Registry Review MCP Server

test_llm_json_validation.py•13.1 KiB

"""Tests for LLM JSON response validation and error handling.""" import pytest from registry_review_mcp.extractors.llm_extractors import ( DateExtractor, LandTenureExtractor, ProjectIDExtractor, ) # Import factory infrastructure from tests.factories import ( unique_doc_name, create_llm_mock_response, create_llm_client_mock, mock_date_extraction, mock_tenure_extraction, mock_project_id_extraction, ) class TestInvalidJSON: """Test handling of invalid JSON responses.""" @pytest.mark.asyncio async def test_malformed_json_syntax_error(self): """Test that malformed JSON is handled gracefully.""" # Invalid JSON: missing closing bracket malformed_json = '''[ { "value": "2022-01-01", "field_type": "project_start_date", "source": "test", "confidence": 0.95, "reasoning": "test" ''' response = create_llm_mock_response(malformed_json) client = create_llm_client_mock(response) extractor = DateExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("malformed_json")) # Should return empty list instead of crashing assert isinstance(results, list) assert len(results) == 0 @pytest.mark.asyncio async def test_json_without_code_fence(self): """Test JSON response without markdown code fence.""" response = create_llm_mock_response(mock_date_extraction("2022-01-01"), use_code_fence=False) client = create_llm_client_mock(response) extractor = DateExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("json_without_fence")) # Should still parse successfully assert len(results) == 1 assert results[0].value == "2022-01-01" @pytest.mark.asyncio async def test_non_json_text_response(self): """Test handling of plain text instead of JSON.""" response = create_llm_mock_response("I found the project start date to be January 1, 2022.", use_code_fence=False) client = create_llm_client_mock(response) extractor = DateExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("non_json_text")) # Should return empty list when JSON parsing fails assert isinstance(results, list) assert len(results) == 0 @pytest.mark.asyncio async def test_empty_json_array(self): """Test handling of empty JSON array response.""" response = create_llm_mock_response("[]") client = create_llm_client_mock(response) extractor = DateExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("empty_array")) # Empty array is valid - just means no fields found assert isinstance(results, list) assert len(results) == 0 @pytest.mark.asyncio async def test_json_object_instead_of_array(self): """Test handling when LLM returns object instead of array.""" json_object = '''{ "value": "2022-01-01", "field_type": "project_start_date", "source": "test", "confidence": 0.95, "reasoning": "test" }''' response = create_llm_mock_response(json_object) client = create_llm_client_mock(response) extractor = DateExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("json_object")) # Should handle gracefully - either convert to array or return empty assert isinstance(results, list) class TestMissingRequiredFields: """Test handling of JSON with missing required fields.""" @pytest.mark.asyncio async def test_missing_value_field(self): """Test handling when 'value' field is missing.""" json_content = '''[ { "field_type": "project_start_date", "source": "test", "confidence": 0.95, "reasoning": "test" } ]''' response = create_llm_mock_response(json_content) client = create_llm_client_mock(response) extractor = DateExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("missing_value")) # Should skip invalid entries assert len(results) == 0 @pytest.mark.asyncio async def test_missing_field_type(self): """Test handling when 'field_type' is missing.""" json_content = '''[ { "value": "2022-01-01", "source": "test", "confidence": 0.95, "reasoning": "test" } ]''' response = create_llm_mock_response(json_content) client = create_llm_client_mock(response) extractor = DateExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("missing_field_type")) # Should skip entries without field_type assert len(results) == 0 @pytest.mark.asyncio async def test_missing_confidence(self): """Test handling when 'confidence' is missing.""" json_content = '''[ { "value": "2022-01-01", "field_type": "project_start_date", "source": "test", "reasoning": "test" } ]''' response = create_llm_mock_response(json_content) client = create_llm_client_mock(response) extractor = DateExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("missing_confidence")) # Should skip or use default confidence assert len(results) == 0 or results[0].confidence >= 0.0 @pytest.mark.asyncio async def test_missing_optional_fields(self): """Test that optional fields (raw_text, page_number) can be missing.""" json_content = '''[ { "value": "2022-01-01", "field_type": "project_start_date", "source": "test.pdf", "confidence": 0.95, "reasoning": "Found in document" } ]''' response = create_llm_mock_response(json_content) client = create_llm_client_mock(response) extractor = DateExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("missing_optional")) # Should work fine - raw_text and page_number are optional assert len(results) == 1 assert results[0].value == "2022-01-01" class TestInvalidFieldValues: """Test handling of invalid field values.""" @pytest.mark.asyncio async def test_confidence_above_one(self): """Test handling when confidence > 1.0.""" response = create_llm_mock_response(mock_date_extraction("2022-01-01", confidence=1.5)) client = create_llm_client_mock(response) extractor = DateExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("confidence_above_one")) # Should either skip or clamp to 1.0 if len(results) > 0: assert results[0].confidence <= 1.0 @pytest.mark.asyncio async def test_confidence_below_zero(self): """Test handling when confidence < 0.0.""" response = create_llm_mock_response(mock_date_extraction("2022-01-01", confidence=-0.5)) client = create_llm_client_mock(response) extractor = DateExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("confidence_below_zero")) # Should either skip or clamp to 0.0 if len(results) > 0: assert results[0].confidence >= 0.0 @pytest.mark.asyncio async def test_confidence_as_string(self): """Test handling when confidence is string instead of number.""" json_content = '''[ { "value": "2022-01-01", "field_type": "project_start_date", "source": "test", "confidence": "high", "reasoning": "test" } ]''' response = create_llm_mock_response(json_content) client = create_llm_client_mock(response) extractor = DateExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("confidence_string")) # Should skip entries with invalid confidence type assert len(results) == 0 @pytest.mark.asyncio async def test_null_value(self): """Test handling when value is null.""" json_content = '''[ { "value": null, "field_type": "project_start_date", "source": "test", "confidence": 0.95, "reasoning": "test" } ]''' response = create_llm_mock_response(json_content) client = create_llm_client_mock(response) extractor = DateExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("null_value")) # Implementation preserves null values (they can be filtered downstream) assert len(results) >= 0 # Either skips or preserves as None if len(results) > 0: assert results[0].value is None class TestPartiallyValidResponses: """Test handling when some entries are valid and others aren't.""" @pytest.mark.asyncio async def test_mixed_valid_and_invalid_entries(self): """Test that valid entries are preserved when some are invalid.""" json_content = '''[ { "value": "2022-01-01", "field_type": "project_start_date", "source": "test", "confidence": 0.95, "reasoning": "Valid entry" }, { "value": "2022-06-15", "field_type": "baseline_imagery_date", "source": "test", "confidence": 2.5, "reasoning": "Invalid confidence" }, { "field_type": "project_end_date", "source": "test", "confidence": 0.9, "reasoning": "Missing value" }, { "value": "2024-01-01", "field_type": "reporting_period_end", "source": "test", "confidence": 0.85, "reasoning": "Another valid entry" } ]''' response = create_llm_mock_response(json_content) client = create_llm_client_mock(response) extractor = DateExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("mixed_valid_invalid")) # Implementation uses strict validation: rejects entire response if ANY entry is invalid # This is good for data quality - better to fail and get it fixed than accept partial data assert isinstance(results, list) # With strict validation, invalid confidence (2.5) causes entire response to be rejected # So we expect empty results (or all entries have valid confidence) for result in results: assert 0.0 <= result.confidence <= 1.0, "All results should have valid confidence" class TestLandTenureJSONValidation: """Test JSON validation for land tenure extractor.""" @pytest.mark.asyncio async def test_invalid_area_value(self): """Test handling when area is not a number.""" response = create_llm_mock_response(mock_tenure_extraction("very large")) client = create_llm_client_mock(response) extractor = LandTenureExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("invalid_area")) # Should handle gracefully - either skip or keep as string assert isinstance(results, list) class TestProjectIDJSONValidation: """Test JSON validation for project ID extractor.""" @pytest.mark.asyncio async def test_duplicate_project_ids_in_response(self): """Test deduplication when LLM returns duplicate IDs.""" json_content = '''[ { "value": "C06-4997", "field_type": "regen_project_id", "source": "page 1", "confidence": 0.95, "reasoning": "Found in header" }, { "value": "C06-4997", "field_type": "regen_project_id", "source": "page 3", "confidence": 0.90, "reasoning": "Found in footer" } ]''' response = create_llm_mock_response(json_content) client = create_llm_client_mock(response) extractor = ProjectIDExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("duplicate_ids")) # Should deduplicate (per the implementation in llm_extractors.py) assert len(results) == 1 assert results[0].value == "C06-4997" # Should keep the highest confidence assert results[0].confidence == 0.95 class TestExtraFields: """Test that extra unexpected fields don't break parsing.""" @pytest.mark.asyncio async def test_extra_fields_ignored(self): """Test that extra fields in JSON don't cause errors.""" json_content = '''[ { "value": "2022-01-01", "field_type": "project_start_date", "source": "test", "confidence": 0.95, "reasoning": "test", "extra_field": "should be ignored", "another_extra": 12345 } ]''' response = create_llm_mock_response(json_content) client = create_llm_client_mock(response) extractor = DateExtractor(client) results = await extractor.extract("test content", [], unique_doc_name("extra_fields")) # Should parse successfully, ignoring extra fields assert len(results) == 1 assert results[0].value == "2022-01-01"

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/gaiaaiagent/regen-registry-review-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

test_llm_json_validation.py•13.1 KiB