mcp-run-python

Official

Overview Schema Related Servers Score Discussions

test_openrouter.py•25.1 kB

from collections.abc import Sequence from typing import Literal, cast import pytest from inline_snapshot import snapshot from pydantic import BaseModel from pydantic_ai import ( Agent, BinaryContent, ModelHTTPError, ModelMessage, ModelRequest, ModelResponse, PartEndEvent, PartStartEvent, RunUsage, TextPart, ThinkingPart, ToolCallPart, ToolDefinition, UnexpectedModelBehavior, ) from pydantic_ai.direct import model_request, model_request_stream from pydantic_ai.models import ModelRequestParameters from ..conftest import try_import with try_import() as imports_successful: from openai.types.chat import ChatCompletion from openai.types.chat.chat_completion import Choice from pydantic_ai.models.openrouter import OpenRouterModel, OpenRouterModelSettings from pydantic_ai.providers.openrouter import OpenRouterProvider pytestmark = [ pytest.mark.skipif(not imports_successful(), reason='openai not installed'), pytest.mark.vcr, pytest.mark.anyio, ] async def test_openrouter_with_preset(allow_model_requests: None, openrouter_api_key: str) -> None: provider = OpenRouterProvider(api_key=openrouter_api_key) model = OpenRouterModel('google/gemini-2.5-flash-lite', provider=provider) settings = OpenRouterModelSettings(openrouter_preset='@preset/comedian') response = await model_request(model, [ModelRequest.user_text_prompt('Trains')], model_settings=settings) text_part = cast(TextPart, response.parts[0]) assert text_part.content == snapshot( """\ Why did the train break up with the track? Because it felt like their relationship was going nowhere.\ """ ) async def test_openrouter_with_native_options(allow_model_requests: None, openrouter_api_key: str) -> None: provider = OpenRouterProvider(api_key=openrouter_api_key) model = OpenRouterModel('google/gemini-2.0-flash-exp:free', provider=provider) # These specific settings will force OpenRouter to use the fallback model, since Gemini is not available via the xAI provider. settings = OpenRouterModelSettings( openrouter_models=['x-ai/grok-4'], openrouter_transforms=['middle-out'], openrouter_provider={'only': ['xai']}, ) response = await model_request(model, [ModelRequest.user_text_prompt('Who are you')], model_settings=settings) text_part = cast(TextPart, response.parts[0]) assert text_part.content == snapshot( """\ I'm Grok, a helpful and maximally truthful AI built by xAI. I'm not based on any other companies' models—instead, I'm inspired by the Hitchhiker's Guide to the Galaxy and JARVIS from Iron Man. My goal is to assist with questions, provide information, and maybe crack a joke or two along the way. What can I help you with today?\ """ ) assert response.provider_details is not None assert response.provider_details['downstream_provider'] == 'xAI' assert response.provider_details['finish_reason'] == 'stop' async def test_openrouter_stream_with_native_options(allow_model_requests: None, openrouter_api_key: str) -> None: provider = OpenRouterProvider(api_key=openrouter_api_key) model = OpenRouterModel('google/gemini-2.0-flash-exp:free', provider=provider) # These specific settings will force OpenRouter to use the fallback model, since Gemini is not available via the xAI provider. settings = OpenRouterModelSettings( openrouter_models=['x-ai/grok-4'], openrouter_transforms=['middle-out'], openrouter_provider={'only': ['xai']}, ) async with model_request_stream( model, [ModelRequest.user_text_prompt('Who are you')], model_settings=settings ) as stream: assert stream.provider_details == snapshot(None) assert stream.finish_reason == snapshot(None) _ = [chunk async for chunk in stream] assert stream.provider_details == snapshot({'finish_reason': 'completed', 'downstream_provider': 'xAI'}) assert stream.finish_reason == snapshot('stop') async def test_openrouter_stream_with_reasoning(allow_model_requests: None, openrouter_api_key: str) -> None: provider = OpenRouterProvider(api_key=openrouter_api_key) model = OpenRouterModel( 'openai/o3', provider=provider, settings=OpenRouterModelSettings(openrouter_reasoning={'effort': 'high'}), ) async with model_request_stream(model, [ModelRequest.user_text_prompt('Who are you')]) as stream: chunks = [chunk async for chunk in stream] thinking_event_start = chunks[0] assert isinstance(thinking_event_start, PartStartEvent) thinking_part = thinking_event_start.part assert isinstance(thinking_part, ThinkingPart) assert thinking_part.id == 'rs_0aa4f2c435e6d1dc0169082486816c8193a029b5fc4ef1764f' assert thinking_part.content == '' assert thinking_part.provider_name == 'openrouter' # After fix: signature and provider_details are now properly preserved assert thinking_part.signature is not None assert thinking_part.provider_details is not None assert thinking_part.provider_details['type'] == 'reasoning.encrypted' assert thinking_part.provider_details['format'] == 'openai-responses-v1' thinking_event_end = chunks[1] assert isinstance(thinking_event_end, PartEndEvent) thinking_part_end = thinking_event_end.part assert isinstance(thinking_part_end, ThinkingPart) assert thinking_part_end.id == 'rs_0aa4f2c435e6d1dc0169082486816c8193a029b5fc4ef1764f' assert thinking_part_end.signature is not None async def test_openrouter_stream_error(allow_model_requests: None, openrouter_api_key: str) -> None: provider = OpenRouterProvider(api_key=openrouter_api_key) model = OpenRouterModel('minimax/minimax-m2:free', provider=provider) settings = OpenRouterModelSettings(max_tokens=10) with pytest.raises(ModelHTTPError): async with model_request_stream( model, [ModelRequest.user_text_prompt('Hello there')], model_settings=settings ) as stream: _ = [chunk async for chunk in stream] async def test_openrouter_tool_calling(allow_model_requests: None, openrouter_api_key: str) -> None: provider = OpenRouterProvider(api_key=openrouter_api_key) class Divide(BaseModel): """Divide two numbers.""" numerator: float denominator: float on_inf: Literal['error', 'infinity'] = 'infinity' model = OpenRouterModel('mistralai/mistral-small', provider=provider) response = await model_request( model, [ModelRequest.user_text_prompt('What is 123 / 456?')], model_request_parameters=ModelRequestParameters( function_tools=[ ToolDefinition( name=Divide.__name__.lower(), description=Divide.__doc__, parameters_json_schema=Divide.model_json_schema(), ) ], allow_text_output=True, # Allow model to either use tools or respond directly ), ) assert len(response.parts) == 1 tool_call_part = response.parts[0] assert isinstance(tool_call_part, ToolCallPart) assert tool_call_part.tool_call_id == snapshot('3sniiMddS') assert tool_call_part.tool_name == 'divide' assert tool_call_part.args == snapshot('{"numerator": 123, "denominator": 456, "on_inf": "infinity"}') mapped_messages = await model._map_messages([response], None) # type: ignore[reportPrivateUsage] tool_call_message = mapped_messages[0] assert tool_call_message['role'] == 'assistant' assert tool_call_message.get('content') is None assert tool_call_message.get('tool_calls') == snapshot( [ { 'id': '3sniiMddS', 'type': 'function', 'function': { 'name': 'divide', 'arguments': '{"numerator": 123, "denominator": 456, "on_inf": "infinity"}', }, } ] ) async def test_openrouter_with_reasoning(allow_model_requests: None, openrouter_api_key: str) -> None: provider = OpenRouterProvider(api_key=openrouter_api_key) request = ModelRequest.user_text_prompt( "What was the impact of Voltaire's writings on modern french culture? Think about your answer." ) model = OpenRouterModel('z-ai/glm-4.6', provider=provider) response = await model_request(model, [request]) assert len(response.parts) == 2 thinking_part = response.parts[0] assert isinstance(thinking_part, ThinkingPart) assert thinking_part.id == snapshot(None) assert thinking_part.content is not None assert thinking_part.signature is None async def test_openrouter_preserve_reasoning_block(allow_model_requests: None, openrouter_api_key: str) -> None: provider = OpenRouterProvider(api_key=openrouter_api_key) model = OpenRouterModel('openai/gpt-5-mini', provider=provider) messages: Sequence[ModelMessage] = [] messages.append(ModelRequest.user_text_prompt('Hello!')) messages.append(await model_request(model, messages)) messages.append( ModelRequest.user_text_prompt("What was the impact of Voltaire's writings on modern french culture?") ) messages.append(await model_request(model, messages)) openai_messages = await model._map_messages(messages, None) # type: ignore[reportPrivateUsage] assistant_message = openai_messages[1] assert assistant_message['role'] == 'assistant' assert 'reasoning_details' not in assistant_message assistant_message = openai_messages[3] assert assistant_message['role'] == 'assistant' assert 'reasoning_details' in assistant_message reasoning_details = assistant_message['reasoning_details'] assert len(reasoning_details) == 2 reasoning_summary = reasoning_details[0] assert 'summary' in reasoning_summary assert reasoning_summary['type'] == 'reasoning.summary' assert reasoning_summary['format'] == 'openai-responses-v1' reasoning_encrypted = reasoning_details[1] assert 'data' in reasoning_encrypted assert reasoning_encrypted['type'] == 'reasoning.encrypted' assert reasoning_encrypted['format'] == 'openai-responses-v1' async def test_openrouter_errors_raised(allow_model_requests: None, openrouter_api_key: str) -> None: provider = OpenRouterProvider(api_key=openrouter_api_key) model = OpenRouterModel('google/gemini-2.0-flash-exp:free', provider=provider) agent = Agent(model, instructions='Be helpful.', retries=1) with pytest.raises(ModelHTTPError) as exc_info: await agent.run('Tell me a joke.') assert str(exc_info.value) == snapshot( "status_code: 429, model_name: google/gemini-2.0-flash-exp:free, body: {'code': 429, 'message': 'Provider returned error', 'metadata': {'provider_name': 'Google', 'raw': 'google/gemini-2.0-flash-exp:free is temporarily rate-limited upstream. Please retry shortly, or add your own key to accumulate your rate limits: https://openrouter.ai/settings/integrations'}}" ) async def test_openrouter_usage(allow_model_requests: None, openrouter_api_key: str) -> None: provider = OpenRouterProvider(api_key=openrouter_api_key) model = OpenRouterModel('openai/gpt-5-mini', provider=provider) agent = Agent(model, instructions='Be helpful.', retries=1) result = await agent.run('Tell me about Venus') assert result.usage() == snapshot( RunUsage(input_tokens=17, output_tokens=1515, details={'reasoning_tokens': 704}, requests=1) ) settings = OpenRouterModelSettings(openrouter_usage={'include': True}) result = await agent.run('Tell me about Mars', model_settings=settings) assert result.usage() == snapshot( RunUsage( input_tokens=17, output_tokens=2177, details={'is_byok': 0, 'reasoning_tokens': 960, 'image_tokens': 0}, requests=1, ) ) last_message = result.all_messages()[-1] assert isinstance(last_message, ModelResponse) assert last_message.provider_details is not None for key in ['cost', 'upstream_inference_cost', 'is_byok']: assert key in last_message.provider_details async def test_openrouter_validate_non_json_response(openrouter_api_key: str) -> None: provider = OpenRouterProvider(api_key=openrouter_api_key) model = OpenRouterModel('google/gemini-2.0-flash-exp:free', provider=provider) with pytest.raises(UnexpectedModelBehavior) as exc_info: model._process_response('This is not JSON!') # type: ignore[reportPrivateUsage] assert str(exc_info.value) == snapshot( 'Invalid response from openrouter chat completions endpoint, expected JSON data' ) async def test_openrouter_validate_error_response(openrouter_api_key: str) -> None: provider = OpenRouterProvider(api_key=openrouter_api_key) model = OpenRouterModel('google/gemini-2.0-flash-exp:free', provider=provider) choice = Choice.model_construct( index=0, message={'role': 'assistant'}, finish_reason='error', native_finish_reason='stop' ) response = ChatCompletion.model_construct( id='', choices=[choice], created=0, object='chat.completion', model='test', provider='test' ) response.error = {'message': 'This response has an error attribute', 'code': 200} # type: ignore[reportAttributeAccessIssue] with pytest.raises(ModelHTTPError) as exc_info: model._process_response(response) # type: ignore[reportPrivateUsage] assert str(exc_info.value) == snapshot( 'status_code: 200, model_name: test, body: This response has an error attribute' ) async def test_openrouter_map_messages_reasoning(allow_model_requests: None, openrouter_api_key: str) -> None: provider = OpenRouterProvider(api_key=openrouter_api_key) model = OpenRouterModel('anthropic/claude-3.7-sonnet:thinking', provider=provider) user_message = ModelRequest.user_text_prompt('Who are you. Think about it.') response = await model_request(model, [user_message]) mapped_messages = await model._map_messages([user_message, response], None) # type: ignore[reportPrivateUsage] assert len(mapped_messages) == 2 assert mapped_messages[1]['reasoning_details'] == snapshot( # type: ignore[reportGeneralTypeIssues] [ { 'id': None, 'type': 'reasoning.text', 'text': """\ This question is asking me about my identity. Let me think about how to respond clearly and accurately. I am Claude, an AI assistant created by Anthropic. I'm designed to be helpful, harmless, and honest in my interactions with humans. I don't have a physical form - I exist as a large language model running on computer hardware. I don't have consciousness, sentience, or feelings in the way humans do. I don't have personal experiences or a life outside of these conversations. My capabilities include understanding and generating natural language text, reasoning about various topics, and attempting to be helpful to users in a wide range of contexts. I have been trained on a large corpus of text data, but my training data has a cutoff date, so I don't have knowledge of events that occurred after my training. I have certain limitations - I don't have the ability to access the internet, run code, or interact with external systems unless given specific tools to do so. I don't have perfect knowledge and can make mistakes. I'm designed to be conversational and to engage with users in a way that's helpful and informative, while respecting important ethical boundaries.\ """, 'signature': 'ErcBCkgICBACGAIiQHtMxpqcMhnwgGUmSDWGoOL9ZHTbDKjWnhbFm0xKzFl0NmXFjQQxjFj5mieRYY718fINsJMGjycTVYeiu69npakSDDrsnKYAD/fdcpI57xoMHlQBxI93RMa5CSUZIjAFVCMQF5GfLLQCibyPbb7LhZ4kLIFxw/nqsTwDDt6bx3yipUcq7G7eGts8MZ6LxOYqHTlIDx0tfHRIlkkcNCdB2sUeMqP8e7kuQqIHoD52GAI=', 'format': 'anthropic-claude-v1', 'index': 0, } ] ) async def test_openrouter_tool_optional_parameters(allow_model_requests: None, openrouter_api_key: str) -> None: provider = OpenRouterProvider(api_key=openrouter_api_key) class FindEducationContentFilters(BaseModel): title: str | None = None model = OpenRouterModel('anthropic/claude-sonnet-4.5', provider=provider) response = await model_request( model, [ModelRequest.user_text_prompt('Can you find me any education content?')], model_request_parameters=ModelRequestParameters( function_tools=[ ToolDefinition( name='find_education_content', description='', parameters_json_schema=FindEducationContentFilters.model_json_schema(), ) ], allow_text_output=True, # Allow model to either use tools or respond directly ), ) assert len(response.parts) == 2 tool_call_part = response.parts[1] assert isinstance(tool_call_part, ToolCallPart) assert tool_call_part.tool_call_id == snapshot('toolu_vrtx_015QAXScZzRDPttiPoc34AdD') assert tool_call_part.tool_name == 'find_education_content' assert tool_call_part.args == snapshot(None) mapped_messages = await model._map_messages([response], None) # type: ignore[reportPrivateUsage] tool_call_message = mapped_messages[0] assert tool_call_message['role'] == 'assistant' assert tool_call_message.get('content') == snapshot("I'll search for education content for you.") assert tool_call_message.get('tool_calls') == snapshot( [ { 'id': 'toolu_vrtx_015QAXScZzRDPttiPoc34AdD', 'type': 'function', 'function': { 'name': 'find_education_content', 'arguments': '{}', }, } ] ) async def test_openrouter_streaming_reasoning(allow_model_requests: None, openrouter_api_key: str) -> None: provider = OpenRouterProvider(api_key=openrouter_api_key) model = OpenRouterModel('anthropic/claude-sonnet-4.5', provider=provider) agent = Agent( model=model, model_settings=OpenRouterModelSettings(openrouter_reasoning={'enabled': True}), ) async with agent.run_stream('What is 2+2?') as stream: _ = await stream.get_output() assert stream.response.parts == snapshot( [ ThinkingPart( content='This is a simple arithmetic question. 2+2 equals 4.', signature='Et0BCkgIChACGAIqQA2s7h7tA7IG35fbwVkou9PM2hANVJNUwcEM4q12fTRDK6y3v6YoEvJ+7bko8wnW/GLsQFXadaJPAEMCpLkhI9ISDLjFkeR1aVUIvdCtyBoMrUTovh0jwk+wpnZWIjANV3e6VVdgbGSsEyyTHO6KMmVtqqs79f9blnVdJmmMIwMyTi6bEtG59+jTU7v1zlsqQ2IKGZILOlr6adh0Aam7zYttvisys+wjyZZXU1y/Srz0nmp1cFgVOJe1BLKQI3SSRrjsqQC0uAEUZy0GX0Rq1AXjvIcYAQ==', provider_name='openrouter', provider_details={'format': 'anthropic-claude-v1', 'index': 0, 'type': 'reasoning.text'}, ), TextPart(content='2 + 2 = 4'), ] ) async def test_openrouter_google_nested_schema(allow_model_requests: None, openrouter_api_key: str) -> None: """Test that nested schemas with $defs/$ref work correctly with OpenRouter + Gemini. This verifies the fix for https://github.com/pydantic/pydantic-ai/issues/3617 where OpenRouter's translation layer didn't support modern JSON Schema features. """ from enum import Enum provider = OpenRouterProvider(api_key=openrouter_api_key) class LevelType(str, Enum): ground = 'ground' basement = 'basement' floor = 'floor' attic = 'attic' class SpaceType(str, Enum): entryway = 'entryway' living_room = 'living-room' kitchen = 'kitchen' bedroom = 'bedroom' bathroom = 'bathroom' garage = 'garage' class InsertLevelArg(BaseModel): level_name: str level_type: LevelType class SpaceArg(BaseModel): space_name: str space_type: SpaceType class InsertedLevel(BaseModel): """Result of inserting a level.""" level_name: str level_type: LevelType space_count: int model = OpenRouterModel('google/gemini-2.5-flash', provider=provider) agent: Agent[None, InsertedLevel] = Agent(model, output_type=InsertedLevel) @agent.tool_plain def insert_level_with_spaces(level: InsertLevelArg | None, spaces: list[SpaceArg]) -> str: """Insert a level with its spaces.""" return f'Inserted level {level} with {len(spaces)} spaces' result = await agent.run("It's a house with a ground floor that has an entryway, a living room and a garage.") tool_call_message = result.all_messages()[1] assert tool_call_message.parts == snapshot( [ ToolCallPart( tool_name='insert_level_with_spaces', args='{"spaces":[{"space_type":"entryway","space_name":"entryway"},{"space_name":"living_room","space_type":"living-room"},{"space_name":"garage","space_type":"garage"}],"level":{"level_type":"ground","level_name":"ground_floor"}}', tool_call_id='tool_insert_level_with_spaces_3ZiChYzj8xER8HixJe7W', ) ] ) assert result.output.level_type == LevelType.ground assert result.output.space_count == 3 async def test_openrouter_file_annotation( allow_model_requests: None, openrouter_api_key: str, document_content: BinaryContent ) -> None: """Test that file annotations from OpenRouter are handled correctly. When sending files (e.g., PDFs) to OpenRouter, the response can include annotations with type="file". This test ensures those annotations are parsed without validation errors. """ provider = OpenRouterProvider(api_key=openrouter_api_key) model = OpenRouterModel('openai/gpt-5.1-codex-mini', provider=provider) agent = Agent(model) result = await agent.run( user_prompt=[ 'What does this PDF contain? Answer in one short sentence.', document_content, ] ) # The response should contain text (model may or may not include file annotations) assert isinstance(result.output, str) assert len(result.output) > 0 async def test_openrouter_file_annotation_validation(openrouter_api_key: str) -> None: """Test that file annotations from OpenRouter are correctly validated. This unit test verifies that responses containing type="file" annotations are parsed without validation errors, which was failing before the fix. """ from openai.types.chat.chat_completion_message import ChatCompletionMessage provider = OpenRouterProvider(api_key=openrouter_api_key) model = OpenRouterModel('openai/gpt-4.1-mini', provider=provider) message = ChatCompletionMessage.model_construct( role='assistant', content='Here is the summary of your file.', annotations=[ {'type': 'file', 'file': {'filename': 'test.pdf', 'file_id': 'file-123'}}, ], ) choice = Choice.model_construct(index=0, message=message, finish_reason='stop', native_finish_reason='stop') response = ChatCompletion.model_construct( id='test', choices=[choice], created=0, object='chat.completion', model='test', provider='test' ) # This should not raise a validation error result = model._process_response(response) # type: ignore[reportPrivateUsage] text_part = cast(TextPart, result.parts[0]) assert text_part.content == 'Here is the summary of your file.' async def test_openrouter_url_citation_annotation_validation(openrouter_api_key: str) -> None: """Test that url_citation annotations from OpenRouter are correctly validated.""" from openai.types.chat.chat_completion_message import ChatCompletionMessage provider = OpenRouterProvider(api_key=openrouter_api_key) model = OpenRouterModel('openai/gpt-4.1-mini', provider=provider) message = ChatCompletionMessage.model_construct( role='assistant', content='According to the source, this is the answer.', annotations=[ { 'type': 'url_citation', 'url_citation': {'url': 'https://example.com', 'title': 'Example', 'start_index': 0, 'end_index': 10}, }, ], ) choice = Choice.model_construct(index=0, message=message, finish_reason='stop', native_finish_reason='stop') response = ChatCompletion.model_construct( id='test', choices=[choice], created=0, object='chat.completion', model='test', provider='test' ) # This should not raise a validation error result = model._process_response(response) # type: ignore[reportPrivateUsage] text_part = cast(TextPart, result.parts[0]) assert text_part.content == 'According to the source, this is the answer.'

Latest Blog Posts

Model Context Protocol Proxies: Enabling Enterprise Control with Virtual MCPs
By Om-Shree-0709 on December 9, 2025.
AI Security
Virtual MCP
Kubernetes Operator
The State of MCP in 2025: Who's Building What and Why It Matters
By punkpeye on December 7, 2025.
mcp
startups
MCP hosting with persistent storage
By punkpeye on December 6, 2025.
changelog

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/pydantic/pydantic-ai'

If you have feedback or need assistance with the MCP directory API, please join our Discord server