DM20 Protocol

Overview Schema Related Servers Score Discussions

dm20-protocol
tests
claudmaster

test_llm_client.py•21.8 KiB

""" Unit tests for LLM Client implementations. Tests MockLLMClient, AnthropicLLMClient, and MultiModelClient. All tests of AnthropicLLMClient mock the SDK to avoid real API calls. """ import os import pytest from typing import Any from unittest.mock import AsyncMock, MagicMock, patch from dm20_protocol.claudmaster.llm_client import ( AnthropicLLMClient, MockLLMClient, MultiModelClient, LLMClientError, LLMConfigurationError, LLMAPIError, LLMRateLimitError, LLMDependencyError, ) from dm20_protocol.claudmaster.config import ClaudmasterConfig # --------------------------------------------------------------------------- # Fixtures # --------------------------------------------------------------------------- @pytest.fixture def mock_llm_client() -> MockLLMClient: """Create a basic MockLLMClient.""" return MockLLMClient() @pytest.fixture def mock_llm_with_responses() -> MockLLMClient: """Create a MockLLMClient with predefined responses.""" return MockLLMClient( responses=[ "First response", "Second response", "Third response", ] ) @pytest.fixture def mock_anthropic_message() -> MagicMock: """Create a mock Anthropic message response.""" message = MagicMock() # Mock content block with text content_block = MagicMock() content_block.text = "This is a generated response from Claude." message.content = [content_block] # Mock usage stats message.usage = MagicMock() message.usage.input_tokens = 50 message.usage.output_tokens = 100 return message # --------------------------------------------------------------------------- # MockLLMClient Tests # --------------------------------------------------------------------------- @pytest.mark.anyio async def test_mock_llm_basic_generate(mock_llm_client: MockLLMClient) -> None: """Test basic MockLLMClient generation.""" response = await mock_llm_client.generate("Test prompt") assert response == "Mock LLM response." assert mock_llm_client.call_count == 1 assert len(mock_llm_client.calls) == 1 assert mock_llm_client.calls[0]["prompt"] == "Test prompt" assert mock_llm_client.calls[0]["max_tokens"] == 1024 @pytest.mark.anyio async def test_mock_llm_custom_max_tokens(mock_llm_client: MockLLMClient) -> None: """Test MockLLMClient with custom max_tokens.""" response = await mock_llm_client.generate("Test prompt", max_tokens=2048) assert mock_llm_client.calls[0]["max_tokens"] == 2048 @pytest.mark.anyio async def test_mock_llm_multiple_responses(mock_llm_with_responses: MockLLMClient) -> None: """Test MockLLMClient cycling through multiple responses.""" response1 = await mock_llm_with_responses.generate("Prompt 1") response2 = await mock_llm_with_responses.generate("Prompt 2") response3 = await mock_llm_with_responses.generate("Prompt 3") response4 = await mock_llm_with_responses.generate("Prompt 4") # Should cycle back assert response1 == "First response" assert response2 == "Second response" assert response3 == "Third response" assert response4 == "First response" # Cycled back assert mock_llm_with_responses.call_count == 4 @pytest.mark.anyio async def test_mock_llm_reset(mock_llm_client: MockLLMClient) -> None: """Test MockLLMClient reset functionality.""" await mock_llm_client.generate("Test 1") await mock_llm_client.generate("Test 2") assert mock_llm_client.call_count == 2 assert len(mock_llm_client.calls) == 2 mock_llm_client.reset() assert mock_llm_client.call_count == 0 assert len(mock_llm_client.calls) == 0 def test_mock_llm_effort_stored() -> None: """Test that MockLLMClient stores effort parameter.""" mock = MockLLMClient(effort="high") assert mock.effort == "high" def test_mock_llm_effort_none_by_default() -> None: """Test that MockLLMClient effort is None by default.""" mock = MockLLMClient() assert mock.effort is None @pytest.mark.anyio async def test_mock_llm_stream(mock_llm_client: MockLLMClient) -> None: """Test MockLLMClient streaming generation.""" chunks = [] async for chunk in mock_llm_client.generate_stream("Test prompt"): chunks.append(chunk) # Should split "Mock LLM response." into words with spaces assert len(chunks) == 3 assert "".join(chunks).strip() == "Mock LLM response." # --------------------------------------------------------------------------- # AnthropicLLMClient Tests - Initialization # --------------------------------------------------------------------------- def test_anthropic_client_missing_dependency() -> None: """Test that AnthropicLLMClient raises error when anthropic package is missing.""" with patch("dm20_protocol.claudmaster.llm_client._HAS_ANTHROPIC", False): with pytest.raises(LLMDependencyError, match="anthropic"): AnthropicLLMClient(api_key="test-key") def test_anthropic_client_missing_api_key() -> None: """Test that AnthropicLLMClient raises error when API key is missing.""" with patch("dm20_protocol.claudmaster.llm_client._HAS_ANTHROPIC", True), \ patch("dm20_protocol.claudmaster.llm_client._anthropic_module", MagicMock()), \ patch("dm20_protocol.claudmaster.llm_client.AsyncAnthropic", MagicMock()), \ patch.dict(os.environ, {}, clear=True): with pytest.raises(LLMConfigurationError, match="API key is required"): AnthropicLLMClient() def test_anthropic_client_with_api_key_param() -> None: """Test AnthropicLLMClient initialization with API key parameter.""" with patch("dm20_protocol.claudmaster.llm_client._HAS_ANTHROPIC", True), \ patch("dm20_protocol.claudmaster.llm_client._anthropic_module", MagicMock()), \ patch("dm20_protocol.claudmaster.llm_client.AsyncAnthropic", MagicMock()): client = AnthropicLLMClient(api_key="test-key-123") assert client.api_key == "test-key-123" assert client.model == "claude-sonnet-4-5-20250929" assert client.temperature == 0.7 assert client.default_max_tokens == 1024 def test_anthropic_client_with_env_var() -> None: """Test AnthropicLLMClient initialization with environment variable.""" with patch("dm20_protocol.claudmaster.llm_client._HAS_ANTHROPIC", True), \ patch("dm20_protocol.claudmaster.llm_client._anthropic_module", MagicMock()), \ patch("dm20_protocol.claudmaster.llm_client.AsyncAnthropic", MagicMock()), \ patch.dict(os.environ, {"ANTHROPIC_API_KEY": "env-key-456"}): client = AnthropicLLMClient() assert client.api_key == "env-key-456" def test_anthropic_client_custom_params() -> None: """Test AnthropicLLMClient with custom parameters.""" with patch("dm20_protocol.claudmaster.llm_client._HAS_ANTHROPIC", True), \ patch("dm20_protocol.claudmaster.llm_client._anthropic_module", MagicMock()), \ patch("dm20_protocol.claudmaster.llm_client.AsyncAnthropic", MagicMock()): client = AnthropicLLMClient( api_key="test-key", model="claude-haiku-4-5-20251001", temperature=0.9, default_max_tokens=2048, ) assert client.model == "claude-haiku-4-5-20251001" assert client.temperature == 0.9 assert client.default_max_tokens == 2048 def test_anthropic_client_with_effort() -> None: """Test AnthropicLLMClient with effort parameter.""" with patch("dm20_protocol.claudmaster.llm_client._HAS_ANTHROPIC", True), \ patch("dm20_protocol.claudmaster.llm_client._anthropic_module", MagicMock()), \ patch("dm20_protocol.claudmaster.llm_client.AsyncAnthropic", MagicMock()): client = AnthropicLLMClient( api_key="test-key", model="claude-opus-4-5-20250929", effort="medium", ) assert client.effort == "medium" def test_anthropic_client_effort_none_by_default() -> None: """Test that effort is None by default.""" with patch("dm20_protocol.claudmaster.llm_client._HAS_ANTHROPIC", True), \ patch("dm20_protocol.claudmaster.llm_client._anthropic_module", MagicMock()), \ patch("dm20_protocol.claudmaster.llm_client.AsyncAnthropic", MagicMock()): client = AnthropicLLMClient(api_key="test-key") assert client.effort is None def test_anthropic_client_invalid_effort() -> None: """Test that invalid effort level raises error.""" with patch("dm20_protocol.claudmaster.llm_client._HAS_ANTHROPIC", True), \ patch("dm20_protocol.claudmaster.llm_client._anthropic_module", MagicMock()), \ patch("dm20_protocol.claudmaster.llm_client.AsyncAnthropic", MagicMock()): with pytest.raises(LLMConfigurationError, match="Invalid effort level"): AnthropicLLMClient(api_key="test-key", effort="ultra") # --------------------------------------------------------------------------- # AnthropicLLMClient Tests - Generation # --------------------------------------------------------------------------- @pytest.mark.anyio async def test_anthropic_generate_success(mock_anthropic_message: MagicMock) -> None: """Test successful generation with AnthropicLLMClient.""" mock_async_client = AsyncMock() mock_async_client.messages.create = AsyncMock(return_value=mock_anthropic_message) with patch("dm20_protocol.claudmaster.llm_client._HAS_ANTHROPIC", True), \ patch("dm20_protocol.claudmaster.llm_client._anthropic_module", MagicMock()), \ patch("dm20_protocol.claudmaster.llm_client.AsyncAnthropic", return_value=mock_async_client): client = AnthropicLLMClient(api_key="test-key") response = await client.generate("Test prompt", max_tokens=512) assert response == "This is a generated response from Claude." mock_async_client.messages.create.assert_called_once() call_kwargs = mock_async_client.messages.create.call_args[1] assert call_kwargs["model"] == "claude-sonnet-4-5-20250929" assert call_kwargs["max_tokens"] == 512 assert call_kwargs["temperature"] == 0.7 assert call_kwargs["messages"][0]["content"] == "Test prompt" @pytest.mark.anyio async def test_anthropic_generate_with_effort(mock_anthropic_message: MagicMock) -> None: """Test that effort parameter is passed as output_config in API call.""" mock_async_client = AsyncMock() mock_async_client.messages.create = AsyncMock(return_value=mock_anthropic_message) with patch("dm20_protocol.claudmaster.llm_client._HAS_ANTHROPIC", True), \ patch("dm20_protocol.claudmaster.llm_client._anthropic_module", MagicMock()), \ patch("dm20_protocol.claudmaster.llm_client.AsyncAnthropic", return_value=mock_async_client): client = AnthropicLLMClient(api_key="test-key", effort="medium") await client.generate("Test prompt", max_tokens=512) call_kwargs = mock_async_client.messages.create.call_args[1] assert call_kwargs["output_config"] == {"effort": "medium"} @pytest.mark.anyio async def test_anthropic_generate_without_effort(mock_anthropic_message: MagicMock) -> None: """Test that output_config is not included when effort is None.""" mock_async_client = AsyncMock() mock_async_client.messages.create = AsyncMock(return_value=mock_anthropic_message) with patch("dm20_protocol.claudmaster.llm_client._HAS_ANTHROPIC", True), \ patch("dm20_protocol.claudmaster.llm_client._anthropic_module", MagicMock()), \ patch("dm20_protocol.claudmaster.llm_client.AsyncAnthropic", return_value=mock_async_client): client = AnthropicLLMClient(api_key="test-key") await client.generate("Test prompt", max_tokens=512) call_kwargs = mock_async_client.messages.create.call_args[1] assert "output_config" not in call_kwargs @pytest.mark.anyio async def test_anthropic_generate_default_max_tokens(mock_anthropic_message: MagicMock) -> None: """Test that AnthropicLLMClient uses default_max_tokens when not specified.""" mock_async_client = AsyncMock() mock_async_client.messages.create = AsyncMock(return_value=mock_anthropic_message) with patch("dm20_protocol.claudmaster.llm_client._HAS_ANTHROPIC", True), \ patch("dm20_protocol.claudmaster.llm_client._anthropic_module", MagicMock()), \ patch("dm20_protocol.claudmaster.llm_client.AsyncAnthropic", return_value=mock_async_client): client = AnthropicLLMClient(api_key="test-key", default_max_tokens=2048) await client.generate("Test prompt") call_kwargs = mock_async_client.messages.create.call_args[1] assert call_kwargs["max_tokens"] == 2048 @pytest.mark.anyio async def test_anthropic_generate_api_error() -> None: """Test AnthropicLLMClient handles API errors.""" # Create mock anthropic module with exception classes mock_module = MagicMock() mock_module.APIError = type("APIError", (Exception,), {}) mock_module.RateLimitError = type("RateLimitError", (Exception,), {}) mock_async_client = AsyncMock() mock_async_client.messages.create = AsyncMock( side_effect=mock_module.APIError("API request failed") ) with patch("dm20_protocol.claudmaster.llm_client._HAS_ANTHROPIC", True), \ patch("dm20_protocol.claudmaster.llm_client._anthropic_module", mock_module), \ patch("dm20_protocol.claudmaster.llm_client.AsyncAnthropic", return_value=mock_async_client): client = AnthropicLLMClient(api_key="test-key") with pytest.raises(LLMAPIError, match="API error"): await client.generate("Test prompt") @pytest.mark.anyio async def test_anthropic_generate_rate_limit_error() -> None: """Test AnthropicLLMClient handles rate limit errors.""" mock_module = MagicMock() mock_module.APIError = type("APIError", (Exception,), {}) mock_module.RateLimitError = type("RateLimitError", (Exception,), {}) mock_async_client = AsyncMock() mock_async_client.messages.create = AsyncMock( side_effect=mock_module.RateLimitError("Rate limit exceeded") ) with patch("dm20_protocol.claudmaster.llm_client._HAS_ANTHROPIC", True), \ patch("dm20_protocol.claudmaster.llm_client._anthropic_module", mock_module), \ patch("dm20_protocol.claudmaster.llm_client.AsyncAnthropic", return_value=mock_async_client): client = AnthropicLLMClient(api_key="test-key") with pytest.raises(LLMRateLimitError, match="Rate limit exceeded"): await client.generate("Test prompt") @pytest.mark.anyio async def test_anthropic_generate_stream_success() -> None: """Test successful streaming generation with AnthropicLLMClient.""" # Create a mock stream context manager async def text_stream_generator(): for chunk in ["This ", "is ", "a ", "streamed ", "response."]: yield chunk mock_stream = MagicMock() mock_stream.text_stream = text_stream_generator() mock_async_client = AsyncMock() # The stream method is a regular method returning an async context manager mock_stream_cm = AsyncMock() mock_stream_cm.__aenter__ = AsyncMock(return_value=mock_stream) mock_stream_cm.__aexit__ = AsyncMock(return_value=False) mock_async_client.messages.stream = MagicMock(return_value=mock_stream_cm) # Mock the final message (called after the 'async with' block) final_message = MagicMock() final_message.usage.input_tokens = 50 final_message.usage.output_tokens = 100 mock_stream.get_final_message = AsyncMock(return_value=final_message) with patch("dm20_protocol.claudmaster.llm_client._HAS_ANTHROPIC", True), \ patch("dm20_protocol.claudmaster.llm_client._anthropic_module", MagicMock()), \ patch("dm20_protocol.claudmaster.llm_client.AsyncAnthropic", return_value=mock_async_client): client = AnthropicLLMClient(api_key="test-key") chunks = [] async for chunk in client.generate_stream("Test prompt", max_tokens=512): chunks.append(chunk) assert len(chunks) == 5 assert "".join(chunks) == "This is a streamed response." # --------------------------------------------------------------------------- # MultiModelClient Tests # --------------------------------------------------------------------------- def test_multi_model_client_initialization() -> None: """Test MultiModelClient initialization.""" narrator_client = MockLLMClient(default_response="Narrator response") arbiter_client = MockLLMClient(default_response="Arbiter response") multi_client = MultiModelClient({ "narrator": narrator_client, "arbiter": arbiter_client, }) assert multi_client.has_role("narrator") assert multi_client.has_role("arbiter") assert not multi_client.has_role("unknown") assert set(multi_client.list_roles()) == {"narrator", "arbiter"} def test_multi_model_client_get_client() -> None: """Test MultiModelClient returns correct client for role.""" narrator_client = MockLLMClient(default_response="Narrator response") arbiter_client = MockLLMClient(default_response="Arbiter response") multi_client = MultiModelClient({ "narrator": narrator_client, "arbiter": arbiter_client, }) retrieved_narrator = multi_client.get_client("narrator") retrieved_arbiter = multi_client.get_client("arbiter") assert retrieved_narrator is narrator_client assert retrieved_arbiter is arbiter_client def test_multi_model_client_unknown_role() -> None: """Test MultiModelClient raises error for unknown role.""" narrator_client = MockLLMClient() multi_client = MultiModelClient({"narrator": narrator_client}) with pytest.raises(LLMConfigurationError, match="No LLM client configured for role 'unknown'"): multi_client.get_client("unknown") @pytest.mark.anyio async def test_multi_model_client_routing() -> None: """Test that MultiModelClient correctly routes to different models.""" narrator_client = MockLLMClient(default_response="Narrator response") arbiter_client = MockLLMClient(default_response="Arbiter response") multi_client = MultiModelClient({ "narrator": narrator_client, "arbiter": arbiter_client, }) # Generate with different clients narrator_response = await multi_client.get_client("narrator").generate("Describe a scene") arbiter_response = await multi_client.get_client("arbiter").generate("Apply rules") assert narrator_response == "Narrator response" assert arbiter_response == "Arbiter response" assert narrator_client.call_count == 1 assert arbiter_client.call_count == 1 # --------------------------------------------------------------------------- # Config Integration Tests # --------------------------------------------------------------------------- def test_config_per_agent_fields() -> None: """Test that ClaudmasterConfig has per-agent model fields.""" config = ClaudmasterConfig() # Check default values assert config.narrator_model == "claude-haiku-4-5-20251001" assert config.arbiter_model == "claude-sonnet-4-5-20250929" assert config.narrator_max_tokens == 1024 assert config.arbiter_max_tokens == 2048 assert config.narrator_temperature == 0.8 assert config.arbiter_temperature == 0.3 def test_config_per_agent_custom_values() -> None: """Test ClaudmasterConfig with custom per-agent values.""" config = ClaudmasterConfig( narrator_model="claude-opus-4-6", arbiter_model="claude-haiku-4-5-20251001", narrator_max_tokens=2048, arbiter_max_tokens=4096, narrator_temperature=0.9, arbiter_temperature=0.2, ) assert config.narrator_model == "claude-opus-4-6" assert config.arbiter_model == "claude-haiku-4-5-20251001" assert config.narrator_max_tokens == 2048 assert config.arbiter_max_tokens == 4096 assert config.narrator_temperature == 0.9 assert config.arbiter_temperature == 0.2 def test_config_temperature_validation() -> None: """Test that temperature validators work for per-agent fields.""" # Valid temperatures config = ClaudmasterConfig( narrator_temperature=0.0, arbiter_temperature=2.0, ) assert config.narrator_temperature == 0.0 assert config.arbiter_temperature == 2.0 # Invalid narrator_temperature (exceeds 2.0) with pytest.raises(ValueError): ClaudmasterConfig(narrator_temperature=3.0) # Invalid arbiter_temperature (below 0.0) with pytest.raises(ValueError): ClaudmasterConfig(arbiter_temperature=-0.1) def test_config_max_tokens_bounds() -> None: """Test that max_tokens fields have correct bounds.""" # Valid values config = ClaudmasterConfig( narrator_max_tokens=256, # Minimum arbiter_max_tokens=16384, # Maximum ) assert config.narrator_max_tokens == 256 assert config.arbiter_max_tokens == 16384 # Below minimum (narrator) with pytest.raises(ValueError): ClaudmasterConfig(narrator_max_tokens=100) # Above maximum (arbiter) with pytest.raises(ValueError): ClaudmasterConfig(arbiter_max_tokens=20000) # --------------------------------------------------------------------------- # Integration Test: Create Clients from Config # --------------------------------------------------------------------------- def test_create_multi_model_client_from_config() -> None: """Test creating a MultiModelClient from ClaudmasterConfig.""" config = ClaudmasterConfig( narrator_model="claude-haiku-4-5-20251001", arbiter_model="claude-sonnet-4-5-20250929", narrator_temperature=0.8, arbiter_temperature=0.3, narrator_max_tokens=1024, arbiter_max_tokens=2048, ) # Create mock clients based on config narrator_client = MockLLMClient(default_response="Narrator response") arbiter_client = MockLLMClient(default_response="Arbiter response") multi_client = MultiModelClient({ "narrator": narrator_client, "arbiter": arbiter_client, }) # Verify routing works assert multi_client.get_client("narrator") is narrator_client assert multi_client.get_client("arbiter") is arbiter_client

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/Polloinfilzato/dm20-protocol'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

test_llm_client.py•21.8 KiB