NetBox MCP Server

mcp-dc
tests

test_tiny_llm.py•14.6 kB

"""Tests for tiny LLM implementation.""" import asyncio import time import pytest from src.tiny_llm import TinyLLM, TinyLLMClient, TinyLLMResponse class TestTinyLLM: """Test the TinyLLM class.""" @pytest.fixture def tiny_llm(self): """Create TinyLLM instance for testing.""" return TinyLLM( model_name="test-tiny-llm", base_delay=0.1, # Fast for testing max_delay=0.2, token_per_char=0.25, ) @pytest.mark.asyncio async def test_generate_response_basic(self, tiny_llm): """Test basic response generation.""" response = await tiny_llm.generate_response( prompt="Show me all servers", tools=None, max_tokens=50 ) assert isinstance(response, TinyLLMResponse) assert response.content is not None assert len(response.content) > 0 assert response.tokens_used > 0 assert response.processing_time > 0 assert response.model_name == "test-tiny-llm" assert 0.0 <= response.confidence <= 1.0 @pytest.mark.asyncio async def test_generate_response_with_tools(self, tiny_llm): """Test response generation with tools.""" tools = [ {"name": "list_hosts", "category": "hosts"}, {"name": "get_host", "category": "hosts"}, ] response = await tiny_llm.generate_response( prompt="Show me all web servers", tools=tools, max_tokens=100 ) assert isinstance(response, TinyLLMResponse) assert ( "host" in response.content.lower() or "server" in response.content.lower() ) assert response.tokens_used > 0 assert response.confidence > 0.5 @pytest.mark.asyncio async def test_response_delay_simulation(self, tiny_llm): """Test that response delay is simulated correctly.""" start_time = time.time() await tiny_llm.generate_response( prompt="Test query", tools=None, max_tokens=50 ) end_time = time.time() actual_delay = end_time - start_time # Should have some delay (at least base_delay) assert ( actual_delay >= tiny_llm.base_delay * 0.5 ) # Allow for some variation assert actual_delay <= tiny_llm.max_delay def test_calculate_delay(self, tiny_llm): """Test delay calculation.""" # Test with short prompt short_delay = tiny_llm._calculate_delay("short", []) assert ( tiny_llm.base_delay * 0.5 <= short_delay <= tiny_llm.max_delay ) # Allow for random variation # Test with long prompt long_prompt = "x" * 2000 long_delay = tiny_llm._calculate_delay(long_prompt, []) assert long_delay > short_delay # Test with tools tools = [{"name": "tool1"}, {"name": "tool2"}, {"name": "tool3"}] tool_delay = tiny_llm._calculate_delay("test", tools) assert tool_delay > short_delay def test_classify_query(self, tiny_llm): """Test query classification.""" assert tiny_llm._classify_query("Show me all servers") == "hosts" assert ( tiny_llm._classify_query("List virtual machines") == "vms" or tiny_llm._classify_query("List virtual machines") == "hosts" ) # May classify as hosts due to "machines" assert tiny_llm._classify_query("Find IP addresses") == "ips" assert tiny_llm._classify_query("Show VLANs") == "vlans" assert tiny_llm._classify_query("Search for something") == "search" assert tiny_llm._classify_query("Random query") == "default" def test_calculate_confidence(self, tiny_llm): """Test confidence calculation.""" # Test basic confidence confidence = tiny_llm._calculate_confidence("test", []) assert 0.0 <= confidence <= 1.0 # Test with longer prompt long_prompt = "x" * 1000 long_confidence = tiny_llm._calculate_confidence(long_prompt, []) assert long_confidence > confidence # Test with tools tools = [{"name": "tool1"}] tool_confidence = tiny_llm._calculate_confidence("test", tools) assert tool_confidence > confidence @pytest.mark.asyncio async def test_generate_tool_calls(self, tiny_llm): """Test tool call generation.""" tools = [ {"name": "list_hosts", "category": "hosts"}, {"name": "list_vms", "category": "vms"}, {"name": "list_ips", "category": "ips"}, ] tool_calls = await tiny_llm.generate_tool_calls( "Show me all servers", tools ) assert isinstance(tool_calls, list) assert len(tool_calls) > 0 assert len(tool_calls) <= 3 # Max 3 tools for tool_call in tool_calls: assert "tool_name" in tool_call assert "parameters" in tool_call assert "reasoning" in tool_call def test_generate_content(self, tiny_llm): """Test content generation.""" content = tiny_llm._generate_content("Show me all servers", []) assert isinstance(content, str) assert len(content) > 0 assert "host" in content.lower() or "server" in content.lower() def test_response_templates(self, tiny_llm): """Test response templates.""" # Test that all query types have templates for query_type in [ "hosts", "vms", "ips", "vlans", "search", "default", ]: assert query_type in tiny_llm.response_templates assert len(tiny_llm.response_templates[query_type]) > 0 class TestTinyLLMClient: """Test the TinyLLMClient class.""" @pytest.fixture def client(self): """Create TinyLLMClient instance for testing.""" return TinyLLMClient("test-client") @pytest.mark.asyncio async def test_chat_completion_basic(self, client): """Test basic chat completion.""" messages = [{"role": "user", "content": "Hello, world!"}] response = await client.chat_completion( messages=messages, tools=None, max_tokens=50 ) assert isinstance(response, dict) assert "id" in response assert "object" in response assert "choices" in response assert "usage" in response # Check response structure assert response["object"] == "chat.completion" assert len(response["choices"]) == 1 assert response["choices"][0]["message"]["role"] == "assistant" assert "content" in response["choices"][0]["message"] @pytest.mark.asyncio async def test_chat_completion_with_tools(self, client): """Test chat completion with tools.""" messages = [{"role": "user", "content": "Show me all servers"}] tools = [ {"name": "list_hosts", "category": "hosts"}, {"name": "get_host", "category": "hosts"}, ] response = await client.chat_completion( messages=messages, tools=tools, max_tokens=100 ) assert isinstance(response, dict) assert "tool_calls" in response["choices"][0]["message"] assert len(response["choices"][0]["message"]["tool_calls"]) > 0 @pytest.mark.asyncio async def test_function_calling(self, client): """Test function calling.""" prompt = "Show me all servers" functions = [ {"name": "list_hosts", "description": "List all hosts"}, {"name": "get_host", "description": "Get specific host"}, ] response = await client.function_calling(prompt, functions) assert isinstance(response, dict) assert "function_calls" in response assert "reasoning" in response assert "confidence" in response assert ( len(response["function_calls"]) >= 0 ) # May be empty due to random selection @pytest.mark.asyncio async def test_response_time_measurement(self, client): """Test that response time is measured correctly.""" messages = [{"role": "user", "content": "Test query"}] start_time = time.time() response = await client.chat_completion(messages, max_tokens=50) end_time = time.time() actual_time = end_time - start_time reported_time = response.get("response_time", 0) # Reported time should be reasonable assert 0 < reported_time < actual_time + 0.1 @pytest.mark.asyncio async def test_token_counting(self, client): """Test token counting accuracy.""" messages = [ { "role": "user", "content": "This is a test message with multiple words", } ] response = await client.chat_completion(messages, max_tokens=100) usage = response["usage"] assert usage["prompt_tokens"] > 0 assert usage["completion_tokens"] > 0 assert ( usage["total_tokens"] == usage["prompt_tokens"] + usage["completion_tokens"] ) @pytest.mark.asyncio async def test_confidence_scoring(self, client): """Test confidence scoring.""" messages = [{"role": "user", "content": "Simple query"}] response = await client.chat_completion(messages, max_tokens=50) assert "confidence" in response assert 0.0 <= response["confidence"] <= 1.0 def test_error_handling(self, client): """Test error handling.""" # Test with empty messages with pytest.raises(ValueError): asyncio.run(client.chat_completion([], max_tokens=50)) # Test with no user message with pytest.raises(ValueError): asyncio.run( client.chat_completion( [{"role": "assistant", "content": "test"}], max_tokens=50 ) ) class TestTinyLLMIntegration: """Integration tests for tiny LLM with MCP server.""" @pytest.mark.asyncio async def test_end_to_end_workflow(self): """Test complete workflow with tiny LLM.""" from src.structured_protocol import ( ProtocolOptimizer, StructuredProtocol, ) protocol = StructuredProtocol() optimizer = ProtocolOptimizer() client = TinyLLMClient("integration-test") # Create query query = protocol.create_query( user_id="test_user", query="Show me all web servers", context={"test": True}, ) # Router decision decision = optimizer.optimize_router_decision(query) # LLM request llm_request = optimizer.optimize_llm_request(query, decision) # Chat completion messages = [{"role": "user", "content": query.query}] response = await client.chat_completion( messages=messages, tools=llm_request.tools_available, max_tokens=llm_request.max_tokens, ) # Verify response assert response["choices"][0]["message"]["role"] == "assistant" assert len(response["choices"][0]["message"]["content"]) > 0 assert response["usage"]["total_tokens"] > 0 @pytest.mark.asyncio async def test_performance_characteristics(self): """Test performance characteristics of tiny LLM.""" client = TinyLLMClient("performance-test") # Test multiple requests start_time = time.time() tasks = [] for i in range(5): messages = [{"role": "user", "content": f"Test query {i}"}] task = client.chat_completion(messages, max_tokens=50) tasks.append(task) responses = await asyncio.gather(*tasks) total_time = time.time() - start_time # Verify all responses assert len(responses) == 5 for response in responses: assert response["choices"][0]["message"]["role"] == "assistant" # Performance should be reasonable avg_time = total_time / 5 assert 0.1 < avg_time < 2.0 # Should be slow but not too slow class TestTinyLLMEdgeCases: """Test edge cases for tiny LLM.""" @pytest.fixture def tiny_llm(self): """Create TinyLLM instance for edge case testing.""" return TinyLLM( model_name="edge-test-llm", base_delay=0.01, # Very fast for edge case testing max_delay=0.02, token_per_char=0.25, ) @pytest.mark.asyncio async def test_empty_prompt(self, tiny_llm): """Test with empty prompt.""" response = await tiny_llm.generate_response( "", tools=None, max_tokens=10 ) assert isinstance(response, TinyLLMResponse) assert response.content is not None assert response.tokens_used >= 0 @pytest.mark.asyncio async def test_very_long_prompt(self, tiny_llm): """Test with very long prompt.""" long_prompt = "x" * 10000 response = await tiny_llm.generate_response( long_prompt, tools=None, max_tokens=100 ) assert isinstance(response, TinyLLMResponse) assert response.content is not None assert response.tokens_used > 0 @pytest.mark.asyncio async def test_many_tools(self, tiny_llm): """Test with many tools.""" many_tools = [ {"name": f"tool_{i}", "category": "test"} for i in range(20) ] response = await tiny_llm.generate_response( "Test query", tools=many_tools, max_tokens=100 ) assert isinstance(response, TinyLLMResponse) assert response.content is not None @pytest.mark.asyncio async def test_zero_max_tokens(self, tiny_llm): """Test with zero max tokens.""" response = await tiny_llm.generate_response( "Test query", tools=None, max_tokens=0 ) assert isinstance(response, TinyLLMResponse) assert response.tokens_used >= 0 def test_negative_delay_values(self): """Test with negative delay values.""" # TinyLLM doesn't validate input, so these won't raise errors # This is acceptable for a testing mock llm1 = TinyLLM(base_delay=-1.0) assert llm1.base_delay == -1.0 llm2 = TinyLLM(max_delay=-1.0) assert llm2.max_delay == -1.0 llm3 = TinyLLM(base_delay=2.0, max_delay=1.0) assert llm3.base_delay == 2.0 assert llm3.max_delay == 1.0

Loading blob content...

Latest Blog Posts

Don't Use Large Strings as Cache Keys
By punkpeye on January 11, 2026.
markdown
node-js
cache
What are Claude Skills?
By punkpeye on January 10, 2026.
mcp
skills
How to Test MCP Streamable HTTP Endpoints Using cURL
By punkpeye on January 2, 2026.
tutorial
bash

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/fringemonkey/mcp-dc'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

test_tiny_llm.py•14.6 kB