ChunkHound

Overview Schema Related Servers Score Discussions

chunkhound
tests

test_smoke.py•17.6 KiB

#!/usr/bin/env python3 """ Smoke tests to catch basic import and startup failures. These tests are designed to catch crashes that occur during: 1. Module import time (like type annotation syntax errors) 2. CLI command initialization 3. Basic server startup They run quickly and should be part of every test run. """ import subprocess import importlib import pkgutil import sys import os import asyncio import pytest from pathlib import Path # Import Windows-safe subprocess utilities from tests.utils.windows_subprocess import create_subprocess_exec_safe, get_safe_subprocess_env from tests.utils.windows_compat import windows_safe_tempdir from tests.utils import SubprocessJsonRpcClient # Add parent directory to path to import chunkhound sys.path.insert(0, str(Path(__file__).parent.parent)) import chunkhound class TestModuleImports: """Test that all modules can be imported without errors.""" def test_all_modules_import(self): """Test that all chunkhound modules can be imported.""" failed_imports = [] # Walk through all chunkhound modules for _, module_name, _ in pkgutil.walk_packages( chunkhound.__path__, prefix="chunkhound." ): try: importlib.import_module(module_name) except Exception as e: failed_imports.append((module_name, str(e))) if failed_imports: error_msg = "Failed to import modules:\n" for module, error in failed_imports: error_msg += f" - {module}: {error}\n" pytest.fail(error_msg) def test_critical_imports(self): """Test critical modules that have caused issues before.""" critical_modules = [ "chunkhound.mcp_server.stdio", "chunkhound.api.cli.main", "chunkhound.database", "chunkhound.embeddings", ] for module_name in critical_modules: try: importlib.import_module(module_name) except Exception as e: pytest.fail(f"Failed to import {module_name}: {e}") def test_v3_research_imports(self): """Test v3 parallel research services can be imported.""" from chunkhound.services.research.shared.exploration import ( ExplorationStrategy, BFSExplorationStrategy, WideCoverageStrategy, ParallelExplorationStrategy, ) from chunkhound.services.research.factory import ResearchServiceFactory from chunkhound.services.research.protocol import ResearchServiceProtocol assert ExplorationStrategy is not None assert BFSExplorationStrategy is not None assert WideCoverageStrategy is not None assert ParallelExplorationStrategy is not None assert ResearchServiceFactory is not None assert ResearchServiceProtocol is not None class TestCLICommands: """Test that CLI commands at least show help without crashing.""" @pytest.mark.parametrize( "command", [ ["chunkhound", "--help"], ["chunkhound", "--version"], ["chunkhound", "index", "--help"], ["chunkhound", "search", "--help"], ["chunkhound", "research", "--help"], ["chunkhound", "map", "--help"], ["chunkhound", "mcp", "--help"], ["chunkhound", "calibrate", "--help"], ], ) def test_cli_help_commands(self, command): """Test that CLI help commands work without crashing.""" result = subprocess.run( ["uv", "run"] + command, capture_output=True, text=True, timeout=5 ) # Help commands should exit with 0 assert result.returncode == 0, ( f"Command {' '.join(command)} failed with code {result.returncode}\n" f"stderr: {result.stderr}" ) # Should have some output assert result.stdout or result.stderr, ( f"Command {' '.join(command)} produced no output" ) class TestServerStartup: """Test that servers can at least start without immediate crashes.""" @pytest.mark.asyncio async def test_mcp_stdio_server_help(self): """Test that MCP stdio server responds to help.""" proc = await create_subprocess_exec_safe( "uv", "run", "chunkhound", "mcp", "--stdio", "--help", stdout=asyncio.subprocess.PIPE, stderr=asyncio.subprocess.PIPE, env=get_safe_subprocess_env(), ) stdout, stderr = await proc.communicate() assert proc.returncode == 0, ( f"MCP stdio help failed with code {proc.returncode}\n" f"stderr: {stderr.decode()}" ) @pytest.mark.asyncio async def test_mcp_stdio_server_starts(self): """Test that MCP stdio server can start without immediate crashes.""" import tempfile import json # Create a temporary directory to avoid indexing the current directory with tempfile.TemporaryDirectory() as temp_dir: temp_path = Path(temp_dir) # Create minimal config file (required for Config() creation) config_path = temp_path / ".chunkhound.json" db_path = temp_path / ".chunkhound" / "test.db" db_path.parent.mkdir(exist_ok=True) config = { "database": {"path": str(db_path), "provider": "duckdb"}, "indexing": {"include": ["*.py"]} } config_path.write_text(json.dumps(config)) # Test that the server starts without crashing proc = await create_subprocess_exec_safe( "uv", "run", "python", "-c", f''' import sys import os sys.path.insert(0, "{os.getcwd()}") from chunkhound.mcp_server.stdio import main import asyncio async def test(): # Set minimal config os.environ["CHUNKHOUND_EMBEDDING__PROVIDER"] = "openai" os.environ["CHUNKHOUND_EMBEDDING__API_KEY"] = "test" # Test we can import without immediate crash try: # Just test that critical imports work - this catches most startup issues from chunkhound.mcp_server.stdio import StdioMCPServer from chunkhound.core.config.config import Config # Test config creation config = Config() print("SUCCESS: MCP server imports and config creation work") return 0 except Exception as e: print(f"FAILED: {{e}}") return 1 sys.exit(asyncio.run(test())) ''', stdout=asyncio.subprocess.PIPE, stderr=asyncio.subprocess.PIPE, cwd=temp_dir, # Run from temp directory that has .chunkhound.json ) try: stdout, stderr = await asyncio.wait_for(proc.communicate(), timeout=10.0) if proc.returncode != 0: pytest.fail( f"MCP stdio server initialization failed with code {proc.returncode}\n" f"stdout: {stdout.decode()}\n" f"stderr: {stderr.decode()}" ) # Check for success message assert "SUCCESS:" in stdout.decode(), f"Expected success message, got: {stdout.decode()}" except asyncio.TimeoutError: proc.kill() await proc.wait() pytest.fail("MCP stdio server test timed out") @pytest.mark.asyncio async def test_mcp_stdio_protocol_handshake(self): """Test MCP stdio server completes full protocol handshake with tool discovery.""" import json with windows_safe_tempdir() as temp_path: # Create minimal test content (server will auto-index on startup) test_file = temp_path / "test.py" test_file.write_text("def hello(): return 'world'") # Create minimal config config_path = temp_path / ".chunkhound.json" db_path = temp_path / ".chunkhound" / "test.db" db_path.parent.mkdir(exist_ok=True) config = { "database": {"path": str(db_path), "provider": "duckdb"}, "indexing": {"include": ["*.py"]} } # Add embedding config if API key available # Note: code_research requires reranker+LLM to EXECUTE, but only embeddings to REGISTER api_key = os.environ.get("OPENAI_API_KEY") if api_key: config["embedding"] = { "provider": "openai", "model": "text-embedding-3-small" } config_path.write_text(json.dumps(config)) # Start MCP server (it will auto-index on startup) mcp_env = get_safe_subprocess_env(os.environ) mcp_env["CHUNKHOUND_MCP_MODE"] = "1" proc = await create_subprocess_exec_safe( "uv", "run", "chunkhound", "mcp", str(temp_path), cwd=str(temp_path), env=mcp_env, stdin=asyncio.subprocess.PIPE, stdout=asyncio.subprocess.PIPE, stderr=asyncio.subprocess.PIPE ) client = SubprocessJsonRpcClient(proc) await client.start() try: # 1. Send initialize request init_result = await client.send_request( "initialize", { "protocolVersion": "2024-11-05", "capabilities": {}, "clientInfo": {"name": "test", "version": "1.0"} }, timeout=10.0 ) # Verify response structure assert "serverInfo" in init_result, f"No serverInfo in result: {init_result}" assert init_result["serverInfo"]["name"] == "ChunkHound Code Search" # 2. Send initialized notification await client.send_notification("notifications/initialized") # 3. Request tool list tools_result = await client.send_request("tools/list", timeout=5.0) # Verify tools tools = tools_result.get("tools", []) tool_names = [t["name"] for t in tools] # Should have at least regex search (works without embeddings) assert "search_regex" in tool_names, f"search_regex not in tools: {tool_names}" assert "get_stats" in tool_names, f"get_stats not in tools: {tool_names}" assert "health_check" in tool_names, f"health_check not in tools: {tool_names}" # Semantic search and code_research only if embeddings available if api_key: assert "search_semantic" in tool_names, f"search_semantic not in tools: {tool_names}" assert "code_research" in tool_names, f"code_research not in tools: {tool_names}" except asyncio.TimeoutError: pytest.fail("MCP stdio protocol handshake timed out") finally: await client.close() class TestParserLoading: """Test that all parsers can be loaded and created.""" def test_all_parsers_load(self): """Test that all supported language parsers can be created and initialized.""" from chunkhound.core.types.common import FileId, Language from chunkhound.parsers.parser_factory import get_parser_factory from chunkhound.parsers.universal_engine import SetupError # Minimal valid code samples for smoke testing language_samples = { Language.PYTHON: "def hello(): pass", Language.JAVA: "class Test { }", Language.CSHARP: "class Test { }", Language.TYPESCRIPT: "const x = 1;", Language.JAVASCRIPT: "const x = 1;", Language.TSX: "const x = <div>hello</div>;", Language.JSX: "const x = <div>hello</div>;", Language.GROOVY: "def hello() { }", Language.KOTLIN: "fun hello() { }", Language.GO: "package main\nfunc main() { }", Language.RUST: "fn main() { }", Language.BASH: "echo hello", Language.MAKEFILE: "all:\n\techo hello", Language.C: "int main() { return 0; }", Language.CPP: "int main() { return 0; }", Language.MATLAB: "function result = hello()\nresult = 1;\nend", Language.MARKDOWN: "# Hello\nWorld", Language.JSON: '{"hello": "world"}', Language.YAML: "hello: world", Language.TOML: "hello = 'world'", Language.TEXT: "hello world", Language.PDF: "hello world", Language.SWIFT: "struct Point { let x: Int; let y: Int }", } factory = get_parser_factory() failed_parsers = [] setup_errors = [] # Test all languages except UNKNOWN (not a real parser) for language in Language: if language == Language.UNKNOWN: continue try: parser = factory.create_parser(language) assert parser is not None, f"Parser for {language.value} was None" # Actually test parsing to trigger tree-sitter Language initialization sample_code = language_samples.get(language, "") if sample_code: chunks = parser.parse_content(sample_code, f"test.{language.value}", FileId(1)) assert isinstance(chunks, list), f"Parser for {language.value} didn't return a list" except SetupError as e: # SetupError indicates critical issues like version incompatibility setup_errors.append((language.value, str(e))) except Exception as e: failed_parsers.append((language.value, str(e))) # SetupErrors should cause immediate test failure (critical issues) if setup_errors: error_msg = "CRITICAL: Parser setup failures (version incompatibility or missing dependencies):\n" for language, error in setup_errors: error_msg += f" - {language}: {error}\n" pytest.fail(error_msg) # Other failures are also important but less critical if failed_parsers: error_msg = "Failed to initialize parsers:\n" for language, error in failed_parsers: error_msg += f" - {language}: {error}\n" pytest.fail(error_msg) class TestTypeAnnotations: """Test for specific type annotation patterns that have caused issues.""" def test_no_invalid_forward_reference_unions(self): """Check for problematic forward reference union patterns.""" import ast import glob problematic_files = [] # Find all Python files in chunkhound, excluding test files themselves for py_file in glob.glob("chunkhound/**/*.py", recursive=True): if "/tests/" in py_file.replace("\\", "/"): continue with open(py_file, "r", encoding="utf-8") as f: content = f.read() # Check for the problematic pattern: "ClassName" | None # This is a simple regex check, not a full AST analysis import re pattern = r':\s*"[^"]+"\s*\|\s*None' if re.search(pattern, content): # Found potential issue, let's verify it's not in a string try: tree = ast.parse(content) # This is where we'd do more sophisticated checking # For now, just flag the file problematic_files.append(py_file) except SyntaxError: # If it's a syntax error, our other tests will catch it pass if problematic_files: pytest.fail( f"Found problematic forward reference union patterns in:\n" + "\n".join(f" - {f}" for f in problematic_files) ) class TestConfigurationSmoke: """Test that new configuration parameters don't break imports or config.""" def test_rerank_format_configuration(self): """Verify rerank_format parameter doesn't break imports or config. This test ensures the new TEI reranking format configuration can be instantiated without errors, catching import-time or validation issues. """ from chunkhound.core.config.embedding_config import EmbeddingConfig # Should not raise during import or instantiation with TEI format config_tei = EmbeddingConfig( provider="openai", model="text-embedding-3-small", base_url="http://localhost:8001", rerank_format="tei", ) assert config_tei.rerank_format == "tei" # Should not raise with Cohere format config_cohere = EmbeddingConfig( provider="openai", model="text-embedding-3-small", base_url="http://localhost:8001", rerank_model="rerank-model", rerank_format="cohere", ) assert config_cohere.rerank_format == "cohere" # Should not raise with auto format (default) config_auto = EmbeddingConfig( provider="openai", model="text-embedding-3-small", base_url="http://localhost:8001", ) assert config_auto.rerank_format == "auto" if __name__ == "__main__": # Allow running directly for debugging pytest.main([__file__, "-v"])

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/ofriw/chunkhound'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

test_smoke.py•17.6 KiB