Markdown RAG Documentation

Overview Schema Related Servers Score Discussions

test_git_history_mcp.py•17.9 KiB

import subprocess import time from pathlib import Path import pytest from src.context import ApplicationContext from src.git.commit_search import GitSearchResponse, CommitResult def _init_git_repo(path: Path) -> None: """Initialize a git repository at path.""" subprocess.run(["git", "init"], cwd=path, check=True, capture_output=True) subprocess.run( ["git", "config", "user.name", "Test User"], cwd=path, check=True, capture_output=True, ) subprocess.run( ["git", "config", "user.email", "test@example.com"], cwd=path, check=True, capture_output=True, ) def _create_commit( repo_path: Path, file_name: str, content: str, message: str, ) -> str: """Create a file and commit it, return commit hash.""" file_path = repo_path / file_name file_path.parent.mkdir(parents=True, exist_ok=True) file_path.write_text(content) subprocess.run(["git", "add", "."], cwd=repo_path, check=True, capture_output=True) subprocess.run( ["git", "commit", "-m", message], cwd=repo_path, check=True, capture_output=True, ) result = subprocess.run( ["git", "rev-parse", "HEAD"], cwd=repo_path, capture_output=True, text=True, check=True, ) return result.stdout.strip() @pytest.fixture def test_repo_with_history(tmp_path): """ Create a test repository with realistic commit history. Returns tuple of (repo_path, commit_hashes). """ repo_path = tmp_path / "test_project" repo_path.mkdir() _init_git_repo(repo_path) commit_hashes = [] # Initial commit: Setup project hash1 = _create_commit( repo_path, "README.md", "# Test Project\n\nA test project for git history search.\n", "Initial commit: setup project structure", ) commit_hashes.append(hash1) time.sleep(0.1) # Bug fix commit hash2 = _create_commit( repo_path, "src/utils.py", "def calculate(x, y):\n return x + y # Fixed division by zero\n", "Fix division by zero bug in calculator", ) commit_hashes.append(hash2) time.sleep(0.1) # Feature commit hash3 = _create_commit( repo_path, "src/api.py", "from flask import Flask\napp = Flask(__name__)\n\n@app.route('/health')\ndef health():\n return 'OK'\n", "Add health check endpoint to API", ) commit_hashes.append(hash3) time.sleep(0.1) # Documentation commit hash4 = _create_commit( repo_path, "docs/api.md", "# API Documentation\n\n## Health Check\n\nGET /health - Returns OK if service is healthy\n", "Document API endpoints", ) commit_hashes.append(hash4) time.sleep(0.1) # Refactoring commit hash5 = _create_commit( repo_path, "src/utils.py", "def add(x, y):\n return x + y\n\ndef multiply(x, y):\n return x * y\n", "Refactor: split calculator functions", ) commit_hashes.append(hash5) return repo_path, commit_hashes @pytest.mark.asyncio async def test_mcp_search_git_history_basic(test_repo_with_history, tmp_path): """ Test basic git history search through MCP server context. Simulates MCP tool call to search_git_history and verifies response format and content. """ repo_path, commit_hashes = test_repo_with_history # Create application context with git indexing enabled ctx = ApplicationContext.create( project_override=str(repo_path), enable_watcher=False, lazy_embeddings=False, ) try: await ctx.start(background_index=False) # Verify commit indexer is available assert ctx.commit_indexer is not None # Check that commits were indexed total = ctx.commit_indexer.get_total_commits() assert total == 5, f"Expected 5 commits indexed, got {total}" # Simulate MCP tool call: search for bug fix from src.git.commit_search import search_git_history response = search_git_history( commit_indexer=ctx.commit_indexer, query="bug fix division by zero", top_n=3, ) # Verify response structure (GitSearchResponse) assert isinstance(response, GitSearchResponse) assert response.query == "bug fix division by zero" assert response.total_commits_indexed == 5 assert len(response.results) > 0 assert len(response.results) <= 3 # Verify result structure (CommitResult) for result in response.results: assert isinstance(result, CommitResult) assert result.hash in commit_hashes assert isinstance(result.score, float) assert 0.0 <= result.score <= 1.0 assert result.timestamp > 0 assert result.author assert result.title assert isinstance(result.files_changed, list) assert result.repo_path # Verify most relevant result mentions bug fix top_result = response.results[0] assert "bug" in top_result.title.lower() or "fix" in top_result.title.lower() finally: await ctx.stop() @pytest.mark.asyncio async def test_mcp_git_search_with_glob_filter(test_repo_with_history, tmp_path): """ Test git history search with file glob filtering via MCP. Verifies that files_glob parameter correctly filters results. """ repo_path, commit_hashes = test_repo_with_history ctx = ApplicationContext.create( project_override=str(repo_path), enable_watcher=False, lazy_embeddings=False, ) try: await ctx.start(background_index=False) from src.git.commit_search import search_git_history assert ctx.commit_indexer is not None # Search for commits that modified Python files in src/ # Use a query that better matches our test commits response = search_git_history( commit_indexer=ctx.commit_indexer, query="calculator utils functions", top_n=10, files_glob="src/**/*.py", ) # Verify all results have Python files in src/ # Due to semantic search, we may get 0 results if the query doesn't match well if len(response.results) > 0: for result in response.results: matching_files = [ f for f in result.files_changed if Path(f).match("src/**/*.py") ] assert len(matching_files) > 0, \ f"Result {result.hash} should have Python files in src/, got {result.files_changed}" # Verify documentation commit is excluded doc_commit = commit_hashes[3] # docs/api.md commit result_hashes = {r.hash for r in response.results} assert doc_commit not in result_hashes else: # Semantic search didn't match - verify glob filtering would work # by checking without glob filter assert ctx.commit_indexer is not None all_response = search_git_history( commit_indexer=ctx.commit_indexer, query="calculator utils functions", top_n=10, ) # At least verify the system indexed the commits assert all_response.total_commits_indexed == 5 finally: await ctx.stop() @pytest.mark.asyncio async def test_mcp_git_search_with_timestamp_filters(test_repo_with_history, tmp_path): """ Test git history search with timestamp filtering via MCP. Verifies after_timestamp and before_timestamp parameters work correctly. """ repo_path, commit_hashes = test_repo_with_history ctx = ApplicationContext.create( project_override=str(repo_path), enable_watcher=False, lazy_embeddings=False, ) try: await ctx.start(background_index=False) from src.git.commit_search import search_git_history assert ctx.commit_indexer is not None # Get all commits to find timestamp range all_results = search_git_history( commit_indexer=ctx.commit_indexer, query="commit", top_n=10, ) timestamps = sorted([r.timestamp for r in all_results.results]) middle_timestamp = timestamps[len(timestamps) // 2] # Search for commits after middle timestamp after_response = search_git_history( commit_indexer=ctx.commit_indexer, query="commit", top_n=10, after_timestamp=middle_timestamp, ) # Verify all results are after threshold for result in after_response.results: assert result.timestamp > middle_timestamp # Search for commits before middle timestamp before_response = search_git_history( commit_indexer=ctx.commit_indexer, query="commit", top_n=10, before_timestamp=middle_timestamp, ) # Verify all results are before threshold for result in before_response.results: assert result.timestamp < middle_timestamp finally: await ctx.stop() @pytest.mark.asyncio async def test_mcp_git_search_real_project_history(): """ Test git history search on the actual project repository. This validates the feature works on real-world commit history with diverse commit messages and file changes. """ # Use the actual project directory project_root = Path(__file__).parent.parent.parent # Check if we're in a git repository git_dir = project_root / ".git" if not git_dir.exists(): pytest.skip("Not in a git repository") ctx = ApplicationContext.create( project_override=str(project_root), enable_watcher=False, lazy_embeddings=False, ) try: await ctx.start(background_index=False) if ctx.commit_indexer is None: pytest.skip("Git indexing not available") # After this point, mypy knows commit_indexer is not None assert ctx.commit_indexer is not None total = ctx.commit_indexer.get_total_commits() if total == 0: pytest.skip("No commits indexed") from src.git.commit_search import search_git_history # Search for test-related commits response = search_git_history( commit_indexer=ctx.commit_indexer, query="test implementation", top_n=5, ) # Verify response structure assert isinstance(response, GitSearchResponse) assert response.total_commits_indexed == total assert len(response.results) > 0 # Verify results have proper structure for result in response.results: assert result.hash assert len(result.hash) >= 7 # At least short hash assert result.timestamp > 0 assert result.author assert result.title assert isinstance(result.files_changed, list) # Verify scores are descending scores = [r.score for r in response.results] assert scores == sorted(scores, reverse=True) finally: await ctx.stop() @pytest.mark.asyncio async def test_mcp_git_search_response_format_for_display(test_repo_with_history, tmp_path): """ Test that git search response can be formatted for MCP text display. Verifies the response contains all necessary fields for rendering in MCP client UI. """ repo_path, commit_hashes = test_repo_with_history ctx = ApplicationContext.create( project_override=str(repo_path), enable_watcher=False, lazy_embeddings=False, ) try: await ctx.start(background_index=False) from src.git.commit_search import search_git_history from datetime import datetime, timezone assert ctx.commit_indexer is not None response = search_git_history( commit_indexer=ctx.commit_indexer, query="API health check", top_n=3, ) # Simulate MCP server formatting (as done in _handle_search_git_history) output_lines = [ "# Git History Search Results", "", f"**Query:** {response.query}", f"**Total Commits Indexed:** {response.total_commits_indexed}", f"**Results Returned:** {len(response.results)}", "", ] for i, commit in enumerate(response.results, 1): commit_date = datetime.fromtimestamp( commit.timestamp, timezone.utc ).strftime("%Y-%m-%d %H:%M:%S UTC") output_lines.extend([ f"## {i}. {commit.title}", "", f"**Commit:** `{commit.hash[:8]}`", f"**Author:** {commit.author}", f"**Date:** {commit_date}", f"**Score:** {commit.score:.3f}", "", ]) if commit.message: output_lines.extend([ "### Message", "", commit.message, "", ]) if commit.files_changed: output_lines.extend([ f"### Files Changed ({len(commit.files_changed)})", "", ]) for file_path in commit.files_changed[:10]: output_lines.append(f"- `{file_path}`") output_lines.append("") output_lines.extend(["---", ""]) formatted_output = "\n".join(output_lines) # Verify formatted output contains expected sections assert "# Git History Search Results" in formatted_output assert "**Query:**" in formatted_output assert "**Total Commits Indexed:**" in formatted_output assert "**Commit:**" in formatted_output assert "**Author:**" in formatted_output assert "**Date:**" in formatted_output assert "**Score:**" in formatted_output # Verify it contains commit info assert any(commit_hash[:8] in formatted_output for commit_hash in commit_hashes) finally: await ctx.stop() @pytest.mark.asyncio async def test_mcp_git_search_no_results(test_repo_with_history, tmp_path): """ Test git history search with query that has no matching commits. Verifies graceful handling of no results scenario. """ repo_path, commit_hashes = test_repo_with_history ctx = ApplicationContext.create( project_override=str(repo_path), enable_watcher=False, lazy_embeddings=False, ) try: await ctx.start(background_index=False) from src.git.commit_search import search_git_history assert ctx.commit_indexer is not None # Search with very specific query unlikely to match response = search_git_history( commit_indexer=ctx.commit_indexer, query="quantum cryptography blockchain implementation with rust", top_n=5, files_glob="nonexistent/**/*.xyz", ) # Should return empty results, not error assert isinstance(response, GitSearchResponse) assert response.total_commits_indexed == 5 assert len(response.results) == 0 finally: await ctx.stop() @pytest.mark.asyncio async def test_mcp_git_search_validates_top_n(test_repo_with_history, tmp_path): """ Test that top_n parameter is properly validated and constrained. Verifies edge cases like 0, negative, and very large values. """ repo_path, commit_hashes = test_repo_with_history ctx = ApplicationContext.create( project_override=str(repo_path), enable_watcher=False, lazy_embeddings=False, ) try: await ctx.start(background_index=False) from src.git.commit_search import search_git_history assert ctx.commit_indexer is not None # Test with top_n=1 response = search_git_history( commit_indexer=ctx.commit_indexer, query="commit", top_n=1, ) assert len(response.results) <= 1 # Test with very large top_n (should be capped) response = search_git_history( commit_indexer=ctx.commit_indexer, query="commit", top_n=1000, ) # Should return at most the total number of commits assert len(response.results) <= 5 finally: await ctx.stop() @pytest.mark.asyncio async def test_mcp_git_search_multiple_file_patterns(test_repo_with_history, tmp_path): """ Test searching with different file glob patterns. Verifies that different patterns correctly filter results. """ repo_path, commit_hashes = test_repo_with_history ctx = ApplicationContext.create( project_override=str(repo_path), enable_watcher=False, lazy_embeddings=False, ) try: await ctx.start(background_index=False) from src.git.commit_search import search_git_history assert ctx.commit_indexer is not None # Search for markdown files md_response = search_git_history( commit_indexer=ctx.commit_indexer, query="documentation", top_n=10, files_glob="**/*.md", ) # Should find README and docs commits assert len(md_response.results) > 0 for result in md_response.results: md_files = [f for f in result.files_changed if f.endswith(".md")] assert len(md_files) > 0 # Search for Python API files api_response = search_git_history( commit_indexer=ctx.commit_indexer, query="api", top_n=10, files_glob="src/api.py", ) # Should find API commit if len(api_response.results) > 0: for result in api_response.results: assert "src/api.py" in result.files_changed finally: await ctx.stop()

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/andnp/ragdocs-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

test_git_history_mcp.py•17.9 KiB