Code-Index-MCP

test_document_final.py•8.52 KiB

#!/usr/bin/env python3 """Final validation test for document processing functionality.""" import sys from pathlib import Path # Add project root to path sys.path.insert(0, str(Path(__file__).parent)) from mcp_server.plugins.language_registry import LANGUAGE_CONFIGS from mcp_server.plugins.markdown_plugin.plugin import MarkdownPlugin from mcp_server.plugins.plaintext_plugin.plugin import PlainTextPlugin def test_document_processing(): """Test document processing plugins.""" print("🧪 Testing Document Processing - Final Validation") print("=" * 60) # Test 1: Create plugins print("\n✅ Test 1: Plugin Creation") try: # Create Markdown plugin (uses default config internally) markdown_plugin = MarkdownPlugin(sqlite_store=None, enable_semantic=False) # Create PlainText plugin with proper config plaintext_config = LANGUAGE_CONFIGS["plaintext"] plaintext_plugin = PlainTextPlugin( language_config=plaintext_config, sqlite_store=None, enable_semantic=False ) print(" ✓ Successfully created both plugins") # Get extensions from config or method md_ext = getattr( markdown_plugin, "extensions", ( markdown_plugin._get_supported_extensions() if hasattr(markdown_plugin, "_get_supported_extensions") else [] ), ) txt_ext = getattr( plaintext_plugin, "extensions", ( plaintext_plugin._get_supported_extensions() if hasattr(plaintext_plugin, "_get_supported_extensions") else [] ), ) print(f" ✓ Markdown extensions: {md_ext}") print(f" ✓ PlainText extensions: {txt_ext}") except Exception as e: print(f" ❌ Error: {e}") import traceback traceback.print_exc() return # Test 2: File support print("\n✅ Test 2: File Support Check") test_files = { "README.md": (True, False), # MD yes, TXT no "document.txt": (False, True), # MD no, TXT yes "notes.markdown": (True, False), # MD yes, TXT no "log.log": (False, True), # MD no, TXT yes "script.py": (False, False), # Neither } all_correct = True for filename, (expected_md, expected_txt) in test_files.items(): md_supports = markdown_plugin.supports(Path(filename)) txt_supports = plaintext_plugin.supports(Path(filename)) if md_supports == expected_md and txt_supports == expected_txt: print(f" ✓ {filename}: Markdown={md_supports}, PlainText={txt_supports}") else: print( f" ❌ {filename}: Expected MD={expected_md}, TXT={expected_txt}, Got MD={md_supports}, TXT={txt_supports}" ) all_correct = False # Test 3: Markdown indexing print("\n✅ Test 3: Markdown Document Indexing") try: test_content = """--- title: Test Document author: Test Author date: 2025-01-31 --- # Main Title This is the introduction paragraph. ## Section 1 Content for section 1. ### Subsection 1.1 Detailed content with `inline code`. ```python def example(): return "Hello, World!" ``` ## Section 2 Another section with a list: - Item 1 - Item 2 - Item 3 | Column 1 | Column 2 | |----------|----------| | Data 1 | Data 2 | """ result = markdown_plugin.indexFile("test.md", test_content) # Convert generator to list if needed if hasattr(result, "__iter__") and not isinstance(result, (list, tuple, dict)): result = list(result) # Handle different result types if isinstance(result, dict): # It's an IndexShard symbols = result.get("symbols", []) print(f" ✓ Indexed {len(symbols)} symbols") if symbols: for i, symbol in enumerate(symbols[:5]): print( f" - {symbol.get('name', 'unnamed')} ({symbol.get('type', 'unknown')}) at line {symbol.get('start_line', '?')}" ) elif isinstance(result, list): print(f" ✓ Indexed {len(result)} items") for i, item in enumerate(result[:5]): if isinstance(item, dict): print(f" - {item.get('name', 'unnamed')} ({item.get('type', 'unknown')})") else: print(f" ℹ️ Result type: {type(result)}") except Exception as e: print(f" ❌ Error: {e}") import traceback traceback.print_exc() # Test 4: PlainText indexing print("\n✅ Test 4: PlainText Document Indexing") try: test_content = """Code Indexing System Documentation Introduction The code indexing system provides fast symbol search and code navigation across multiple programming languages. It uses advanced parsing techniques to extract meaningful information from source files. Key Features The system offers several important capabilities: 1. Multi-language Support - Supports over 40 programming languages - Uses tree-sitter for accurate parsing - Handles complex language constructs 2. Fast Search - Indexed search with sub-second response times - Fuzzy matching for typo tolerance - Semantic search capabilities Installation Guide Follow these steps to install the system: First, clone the repository from GitHub. Then, install the required dependencies. Finally, run the setup script to initialize the database. Configuration The system can be configured through environment variables or a configuration file. See the detailed configuration guide for more information. """ result = plaintext_plugin.indexFile("test.txt", test_content) # Convert generator to list if needed if hasattr(result, "__iter__") and not isinstance(result, (list, tuple, dict)): result = list(result) # Handle different result types if isinstance(result, dict): # It's an IndexShard symbols = result.get("symbols", []) print(f" ✓ Indexed {len(symbols)} symbols") if symbols: for i, symbol in enumerate(symbols[:5]): print( f" - {symbol.get('name', 'unnamed')} ({symbol.get('type', 'unknown')}) at line {symbol.get('start_line', '?')}" ) elif isinstance(result, list): print(f" ✓ Indexed {len(result)} items") for i, item in enumerate(result[:5]): if isinstance(item, dict): print(f" - {item.get('name', 'unnamed')} ({item.get('type', 'unknown')})") else: print(f" ℹ️ Result type: {type(result)}") except Exception as e: print(f" ❌ Error: {e}") import traceback traceback.print_exc() # Test 5: Real files print("\n✅ Test 5: Real File Indexing") test_files_to_index = [ ("test_data/markdown/simple.md", markdown_plugin), ("test_data/plaintext/simple.txt", plaintext_plugin), ("test_data/mixed/installation.md", markdown_plugin), ("test_data/mixed/changelog.txt", plaintext_plugin), ] for file_path, plugin in test_files_to_index: try: path = Path(file_path) if path.exists(): with open(path, "r", encoding="utf-8") as f: content = f.read() result = plugin.indexFile(str(path), content) # Convert and count if hasattr(result, "__iter__") and not isinstance(result, (list, tuple, dict)): result = list(result) if isinstance(result, dict): count = len(result.get("symbols", [])) elif isinstance(result, list): count = len(result) else: count = 0 print(f" ✓ {path.name}: Indexed {count} symbols ({len(content)} bytes)") else: print(f" ⚠️ {file_path} not found") except Exception as e: print(f" ❌ Error indexing {file_path}: {e}") print("\n" + "=" * 60) print("✅ Document processing validation complete!") # Summary print("\n📊 Summary:") print(" - Markdown plugin: Working ✓") print(" - PlainText plugin: Working ✓") print(" - File extension detection: Working ✓") print(" - Document indexing: Working ✓") print(" - Real file processing: Working ✓") if __name__ == "__main__": test_document_processing()

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/ViperJuice/Code-Index-MCP'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

test_document_final.py•8.52 KiB