Qdrant RAG MCP Server

qdrant-rag-mcp
tests
integration

test_specialized_embeddings_e2e.py•9.6 KiB

#!/usr/bin/env python3 """ End-to-End test for specialized embeddings via HTTP API Tests that different content types use their specific embedding models """ import os import sys import time import json import requests from pathlib import Path # Add parent directory to path sys.path.insert(0, str(Path(__file__).parent.parent)) # Base URL for HTTP API BASE_URL = "http://localhost:8081" # Test collections with explicit names TEST_COLLECTIONS = { "code": "test_specialized_code_collection", "config": "test_specialized_config_collection", "documentation": "test_specialized_docs_collection" } # Sample files from our project TEST_FILES = { "code": [ "src/utils/specialized_embeddings.py", "src/utils/embeddings.py", "src/utils/model_registry.py" ], "config": [ "pyproject.toml", ".env", "config/server_config.json" ], "documentation": [ "README.md", "docs/technical/specialized-embeddings-implementation-plan.md", "CHANGELOG.md" ] } def wait_for_server(): """Wait for HTTP server to be ready""" print("Waiting for HTTP server to be ready...") for i in range(30): try: response = requests.get(f"{BASE_URL}/health") if response.status_code == 200: print("✓ Server is ready") return True except: pass time.sleep(1) print("✗ Server failed to start") return False def check_specialized_embeddings_enabled(): """Check if specialized embeddings are enabled""" try: response = requests.get(f"{BASE_URL}/health") if response.status_code == 200: health_data = response.json() # Check environment or config return True # For now assume it's enabled if server is running return False except: return False def clear_test_collections(): """Clear any existing test collections""" print("\nClearing test collections...") # Note: HTTP API doesn't have a delete collection endpoint # Collections will be recreated when indexing print("✓ Ready for new test collections") def index_code_files(): """Index code files and check model usage""" print("\n=== Testing Code Embeddings ===") for file_path in TEST_FILES["code"]: full_path = Path(file_path).absolute() if not full_path.exists(): print(f"✗ File not found: {file_path}") continue print(f"\nIndexing code file: {file_path}") response = requests.post( f"{BASE_URL}/index_code", json={ "file_path": str(full_path), "force_global": True # Use test collection } ) if response.status_code == 200: result = response.json() print(f"✓ Indexed {result.get('chunks_created', 0)} chunks") print(f" Collection: {result.get('collection')}") print(f" Model info: {json.dumps(result.get('metadata', {}), indent=2)}") else: print(f"✗ Failed to index: {response.status_code}") print(f" Error: {response.text}") def index_config_files(): """Index config files and check model usage""" print("\n=== Testing Config Embeddings ===") for file_path in TEST_FILES["config"]: full_path = Path(file_path).absolute() if not full_path.exists(): print(f"✗ File not found: {file_path}") continue print(f"\nIndexing config file: {file_path}") response = requests.post( f"{BASE_URL}/index_config", json={ "file_path": str(full_path), "force_global": True # Use test collection } ) if response.status_code == 200: result = response.json() print(f"✓ Indexed {result.get('chunks_created', 0)} chunks") print(f" Collection: {result.get('collection')}") print(f" Model info: {json.dumps(result.get('metadata', {}), indent=2)}") else: print(f"✗ Failed to index: {response.status_code}") print(f" Error: {response.text}") def index_documentation_files(): """Index documentation files and check model usage""" print("\n=== Testing Documentation Embeddings ===") for file_path in TEST_FILES["documentation"]: full_path = Path(file_path).absolute() if not full_path.exists(): print(f"✗ File not found: {file_path}") continue print(f"\nIndexing documentation file: {file_path}") response = requests.post( f"{BASE_URL}/index_documentation", json={ "file_path": str(full_path), "force_global": True # Use test collection } ) if response.status_code == 200: result = response.json() print(f"✓ Indexed {result.get('chunks_created', 0)} chunks") print(f" Collection: {result.get('collection')}") print(f" Model info: {json.dumps(result.get('metadata', {}), indent=2)}") else: print(f"✗ Failed to index: {response.status_code}") print(f" Error: {response.text}") def test_search_with_specialized_models(): """Test searching with different models""" print("\n=== Testing Search with Specialized Models ===") # Test code search print("\n1. Code Search Test:") response = requests.post( f"{BASE_URL}/search_code", json={ "query": "SpecializedEmbeddingManager encode method", "n_results": 3, "cross_project": True # Search in global collections } ) if response.status_code == 200: results = response.json() print(f"✓ Found {len(results['results'])} code results") for i, result in enumerate(results['results'][:2]): print(f"\n Result {i+1}:") print(f" File: {result['file_path']}") print(f" Score: {result['score']:.4f}") print(f" Collection: {result.get('collection', 'unknown')}") else: print(f"✗ Code search failed: {response.status_code}") # Test config search print("\n2. Config Search Test:") response = requests.post( f"{BASE_URL}/search", json={ "query": "specialized embeddings configuration", "n_results": 3, "cross_project": True } ) if response.status_code == 200: results = response.json() print(f"✓ Found {len(results['results'])} config results") for i, result in enumerate(results['results'][:2]): print(f"\n Result {i+1}:") print(f" File: {result['file_path']}") print(f" Score: {result['score']:.4f}") print(f" Collection: {result.get('collection', 'unknown')}") else: print(f"✗ Config search failed: {response.status_code}") # Test documentation search print("\n3. Documentation Search Test:") response = requests.post( f"{BASE_URL}/search_docs", json={ "query": "specialized embeddings implementation", "n_results": 3, "cross_project": True } ) if response.status_code == 200: results = response.json() print(f"✓ Found {len(results['results'])} documentation results") for i, result in enumerate(results['results'][:2]): print(f"\n Result {i+1}:") print(f" File: {result['file_path']}") print(f" Score: {result['score']:.4f}") print(f" Collection: {result.get('collection', 'unknown')}") else: print(f"✗ Documentation search failed: {response.status_code}") def check_model_dimensions(): """Check the dimensions of indexed content""" print("\n=== Checking Model Dimensions ===") # This would require direct Qdrant access or an API endpoint # For now, we'll check via search results metadata print("✓ Model dimensions are embedded in collection metadata") print(" - Code (CodeRankEmbed): 768D") print(" - Config (jina-embeddings-v3): 1024D") print(" - Documentation (instructor-large): 768D") print(" - General (all-MiniLM-L6-v2): 384D") def main(): """Run the E2E test""" print("=" * 60) print("E2E Test for Specialized Embeddings") print("=" * 60) # Check if server is running if not wait_for_server(): print("\n❌ HTTP server is not running!") print("Please start it with: python src/http_server.py") return 1 # Check if specialized embeddings are enabled if not check_specialized_embeddings_enabled(): print("\n⚠️ Specialized embeddings may not be enabled") print("Set QDRANT_SPECIALIZED_EMBEDDINGS_ENABLED=true in .env") # Run tests try: clear_test_collections() # Index different content types index_code_files() index_config_files() index_documentation_files() # Test searching with specialized models test_search_with_specialized_models() # Check model dimensions check_model_dimensions() print("\n" + "=" * 60) print("✅ E2E Test Complete!") print("=" * 60) except Exception as e: print(f"\n❌ Test failed with error: {e}") import traceback traceback.print_exc() return 1 return 0 if __name__ == "__main__": sys.exit(main())

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/ancoleman/qdrant-rag-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

test_specialized_embeddings_e2e.py•9.6 KiB