M.I.M.I.R - Multi-agent Intelligent Memory & Insight Repository

Overview Schema Related Servers Score Discussions

Mimir
src
tools

vectorSearch.tools.ts•11.6 KiB

/** * @file src/tools/vectorSearch.tools.ts * @description Vector search MCP tools for semantic file search * Now uses UnifiedSearchService for automatic fallback to full-text search */ import { Tool } from '@modelcontextprotocol/sdk/types.js'; import { Driver } from 'neo4j-driver'; import { UnifiedSearchService } from '../managers/UnifiedSearchService.js'; export function createVectorSearchTools(driver: Driver): Tool[] { return [ // ======================================================================== // vector_search_nodes // ======================================================================== { name: 'vector_search_nodes', description: 'Semantic search across all nodes using vector embeddings (with automatic fallback to full-text search). Returns nodes most similar to the query by MEANING (not exact text match). If embeddings are disabled or no results found, automatically falls back to keyword search. For files, searches individual chunks and returns parent file context. Use this to find related concepts, similar problems, or relevant context when you don\'t know exact keywords. Works with todos, memories, file chunks, and all other node types. Supports multi-hop graph traversal via depth parameter.', inputSchema: { type: 'object', properties: { query: { type: 'string', description: 'Natural language search query (e.g., "authentication code", "database connections", "pending tasks")' }, types: { type: 'array', items: { type: 'string' }, description: 'Optional: Filter by node types (e.g., ["todo", "memory", "file", "file_chunk"]). If not provided, searches all types.' }, limit: { type: 'number', description: 'Maximum number of results to return (default: 10)', default: 10 }, min_similarity: { type: 'number', description: 'Minimum cosine similarity threshold 0-1 (default: 0.75)', default: 0.75 }, depth: { type: 'number', description: 'Graph traversal depth for multi-hop search (1-3). At depth 1 (default), returns only direct matches. At depth 2+, also fetches connected nodes via relationships. Higher depth = wider context but more results.', default: 1, minimum: 1, maximum: 3 } }, required: ['query'] } }, // ======================================================================== // get_embedding_stats // ======================================================================== { name: 'get_embedding_stats', description: 'Get statistics about nodes with embeddings, broken down by type', inputSchema: { type: 'object', properties: {}, required: [] } }, ]; } /** * Handle vector_search_nodes tool call - Semantic search across all nodes * * @description Performs semantic search using vector embeddings to find nodes * by meaning rather than exact keywords. Automatically falls back to full-text * search if embeddings are disabled or no results found. Supports multi-hop * graph traversal to discover connected nodes at specified depth. * * @param params - Search parameters * @param params.query - Natural language search query * @param params.types - Optional array of node types to filter (e.g., ['todo', 'memory', 'file']) * @param params.limit - Maximum results to return (default: 10) * @param params.min_similarity - Minimum cosine similarity 0-1 (default: 0.75) * @param params.depth - Graph traversal depth 1-3 (default: 1) * @param driver - Neo4j driver instance * * @returns Promise with search results and metadata * * @example * ```typescript * // Basic semantic search * const result = await handleVectorSearchNodes({ * query: 'authentication implementation', * limit: 10 * }, driver); * // Returns: { results: [...], total_candidates: 10, search_method: 'vector' } * ``` * * @example * ```typescript * // Search specific node types * const result = await handleVectorSearchNodes({ * query: 'database connection', * types: ['file', 'file_chunk'], * limit: 20, * min_similarity: 0.8 * }, driver); * ``` * * @example * ```typescript * // Multi-hop search to find connected nodes * const result = await handleVectorSearchNodes({ * query: 'user authentication', * depth: 2, * limit: 15 * }, driver); * // Returns direct matches + connected nodes within 2 hops * ``` */ export async function handleVectorSearchNodes( params: any, driver: Driver ): Promise<any> { const searchService = new UnifiedSearchService(driver); await searchService.initialize(); try { const depth = Math.max(1, Math.min(3, params.depth || 1)); // Clamp 1-3 const limit = params.limit || 10; // Initial vector search (with optional advanced search) const result = await searchService.search(params.query, { types: params.types, limit, minSimilarity: params.min_similarity || 0.5, offset: 0, rrfK: params.rrf_k, rrfVectorWeight: params.rrf_vector_weight, rrfBm25Weight: params.rrf_bm25_weight, rrfMinScore: params.rrf_min_score }); // If depth > 1, perform multi-hop graph traversal if (depth > 1 && result.results && result.results.length > 0) { const session = driver.session(); try { // Get connected nodes for top results (up to 5 to avoid explosion) const topResults = result.results.slice(0, Math.min(5, result.results.length)); const nodeIds = topResults.map((r: any) => r.id); // Multi-hop traversal query const traversalResult = await session.run( ` MATCH (start:Node) WHERE start.id IN $nodeIds CALL apoc.path.subgraphNodes(start, { maxLevel: $maxDepth, relationshipFilter: "EDGE", labelFilter: "+Node" }) YIELD node WHERE node.id <> start.id RETURN DISTINCT node.id as id, node.type as type, node.title as title, node.content as content, labels(node) as labels, properties(node) as props LIMIT $expandLimit `, { nodeIds, maxDepth: depth - 1, expandLimit: limit * 2 // Fetch more connected nodes } ); // Format connected nodes const connectedNodes = traversalResult.records.map(record => ({ id: record.get('id'), type: record.get('type'), title: record.get('title') || 'Untitled', description: `Connected via graph traversal (depth ${depth})`, content_preview: (record.get('content') || '').substring(0, 200), similarity: 0.0, // Mark as connected, not direct match })); // Merge with original results (cast to any to allow custom properties on result object) const enhancedResult = result as any; enhancedResult.results = [...result.results, ...connectedNodes]; enhancedResult.total_candidates = enhancedResult.results.length; enhancedResult.returned = enhancedResult.results.length; enhancedResult.depth_used = depth; enhancedResult.multi_hop_enabled = true; enhancedResult.connected_nodes_count = connectedNodes.length; } catch (traversalError: any) { // If APOC is not available, fall back to simple neighbor query console.warn('APOC traversal failed, using simple neighbor query:', traversalError.message); const topResults = result.results.slice(0, Math.min(5, result.results.length)); const nodeIds = topResults.map((r: any) => r.id); const neighborResult = await session.run( ` MATCH (start:Node)-[r:EDGE*1..${depth - 1}]-(connected:Node) WHERE start.id IN $nodeIds AND connected.id <> start.id RETURN DISTINCT connected.id as id, connected.type as type, connected.title as title, connected.content as content LIMIT ${limit * 2} `, { nodeIds } ); const connectedNodes = neighborResult.records.map(record => ({ id: record.get('id'), type: record.get('type'), title: record.get('title') || 'Untitled', description: `Connected via simple neighbor query (depth ${depth})`, content_preview: (record.get('content') || '').substring(0, 200), similarity: 0.0, })); const enhancedResult = result as any; enhancedResult.results = [...result.results, ...connectedNodes]; enhancedResult.total_candidates = enhancedResult.results.length; enhancedResult.returned = enhancedResult.results.length; enhancedResult.depth_used = depth; enhancedResult.multi_hop_enabled = true; enhancedResult.connected_nodes_count = connectedNodes.length; } finally { await session.close(); } } return result; } catch (error: any) { return { status: 'error', message: error.message }; } } /** * Handle get_embedding_stats tool call - Get embedding statistics * * @description Returns statistics about nodes with vector embeddings, * broken down by node type. Useful for monitoring indexing progress * and understanding what content is available for semantic search. * * @param params - No parameters required * @param driver - Neo4j driver instance * * @returns Promise with embedding statistics * * @example * ```typescript * // Get embedding statistics * const result = await handleGetEmbeddingStats({}, driver); * // Returns: { * // status: 'success', * // embeddings_enabled: true, * // total_nodes_with_embeddings: 1523, * // breakdown_by_type: { * // file_chunk: 1200, * // todo: 150, * // memory: 100, * // file: 73 * // } * // } * ``` * * @example * ```typescript * // Check if embeddings are enabled * const stats = await handleGetEmbeddingStats({}, driver); * if (stats.embeddings_enabled) { * console.log(`${stats.total_nodes_with_embeddings} nodes indexed`); * } * ``` */ export async function handleGetEmbeddingStats( params: any, driver: Driver ): Promise<any> { const searchService = new UnifiedSearchService(driver); await searchService.initialize(); const session = driver.session(); try { // Get total count and breakdown by type (including FileChunk) // Match nodes with embeddings, but exclude system nodes like WatchConfig const result = await session.run(` MATCH (n) WHERE n.embedding IS NOT NULL AND NOT n:WatchConfig AND n.type IS NOT NULL RETURN n.type AS type, count(*) AS count ORDER BY count DESC `); const byType: Record<string, number> = {}; let total = 0; for (const record of result.records) { const type = record.get('type'); const countValue = record.get('count'); const count = typeof countValue === 'object' && countValue.toNumber ? countValue.toNumber() : Number(countValue); byType[type] = count; total += count; } return { status: 'success', embeddings_enabled: searchService.isEmbeddingsEnabled(), total_nodes_with_embeddings: total, breakdown_by_type: byType }; } catch (error: any) { return { status: 'error', message: error.message }; } finally { await session.close(); } }

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/orneryd/Mimir'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

vectorSearch.tools.ts•11.6 KiB