Memory Engineering MCP

codeEmbeddings.ts•6.28 KiB

import { VoyageAIClient } from 'voyageai'; import type { CodeChunk } from '../types/memory-v5.js'; import { logger } from '../utils/logger.js'; // Don't read API key at module level - will be read inside functions const BATCH_SIZE = 100; // Process chunks in batches let voyageClient: VoyageAIClient | null = null; function getVoyageClient(): VoyageAIClient { if (!voyageClient) { const apiKey = process.env.VOYAGE_API_KEY; if (!apiKey) { throw new Error('VOYAGE_API_KEY environment variable is not set'); } voyageClient = new VoyageAIClient({ apiKey }); } return voyageClient; } /** * Generate embeddings for code chunks using voyage-code-3 model. * Each chunk is embedded with its signature, content, and metadata. */ export async function generateCodeEmbeddings( chunks: Omit<CodeChunk, '_id' | 'contentVector' | 'createdAt' | 'updatedAt'>[] ): Promise<number[][]> { const client = getVoyageClient(); // Simplified: Generate embeddings for each chunk individually // This avoids the complexity of contextualizedEmbed which seems to have issues const chunkTexts = chunks.map(chunk => { // Combine signature, content, and metadata for rich embedding const text = `${chunk.chunk.signature || chunk.chunk.name} ${chunk.chunk.content} File: ${chunk.filePath} | Type: ${chunk.chunk.type} | Patterns: ${chunk.metadata.patterns.join(', ')}`; return text; }); // Generate embeddings in batches using regular embed (not contextualized) const allEmbeddings: number[][] = []; for (let i = 0; i < chunkTexts.length; i += BATCH_SIZE) { const batch = chunkTexts.slice(i, i + BATCH_SIZE); try { logger.info(`🧠 GENERATING INTELLIGENCE: ${batch.length} chunks → voyage-code-3 embeddings`); // Use regular embed which is more stable const response = await client.embed({ input: batch, model: 'voyage-code-3', // Use code-optimized model for better accuracy inputType: 'document' }); logger.info(`🎆 EMBEDDINGS RECEIVED: ${response.data?.length || 0} vectors from Voyage AI`); // Extract embeddings from regular embed response // The response structure is simpler: response.data[index].embedding if (response.data && Array.isArray(response.data)) { for (const item of response.data) { if (item.embedding && Array.isArray(item.embedding) && item.embedding.length > 0) { allEmbeddings.push(item.embedding); logger.debug(`✨ PERFECT VECTOR: ${item.embedding.length} dimensions captured`); } else { logger.error(`🔴 CORRUPT EMBEDDING DETECTED!`, item); } } } else { logger.error('💀 VOYAGE AI RETURNED EMPTY!', response); } logger.info(`📊 EMBEDDING PROGRESS: ${allEmbeddings.length} vectors ready`); } catch (error: any) { // More robust error handling for embed API if (error.message?.includes('invalid model')) { throw new Error(`Model voyage-3 not available. Please check your Voyage AI account permissions.`); } else if (error.response?.status === 401) { throw new Error('💀 VOYAGE API KEY DEAD! Your VOYAGE_API_KEY is INVALID or EXPIRED! GET A NEW KEY NOW at voyageai.com!'); } else { logger.error('💥 EMBEDDING GENERATION EXPLODED!', error); throw error; } } } // SIMPLIFIED: Just return all embeddings in the order they were generated // The contextualized embeddings should maintain the same order as the input chunks logger.debug(`🎯 FINAL COUNT: ${allEmbeddings.length} embeddings for ${chunks.length} chunks`); if (allEmbeddings.length !== chunks.length) { logger.error(`⚠️ EMBEDDING MISMATCH: ${allEmbeddings.length} vectors ≠ ${chunks.length} chunks!`); // Pad with empty arrays if we have fewer embeddings while (allEmbeddings.length < chunks.length) { allEmbeddings.push([]); } // Truncate if we have too many embeddings if (allEmbeddings.length > chunks.length) { allEmbeddings.splice(chunks.length); } } logger.info(`🎉 EMBEDDING SUCCESS: ${allEmbeddings.filter(e => e.length > 0).length}/${chunks.length} valid vectors`); return allEmbeddings; } /** * Generate embedding for a code search query using voyage-3 model */ export async function generateCodeQueryEmbedding(query: string): Promise<number[]> { const client = getVoyageClient(); try { logger.info(`🔍 QUERY EMBEDDING: "${query.substring(0, 100)}..."`); // Use regular embed API which is more stable const response = await client.embed({ input: [query], // Single query model: 'voyage-3', // Same model as documents for consistency inputType: 'query' // This is a search query }); // Extract embedding from response if (response.data && response.data.length > 0) { const item = response.data[0]; if (item && item.embedding && Array.isArray(item.embedding) && item.embedding.length > 0) { logger.info(`✅ QUERY VECTOR READY: ${item.embedding.length} dimensions`); return item.embedding; } } throw new Error('💥 QUERY EMBEDDING CATASTROPHE! Failed to generate search vector! Your query might be corrupted or Voyage AI is DOWN!'); } catch (error: any) { // Provide specific error messages if (error.message?.includes('invalid model')) { throw new Error(`Model voyage-3 not available for queries.`); } else if (error.response?.status === 401) { throw new Error('🔴 VOYAGE KEY REJECTED! Cannot generate query embeddings! CHECK YOUR API KEY IMMEDIATELY!'); } else { logger.error('🔴 QUERY EMBEDDING FAILED!', error); throw error; } } } /** * Example of how contextualized embeddings solve the "golden chunk" problem: * * File: userService.ts * Chunks: * 1. "import { User } from './models/User';" * 2. "export class UserService { ... }" * 3. "async authenticate(email: string, password: string) { ... }" * * With standard embeddings: * - Chunk 3 loses context about UserService class * - Search for "UserService authenticate" might not find chunk 3 * * With contextualized embeddings: * - Chunk 3 is embedded knowing it's part of UserService * - Search for "UserService authenticate" correctly finds chunk 3 * - Each chunk "knows" about the imports and class structure */

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/romiluz13/memory-engineering-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

codeEmbeddings.ts•6.28 KiB