MCP Codebase Index

Overview Schema Related Servers Score Discussions

embedder.ts•12.2 KiB

// src/core/embedder.ts import { GoogleGenerativeAI } from '@google/generative-ai'; import { CodeChunk, QuotaUsage } from '../types/index.js'; const SUPPORTED_MODELS = ['text-embedding-004', 'gemini-embedding-001'] as const; type SupportedModel = typeof SUPPORTED_MODELS[number]; // Model dimensions mapping (maximum recommended dimensions for best results) const MODEL_DEFAULT_DIMENSIONS: Record<SupportedModel, number> = { 'text-embedding-004': 768, // Fixed dimension for English/code specialization (recommended) 'gemini-embedding-001': 3072 // Flexible dimension 768-3072 (not recommended for free tier) }; // Rate limits per model (free tier) const MODEL_RATE_LIMITS: Record<SupportedModel, { rpm: number; tpm: number; rpd: number | null }> = { 'text-embedding-004': { rpm: 1500, tpm: 1000000, rpd: null }, // No daily limit 'gemini-embedding-001': { rpm: 90, tpm: 27000, rpd: 950 } // Has daily limit }; export class CodeEmbedder { private genAI: GoogleGenerativeAI; private model: SupportedModel; private outputDimension: number; // Quota tracking private requestsThisMinute: number = 0; private tokensThisMinute: number = 0; private requestsToday: number = 0; private currentMinuteStart: number = Date.now(); private currentDayStart: string = this.getTodayString(); constructor(apiKey: string, model?: string, outputDimension?: number) { this.genAI = new GoogleGenerativeAI(apiKey); // Get model from parameter or environment variable, default to text-embedding-004 const selectedModel = model || process.env.EMBEDDING_MODEL || 'text-embedding-004'; // Validate model if (!SUPPORTED_MODELS.includes(selectedModel as SupportedModel)) { throw new Error( `Unsupported embedding model: ${selectedModel}. ` + `Supported models: ${SUPPORTED_MODELS.join(', ')}` ); } this.model = selectedModel as SupportedModel; // Set output dimension this.outputDimension = outputDimension || parseInt(process.env.EMBEDDING_DIMENSION || '') || MODEL_DEFAULT_DIMENSIONS[this.model]; // Validate dimension for gemini-embedding-001 if (this.model === 'gemini-embedding-001') { if (this.outputDimension < 128 || this.outputDimension > 3072) { throw new Error( `Invalid output dimension for gemini-embedding-001: ${this.outputDimension}. ` + `Must be between 128-3072. Recommended: 768, 1536, 3072` ); } } // Validate dimension for text-embedding-004 if (this.model === 'text-embedding-004' && this.outputDimension > 768) { throw new Error( `Invalid output dimension for ${this.model}: ${this.outputDimension}. ` + `Maximum is 768.` ); } console.log(`[Embedder] Using embedding model: ${this.model} (dimension: ${this.outputDimension})`); } /** * Get the dimension of the current model */ getDimension(): number { return this.outputDimension; } /** * Get today's date string (YYYY-MM-DD) */ private getTodayString(): string { return new Date().toISOString().split('T')[0]; } /** * Reset minute counters if a new minute has started */ private resetMinuteCountersIfNeeded(): void { const now = Date.now(); const minuteElapsed = now - this.currentMinuteStart; if (minuteElapsed >= 60000) { this.requestsThisMinute = 0; this.tokensThisMinute = 0; this.currentMinuteStart = now; } } /** * Reset daily counters if a new day has started */ private resetDailyCountersIfNeeded(): void { const today = this.getTodayString(); if (this.currentDayStart !== today) { this.requestsToday = 0; this.currentDayStart = today; } } /** * Track a request and estimate tokens */ private trackRequest(text: string): void { this.resetMinuteCountersIfNeeded(); this.resetDailyCountersIfNeeded(); this.requestsThisMinute++; this.requestsToday++; // Estimate tokens (rough approximation: 1 token ≈ 4 characters) const estimatedTokens = Math.ceil(text.length / 4); this.tokensThisMinute += estimatedTokens; } /** * Get current quota usage */ getQuotaUsage(): QuotaUsage { this.resetMinuteCountersIfNeeded(); this.resetDailyCountersIfNeeded(); const limits = MODEL_RATE_LIMITS[this.model]; return { rpm: { current: this.requestsThisMinute, limit: limits.rpm, percentage: (this.requestsThisMinute / limits.rpm) * 100 }, tpm: { current: this.tokensThisMinute, limit: limits.tpm, percentage: (this.tokensThisMinute / limits.tpm) * 100 }, rpd: { current: this.requestsToday, limit: limits.rpd || 0, percentage: limits.rpd ? (this.requestsToday / limits.rpd) * 100 : 0 }, tier: 'free', // Assuming free tier for now model: this.model }; } /** * Embed a code chunk */ async embedChunk(chunk: CodeChunk): Promise<number[]> { try { // Track request before making API call this.trackRequest(chunk.content); const embeddingModel = this.genAI.getGenerativeModel({ model: this.model }); // For gemini-embedding-001, specify output dimension and task type let result; if (this.model === 'gemini-embedding-001') { result = await embeddingModel.embedContent({ content: { parts: [{ text: chunk.content }] }, taskType: 'RETRIEVAL_DOCUMENT', outputDimensionality: this.outputDimension } as any); } else { result = await embeddingModel.embedContent(chunk.content); } return result.embedding.values; } catch (error) { console.error('Embedding error:', error); throw error; } } /** * Embed multiple chunks in batch with rate limiting */ async embedChunks(chunks: CodeChunk[]): Promise<(number[] | null)[]> { // text-embedding-004 has better rate limits, use parallel processing // gemini-embedding-001 needs sequential processing to avoid 429 errors if (this.model === 'text-embedding-004') { return this.embedChunksParallel(chunks); } else { return this.embedChunksSequential(chunks); } } /** * Parallel embedding for models with good rate limits (text-embedding-004) * text-embedding-004: 1,500 RPM = 25 requests per second */ private async embedChunksParallel(chunks: CodeChunk[]): Promise<(number[] | null)[]> { const results: (number[] | null)[] = []; const BATCH_SIZE = 25; // Process 25 at a time (max rate = 25 RPS) const DELAY_PER_BATCH = 1000; // 1 second between batches = exactly 25 RPS console.log(`[Embedder] Processing ${chunks.length} chunks with parallel batching: 1,500 RPM (25 RPS)`); for (let i = 0; i < chunks.length; i += BATCH_SIZE) { const batch = chunks.slice(i, i + BATCH_SIZE); const batchNumber = Math.floor(i / BATCH_SIZE) + 1; const totalBatches = Math.ceil(chunks.length / BATCH_SIZE); try { // Process batch in parallel const promises = batch.map(chunk => this.delayedEmbedWithRetry(chunk, 0, 3)); const batchResults = await Promise.all(promises); results.push(...batchResults); const processed = Math.min(i + BATCH_SIZE, chunks.length); console.log(`[Embedder] Batch ${batchNumber}/${totalBatches}: ${processed}/${chunks.length} chunks (${((processed / chunks.length) * 100).toFixed(1)}%)`); // Wait between batches to respect rate limit (except for last batch) if (i + BATCH_SIZE < chunks.length) { await new Promise(resolve => setTimeout(resolve, DELAY_PER_BATCH)); } } catch (error) { console.error(`[Embedder] Batch ${batchNumber} error:`, error); // Add nulls for failed batch results.push(...new Array(batch.length).fill(null)); } } return results; } /** * Sequential embedding for models with strict rate limits (gemini-embedding-001) */ private async embedChunksSequential(chunks: CodeChunk[]): Promise<(number[] | null)[]> { const results: (number[] | null)[] = []; const DELAY_BETWEEN_REQUESTS = 1500; // 1.5s between each request console.log(`[Embedder] Processing ${chunks.length} chunks sequentially (rate-limited model)...`); for (let i = 0; i < chunks.length; i++) { try { if (i > 0) { await new Promise(resolve => setTimeout(resolve, DELAY_BETWEEN_REQUESTS)); } const result = await this.delayedEmbedWithRetry(chunks[i], 0, 5); results.push(result); if ((i + 1) % 5 === 0 || i === chunks.length - 1) { console.log(`[Embedder] Processed ${i + 1}/${chunks.length} chunks`); } } catch (error) { console.error(`[Embedder] Error processing chunk ${i}:`, error); results.push(null); } } return results; } /** * Embed with delay and retry logic for rate limits */ private async delayedEmbedWithRetry( chunk: CodeChunk, delayMs: number, maxRetries: number = 3 ): Promise<number[] | null> { await new Promise(resolve => setTimeout(resolve, delayMs)); for (let attempt = 0; attempt < maxRetries; attempt++) { try { return await this.embedChunk(chunk); } catch (err: any) { // Check if it's a 429 rate limit error if (err?.status === 429 || err?.message?.includes('429') || err?.message?.includes('quota')) { // Exponential backoff based on model const baseDelay = this.model === 'gemini-embedding-001' ? 5000 : 2000; const retryDelay = Math.min(Math.pow(2, attempt) * baseDelay, 60000); console.warn(`[Rate Limit] ${chunk.id}: Retry ${attempt + 1}/${maxRetries} after ${retryDelay}ms`); await new Promise(resolve => setTimeout(resolve, retryDelay)); continue; } // Other errors, don't retry console.error(`Failed to embed ${chunk.id}:`, err.message || err); return null; } } console.error(`Failed to embed ${chunk.id} after ${maxRetries} retries`); return null; } /** * Embed a query */ async embedQuery(query: string): Promise<number[]> { try { // Track request before making API call this.trackRequest(query); const embeddingModel = this.genAI.getGenerativeModel({ model: this.model }); // For gemini-embedding-001, specify output dimension and task type for queries let result; if (this.model === 'gemini-embedding-001') { result = await embeddingModel.embedContent({ content: { parts: [{ text: query }] }, taskType: 'RETRIEVAL_QUERY', outputDimensionality: this.outputDimension } as any); } else { result = await embeddingModel.embedContent(query); } return result.embedding.values; } catch (error) { console.error('Query embedding error:', error); throw error; } } }

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/NgoTaiCo/mcp-codebase-index'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

embedder.ts•12.2 KiB