Local RAG

Overview Inspect Schema Related Servers Score Discussions

index.ts•5.46 kB

// Embedder implementation with Transformers.js import { env, pipeline } from '@huggingface/transformers' // ============================================ // Type Definitions // ============================================ /** * Embedder configuration */ export interface EmbedderConfig { /** HuggingFace model path */ modelPath: string /** Batch size */ batchSize: number /** Model cache directory */ cacheDir: string } // ============================================ // Error Classes // ============================================ /** * Embedding generation error */ export class EmbeddingError extends Error { constructor( message: string, public readonly cause?: Error ) { super(message) this.name = 'EmbeddingError' } } // ============================================ // Embedder Class // ============================================ /** * Embedding generation class using Transformers.js * * Responsibilities: * - Generate embedding vectors (384 dimensions) * - Transformers.js wrapper * - Batch processing (size 8) */ export class Embedder { private model: Awaited<ReturnType<typeof pipeline>> | null = null private initPromise: Promise<void> | null = null private readonly config: EmbedderConfig constructor(config: EmbedderConfig) { this.config = config } /** * Initialize Transformers.js model */ async initialize(): Promise<void> { // Skip if already initialized if (this.model) { return } try { // Set cache directory BEFORE creating pipeline env.cacheDir = this.config.cacheDir console.error(`Embedder: Setting cache directory to "${this.config.cacheDir}"`) console.error(`Embedder: Loading model "${this.config.modelPath}"...`) this.model = await pipeline('feature-extraction', this.config.modelPath) console.error('Embedder: Model loaded successfully') } catch (error) { throw new EmbeddingError( `Failed to initialize Embedder: ${(error as Error).message}`, error as Error ) } } /** * Ensure model is initialized (lazy initialization) * This method is called automatically by embed() and embedBatch() */ private async ensureInitialized(): Promise<void> { // Already initialized if (this.model) { return } // Initialization already in progress, wait for it if (this.initPromise) { await this.initPromise return } // Start initialization console.error( 'Embedder: First use detected. Initializing model (downloading ~90MB, may take 1-2 minutes)...' ) this.initPromise = this.initialize().catch((error) => { // Clear initPromise on failure to allow retry this.initPromise = null // Enhance error message with detailed guidance throw new EmbeddingError( `Failed to initialize embedder on first use: ${(error as Error).message}\n\nPossible causes:\n • Network connectivity issues during model download\n • Insufficient disk space (need ~90MB)\n • Corrupted model cache\n\nRecommended actions:\n 1. Check your internet connection and try again\n 2. Ensure sufficient disk space is available\n 3. If problem persists, delete cache: ${this.config.cacheDir}\n 4. Then retry your query\n`, error as Error ) }) await this.initPromise } /** * Convert single text to embedding vector * * @param text - Text * @returns 384-dimensional vector */ async embed(text: string): Promise<number[]> { // Lazy initialization: initialize on first use if not already initialized await this.ensureInitialized() try { // Return zero vector for empty string if (text.length === 0) { return new Array(384).fill(0) } // Use type assertion to avoid complex Transformers.js type definitions // This is due to external library type definition constraints, runtime behavior is guaranteed const options = { pooling: 'mean', normalize: true } const modelCall = this.model as ( text: string, options: unknown ) => Promise<{ data: Float32Array }> const output = await modelCall(text, options) // Access raw data via .data property const embedding = Array.from(output.data) return embedding } catch (error) { throw new EmbeddingError( `Failed to generate embedding: ${(error as Error).message}`, error as Error ) } } /** * Convert multiple texts to embedding vectors with batch processing * * @param texts - Array of texts * @returns Array of 384-dimensional vectors */ async embedBatch(texts: string[]): Promise<number[][]> { // Lazy initialization: initialize on first use if not already initialized await this.ensureInitialized() if (texts.length === 0) { return [] } try { const embeddings: number[][] = [] // Process in batches according to batch size for (let i = 0; i < texts.length; i += this.config.batchSize) { const batch = texts.slice(i, i + this.config.batchSize) const batchEmbeddings = await Promise.all(batch.map((text) => this.embed(text))) embeddings.push(...batchEmbeddings) } return embeddings } catch (error) { throw new EmbeddingError( `Failed to generate batch embeddings: ${(error as Error).message}`, error as Error ) } } }

Latest Blog Posts

What Is Context Bloat in MCP?
By Om-Shree-0709 on December 16, 2025.
mcp
Context Bloat
MCP Moves to the Linux Foundation: Neutral Stewardship for Agentic Infrastructure
By Om-Shree-0709 on December 15, 2025.
mcp
anthropic
Linux Foundation
Code Execution with MCP: Architecting Agentic Efficiency
By Om-Shree-0709 on December 14, 2025.
mcp
Token bloat

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/shinpr/mcp-local-rag'

If you have feedback or need assistance with the MCP directory API, please join our Discord server