Doclea MCP

Official

Overview Schema Related Servers Score Discussions

doclea-mcp
src
embeddings

provider.ts•9.13 KiB

import type { EmbeddingConfig } from "@/types"; import { TransformersEmbeddingClient } from "./transformers"; export interface EmbeddingClient { embed(text: string): Promise<number[]>; embedBatch(texts: string[]): Promise<number[][]>; } export { CachedEmbeddingClient } from "./cached"; export type { TransformersEmbeddingConfig, TransformersModelName, } from "./transformers"; export { TRANSFORMERS_MODELS, TransformersEmbeddingClient, } from "./transformers"; export function createEmbeddingClient( config: EmbeddingConfig, ): EmbeddingClient { switch (config.provider) { case "local": return new LocalTEIClient(config.endpoint); case "openai": return new OpenAIClient(config.apiKey, config.model); case "nomic": return new NomicClient(config.apiKey, config.model); case "voyage": return new VoyageClient(config.apiKey, config.model); case "ollama": return new OllamaClient(config.endpoint, config.model); case "transformers": return new TransformersEmbeddingClient({ model: config.model, cacheDir: config.cacheDir, dimensions: config.dimensions, }); } } // Local HuggingFace Text Embeddings Inference class LocalTEIClient implements EmbeddingClient { private readonly maxBatchSize: number; private readonly timeoutMs: number; constructor(private endpoint: string) { const profile = (process.env.DOCLEA_LOCAL_EMBED_PROFILE ?? "") .trim() .toLowerCase(); const profileIsQwenCpu = profile === "qwen_cpu"; const defaultBatchSize = profileIsQwenCpu ? 8 : 32; const parsed = Number.parseInt( process.env.DOCLEA_LOCAL_EMBED_MAX_BATCH_SIZE ?? `${defaultBatchSize}`, 10, ); this.maxBatchSize = Number.isFinite(parsed) && parsed > 0 ? parsed : defaultBatchSize; const defaultTimeoutMs = profileIsQwenCpu ? 180_000 : 120_000; const parsedTimeout = Number.parseInt( process.env.DOCLEA_LOCAL_EMBED_TIMEOUT_MS ?? `${defaultTimeoutMs}`, 10, ); this.timeoutMs = Number.isFinite(parsedTimeout) && parsedTimeout > 0 ? parsedTimeout : defaultTimeoutMs; } private async fetchEmbed(payload: unknown): Promise<Response> { const controller = new AbortController(); const timeout = setTimeout(() => controller.abort(), this.timeoutMs); try { return await fetch(`${this.endpoint}/embed`, { method: "POST", headers: { "Content-Type": "application/json" }, body: JSON.stringify(payload), signal: controller.signal, }); } finally { clearTimeout(timeout); } } private async requestBatch(texts: string[]): Promise<number[][]> { if (texts.length > this.maxBatchSize) { const vectors: number[][] = []; for (let i = 0; i < texts.length; i += this.maxBatchSize) { const chunk = texts.slice(i, i + this.maxBatchSize); const chunkVectors = await this.requestBatch(chunk); vectors.push(...chunkVectors); } return vectors; } const response = await this.fetchEmbed({ inputs: texts }); if (response.ok) { return response.json(); } const responseText = await response.text().catch(() => ""); const normalizedError = `${response.statusText} ${responseText}`.toLowerCase(); const isPayloadTooLarge = response.status === 413 || normalizedError.includes("payload too large") || normalizedError.includes("entity too large") || normalizedError.includes("request body too large"); if (isPayloadTooLarge && texts.length > 1) { const midpoint = Math.ceil(texts.length / 2); const left = await this.requestBatch(texts.slice(0, midpoint)); const right = await this.requestBatch(texts.slice(midpoint)); return [...left, ...right]; } const detail = responseText ? `: ${responseText.slice(0, 240)}` : ""; throw new Error( `TEI embed batch failed: ${response.status} ${response.statusText}${detail}`, ); } async embed(text: string): Promise<number[]> { const response = await this.fetchEmbed({ inputs: text }); if (!response.ok) { throw new Error(`TEI embed failed: ${response.statusText}`); } const result = await response.json(); // TEI returns [[...embedding...]] for single input return Array.isArray(result[0]) ? result[0] : result; } async embedBatch(texts: string[]): Promise<number[][]> { if (texts.length === 0) return []; return this.requestBatch(texts); } } // OpenAI Embeddings class OpenAIClient implements EmbeddingClient { constructor( private apiKey: string, private model: string, ) {} async embed(text: string): Promise<number[]> { const response = await fetch("https://api.openai.com/v1/embeddings", { method: "POST", headers: { "Content-Type": "application/json", Authorization: `Bearer ${this.apiKey}`, }, body: JSON.stringify({ model: this.model, input: text, }), }); if (!response.ok) { throw new Error(`OpenAI embed failed: ${response.statusText}`); } const result = await response.json(); return result.data[0].embedding; } async embedBatch(texts: string[]): Promise<number[][]> { const response = await fetch("https://api.openai.com/v1/embeddings", { method: "POST", headers: { "Content-Type": "application/json", Authorization: `Bearer ${this.apiKey}`, }, body: JSON.stringify({ model: this.model, input: texts, }), }); if (!response.ok) { throw new Error(`OpenAI embed batch failed: ${response.statusText}`); } const result = await response.json(); return result.data.map((d: { embedding: number[] }) => d.embedding); } } // Nomic Embeddings class NomicClient implements EmbeddingClient { constructor( private apiKey: string, private model: string, ) {} async embed(text: string): Promise<number[]> { const response = await fetch( "https://api-atlas.nomic.ai/v1/embedding/text", { method: "POST", headers: { "Content-Type": "application/json", Authorization: `Bearer ${this.apiKey}`, }, body: JSON.stringify({ model: this.model, texts: [text], task_type: "search_document", }), }, ); if (!response.ok) { throw new Error(`Nomic embed failed: ${response.statusText}`); } const result = await response.json(); return result.embeddings[0]; } async embedBatch(texts: string[]): Promise<number[][]> { const response = await fetch( "https://api-atlas.nomic.ai/v1/embedding/text", { method: "POST", headers: { "Content-Type": "application/json", Authorization: `Bearer ${this.apiKey}`, }, body: JSON.stringify({ model: this.model, texts, task_type: "search_document", }), }, ); if (!response.ok) { throw new Error(`Nomic embed batch failed: ${response.statusText}`); } const result = await response.json(); return result.embeddings; } } // Voyage AI Embeddings class VoyageClient implements EmbeddingClient { constructor( private apiKey: string, private model: string, ) {} async embed(text: string): Promise<number[]> { const response = await fetch("https://api.voyageai.com/v1/embeddings", { method: "POST", headers: { "Content-Type": "application/json", Authorization: `Bearer ${this.apiKey}`, }, body: JSON.stringify({ model: this.model, input: text, }), }); if (!response.ok) { throw new Error(`Voyage embed failed: ${response.statusText}`); } const result = await response.json(); return result.data[0].embedding; } async embedBatch(texts: string[]): Promise<number[][]> { const response = await fetch("https://api.voyageai.com/v1/embeddings", { method: "POST", headers: { "Content-Type": "application/json", Authorization: `Bearer ${this.apiKey}`, }, body: JSON.stringify({ model: this.model, input: texts, }), }); if (!response.ok) { throw new Error(`Voyage embed batch failed: ${response.statusText}`); } const result = await response.json(); return result.data.map((d: { embedding: number[] }) => d.embedding); } } // Ollama Embeddings class OllamaClient implements EmbeddingClient { constructor( private endpoint: string, private model: string, ) {} async embed(text: string): Promise<number[]> { const response = await fetch(`${this.endpoint}/api/embeddings`, { method: "POST", headers: { "Content-Type": "application/json" }, body: JSON.stringify({ model: this.model, prompt: text, }), }); if (!response.ok) { throw new Error(`Ollama embed failed: ${response.statusText}`); } const result = await response.json(); return result.embedding; } async embedBatch(texts: string[]): Promise<number[][]> { // Ollama doesn't support batch, so we do sequential return Promise.all(texts.map((text) => this.embed(text))); } }

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/docleaai/doclea-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

provider.ts•9.13 KiB