Obsidian RAG MCP Server

Overview Schema Related Servers Score Discussions

embedder.py•5.02 KiB

""" OpenAI embedding wrapper with batching, retries, and logging. """ import logging import os from dataclasses import dataclass from openai import APIConnectionError, APITimeoutError, OpenAI, RateLimitError from tenacity import ( before_sleep_log, retry, retry_if_exception_type, stop_after_attempt, wait_exponential, ) logger = logging.getLogger(__name__) @dataclass class EmbedderConfig: """Configuration for the embedder.""" model: str = "text-embedding-3-small" batch_size: int = 100 # OpenAI allows up to 2048 dimensions: int | None = None # Use model default max_retries: int = 3 query_max_chars: int = 8000 # Stricter limit for queries class OpenAIEmbedder: """ Wrapper around OpenAI's embedding API. Features: - Batched embedding for efficiency - Automatic retries with exponential backoff - Configurable model and dimensions - Simple interface """ def __init__( self, api_key: str | None = None, config: EmbedderConfig | None = None ): self.config = config or EmbedderConfig() self.client = OpenAI(api_key=api_key or os.getenv("OPENAI_API_KEY")) # Validate API key if not self.client.api_key: raise ValueError( "OpenAI API key required. Set OPENAI_API_KEY environment variable." ) logger.debug(f"Initialized embedder with model={self.config.model}") def embed_text(self, text: str, is_query: bool = True) -> list[float]: """ Embed a single text string. Args: text: Text to embed is_query: If True, apply stricter length limit for queries Returns: Embedding vector as list of floats """ result = self.embed_texts([text], is_query=is_query) return result[0] def embed_texts( self, texts: list[str], is_query: bool = False ) -> list[list[float]]: """ Embed multiple texts efficiently with batching. Args: texts: List of texts to embed is_query: If True, apply stricter length limits Returns: List of embedding vectors """ if not texts: return [] all_embeddings = [] total_batches = ( len(texts) + self.config.batch_size - 1 ) // self.config.batch_size logger.debug(f"Embedding {len(texts)} texts in {total_batches} batches") # Process in batches for batch_num, i in enumerate(range(0, len(texts), self.config.batch_size)): batch = texts[i : i + self.config.batch_size] # Clean texts (remove null bytes, excessive whitespace) max_chars = self.config.query_max_chars if is_query else 30000 batch = [self._clean_text(t, max_chars) for t in batch] # Call OpenAI API with retries batch_embeddings = self._embed_batch(batch) all_embeddings.extend(batch_embeddings) logger.debug(f"Completed batch {batch_num + 1}/{total_batches}") return all_embeddings @retry( retry=retry_if_exception_type( (RateLimitError, APIConnectionError, APITimeoutError) ), stop=stop_after_attempt(3), wait=wait_exponential(multiplier=1, min=1, max=10), before_sleep=before_sleep_log(logger, logging.WARNING), ) def _embed_batch(self, batch: list[str]) -> list[list[float]]: """ Embed a single batch with retry logic. Args: batch: List of cleaned texts to embed Returns: List of embedding vectors """ kwargs = { "model": self.config.model, "input": batch, } if self.config.dimensions: kwargs["dimensions"] = self.config.dimensions response = self.client.embeddings.create(**kwargs) # Extract embeddings in order batch_embeddings: list[list[float] | None] = [None] * len(batch) for item in response.data: batch_embeddings[item.index] = item.embedding # Type narrowing - we know all slots are filled return [e for e in batch_embeddings if e is not None] def _clean_text(self, text: str, max_chars: int = 30000) -> str: """Clean text for embedding.""" # Remove null bytes text = text.replace("\x00", "") # Normalize whitespace text = " ".join(text.split()) # Truncate if too long if len(text) > max_chars: text = text[:max_chars] logger.debug(f"Truncated text to {max_chars} characters") return text @property def embedding_dimension(self) -> int: """Get the embedding dimension for the current model.""" if self.config.dimensions: return self.config.dimensions # Default dimensions by model defaults = { "text-embedding-3-small": 1536, "text-embedding-3-large": 3072, "text-embedding-ada-002": 1536, } return defaults.get(self.config.model, 1536)

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/claudiogarza/obsidian-rag-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

embedder.py•5.02 KiB