Nexus MCP for Obsidian

Overview Schema Related Servers Score Discussions

OpenRouterAdapter.ts•24.8 KiB

/** * OpenRouter Adapter - Clean implementation with centralized SSE streaming * Supports 400+ models through OpenRouter's unified API * Uses BaseAdapter's processSSEStream for reliable streaming */ import { BaseAdapter } from '../BaseAdapter'; import { GenerateOptions, StreamChunk, LLMResponse, ModelInfo, ProviderCapabilities, ModelPricing, SearchResult } from '../types'; import { ModelRegistry } from '../ModelRegistry'; import { ReasoningPreserver } from '../shared/ReasoningPreserver'; import { WebSearchUtils } from '../../utils/WebSearchUtils'; import { BRAND_NAME } from '../../../../constants/branding'; import { MCPToolExecution } from '../shared/ToolExecutionUtils'; export class OpenRouterAdapter extends BaseAdapter { readonly name = 'openrouter'; readonly baseUrl = 'https://openrouter.ai/api/v1'; private httpReferer: string; private xTitle: string; constructor( apiKey: string, options?: { httpReferer?: string; xTitle?: string } ) { super(apiKey, 'anthropic/claude-3.5-sonnet'); this.httpReferer = options?.httpReferer?.trim() || 'https://synapticlabs.ai'; this.xTitle = options?.xTitle?.trim() || BRAND_NAME; this.initializeCache(); } /** * Generate response without caching */ async generateUncached(prompt: string, options?: GenerateOptions): Promise<LLMResponse> { try { // Validate web search support if (options?.webSearch) { WebSearchUtils.validateWebSearchRequest('openrouter', options.webSearch); } const baseModel = options?.model || this.currentModel; // Add :online suffix for web search const model = options?.webSearch ? `${baseModel}:online` : baseModel; // Handle post-stream tool execution: if detectedToolCalls are provided, execute only tools if (options?.detectedToolCalls && options.detectedToolCalls.length > 0) { return await this.executeDetectedToolCalls(options.detectedToolCalls, model, prompt, options); } // Tool execution requires streaming - use generateStreamAsync instead if (options?.tools && options.tools.length > 0) { throw new Error('Tool execution requires streaming. Use generateStreamAsync() instead.'); } const requestBody = { model, messages: this.buildMessages(prompt, options?.systemPrompt), temperature: options?.temperature, max_tokens: options?.maxTokens, top_p: options?.topP, frequency_penalty: options?.frequencyPenalty, presence_penalty: options?.presencePenalty, response_format: options?.jsonMode ? { type: 'json_object' } : undefined, stop: options?.stopSequences, tools: options?.tools ? this.convertTools(options.tools) : undefined, usage: { include: true } // Enable token usage and cost tracking }; const response = await fetch(`${this.baseUrl}/chat/completions`, { method: 'POST', headers: { ...this.buildHeaders(), 'Authorization': `Bearer ${this.apiKey}`, 'HTTP-Referer': this.httpReferer, 'X-Title': this.xTitle }, body: JSON.stringify(requestBody) }); if (!response.ok) { throw new Error(`HTTP ${response.status}: ${response.statusText}`); } const data = await response.json(); const text = data.choices[0]?.message?.content || ''; const usage = this.extractUsage(data); const finishReason = data.choices[0]?.finish_reason || 'stop'; // Extract web search results if web search was enabled const webSearchResults = options?.webSearch ? this.extractOpenRouterSources(data) : undefined; return this.buildLLMResponse( text, baseModel, // Use base model name, not :online version usage, { webSearchResults }, finishReason as 'stop' | 'length' | 'tool_calls' | 'content_filter' ); } catch (error) { throw this.handleError(error, 'generation'); } } /** * Generate streaming response using unified stream processing * Uses processStream which automatically handles SSE parsing and tool call accumulation */ async* generateStreamAsync(prompt: string, options?: GenerateOptions): AsyncGenerator<StreamChunk, void, unknown> { try { // Validate web search support if (options?.webSearch) { WebSearchUtils.validateWebSearchRequest('openrouter', options.webSearch); } const baseModel = options?.model || this.currentModel; // Add :online suffix for web search const model = options?.webSearch ? `${baseModel}:online` : baseModel; const messages = options?.conversationHistory || this.buildMessages(prompt, options?.systemPrompt); // Check if this model requires reasoning preservation (Gemini via OpenRouter) const needsReasoning = ReasoningPreserver.requiresReasoningPreservation(baseModel, 'openrouter'); const hasTools = options?.tools && options.tools.length > 0; const requestBody: any = { model, messages, temperature: options?.temperature, max_tokens: options?.maxTokens, top_p: options?.topP, frequency_penalty: options?.frequencyPenalty, presence_penalty: options?.presencePenalty, response_format: options?.jsonMode ? { type: 'json_object' } : undefined, stop: options?.stopSequences, tools: options?.tools ? this.convertTools(options.tools) : undefined, stream: true, // Enable reasoning for Gemini models to capture thought signatures ...ReasoningPreserver.getReasoningRequestParams(baseModel, 'openrouter', hasTools || false) }; const response = await fetch(`${this.baseUrl}/chat/completions`, { method: 'POST', headers: { ...this.buildHeaders(), 'Authorization': `Bearer ${this.apiKey}`, 'HTTP-Referer': this.httpReferer, 'X-Title': this.xTitle }, body: JSON.stringify(requestBody) }); if (!response.ok) { const errorBody = await response.text(); throw new Error(`HTTP ${response.status}: ${response.statusText} - ${errorBody}`); } // Track generation ID for async usage retrieval let generationId: string | null = null; let usageFetchTriggered = false; // Track reasoning data for models that need preservation (Gemini via OpenRouter) // Gemini requires TWO different fields for tool continuations: // - reasoning_details: array of reasoning objects from OpenRouter // - thought_signature: string signature required by Google for function call continuations let capturedReasoning: any[] | undefined = undefined; let capturedThoughtSignature: string | undefined = undefined; // Use unified stream processing (automatically uses SSE parsing for Response objects) yield* this.processStream(response, { debugLabel: 'OpenRouter', extractContent: (parsed: any) => { // Capture generation ID from first chunk if (!generationId && parsed.id) { generationId = parsed.id; } // Capture reasoning_details for Gemini models (required for tool continuations) if (needsReasoning && !capturedReasoning) { capturedReasoning = parsed.reasoning_details || parsed.choices?.[0]?.message?.reasoning_details || parsed.choices?.[0]?.delta?.reasoning_details || parsed.choices?.[0]?.reasoning_details || ReasoningPreserver.extractFromStreamChunk(parsed); } // Capture thought_signature for Gemini models (OpenAI compatibility format) // Per Google docs, this can be in: extra_content.google.thought_signature // or directly on the delta/message if (needsReasoning && !capturedThoughtSignature) { const delta = parsed.choices?.[0]?.delta; const message = parsed.choices?.[0]?.message; capturedThoughtSignature = // OpenAI compatibility format per Google docs delta?.extra_content?.google?.thought_signature || message?.extra_content?.google?.thought_signature || parsed.extra_content?.google?.thought_signature || // Direct formats delta?.thought_signature || delta?.thoughtSignature || message?.thought_signature || message?.thoughtSignature || parsed.thought_signature || parsed.thoughtSignature; } // Process all available choices - reasoning models may use multiple choices for (const choice of parsed.choices || []) { const delta = choice?.delta; const content = delta?.content || delta?.text || choice?.text; if (content) { return content; } } return null; }, extractToolCalls: (parsed: any) => { // Extract tool calls from any choice that has them for (const choice of parsed.choices || []) { let toolCalls = choice?.delta?.tool_calls || choice?.delta?.toolCalls; if (toolCalls) { // Extract reasoning_details from this chunk (it may contain encrypted thought signatures) const chunkReasoningDetails = choice?.delta?.reasoning_details; if (chunkReasoningDetails && Array.isArray(chunkReasoningDetails)) { // Look for reasoning.encrypted entries - these contain the thought_signature for (const entry of chunkReasoningDetails) { if (entry.type === 'reasoning.encrypted' && entry.data && entry.id) { // Match encrypted entry to tool call by id for (const tc of toolCalls) { if (tc.id === entry.id || tc.id?.startsWith(entry.id?.split('_').slice(0, -1).join('_'))) { tc.thought_signature = entry.data; } } // Also store as fallback if (!capturedThoughtSignature) { capturedThoughtSignature = entry.data; } } } // Update capturedReasoning to include all entries (both text and encrypted) if (!capturedReasoning) { capturedReasoning = chunkReasoningDetails; } else if (Array.isArray(capturedReasoning)) { // Merge in new entries capturedReasoning = [...capturedReasoning, ...chunkReasoningDetails]; } } // Also check direct thought_signature fields (fallback) for (const tc of toolCalls) { const tcThoughtSig = tc.thought_signature || tc.thoughtSignature || tc.extra_content?.google?.thought_signature; if (tcThoughtSig && !tc.thought_signature) { tc.thought_signature = tcThoughtSig; } } // Attach reasoning data (both reasoning_details AND thought_signature) const hasReasoning = capturedReasoning || capturedThoughtSignature; if (hasReasoning) { toolCalls = ReasoningPreserver.attachToToolCalls( toolCalls, { reasoning_details: capturedReasoning, thought_signature: capturedThoughtSignature } ); } return toolCalls; } } return null; }, extractFinishReason: (parsed: any) => { // Extract finish reason from any choice for (const choice of parsed.choices || []) { if (choice?.finish_reason) { // Last chance to capture thought_signature from final chunk if (needsReasoning && !capturedThoughtSignature) { const delta = choice?.delta; const message = choice?.message; capturedThoughtSignature = delta?.extra_content?.google?.thought_signature || message?.extra_content?.google?.thought_signature || parsed.extra_content?.google?.thought_signature || delta?.thought_signature || message?.thought_signature || parsed.thought_signature || choice?.thought_signature; } // When we detect completion, trigger async usage fetch (only once) if (generationId && options?.onUsageAvailable && !usageFetchTriggered) { usageFetchTriggered = true; // Fire and forget - don't await this.fetchAndNotifyUsage(generationId, baseModel, options.onUsageAvailable).catch(() => undefined); } return choice.finish_reason; } } return null; }, extractUsage: (parsed: any) => { // OpenRouter doesn't include usage in streaming responses // We'll fetch it asynchronously using the generation ID when completion is detected return null; }, // Extract reasoning from reasoning_details array (OpenRouter unified format) extractReasoning: (parsed: any) => { // Check for reasoning_details in delta or message const reasoningDetails = parsed.choices?.[0]?.delta?.reasoning_details || parsed.choices?.[0]?.message?.reasoning_details || parsed.reasoning_details; if (reasoningDetails && Array.isArray(reasoningDetails)) { // Find reasoning.text entries (these contain the actual reasoning text) const textEntries = reasoningDetails.filter((r) => r.type === 'reasoning.text'); if (textEntries.length > 0) { const reasoningText = textEntries.map((r) => r.text || '').join(''); if (reasoningText) { return { text: reasoningText, complete: false // We can't know if reasoning is complete from streaming }; } } // Also check for reasoning.summary entries const summaryEntries = reasoningDetails.filter((r) => r.type === 'reasoning.summary'); if (summaryEntries.length > 0) { const summaryText = summaryEntries.map((r) => r.text || r.summary || '').join(''); if (summaryText) { return { text: summaryText, complete: false }; } } } return null; } }); } catch (error) { throw this.handleError(error, 'streaming generation'); } } /** * Fetch usage data and notify via callback - runs asynchronously after streaming completes */ private async fetchAndNotifyUsage( generationId: string, model: string, onUsageAvailable: (usage: any, cost?: any) => void ): Promise<void> { try { const stats = await this.fetchGenerationStats(generationId); if (!stats) { return; } const usage = { promptTokens: stats.promptTokens, completionTokens: stats.completionTokens, totalTokens: stats.totalTokens }; // Calculate cost - prefer provider total_cost when present, otherwise fall back to pricing calculation let cost; if (stats.totalCost !== undefined) { cost = { totalCost: stats.totalCost, currency: stats.currency || 'USD' }; } else { cost = await this.calculateCost(usage, model); } // Notify via callback onUsageAvailable(usage, cost || undefined); } catch (error) { throw error; } } /** * Fetch generation statistics from OpenRouter using generation ID with exponential backoff * This is the proper way to get token usage and cost for streaming requests */ private async fetchGenerationStats(generationId: string): Promise<{ promptTokens: number; completionTokens: number; totalTokens: number; totalCost?: number; currency?: string; } | null> { // OpenRouter stats can lag ~3-6s; extend retries to reduce 404 noise const maxRetries = 12; const baseDelay = 900; // Start near 1s const incrementDelay = 500; // Grow more aggressively let lastStatus: number | null = null; for (let attempt = 0; attempt < maxRetries; attempt++) { try { // Linear backoff: 800ms, 1000ms, 1200ms, 1400ms, 1600ms if (attempt > 0) { const delay = baseDelay + (incrementDelay * attempt); await new Promise(resolve => setTimeout(resolve, delay)); } const response = await fetch(`${this.baseUrl}/generation?id=${generationId}`, { method: 'GET', headers: { 'Authorization': `Bearer ${this.apiKey}`, 'HTTP-Referer': this.httpReferer, 'X-Title': this.xTitle } }); lastStatus = response.status; if (response.status === 404) { // Stats not ready yet, retry continue; } if (!response.ok) { return null; } const data = await response.json(); // Extract token counts from response // OpenRouter returns: tokens_prompt, tokens_completion, native_tokens_prompt, native_tokens_completion const promptTokens = data.data?.native_tokens_prompt || data.data?.tokens_prompt || 0; const completionTokens = data.data?.native_tokens_completion || data.data?.tokens_completion || 0; const totalCost = data.data?.total_cost ?? undefined; const currency = 'USD'; if (promptTokens > 0 || completionTokens > 0) { return { promptTokens, completionTokens, totalTokens: promptTokens + completionTokens, totalCost, currency }; } // Data returned but no tokens - might not be ready yet } catch (error) { if (attempt === maxRetries - 1) { return null; } } } return null; } /** * List available models */ async listModels(): Promise<ModelInfo[]> { try { // Use centralized model registry const openrouterModels = ModelRegistry.getProviderModels('openrouter'); return openrouterModels.map(model => ModelRegistry.toModelInfo(model)); } catch (error) { this.handleError(error, 'listing models'); return []; } } /** * Get provider capabilities */ getCapabilities(): ProviderCapabilities { const baseCapabilities = { supportsStreaming: true, supportsJSON: true, supportsImages: true, supportsFunctions: true, supportsThinking: false, maxContextWindow: 2000000, // Varies by model supportedFeatures: [ 'streaming', 'json_mode', 'function_calling', 'image_input', '400+ models' ] }; return baseCapabilities; } /** * Execute detected tool calls from streaming and get AI response * Used for post-stream tool execution - implements pingpong pattern */ private async executeDetectedToolCalls(detectedToolCalls: any[], model: string, prompt: string, options?: GenerateOptions): Promise<LLMResponse> { try { // Convert to MCP format const mcpToolCalls: any[] = detectedToolCalls.map((tc) => ({ id: tc.id, function: { name: tc.function?.name || tc.name, arguments: tc.function?.arguments || JSON.stringify(tc.parameters || {}) } })); // Execute tool calls directly using MCPToolExecution // Note: This path is deprecated - tool execution now happens in StreamingOrchestrator // Passing null will return error results for all tools const toolResults = await MCPToolExecution.executeToolCalls( null, // No toolExecutor available in adapter context mcpToolCalls, 'openrouter', options?.onToolEvent ); // Now do the "pingpong" - send the conversation with tool results back to the LLM const messages = this.buildMessages(prompt, options?.systemPrompt); // Build assistant message with reasoning preserved using centralized utility const assistantMessage = ReasoningPreserver.buildAssistantMessageWithReasoning( detectedToolCalls, '' // Empty content since this was a tool call ); messages.push(assistantMessage); // Add tool result messages const toolMessages = MCPToolExecution.buildToolMessages(toolResults, 'openrouter'); messages.push(...toolMessages); // Make API call to get AI's response to the tool results const requestBody = { model, messages, temperature: options?.temperature, max_tokens: options?.maxTokens, top_p: options?.topP, frequency_penalty: options?.frequencyPenalty, presence_penalty: options?.presencePenalty, response_format: options?.jsonMode ? { type: 'json_object' } : undefined, stop: options?.stopSequences, usage: { include: true } // Enable token usage and cost tracking }; const response = await fetch(`${this.baseUrl}/chat/completions`, { method: 'POST', headers: { ...this.buildHeaders(), 'Authorization': `Bearer ${this.apiKey}`, 'HTTP-Referer': this.httpReferer, 'X-Title': this.xTitle }, body: JSON.stringify(requestBody) }); if (!response.ok) { throw new Error(`HTTP ${response.status}: ${response.statusText}`); } const data = await response.json(); const choice = data.choices[0]; const finalContent = choice?.message?.content || 'No response from AI after tool execution'; const usage = this.extractUsage(data); // Combine original tool calls with their execution results const completeToolCalls = detectedToolCalls.map(originalCall => { const result = toolResults.find(r => r.id === originalCall.id); return { id: originalCall.id, name: originalCall.function?.name || originalCall.name, parameters: JSON.parse(originalCall.function?.arguments || '{}'), result: result?.result, success: result?.success || false, error: result?.error, executionTime: result?.executionTime }; }); // Return LLMResponse with AI's natural language response to tool results return this.buildLLMResponse( finalContent, model, usage, MCPToolExecution.buildToolMetadata(toolResults), choice?.finish_reason || 'stop', completeToolCalls ); } catch (error) { console.error('OpenRouter adapter post-stream tool execution failed:', error); throw this.handleError(error, 'post-stream tool execution'); } } /** * Extract search results from OpenRouter response annotations */ private extractOpenRouterSources(response: any): SearchResult[] { try { const annotations = response.choices?.[0]?.message?.annotations || []; const sources = annotations .filter((ann: { type: string }) => ann.type === 'url_citation') .map((ann: { type: string; url?: string; title?: string; url_citation?: { title?: string; text?: string; url?: string; date?: string; timestamp?: string } }) => { const citation = ann.url_citation; return WebSearchUtils.validateSearchResult({ title: citation?.title || citation?.text || 'Unknown Source', url: citation?.url, date: citation?.date || citation?.timestamp }); }) .filter((result: SearchResult | null): result is SearchResult => result !== null); return sources; } catch (error) { return []; } } /** * Get model pricing */ async getModelPricing(modelId: string): Promise<ModelPricing | null> { try { const models = ModelRegistry.getProviderModels('openrouter'); const model = models.find(m => m.apiName === modelId); if (!model) { return null; } return { rateInputPerMillion: model.inputCostPerMillion, rateOutputPerMillion: model.outputCostPerMillion, currency: 'USD' }; } catch (error) { return null; } } private convertTools(tools: any[]): any[] { return tools.map(tool => { if (tool.type === 'function') { // Handle both nested (Chat Completions) and flat (Responses API) formats const toolDef = tool.function || tool; return { type: 'function', function: { name: toolDef.name, description: toolDef.description, parameters: toolDef.parameters || toolDef.input_schema } }; } return tool; }); } }

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/ProfSynapse/nexus'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

OpenRouterAdapter.ts•24.8 KiB