DevOps AI Toolkit

dot-ai
src
core
providers

vercel-provider.ts•15 KiB

/** * Vercel AI Provider Implementation * * Implements AIProvider interface using Vercel AI SDK. * Supports OpenAI and Google Gemini providers through unified interface. */ import { generateText, jsonSchema, tool, stepCountIs } from 'ai'; import { createOpenAI } from '@ai-sdk/openai'; import { createGoogleGenerativeAI } from '@ai-sdk/google'; import { createAnthropic } from '@ai-sdk/anthropic'; import { AIProvider, AIResponse, AIProviderConfig, ToolLoopConfig, AgenticResult } from '../ai-provider.interface'; import { generateDebugId, debugLogInteraction, logMetrics, createAndLogAgenticResult } from './provider-debug-utils'; /** * Provider-specific default models */ const PROVIDER_MODELS = { openai: 'gpt-5', google: 'gemini-2.5-pro', anthropic: 'claude-sonnet-4-5-20250929' } as const; type SupportedProvider = keyof typeof PROVIDER_MODELS; export class VercelProvider implements AIProvider { private providerType: SupportedProvider; private model: string; private apiKey: string; private debugMode: boolean; private modelInstance: any; // Vercel AI SDK model instance constructor(config: AIProviderConfig) { this.apiKey = config.apiKey; this.providerType = config.provider as SupportedProvider; this.model = config.model || this.getDefaultModel(); this.debugMode = config.debugMode ?? (process.env.DEBUG_DOT_AI === 'true'); this.validateConfiguration(); this.initializeModel(); } private validateConfiguration(): void { if (!this.apiKey) { throw new Error(`API key is required for ${this.providerType} provider`); } if (!['openai', 'google', 'anthropic'].includes(this.providerType)) { throw new Error(`Unsupported provider: ${this.providerType}. Must be 'openai', 'google', or 'anthropic'`); } } private initializeModel(): void { try { switch (this.providerType) { case 'openai': { const provider = createOpenAI({ apiKey: this.apiKey }); this.modelInstance = provider(this.model); break; } case 'google': { const provider = createGoogleGenerativeAI({ apiKey: this.apiKey }); this.modelInstance = provider(this.model); break; } case 'anthropic': { const provider = createAnthropic({ apiKey: this.apiKey }); this.modelInstance = provider(this.model); break; } default: throw new Error(`Cannot initialize model for provider: ${this.providerType}`); } } catch (error) { throw new Error(`Failed to initialize ${this.providerType} model: ${error}`); } } getProviderType(): string { return 'vercel'; } getDefaultModel(): string { return PROVIDER_MODELS[this.providerType]; } isInitialized(): boolean { return this.modelInstance !== undefined; } private logDebugIfEnabled( operation: string, prompt: string, response: AIResponse, durationMs: number ): void { if (!this.debugMode) return; const debugId = generateDebugId(operation); debugLogInteraction(debugId, prompt, response, operation, this.getProviderType(), this.model, this.debugMode); // Use logMetrics for sendMessage calls (simple token structure, no extended metrics) logMetrics(operation, this.getProviderType(), { totalTokens: { input: response.usage.input_tokens, output: response.usage.output_tokens, cacheCreation: response.usage.cache_creation_input_tokens, cacheRead: response.usage.cache_read_input_tokens } }, durationMs, this.debugMode); } async sendMessage(message: string, operation: string = 'generic'): Promise<AIResponse> { if (!this.isInitialized()) { throw new Error(`${this.providerType} provider not initialized`); } const startTime = Date.now(); try { // Use Vercel AI SDK generateText // Note: maxTokens omitted - let SDK/provider use model-specific optimal defaults const result = await generateText({ model: this.modelInstance, prompt: message, }); const response: AIResponse = { content: result.text, usage: { input_tokens: result.usage.inputTokens || 0, output_tokens: result.usage.outputTokens || 0 } }; const durationMs = Date.now() - startTime; // Debug log the interaction if enabled if (this.debugMode) { const debugId = generateDebugId(operation); debugLogInteraction(debugId, message, response, operation, this.getProviderType(), this.model, this.debugMode); logMetrics(operation, this.getProviderType(), { totalTokens: { input: response.usage.input_tokens, output: response.usage.output_tokens, cacheCreation: response.usage.cache_creation_input_tokens, cacheRead: response.usage.cache_read_input_tokens } }, durationMs, this.debugMode); } return response; } catch (error) { throw new Error(`${this.providerType} API error: ${error}`); } } /** * Agentic tool loop using Vercel AI SDK * * Implements multi-turn tool calling using generateText with maxSteps. * The Vercel AI SDK handles the conversation loop automatically. * * Provider-specific caching: * - Anthropic: Manual cache control via providerOptions * - OpenAI: Automatic caching (no code changes needed) * - Google: Check Gemini caching capabilities * * See PRD #143 Milestone 2.5 for Vercel provider implementation details. */ async toolLoop(config: ToolLoopConfig): Promise<AgenticResult> { if (!this.isInitialized()) { throw new Error(`${this.providerType} provider not initialized`); } const startTime = Date.now(); const maxIterations = config.maxIterations || 20; const operation = config.operation || 'tool-loop'; // Convert AITool[] to Vercel AI SDK tool format const tools: Record<string, any> = {}; for (let i = 0; i < config.tools.length; i++) { const aiTool = config.tools[i]; const isLastTool = i === config.tools.length - 1; const toolDef = tool({ description: aiTool.description, inputSchema: jsonSchema(aiTool.inputSchema), execute: async (input: any) => { return await config.toolExecutor(aiTool.name, input); } }); // Add cache control ONLY to last tool for Anthropic (max 4 cache breakpoints) // This caches the system prompt + all tools together if (this.providerType === 'anthropic' && isLastTool) { (toolDef as any).providerOptions = { anthropic: { cacheControl: { type: 'ephemeral' } } }; } // TODO: Check if Google Gemini supports caching in future SDK versions // Google Gemini may have caching capabilities - research providerOptions.google syntax // if (this.providerType === 'google' && isLastTool) { // (toolDef as any).providerOptions = { // google: { /* caching config if available */ } // }; // } tools[aiTool.name] = toolDef; } // Build messages array with system prompt caching for Anthropic // Anthropic caching requires system messages in messages array with providerOptions const messages: any[] = []; let systemParam: string | undefined; if (this.providerType === 'anthropic') { // For Anthropic: Put system in messages array with cacheControl messages.push({ role: 'system', content: config.systemPrompt, providerOptions: { anthropic: { cacheControl: { type: 'ephemeral' } } } }); // Don't use system parameter for Anthropic when caching systemParam = undefined; } else { // For OpenAI/Google: Use system parameter (string) systemParam = config.systemPrompt; } // Add user message messages.push({ role: 'user', content: config.userMessage }); // TODO: Check if Google Gemini supports system prompt caching in future SDK versions // if (this.providerType === 'google') { // messages.unshift({ // role: 'system', // content: config.systemPrompt, // providerOptions: { // google: { /* caching config if available */ } // } // }); // systemParam = undefined; // } try { // Use Vercel AI SDK's generateText with stopWhen for automatic loop // Default is stepCountIs(1) - we need to increase for multi-step investigation const generateConfig: any = { model: this.modelInstance, messages, tools, stopWhen: stepCountIs(maxIterations) }; // Add system parameter for non-Anthropic providers if (systemParam) { generateConfig.system = systemParam; } const result = await generateText(generateConfig); // Debug: Log the full cumulative context that was actually sent to the AI if (this.debugMode && result.response?.messages) { const path = await import('path'); const debugId = generateDebugId(`${operation}-final-context`); const debugDir = path.join(process.cwd(), 'tmp', 'debug-ai'); const contextFile = path.join(debugDir, `${debugId}_full-context.md`); // Build full conversation history representation const messages = result.response.messages; const contextParts = [`# Full Conversation Context - ${operation}\n`]; contextParts.push(`\nTimestamp: ${new Date().toISOString()}`); contextParts.push(`Provider: ${this.getProviderType()}`); contextParts.push(`Model: ${this.model}`); contextParts.push(`Total Messages: ${messages.length}`); contextParts.push(`Total Steps: ${result.steps?.length || 0}`); contextParts.push('\n---\n'); for (let i = 0; i < messages.length; i++) { const msg = messages[i]; contextParts.push(`\n## Message ${i + 1} - Role: ${msg.role}\n`); if (typeof msg.content === 'string') { contextParts.push(msg.content); } else if (Array.isArray(msg.content)) { for (const part of msg.content) { if (part.type === 'text') { contextParts.push((part as any).text || ''); } else if (part.type === 'tool-call') { contextParts.push(`\n[TOOL CALL: ${(part as any).toolName}]`); contextParts.push(JSON.stringify((part as any).args, null, 2)); } else if (part.type === 'tool-result') { contextParts.push(`\n[TOOL RESULT: ${(part as any).toolName}]`); const resultData = (part as any).output || (part as any).result || (part as any).content || part; contextParts.push(JSON.stringify(resultData, null, 2)); } } } } const fs = await import('fs'); fs.writeFileSync(contextFile, contextParts.join('\n')); console.log(`🐛 DEBUG: Full conversation context logged to ${contextFile}`); } // Extract tool call history from steps const toolCallsExecuted: Array<{ tool: string; input: any; output: any }> = []; for (const step of result.steps || []) { for (const toolCall of step.toolCalls || []) { const toolResult = step.toolResults?.find( (tr: any) => tr.toolCallId === toolCall.toolCallId ); toolCallsExecuted.push({ tool: (toolCall as any).toolName, input: (toolCall as any).args, output: (toolResult as any)?.result }); } } // Normalize token metrics across providers // NOTE: Vercel AI SDK had token reporting bugs that were fixed in PR #8945 (merged Sept 26, 2025) // - GitHub Issue #8349: cache tokens only reflected last step, not summed across all steps // - GitHub Issue #8795: Token reporting issues with Anthropic provider (streaming) // Our version (5.0.60, released Oct 2, 2025) includes these fixes. // However, testing still shows ~70% fewer tokens reported vs Anthropic native SDK. // Root cause unknown - may be additional unreported bugs or different calculation methods. const usage = result.usage; let cacheReadTokens = 0; let cacheCreationTokens = 0; // Anthropic via Vercel uses cachedInputTokens if ((usage as any).cachedInputTokens) { cacheReadTokens = (usage as any).cachedInputTokens; } // OpenAI uses cached_tokens or cachedTokens (automatic caching, no config needed) if ('cachedTokens' in usage || (usage as any).cached_tokens) { cacheReadTokens = (usage as any).cachedTokens || (usage as any).cached_tokens || 0; } // Anthropic native SDK uses separate cache_creation and cache_read fields if ((usage as any).cache_creation_input_tokens) { cacheCreationTokens = (usage as any).cache_creation_input_tokens; } if ((usage as any).cache_read_input_tokens) { cacheReadTokens = (usage as any).cache_read_input_tokens; } // TODO: Check if Google Gemini reports cache metrics in future SDK versions // Google Gemini may return cache-related metrics - check usage object structure // Possible fields: cachedTokens, cacheHits, or provider-specific naming // Add normalization logic here when Gemini caching is confirmed // Extract final text from the last step (result.text might be empty if last step had tool calls) let finalText = result.text; if (!finalText || finalText.trim().length === 0) { // If result.text is empty, find the last text response from steps for (let i = (result.steps || []).length - 1; i >= 0; i--) { const step = result.steps![i]; if (step.text && step.text.trim().length > 0) { finalText = step.text; break; } } } return createAndLogAgenticResult({ finalMessage: finalText || '', iterations: result.steps?.length || 1, toolCallsExecuted, totalTokens: { input: usage.inputTokens || 0, output: usage.outputTokens || 0, cacheCreation: cacheCreationTokens, cacheRead: cacheReadTokens }, status: 'success', completionReason: 'investigation_complete', modelVersion: this.model, operation: `${operation}-summary`, sdk: this.getProviderType(), startTime, debugMode: this.debugMode }); } catch (error) { // Return error result with extended metrics return createAndLogAgenticResult({ finalMessage: `Error during investigation: ${error instanceof Error ? error.message : String(error)}`, iterations: 0, toolCallsExecuted: [], totalTokens: { input: 0, output: 0, cacheCreation: 0, cacheRead: 0 }, status: 'failed', completionReason: 'error', modelVersion: this.model, operation: `${operation}-error`, sdk: this.getProviderType(), startTime, debugMode: this.debugMode }); } } }

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/vfarcic/dot-ai'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

vercel-provider.ts•15 KiB