AutoDev Codebase MCP Server

openai-compatible.spec.ts•16.7 KiB

import { vitest, describe, it, expect, beforeEach, afterEach, vi } from "vitest" import type { MockedClass, MockedFunction } from "vitest" import { OpenAI } from "openai" import { OpenAICompatibleEmbedder } from "../openai-compatible" import { MAX_BATCH_TOKENS, MAX_ITEM_TOKENS, MAX_BATCH_RETRIES, INITIAL_RETRY_DELAY_MS } from "../../constants" // Mock the OpenAI SDK vitest.mock("openai") const MockedOpenAI = OpenAI as MockedClass<typeof OpenAI> describe("OpenAICompatibleEmbedder", () => { let embedder: OpenAICompatibleEmbedder let mockOpenAIInstance: any let mockEmbeddingsCreate: MockedFunction<any> const testBaseUrl = "https://api.siliconflow.cn/v1" const testApiKey = "sk-xxxxx" const testModelId = "Qwen/Qwen3-Embedding-4B" beforeEach(() => { vitest.clearAllMocks() vitest.spyOn(console, "warn").mockImplementation(() => {}) vitest.spyOn(console, "error").mockImplementation(() => {}) // Setup mock OpenAI instance mockEmbeddingsCreate = vitest.fn() mockOpenAIInstance = { embeddings: { create: mockEmbeddingsCreate, }, } MockedOpenAI.mockImplementation(() => mockOpenAIInstance) }) afterEach(() => { vitest.restoreAllMocks() }) describe("constructor", () => { it("should create embedder with valid configuration", () => { embedder = new OpenAICompatibleEmbedder(testBaseUrl, testApiKey, testModelId) expect(MockedOpenAI).toHaveBeenCalledWith({ baseURL: testBaseUrl, apiKey: testApiKey, }) expect(embedder).toBeDefined() }) it("should use default model when modelId is not provided", () => { embedder = new OpenAICompatibleEmbedder(testBaseUrl, testApiKey) expect(MockedOpenAI).toHaveBeenCalledWith({ baseURL: testBaseUrl, apiKey: testApiKey, }) expect(embedder).toBeDefined() }) it("should throw error when baseUrl is missing", () => { expect(() => new OpenAICompatibleEmbedder("", testApiKey, testModelId)).toThrow( "Base URL is required for OpenAI Compatible embedder", ) }) it("should throw error when apiKey is missing", () => { expect(() => new OpenAICompatibleEmbedder(testBaseUrl, "", testModelId)).toThrow( "API key is required for OpenAI Compatible embedder", ) }) it("should throw error when both baseUrl and apiKey are missing", () => { expect(() => new OpenAICompatibleEmbedder("", "", testModelId)).toThrow( "Base URL is required for OpenAI Compatible embedder", ) }) }) describe("embedderInfo", () => { beforeEach(() => { embedder = new OpenAICompatibleEmbedder(testBaseUrl, testApiKey, testModelId) }) it("should return correct embedder info", () => { const info = embedder.embedderInfo expect(info).toEqual({ name: "openai-compatible", }) }) }) describe("createEmbeddings", () => { beforeEach(() => { embedder = new OpenAICompatibleEmbedder(testBaseUrl, testApiKey, testModelId) }) it("should create embeddings for single text", async () => { const testTexts = ["Hello world"] const mockResponse = { data: [{ embedding: [0.1, 0.2, 0.3] }], usage: { prompt_tokens: 10, total_tokens: 15 }, } mockEmbeddingsCreate.mockResolvedValue(mockResponse) const result = await embedder.createEmbeddings(testTexts) expect(mockEmbeddingsCreate).toHaveBeenCalledWith({ input: testTexts, model: testModelId, encoding_format: "base64", }) expect(result).toEqual({ embeddings: [[0.1, 0.2, 0.3]], usage: { promptTokens: 10, totalTokens: 15 }, }) }) it("should create embeddings for multiple texts", async () => { const testTexts = ["Hello world", "Goodbye world"] const mockResponse = { data: [{ embedding: [0.1, 0.2, 0.3] }, { embedding: [0.4, 0.5, 0.6] }], usage: { prompt_tokens: 20, total_tokens: 30 }, } mockEmbeddingsCreate.mockResolvedValue(mockResponse) const result = await embedder.createEmbeddings(testTexts) expect(mockEmbeddingsCreate).toHaveBeenCalledWith({ input: testTexts, model: testModelId, encoding_format: "base64", }) expect(result).toEqual({ embeddings: [ [0.1, 0.2, 0.3], [0.4, 0.5, 0.6], ], usage: { promptTokens: 20, totalTokens: 30 }, }) }) it("should use custom model when provided", async () => { const testTexts = ["Hello world"] const customModel = "custom-embedding-model" const mockResponse = { data: [{ embedding: [0.1, 0.2, 0.3] }], usage: { prompt_tokens: 10, total_tokens: 15 }, } mockEmbeddingsCreate.mockResolvedValue(mockResponse) await embedder.createEmbeddings(testTexts, customModel) expect(mockEmbeddingsCreate).toHaveBeenCalledWith({ input: testTexts, model: customModel, encoding_format: "base64", }) }) it("should handle missing usage data gracefully", async () => { const testTexts = ["Hello world"] const mockResponse = { data: [{ embedding: [0.1, 0.2, 0.3] }], usage: undefined, } mockEmbeddingsCreate.mockResolvedValue(mockResponse) const result = await embedder.createEmbeddings(testTexts) expect(result).toEqual({ embeddings: [[0.1, 0.2, 0.3]], usage: { promptTokens: 0, totalTokens: 0 }, }) }) /** * Test base64 conversion logic */ describe("base64 conversion", () => { it("should convert base64 encoded embeddings to float arrays", async () => { const testTexts = ["Hello world"] // Create a Float32Array with test values that can be exactly represented in Float32 const testEmbedding = new Float32Array([0.25, 0.5, 0.75, 1.0]) // Convert to base64 string (simulating what OpenAI API returns) const buffer = Buffer.from(testEmbedding.buffer) const base64String = buffer.toString("base64") const mockResponse = { data: [{ embedding: base64String }], // Base64 string instead of array usage: { prompt_tokens: 10, total_tokens: 15 }, } mockEmbeddingsCreate.mockResolvedValue(mockResponse) const result = await embedder.createEmbeddings(testTexts) expect(mockEmbeddingsCreate).toHaveBeenCalledWith({ input: testTexts, model: testModelId, encoding_format: "base64", }) // Verify the base64 string was converted back to the original float array expect(result).toEqual({ embeddings: [[0.25, 0.5, 0.75, 1.0]], usage: { promptTokens: 10, totalTokens: 15 }, }) }) it("should handle multiple base64 encoded embeddings", async () => { const testTexts = ["Hello world", "Goodbye world"] // Create test embeddings with values that can be exactly represented in Float32 const embedding1 = new Float32Array([0.25, 0.5, 0.75]) const embedding2 = new Float32Array([1.0, 1.25, 1.5]) // Convert to base64 strings const base64String1 = Buffer.from(embedding1.buffer).toString("base64") const base64String2 = Buffer.from(embedding2.buffer).toString("base64") const mockResponse = { data: [{ embedding: base64String1 }, { embedding: base64String2 }], usage: { prompt_tokens: 20, total_tokens: 30 }, } mockEmbeddingsCreate.mockResolvedValue(mockResponse) const result = await embedder.createEmbeddings(testTexts) expect(result).toEqual({ embeddings: [ [0.25, 0.5, 0.75], [1.0, 1.25, 1.5], ], usage: { promptTokens: 20, totalTokens: 30 }, }) }) it("should handle mixed base64 and array embeddings", async () => { const testTexts = ["Hello world", "Goodbye world"] // Create one base64 embedding and one regular array (edge case) const embedding1 = new Float32Array([0.25, 0.5, 0.75]) const base64String1 = Buffer.from(embedding1.buffer).toString("base64") const mockResponse = { data: [ { embedding: base64String1 }, // Base64 string { embedding: [1.0, 1.25, 1.5] }, // Regular array ], usage: { prompt_tokens: 20, total_tokens: 30 }, } mockEmbeddingsCreate.mockResolvedValue(mockResponse) const result = await embedder.createEmbeddings(testTexts) expect(result).toEqual({ embeddings: [ [0.25, 0.5, 0.75], [1.0, 1.25, 1.5], ], usage: { promptTokens: 20, totalTokens: 30 }, }) }) }) /** * Test batching logic when texts exceed token limits */ describe("batching logic", () => { it("should process texts in batches", async () => { // Use normal sized texts that won't be skipped const testTexts = ["text1", "text2", "text3"] mockEmbeddingsCreate.mockResolvedValue({ data: [ { embedding: [0.1, 0.2, 0.3] }, { embedding: [0.4, 0.5, 0.6] }, { embedding: [0.7, 0.8, 0.9] }, ], usage: { prompt_tokens: 10, total_tokens: 15 }, }) await embedder.createEmbeddings(testTexts) // Should be called once for normal texts expect(mockEmbeddingsCreate).toHaveBeenCalledTimes(1) }) it("should skip texts that exceed MAX_ITEM_TOKENS", async () => { const normalText = "Hello world" const oversizedText = "a".repeat(MAX_ITEM_TOKENS * 5) // Exceeds MAX_ITEM_TOKENS const testTexts = [normalText, oversizedText, normalText] const mockResponse = { data: [{ embedding: [0.1, 0.2, 0.3] }, { embedding: [0.4, 0.5, 0.6] }], usage: { prompt_tokens: 10, total_tokens: 15 }, } mockEmbeddingsCreate.mockResolvedValue(mockResponse) await embedder.createEmbeddings(testTexts) // Should warn about oversized text expect(console.warn).toHaveBeenCalledWith(expect.stringContaining("exceeds maximum token limit")) // Should only process normal texts (1 call for 2 normal texts batched together) expect(mockEmbeddingsCreate).toHaveBeenCalledTimes(1) }) it("should return correct usage statistics", async () => { const testTexts = ["text1", "text2"] mockEmbeddingsCreate.mockResolvedValue({ data: [{ embedding: [0.1, 0.2, 0.3] }, { embedding: [0.4, 0.5, 0.6] }], usage: { prompt_tokens: 10, total_tokens: 15 }, }) const result = await embedder.createEmbeddings(testTexts) expect(result.usage).toEqual({ promptTokens: 10, totalTokens: 15, }) }) }) /** * Test retry logic with exponential backoff */ describe("retry logic", () => { beforeEach(() => { vitest.useFakeTimers() }) afterEach(() => { vitest.useRealTimers() }) it("should retry on rate limit errors with exponential backoff", async () => { const testTexts = ["Hello world"] const rateLimitError = { status: 429, message: "Rate limit exceeded" } // Create base64 encoded embedding for successful response const testEmbedding = new Float32Array([0.25, 0.5, 0.75]) const base64String = Buffer.from(testEmbedding.buffer).toString("base64") mockEmbeddingsCreate .mockRejectedValueOnce(rateLimitError) .mockRejectedValueOnce(rateLimitError) .mockResolvedValueOnce({ data: [{ embedding: base64String }], usage: { prompt_tokens: 10, total_tokens: 15 }, }) const resultPromise = embedder.createEmbeddings(testTexts) // Fast-forward through the delays await vitest.advanceTimersByTimeAsync(INITIAL_RETRY_DELAY_MS) // First retry delay await vitest.advanceTimersByTimeAsync(INITIAL_RETRY_DELAY_MS * 2) // Second retry delay const result = await resultPromise expect(mockEmbeddingsCreate).toHaveBeenCalledTimes(3) expect(console.warn).toHaveBeenCalledWith(expect.stringContaining("Rate limit hit, retrying in")) expect(result).toEqual({ embeddings: [[0.25, 0.5, 0.75]], usage: { promptTokens: 10, totalTokens: 15 }, }) }) it("should not retry on non-rate-limit errors", async () => { const testTexts = ["Hello world"] const authError = new Error("Unauthorized") ;(authError as any).status = 401 mockEmbeddingsCreate.mockRejectedValue(authError) await expect(embedder.createEmbeddings(testTexts)).rejects.toThrow( "Failed to create embeddings: batch processing error", ) expect(mockEmbeddingsCreate).toHaveBeenCalledTimes(1) expect(console.warn).not.toHaveBeenCalledWith(expect.stringContaining("Rate limit hit")) }) it("should throw error immediately on non-retryable errors", async () => { const testTexts = ["Hello world"] const serverError = new Error("Internal server error") ;(serverError as any).status = 500 mockEmbeddingsCreate.mockRejectedValue(serverError) await expect(embedder.createEmbeddings(testTexts)).rejects.toThrow( "Failed to create embeddings: batch processing error", ) expect(mockEmbeddingsCreate).toHaveBeenCalledTimes(1) }) }) /** * Test error handling scenarios */ describe("error handling", () => { it("should handle API errors gracefully", async () => { const testTexts = ["Hello world"] const apiError = new Error("API connection failed") mockEmbeddingsCreate.mockRejectedValue(apiError) await expect(embedder.createEmbeddings(testTexts)).rejects.toThrow( "Failed to create embeddings: batch processing error", ) expect(console.error).toHaveBeenCalledWith( expect.stringContaining("Failed to process batch"), expect.any(Error), ) }) it("should handle batch processing errors", async () => { const testTexts = ["text1", "text2"] const batchError = new Error("Batch processing failed") mockEmbeddingsCreate.mockRejectedValue(batchError) await expect(embedder.createEmbeddings(testTexts)).rejects.toThrow( "Failed to create embeddings: batch processing error", ) expect(console.error).toHaveBeenCalledWith("Failed to process batch:", batchError) }) it("should handle empty text arrays", async () => { const testTexts: string[] = [] const result = await embedder.createEmbeddings(testTexts) expect(result).toEqual({ embeddings: [], usage: { promptTokens: 0, totalTokens: 0 }, }) expect(mockEmbeddingsCreate).not.toHaveBeenCalled() }) it("should handle malformed API responses", async () => { const testTexts = ["Hello world"] const malformedResponse = { data: null, usage: { prompt_tokens: 10, total_tokens: 15 }, } mockEmbeddingsCreate.mockResolvedValue(malformedResponse) await expect(embedder.createEmbeddings(testTexts)).rejects.toThrow() }) }) /** * Test to confirm OpenAI package bug with base64 encoding * This test verifies that when we request encoding_format: "base64", * the OpenAI package returns unparsed base64 strings as expected. * This is the behavior we rely on in our workaround. */ describe("OpenAI package base64 behavior verification", () => { it("should return unparsed base64 when encoding_format is base64", async () => { const testTexts = ["Hello world"] // Create a real OpenAI instance to test the actual package behavior const realOpenAI = new ((await vi.importActual("openai")) as any).OpenAI({ baseURL: testBaseUrl, apiKey: testApiKey, }) // Create test embedding data as base64 using values that can be exactly represented in Float32 const testEmbedding = new Float32Array([0.25, 0.5, 0.75, 1.0]) const buffer = Buffer.from(testEmbedding.buffer) const base64String = buffer.toString("base64") // Mock the raw API response that would come from OpenAI const mockApiResponse = { data: [ { object: "embedding", embedding: base64String, // Raw base64 string from API index: 0, }, ], model: "text-embedding-3-small", object: "list", usage: { prompt_tokens: 2, total_tokens: 2, }, } // Mock the methodRequest method which is called by post() const mockMethodRequest = vi.fn() const mockAPIPromise = { then: vi.fn().mockImplementation((callback) => { return Promise.resolve(callback(mockApiResponse)) }), catch: vi.fn(), finally: vi.fn(), } mockMethodRequest.mockReturnValue(mockAPIPromise) // Replace the methodRequest method on the client ;(realOpenAI as any).post = vi.fn().mockImplementation((path, opts) => { return mockMethodRequest("post", path, opts) }) // Call the embeddings.create method with base64 encoding const response = await realOpenAI.embeddings.create({ input: testTexts, model: "text-embedding-3-small", encoding_format: "base64", }) // Verify that the response contains the raw base64 string // This confirms the OpenAI package doesn't parse base64 when explicitly requested expect(response.data[0].embedding).toBe(base64String) expect(typeof response.data[0].embedding).toBe("string") // Verify we can manually convert it back to the original float array const returnedBuffer = Buffer.from(response.data[0].embedding as string, "base64") const returnedFloat32Array = new Float32Array( returnedBuffer.buffer, returnedBuffer.byteOffset, returnedBuffer.byteLength / 4, ) const returnedArray = Array.from(returnedFloat32Array) expect(returnedArray).toEqual([0.25, 0.5, 0.75, 1.0]) }) }) }) })

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/anrgct/autodev-codebase'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

openai-compatible.spec.ts•16.7 KiB