Ollama MCP Server

client.ts•3.36 KiB

import type { z } from "zod"; import { OllamaApiError, OllamaNetworkError, OllamaResponseError, OllamaError, } from "./errors.js"; /** * Validate and get the Ollama base URL */ function getOllamaBaseUrl(): string { const raw = process.env.OLLAMA_BASE_URL ?? "http://localhost:11434"; try { const url = new URL(raw); if (!["http:", "https:"].includes(url.protocol)) { throw new Error(`Invalid protocol: ${url.protocol}`); } // Remove trailing slash return url.toString().replace(/\/+$/, ""); } catch { // Do not log raw env value - it may contain secrets throw new Error("Invalid OLLAMA_BASE_URL configuration"); } } const OLLAMA_BASE_URL = getOllamaBaseUrl(); // Default timeout for simple API requests (30 seconds) const DEFAULT_TIMEOUT_MS = 30_000; // Extended timeout for inference operations (5 minutes) // Reasoning models may take significant time to generate responses const INFERENCE_TIMEOUT_MS = 300_000; // Extended timeout for model pull operations (10 minutes) const PULL_TIMEOUT_MS = 600_000; /** * Make a request to the Ollama API with timeout, validation, and error handling */ export async function ollamaRequest<T>( endpoint: string, init: RequestInit = {}, timeoutMs: number = DEFAULT_TIMEOUT_MS, responseSchema?: z.ZodSchema<T> ): Promise<T> { const controller = new AbortController(); const timeout = setTimeout(() => controller.abort(), timeoutMs); try { const url = `${OLLAMA_BASE_URL}${endpoint}`; const response = await fetch(url, { ...init, signal: controller.signal, headers: { "Content-Type": "application/json", ...init.headers, }, }); if (!response.ok) { const body = await response.text(); throw new OllamaApiError(response.status, body); } const raw: unknown = await response.json(); // Validate response if schema provided if (responseSchema) { const parsed = responseSchema.safeParse(raw); if (!parsed.success) { throw new OllamaResponseError( `Invalid response shape: ${parsed.error.message}`, parsed.error ); } return parsed.data; } return raw as T; } catch (error) { if (error instanceof OllamaError) { throw error; } if (error instanceof Error) { if (error.name === "AbortError") { throw new OllamaNetworkError("Request timed out", error); } if ( error.message.includes("fetch failed") || error.message.includes("ECONNREFUSED") ) { throw new OllamaNetworkError( `Failed to connect to Ollama: ${error.message}`, error ); } } throw error; } finally { clearTimeout(timeout); } } /** * Make a request with extended timeout for inference operations * (generate, chat - reasoning models may take several minutes) */ export async function ollamaRequestInference<T>( endpoint: string, init: RequestInit = {}, responseSchema?: z.ZodSchema<T> ): Promise<T> { return ollamaRequest<T>(endpoint, init, INFERENCE_TIMEOUT_MS, responseSchema); } /** * Make a request with extended timeout (for model pull operations) */ export async function ollamaRequestPull<T>( endpoint: string, init: RequestInit = {}, responseSchema?: z.ZodSchema<T> ): Promise<T> { return ollamaRequest<T>(endpoint, init, PULL_TIMEOUT_MS, responseSchema); }

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/ngc-shj/ollama-mcp-server'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

client.ts•3.36 KiB