MCP Prompt Tester

MIT License

Overview InspectNew Endpoints Schema Related Servers Reviews Score

openai.py•10.1 kB

"""OpenAI provider implementation.""" import time from typing import Dict, Any, Optional, List from langfuse.decorators import observe from openai import OpenAI, APIError, APIConnectionError, RateLimitError from .base import ProviderBase, ProviderError from ..env import get_api_key class OpenAIProvider(ProviderBase): """Provider implementation for OpenAI API.""" def __init__(self): """Initialize the OpenAI provider with API key from environment.""" try: # Get API key using the utility function api_key = get_api_key("openai") self.client = OpenAI(api_key=api_key) except ValueError as e: raise ProviderError(str(e)) @observe(as_type="generation") async def generate( self, model: str, system_prompt: str, user_prompt: str, temperature: Optional[float] = 0.7, max_tokens: Optional[int] = 1000, top_p: Optional[float] = 1.0, **kwargs: Any, ) -> Dict[str, Any]: """Generate a response using OpenAI's API.""" try: # Prepare the messages messages = [ {"role": "system", "content": system_prompt}, {"role": "user", "content": user_prompt} ] # Build the request params request_params = { "model": model, "messages": messages, "temperature": temperature if temperature is not None else 0.7, "max_tokens": max_tokens if max_tokens is not None else 1000, "top_p": top_p if top_p is not None else 1.0, } # Add any additional kwargs for key, value in kwargs.items(): if value is not None: request_params[key] = value # Make the API call start_time = time.time() response = self.client.chat.completions.create(**request_params) end_time = time.time() response_time = end_time - start_time # Get the generated text generated_text = response.choices[0].message.content # Prepare the result result = { "text": generated_text, "model": model, "usage": { "prompt_tokens": response.usage.prompt_tokens, "completion_tokens": response.usage.completion_tokens, "total_tokens": response.usage.total_tokens, }, "finish_reason": response.choices[0].finish_reason, "response_time": response_time, } # Calculate cost if the model is in our default models default_models = self.get_default_models() model_info = None # Find the model in our default models for model_type, info in default_models.items(): if info["name"] == model: model_info = info break # If we have pricing data for this model, calculate and add costs if model_info: input_cost = (response.usage.prompt_tokens / 1_000_000) * model_info["input_cost"] output_cost = (response.usage.completion_tokens / 1_000_000) * model_info["output_cost"] total_cost = input_cost + output_cost result["costs"] = { "input_cost": input_cost, "output_cost": output_cost, "total_cost": total_cost, "currency": "USD", "rates": { "input_rate": model_info["input_cost"], "output_rate": model_info["output_cost"], } } return result except APIConnectionError as e: raise ProviderError(f"Connection error: {str(e)}") except RateLimitError as e: raise ProviderError(f"Rate limit exceeded: {str(e)}") except APIError as e: raise ProviderError(f"API error: {str(e)}") except Exception as e: raise ProviderError(f"Unexpected error: {str(e)}") @observe(as_type="generation") async def generate_with_history( self, model: str, system_prompt: str, message_history: List[Dict[str, str]], temperature: Optional[float] = 0.7, max_tokens: Optional[int] = 1000, top_p: Optional[float] = 1.0, **kwargs: Any, ) -> Dict[str, Any]: """Generate a response using OpenAI's API with a message history.""" try: # Prepare the messages with system message first messages = [{"role": "system", "content": system_prompt}] # Add all messages from history messages.extend(message_history) # Build the request params request_params = { "model": model, "messages": messages, "temperature": temperature, "max_tokens": max_tokens, "top_p": top_p, } # Add any additional parameters request_params.update(kwargs) # Record the start time start_time = time.time() # Make the API call response = self.client.chat.completions.create(**request_params) # Calculate the response time response_time = time.time() - start_time # Extract the result text result_text = response.choices[0].message.content # Calculate token usage and cost input_tokens = response.usage.prompt_tokens output_tokens = response.usage.completion_tokens total_tokens = response.usage.total_tokens # Model ID and name model_id = getattr(response, "model", model) # Calculate the cost # Calculate cost if the model is in our default models default_models = self.get_default_models() model_info = None # Find the model in our default models for model_type, info in default_models.items(): if info["name"] == model: model_info = info break # If we have pricing data for this model, calculate and add costs if model_info: input_cost = (input_tokens / 1_000_000) * model_info["input_cost"] output_cost = (output_tokens / 1_000_000) * model_info["output_cost"] total_cost = input_cost + output_cost result = { "text": result_text, "model": model_id, "usage": { "prompt_tokens": input_tokens, "completion_tokens": output_tokens, "total_tokens": total_tokens, }, "finish_reason": response.choices[0].finish_reason, "response_time": response_time, "costs": { "input_cost": input_cost, "output_cost": output_cost, "total_cost": total_cost, "currency": "USD", "rates": { "input_rate": model_info["input_cost"], "output_rate": model_info["output_cost"], } } } else: # If we don't have pricing info for this model result = { "text": result_text, "model": model_id, "usage": { "prompt_tokens": input_tokens, "completion_tokens": output_tokens, "total_tokens": total_tokens, }, "finish_reason": response.choices[0].finish_reason, "response_time": response_time, } return result except APIConnectionError as e: raise ProviderError(f"Network error connecting to OpenAI: {str(e)}") except RateLimitError as e: raise ProviderError(f"OpenAI rate limit exceeded: {str(e)}") except APIError as e: raise ProviderError(f"OpenAI API error: {str(e)}") except Exception as e: raise ProviderError(f"Unexpected error with OpenAI: {str(e)}") # TODO: We should call the API to get available models # the only issue is that we don't have any information about the models themselves, quality, token limits, etc. @classmethod def get_default_models(cls) -> Dict[str, Dict[str, Any]]: """Get the default OpenAI models with pricing information.""" return { "fast": { "name": "gpt-4o-mini", "input_cost": 0.15, # $0.15 per million tokens "output_cost": 0.60, # $0.60 per million tokens "description": "Fast and cost-effective model for most use cases" }, "smart": { "name": "o1-mini", "input_cost": 1.1, # $1.10 per million tokens "output_cost": 4.4, # $4.40 per million tokens "description": "Advanced reasoning capabilities with superior performance" }, "vision": { "name": "gpt-4o", "input_cost": 2.5, # $2.50 per million tokens "output_cost": 10.0, # $10.00 per million tokens "description": "Multimodal model that can process images and text" }, }

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/rt96-hub/prompt-tester'

If you have feedback or need assistance with the MCP directory API, please join our Discord server