OpenAI Vector Store MCP Server

server.py•7.45 kB

""" Sample MCP Server for ChatGPT Integration This server implements the Model Context Protocol (MCP) with search and fetch capabilities designed to work with ChatGPT's chat and deep research features. """ import logging import os from typing import Dict, List, Any from fastmcp import FastMCP from openai import OpenAI from dotenv import load_dotenv # .env에서 환경변수 불러옴 load_dotenv() # 로거 세팅 logging.basicConfig(level=logging.INFO) logger = logging.getLogger(__name__) # 각종 키 OPENAI_API_KEY = os.environ.get("OPENAI_API_KEY") VECTOR_STORE_ID = os.environ.get("VECTOR_STORE_ID", "") openai_client = OpenAI() server_instructions = """ This MCP server provides search and document retrieval capabilities for chat and deep research connectors. Use the search tool to find relevant documents based on keywords, then use the fetch tool to retrieve complete document content with citations. """ def create_server(): """Create and configure the MCP server with search and fetch tools.""" # Initialize the FastMCP server mcp = FastMCP(name="Sample MCP Server", instructions=server_instructions) @mcp.tool() async def search(query: str) -> Dict[str, List[Dict[str, Any]]]: """ Search for documents using OpenAI Vector Store search. This tool searches through the vector store to find semantically relevant matches. Returns a list of search results with basic information. Use the fetch tool to get complete document content. Args: query: Search query string. Natural language queries work best for semantic search. Returns: Dictionary with 'results' key containing list of matching documents. Each result includes id, title, text snippet, and optional URL. """ if not query or not query.strip(): return {"results": []} if not openai_client: logger.error("OpenAI client not initialized - API key missing") raise ValueError( "OpenAI API key is required for vector store search") # Search the vector store using OpenAI API logger.info(f"Searching {VECTOR_STORE_ID} for query: '{query}'") response = openai_client.vector_stores.search( vector_store_id=VECTOR_STORE_ID, query=query) results = [] # Process the vector store search results if hasattr(response, 'data') and response.data: for i, item in enumerate(response.data): # Extract file_id, filename, and content item_id = getattr(item, 'file_id', f"vs_{i}") item_filename = getattr(item, 'filename', f"Document {i+1}") # Extract text content from the content array content_list = getattr(item, 'content', []) text_content = "" if content_list and len(content_list) > 0: # Get text from the first content item first_content = content_list[0] if hasattr(first_content, 'text'): text_content = first_content.text elif isinstance(first_content, dict): text_content = first_content.get('text', '') if not text_content: text_content = "No content available" # Create a snippet from content text_snippet = text_content[:200] + "..." if len( text_content) > 200 else text_content result = { "id": item_id, "title": item_filename, "text": text_snippet, "url": f"https://platform.openai.com/storage/files/{item_id}" } results.append(result) logger.info(f"Vector store search returned {len(results)} results") return {"results": results} @mcp.tool() async def fetch(id: str) -> Dict[str, Any]: """ Retrieve complete document content by ID for detailed analysis and citation. This tool fetches the full document content from OpenAI Vector Store. Use this after finding relevant documents with the search tool to get complete information for analysis and proper citation. Args: id: File ID from vector store (file-xxx) or local document ID Returns: Complete document with id, title, full text content, optional URL, and metadata Raises: ValueError: If the specified ID is not found """ if not id: raise ValueError("Document ID is required") if not openai_client: logger.error("OpenAI client not initialized - API key missing") raise ValueError( "OpenAI API key is required for vector store file retrieval") logger.info(f"Fetching content from vector store for file ID: {id}") # Fetch file content from vector store content_response = openai_client.vector_stores.files.content( vector_store_id=VECTOR_STORE_ID, file_id=id) # Get file metadata file_info = openai_client.vector_stores.files.retrieve( vector_store_id=VECTOR_STORE_ID, file_id=id) # Extract content from paginated response file_content = "" if hasattr(content_response, 'data') and content_response.data: # Combine all content chunks from FileContentResponse objects content_parts = [] for content_item in content_response.data: if hasattr(content_item, 'text'): content_parts.append(content_item.text) file_content = "\n".join(content_parts) else: file_content = "No content available" # Use filename as title and create proper URL for citations filename = getattr(file_info, 'filename', f"Document {id}") result = { "id": id, "title": filename, "text": file_content, "url": f"https://platform.openai.com/storage/files/{id}", "metadata": None } # Add metadata if available from file info if hasattr(file_info, 'attributes') and file_info.attributes: result["metadata"] = file_info.attributes logger.info(f"Fetched vector store file: {id}") return result return mcp def main(): """Main function to start the MCP server.""" # Verify OpenAI client is initialized if not openai_client: logger.error( "OpenAI API key not found. Please set OPENAI_API_KEY environment variable." ) raise ValueError("OpenAI API key is required") logger.info(f"Using vector store: {VECTOR_STORE_ID}") # Create the MCP server server = create_server() # Configure and start the server logger.info("Starting MCP server on 0.0.0.0:8000") logger.info("Server will be accessible via SSE transport") try: # Use FastMCP's built-in run method with SSE transport server.run(transport="sse", host="0.0.0.0", port=8000) except KeyboardInterrupt: logger.info("Server stopped by user") except Exception as e: logger.error(f"Server error: {e}") raise if __name__ == "__main__": main()

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/kkyy3402/openai-mcp-test'

If you have feedback or need assistance with the MCP directory API, please join our Discord server