pdf4vllm

server.py•8.47 KiB

""" PDF MCP for vLLM - Block-based PDF extraction for LLM consumption Exports PDFs as structured content blocks (text, tables, images) that LLMs can easily process. Preserves document reading order and handles corrupted text automatically. Provides two tools: 1. list_pdfs: List all PDF files recursively from working directory 2. read_pdf: Extract PDF content as ordered blocks with intelligent limits """ import asyncio import sys import logging from pathlib import Path # Configure logging to file for MCP server debugging log_file = Path.home() / '.pdf4vllm_mcp_debug.log' logging.basicConfig( level=logging.INFO, format='%(asctime)s - %(name)s - %(levelname)s - %(message)s', handlers=[ logging.FileHandler(str(log_file), mode='a'), logging.StreamHandler(sys.stderr) ] ) # Add project directory to sys.path (executable from anywhere) SCRIPT_DIR = Path(__file__).parent.parent if str(SCRIPT_DIR) not in sys.path: sys.path.insert(0, str(SCRIPT_DIR)) # Imports after sys.path modification (intentional) from mcp.server import Server # noqa: E402 from mcp.server.stdio import stdio_server # noqa: E402 from mcp.server.fastmcp.utilities.types import Image # noqa: E402 from mcp.types import Tool, TextContent, CallToolResult # noqa: E402 from src.pdf_tools import list_pdfs_handler, read_pdf_handler # noqa: E402 from src.config import config # noqa: E402 # Create MCP server instance server = Server("pdf4vllm") def _get_read_pdf_description() -> str: """Generate read_pdf description based on config extraction mode""" mode = config.default_extraction_mode base = f"Read PDF content. Always prefer this over cat or file read for PDF files. Limits: {config.max_pages_per_request} pages per request." if mode == "auto": return ( f"{base} " f"Works with both text and scanned documents. " f"Use 'image_only' to see actual page layout, or 'text_only' for pure text." ) elif mode == "text_only": return ( f"{base} " f"Extracts text and tables only. " f"Use 'image_only' to see actual page layout, or 'auto' for smart detection." ) elif mode == "image_only": return ( f"{base} " f"Returns page images for visual analysis. " f"Use 'text_only' for pure text extraction, or 'auto' for smart detection." ) else: return base @server.list_tools() async def list_tools() -> list[Tool]: """ List available tools for PDF MCP for vLLM """ return [ Tool( name="list_pdfs", description="Find all PDF files in a directory. Always prefer this over ls or find for PDF files. Returns name, path, pages, and size for each PDF. Use the returned 'path' directly with read_pdf.", inputSchema={ "type": "object", "properties": { "working_directory": { "type": "string", "description": "Working directory to search (relative or absolute path, default: current directory)", "default": "." }, "include_subdirectories": { "type": "boolean", "description": "Whether to include subdirectories", "default": True }, "max_depth": { "type": "integer", "description": f"Maximum recursion depth (default: {config.max_recursion_depth})", "default": config.max_recursion_depth, "minimum": 1 } } } ), Tool( name="read_pdf", description=_get_read_pdf_description(), inputSchema={ "type": "object", "properties": { "file_path": { "type": "string", "description": "PDF file path (relative or absolute path)" }, "start_page": { "type": "integer", "description": "Start page (1-indexed, inclusive)", "default": 1, "minimum": 1 }, "end_page": { "type": "integer", "description": "End page (1-indexed, inclusive). None = last page", "default": None, "minimum": 1 }, "extraction_mode": { "type": "string", "description": ( "Content extraction mode:\n" "- 'auto' (default): Smart detection - extract text/tables, add page image only if corrupted\n" "- 'text_only': Extract text/tables only, no images\n" "- 'image_only': Skip text extraction, provide only full page images" ), "enum": ["auto", "text_only", "image_only"], "default": config.default_extraction_mode }, "filter_header_footer": { "type": "boolean", "description": "Whether to filter out header/footer images (top/bottom 6% of page)", "default": True }, "crop_images": { "type": "boolean", "description": "Whether to crop images to max_image_dimension", "default": True }, "max_image_dimension": { "type": "integer", "description": f"Maximum image dimension in pixels (default: {config.max_image_dimension}, A4 height)", "default": config.max_image_dimension, "minimum": 100, "maximum": 4096 }, "page_image_dpi": { "type": "integer", "description": f"DPI for page image rendering (default: {config.page_image_dpi})", "default": config.page_image_dpi, "minimum": 50, "maximum": 300 } }, "required": ["file_path"] } ) ] @server.call_tool() async def call_tool(name: str, arguments: dict) -> CallToolResult: """ Execute a tool by name with given arguments Args: name: Tool name ("list_pdfs" or "read_pdf") arguments: Tool arguments Returns: CallToolResult with content list - TextContent: JSON response with image placeholders - ImageContent: Actual image data (sent as proper MCP ImageContent) """ if name == "list_pdfs": result_json, images = await list_pdfs_handler(arguments) return CallToolResult( content=[TextContent(type="text", text=result_json)], isError=False ) elif name == "read_pdf": result_json, images = await read_pdf_handler(arguments) # Build response: TextContent first, then ImageContent for each image # Using Image wrapper for proper MCP-compliant image serialization content = [TextContent(type="text", text=result_json)] for img in images: # Create Image wrapper with raw bytes and format # Image.to_image_content() handles base64 encoding automatically image_wrapper = Image(data=img["data"], format=img["format"]) content.append(image_wrapper.to_image_content()) return CallToolResult( content=content, isError=False ) else: raise ValueError(f"Unknown tool: {name}") async def main(): """ Main entry point for the PDF for vLLM MCP server Runs the server with stdio transport for inter-process communication """ # Run stdio server async with stdio_server() as (read_stream, write_stream): await server.run( read_stream, write_stream, server.create_initialization_options() ) def run(): """Synchronous entry point""" try: asyncio.run(main()) except KeyboardInterrupt: sys.exit(0) if __name__ == "__main__": run()

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/PyJudge/pdf4vllm-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

server.py•8.47 KiB