MyAIGist MCP

Overview Schema Related Servers Score Discussions

myaigist_mcp
mcp_agents

document_processor.py•2.19 KiB

""" Document processing agent - extracts text from various file formats """ import os from PyPDF2 import PdfReader from docx import Document class DocumentProcessor: """Agent responsible for extracting text from documents""" def __init__(self): self.supported_formats = ['.pdf', '.docx', '.txt'] def extract_text(self, file_path: str) -> str: """ Extract text from document based on file extension Args: file_path: Path to the document file Returns: Extracted text content """ if not os.path.exists(file_path): raise FileNotFoundError(f"File not found: {file_path}") file_ext = os.path.splitext(file_path)[1].lower() if file_ext == '.pdf': return self._extract_from_pdf(file_path) elif file_ext == '.docx': return self._extract_from_docx(file_path) elif file_ext == '.txt': return self._extract_from_txt(file_path) else: raise ValueError(f"Unsupported file format: {file_ext}") def _extract_from_pdf(self, file_path: str) -> str: """Extract text from PDF file""" try: with open(file_path, 'rb') as file: reader = PdfReader(file) text = "" for page in reader.pages: text += page.extract_text() + "\n" return text.strip() except Exception as e: raise RuntimeError(f"Error extracting PDF: {str(e)}") def _extract_from_docx(self, file_path: str) -> str: """Extract text from DOCX file""" try: doc = Document(file_path) text = "" for paragraph in doc.paragraphs: text += paragraph.text + "\n" return text.strip() except Exception as e: raise RuntimeError(f"Error extracting DOCX: {str(e)}") def _extract_from_txt(self, file_path: str) -> str: """Extract text from TXT file""" try: with open(file_path, 'r', encoding='utf-8') as file: return file.read().strip() except Exception as e: raise RuntimeError(f"Error extracting TXT: {str(e)}")

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/schwim23/myaigist_mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

document_processor.py•2.19 KiB