LLM Graph Builder MCP

Overview Schema Related Servers Score Discussions

local_file.py•4.08 KiB

import logging from pathlib import Path from langchain_community.document_loaders import PyMuPDFLoader from langchain_community.document_loaders import UnstructuredFileLoader from langchain_core.documents import Document import chardet from langchain_core.document_loaders import BaseLoader class ListLoader(BaseLoader): """A wrapper to make a list of Documents compatible with BaseLoader.""" def __init__(self, documents): self.documents = documents def load(self): return self.documents def detect_encoding(file_path): """Detects the file encoding to avoid UnicodeDecodeError.""" with open(file_path, 'rb') as f: raw_data = f.read(4096) result = chardet.detect(raw_data) return result['encoding'] or "utf-8" def load_document_content(file_path): file_extension = Path(file_path).suffix.lower() encoding_flag = False if file_extension == '.pdf': loader = PyMuPDFLoader(file_path) return loader,encoding_flag elif file_extension == ".txt": encoding = detect_encoding(file_path) logging.info(f"Detected encoding for {file_path}: {encoding}") if encoding.lower() == "utf-8": loader = UnstructuredFileLoader(file_path, mode="elements",autodetect_encoding=True) return loader,encoding_flag else: with open(file_path, encoding=encoding, errors="replace") as f: content = f.read() loader = ListLoader([Document(page_content=content, metadata={"source": file_path})]) encoding_flag = True return loader,encoding_flag else: loader = UnstructuredFileLoader(file_path, mode="elements",autodetect_encoding=True) return loader,encoding_flag def get_documents_from_file_by_path(file_path,file_name): file_path = Path(file_path) if not file_path.exists(): logging.info(f'File {file_name} does not exist') raise Exception(f'File {file_name} does not exist') logging.info(f'file {file_name} processing') try: loader, encoding_flag = load_document_content(file_path) file_extension = file_path.suffix.lower() if file_extension == ".pdf" or (file_extension == ".txt" and encoding_flag): pages = loader.load() else: unstructured_pages = loader.load() pages = get_pages_with_page_numbers(unstructured_pages) except Exception as e: raise Exception(f'Error while reading the file content or metadata, {e}') return file_name, pages , file_extension def get_pages_with_page_numbers(unstructured_pages): pages = [] page_number = 1 page_content='' metadata = {} for page in unstructured_pages: if 'page_number' in page.metadata: if page.metadata['page_number']==page_number: page_content += page.page_content metadata = {'source':page.metadata['source'],'page_number':page_number, 'filename':page.metadata['filename'], 'filetype':page.metadata['filetype']} if page.metadata['page_number']>page_number: page_number+=1 pages.append(Document(page_content = page_content)) page_content='' if page == unstructured_pages[-1]: pages.append(Document(page_content = page_content)) elif page.metadata['category']=='PageBreak' and page!=unstructured_pages[0]: page_number+=1 pages.append(Document(page_content = page_content, metadata=metadata)) page_content='' metadata={} else: page_content += page.page_content metadata_with_custom_page_number = {'source':page.metadata['source'], 'page_number':1, 'filename':page.metadata['filename'], 'filetype':page.metadata['filetype']} if page == unstructured_pages[-1]: pages.append(Document(page_content = page_content, metadata=metadata_with_custom_page_number)) return pages

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/henrardo/llm-graph-builder-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

local_file.py•4.08 KiB