Local DeepWiki MCP Server

Overview Schema Related Servers Score Discussions

wiki.py•20.3 KiB

"""Wiki documentation generator using LLM providers.""" import re import time from pathlib import Path from typing import Any from local_deepwiki.config import Config, get_config from local_deepwiki.core.vectorstore import VectorStore from local_deepwiki.models import CodeChunk, IndexStatus, WikiPage, WikiStructure from local_deepwiki.providers.base import LLMProvider from local_deepwiki.providers.llm import get_llm_provider SYSTEM_PROMPT = """You are a technical documentation expert. Generate clear, concise documentation for code. - Use markdown formatting - Include code examples where helpful - Focus on explaining what the code does and how to use it - Be accurate and avoid speculation - Keep explanations practical and actionable""" def generate_class_diagram(chunks: list) -> str | None: """Generate a Mermaid class diagram from code chunks. Args: chunks: List of CodeChunk objects. Returns: Mermaid class diagram markdown string, or None if no classes found. """ from local_deepwiki.models import ChunkType # Collect classes, their methods, and inheritance info classes: dict[str, list[str]] = {} class_contents: dict[str, str] = {} # Store content for method extraction inheritance: dict[str, list[str]] = {} # child -> [parents] standalone_functions: list[str] = [] for chunk in chunks: # Handle both CodeChunk objects and SearchResult objects (which have .chunk) if hasattr(chunk, 'chunk'): chunk = chunk.chunk if chunk.chunk_type == ChunkType.CLASS: class_name = chunk.name or "Unknown" if class_name not in classes: classes[class_name] = [] class_contents[class_name] = chunk.content # Extract parent classes from metadata parent_classes = chunk.metadata.get("parent_classes", []) if parent_classes: inheritance[class_name] = parent_classes elif chunk.chunk_type == ChunkType.METHOD: parent = chunk.parent_name or "Unknown" method_name = chunk.name or "unknown" if parent not in classes: classes[parent] = [] # Avoid duplicates if method_name not in classes[parent]: classes[parent].append(method_name) elif chunk.chunk_type == ChunkType.FUNCTION: func_name = chunk.name or "unknown" if func_name not in standalone_functions: standalone_functions.append(func_name) # For classes without METHOD chunks, extract methods from content # Pattern matches: def method_name( or async def method_name( method_pattern = re.compile(r'(?:async\s+)?def\s+(\w+)\s*\(') for class_name, methods in classes.items(): if not methods and class_name in class_contents: content = class_contents[class_name] # Skip the first match if it's the class definition line found_methods = method_pattern.findall(content) for method in found_methods: if method not in methods: methods.append(method) # Filter to only classes with methods (empty classes cause Mermaid syntax errors) classes_with_methods = {k: v for k, v in classes.items() if v} # If no classes with methods, nothing to diagram if not classes_with_methods: return None # Helper to sanitize names for Mermaid def sanitize(name: str) -> str: return name.replace("<", "_").replace(">", "_").replace(" ", "_") # Build Mermaid diagram lines = ["```mermaid", "classDiagram"] for class_name, methods in sorted(classes_with_methods.items()): safe_name = sanitize(class_name) lines.append(f" class {safe_name} {{") for method in methods: # Mark private methods with - prefix, others with + prefix = "-" if method.startswith("_") else "+" safe_method = sanitize(method) lines.append(f" {prefix}{safe_method}()") lines.append(" }") # Add inheritance relationships for child, parents in sorted(inheritance.items()): if child in classes_with_methods: safe_child = sanitize(child) for parent in parents: safe_parent = sanitize(parent) # Use --|> for inheritance (child inherits from parent) lines.append(f" {safe_child} --|> {safe_parent}") lines.append("```") return "\n".join(lines) class WikiGenerator: """Generate wiki documentation from indexed code.""" def __init__( self, wiki_path: Path, vector_store: VectorStore, config: Config | None = None, llm_provider_name: str | None = None, ): """Initialize the wiki generator. Args: wiki_path: Path to wiki output directory. vector_store: Vector store with indexed code. config: Optional configuration. llm_provider_name: Override LLM provider ("ollama", "anthropic", "openai"). """ self.wiki_path = wiki_path self.vector_store = vector_store self.config = config or get_config() # Override LLM provider if specified if llm_provider_name: self.config.llm.provider = llm_provider_name # type: ignore self.llm = get_llm_provider(self.config.llm) async def generate( self, index_status: IndexStatus, progress_callback: Any = None, ) -> WikiStructure: """Generate wiki documentation for the indexed repository. Args: index_status: The index status with file information. progress_callback: Optional progress callback. Returns: WikiStructure with generated pages. """ pages: list[WikiPage] = [] total_steps = 5 # overview, architecture, modules, files, dependencies # Generate index page (overview) if progress_callback: progress_callback("Generating overview", 0, total_steps) overview_page = await self._generate_overview(index_status) pages.append(overview_page) self._write_page(overview_page) # Generate architecture page if progress_callback: progress_callback("Generating architecture docs", 1, total_steps) architecture_page = await self._generate_architecture(index_status) pages.append(architecture_page) self._write_page(architecture_page) # Generate module pages if progress_callback: progress_callback("Generating module documentation", 2, total_steps) module_pages = await self._generate_module_docs(index_status) for page in module_pages: pages.append(page) self._write_page(page) # Generate file-level documentation if progress_callback: progress_callback("Generating file documentation", 3, total_steps) file_pages = await self._generate_file_docs(index_status, progress_callback) for page in file_pages: pages.append(page) self._write_page(page) # Generate dependencies page if progress_callback: progress_callback("Generating dependencies", 4, total_steps) deps_page = await self._generate_dependencies(index_status) pages.append(deps_page) self._write_page(deps_page) if progress_callback: progress_callback("Wiki generation complete", total_steps, total_steps) return WikiStructure(root=str(self.wiki_path), pages=pages) async def _generate_overview(self, index_status: IndexStatus) -> WikiPage: """Generate the main overview/index page.""" # Gather context from vector store stats = self.vector_store.get_stats() prompt = f"""Generate a README-style overview for this codebase: Repository: {Path(index_status.repo_path).name} Total Files: {index_status.total_files} Languages: {', '.join(f'{lang} ({count} files)' for lang, count in index_status.languages.items())} Total Code Chunks: {index_status.total_chunks} Generate a clear overview that includes: 1. Project title and brief description (infer from the code structure) 2. Key features/capabilities 3. Technology stack 4. Directory structure overview 5. Quick start guide Format as markdown with proper headings.""" content = await self.llm.generate(prompt, system_prompt=SYSTEM_PROMPT) return WikiPage( path="index.md", title="Overview", content=content, generated_at=time.time(), ) async def _generate_architecture(self, index_status: IndexStatus) -> WikiPage: """Generate architecture documentation with diagrams.""" # Get module-level chunks for architecture overview search_results = await self.vector_store.search( "architecture structure main module", limit=20, ) context = "\n\n".join([ f"File: {r.chunk.file_path}\n{r.chunk.content[:500]}" for r in search_results ]) prompt = f"""Based on this codebase context, generate architecture documentation: {context} Generate documentation that includes: 1. System architecture overview 2. Key components and their responsibilities 3. Data flow between components 4. A Mermaid diagram showing the architecture (use ```mermaid code blocks) 5. Design patterns used Format as markdown with clear sections.""" content = await self.llm.generate(prompt, system_prompt=SYSTEM_PROMPT) return WikiPage( path="architecture.md", title="Architecture", content=content, generated_at=time.time(), ) async def _generate_module_docs(self, index_status: IndexStatus) -> list[WikiPage]: """Generate documentation for each module/directory.""" pages = [] # Group files by top-level directory directories: dict[str, list[str]] = {} for file_info in index_status.files: parts = Path(file_info.path).parts if len(parts) > 1: dir_name = parts[0] else: dir_name = "root" directories.setdefault(dir_name, []).append(file_info.path) # Generate a page for each significant directory for dir_name, files in directories.items(): if len(files) < 2: continue # Get chunks for this directory search_results = await self.vector_store.search( f"module {dir_name}", limit=15, ) # Filter to chunks from this directory relevant_chunks = [ r for r in search_results if r.chunk.file_path.startswith(dir_name) ] if not relevant_chunks: continue context = "\n\n".join([ f"File: {r.chunk.file_path}\nType: {r.chunk.chunk_type.value}\nName: {r.chunk.name}\n{r.chunk.content[:400]}" for r in relevant_chunks[:10] ]) prompt = f"""Generate documentation for the '{dir_name}' module: Files in module: {', '.join(files[:10])}{'...' if len(files) > 10 else ''} Code context: {context} Generate documentation that includes: 1. Module purpose and responsibilities 2. Key classes/functions and their purposes 3. Usage examples 4. Dependencies on other modules Format as markdown.""" content = await self.llm.generate(prompt, system_prompt=SYSTEM_PROMPT) page = WikiPage( path=f"modules/{dir_name}.md", title=f"Module: {dir_name}", content=content, generated_at=time.time(), ) pages.append(page) # Create modules index if pages: modules_index = WikiPage( path="modules/index.md", title="Modules", content=self._generate_modules_index(pages), generated_at=time.time(), ) pages.insert(0, modules_index) return pages def _generate_modules_index(self, module_pages: list[WikiPage]) -> str: """Generate index page for modules.""" lines = ["# Modules\n", "This section contains documentation for each module.\n"] for page in module_pages: if page.path != "modules/index.md": name = Path(page.path).stem lines.append(f"- [{page.title}]({name}.md)") return "\n".join(lines) async def _generate_file_docs( self, index_status: IndexStatus, progress_callback: Any = None ) -> list[WikiPage]: """Generate documentation for individual source files.""" pages = [] # Filter to significant files (skip __init__.py, test files for now) significant_files = [ f for f in index_status.files if not f.path.endswith("__init__.py") and f.chunk_count >= 2 # Has meaningful content ] # Limit to avoid too many LLM calls max_files = 20 if len(significant_files) > max_files: # Prioritize files with more chunks (more complex) significant_files = sorted( significant_files, key=lambda x: x.chunk_count, reverse=True )[:max_files] for i, file_info in enumerate(significant_files): file_path = Path(file_info.path) # Get all chunks for this file search_results = await self.vector_store.search( f"file:{file_info.path}", limit=50, ) # Filter to chunks from this specific file file_chunks = [ r for r in search_results if r.chunk.file_path == file_info.path ] if not file_chunks: # Fallback: search by filename search_results = await self.vector_store.search( file_path.stem, limit=30, ) file_chunks = [ r for r in search_results if r.chunk.file_path == file_info.path ] if not file_chunks: continue # Build context from chunks context_parts = [] for r in file_chunks[:15]: # Limit context size chunk = r.chunk context_parts.append( f"Type: {chunk.chunk_type.value}\n" f"Name: {chunk.name}\n" f"Lines: {chunk.start_line}-{chunk.end_line}\n" f"```\n{chunk.content[:600]}\n```" ) context = "\n\n".join(context_parts) prompt = f"""Generate documentation for the file '{file_info.path}': Language: {file_info.language} Total code chunks: {file_info.chunk_count} Code contents: {context} Generate comprehensive documentation that includes: 1. **File Overview**: Purpose and responsibility of this file 2. **Classes**: Document each class with its purpose, key methods, and usage 3. **Functions**: Document each function with parameters, return values, and purpose 4. **Usage Examples**: Show how to use the main components 5. **Dependencies**: What this file imports/depends on Format as markdown with clear sections. Be specific about the actual code. Do NOT include mermaid class diagrams - they will be auto-generated.""" content = await self.llm.generate(prompt, system_prompt=SYSTEM_PROMPT) # Strip any LLM-generated class diagram sections (we add our own) # Remove "## Class Diagram" section and any mermaid classDiagram blocks content = re.sub( r'\n*##\s*Class\s*Diagram\s*\n+```mermaid\s*\n+classDiagram.*?```', '', content, flags=re.DOTALL | re.IGNORECASE ) # Generate class diagram if file has classes # Use get_chunks_by_file for complete chunk list (not just search results) all_file_chunks = await self.vector_store.get_chunks_by_file(file_info.path) class_diagram = generate_class_diagram(all_file_chunks) if class_diagram: content += "\n\n## Class Diagram\n\n" + class_diagram # Create nested path structure: files/module/filename.md parts = file_path.parts if len(parts) > 1: wiki_path = f"files/{'/'.join(parts[:-1])}/{file_path.stem}.md" else: wiki_path = f"files/{file_path.stem}.md" page = WikiPage( path=wiki_path, title=f"{file_path.name}", content=content, generated_at=time.time(), ) pages.append(page) # Create files index if pages: files_index = WikiPage( path="files/index.md", title="Source Files", content=self._generate_files_index(pages), generated_at=time.time(), ) pages.insert(0, files_index) return pages def _generate_files_index(self, file_pages: list[WikiPage]) -> str: """Generate index page for file documentation.""" lines = [ "# Source Files\n", "Detailed documentation for individual source files.\n", ] # Group by directory by_dir: dict[str, list[WikiPage]] = {} for page in file_pages: if page.path == "files/index.md": continue parts = Path(page.path).parts if len(parts) > 2: dir_name = parts[1] # files/DIR/file.md -> DIR else: dir_name = "root" by_dir.setdefault(dir_name, []).append(page) for dir_name, dir_pages in sorted(by_dir.items()): lines.append(f"\n## {dir_name}\n") for page in sorted(dir_pages, key=lambda p: p.title): # Make relative link from files/index.md rel_path = page.path.replace("files/", "") lines.append(f"- [{page.title}]({rel_path})") return "\n".join(lines) async def _generate_dependencies(self, index_status: IndexStatus) -> WikiPage: """Generate dependencies documentation.""" # Get import chunks search_results = await self.vector_store.search( "import require include dependencies", limit=30, ) import_chunks = [r for r in search_results if r.chunk.chunk_type.value == "import"] context = "\n\n".join([ f"File: {r.chunk.file_path}\n{r.chunk.content}" for r in import_chunks[:20] ]) prompt = f"""Based on these import statements, generate a dependencies overview: {context} Generate documentation that includes: 1. External dependencies (libraries, packages) 2. Internal module dependencies 3. A Mermaid diagram showing dependency relationships (use ```mermaid code blocks) 4. Any notable dependency patterns Format as markdown.""" content = await self.llm.generate(prompt, system_prompt=SYSTEM_PROMPT) return WikiPage( path="dependencies.md", title="Dependencies", content=content, generated_at=time.time(), ) def _write_page(self, page: WikiPage) -> None: """Write a wiki page to disk.""" page_path = self.wiki_path / page.path page_path.parent.mkdir(parents=True, exist_ok=True) page_path.write_text(page.content) async def generate_wiki( repo_path: Path, wiki_path: Path, vector_store: VectorStore, index_status: IndexStatus, config: Config | None = None, llm_provider: str | None = None, progress_callback: Any = None, ) -> WikiStructure: """Convenience function to generate wiki documentation. Args: repo_path: Path to the repository. wiki_path: Path for wiki output. vector_store: Indexed vector store. index_status: Index status. config: Optional configuration. llm_provider: Optional LLM provider override. progress_callback: Optional progress callback. Returns: WikiStructure with generated pages. """ generator = WikiGenerator( wiki_path=wiki_path, vector_store=vector_store, config=config, llm_provider_name=llm_provider, ) return await generator.generate(index_status, progress_callback)

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/UrbanDiver/local-deepwiki-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

wiki.py•20.3 KiB