Local DeepWiki MCP Server

Overview Schema Related Servers Score Discussions

docstring_examples.py•8.88 KiB

"""Parse code examples from docstrings. This module extracts code examples from docstrings in two styles: 1. Python doctest-style (>>> prompts) 2. Google-style Examples sections These parsers are used by the example extraction pipeline to find usage examples embedded in documentation. """ from __future__ import annotations import re from dataclasses import dataclass from textwrap import dedent @dataclass(frozen=True, slots=True) class CodeExample: """A code example extracted from tests or docstrings. This is the unified data class for examples from any source. """ source: str # "test" or "docstring" code: str # The actual code snippet description: str | None = None # Description or context test_file: str | None = None # Path to test file (for test examples) language: str = "python" # Programming language expected_output: str | None = None # Expected output (for doctest examples) entity_name: str | None = None # Name of the function/class being demonstrated def parse_doctest_examples(docstring: str) -> list[CodeExample]: """Extract >>> doctest examples from a docstring. Parses Python doctest-style examples with >>> prompts and expected output. Args: docstring: The docstring to parse. Returns: List of CodeExample objects extracted from doctests. Example: >>> parse_doctest_examples(''' ... >>> add(1, 2) ... 3 ... >>> add(-1, 1) ... 0 ... ''') [CodeExample(source='docstring', code='add(1, 2)', expected_output='3', ...)] """ if not docstring: return [] examples: list[CodeExample] = [] lines = docstring.split("\n") current_code_lines: list[str] = [] current_output_lines: list[str] = [] in_code = False for line in lines: stripped = line.strip() # Check for >>> prompt (start of code) if stripped.startswith(">>>"): # If we have accumulated code from before, save it if current_code_lines: code = "\n".join(current_code_lines) output = ( "\n".join(current_output_lines) if current_output_lines else None ) examples.append( CodeExample( source="docstring", code=code, expected_output=output, language="python", ) ) current_code_lines = [] current_output_lines = [] # Start new code block code_part = stripped[3:].strip() # Remove >>> if code_part: current_code_lines.append(code_part) in_code = True # Check for ... continuation elif stripped.startswith("...") and in_code: cont_part = stripped[3:].strip() # Remove ... current_code_lines.append(cont_part) # Expected output (non-empty line after code, not starting with >>> or ...) elif in_code and stripped and not stripped.startswith((">>>", "...")): current_output_lines.append(stripped) # Empty line may end the example elif in_code and not stripped and current_code_lines: # Save the accumulated example code = "\n".join(current_code_lines) output = "\n".join(current_output_lines) if current_output_lines else None examples.append( CodeExample( source="docstring", code=code, expected_output=output, language="python", ) ) current_code_lines = [] current_output_lines = [] in_code = False # Don't forget the last example if current_code_lines: code = "\n".join(current_code_lines) output = "\n".join(current_output_lines) if current_output_lines else None examples.append( CodeExample( source="docstring", code=code, expected_output=output, language="python", ) ) return examples def parse_google_style_examples(docstring: str) -> list[CodeExample]: """Extract examples from Google-style docstring Examples section. Parses the Examples: section of a Google-style docstring, extracting code blocks and their descriptions. Args: docstring: The docstring to parse. Returns: List of CodeExample objects from the Examples section. Example: >>> doc = ''' ... Examples: ... Basic usage: ... result = process("input") ... print(result) ... ... With options: ... result = process("input", verbose=True) ... ''' >>> examples = parse_google_style_examples(doc) >>> len(examples) 2 """ if not docstring: return [] examples: list[CodeExample] = [] # Find the Examples: section # Match "Examples:", "Example:", with optional leading whitespace example_pattern = re.compile( r"^\s*(Examples?)\s*:\s*$", re.MULTILINE | re.IGNORECASE, ) match = example_pattern.search(docstring) if not match: return [] # Extract from Examples: to end or next section start_idx = match.end() # Find the next section (Args:, Returns:, Raises:, etc.) section_pattern = re.compile( r"^\s*(Args?|Returns?|Raises?|Yields?|Attributes?|Note|Notes|Warning|Warnings|See Also|References?)\s*:", re.MULTILINE | re.IGNORECASE, ) end_match = section_pattern.search(docstring, start_idx) if end_match: examples_text = docstring[start_idx : end_match.start()] else: examples_text = docstring[start_idx:] # Parse the examples section lines = examples_text.split("\n") current_description: str | None = None current_code_lines: list[str] = [] base_indent: int | None = None def save_current_example() -> None: """Save the current accumulated example.""" nonlocal current_description, current_code_lines if current_code_lines: code = dedent("\n".join(current_code_lines)).strip() if code: examples.append( CodeExample( source="docstring", code=code, description=current_description, language="python", ) ) current_description = None current_code_lines = [] for line in lines: # Skip empty lines at the start if not line.strip() and not current_code_lines: continue # Calculate indentation stripped = line.lstrip() indent = len(line) - len(stripped) # Detect base indent level if base_indent is None and stripped: base_indent = indent if not stripped: # Empty line might separate examples if current_code_lines: current_code_lines.append("") continue # Line at base indent level might be a description if base_indent is not None and indent == base_indent: # Check if it looks like a description (ends with :) if stripped.endswith(":") and not stripped.startswith((">>>", "...")): # Save previous example if any save_current_example() current_description = stripped.rstrip(":") continue # Code line (more indented than base) if base_indent is not None and indent > base_indent: current_code_lines.append(line) elif stripped: # At base level, could be code if we're already collecting if current_code_lines: current_code_lines.append(line) else: # Could be description or start of code current_code_lines.append(line) # Save the last example save_current_example() return examples def parse_docstring_examples(docstring: str) -> list[CodeExample]: """Extract all examples from a docstring (doctests and Google-style). Combines doctest-style (>>>) examples and Google-style Examples section into a unified list. Args: docstring: The docstring to parse. Returns: List of CodeExample objects from all sources. """ if not docstring: return [] examples: list[CodeExample] = [] # Extract doctest examples doctest_examples = parse_doctest_examples(docstring) examples.extend(doctest_examples) # Extract Google-style examples (only if no doctests found, to avoid duplication) if not doctest_examples: google_examples = parse_google_style_examples(docstring) examples.extend(google_examples) return examples

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/UrbanDiver/local-deepwiki-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

docstring_examples.py•8.88 KiB