MCP Code Analysis Server

utils.py•10.2 KiB

"""Utility functions for MCP tools.""" import math from datetime import UTC, datetime from typing import Any from sqlalchemy import select from sqlalchemy.ext.asyncio import AsyncSession from src.database.models import Class, File, Function, Module from src.logger import get_logger logger = get_logger(__name__) def format_file_path(path: str, repo_root: str | None = None) -> str: """Format file path for display. Args: path: File path to format repo_root: Repository root to strip from absolute paths Returns: Formatted file path """ if not path: return path # Normalize path path = path.replace("\\", "/") # Remove leading ./ if path.startswith("./"): path = path[2:] # Strip repository root if provided if repo_root and path.startswith(repo_root): path = path[len(repo_root) :].lstrip("/") return path def format_function_signature( name: str, parameters: str | None = None, return_type: str | None = None, ) -> str: """Format function signature for display. Args: name: Function name parameters: JSON string of parameters or None return_type: Return type annotation or None Returns: Formatted function signature """ # Parse parameters if parameters: try: import json params = json.loads(parameters) if isinstance(params, list): param_str = ", ".join(str(p) for p in params) elif isinstance(params, dict): # Support dict-style {name: type} param_str = ", ".join(f"{k}: {v}" for k, v in params.items()) else: param_str = str(params) except (ValueError, TypeError): param_str = "" else: param_str = "" # Build signature signature = f"{name}({param_str})" # Add return type if present if return_type: signature += f" -> {return_type}" return signature def format_timestamp(timestamp: datetime) -> str: """Format timestamp for human-readable display. Args: timestamp: Datetime to format Returns: Human-readable time string """ if not timestamp: return "never" # Ensure timezone awareness if timestamp.tzinfo is None: timestamp = timestamp.replace(tzinfo=UTC) now = datetime.now(UTC) delta = now - timestamp # Just now if delta.total_seconds() < 60: return "just now" # Minutes minutes = int(delta.total_seconds() / 60) if minutes < 60: return f"{minutes} minute{'s' if minutes != 1 else ''} ago" # Hours hours = int(minutes / 60) if hours < 24: return f"{hours} hour{'s' if hours != 1 else ''} ago" # Days days = int(hours / 24) if days < 30: return f"{days} day{'s' if days != 1 else ''} ago" # Older - show actual date return timestamp.strftime("%Y-%m-%d %H:%M") def validate_entity_type(entity_type: str) -> bool: """Validate entity type. Args: entity_type: Entity type to validate Returns: True if valid, False otherwise """ valid_types = {"function", "class", "module", "file"} return entity_type in valid_types def validate_file_path(path: str) -> bool: """Validate file path for safety. Args: path: File path to validate Returns: True if valid and safe, False otherwise """ if not path or not path.strip(): return False # Check for null bytes if "\x00" in path: return False # Check for newlines if "\n" in path or "\r" in path: return False # Check for excessive path traversal return not (path.count("..") > 3) def parse_entity_reference(reference: str) -> tuple[str | None, str | None, str | None]: """Parse entity reference string. Format: "type:name[@file]" Args: reference: Entity reference string Returns: Tuple of (entity_type, entity_name, file_path) """ if not reference: return None, None, None # Parse type:name if ":" not in reference: return None, None, None entity_type, rest = reference.split(":", 1) if not rest: return None, None, None # Parse optional @file if "@" in rest: entity_name, file_path = rest.split("@", 1) else: entity_name = rest file_path = None return entity_type, entity_name, file_path def paginate_results( items: list[Any], page: int = 1, page_size: int = 20, ) -> dict[str, Any]: """Paginate a list of results. Args: items: List of items to paginate page: Page number (1-based) page_size: Items per page Returns: Dictionary with paginated results """ total = len(items) pages = math.ceil(total / page_size) if page_size > 0 else 1 # Calculate slice indices start = (page - 1) * page_size end = start + page_size # Get page items page_items = items[start:end] return { "items": page_items, "total": total, "page": page, "pages": pages, "page_size": page_size, "has_next": page < pages, "has_prev": page > 1, } async def get_entity_by_type_and_id( db_session: AsyncSession, entity_type: str, entity_id: int, ) -> Function | Class | Module | File | None: """Get entity by type and ID. Args: db_session: Database session entity_type: Type of entity entity_id: Entity ID Returns: Entity object or None """ if not validate_entity_type(entity_type): class InvalidEntityTypeError(ValueError): """Raised when an entity type is invalid.""" def __init__(self, entity_type: str) -> None: super().__init__(f"Invalid entity type: {entity_type}") raise InvalidEntityTypeError(entity_type) # Map types to models from typing import cast model_cls = type[Function] | type[Class] | type[Module] | type[File] type_map: dict[str, model_cls] = { "function": Function, "class": Class, "module": Module, "file": File, } model = type_map[entity_type] # Query entity result = await db_session.execute( select(model).where(model.id == entity_id), ) return cast("Function | Class | Module | File | None", result.scalar_one_or_none()) async def get_file_content_safe( file_path: str, max_size: int = 1_000_000, # 1MB default ) -> str | None: """Safely read file content with size limit. Args: file_path: Path to file max_size: Maximum file size to read Returns: File content or None if error """ try: from pathlib import Path path_obj = Path(file_path) # Fail fast on very large files try: if path_obj.exists() and path_obj.stat().st_size > max_size: return None except OSError: # If stat fails, fall back to best-effort read with size limit pass # Note: This async wrapper uses a threadpool to avoid blocking the event loop import asyncio loop = asyncio.get_running_loop() return await loop.run_in_executor( None, lambda: path_obj.read_text(encoding="utf-8")[:max_size] ) except (FileNotFoundError, PermissionError, OSError): return None except Exception: logger.exception("Error reading file %s", file_path) return None def format_error_response( message: str, code: str | None = None, details: dict[str, Any] | None = None, ) -> dict[str, Any]: """Format error response for consistency. Args: message: Error message code: Optional error code details: Optional error details Returns: Formatted error response """ response: dict[str, Any] = { "status": "error", "error": message, } if code: response["code"] = code if details is not None: response["details"] = details return response def sanitize_output(data: dict[str, Any]) -> dict[str, Any]: """Sanitize output by removing sensitive data. Args: data: Data dictionary to sanitize Returns: Sanitized data """ sensitive_keys = { "password", "secret", "token", "key", "api_key", "access_token", "refresh_token", "private_key", } sanitized = {} for key, value in data.items(): if any(sensitive in key.lower() for sensitive in sensitive_keys): sanitized[key] = "[REDACTED]" else: sanitized[key] = value return sanitized def calculate_similarity_score( text1: str, text2: str, case_sensitive: bool = True, ) -> float: """Calculate simple similarity score between two strings. Args: text1: First text text2: Second text case_sensitive: Whether to consider case Returns: Similarity score between 0 and 1 """ if not case_sensitive: text1 = text1.lower() text2 = text2.lower() if text1 == text2: return 1.0 # Simple character-based similarity longer = max(len(text1), len(text2)) if longer == 0: return 1.0 # Count matching characters matches = sum(c1 == c2 for c1, c2 in zip(text1, text2, strict=False)) # Basic similarity score return matches / longer def parse_code_location(location: str) -> tuple[str | None, int | None, int | None]: """Parse code location string. Format: "file:line:column" or "file:line" or "file" Args: location: Location string Returns: Tuple of (file_path, line, column) """ if not location: return None, None, None parts = location.split(":") if len(parts) == 1: return parts[0], None, None if len(parts) == 2: try: return parts[0], int(parts[1]), None except ValueError: return None, None, None elif len(parts) == 3: try: return parts[0], int(parts[1]), int(parts[2]) except ValueError: return None, None, None else: return None, None, None

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/johannhartmann/mcpcodeanalysis'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

utils.py•10.2 KiB