Igloo MCP

igloo-mcp
src
igloo_mcp

query_optimizer.py•5.71 kB

"""Offline query optimization helper consuming cached manifest + history data.""" from __future__ import annotations import json from dataclasses import dataclass from pathlib import Path from typing import Any from .path_utils import find_repo_root, resolve_history_path @dataclass class OptimizationFinding: level: str message: str detail: str | None = None def _read_history_entries(history_path: Path) -> list[dict[str, Any]]: if not history_path.exists(): raise FileNotFoundError(f"history file not found: {history_path}") entries: list[dict[str, Any]] = [] with history_path.open("r", encoding="utf-8") as fh: for line in fh: line = line.strip() if not line: continue try: entries.append(json.loads(line)) except (json.JSONDecodeError, ValueError): continue return entries def _select_entry(entries: list[dict[str, Any]], execution_id: str | None) -> dict[str, Any]: if execution_id: for entry in reversed(entries): if str(entry.get("execution_id")) == execution_id: return entry raise ValueError(f"execution_id {execution_id} not found in history") # Default to latest successful or cache_hit entry for entry in reversed(entries): if entry.get("status") in {"success", "cache_hit"}: return entry if entries: return entries[-1] raise ValueError("history file is empty") def _load_manifest(entry: dict[str, Any]) -> dict[str, Any]: manifest_path = entry.get("cache_manifest") artifacts = entry.get("artifacts") or {} manifest_path = manifest_path or artifacts.get("cache_manifest") if not manifest_path: return {} path = Path(manifest_path) if not path.is_absolute(): repo_root = find_repo_root() path = (repo_root / path).resolve() if not path.exists(): return {} try: return json.loads(path.read_text(encoding="utf-8")) except (FileNotFoundError, PermissionError, json.JSONDecodeError): return {} def _load_sql_text(entry: dict[str, Any]) -> str | None: artifacts = entry.get("artifacts") or {} sql_path = artifacts.get("sql_path") if not sql_path: return None path = Path(sql_path) if not path.is_absolute(): repo_root = find_repo_root() path = (repo_root / path).resolve() if not path.exists(): return None try: return path.read_text(encoding="utf-8") except (FileNotFoundError, PermissionError, OSError): return None def _detect_findings( sql: str | None, manifest: dict[str, Any], entry: dict[str, Any], ) -> list[OptimizationFinding]: findings: list[OptimizationFinding] = [] duration = entry.get("duration_ms") or manifest.get("duration_ms") or 0 rowcount = entry.get("rowcount") or manifest.get("rowcount") or 0 objects = manifest.get("objects") or [] if sql and "select *" in sql.lower(): findings.append( OptimizationFinding( level="info", message="Replace SELECT * with explicit column list", detail="Selecting all columns prevents pruning and increases scan time.", ) ) if duration and duration > 60_000 and rowcount and rowcount < 5_000: findings.append( OptimizationFinding( level="warn", message="Query scanned a lot of data for few rows", detail="Add WHERE clauses or leverage clustering/filters to reduce scans.", ) ) if len(objects) > 3: names = [o.get("name") for o in objects if isinstance(o, dict)] findings.append( OptimizationFinding( level="info", message="Query joins many objects", detail=f"Referenced objects: {', '.join(filter(None, names))}", ) ) if entry.get("status") == "timeout": findings.append( OptimizationFinding( level="error", message="Query timed out", detail=( "Consider filtering by clustering keys or adding WHERE clauses to reduce data scanned " "before increasing timeout_seconds. Alternatively, run asynchronously or sample with LIMIT." ), ) ) if not findings: findings.append( OptimizationFinding( level="info", message="No obvious issues detected", detail=( "Query metadata looks healthy. Review warehouse size or predicate selectivity if latency persists." ), ) ) return findings def optimize_execution( execution_id: str | None = None, *, history_path: str | None = None, ) -> dict[str, Any]: path = Path(history_path).expanduser() if history_path else resolve_history_path() entries = _read_history_entries(path) entry = _select_entry(entries, execution_id) manifest = _load_manifest(entry) sql = _load_sql_text(entry) findings = _detect_findings(sql, manifest, entry) return { "execution_id": entry.get("execution_id"), "status": entry.get("status"), "duration_ms": entry.get("duration_ms") or manifest.get("duration_ms"), "rowcount": entry.get("rowcount") or manifest.get("rowcount"), "objects": manifest.get("objects"), "sql_path": (entry.get("artifacts") or {}).get("sql_path"), "findings": [finding.__dict__ for finding in findings], }

Latest Blog Posts

Model Context Protocol Proxies: Enabling Enterprise Control with Virtual MCPs
By Om-Shree-0709 on December 9, 2025.
AI Security
Virtual MCP
Kubernetes Operator
The State of MCP in 2025: Who's Building What and Why It Matters
By punkpeye on December 7, 2025.
mcp
startups
MCP hosting with persistent storage
By punkpeye on December 6, 2025.
changelog

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/Evan-Kim2028/igloo-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server