Relace MCP Server

analyze.py•5.63 KiB

import json import sys from pathlib import Path from typing import Any from ..config import get_results_dir def load_results(path: str) -> dict[str, Any]: path_obj = Path(path) if path_obj.suffix == ".jsonl": results = [] with open(path, encoding="utf-8") as f: for line in f: stripped = line.strip() if stripped: results.append(json.loads(stripped)) return {"results": results} with open(path, encoding="utf-8") as f: data = json.load(f) if isinstance(data, list): return {"results": data} return data # type: ignore[no-any-return] def print_detailed_table(results: list[dict[str, Any]]) -> None: print("\n" + "=" * 80) print("DETAILED RESULTS") print("=" * 80) has_context = all( ("context_line_precision_matched" in r and "context_line_coverage" in r) for r in results ) if has_context: print(f"{'Case ID':<40} | F.Rec | F.Prec | T.Cov | T.Prec(M) | C.Cov | C.Prec(M)") print( "-" * 40 + "-+-" + "-" * 6 + "+-" + "-" * 6 + "+-" + "-" * 6 + "+-" + "-" * 9 + "+-" + "-" * 6 + "+-" + "-" * 9 ) else: print(f"{'Case ID':<40} | F.Rec | F.Prec | L.Cov | L.Prec(M)") print("-" * 40 + "-+-" + "-" * 6 + "+-" + "-" * 6 + "+-" + "-" * 6 + "+-" + "-" * 9) for r in results: case_id = r["case_id"][:38] if len(r["case_id"]) > 38 else r["case_id"] if has_context: print( f"{case_id:<40} | " f"{r['file_recall'] * 100:5.1f}% | " f"{r['file_precision'] * 100:5.1f}% | " f"{r['line_coverage'] * 100:5.1f}% | " f"{r['line_precision_matched'] * 100:7.1f}% | " f"{r['context_line_coverage'] * 100:5.1f}% | " f"{r['context_line_precision_matched'] * 100:7.1f}%" ) else: print( f"{case_id:<40} | " f"{r['file_recall'] * 100:5.1f}% | " f"{r['file_precision'] * 100:5.1f}% | " f"{r['line_coverage'] * 100:5.1f}% | " f"{r['line_precision_matched'] * 100:7.1f}%" ) def print_distribution(results: list[dict[str, Any]], key: str, label: str) -> None: values = [r[key] * 100 for r in results] buckets = [0] * 11 # 0-10, 10-20, ..., 90-100, 100+ for v in values: idx = min(int(v // 10), 10) buckets[idx] += 1 print(f"\n{label} Distribution:") for i, count in enumerate(buckets): if i == 10: label_str = "100%" else: label_str = f"{i * 10:2d}-{(i + 1) * 10:2d}%" bar = "█" * count pct = count / len(values) * 100 if values else 0 print(f" {label_str}: {bar:<15} {count} ({pct:.0f}%)") def print_worst_cases(results: list[dict[str, Any]], key: str, label: str, n: int = 3) -> None: sorted_results = sorted(results, key=lambda r: r[key]) worst = sorted_results[:n] print(f"\nWorst {n} cases by {label}:") for r in worst: print(f" - {r['case_id']}") print(f" {label}: {r[key] * 100:.1f}%") print(f" Target Line Coverage: {r['line_coverage'] * 100:.1f}%") if "context_line_coverage" in r: print(f" Context Line Coverage: {r['context_line_coverage'] * 100:.1f}%") print(f" Turns: {r['turns_used']}, Latency: {r['latency_ms']:.0f}ms") if r.get("error"): print(f" Error: {r['error']}") print() def print_summary_stats(results: list[dict[str, Any]], key: str, label: str) -> None: values = [r[key] * 100 for r in results] if not values: return values.sort() n = len(values) mean = sum(values) / n median = values[n // 2] if n % 2 else (values[n // 2 - 1] + values[n // 2]) / 2 min_v, max_v = min(values), max(values) print(f"\n{label} Stats:") print(f" Mean: {mean:.1f}%") print(f" Median: {median:.1f}%") print(f" Min: {min_v:.1f}%") print(f" Max: {max_v:.1f}%") print(f" Range: {max_v - min_v:.1f}%") def main() -> None: # Default path default_path = get_results_dir() / "benchmark_results.json" path = sys.argv[1] if len(sys.argv) > 1 else str(default_path) if not Path(path).exists(): print(f"Error: File not found: {path}") sys.exit(1) data = load_results(path) results = data.get("results", []) if not results: print("No results found.") sys.exit(1) print(f"Analyzing {len(results)} benchmark results from: {path}") # Detailed table print_detailed_table(results) # Distribution print_distribution(results, "line_precision_matched", "Line Prec(M)") if all( ("context_line_precision_matched" in r and "context_line_coverage" in r) for r in results ): print_distribution(results, "context_line_precision_matched", "Context Line Prec(M)") # Summary stats print_summary_stats(results, "line_precision_matched", "Line Prec(M)") print_summary_stats(results, "line_coverage", "Line Coverage") if all( ("context_line_precision_matched" in r and "context_line_coverage" in r) for r in results ): print_summary_stats(results, "context_line_precision_matched", "Context Line Prec(M)") print_summary_stats(results, "context_line_coverage", "Context Line Coverage") # Worst cases print_worst_cases(results, "line_precision_matched", "Line Prec(M)", n=3) if __name__ == "__main__": main()

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/possible055/relace-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

analyze.py•5.63 KiB