Lean LSP MCP

test_repl.py•6.79 KiB

"""Tests for REPL integration.""" import shutil from pathlib import Path import pytest from lean_lsp_mcp.repl import Repl, _split_imports, find_repl_binary # ============================================================================= # Unit Tests # ============================================================================= def test_find_repl_binary_from_lake_packages(tmp_path: Path, monkeypatch): """Auto-detect REPL in .lake/packages.""" monkeypatch.delenv("LEAN_REPL_PATH", raising=False) repl_path = tmp_path / ".lake" / "packages" / "repl" / ".lake" / "build" / "bin" repl_path.mkdir(parents=True) (repl_path / "repl").touch() found = find_repl_binary(str(tmp_path)) assert found == str(repl_path / "repl") def test_find_repl_binary_env_var_takes_precedence(tmp_path: Path, monkeypatch): """LEAN_REPL_PATH env var takes precedence.""" custom = tmp_path / "custom_repl" custom.touch() monkeypatch.setenv("LEAN_REPL_PATH", str(custom)) found = find_repl_binary(str(tmp_path)) assert found == str(custom) @pytest.mark.parametrize( "code,header,body", [ ("import Mathlib\n\ndef x := 1", "import Mathlib", "def x := 1"), ( "import Foo\nimport Bar\n\ndef x := 1", "import Foo\nimport Bar", "def x := 1", ), ("def x := 1", "", "def x := 1"), ("import Foo\nimport Foo\n\ndef x := 1", "import Foo", "def x := 1"), ("import Foo\n\n\ndef x := 1", "import Foo", "def x := 1"), ], ) def test_split_imports(code: str, header: str, body: str): h, b = _split_imports(code) assert h == header assert b == body def test_split_imports_preserves_specific_mathlib(): """Specific Mathlib imports are preserved (faster than import Mathlib).""" code = ( "import Mathlib.Data.Nat\nimport Mathlib.Data.List\nimport Other\n\ndef x := 1" ) header, _ = _split_imports(code) assert "import Mathlib.Data.Nat" in header assert "import Mathlib.Data.List" in header assert "import Other" in header # ============================================================================= # Integration Tests (require REPL binary) # ============================================================================= @pytest.fixture async def repl(test_project_path: Path, monkeypatch): # Check multiple possible locations for REPL binary candidates = [ test_project_path / ".lake" / "build" / "bin" / "repl", test_project_path / ".lake" / "packages" / "repl" / ".lake" / "build" / "bin" / "repl", ] repl_bin = next((p for p in candidates if p.exists()), None) if not repl_bin: found = shutil.which("repl") repl_bin = Path(found) if found else None if not repl_bin: pytest.skip("REPL binary not found") monkeypatch.setenv("LEAN_REPL_PATH", str(repl_bin)) monkeypatch.setenv("LEAN_REPL_TIMEOUT", "30") r = Repl(project_dir=str(test_project_path)) yield r await r.close() @pytest.mark.asyncio async def test_run_snippets_returns_results(repl: Repl): results = await repl.run_snippets("theorem t : 1 = 1 := by\n", ["rfl", "simp"]) assert len(results) == 2 assert any(r.error is None for r in results) @pytest.mark.asyncio async def test_header_caching_reuses_repl(repl: Repl): """Header caching keeps same REPL across calls with same imports.""" base = "theorem t : 1 = 1 := by\n" await repl.run_snippets(base, ["rfl"]) proc1 = repl._proc await repl.run_snippets(base, ["rfl"]) proc2 = repl._proc assert proc1 is proc2 # Same process reused @pytest.mark.asyncio async def test_backtracking_isolation(repl: Repl): base = "theorem t : 1 + 1 = 2 := by\n" results = await repl.run_snippets( base, [ "have h : False := sorry; exact h.elim", "rfl", ], ) assert len(results) == 2 assert results[1].error is None # rfl specifically should work @pytest.mark.skip @pytest.mark.asyncio async def test_benchmark_repl_vs_lsp(repl: Repl, mcp_client_factory, test_project_path): """Benchmark: REPL vs LSP for multi_attempt. Uses GoalSample.lean which has `import Mathlib` - same as most test files. REPL advantage: tactic mode runs tactics without reparsing body. """ import json import time from tests.helpers.mcp_client import result_text tactics = ["rfl", "simp", "omega", "decide", "trivial", "rfl", "simp", "rfl"] # Same as BenchmarkTest.lean - fair comparison with LSP # Goal: 1 = 1 (solvable by rfl, simp, omega, decide) base = """\ import Mathlib theorem benchmark : 1 = 1 := by """ # Cold REPL (starts subprocess + loads Mathlib + first body parse) start = time.perf_counter() await repl.run_snippets(base, tactics) repl_cold = time.perf_counter() - start # Warm REPL (subprocess cached with Mathlib, body re-parsed but tactics fast) start = time.perf_counter() repl_results = await repl.run_snippets(base, tactics) repl_warm = time.perf_counter() - start # Cold LSP - use BenchmarkTest.lean which has same `import Mathlib` # Line 6 is `sorry` - multi_attempt replaces it with each tactic async with mcp_client_factory() as client: start = time.perf_counter() await client.call_tool( "lean_multi_attempt", { "file_path": str(test_project_path / "BenchmarkTest.lean"), "line": 6, "snippets": tactics, }, ) lsp_cold = time.perf_counter() - start # Warm LSP (file compiled, but each tactic is separate edit) start = time.perf_counter() lsp_result = await client.call_tool( "lean_multi_attempt", { "file_path": str(test_project_path / "BenchmarkTest.lean"), "line": 6, "snippets": tactics, }, ) lsp_warm = time.perf_counter() - start lsp_data = json.loads(result_text(lsp_result)) repl_success = [r.goals == [] and r.error is None for r in repl_results] lsp_success = [a["goals"] == [] for a in lsp_data["items"]] # Per-tactic timing repl_per = repl_warm / len(tactics) * 1000 lsp_per = lsp_warm / len(tactics) * 1000 print(f"\n{'=' * 60}") print(f"Tactics: {len(tactics)}") print( f"REPL cold: {repl_cold:.2f}s | warm: {repl_warm * 1000:.0f}ms ({repl_per:.0f}ms/tactic)" ) print( f"LSP cold: {lsp_cold:.2f}s | warm: {lsp_warm * 1000:.0f}ms ({lsp_per:.0f}ms/tactic)" ) if repl_warm < lsp_warm: print(f"REPL is {lsp_warm / repl_warm:.1f}x faster (warm)") else: print(f"LSP is {repl_warm / lsp_warm:.1f}x faster (warm)") print(f"{'=' * 60}") assert repl_success == lsp_success, "Results differ!"

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/oOo0oOo/lean-lsp-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

test_repl.py•6.79 KiB