Tea Rags MCP

reranker.test.ts•22.7 KiB

import { describe, expect, it } from "vitest"; import { getAvailablePresets, rerankSearchCodeResults, rerankSemanticSearchResults, type RerankableResult, } from "./reranker.js"; describe("reranker", () => { // Create mock results with git metadata const createResult = ( score: number, ageDays: number, commitCount: number, isDoc = false, extraGit: Partial< RerankableResult["payload"] extends infer P ? (P extends { git?: infer G } ? G : never) : never > = {}, ): RerankableResult => ({ score, payload: { relativePath: `src/file-${score}.ts`, startLine: 1, endLine: 50, language: "typescript", isDocumentation: isDoc, git: { ageDays, commitCount, dominantAuthor: "alice", authors: ["alice"], ...extraGit, }, }, }); describe("rerankSemanticSearchResults", () => { const mockResults: RerankableResult[] = [ createResult(0.9, 10, 2), // high similarity, recent, stable createResult(0.8, 100, 20), // medium similarity, old, high churn createResult(0.7, 5, 1), // lower similarity, very recent, very stable ]; it("should not change order for 'relevance' preset (default)", () => { const result = rerankSemanticSearchResults(mockResults, "relevance"); expect(result[0].score).toBe(0.9); expect(result[1].score).toBe(0.8); expect(result[2].score).toBe(0.7); }); it("should boost old and high-churn code for 'techDebt' preset", () => { const result = rerankSemanticSearchResults(mockResults, "techDebt"); // Old + high churn code should be boosted // Result with ageDays=100, commitCount=20 should rank higher const oldHighChurnResult = result.find((r) => r.payload?.git?.ageDays === 100); expect(oldHighChurnResult).toBeDefined(); // Should be boosted compared to relevance-only }); it("should boost recent changes for 'codeReview' preset", () => { const result = rerankSemanticSearchResults(mockResults, "codeReview"); // Very recent code (ageDays=5) should be boosted const recentResult = result.find((r) => r.payload?.git?.ageDays === 5); expect(recentResult).toBeDefined(); }); it("should boost documentation for 'onboarding' preset", () => { const resultsWithDocs: RerankableResult[] = [ createResult(0.8, 30, 5, false), // code createResult(0.7, 30, 5, true), // documentation ]; const result = rerankSemanticSearchResults(resultsWithDocs, "onboarding"); // Documentation should be boosted const docResult = result.find((r) => r.payload?.isDocumentation === true); expect(docResult).toBeDefined(); }); it("should support custom weights", () => { const result = rerankSemanticSearchResults(mockResults, { custom: { similarity: 0.5, recency: 0.5, }, }); // Results should be reordered based on custom weights expect(result).toHaveLength(3); }); it("should handle results without git metadata", () => { const noGitResults: RerankableResult[] = [ { score: 0.9, payload: { relativePath: "file1.ts" } }, { score: 0.8, payload: { relativePath: "file2.ts" } }, ]; const result = rerankSemanticSearchResults(noGitResults, "techDebt"); // Should not crash, similarity should dominate expect(result).toHaveLength(2); }); }); describe("rerankSearchCodeResults", () => { const mockResults: RerankableResult[] = [ createResult(0.9, 100, 10), // high similarity, old createResult(0.8, 5, 2), // medium similarity, very recent createResult(0.7, 50, 1), // lower similarity, stable ]; it("should not change order for 'relevance' preset", () => { const result = rerankSearchCodeResults(mockResults, "relevance"); expect(result[0].score).toBe(0.9); expect(result[1].score).toBe(0.8); expect(result[2].score).toBe(0.7); }); it("should boost recent code for 'recent' preset", () => { const result = rerankSearchCodeResults(mockResults, "recent"); // Result with ageDays=5 should be boosted const recentResult = result.find((r) => r.payload?.git?.ageDays === 5); expect(recentResult).toBeDefined(); // Should have higher rank than in relevance-only }); it("should boost stable code for 'stable' preset", () => { const result = rerankSearchCodeResults(mockResults, "stable"); // Result with commitCount=1 (most stable) should be boosted const stableResult = result.find((r) => r.payload?.git?.commitCount === 1); expect(stableResult).toBeDefined(); }); it("should support custom weights", () => { const result = rerankSearchCodeResults(mockResults, { custom: { similarity: 0.7, stability: 0.3, }, }); expect(result).toHaveLength(3); }); }); describe("getAvailablePresets", () => { it("should return semantic_search presets", () => { const presets = getAvailablePresets("semantic_search"); expect(presets).toContain("relevance"); expect(presets).toContain("techDebt"); expect(presets).toContain("hotspots"); expect(presets).toContain("codeReview"); expect(presets).toContain("onboarding"); expect(presets).toContain("securityAudit"); expect(presets).toContain("refactoring"); expect(presets).toContain("ownership"); expect(presets).toContain("impactAnalysis"); }); it("should return search_code presets", () => { const presets = getAvailablePresets("search_code"); expect(presets).toContain("relevance"); expect(presets).toContain("recent"); expect(presets).toContain("stable"); expect(presets).not.toContain("techDebt"); // semantic_search only }); }); describe("new signals: bugFix, volatility, density, chunkChurn", () => { it("should normalize bugFix signal correctly (50% → 0.5)", () => { const results = [ createResult(0.8, 30, 5, false, { bugFixRate: 50 }), createResult(0.8, 30, 5, false, { bugFixRate: 0 }), ]; const reranked = rerankSemanticSearchResults(results, { custom: { bugFix: 1.0 }, }); // 50% bugFixRate should rank higher expect(reranked[0].payload?.git?.bugFixRate).toBe(50); expect(reranked[0].score).toBeGreaterThan(reranked[1].score); }); it("should prefer chunk-level churn over file-level in hotspots", () => { const results = [ // File has high churn (20), but this chunk is cold (chunkCommitCount=1) createResult(0.8, 10, 20, false, { chunkCommitCount: 1 }), // File has low churn (3), but this chunk is hot (chunkCommitCount=15) createResult(0.8, 10, 3, false, { chunkCommitCount: 15 }), ]; const reranked = rerankSemanticSearchResults(results, "hotspots"); // Chunk with high chunkCommitCount should rank higher expect(reranked[0].payload?.git?.chunkCommitCount).toBe(15); }); it("should boost high bugFixRate + old code in techDebt preset", () => { const results = [ createResult(0.8, 200, 10, false, { bugFixRate: 80, churnVolatility: 30 }), createResult(0.8, 10, 10, false, { bugFixRate: 5, churnVolatility: 2 }), ]; const reranked = rerankSemanticSearchResults(results, "techDebt"); // High bugFixRate + old code should rank higher expect(reranked[0].payload?.git?.bugFixRate).toBe(80); }); it("should not crash when mixing chunk-level and file-level results", () => { const results = [ createResult(0.9, 10, 5, false, { chunkCommitCount: 8 }), createResult(0.8, 20, 3, false), // no chunk-level data ]; const reranked = rerankSemanticSearchResults(results, "hotspots"); expect(reranked).toHaveLength(2); }); it("should use dominantAuthorPct for ownership when available", () => { const results = [ createResult(0.8, 30, 5, false, { dominantAuthorPct: 90, authors: ["alice", "bob", "charlie"] as any }), createResult(0.8, 30, 5, false, { dominantAuthorPct: 30, authors: ["a", "b", "c", "d"] as any }), ]; const reranked = rerankSemanticSearchResults(results, "ownership"); // 90% ownership should rank higher expect(reranked[0].payload?.git?.dominantAuthorPct).toBe(90); }); it("should boost density signal in codeReview preset", () => { const results = [ createResult(0.8, 5, 3, false, { changeDensity: 15 }), // high density createResult(0.8, 5, 3, false, { changeDensity: 1 }), // low density ]; const reranked = rerankSemanticSearchResults(results, "codeReview"); expect(reranked[0].payload?.git?.changeDensity).toBe(15); }); }); describe("new signals: relativeChurnNorm, burstActivity, pathRisk, knowledgeSilo, chunkRelativeChurn", () => { it("should normalize relativeChurn via relativeChurnNorm signal", () => { // LOW relativeChurn first — if signal doesn't exist, order won't change const results = [ createResult(0.8, 100, 10, false, { relativeChurn: 0.1 }), createResult(0.8, 100, 10, false, { relativeChurn: 4.0 }), ]; // Isolate the signal via custom weights const reranked = rerankSemanticSearchResults(results, { custom: { similarity: 0.1, relativeChurnNorm: 0.9 }, }); // High relativeChurn must be reordered to first expect(reranked[0].payload?.git?.relativeChurn).toBe(4.0); }); it("should normalize recencyWeightedFreq via burstActivity signal", () => { // LOW burst first — if signal doesn't exist, order won't change const results = [ createResult(0.8, 5, 3, false, { recencyWeightedFreq: 0.5 }), createResult(0.8, 5, 3, false, { recencyWeightedFreq: 8.0 }), ]; const reranked = rerankSemanticSearchResults(results, { custom: { similarity: 0.1, burstActivity: 0.9 }, }); // High burstActivity must be reordered to first expect(reranked[0].payload?.git?.recencyWeightedFreq).toBe(8.0); }); it("should wire pathRisk into securityAudit preset", () => { // Non-auth path first — securityAudit must reorder auth path to top const results: RerankableResult[] = [ { score: 0.8, payload: { relativePath: "src/utils/format.ts", startLine: 1, endLine: 50, language: "typescript", git: { ageDays: 100, commitCount: 10, bugFixRate: 50 }, }, }, { score: 0.8, payload: { relativePath: "src/auth/login.ts", startLine: 1, endLine: 50, language: "typescript", git: { ageDays: 100, commitCount: 10, bugFixRate: 50 }, }, }, ]; const reranked = rerankSemanticSearchResults(results, "securityAudit"); // Auth path should rank higher due to pathRisk signal expect(reranked[0].payload?.relativePath).toBe("src/auth/login.ts"); }); it("should flag single-contributor code via knowledgeSilo signal", () => { // Both have SAME dominantAuthorPct=80 — only knowledgeSilo differentiates // Multi-contributor first — if signal doesn't exist, order won't change const results = [ createResult(0.8, 30, 5, false, { contributorCount: 5, dominantAuthorPct: 80, authors: ["a", "b", "c", "d", "e"] as any, }), createResult(0.8, 30, 5, false, { contributorCount: 1, dominantAuthorPct: 80, authors: ["alice"] as any }), ]; const reranked = rerankSemanticSearchResults(results, { custom: { similarity: 0.1, knowledgeSilo: 0.9 }, }); // Single contributor (knowledgeSilo=1.0) must be reordered to first expect(reranked[0].payload?.git?.contributorCount).toBe(1); }); it("should normalize chunkChurnRatio via chunkRelativeChurn signal", () => { // Same chunkCommitCount — only ratio differs. LOW ratio first. const results = [ createResult(0.8, 10, 10, false, { chunkCommitCount: 5, chunkChurnRatio: 0.1 }), createResult(0.8, 10, 10, false, { chunkCommitCount: 5, chunkChurnRatio: 0.9 }), ]; const reranked = rerankSemanticSearchResults(results, { custom: { similarity: 0.1, chunkRelativeChurn: 0.9 }, }); // High chunkChurnRatio must be reordered to first expect(reranked[0].payload?.git?.chunkChurnRatio).toBe(0.9); }); }); describe("chunk-level preference for bugFix and knowledgeSilo", () => { it("should prefer chunkBugFixRate over file-level bugFixRate", () => { // File has low bugFixRate (10%), but chunk has high chunkBugFixRate (80%) // vs file with high bugFixRate (80%) but chunk has low chunkBugFixRate (10%) // LOW chunk bugfix first — must be reordered if chunk-level preferred const results = [ createResult(0.8, 30, 10, false, { bugFixRate: 80, chunkBugFixRate: 10 }), createResult(0.8, 30, 10, false, { bugFixRate: 10, chunkBugFixRate: 80 }), ]; const reranked = rerankSemanticSearchResults(results, { custom: { similarity: 0.1, bugFix: 0.9 }, }); // Chunk with high chunkBugFixRate should rank first expect(reranked[0].payload?.git?.chunkBugFixRate).toBe(80); }); it("should prefer chunkContributorCount over file-level contributorCount for knowledgeSilo", () => { // File has 5 contributors, but this chunk only has 1 // vs file with 1 contributor but chunk has 3 // Multi-contributor chunk first — must be reordered if chunk-level preferred const results = [ createResult(0.8, 30, 10, false, { contributorCount: 1, chunkContributorCount: 3 }), createResult(0.8, 30, 10, false, { contributorCount: 5, chunkContributorCount: 1 }), ]; const reranked = rerankSemanticSearchResults(results, { custom: { similarity: 0.1, knowledgeSilo: 0.9 }, }); // Chunk with chunkContributorCount=1 (silo) should rank first expect(reranked[0].payload?.git?.chunkContributorCount).toBe(1); }); }); describe("blockPenalty: penalize block chunks without chunk-level data", () => { const createResultWithChunkType = ( score: number, chunkType: string, git: Partial< RerankableResult["payload"] extends infer P ? (P extends { git?: infer G } ? G : never) : never > = {}, ): RerankableResult => ({ score, payload: { relativePath: `src/file-${score}.ts`, startLine: 1, endLine: 50, language: "typescript", chunkType, git: { ageDays: 10, commitCount: 20, dominantAuthor: "alice", authors: ["alice"], recencyWeightedFreq: 5.0, bugFixRate: 40, churnVolatility: 20, ...git, }, }, }); it("should penalize block chunks without chunk-level data in hotspots", () => { const results = [ // Block chunk with only file-level data (no chunkCommitCount) — should be penalized createResultWithChunkType(0.8, "block", {}), // Function chunk with same file-level data — should NOT be penalized createResultWithChunkType(0.8, "function", {}), ]; const reranked = rerankSemanticSearchResults(results, "hotspots"); // Function should rank higher due to block penalty expect(reranked[0].payload?.chunkType).toBe("function"); }); it("should NOT penalize block chunks that have chunk-level data", () => { const results = [ // Block with chunk-level data — should NOT be penalized createResultWithChunkType(0.8, "block", { chunkCommitCount: 15, chunkChurnRatio: 0.8 }), // Function without chunk-level data — no penalty either createResultWithChunkType(0.8, "function", {}), ]; const reranked = rerankSemanticSearchResults(results, "hotspots"); // Block with chunk data should rank at least as high (it has high chunkCommitCount) expect(reranked[0].payload?.chunkType).toBe("block"); }); it("should NOT penalize function/class/interface chunks", () => { const results = [ createResultWithChunkType(0.8, "function", {}), createResultWithChunkType(0.8, "class", {}), createResultWithChunkType(0.8, "interface", {}), ]; const reranked = rerankSemanticSearchResults(results, "hotspots"); // All scores should be equal (no penalties applied) expect(reranked[0].score).toBeCloseTo(reranked[1].score, 5); expect(reranked[1].score).toBeCloseTo(reranked[2].score, 5); }); it("should apply blockPenalty in techDebt preset", () => { const results = [ createResultWithChunkType(0.8, "block", { ageDays: 200 }), createResultWithChunkType(0.8, "function", { ageDays: 200 }), ]; const reranked = rerankSemanticSearchResults(results, "techDebt"); expect(reranked[0].payload?.chunkType).toBe("function"); }); it("should apply blockPenalty in codeReview preset", () => { const results = [ createResultWithChunkType(0.8, "block", { changeDensity: 15 }), createResultWithChunkType(0.8, "function", { changeDensity: 15 }), ]; const reranked = rerankSemanticSearchResults(results, "codeReview"); expect(reranked[0].payload?.chunkType).toBe("function"); }); it("should apply blockPenalty in refactoring preset", () => { const results = [ createResultWithChunkType(0.8, "block", { relativeChurn: 3.0 }), createResultWithChunkType(0.8, "function", { relativeChurn: 3.0 }), ]; const reranked = rerankSemanticSearchResults(results, "refactoring"); expect(reranked[0].payload?.chunkType).toBe("function"); }); it("should support blockPenalty as custom negative weight", () => { const results = [createResultWithChunkType(0.8, "block", {}), createResultWithChunkType(0.7, "function", {})]; const reranked = rerankSemanticSearchResults(results, { custom: { similarity: 0.5, churn: 0.3, blockPenalty: -0.3 }, }); // Function should rank higher despite lower similarity, because block gets penalty expect(reranked[0].payload?.chunkType).toBe("function"); }); it("should not affect presets without blockPenalty (e.g., onboarding)", () => { const results = [createResultWithChunkType(0.9, "block", {}), createResultWithChunkType(0.7, "function", {})]; const reranked = rerankSemanticSearchResults(results, "onboarding"); // Block should still rank first (higher similarity, no penalty in this preset) expect(reranked[0].payload?.chunkType).toBe("block"); }); }); describe("confidence dampening for small sample sizes", () => { it("should dampen bugFixRate=100% on commitCount=1 vs reliable commitCount=10", () => { // Without dampening: bugFix signal = 100/100=1.0 vs 50/100=0.5 → first wins // With dampening: 1.0*0.2=0.2 vs 0.5*1.0=0.5 → second wins const results = [ createResult(0.8, 30, 1, false, { bugFixRate: 100 }), createResult(0.8, 30, 10, false, { bugFixRate: 50 }), ]; const reranked = rerankSemanticSearchResults(results, { custom: { bugFix: 1.0 }, }); expect(reranked[0].payload?.git?.commitCount).toBe(10); }); it("should not dampen when commitCount >= 5", () => { const results = [ createResult(0.8, 30, 10, false, { bugFixRate: 30 }), createResult(0.8, 30, 10, false, { bugFixRate: 80 }), ]; const reranked = rerankSemanticSearchResults(results, { custom: { bugFix: 1.0 }, }); expect(reranked[0].payload?.git?.bugFixRate).toBe(80); }); it("should zero statistical signals when commitCount=0", () => { const results: RerankableResult[] = [ { score: 0.7, payload: { relativePath: "a.ts", startLine: 1, endLine: 50, git: { commitCount: 0, bugFixRate: 100 } }, }, { score: 0.9, payload: { relativePath: "b.ts", startLine: 1, endLine: 50, git: { commitCount: 0, bugFixRate: 0 } }, }, ]; const reranked = rerankSemanticSearchResults(results, { custom: { similarity: 0.5, bugFix: 0.5 }, }); // bugFix zeroed by confidence=0, similarity decides expect(reranked[0].payload?.relativePath).toBe("b.ts"); }); it("should NOT dampen recency (factual signal)", () => { // Both have commitCount=1. Recency is factual — should NOT be dampened. // If recency were dampened, both would have ~0 recency and similarity would decide (tie). // If recency is NOT dampened, the recent file (ageDays=5) should win. const results = [ createResult(0.8, 200, 1), // old, 1 commit createResult(0.8, 5, 1), // recent, 1 commit ]; const reranked = rerankSemanticSearchResults(results, { custom: { recency: 1.0 }, }); // Recent file must rank first — recency not dampened expect(reranked[0].payload?.git?.ageDays).toBe(5); }); it("should dampen ownership for single-commit chunks in hotspots", () => { // commitCount=1: inflated bugFixRate=100%, ownership trivially 100% // commitCount=10: moderate bugFixRate=40%, real ownership=80% // Hotspots uses bugFix and volatility which should be dampened const results = [ createResult(0.8, 10, 1, false, { chunkCommitCount: 1, chunkChurnRatio: 1.0, recencyWeightedFreq: 1.0, bugFixRate: 100, churnVolatility: 30, }), createResult(0.8, 10, 10, false, { chunkCommitCount: 8, chunkChurnRatio: 0.8, recencyWeightedFreq: 5.0, bugFixRate: 40, churnVolatility: 20, }), ]; const reranked = rerankSemanticSearchResults(results, "hotspots"); expect(reranked[0].payload?.git?.commitCount).toBe(10); }); }); describe("edge cases", () => { it("should handle empty results", () => { const result = rerankSemanticSearchResults([], "techDebt"); expect(result).toEqual([]); }); it("should handle single result", () => { const single = [createResult(0.9, 10, 5)]; const result = rerankSemanticSearchResults(single, "techDebt"); expect(result).toHaveLength(1); }); it("should handle results with missing payload", () => { const noPayload: RerankableResult[] = [{ score: 0.9 }, { score: 0.8 }]; const result = rerankSemanticSearchResults(noPayload, "techDebt"); expect(result).toHaveLength(2); }); it("should handle unknown preset gracefully", () => { const result = rerankSemanticSearchResults([createResult(0.9, 10, 5)], "unknownPreset" as any); // Should fall back to relevance expect(result).toHaveLength(1); }); }); });

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/artk0de/TeaRAGs-MCP'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

reranker.test.ts•22.7 KiB