swift-patterns-mcp

search.ts•6.43 KiB

// src/utils/search.ts // Advanced search utilities with fuzzy matching and smart stemming import MiniSearch from 'minisearch'; import { stemmer } from 'stemmer'; import { normalizeTokens } from './search-terms.js'; export interface SearchableDocument { id: string; title: string; content: string; topics: string[]; } interface SearchResult<T> { item: T; score: number; matches: string[]; } interface SearchOptions { fuzzy?: number; // Fuzzy matching threshold (0-1, default 0.2) boost?: Record<string, number>; // Field boosting minScore?: number; // Minimum score threshold } // Custom tokenizer with smart hyphen handling and stemming function tokenize(text: string): string[] { return normalizeTokens(text, (token) => stemmer(token)); } // Process query with same tokenization for consistent matching function processQuery(query: string): string[] { return tokenize(query); } export class SearchIndex<T extends SearchableDocument> { private miniSearch: MiniSearch<T>; private documents: Map<string, T> = new Map(); constructor(fields: string[] = ['title', 'content', 'topics']) { this.miniSearch = new MiniSearch<T>({ fields, storeFields: ['id'], tokenize, // Uses our new smart tokenizer processTerm: (term) => term, // Already processed by tokenize searchOptions: { boost: { title: 2, topics: 1.5, content: 1 }, fuzzy: 0.2, prefix: true, }, }); } addDocuments(docs: T[]): void { // Clear existing documents this.miniSearch.removeAll(); this.documents.clear(); // Preprocess documents for indexing const processedDocs = docs.map(doc => ({ ...doc, // Join topics array for indexing topics: Array.isArray(doc.topics) ? doc.topics.join(' ') : doc.topics, })); // Add to MiniSearch this.miniSearch.addAll(processedDocs); // Store original documents for retrieval docs.forEach(doc => this.documents.set(doc.id, doc)); } search(query: string, options: SearchOptions = {}): SearchResult<T>[] { const { fuzzy = 0.2, boost = { title: 2, topics: 1.5, content: 1 }, minScore = 0, } = options; // Get stemmed query terms for match highlighting const queryTerms = processQuery(query); // Search with MiniSearch const results = this.miniSearch.search(query, { fuzzy, prefix: true, boost, combineWith: 'OR', }); // Map results to original documents with scores return results .filter(result => result.score >= minScore) .map(result => { const doc = this.documents.get(result.id); if (!doc) return null; // Find which terms matched const matches = this.findMatches(doc, queryTerms); return { item: doc, score: result.score, matches, }; }) .filter((r): r is SearchResult<T> => r !== null); } private findMatches(doc: T, queryTerms: string[]): string[] { const matches: string[] = []; const searchText = `${doc.title} ${doc.content} ${doc.topics.join(' ')}`.toLowerCase(); for (const term of queryTerms) { // Check both stemmed and original if (searchText.includes(term)) { matches.push(term); } } return [...new Set(matches)]; } } /** * CachedSearchIndex - Manages a SearchIndex with automatic invalidation based on document changes. * Eliminates duplicated search caching logic across pattern sources. */ export class CachedSearchIndex<T extends SearchableDocument> { private searchIndex: SearchIndex<T> | null = null; private indexedPatternsHash: string | null = null; private fields: string[]; constructor(fields: string[] = ['title', 'content', 'topics']) { this.fields = fields; } /** * Search patterns with automatic index caching. * Index is rebuilt only when patterns change (detected via hash). */ search( patterns: T[], query: string, options: SearchOptions = {} ): T[] { const { fuzzy = 0.2, boost = { title: 2.5, topics: 1.8, content: 1 }, } = options; // O(n) additive fingerprint — order-insensitive, no allocations let hash = 0; for (const p of patterns) { for (let i = 0; i < p.id.length; i++) { hash = (hash + p.id.charCodeAt(i) * (i + 1)) | 0; } } const patternsHash = `${patterns.length}:${hash}`; // Rebuild index only if patterns changed if (!this.searchIndex || this.indexedPatternsHash !== patternsHash) { this.searchIndex = new SearchIndex<T>(this.fields); this.searchIndex.addDocuments(patterns); this.indexedPatternsHash = patternsHash; } const results = this.searchIndex.search(query, { fuzzy, boost }); // Count query terms for coverage penalty const queryTerms = processQuery(query); const queryTermCount = queryTerms.length; // Normalize MiniSearch scores using relative ranking, absolute // confidence, and query term coverage. const maxSearchScore = results.length > 0 ? Math.max(...results.map(r => r.score)) : 1; // Absolute confidence: how strong is the best match overall? const confidenceFactor = Math.min(maxSearchScore / 10, 1); return results .map(result => { // Relative score within this result set (0-100) const relativeScore = maxSearchScore > 0 ? (result.score / maxSearchScore) * 100 : 0; // Term coverage: what fraction of query terms matched? // If query is "Apple Books Hero Effect" (4 terms) but only "effect" // matched (1/4 = 0.25), the score drops significantly. const matchCount = result.matches.length; const coverageFactor = queryTermCount > 0 ? matchCount / queryTermCount : 1; // Apply both confidence and coverage factors const normalizedSearch = relativeScore * confidenceFactor * coverageFactor; const staticRelevance = (result.item as T & { relevanceScore: number }).relevanceScore; // 80% query-aware search score, 20% static quality const combined = Math.round(normalizedSearch * 0.8 + staticRelevance * 0.2); return { ...result.item, relevanceScore: combined, }; }) .sort((a, b) => b.relevanceScore - a.relevanceScore); } /** * Invalidate the cached index (call after fetching new patterns) */ invalidate(): void { this.searchIndex = null; this.indexedPatternsHash = null; } }

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/efremidze/swift-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

search.ts•6.43 KiB