Enhanced Knowledge Graph Memory Server

tfidf.ts•2.71 KiB

/** * TF-IDF (Term Frequency-Inverse Document Frequency) Utilities * * Algorithms for calculating TF-IDF scores used in ranked search. * TF-IDF measures how important a term is to a document in a collection. * * @module utils/tfidf */ /** * Calculate Term Frequency (TF) for a term in a document. * * TF = (Number of times term appears in document) / (Total terms in document) * * @param term - The search term * @param document - The document text * @returns Term frequency (0.0 to 1.0) */ export function calculateTF(term: string, document: string): number { const termLower = term.toLowerCase(); const tokens = tokenize(document); if (tokens.length === 0) return 0; const termCount = tokens.filter(t => t === termLower).length; return termCount / tokens.length; } /** * Calculate Inverse Document Frequency (IDF) for a term across documents. * * IDF = log(Total documents / Documents containing term) * * @param term - The search term * @param documents - Array of document texts * @returns Inverse document frequency */ export function calculateIDF(term: string, documents: string[]): number { if (documents.length === 0) return 0; const termLower = term.toLowerCase(); const docsWithTerm = documents.filter(doc => tokenize(doc).includes(termLower) ).length; if (docsWithTerm === 0) return 0; return Math.log(documents.length / docsWithTerm); } /** * Calculate TF-IDF score for a term in a document. * * TF-IDF = TF * IDF * * Higher scores indicate more important/relevant terms. * * @param term - The search term * @param document - The document text * @param documents - Array of all documents * @returns TF-IDF score */ export function calculateTFIDF( term: string, document: string, documents: string[] ): number { const tf = calculateTF(term, document); const idf = calculateIDF(term, documents); return tf * idf; } /** * Tokenize text into lowercase words. * * Splits on whitespace and removes punctuation. * * @param text - Text to tokenize * @returns Array of lowercase tokens */ export function tokenize(text: string): string[] { return text .toLowerCase() .replace(/[^\w\s]/g, ' ') .split(/\s+/) .filter(token => token.length > 0); } /** * Calculate TF-IDF scores for multiple search terms. * * @param terms - Array of search terms * @param document - The document text * @param documents - Array of all documents * @returns Map of term to TF-IDF score */ export function calculateMultiTermTFIDF( terms: string[], document: string, documents: string[] ): Map<string, number> { const scores = new Map<string, number>(); for (const term of terms) { scores.set(term, calculateTFIDF(term, document, documents)); } return scores; }

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/danielsimonjr/memory-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

tfidf.ts•2.71 KiB