Flint Note

Overview Schema Related Servers Score Discussions

search.ts•27.8 KiB

/** * Search Manager * * Handles search operations across notes, including text search, * filtering by type, and maintaining search indices. */ import path from 'path'; import fs from 'fs/promises'; import { Workspace } from './workspace.js'; import { parseFrontmatter, parseNoteContent } from '../utils/yaml-parser.js'; import type { NoteMetadata } from '../types/index.js'; interface SearchIndex { version: string; last_updated: string; notes: Record<string, SearchIndexEntry>; } interface SearchIndexEntry { content: string; title: string; type: string; tags: string[]; updated: string; metadata: Record<string, unknown>; } interface SearchResult { id: string; title: string; type: string; tags: string[]; score: number; snippet: string; lastUpdated: string; filename: string; path: string; created: string; modified: string; size: number; metadata: Record<string, unknown>; } interface TagSearchResult { id: string; title: string; type: string; tags: string[]; lastUpdated: string; } interface TagInfo { tag: string; count: number; } interface SimilarNoteResult { id: string; title: string; type: string; tags: string[]; similarity: number; lastUpdated: string; } interface ParsedNote { metadata: NoteMetadata; content: string; } interface RebuildResult { indexedNotes: number; timestamp: string; } export class SearchManager { #workspace: Workspace; static #globalIndexLock: Promise<void> = Promise.resolve(); constructor(workspace: Workspace) { this.#workspace = workspace; } /** * Search notes by content and/or type */ async searchNotes( query: string | undefined, typeFilter: string | null = null, limit: number = 10, useRegex: boolean = false ): Promise<SearchResult[]> { try { const searchIndex = await this.loadSearchIndex(); const results: SearchResult[] = []; // Handle undefined or null query const safeQuery = query ?? ''; // Handle regex search if (useRegex) { return this.searchWithRegex(safeQuery, typeFilter, limit, searchIndex); } // Prepare search terms for regular text search const searchTerms = safeQuery .toLowerCase() .split(/\s+/) .filter(term => term.length > 0); // If no search terms, return all notes (matching everything) if (searchTerms.length === 0) { // Return all notes, respecting type filter for (const [notePath, noteData] of Object.entries(searchIndex.notes)) { // Apply type filter if specified if (typeFilter && noteData.type !== typeFilter) { continue; } // Parse note path to get identifier const identifier = this.pathToIdentifier(notePath); const stats = await this.getFileStats(notePath); results.push({ id: identifier, title: noteData.title, type: noteData.type, tags: noteData.tags, score: 1, // Default score for empty query snippet: this.generateSnippet(noteData.content, []), lastUpdated: noteData.updated, filename: path.basename(notePath), path: notePath, created: stats.created, modified: stats.modified, size: stats.size, metadata: noteData.metadata }); } // Sort by last updated (most recent first) for empty queries results.sort( (a, b) => new Date(b.lastUpdated).getTime() - new Date(a.lastUpdated).getTime() ); return results.slice(0, limit); } // Search through indexed notes for (const [notePath, noteData] of Object.entries(searchIndex.notes)) { // Apply type filter if specified if (typeFilter && noteData.type !== typeFilter) { continue; } // Calculate relevance score const score = this.calculateRelevanceScore(noteData, searchTerms); if (score > 0) { // Parse note path to get identifier const identifier = this.pathToIdentifier(notePath); const stats = await this.getFileStats(notePath); results.push({ id: identifier, title: noteData.title, type: noteData.type, tags: noteData.tags, score, snippet: this.generateSnippet(noteData.content, searchTerms), lastUpdated: noteData.updated, filename: path.basename(notePath), path: notePath, created: stats.created, modified: stats.modified, size: stats.size, metadata: noteData.metadata }); } } // Sort by relevance score (highest first) results.sort((a, b) => b.score - a.score); // Apply limit return results.slice(0, limit); } catch (error) { const errorMessage = error instanceof Error ? error.message : 'Unknown error'; throw new Error(`Search failed: ${errorMessage}`); } } /** * Search notes using regex patterns */ private async searchWithRegex( pattern: string, typeFilter: string | null, limit: number, searchIndex: SearchIndex ): Promise<SearchResult[]> { try { const results: SearchResult[] = []; // If pattern is empty, return all notes (matching everything) if (!pattern || pattern.trim() === '') { for (const [notePath, noteData] of Object.entries(searchIndex.notes)) { // Apply type filter if specified if (typeFilter && noteData.type !== typeFilter) { continue; } // Parse note path to get identifier const identifier = this.pathToIdentifier(notePath); const stats = await this.getFileStats(notePath); results.push({ id: identifier, title: noteData.title, type: noteData.type, tags: noteData.tags, score: 1, // Default score for empty query snippet: this.generateSnippet(noteData.content, []), lastUpdated: noteData.updated, filename: path.basename(notePath), path: notePath, created: stats.created, modified: stats.modified, size: stats.size, metadata: noteData.metadata }); } // Sort by last updated (most recent first) for empty pattern results.sort( (a, b) => new Date(b.lastUpdated).getTime() - new Date(a.lastUpdated).getTime() ); return results.slice(0, limit); } // Validate and create regex with default flags let regex: RegExp; try { regex = new RegExp(pattern, 'gi'); // global, case-insensitive } catch (regexError) { throw new Error( `Invalid regex pattern: ${regexError instanceof Error ? regexError.message : 'Unknown regex error'}` ); } // Search through indexed notes for (const [notePath, noteData] of Object.entries(searchIndex.notes)) { // Apply type filter if specified if (typeFilter && noteData.type !== typeFilter) { continue; } // Test regex against content, title, and tags const contentMatches = regex.test(noteData.content); const titleMatches = regex.test(noteData.title); const tagMatches = noteData.tags.some(tag => regex.test(tag)); if (contentMatches || titleMatches || tagMatches) { // Reset regex for snippet generation regex.lastIndex = 0; // Calculate score based on match types let score = 0; if (titleMatches) score += 10; if (contentMatches) score += 5; if (tagMatches) score += 3; // Parse note path to get identifier const identifier = this.pathToIdentifier(notePath); const stats = await this.getFileStats(notePath); results.push({ id: identifier, title: noteData.title, type: noteData.type, tags: noteData.tags, score: score, snippet: this.generateRegexSnippet(noteData.content, regex), lastUpdated: noteData.updated, filename: path.basename(notePath), path: notePath, created: stats.created, modified: stats.modified, size: stats.size, metadata: noteData.metadata }); } } // Sort by relevance score (highest first) results.sort((a, b) => b.score - a.score); // Apply limit return results.slice(0, limit); } catch (error) { const errorMessage = error instanceof Error ? error.message : 'Unknown error'; throw new Error(`Regex search failed: ${errorMessage}`); } } /** * Generate snippet for regex matches */ private generateRegexSnippet(content: string, regex: RegExp): string { const maxSnippetLength = 200; const contextLength = 50; // Reset regex regex.lastIndex = 0; const match = regex.exec(content); if (!match) { return ( content.substring(0, maxSnippetLength) + (content.length > maxSnippetLength ? '...' : '') ); } const matchStart = match.index; const matchEnd = matchStart + match[0].length; // Calculate snippet boundaries const snippetStart = Math.max(0, matchStart - contextLength); const snippetEnd = Math.min(content.length, matchEnd + contextLength); let snippet = content.substring(snippetStart, snippetEnd); // Add ellipsis if we're not at the beginning/end if (snippetStart > 0) { snippet = '...' + snippet; } if (snippetEnd < content.length) { snippet = snippet + '...'; } return snippet; } /** * Load search index from file */ async loadSearchIndex(): Promise<SearchIndex> { try { const indexPath = this.#workspace.searchIndexPath; const indexContent = await fs.readFile(indexPath, 'utf-8'); return JSON.parse(indexContent); } catch (error) { if (error instanceof Error && 'code' in error && error.code === 'ENOENT') { // Try to rebuild index if file doesn't exist try { console.log('Search index missing, attempting to rebuild...'); await this.rebuildSearchIndex(); const indexContent = await fs.readFile( this.#workspace.searchIndexPath, 'utf-8' ); return JSON.parse(indexContent); } catch (rebuildError) { console.error('Failed to rebuild search index:', rebuildError); // Return empty index as fallback return { version: '1.0.0', last_updated: new Date().toISOString(), notes: {} }; } } throw error; } } /** * Calculate relevance score for a note based on search terms */ calculateRelevanceScore(noteData: SearchIndexEntry, searchTerms: string[]): number { let score = 0; const content = noteData.content.toLowerCase(); const title = noteData.title.toLowerCase(); const tags = noteData.tags.map(tag => tag.toLowerCase()); for (const term of searchTerms) { // Title matches are weighted more heavily const titleMatches = this.countOccurrences(title, term); score += titleMatches * 10; // Tag matches are also weighted heavily for (const tag of tags) { if (tag.includes(term)) { score += 8; } } // Content matches const contentMatches = this.countOccurrences(content, term); score += contentMatches * 2; // Exact word matches get bonus points const titleWords = title.split(/\s+/); const contentWords = content.split(/\s+/); if (titleWords.includes(term)) { score += 15; } if (contentWords.includes(term)) { score += 3; } } return score; } /** * Count occurrences of a term in text */ countOccurrences(text: string, term: string): number { const regex = new RegExp(term.replace(/[.*+?^${}()|[\]\\]/g, '\\$&'), 'gi'); const matches = text.match(regex); return matches ? matches.length : 0; } /** * Generate a snippet showing search term context */ generateSnippet( content: string, searchTerms: string[], maxLength: number = 200 ): string { let bestSnippet = ''; let maxTerms = 0; // Find the position with the most search terms for (let i = 0; i < content.length - maxLength; i += 50) { const snippet = content.substring(i, i + maxLength); const lowerSnippet = snippet.toLowerCase(); let termCount = 0; for (const term of searchTerms) { if (lowerSnippet.includes(term)) { termCount++; } } if (termCount > maxTerms) { maxTerms = termCount; bestSnippet = snippet; } } // If no good snippet found, use the beginning if (!bestSnippet) { bestSnippet = content.substring(0, maxLength); } // Clean up the snippet bestSnippet = bestSnippet.trim(); if (bestSnippet.length === maxLength) { bestSnippet += '...'; } // Highlight search terms for (const term of searchTerms) { const regex = new RegExp(`(${term.replace(/[.*+?^${}()|[\]\\]/g, '\\$&')})`, 'gi'); bestSnippet = bestSnippet.replace(regex, '**$1**'); } return bestSnippet; } /** * Get file stats helper method */ private async getFileStats(notePath: string): Promise<{ created: string; modified: string; size: number; }> { try { const stats = await fs.stat(notePath); return { created: stats.birthtime.toISOString(), modified: stats.mtime.toISOString(), size: stats.size }; } catch { // Return default values if stat fails return { created: new Date().toISOString(), modified: new Date().toISOString(), size: 0 }; } } /** * Convert file path to note identifier */ private pathToIdentifier(notePath: string): string { const relativePath = path.relative(this.#workspace.rootPath, notePath); const parts = relativePath.split(path.sep); if (parts.length >= 2) { const type = parts[0]; const filename = parts[parts.length - 1]; return `${type}/${filename}`; } return relativePath; } /** * Search notes by tags */ async searchByTags( tags: string[], matchAll: boolean = false ): Promise<TagSearchResult[]> { try { const searchIndex = await this.loadSearchIndex(); const results: TagSearchResult[] = []; const searchTags = tags.map(tag => tag.toLowerCase()); for (const [notePath, noteData] of Object.entries(searchIndex.notes)) { const noteTags = noteData.tags.map(tag => tag.toLowerCase()); let matches = false; if (matchAll) { // All tags must be present matches = searchTags.every(tag => noteTags.includes(tag)); } else { // At least one tag must be present matches = searchTags.some(tag => noteTags.includes(tag)); } if (matches) { const identifier = this.pathToIdentifier(notePath); results.push({ id: identifier, title: noteData.title, type: noteData.type, tags: noteData.tags, lastUpdated: noteData.updated }); } } // Sort by last updated (newest first) results.sort( (a, b) => new Date(b.lastUpdated).getTime() - new Date(a.lastUpdated).getTime() ); return results; } catch (error) { const errorMessage = error instanceof Error ? error.message : 'Unknown error'; throw new Error(`Tag search failed: ${errorMessage}`); } } /** * Get all unique tags from notes */ async getAllTags(): Promise<TagInfo[]> { try { const searchIndex = await this.loadSearchIndex(); const tagCounts: Record<string, number> = {}; for (const noteData of Object.values(searchIndex.notes)) { for (const tag of noteData.tags) { tagCounts[tag] = (tagCounts[tag] || 0) + 1; } } // Convert to array and sort by frequency const tags = Object.entries(tagCounts) .map(([tag, count]) => ({ tag, count })) .sort((a, b) => b.count - a.count); return tags; } catch (error) { const errorMessage = error instanceof Error ? error.message : 'Unknown error'; throw new Error(`Failed to get tags: ${errorMessage}`); } } /** * Search for similar notes based on content similarity */ async findSimilarNotes( noteIdentifier: string, limit: number = 5 ): Promise<SimilarNoteResult[]> { try { const searchIndex = await this.loadSearchIndex(); const targetPath = this.identifierToPath(noteIdentifier); const targetNote = searchIndex.notes[targetPath]; if (!targetNote) { throw new Error(`Note '${noteIdentifier}' not found in search index`); } const results: SimilarNoteResult[] = []; const targetWords = this.extractWords(targetNote.content); for (const [notePath, noteData] of Object.entries(searchIndex.notes)) { // Skip the target note itself if (notePath === targetPath) { continue; } const noteWords = this.extractWords(noteData.content); const similarity = this.calculateSimilarity(targetWords, noteWords); if (similarity > 0.1) { // Minimum similarity threshold const identifier = this.pathToIdentifier(notePath); results.push({ id: identifier, title: noteData.title, type: noteData.type, tags: noteData.tags, similarity, lastUpdated: noteData.updated }); } } // Sort by similarity (highest first) results.sort((a, b) => b.similarity - a.similarity); return results.slice(0, limit); } catch (error) { const errorMessage = error instanceof Error ? error.message : 'Unknown error'; throw new Error(`Similar notes search failed: ${errorMessage}`); } } /** * Extract words from content for similarity calculation */ extractWords(content: string): Record<string, number> { return content .toLowerCase() .replace(/[^\w\s]/g, ' ') .split(/\s+/) .filter(word => word.length > 2) .reduce( (acc, word) => { acc[word] = (acc[word] || 0) + 1; return acc; }, {} as Record<string, number> ); } /** * Calculate similarity between two word frequency maps */ calculateSimilarity( words1: Record<string, number>, words2: Record<string, number> ): number { const allWords = new Set([...Object.keys(words1), ...Object.keys(words2)]); let dotProduct = 0; let norm1 = 0; let norm2 = 0; for (const word of allWords) { const freq1 = words1[word] || 0; const freq2 = words2[word] || 0; dotProduct += freq1 * freq2; norm1 += freq1 * freq1; norm2 += freq2 * freq2; } if (norm1 === 0 || norm2 === 0) { return 0; } return dotProduct / (Math.sqrt(norm1) * Math.sqrt(norm2)); } /** * Convert note identifier to file path */ identifierToPath(identifier: string): string { if (identifier.includes('/')) { const parts = identifier.split('/'); const type = parts[0]; const filename = parts.slice(1).join('/'); return path.join(this.#workspace.rootPath, type, filename); } else { const config = this.#workspace.getConfig(); const defaultType = config?.default_note_type || 'general'; const filename = identifier.endsWith('.md') ? identifier : `${identifier}.md`; return path.join(this.#workspace.rootPath, defaultType, filename); } } /** * Rebuild the entire search index */ async rebuildSearchIndex(): Promise<RebuildResult> { // Use the same lock mechanism to prevent concurrent index operations return this.#withIndexLock(async () => { try { const index: SearchIndex = { version: '1.0.0', last_updated: new Date().toISOString(), notes: {} }; // Scan all note types const workspaceRoot = this.#workspace.rootPath; const entries = await fs.readdir(workspaceRoot, { withFileTypes: true }); for (const entry of entries) { if ( entry.isDirectory() && !entry.name.startsWith('.') && entry.name !== 'node_modules' ) { const typePath = path.join(workspaceRoot, entry.name); const typeEntries = await fs.readdir(typePath); for (const filename of typeEntries) { if (filename.endsWith('.md') && !filename.startsWith('.')) { const notePath = path.join(typePath, filename); try { const content = await fs.readFile(notePath, 'utf-8'); const parsed = this.parseNoteContent(content); index.notes[notePath] = { content: content, title: parsed.metadata.title || this.extractTitleFromFilename(filename), type: parsed.metadata.type || entry.name, tags: parsed.metadata.tags || [], updated: new Date().toISOString(), metadata: parsed.metadata }; } catch (_error) { // Skip files that can't be read continue; } } } } } // Save the rebuilt index const indexPath = this.#workspace.searchIndexPath; await this.#writeIndexFileWithRetry(indexPath, index); return { indexedNotes: Object.keys(index.notes).length, timestamp: index.last_updated }; } catch (error) { const errorMessage = error instanceof Error ? error.message : 'Unknown error'; throw new Error(`Failed to rebuild search index: ${errorMessage}`); } }); } /** * Read index file with retry logic to handle JSON corruption */ async #readIndexFileWithRetry( indexPath: string, maxRetries: number = 3 ): Promise<string> { for (let attempt = 0; attempt < maxRetries; attempt++) { try { const content = await fs.readFile(indexPath, 'utf-8'); // Validate JSON by parsing it if (content.trim()) { JSON.parse(content); } return content; } catch (error) { if (error instanceof Error && 'code' in error && error.code === 'ENOENT') { throw error; // File doesn't exist, don't retry } if (attempt === maxRetries - 1) { throw error; // Last attempt, give up } // Wait a bit before retrying await new Promise(resolve => setTimeout(resolve, 10 * (attempt + 1))); } } return ''; } /** * Write index file with atomic operation to prevent corruption */ async #writeIndexFileWithRetry(indexPath: string, index: SearchIndex): Promise<void> { const tempPath = `${indexPath}.tmp.${Date.now()}.${Math.random().toString(36).substr(2, 9)}`; const content = JSON.stringify(index, null, 2); try { // Ensure parent directory exists await fs.mkdir(path.dirname(indexPath), { recursive: true }); // Write to temporary file first await fs.writeFile(tempPath, content, 'utf-8'); // Atomic move to final location await fs.rename(tempPath, indexPath); } catch (error) { // Clean up temp file if it exists try { await fs.unlink(tempPath); } catch { // Ignore cleanup errors } throw error; } } /** * Execute a function with exclusive access to the search index */ async #withIndexLock<T>(fn: () => Promise<T>): Promise<T> { const currentLock = SearchManager.#globalIndexLock; let resolve: () => void; SearchManager.#globalIndexLock = new Promise<void>(r => (resolve = r)); try { await currentLock; return await fn(); } finally { resolve!(); } } /** * Update a single note in the search index (thread-safe) */ async updateNoteInIndex(notePath: string, content: string): Promise<void> { return this.#withIndexLock(async () => { try { const indexPath = this.#workspace.searchIndexPath; let index: SearchIndex = { version: '1.0.0', last_updated: new Date().toISOString(), notes: {} }; // Load existing index with retry logic try { const indexContent = await this.#readIndexFileWithRetry(indexPath); if (indexContent.trim()) { index = JSON.parse(indexContent); } } catch (error) { if (error instanceof Error && 'code' in error && error.code === 'ENOENT') { // Create parent directory if it doesn't exist await fs.mkdir(path.dirname(indexPath), { recursive: true }); } else { console.warn('Failed to load search index, using default:', error); } } // Extract searchable content const parsed = this.parseNoteContent(content); const searchableContent = [ parsed.metadata.title || '', parsed.content, (parsed.metadata.tags || []).join(' ') ].join(' '); // Add to index index.notes[notePath] = { content: searchableContent, title: parsed.metadata.title || this.extractTitleFromFilename(path.basename(notePath)), type: parsed.metadata.type || path.basename(path.dirname(notePath)), tags: parsed.metadata.tags || [], updated: new Date().toISOString(), metadata: parsed.metadata }; index.last_updated = new Date().toISOString(); // Save updated index with retry logic await this.#writeIndexFileWithRetry(indexPath, index); } catch (error) { const errorMessage = error instanceof Error ? error.message : 'Unknown error'; throw new Error(`Failed to update search index: ${errorMessage}`); } }); } /** * Remove a note from the search index (thread-safe) */ async removeNoteFromIndex(notePath: string): Promise<void> { return this.#withIndexLock(async () => { try { const indexPath = this.#workspace.searchIndexPath; // Load existing index with retry logic try { const indexContent = await this.#readIndexFileWithRetry(indexPath); if (!indexContent.trim()) { return; // Empty index, nothing to remove } const index = JSON.parse(indexContent); // Remove the note entry delete index.notes[notePath]; index.last_updated = new Date().toISOString(); // Save updated index with retry logic await this.#writeIndexFileWithRetry(indexPath, index); } catch (error) { if (error instanceof Error && 'code' in error && error.code === 'ENOENT') { // Index doesn't exist, nothing to remove return; } throw error; } } catch (error) { const errorMessage = error instanceof Error ? error.message : 'Unknown error'; throw new Error(`Failed to remove from search index: ${errorMessage}`); } }); } /** * Parse note content (simplified version) */ parseNoteContent(content: string): ParsedNote { return parseNoteContent(content, false); } /** * Parse YAML frontmatter using js-yaml */ parseFrontmatter(frontmatter: string): NoteMetadata { return parseFrontmatter(frontmatter, false); } /** * Extract title from filename */ extractTitleFromFilename(filename: string): string { return filename .replace(/\.md$/, '') .replace(/-/g, ' ') .replace(/\b\w/g, letter => letter.toUpperCase()); } }

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/disnet/flint-note'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

search.ts•27.8 KiB