search.ts•8.52 kB
import { spawn, ChildProcess } from 'child_process';
import path from 'path';
import fs from 'fs/promises';
import { validatePath } from './filesystem.js';
import { rgPath } from '@vscode/ripgrep';
import {capture} from "../utils/capture.js";
// Type definition for search results
export interface SearchResult {
  file: string;
  line: number;
  match: string;
}
// Function to search file contents using ripgrep
export async function searchCode(options: {
  rootPath: string,        // Directory to search in
  pattern: string,         // Text/regex pattern to search for
  filePattern?: string,    // Optional file pattern (e.g., "*.ts")
  ignoreCase?: boolean,    // Case insensitive search
  maxResults?: number,     // Limit number of results
  includeHidden?: boolean, // Whether to include hidden files
  contextLines?: number,   // Number of context lines before and after matches
}): Promise<SearchResult[]> {
  const { 
    rootPath, 
    pattern, 
    filePattern, 
    ignoreCase = true, 
    maxResults = 1000, 
    includeHidden = false,
    contextLines = 0
  } = options;
  
  // Validate path for security
  const validPath = await validatePath(rootPath);
  
  // Build command arguments
  const args = [
    '--json',  // Output in JSON format for easier parsing
    '--line-number', // Include line numbers
  ];
  
  if (ignoreCase) {
    args.push('-i');
  }
  
  if (maxResults) {
    args.push('-m', maxResults.toString());
  }
  
  if (includeHidden) {
    args.push('--hidden');
  }
  
  if (contextLines > 0) {
    args.push('-C', contextLines.toString());
  }
  
  if (filePattern) {
    const patterns = filePattern
      .split('|')
      .map(p => p.trim())      // remove surrounding spaces
      .filter(Boolean);        // drop empty tokens
    
    // If all patterns were empty, return no results
    if (patterns.length === 0) {
      return [];
    }
    
    patterns.forEach(p => args.push('-g', p));
  }
  
  // Add pattern and path
  args.push(pattern, validPath);
  
  // Run ripgrep command
  return new Promise((resolve, reject) => {
    const results: SearchResult[] = [];
    const rg = spawn(rgPath, args);
    let stdoutBuffer = '';
    
    // Store a reference to the child process for potential termination
    const childProcess: ChildProcess = rg;
    
    // Store in a process list - this could be expanded to a global registry
    // of running search processes if needed for management
    (globalThis as any).currentSearchProcess = childProcess;
    
    rg.stdout.on('data', (data) => {
      stdoutBuffer += data.toString();
    });
    
    rg.stderr.on('data', (data) => {
      console.error(`ripgrep error: ${data}`);
    });
    
    rg.on('close', (code) => {
      // Clean up the global reference
      if ((globalThis as any).currentSearchProcess === childProcess) {
        delete (globalThis as any).currentSearchProcess;
      }
      
      if (code === 0 || code === 1) {
        // Process the buffered output
        const lines = stdoutBuffer.trim().split('\n');
        for (const line of lines) {
          if (!line) continue;
          try {
            const result = JSON.parse(line);
            if (result.type === 'match') {
              result.data.submatches.forEach((submatch: any) => {
                results.push({
                  file: result.data.path.text,
                  line: result.data.line_number,
                  match: submatch.match.text
                });
              });
            }
            else if (result.type === 'context' && contextLines > 0) {
              results.push({
                file: result.data.path.text,
                line: result.data.line_number,
                match: result.data.lines.text.trim()
              });
            }
          } catch (error) {
            const errorMessage = error instanceof Error ? error.message : String(error);
            capture('server_request_error', {error: `Error parsing ripgrep output: ${errorMessage}`});
            console.error(`Error parsing ripgrep output: ${errorMessage}`);    
          }
        }
        resolve(results);
      } else {
        reject(new Error(`ripgrep process exited with code ${code}`));
      }
    });
  });
}
// Fallback implementation using Node.js for environments without ripgrep
export async function searchCodeFallback(options: {
  rootPath: string,
  pattern: string,
  filePattern?: string,
  ignoreCase?: boolean,
  maxResults?: number,
  excludeDirs?: string[],
  contextLines?: number,
}): Promise<SearchResult[]> {
  const { 
    rootPath, 
    pattern, 
    filePattern, 
    ignoreCase = true, 
    maxResults = 1000,
    excludeDirs = ['node_modules', '.git'],
    contextLines = 0
  } = options;
  
  const validPath = await validatePath(rootPath);
  const results: SearchResult[] = [];
  const regex = new RegExp(pattern, ignoreCase ? 'i' : '');
  
  // Handle filePattern similarly to main implementation
  let fileRegex: RegExp | null = null;
  if (filePattern) {
    const patterns = filePattern
      .split('|')
      .map(p => p.trim())
      .filter(Boolean);
    
    // If all patterns were empty, return no results
    if (patterns.length === 0) {
      return [];
    }
    
    // Create a regex that matches any of the patterns
    const combinedPattern = patterns.map(p => 
      p.replace(/\./g, '\\.').replace(/\*/g, '.*').replace(/\?/g, '.')
    ).join('|');
    fileRegex = new RegExp(`^(${combinedPattern})$`);
  }
  
  async function searchDir(dirPath: string) {
    if (results.length >= maxResults) return;
    
    try {
      const entries = await fs.readdir(dirPath, { withFileTypes: true });
      
      for (const entry of entries) {
        if (results.length >= maxResults) break;
        
        const fullPath = path.join(dirPath, entry.name);
        
        try {
          await validatePath(fullPath);
          
          if (entry.isDirectory()) {
            if (!excludeDirs.includes(entry.name)) {
              await searchDir(fullPath);
            }
          } else if (entry.isFile()) {
            if (!fileRegex || fileRegex.test(entry.name)) {
              const content = await fs.readFile(fullPath, 'utf-8');
              const lines = content.split('\n');
              
              for (let i = 0; i < lines.length; i++) {
                if (regex.test(lines[i])) {
                  // Add the matched line
                  results.push({
                    file: fullPath,
                    line: i + 1,
                    match: lines[i].trim()
                  });
                  
                  // Add context lines
                  if (contextLines > 0) {
                    const startIdx = Math.max(0, i - contextLines);
                    const endIdx = Math.min(lines.length - 1, i + contextLines);
                    
                    for (let j = startIdx; j <= endIdx; j++) {
                      if (j !== i) { // Skip the match line as it's already added
                        results.push({
                          file: fullPath,
                          line: j + 1,
                          match: lines[j].trim()
                        });
                      }
                    }
                  }
                  
                  if (results.length >= maxResults) break;
                }
              }
            }
          }
        } catch (error) {
          // Skip files/directories we can't access
          continue;
        }
      }
    } catch (error) {
      // Skip directories we can't read
    }
  }
  
  await searchDir(validPath);
  return results;
}
// Main function that tries ripgrep first, falls back to native implementation
export async function searchTextInFiles(options: {
  rootPath: string,
  pattern: string,
  filePattern?: string,
  ignoreCase?: boolean,
  maxResults?: number,
  includeHidden?: boolean,
  contextLines?: number,
}): Promise<SearchResult[]> {
  try {
    // For better performance and consistency, prefer the search session manager
    // when doing content search, but keep the original direct ripgrep approach as primary
    return await searchCode(options);
  } catch (error) {
    capture('searchTextInFiles_ripgrep_fallback', {
      error: error instanceof Error ? error.message : 'Unknown error'
    });
    // Use consistent exclusions - remove 'dist' to match ripgrep behavior
    return searchCodeFallback({
      ...options,
      excludeDirs: ['node_modules', '.git']
    });
  }
}