gerbil-mcp

Overview Schema Related Servers Score Discussions

lint.ts•47.2 KiB

import { McpServer } from '@modelcontextprotocol/sdk/server/mcp.js'; import { z } from 'zod'; import { readFile } from 'node:fs/promises'; import { runGxc } from '../gxi.js'; import { parseDefinitions, parseGxcErrors, extractModulePaths, type FileAnalysis, } from './parse-utils.js'; interface LintDiagnostic { line: number | null; severity: 'error' | 'warning' | 'info'; code: string; message: string; } const COMMON_STDLIB = new Set([ 'map', 'filter', 'fold', 'for-each', 'apply', 'append', 'cons', 'car', 'cdr', 'list', 'length', 'reverse', 'sort', 'display', 'displayln', 'write', 'read', 'string-append', 'number->string', 'string->number', 'not', 'error', 'raise', 'values', 'call-with-values', 'void', 'begin', 'hash', 'vector', 'string', 'number?', 'string?', 'pair?', 'null?', 'boolean?', 'symbol?', 'vector?', 'procedure?', 'equal?', 'eq?', 'eqv?', ]); export function registerLintTool(server: McpServer): void { server.registerTool( 'gerbil_lint', { title: 'Basic Linting', description: 'Static analysis for common Gerbil issues: unused imports, duplicate definitions, ' + 'style warnings (define vs def, missing transparent:), shadowed standard bindings, ' + 'hash literal symbol key warnings, channel anti-patterns (spinning try-get, ' + 'wg-wait visibility gaps), pitfall detection (unquote outside quasiquote, ' + 'dot in brackets, missing exported definitions, re-export awareness), ' + 'SRFI-19 time->seconds shadow, unsafe mutex-lock!/unlock! without unwind-protect, ' + 'byte/char port type mismatch (fdopen with char I/O), ' + 'pregexp inline flag detection ((?i)/(?m)/(?s) cause runtime crashes), ' + 'char/byte I/O mixing on same port (nonempty-input-port-character-buffer-exception), ' + 'macro suggestions (awhen, if-let, let-hash for verbose patterns), ' + 'and compilation errors via gxc.', annotations: { readOnlyHint: true, idempotentHint: true, }, inputSchema: { file_path: z .string() .describe('Absolute path to a Gerbil source file to lint'), }, }, async ({ file_path }) => { let content: string; try { content = await readFile(file_path, 'utf-8'); } catch (err) { const msg = err instanceof Error ? err.message : 'Unknown error'; return { content: [ { type: 'text' as const, text: `Failed to read file: ${msg}` }, ], isError: true, }; } const diagnostics: LintDiagnostic[] = []; const analysis = parseDefinitions(content); const lines = content.split('\n'); checkUnusedImports(content, analysis, diagnostics); checkDuplicateDefinitions(analysis, diagnostics); checkStyleIssues(lines, diagnostics); checkShadowedBindings(analysis, diagnostics); checkHashLiteralKeys(lines, diagnostics); checkChannelPatterns(lines, diagnostics); checkUnquoteOutsideQuasiquote(lines, diagnostics); checkDotInBrackets(lines, diagnostics); checkMissingExportedDefinitions(analysis, diagnostics); checkSrfi19TimeShadow(content, analysis, diagnostics); checkUnsafeMutexPattern(lines, diagnostics); checkPortTypeMismatch(lines, diagnostics); checkPregexpInlineFlags(lines, diagnostics); checkCharByteIOMixing(lines, diagnostics); checkMacroSuggestions(lines, diagnostics); checkKeywordPositionalMismatch(content, analysis, diagnostics); checkQtCallbackArity(lines, diagnostics); // Compile check via gxc const compileResult = await runGxc(file_path, { timeout: 30_000 }); if ( compileResult.exitCode !== 0 && compileResult.exitCode !== 127 && !compileResult.timedOut ) { const gxcDiags = parseGxcErrors(compileResult.stderr, file_path); for (const d of gxcDiags) { diagnostics.push({ line: d.line, severity: d.severity, code: 'compile-error', message: d.message, }); } } if (diagnostics.length === 0) { return { content: [ { type: 'text' as const, text: `No issues found in ${file_path}.`, }, ], }; } // Sort: errors first, then warnings, then info; within severity by line const sevOrder: Record<string, number> = { error: 0, warning: 1, info: 2, }; diagnostics.sort((a, b) => { const sa = sevOrder[a.severity] ?? 3; const sb = sevOrder[b.severity] ?? 3; if (sa !== sb) return sa - sb; return (a.line ?? 0) - (b.line ?? 0); }); const errors = diagnostics.filter((d) => d.severity === 'error'); const warnings = diagnostics.filter((d) => d.severity === 'warning'); const infos = diagnostics.filter((d) => d.severity === 'info'); const sections: string[] = [ `Lint: ${file_path}`, ` ${errors.length} error(s), ${warnings.length} warning(s), ${infos.length} info`, '', ]; for (const d of diagnostics) { const loc = d.line ? `L${d.line}` : '---'; sections.push( ` [${d.severity.toUpperCase()}] ${loc} (${d.code}): ${d.message}`, ); } return { content: [{ type: 'text' as const, text: sections.join('\n') }], isError: errors.length > 0, }; }, ); } function checkUnusedImports( content: string, analysis: FileAnalysis, diagnostics: LintDiagnostic[], ): void { const contentLines = content.split('\n'); for (const imp of analysis.imports) { const modPaths = extractModulePaths(imp.raw); for (const modPath of modPaths) { // Skip relative imports — harder to check if (modPath.startsWith('./')) continue; const lastSeg = modPath.split('/').pop() || ''; if (!lastSeg) continue; // Check if the module's last segment or full path appears after the import line const afterImport = contentLines.slice(imp.line).join('\n'); if (!afterImport.includes(lastSeg) && !afterImport.includes(modPath)) { diagnostics.push({ line: imp.line, severity: 'warning', code: 'possibly-unused-import', message: `Import ${modPath} may be unused`, }); } } } } function checkDuplicateDefinitions( analysis: FileAnalysis, diagnostics: LintDiagnostic[], ): void { const seen = new Map<string, number>(); for (const def of analysis.definitions) { if (seen.has(def.name)) { diagnostics.push({ line: def.line, severity: 'warning', code: 'duplicate-definition', message: `"${def.name}" already defined at line ${seen.get(def.name)}`, }); } else { seen.set(def.name, def.line); } } } function checkStyleIssues( lines: string[], diagnostics: LintDiagnostic[], ): void { for (let i = 0; i < lines.length; i++) { const trimmed = lines[i].trimStart(); const lineNum = i + 1; // Skip comments if (trimmed.startsWith(';')) continue; // Prefer def over define if (trimmed.startsWith('(define ') && !trimmed.startsWith('(define-')) { diagnostics.push({ line: lineNum, severity: 'info', code: 'style-prefer-def', message: 'Prefer "def" over "define" (supports optional/keyword args)', }); } // defstruct without transparent: if (trimmed.startsWith('(defstruct ') && !trimmed.includes('transparent:')) { const lookAhead = lines .slice(i, Math.min(i + 5, lines.length)) .join(' '); if (!lookAhead.includes('transparent:')) { diagnostics.push({ line: lineNum, severity: 'info', code: 'style-missing-transparent', message: 'Consider adding transparent: #t to defstruct for debugging/printing', }); } } } } function checkShadowedBindings( analysis: FileAnalysis, diagnostics: LintDiagnostic[], ): void { for (const def of analysis.definitions) { if (COMMON_STDLIB.has(def.name)) { diagnostics.push({ line: def.line, severity: 'warning', code: 'shadowed-binding', message: `"${def.name}" shadows a common standard binding`, }); } } } function extractFormFromLines(lines: string[], startIdx: number): string { let depth = 0; let result = ''; for (let i = startIdx; i < lines.length; i++) { const line = lines[i]; result += (i > startIdx ? '\n' : '') + line; for (const ch of line) { if (ch === '(' || ch === '[') depth++; else if (ch === ')' || ch === ']') depth--; } if (depth <= 0 && result.includes('(')) break; } return result; } /** * Extract top-level entries from a (hash ...) form. * Returns the key token of each (key value) pair at depth 1. */ function extractHashEntries(form: string): string[] { const keys: string[] = []; // Skip past the opening "(hash" prefix const start = form.indexOf('(hash'); if (start === -1) return keys; let pos = start + 5; // skip "(hash" const len = form.length; while (pos < len) { const ch = form[pos]; // Skip whitespace if (/\s/.test(ch)) { pos++; continue; } // End of hash form if (ch === ')') break; // Start of an entry: (key value) if (ch === '(') { pos++; // skip '(' // Skip whitespace before key while (pos < len && /\s/.test(form[pos])) pos++; // Read the key token const keyStart = pos; while (pos < len && !/[\s()]/.test(form[pos])) pos++; const key = form.slice(keyStart, pos); if (key.length > 0) keys.push(key); // Skip the rest of this entry by tracking depth let depth = 1; while (pos < len && depth > 0) { if (form[pos] === '(' || form[pos] === '[') depth++; else if (form[pos] === ')' || form[pos] === ']') depth--; // Skip string literals to avoid counting parens inside them if (form[pos] === '"') { pos++; while (pos < len && form[pos] !== '"') { if (form[pos] === '\\') pos++; // skip escaped char pos++; } } pos++; } } else { // Skip any other token (shouldn't happen in well-formed hash) pos++; } } return keys; } /** * Check if a token looks like a bare identifier (symbol key) in a hash literal. * Returns false for strings, numbers, booleans, keywords, and characters. */ function isBareIdentifier(token: string): boolean { if (token.length === 0) return false; // String literal if (token.startsWith('"')) return false; // Number (including negative) if (/^-?[0-9]/.test(token)) return false; // Boolean if (token === '#t' || token === '#f') return false; // Keyword (ends with colon) if (token.endsWith(':')) return false; // Character literal if (token.startsWith('#\\')) return false; // Quoted symbol if (token.startsWith("'")) return false; return true; } function checkHashLiteralKeys( lines: string[], diagnostics: LintDiagnostic[], ): void { for (let i = 0; i < lines.length; i++) { const trimmed = lines[i].trimStart(); const lineNum = i + 1; // Skip comments if (trimmed.startsWith(';')) continue; // Match (hash ...) but not (hash-eq ...), (hash-eqv ...), (hash-ref ...), etc. if (!trimmed.match(/^\(hash[\s\n)]/)) continue; // Extract the full form spanning multiple lines const form = extractFormFromLines(lines, i); // Extract entry keys and check for bare identifiers const keys = extractHashEntries(form); for (const key of keys) { if (isBareIdentifier(key)) { diagnostics.push({ line: lineNum, severity: 'warning', code: 'hash-symbol-key', message: `Hash literal uses bare symbol key '${key}' — this creates a symbol key, not a string. ` + `Use ("${key}" ...) for string keys, or hash-eq for intentional symbol keys.`, }); } } } } /** * Check if a line index is inside a loop construct by scanning backward. * Stops at top-level definition boundaries (def, def*, defmethod, etc.). */ function isInsideLoop(lines: string[], targetIdx: number): boolean { const loopPattern = /\(\s*(while|until|do|for|for\/collect|for\/fold)\s/; const namedLetPattern = /\(\s*let\s+\S+\s+\(/; const defBoundary = /^\s*\(\s*(def\b|def\*|defmethod|defclass|defstruct)/; for (let i = targetIdx; i >= 0; i--) { const line = lines[i]; // Stop scanning at top-level definition boundaries if (defBoundary.test(line) && i < targetIdx) return false; if (loopPattern.test(line)) return true; if (namedLetPattern.test(line)) return true; } return false; } function checkChannelPatterns( lines: string[], diagnostics: LintDiagnostic[], ): void { const defBoundary = /^\s*\(\s*(def\b|def\*|defmethod|defclass|defstruct)/; for (let i = 0; i < lines.length; i++) { const trimmed = lines[i].trimStart(); const lineNum = i + 1; // Skip comments if (trimmed.startsWith(';')) continue; // Rule 1: channel-try-get inside a loop if (trimmed.includes('channel-try-get')) { if (isInsideLoop(lines, i)) { diagnostics.push({ line: lineNum, severity: 'warning', code: 'channel-try-get-in-loop', message: 'channel-try-get inside a loop spins the CPU. ' + 'Use channel-get (blocking) or add a sleep/timeout.', }); } } // Rule 2: wg-wait! followed by channel-try-get if (trimmed.includes('wg-wait!')) { const lookAheadEnd = Math.min(i + 15, lines.length); for (let j = i + 1; j < lookAheadEnd; j++) { // Stop at definition boundaries if (defBoundary.test(lines[j])) break; if (lines[j].includes('channel-try-get')) { diagnostics.push({ line: lineNum, severity: 'warning', code: 'wg-wait-then-try-get', message: 'wg-wait! followed by channel-try-get may miss values. ' + 'Workers may not have put to the channel yet when wg signals. ' + 'Use channel-get (blocking) or collect results before wg-wait!.', }); break; } } } } } /** * Detect `,expr` or `,@expr` that appear outside quasiquote context. * Scans for unquote (comma) at Scheme word boundaries, not inside strings, * and checks whether a quasiquote (backtick) is active in preceding lines. */ function checkUnquoteOutsideQuasiquote( lines: string[], diagnostics: LintDiagnostic[], ): void { // Track quasiquote depth across lines (heuristic: look for backtick starts) let qqDepth = 0; for (let i = 0; i < lines.length; i++) { const line = lines[i]; const lineNum = i + 1; const trimmed = line.trimStart(); // Skip comments if (trimmed.startsWith(';')) continue; // Track quasiquote nesting (simple heuristic) let inString = false; for (let j = 0; j < line.length; j++) { const ch = line[j]; // Skip string contents if (ch === '"' && (j === 0 || line[j - 1] !== '\\')) { inString = !inString; continue; } if (inString) continue; // Skip after semicolon (comment) if (ch === ';') break; if (ch === '`') { qqDepth++; } else if (ch === ',' && qqDepth > 0) { qqDepth--; } } // Reset at top-level forms (heuristic: line starts with `(`) if (trimmed.startsWith('(') && !trimmed.startsWith('(`') && qqDepth > 0) { // Check if this looks like a top-level definition if ( /^\((def\b|defstruct|defclass|defmethod|defrules?|defsyntax|export|import)/.test( trimmed, ) ) { qqDepth = 0; } } // Now check for commas that aren't inside quasiquote inString = false; for (let j = 0; j < line.length; j++) { const ch = line[j]; if (ch === '"' && (j === 0 || line[j - 1] !== '\\')) { inString = !inString; continue; } if (inString) continue; if (ch === ';') break; if (ch === ',') { // Check if preceded by a Scheme delimiter or start of line const leftOk = j === 0 || /[\s([\]{}'`]/.test(line[j - 1]); if (!leftOk) continue; // Check that something follows (not just whitespace to EOL) const rest = line.slice(j + 1).trimStart(); if (!rest || rest.startsWith(';')) continue; // Skip if it looks like it's a comma in a hash literal key-value form // e.g., (hash ("key" , value)) — this is unusual but not unquote // Actually, in Scheme `,` is always unquote syntax // Check if we're inside a quasiquote context by scanning backward let inQQ = false; // Scan backward on this line for backtick for (let k = j - 1; k >= 0; k--) { if (line[k] === '`') { inQQ = true; break; } } // Also check if a previous line's quasiquote is still open if (!inQQ && qqDepth <= 0) { // Scan back a few lines for an open quasiquote let foundQQ = false; for (let back = i - 1; back >= Math.max(0, i - 20); back--) { const prevLine = lines[back].trimStart(); if (prevLine.startsWith(';')) continue; if ( /^\((def\b|defstruct|defclass|defmethod|defrules?|defsyntax|export|import)/.test( prevLine, ) ) { break; // Hit a top-level form boundary } if (prevLine.includes('`')) { foundQQ = true; break; } } if (!foundQQ) { const snippet = line.slice(j, Math.min(j + 20, line.length)); diagnostics.push({ line: lineNum, severity: 'warning', code: 'unquote-outside-quasiquote', message: `Unquote "${snippet.trim()}" appears outside quasiquote context. ` + 'Did you mean to use a backtick ` template?', }); } } } } } } /** * Detect `. ` (dot-space) inside `[...]` constructs. * Gerbil's `[]` is list sugar, so `[a . b]` is almost always a mistake — * the user likely meant `(cons a b)` or `(a . b)` with parentheses. */ function checkDotInBrackets( lines: string[], diagnostics: LintDiagnostic[], ): void { for (let i = 0; i < lines.length; i++) { const line = lines[i]; const lineNum = i + 1; const trimmed = line.trimStart(); // Skip comments if (trimmed.startsWith(';')) continue; // Quick check: does this line contain both `[` and `. `? if (!line.includes('[') || !line.includes('. ')) continue; // Scan character by character tracking bracket depth and string state let inString = false; let bracketDepth = 0; for (let j = 0; j < line.length; j++) { const ch = line[j]; if (ch === '"' && (j === 0 || line[j - 1] !== '\\')) { inString = !inString; continue; } if (inString) continue; if (ch === ';') break; // Rest is comment if (ch === '[') { bracketDepth++; } else if (ch === ']') { bracketDepth--; } else if ( ch === '.' && bracketDepth > 0 && j + 1 < line.length && line[j + 1] === ' ' ) { // Check it's at a word boundary (not part of a symbol like `foo.bar`) const leftOk = j === 0 || /[\s([\]{}]/.test(line[j - 1]); if (leftOk) { diagnostics.push({ line: lineNum, severity: 'warning', code: 'dot-in-brackets', message: 'Dotted pair inside [...] brackets. ' + 'Gerbil [] is list sugar, not cons syntax. ' + 'Use (a . b) with parentheses for dotted pairs, or [a b] for a list.', }); break; // One warning per line is enough } } } } } /** * Detect time->seconds usage in files that import :std/srfi/19. * SRFI-19's current-time shadows Gambit's current-time, but time->seconds * remains Gambit's version. Passing an SRFI-19 time object to Gambit's * time->seconds causes a runtime type error. This is invisible at compile * time and can cause cascading deadlocks if inside a mutex-protected section. */ function checkSrfi19TimeShadow( content: string, analysis: FileAnalysis, diagnostics: LintDiagnostic[], ): void { // Check if file imports :std/srfi/19 const hasSrfi19 = analysis.imports.some((imp) => imp.raw.includes(':std/srfi/19'), ); if (!hasSrfi19) return; const lines = content.split('\n'); for (let i = 0; i < lines.length; i++) { const line = lines[i]; const lineNum = i + 1; const trimmed = line.trimStart(); // Skip comments and import lines if (trimmed.startsWith(';')) continue; if (trimmed.startsWith('(import ')) continue; // Check for time->seconds usage let searchFrom = 0; while (true) { const idx = line.indexOf('time->seconds', searchFrom); if (idx === -1) break; // Word boundary check const leftOk = idx === 0 || /[\s([\]{}'`,;]/.test(line[idx - 1]); const rightIdx = idx + 'time->seconds'.length; const rightOk = rightIdx >= line.length || /[\s)[\]{}'`,;]/.test(line[rightIdx]); if (leftOk && rightOk) { // Check it's not inside a string or comment const before = line.slice(0, idx); const inComment = before.includes(';'); const quoteCount = (before.match(/"/g) || []).length; const inString = quoteCount % 2 !== 0; if (!inComment && !inString) { diagnostics.push({ line: lineNum, severity: 'warning', code: 'srfi19-time-seconds-shadow', message: 'time->seconds with :std/srfi/19 import is likely a bug. ' + "SRFI-19's current-time shadows Gambit's, but time->seconds remains " + "Gambit's version and will fail on SRFI-19 time objects. " + 'Use time-second for SRFI-19, or ##current-time for Gambit timing.', }); } } searchFrom = idx + 1; } } } /** * Detect mutex-lock!/mutex-unlock! pairs not wrapped in unwind-protect * or dynamic-wind. If an exception occurs between lock and unlock, the * mutex stays permanently locked, causing deadlocks for all subsequent callers. */ function checkUnsafeMutexPattern( lines: string[], diagnostics: LintDiagnostic[], ): void { const defBoundary = /^\s*\(\s*(def\b|def\*|defmethod|defclass|defstruct)/; for (let i = 0; i < lines.length; i++) { const trimmed = lines[i].trimStart(); const lineNum = i + 1; // Skip comments if (trimmed.startsWith(';')) continue; if (!trimmed.includes('mutex-lock!')) continue; // Check it's not inside a string or comment const before = trimmed.slice(0, trimmed.indexOf('mutex-lock!')); if (before.includes(';')) continue; const quoteCount = (before.match(/"/g) || []).length; if (quoteCount % 2 !== 0) continue; // Scan backward to check if we're inside an unwind-protect or dynamic-wind let protected_ = false; for (let j = i - 1; j >= Math.max(0, i - 30); j--) { const prev = lines[j].trimStart(); // Stop at definition boundaries if (defBoundary.test(prev) && j < i) break; if (prev.includes('unwind-protect') || prev.includes('dynamic-wind')) { protected_ = true; break; } } if (protected_) continue; // Scan forward for a matching mutex-unlock! in the same scope let hasUnlock = false; for (let j = i + 1; j < Math.min(lines.length, i + 30); j++) { if (defBoundary.test(lines[j])) break; if (lines[j].includes('mutex-unlock!')) { hasUnlock = true; break; } // Also check if unwind-protect appears after the lock (wrapping the body) if (lines[j].includes('unwind-protect') || lines[j].includes('dynamic-wind')) { protected_ = true; break; } } if (protected_) continue; if (hasUnlock) { diagnostics.push({ line: lineNum, severity: 'warning', code: 'unsafe-mutex-pattern', message: 'mutex-lock!/mutex-unlock! without unwind-protect. ' + 'If an exception occurs between lock and unlock, the mutex stays permanently locked. ' + 'Wrap the body in (unwind-protect body (mutex-unlock! mx)).', }); } } } /** * Detect character I/O functions used with fdopen byte ports. * fdopen returns a byte (binary) port, but functions like display, displayln, * write, read-line etc. expect character ports. This mismatch causes subtle * encoding bugs or runtime errors. */ function checkPortTypeMismatch( lines: string[], diagnostics: LintDiagnostic[], ): void { const CHAR_IO_FUNCTIONS = new Set([ 'display', 'displayln', 'write', 'write-char', 'read-char', 'read-line', 'newline', 'print', 'println', 'pretty-print', 'write-string', 'read', ]); const defBoundary = /^\s*\(\s*(def\b|def\*|defmethod|defclass|defstruct)/; for (let i = 0; i < lines.length; i++) { const trimmed = lines[i].trimStart(); const lineNum = i + 1; // Skip comments if (trimmed.startsWith(';')) continue; if (!trimmed.includes('fdopen')) continue; // Check it's not inside a string or comment const fdIdx = trimmed.indexOf('fdopen'); const before = trimmed.slice(0, fdIdx); if (before.includes(';')) continue; const quoteCount = (before.match(/"/g) || []).length; if (quoteCount % 2 !== 0) continue; // Check same line for char I/O functions for (const fn of CHAR_IO_FUNCTIONS) { if (trimmed.includes(fn)) { const fnIdx = trimmed.indexOf(fn); // Verify word boundary const leftOk = fnIdx === 0 || /[\s([\]{}'`,;]/.test(trimmed[fnIdx - 1]); const rightIdx = fnIdx + fn.length; const rightOk = rightIdx >= trimmed.length || /[\s)[\]{}'`,;]/.test(trimmed[rightIdx]); if (leftOk && rightOk) { diagnostics.push({ line: lineNum, severity: 'warning', code: 'port-type-mismatch', message: `"${fn}" used with fdopen byte port on same line. ` + 'fdopen returns a byte port, but character I/O functions expect a character port. ' + 'Use open-input-file/open-output-file for character I/O, or wrap with open-buffered-reader.', }); break; } } } // Try to extract bound variable name from (let ((VAR (fdopen ...))) or (def VAR (fdopen ...)) const letMatch = trimmed.match(/\(\s*(\S+)\s+\(fdopen\b/); const defMatch = trimmed.match(/^\(def\s+(\S+)\s+\(fdopen\b/); const varName = letMatch?.[1] || defMatch?.[1]; if (varName) { // Scan forward for char I/O functions used with this variable const lookAheadEnd = Math.min(i + 30, lines.length); for (let j = i + 1; j < lookAheadEnd; j++) { if (defBoundary.test(lines[j])) break; const fwdLine = lines[j].trimStart(); if (fwdLine.startsWith(';')) continue; for (const fn of CHAR_IO_FUNCTIONS) { if (fwdLine.includes(fn) && fwdLine.includes(varName)) { diagnostics.push({ line: j + 1, severity: 'warning', code: 'port-type-mismatch', message: `"${fn}" used with "${varName}" which is bound to an fdopen byte port (line ${lineNum}). ` + 'fdopen returns a byte port, but character I/O functions expect a character port.', }); break; } } } } } } /** * Check that all symbols listed in (export ...) forms are actually * defined in the file. Catches typos and forgotten definitions. * Aware of re-exports: if a symbol appears in an import statement's text, * it is likely being re-exported and should not be flagged. */ function checkMissingExportedDefinitions( analysis: FileAnalysis, diagnostics: LintDiagnostic[], ): void { const definedNames = new Set(analysis.definitions.map((d) => d.name)); // Build a set of tokens that appear in import statements for re-export detection const importTokens = new Set<string>(); // Also track whether there are any bare module imports (could re-export anything) let hasBareModuleImports = false; for (const imp of analysis.imports) { // Extract all symbol-like tokens from raw import text const tokens = imp.raw.match(/[a-zA-Z_!?<>=+\-*/][a-zA-Z0-9_!?<>=+\-*/.:~#]*/g); if (tokens) { for (const t of tokens) { // Skip keywords like import, only-in, except-out, rename-in, etc. if (!['import', 'only-in', 'except-out', 'rename-in', 'rename-out', 'prefix-in', 'prefix-out', 'struct-out', 'group-in'].includes(t)) { importTokens.add(t); } } } // Detect bare module imports: (import :foo/bar) without only-in/except-out filters const modPaths = extractModulePaths(imp.raw); if (modPaths.length > 0 && !imp.raw.includes('only-in')) { hasBareModuleImports = true; } } for (const exp of analysis.exports) { const raw = exp.raw; // (export #t) — export everything, skip if (raw.includes('#t')) continue; // Strip outer (export ...) const inner = raw .replace(/^\s*$export\s+/, '') .replace(/$\s*$/, '') .trim(); if (!inner) continue; // Extract plain symbol tokens (skip sub-forms like (struct-out ...) etc.) let pos = 0; while (pos < inner.length) { while (pos < inner.length && /\s/.test(inner[pos])) pos++; if (pos >= inner.length) break; if (inner[pos] === '(') { // Skip sub-form let depth = 1; pos++; while (pos < inner.length && depth > 0) { if (inner[pos] === '(') depth++; else if (inner[pos] === ')') depth--; pos++; } } else { // Read plain symbol const start = pos; while (pos < inner.length && !/[\s()[\]{}]/.test(inner[pos])) pos++; const sym = inner.slice(start, pos); // Skip comment tokens (;;), booleans, and defined names if (sym.startsWith(';')) continue; if (sym && sym !== '#t' && sym !== '#f' && !definedNames.has(sym)) { // Check if symbol appears explicitly in imports (e.g. only-in) if (importTokens.has(sym)) continue; // If file has bare module imports, the symbol could be a re-export if (hasBareModuleImports) continue; diagnostics.push({ line: exp.line, severity: 'warning', code: 'missing-exported-definition', message: `Exports "${sym}" but no definition found in this file`, }); } } } } } /** * Detect pregexp inline flags ((?i), (?m), (?s), (?x)) in string literals. * Gerbil's :std/pregexp does not support these Perl-style inline flags — * they cause a cryptic "BUG: pregexp internal error" at runtime from * pregexp-read-cluster-type. Suggest character classes or string-downcase instead. */ function checkPregexpInlineFlags( lines: string[], diagnostics: LintDiagnostic[], ): void { // Match (?i), (?m), (?s), (?x), (?I), etc. inside a string const INLINE_FLAG_RE = /$\?[imsxIMSX]$/; for (let i = 0; i < lines.length; i++) { const line = lines[i]; const lineNum = i + 1; const trimmed = line.trimStart(); // Skip pure comment lines if (trimmed.startsWith(';')) continue; // Quick bail: no inline flag pattern at all if (!INLINE_FLAG_RE.test(line)) continue; // Scan for string literals and check if they contain an inline flag let j = 0; let warned = false; while (j < line.length && !warned) { const ch = line[j]; // Skip line comments if (ch === ';') break; // Enter a string literal if (ch === '"') { const start = j; j++; while (j < line.length) { if (line[j] === '\\') { j += 2; // skip escaped character continue; } if (line[j] === '"') { j++; break; } j++; } const strContent = line.slice(start, j); const flagMatch = INLINE_FLAG_RE.exec(strContent); if (flagMatch) { diagnostics.push({ line: lineNum, severity: 'warning', code: 'pregexp-inline-flag', message: `String contains pregexp inline flag "${flagMatch[0]}". ` + "Gerbil's :std/pregexp does not support (?i)/(?m)/(?s)/(?x) — " + 'they cause a "BUG: pregexp internal error" at runtime. ' + 'Use character classes (e.g. [Aa][Bb] for case-insensitive "ab") ' + 'or string-downcase/string-upcase before matching.', }); warned = true; } continue; } j++; } } } /** * Detect when both character I/O and byte I/O functions are used on the same port. * Gambit raises nonempty-input-port-character-buffer-exception when byte I/O follows * char I/O on the same port, because read-line consumes bytes into the character buffer. * Common in HTTP/LSP Content-Length framed protocols where headers use read-line and * body uses read-subu8vector. */ function checkCharByteIOMixing( lines: string[], diagnostics: LintDiagnostic[], ): void { const CHAR_IO_FUNCTIONS = new Set([ 'display', 'displayln', 'write', 'write-char', 'read-char', 'read-line', 'newline', 'print', 'println', 'pretty-print', 'write-string', 'read-string', 'read', ]); const BYTE_IO_FUNCTIONS = new Set([ 'read-subu8vector', 'write-subu8vector', 'read-u8', 'write-u8', 'read-u8vector', 'write-u8vector', ]); const defBoundary = /^\s*\(\s*(def\b|def\*|defmethod|defclass|defstruct)/; // Track I/O usages per variable within each function scope // Map: function start line → Map of variable → usage array const scopes = new Map<number, Map<string, Array<{line: number; type: 'char' | 'byte'; fn: string}>>>(); let currentScopeStart = 0; for (let i = 0; i < lines.length; i++) { const trimmed = lines[i].trimStart(); const lineNum = i + 1; // Skip comments if (trimmed.startsWith(';')) continue; // Track function boundaries if (defBoundary.test(trimmed)) { currentScopeStart = i; scopes.set(currentScopeStart, new Map()); } // Get current scope map const scopeMap = scopes.get(currentScopeStart); if (!scopeMap) continue; // Check for char I/O functions on this line for (const fn of CHAR_IO_FUNCTIONS) { if (trimmed.includes(fn)) { const fnIdx = trimmed.indexOf(fn); // Verify word boundary const leftOk = fnIdx === 0 || /[\s([\]{}'`,;]/.test(trimmed[fnIdx - 1]); const rightIdx = fnIdx + fn.length; const rightOk = rightIdx >= trimmed.length || /[\s)[\]{}'`,;]/.test(trimmed[rightIdx]); if (leftOk && rightOk) { // Extract potential port variable names from the line const vars = trimmed.match(/\b[a-zA-Z_][-a-zA-Z0-9_]*/g) || []; for (const v of vars) { // Skip function names and common keywords if (v === fn || v === 'let' || v === 'def' || v === 'lambda') continue; if (!scopeMap.has(v)) { scopeMap.set(v, []); } scopeMap.get(v)!.push({line: lineNum, type: 'char', fn}); } break; } } } // Check for byte I/O functions on this line for (const fn of BYTE_IO_FUNCTIONS) { if (trimmed.includes(fn)) { const fnIdx = trimmed.indexOf(fn); // Verify word boundary const leftOk = fnIdx === 0 || /[\s([\]{}'`,;]/.test(trimmed[fnIdx - 1]); const rightIdx = fnIdx + fn.length; const rightOk = rightIdx >= trimmed.length || /[\s)[\]{}'`,;]/.test(trimmed[rightIdx]); if (leftOk && rightOk) { // Extract potential port variable names from the line const vars = trimmed.match(/\b[a-zA-Z_][-a-zA-Z0-9_]*/g) || []; for (const v of vars) { // Skip function names and common keywords if (v === fn || v === 'let' || v === 'def' || v === 'lambda') continue; if (!scopeMap.has(v)) { scopeMap.set(v, []); } scopeMap.get(v)!.push({line: lineNum, type: 'byte', fn}); } break; } } } } // Check each scope for mixed usage for (const [scopeLine, varMap] of scopes) { for (const [varName, usages] of varMap) { const charUsages = usages.filter(u => u.type === 'char'); const byteUsages = usages.filter(u => u.type === 'byte'); if (charUsages.length > 0 && byteUsages.length > 0) { const charUsage = charUsages[0]; const byteUsage = byteUsages[0]; diagnostics.push({ line: Math.min(charUsage.line, byteUsage.line), severity: 'error', code: 'char-byte-io-mixing', message: `Port variable "${varName}" uses both character I/O (${charUsage.fn} at L${charUsage.line}) ` + `and byte I/O (${byteUsage.fn} at L${byteUsage.line}). ` + 'Mixing char and byte I/O on the same port causes nonempty-input-port-character-buffer-exception. ' + 'Use only char I/O or only byte I/O, or create separate ports.', }); } } } } /** * Suggest stdlib sugar macros for verbose patterns. * Detects patterns that could be simplified using :std/sugar macros like * awhen, if-let, let-hash, etc. */ function checkMacroSuggestions( lines: string[], diagnostics: LintDiagnostic[], ): void { for (let i = 0; i < lines.length; i++) { const line = lines[i]; const trimmed = line.trimStart(); const lineNum = i + 1; // Skip comments if (trimmed.startsWith(';')) continue; // Pattern 1: (let (var expr) (when var ...)) → suggest awhen // Look for let followed by when using the same variable const letWhenMatch = trimmed.match(/\(let\s+\(\((\S+)\s+/); if (letWhenMatch) { const varName = letWhenMatch[1]; // Look ahead for (when varName ...) const lookAhead = lines.slice(i, Math.min(i + 5, lines.length)).join(' '); if (new RegExp(`\\(when\\s+${varName}\\b`).test(lookAhead)) { diagnostics.push({ line: lineNum, severity: 'info', code: 'suggest-awhen', message: `Consider using 'awhen' instead of let + when. awhen binds the result to 'it' if truthy: (awhen (${varName} expr) ...)`, }); } } // Pattern 2: (let (var expr) (if var ...)) → suggest if-let if (letWhenMatch) { const varName = letWhenMatch[1]; const lookAhead = lines.slice(i, Math.min(i + 5, lines.length)).join(' '); if (new RegExp(`\\(if\\s+${varName}\\b`).test(lookAhead)) { diagnostics.push({ line: lineNum, severity: 'info', code: 'suggest-if-let', message: `Consider using 'if-let' instead of let + if: (if-let (${varName} expr) then-branch else-branch)`, }); } } // Pattern 3: Multiple hash-ref calls in let bindings → suggest let-hash // (let ((a (hash-ref h "a")) (b (hash-ref h "b"))) ...) if (trimmed.includes('let') && trimmed.includes('hash-ref')) { const lookAhead = lines.slice(i, Math.min(i + 10, lines.length)).join('\n'); const hashRefCount = (lookAhead.match(/hash-ref\s+(\S+)/g) || []).length; if (hashRefCount >= 2) { // Extract the hash table variable name from first hash-ref const firstHashRef = lookAhead.match(/hash-ref\s+(\S+)\s+/); if (firstHashRef) { const hashVar = firstHashRef[1]; // Check if multiple hash-refs use the same hash variable const sameHashCount = (lookAhead.match(new RegExp(`hash-ref\\s+${hashVar}\\s+`, 'g')) || []).length; if (sameHashCount >= 2) { diagnostics.push({ line: lineNum, severity: 'info', code: 'suggest-let-hash', message: `Consider using 'let-hash' for multiple hash-ref from the same hash: (let-hash ${hashVar} ((key1 val1) (key2 val2) ...) ...)`, }); } } } } // Pattern 4: try with explicit cleanup → suggest with-destroy if (trimmed.includes('try') || trimmed.includes('with-catch')) { const lookAhead = lines.slice(i, Math.min(i + 15, lines.length)).join('\n'); if ((lookAhead.includes('finally') || lookAhead.includes('close')) && (lookAhead.includes('make-') || lookAhead.includes('open-'))) { diagnostics.push({ line: lineNum, severity: 'info', code: 'suggest-with-destroy', message: `Consider using 'with-destroy' for automatic resource cleanup: (with-destroy obj-expr obj-destructor body ...)`, }); } } // Pattern 5: Repeated hash-get on same object → suggest using // This is trickier - look for multiple hash-get calls with the same first argument const hashGetMatches = trimmed.match(/hash-get\s+(\S+)\s+/g); if (hashGetMatches && hashGetMatches.length >= 3) { diagnostics.push({ line: lineNum, severity: 'info', code: 'suggest-using', message: `Consider using 'using' macro for repeated access: (using (obj-expr :- accessor) (accessor \"field1\") (accessor \"field2\") ...)`, }); } // Pattern 6: Nested let expressions → suggest chain or let* if (trimmed.match(/\(let\s+\(\(/)) { const lookAhead = lines.slice(i, Math.min(i + 10, lines.length)).join('\n'); const nestedLetCount = (lookAhead.match(/\(let\s+\(\(/g) || []).length; if (nestedLetCount >= 2) { diagnostics.push({ line: lineNum, severity: 'info', code: 'suggest-let-star-or-chain', message: `Consider using 'let*' for sequential bindings or 'chain' for threading values: (let* ((a expr1) (b (use-a a))) ...) or (chain expr (fn1) (fn2))`, }); } } } } /** * Detect call sites using keyword syntax on functions defined with positional optionals. * e.g., (def (f a (prompt ">")) ...) called as (f x prompt: "hello") * The keyword symbol silently becomes a positional argument value. */ function checkKeywordPositionalMismatch( content: string, analysis: FileAnalysis, diagnostics: LintDiagnostic[], ): void { // Find function definitions with positional optionals (not keyword optionals) // Positional: (def (f a (prompt ">") (multi? #f))) // Keyword: (def (f a prompt: (prompt ">"))) const positionalOptFuncs = new Map<string, number>(); // name -> line for (const def of analysis.definitions) { if (def.kind !== 'procedure') continue; // Find the definition line to check for positional optionals const lines = content.split('\n'); const defLine = lines[def.line - 1] || ''; // Look for (def (name ... (opt default) ... ) pattern WITHOUT keyword: syntax const paramMatch = defLine.match( /\(\s*(?:def\*?|define)\s+\(\s*([a-zA-Z_!?<>=+\-*/][a-zA-Z0-9_!?<>=+\-*/.:#~]*)\s+(.*)/, ); if (!paramMatch) continue; const paramStr = paramMatch[2]; // Has positional optionals (parenthesized defaults) but NOT keyword: params if (paramStr.match(/\([a-zA-Z_!?<>=+\-*/]/) && !paramStr.match(/[a-zA-Z_!?<>=+\-*/]+:/)) { positionalOptFuncs.set(def.name, def.line); } } if (positionalOptFuncs.size === 0) return; // Scan for call sites that use keyword syntax on these functions const lines = content.split('\n'); for (let i = 0; i < lines.length; i++) { const line = lines[i]; const commentIdx = line.indexOf(';'); const effective = commentIdx >= 0 ? line.slice(0, commentIdx) : line; for (const [funcName, defLine] of positionalOptFuncs) { // Look for (funcName ... keyword: value) const escaped = funcName.replace(/[.*+?^${}()|[\]\\]/g, '\\$&'); const callPattern = new RegExp(`\\(\\s*${escaped}\\b.*\\s([a-zA-Z_!?<>=+\\-*/][a-zA-Z0-9_!?<>=+\\-*/.#~]*):\\s`); const callMatch = effective.match(callPattern); if (callMatch && i + 1 !== defLine) { diagnostics.push({ line: i + 1, severity: 'warning', code: 'keyword-positional-mismatch', message: `"${funcName}" uses positional optionals (line ${defLine}) but is called with keyword syntax "${callMatch[1]}:". ` + `The keyword symbol will be consumed as a positional arg value, shifting subsequent parameters. ` + `Either change the definition to use keyword args (e.g., ${callMatch[1]}: (${callMatch[1]} default)) or remove the keyword syntax from the call.`, }); } } } } /** * Qt callback arity checking. * Maps qt-on-*! functions to expected handler arities based on signal type. */ const QT_SIGNAL_ARITIES: Record<string, { arity: number; type: string }> = { 'qt-on-clicked!': { arity: 0, type: 'void' }, 'qt-on-toggled!': { arity: 1, type: 'bool' }, 'qt-on-text-changed!': { arity: 1, type: 'string' }, 'qt-on-text-edited!': { arity: 1, type: 'string' }, 'qt-on-value-changed!': { arity: 1, type: 'int' }, 'qt-on-index-changed!': { arity: 1, type: 'int' }, 'qt-on-current-index-changed!': { arity: 1, type: 'int' }, 'qt-on-return-pressed!': { arity: 0, type: 'void' }, 'qt-on-activated!': { arity: 1, type: 'int' }, 'qt-on-pressed!': { arity: 0, type: 'void' }, 'qt-on-released!': { arity: 0, type: 'void' }, 'qt-on-selection-changed!': { arity: 0, type: 'void' }, 'qt-on-current-changed!': { arity: 1, type: 'int' }, 'qt-on-item-clicked!': { arity: 1, type: 'int' }, 'qt-on-double-clicked!': { arity: 1, type: 'int' }, 'qt-on-state-changed!': { arity: 1, type: 'int' }, 'qt-on-timeout!': { arity: 0, type: 'void' }, 'qt-on-finished!': { arity: 1, type: 'int' }, 'qt-on-triggered!': { arity: 0, type: 'void' }, }; /** * Detect qt-on-*! signal handler calls with lambda arity mismatches. */ function checkQtCallbackArity( lines: string[], diagnostics: LintDiagnostic[], ): void { for (let i = 0; i < lines.length; i++) { const line = lines[i]; const commentIdx = line.indexOf(';'); const effective = commentIdx >= 0 ? line.slice(0, commentIdx) : line; for (const [funcName, info] of Object.entries(QT_SIGNAL_ARITIES)) { if (!effective.includes(funcName)) continue; // Look for (qt-on-*! widget (lambda (...) ...)) const escaped = funcName.replace(/[.*+?^${}()|[\]\\]/g, '\\$&'); const pattern = new RegExp(`${escaped}[^(]*\$\\s*lambda\\s+\\(([^)]*)\$`); // Check current and next few lines (lambda may be on next line) const context = lines.slice(i, Math.min(i + 5, lines.length)).join(' '); const match = context.match(pattern); if (match) { const params = match[1].trim(); const actualArity = params.length === 0 ? 0 : params.split(/\s+/).length; if (actualArity !== info.arity) { diagnostics.push({ line: i + 1, severity: 'warning', code: 'qt-callback-arity', message: `${funcName} expects a ${info.type} handler (${info.arity} arg${info.arity === 1 ? '' : 's'}) ` + `but lambda has ${actualArity} parameter${actualArity === 1 ? '' : 's'}. ` + `The arity exception will be silently caught by the FFI dispatch — the handler will never fire.`, }); } } } } }

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/ober/gerbil-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

lint.ts•47.2 KiB