CodeGraphContext

MIT License

138

Overview InspectNew Endpoints Schema Related Servers Reviews Score

watcher.py•7.71 kB

# src/codegraphcontext/core/watcher.py """ This module implements the live file-watching functionality using the `watchdog` library. It observes directories for changes and triggers updates to the code graph. """ import logging import threading from pathlib import Path import typing from watchdog.observers import Observer from watchdog.events import FileSystemEventHandler if typing.TYPE_CHECKING: from codegraphcontext.tools.graph_builder import GraphBuilder from codegraphcontext.core.jobs import JobManager logger = logging.getLogger(__name__) class RepositoryEventHandler(FileSystemEventHandler): """ A dedicated event handler for a single repository being watched. This handler is stateful. It performs an initial scan of the repository to build a baseline and then uses this cached state to perform efficient updates when files are changed, created, or deleted. """ def __init__(self, graph_builder: "GraphBuilder", repo_path: Path, debounce_interval=2.0): """ Initializes the event handler. Args: graph_builder: An instance of the GraphBuilder to perform graph operations. repo_path: The absolute path to the repository directory to watch. debounce_interval: The time in seconds to wait for more changes before processing an event. """ super().__init__() self.graph_builder = graph_builder self.repo_path = repo_path self.debounce_interval = debounce_interval self.timers = {} # A dictionary to manage debounce timers for file paths. # Caches for the repository's state. self.all_file_data = [] self.imports_map = {} # Perform the initial scan and linking when the watcher is created. self._initial_scan() def _initial_scan(self): """Scans the entire repository, parses all files, and builds the initial graph.""" logger.info(f"Performing initial scan for watcher: {self.repo_path}") all_files = list(self.repo_path.rglob("*.py")) # 1. Pre-scan all files to get a global map of where every symbol is defined. self.imports_map = self.graph_builder._pre_scan_for_imports(all_files) # 2. Parse all files in detail and cache the parsed data. for f in all_files: parsed_data = self.graph_builder.parse_python_file(self.repo_path, f, self.imports_map) if "error" not in parsed_data: self.all_file_data.append(parsed_data) # 3. After all files are parsed, create the relationships (e.g., function calls) between them. self.graph_builder._create_all_function_calls(self.all_file_data, self.imports_map) logger.info(f"Initial scan and graph linking complete for: {self.repo_path}") def _debounce(self, event_path, action): """ Schedules an action to run after a debounce interval. This prevents the handler from firing on every single file save event in rapid succession, which is common in IDEs. It waits for a quiet period before processing. """ # If a timer already exists for this path, cancel it. if event_path in self.timers: self.timers[event_path].cancel() # Create and start a new timer. timer = threading.Timer(self.debounce_interval, action) timer.start() self.timers[event_path] = timer def _handle_modification(self, event_path_str: str): """ Orchestrates the complete update cycle for a modified or created file. This involves updating the graph and then re-linking the relationships. """ logger.info(f"File change detected, starting full update for: {event_path_str}") modified_path = Path(event_path_str) # 1. Update the specific file in the graph (delete old nodes, create new ones). new_file_data = self.graph_builder.update_file_in_graph( modified_path, self.repo_path, self.imports_map ) if not new_file_data: logger.error(f"Update failed for {event_path_str}, skipping re-link.") return # 2. Update the in-memory cache of the repository's state. self.all_file_data = [d for d in self.all_file_data if d.get("file_path") != event_path_str] if not new_file_data.get("deleted"): self.all_file_data.append(new_file_data) # 3. CRITICAL: Re-link the entire graph's call relationships using the updated cache. # This is necessary because a change in one file can affect its relationship with any other file. logger.info("Re-linking the call graph with updated information...") self.graph_builder._create_all_function_calls(self.all_file_data, self.imports_map) logger.info(f"Graph update for {event_path_str} complete! ✅") # The following methods are called by the watchdog observer when a file event occurs. def on_created(self, event): if not event.is_directory and event.src_path.endswith('.py'): self._debounce(event.src_path, lambda: self._handle_modification(event.src_path)) def on_modified(self, event): if not event.is_directory and event.src_path.endswith('.py'): self._debounce(event.src_path, lambda: self._handle_modification(event.src_path)) def on_deleted(self, event): if not event.is_directory and event.src_path.endswith('.py'): self._debounce(event.src_path, lambda: self._handle_modification(event.src_path)) def on_moved(self, event): if not event.is_directory and event.src_path.endswith('.py'): # A move is treated as a deletion at the old path and a creation at the new path. self._debounce(event.src_path, lambda: self._handle_modification(event.src_path)) self._debounce(event.dest_path, lambda: self._handle_modification(event.dest_path)) class CodeWatcher: """ Manages the file system observer thread. It can watch multiple directories, assigning a separate `RepositoryEventHandler` to each one. """ def __init__(self, graph_builder: "GraphBuilder", job_manager= "JobManager"): self.graph_builder = graph_builder self.observer = Observer() self.watched_paths = set() # Keep track of paths already being watched. def watch_directory(self, path: str): """Schedules a directory to be watched for changes.""" path_obj = Path(path).resolve() path_str = str(path_obj) if path_str in self.watched_paths: logger.info(f"Path already being watched: {path_str}") return {"message": f"Path already being watched: {path_str}"} # Create a new, dedicated event handler for this specific repository path. event_handler = RepositoryEventHandler(self.graph_builder, path_obj) self.observer.schedule(event_handler, path_str, recursive=True) self.watched_paths.add(path_str) logger.info(f"Started watching for code changes in: {path_str}") return {"message": f"Started watching {path_str}. Initial scan is in progress."} def start(self): """Starts the observer thread.""" if not self.observer.is_alive(): self.observer.start() logger.info("Code watcher observer thread started.") def stop(self): """Stops the observer thread gracefully.""" if self.observer.is_alive(): self.observer.stop() self.observer.join() # Wait for the thread to terminate. logger.info("Code watcher observer thread stopped.")

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/Shashankss1205/CodeGraphContext'

If you have feedback or need assistance with the MCP directory API, please join our Discord server