Claude Code MCP - Agent Orchestration Platform

mcp_tools.py•116 KiB

""" MCP Tools Implementation - Agent Orchestration Platform This module implements all 8 core MCP tools for the Agent Orchestration Platform with comprehensive validation, security enforcement, and monitoring integration. Architecture Integration: - Design Patterns: Facade pattern for MCP integration, Command pattern for agent operations - Security Model: Defense-in-depth with comprehensive input validation and audit logging - Performance Profile: O(1) tool operations with efficient async execution and monitoring Technical Decisions: - FastMCP Integration: Enhanced tool registration with automatic schema generation - Security-First Design: All operations validated with comprehensive security contracts - Comprehensive Monitoring: Real-time performance tracking and audit logging - Error Handling: Robust error recovery with automatic rollback capabilities Dependencies & Integration: - External: FastMCP framework, iTerm2 integration, Claude Code orchestration - Internal: Agent/Session managers, validation framework, rollback utilities Quality Assurance: - Test Coverage: Property-based testing for all tool operations - Error Handling: Comprehensive error recovery with secure failure modes - Contract Validation: All operations protected by security and business contracts Author: Adder_5 | Created: 2025-06-26 | Last Modified: 2025-06-26 """ import asyncio import time from datetime import datetime from pathlib import Path from typing import Any, Dict, List, Optional, Union # Import MCP framework from fastmcp import Context, FastMCP # Import boundary enforcement from src.boundaries.audit import AuditCategory, AuditLevel, get_audit_logger # Import security contracts from src.contracts.security import ( agent_creation_contract, set_security_context, validate_agent_operation, ) from src.contracts_compat import ensure, require # Import core managers (these will be injected via dependency injection) from src.interfaces.manager_protocols import ( AgentManagerProtocol, ClaudeManagerProtocol, ITermManagerProtocol, SessionManagerProtocol, ) from src.models.agent import AgentCreationRequest, AgentSpecialization, ClaudeConfig # Import type system from src.models.ids import AgentId, SessionId from src.models.mcp_results import ( AgentCreationResult, AgentDeletionResult, SessionCreationResult, SessionDeletionResult, ) from src.models.security import SecurityContext, SecurityLevel from src.models.session import SessionCreationRequest from src.models.validation import ValidationError from src.utils.errors import OperationError # Import rollback utilities from src.utils.rollback import AgentCreationRollback, RollbackContext, with_rollback # Import validation framework from src.validators.agent_creation import ( AgentCreationValidationError, AgentCreationValidator, ValidationContext, validate_agent_creation_request, ) # Import validation utilities from src.validators.input import sanitize_user_input, validate_file_path class AgentOrchestrationTools: """ Comprehensive MCP tools for agent orchestration platform. Implements all 8 core MCP tools with enhanced security, validation, and monitoring for sophisticated multi-agent Claude Code coordination. Contracts: Preconditions: - All managers are properly initialized and available - Security context is established for all operations - Audit logging is configured and operational Postconditions: - All operations maintain comprehensive audit trails - Resource cleanup occurs on all error paths - Security boundaries are enforced throughout Invariants: - Agent count never exceeds system limits - All operations are logged with security context - Resource allocations are tracked and cleaned up """ def __init__( self, agent_manager: AgentManagerProtocol, session_manager: SessionManagerProtocol, iterm_manager: ITermManagerProtocol, claude_manager: ClaudeManagerProtocol, ): """Initialize MCP tools with dependency injection.""" self.agent_manager = agent_manager self.session_manager = session_manager self.iterm_manager = iterm_manager self.claude_manager = claude_manager # Initialize validation and audit systems self.validator = AgentCreationValidator() self._audit_logger = None # Performance tracking self._tool_execution_stats: Dict[str, Dict[str, Any]] = {} async def initialize(self) -> None: """Initialize tools with audit logging and validation systems.""" try: await self.validator.initialize() self._audit_logger = get_audit_logger() # Initialize performance tracking for tool_name in [ "create_agent", "delete_agent", "create_session", "get_session_status", "delete_session", "send_message_to_agent", "clear_agent_conversation", "start_new_agent_conversation", ]: self._tool_execution_stats[tool_name] = { "total_executions": 0, "successful_executions": 0, "failed_executions": 0, "avg_duration_ms": 0.0, } except Exception as e: raise RuntimeError(f"Failed to initialize MCP tools: {e}") # Tool 1: create_agent - Core agent creation with comprehensive validation @agent_creation_contract async def create_agent( self, session_id: str, agent_name: str, specialization: Optional[str] = None, system_prompt_suffix: str = "", claude_config: Optional[Dict[str, Any]] = None, ctx: Optional[Context] = None, ) -> Dict[str, Any]: """ Create new Claude Code agent with comprehensive validation and monitoring. Implements complete agent creation workflow with security validation, resource allocation, iTerm2 integration, and Claude Code orchestration. Contracts: Preconditions: - session_id corresponds to existing, accessible session - agent_name follows Agent_# format and is unique - System has capacity for new agent - All inputs pass security validation Postconditions: - Agent created with unique ID and active status - iTerm2 tab created and accessible - Claude Code process spawned and configured - ADDER+ prompt injected with agent name - Agent state persisted with encryption - Health monitoring initiated Invariants: - Agent count never exceeds session limits - All operations maintain audit trails - Resource cleanup occurs on failure - Security boundaries are enforced Security Implementation: - Input Validation: Comprehensive whitelist validation for all parameters - Agent Name Security: Strict pattern matching to prevent injection - Resource Limits: Enforced limits on memory, CPU, and process counts - Directory Boundaries: Agent operations confined to session root - Audit Trail: Complete logging of creation process and outcomes Args: session_id: Target session identifier (validated) agent_name: Agent name in Agent_# format (validated and sanitized) specialization: Optional agent specialization from allowed set system_prompt_suffix: Additional system prompt content (sanitized) claude_config: Claude Code configuration options (validated) ctx: FastMCP context for progress reporting and logging Returns: Dict[str, Any]: Agent creation result with comprehensive metadata Raises: ValidationError: Input validation or security check failure ResourceLimitError: Insufficient system resources or capacity OperationError: Agent creation process failure SecurityError: Security policy violation or unauthorized access """ execution_start = time.time() operation_id = f"create_agent_{int(execution_start * 1000)}" # Initialize rollback context for comprehensive cleanup rollback = AgentCreationRollback(operation_id) await rollback.initialize() try: # Phase 1: Progress Reporting and Initial Validation if ctx: await ctx.info(f"Creating agent {agent_name} in session {session_id}") await ctx.report_progress(5, 100, "Validating request parameters") # Phase 2: Comprehensive Input Validation session_state = await self.session_manager.get_session_state( SessionId(session_id), SecurityContext(), # TODO: Actual security context ) if not session_state: raise ValidationError(f"Session {session_id} not found or inaccessible") # Create validation context with current system state validation_context = ValidationContext( session_id=SessionId(session_id), security_level=session_state.security_level, max_agents_in_session=session_state.max_agents, current_agent_count=len(session_state.agents), available_memory_mb=2048, # TODO: Get from resource manager available_cpu_percent=75.0, # TODO: Get from resource manager ) if ctx: await ctx.report_progress(15, 100, "Performing security validation") # Comprehensive validation using validation framework validation_result = await self.validator.validate_agent_creation_request( session_id=SessionId(session_id), agent_name=agent_name, specialization=specialization, system_prompt_suffix=system_prompt_suffix, claude_config=claude_config, validation_context=validation_context, ) if not validation_result.is_valid: raise AgentCreationValidationError( f"Agent creation validation failed: {validation_result.get_failure_summary()}" ) # Use validated request for all subsequent operations validated_request = validation_result.validated_request if not validated_request: raise ValidationError( "Validation succeeded but no validated request created" ) # Phase 3: Agent Creation via AgentManager if ctx: await ctx.report_progress( 30, 100, "Creating agent with resource allocation" ) # Capture pre-operation state for rollback existing_agents = { aid: agent for aid, agent in session_state.agents.items() } rollback.capture_pre_operation_state( existing_agents=existing_agents, existing_sessions={session_state.session_id: session_state}, resource_allocations={}, # TODO: Get current allocations ) # Create agent through AgentManager agent_creation_result = await self.agent_manager.create_agent( request=validated_request, security_context=SecurityContext(), # TODO: Actual security context ) if not agent_creation_result.success: raise RuntimeError( f"Agent creation failed: {agent_creation_result.message}" ) agent_id = agent_creation_result.agent_id rollback.add_agent_cleanup(agent_id) # Phase 4: iTerm2 Tab Creation if ctx: await ctx.report_progress(50, 100, "Creating iTerm2 tab") try: tab_id = await self.iterm_manager.create_tab( agent_id=agent_id, session_id=SessionId(session_id), working_directory=session_state.root_path, security_context=SecurityContext(), ) rollback.add_iterm_tab_cleanup(tab_id, self.iterm_manager) except Exception as e: raise RuntimeError(f"Failed to create iTerm2 tab: {e}") # Phase 5: Claude Code Process Activation if ctx: await ctx.report_progress(70, 100, "Activating Claude Code process") try: # Navigate to session root and activate Claude Code activation_command = f"cd {session_state.root_path} && claude" if validated_request.claude_config.model != "sonnet-3.5": activation_command += ( f" --model {validated_request.claude_config.model}" ) if validated_request.claude_config.no_color: activation_command += " --no-color" # Send activation command to iTerm2 tab await self.iterm_manager.send_text( tab_id=tab_id, text=activation_command + "\\n", security_context=SecurityContext(), ) # Wait for Claude Code to initialize await asyncio.sleep(3) except Exception as e: raise RuntimeError(f"Failed to activate Claude Code: {e}") # Phase 6: ADDER+ Prompt Injection if ctx: await ctx.report_progress(85, 100, "Injecting ADDER+ system prompt") try: # Build ADDER+ prompt with agent name injection adder_prompt = self._build_adder_prompt( agent_name=validated_request.agent_name, specialization=validated_request.specialization, system_prompt_suffix=validated_request.system_prompt_suffix, session_root_path=session_state.root_path, ) # Send ADDER+ prompt to Claude Code await self.iterm_manager.send_text( tab_id=tab_id, text=adder_prompt + "\\n", security_context=SecurityContext(), ) # Wait for prompt processing await asyncio.sleep(2) except Exception as e: raise RuntimeError(f"Failed to inject ADDER+ prompt: {e}") # Phase 7: Final Status Update and Completion if ctx: await ctx.report_progress(100, 100, "Agent creation complete") await ctx.info( f"Successfully created agent {validated_request.agent_name}" ) # Calculate execution time execution_duration = (time.time() - execution_start) * 1000 # Clear rollback on success rollback.clear() # Update performance statistics self._update_tool_performance( "create_agent", execution_duration, success=True ) # Log successful agent creation if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.INFO, category=AuditCategory.AGENT_OPERATIONS, operation="agent_created", resource_type="agent", resource_id=str(agent_id), success=True, metadata={ "agent_name": validated_request.agent_name, "session_id": str(session_id), "specialization": ( validated_request.specialization.value if validated_request.specialization else None ), "execution_duration_ms": execution_duration, "iterm_tab_id": tab_id, "validation_warnings": len( validation_result.validation_warnings ), }, ) # Return comprehensive success result return { "success": True, "agent_id": str(agent_id), "agent_name": validated_request.agent_name, "session_id": session_id, "iterm_tab_id": tab_id, "specialization": ( validated_request.specialization.value if validated_request.specialization else None ), "claude_config": { "model": validated_request.claude_config.model, "no_color": validated_request.claude_config.no_color, "working_directory": str(session_state.root_path), }, "execution_duration_ms": execution_duration, "validation_warnings": validation_result.validation_warnings, "status": "ACTIVE", "created_at": datetime.utcnow().isoformat(), } except Exception as e: # Execute rollback on any failure try: await rollback.execute() except Exception as rollback_error: if ctx: await ctx.error(f"Rollback also failed: {rollback_error}") # Calculate execution time for failure execution_duration = (time.time() - execution_start) * 1000 # Update performance statistics for failure self._update_tool_performance( "create_agent", execution_duration, success=False ) # Log agent creation failure if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.ERROR, category=AuditCategory.AGENT_OPERATIONS, operation="agent_creation_failed", resource_type="agent_creation_request", resource_id=operation_id, success=False, error_message=str(e), metadata={ "agent_name": agent_name, "session_id": session_id, "execution_duration_ms": execution_duration, "error_type": type(e).__name__, }, ) # Report error to user if ctx: await ctx.error(f"Agent creation failed: {str(e)}") # Return failure result return { "success": False, "error": str(e), "error_type": type(e).__name__, "agent_name": agent_name, "session_id": session_id, "execution_duration_ms": execution_duration, "rollback_executed": True, } # Tool 2: delete_agent - Comprehensive agent removal with cleanup @require( lambda self, agent_name, *args, **kwargs: agent_name and isinstance(agent_name, str) ) @ensure( lambda result, *args, **kwargs: isinstance(result, dict) and "success" in result ) async def delete_agent( self, agent_name: str, force: bool = False, timeout_seconds: int = 30, ctx: Optional[Context] = None, ) -> Dict[str, Any]: """ Delete agent with comprehensive cleanup and state persistence. Performs secure agent deletion with graceful termination, complete resource cleanup, and comprehensive audit logging. Ensures all agent resources are properly deallocated and state is securely removed. Contracts: Preconditions: - agent_name must be non-empty string in Agent_# format - Agent must exist and be accessible - Caller must have appropriate permissions - System must not be in critical operation state (unless force=True) Postconditions: - Agent process gracefully terminated or forcefully killed - iTerm2 tab closed and cleaned up - All agent state securely deleted - Resources deallocated and freed - Audit trail created for deletion - Session state updated to reflect removal Invariants: - No orphaned processes left after deletion - No state remnants in encrypted storage - Session agent count properly decremented - System capacity properly updated Security Implementation: - Permission Validation: Verifies caller can delete target agent - State Verification: Ensures agent is in deletable state - Secure Deletion: Uses cryptographic erasure for state removal - Audit Trail: Complete logging of deletion process - Resource Tracking: Ensures all resources are freed Args: agent_name: Name of agent to delete (Agent_# format) force: Whether to force deletion without graceful shutdown timeout_seconds: Maximum time to wait for graceful termination ctx: FastMCP context for progress reporting Returns: Dict[str, Any]: Deletion result with comprehensive status: - success: Whether deletion completed successfully - agent_id: ID of deleted agent - cleanup_summary: Details of cleanup operations - resources_freed: Summary of freed resources - execution_duration_ms: Total operation time Raises: ValidationError: Invalid agent name or format SecurityError: Insufficient permissions for deletion OperationError: Agent has critical operations (unless force=True) TimeoutError: Graceful termination exceeded timeout """ execution_start = time.time() operation_id = f"delete_agent_{int(execution_start * 1000)}" try: # Phase 1: Initial Validation and Progress Reporting if ctx: await ctx.info(f"Deleting agent {agent_name} (force={force})") await ctx.report_progress(5, 100, "Validating agent name format") # Validate agent name format import re agent_name_pattern = re.compile(r"^Agent_\d+$") if not agent_name_pattern.match(agent_name): raise ValidationError( f"Invalid agent name format. Expected 'Agent_#', got: {agent_name}" ) # Phase 2: Agent Location and Access Verification if ctx: await ctx.report_progress(15, 100, "Locating agent across sessions") # Find agent across all sessions agent_info = await self.agent_manager.find_agent_by_name( agent_name=agent_name, security_context=SecurityContext() ) if not agent_info: raise ValidationError(f"Agent {agent_name} not found in any session") agent_id = agent_info.agent_id session_id = agent_info.session_id # Verify permissions to delete this agent # TODO: Implement proper permission checking based on security context # Phase 3: Pre-deletion Safety Checks if ctx: await ctx.report_progress(25, 100, "Performing safety checks") # Check for active critical operations if not force: agent_state = await self.agent_manager.get_agent_state( agent_id=agent_id, security_context=SecurityContext() ) if agent_state and agent_state.has_critical_operations: critical_ops = agent_state.get_critical_operations() raise OperationError( f"Agent has {len(critical_ops)} critical operations in progress. " f"Use force=True to override. Operations: {critical_ops}" ) # Phase 4: Graceful Termination Process if ctx: await ctx.report_progress(40, 100, "Initiating graceful termination") # Send termination signal to Claude Code process termination_start = time.time() termination_success = False if not force: try: # Send graceful shutdown command await self.iterm_manager.send_text( tab_id=agent_info.iterm_tab_id, text="/exit\n", # Claude Code exit command security_context=SecurityContext(), ) # Wait for process termination with timeout elapsed = 0 while elapsed < timeout_seconds: if not await self._is_process_running(agent_info.process_id): termination_success = True break await asyncio.sleep(1) elapsed = time.time() - termination_start if ctx and elapsed % 5 == 0: await ctx.report_progress( 40 + int((elapsed / timeout_seconds) * 20), 100, f"Waiting for graceful shutdown ({elapsed}s/{timeout_seconds}s)", ) except Exception as e: if ctx: await ctx.warn(f"Graceful termination failed: {e}") # Phase 5: Force Termination if Needed if not termination_success: if ctx: await ctx.report_progress(60, 100, "Force terminating process") # Force kill the process await self._force_terminate_process(agent_info.process_id) # Verify process is terminated if await self._is_process_running(agent_info.process_id): raise OperationError( f"Failed to terminate agent process {agent_info.process_id}" ) # Phase 6: Resource Cleanup if ctx: await ctx.report_progress(70, 100, "Cleaning up resources") # Close iTerm2 tab try: await self.iterm_manager.close_tab( tab_id=agent_info.iterm_tab_id, security_context=SecurityContext() ) except Exception as e: if ctx: await ctx.warn(f"iTerm2 tab cleanup warning: {e}") # Phase 7: State Deletion if ctx: await ctx.report_progress(85, 100, "Deleting agent state") # Delete agent through AgentManager (handles all state cleanup) deletion_result = await self.agent_manager.delete_agent( agent_name=agent_name, force=force, security_context=SecurityContext() ) if not deletion_result: raise OperationError("Agent manager deletion failed") # Phase 8: Verification and Completion if ctx: await ctx.report_progress(95, 100, "Verifying deletion") # Verify agent is completely removed remaining_agent = await self.agent_manager.find_agent_by_name( agent_name=agent_name, security_context=SecurityContext() ) if remaining_agent: raise OperationError( "Agent deletion verification failed - agent still exists" ) if ctx: await ctx.report_progress(100, 100, "Agent deletion complete") await ctx.info(f"Successfully deleted agent {agent_name}") # Calculate execution time execution_duration = (time.time() - execution_start) * 1000 # Update performance statistics self._update_tool_performance( "delete_agent", execution_duration, success=True ) # Log successful deletion if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.INFO, category=AuditCategory.AGENT_OPERATIONS, operation="agent_deleted", resource_type="agent", resource_id=str(agent_id), success=True, metadata={ "agent_name": agent_name, "session_id": str(session_id), "force": force, "graceful_termination": termination_success, "execution_duration_ms": execution_duration, "timeout_seconds": timeout_seconds, }, ) # Return comprehensive success result return { "success": True, "agent_id": str(agent_id), "agent_name": agent_name, "session_id": str(session_id), "cleanup_summary": { "graceful_termination": termination_success, "process_terminated": True, "iterm_tab_closed": True, "state_deleted": True, "resources_freed": True, }, "resources_freed": { "memory_mb": agent_info.allocated_memory_mb, "cpu_percent": agent_info.allocated_cpu_percent, }, "force": force, "execution_duration_ms": execution_duration, "deleted_at": datetime.utcnow().isoformat(), } except Exception as e: # Calculate execution time for failure execution_duration = (time.time() - execution_start) * 1000 # Update performance statistics for failure self._update_tool_performance( "delete_agent", execution_duration, success=False ) # Log deletion failure if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.ERROR, category=AuditCategory.AGENT_OPERATIONS, operation="agent_deletion_failed", resource_type="agent_deletion_request", resource_id=operation_id, success=False, error_message=str(e), metadata={ "agent_name": agent_name, "force": force, "execution_duration_ms": execution_duration, "error_type": type(e).__name__, }, ) # Report error to user if ctx: await ctx.error(f"Agent deletion failed: {str(e)}") # Return failure result return { "success": False, "error": str(e), "error_type": type(e).__name__, "agent_name": agent_name, "force": force, "execution_duration_ms": execution_duration, "partial_cleanup": self._assess_partial_cleanup(agent_name), } async def _is_process_running(self, process_id: int) -> bool: """Check if a process is still running.""" try: import psutil return psutil.pid_exists(process_id) except Exception: # Fallback to OS check import subprocess result = subprocess.run( ["ps", "-p", str(process_id)], capture_output=True, text=True ) return result.returncode == 0 async def _force_terminate_process(self, process_id: int) -> None: """Force terminate a process.""" try: import os import signal os.kill(process_id, signal.SIGKILL) except ProcessLookupError: # Process already terminated pass except Exception as e: raise OperationError(f"Failed to force terminate process: {e}") def _assess_partial_cleanup(self, agent_name: str) -> Dict[str, bool]: """Assess what cleanup operations may have partially completed.""" # This would check various cleanup states return { "process_check_attempted": True, "iterm_cleanup_attempted": True, "state_cleanup_attempted": True, "manual_cleanup_required": True, } # Additional tool implementations would follow similar patterns... # For brevity, I'll include placeholders for the remaining tools async def create_session( self, root_path: str, session_name: str, security_level: str = "HIGH", ctx: Optional[Context] = None, ) -> Dict[str, Any]: """ Create new development session tied to specific codebase. Creates a secure development session with filesystem boundaries, Git integration, and encrypted state storage. Establishes security context for all agents in session. Security: - Validates root_path accessibility and permissions - Establishes filesystem boundaries for session isolation - Creates encrypted state storage for persistence - Prevents path traversal and injection attacks - Enforces security level throughout session lifecycle Process: 1. Validate and sanitize all inputs 2. Check root_path exists and is accessible 3. Verify session name uniqueness 4. Create session directory structure if needed 5. Initialize Git integration and project analysis 6. Establish security context and file boundaries 7. Create encrypted session state storage 8. Initialize task file monitoring system 9. Register session in global state manager 10. Return comprehensive creation result Args: root_path: Absolute path to codebase root directory session_name: Human-readable session name (unique) security_level: Security level - HIGH (default), MEDIUM, or LOW ctx: FastMCP context for progress reporting Returns: Dict containing: - success: Whether session was created - session_id: Unique session identifier - session_name: Sanitized session name - root_path: Validated root path - git_integrated: Whether Git integration was enabled - task_monitoring_enabled: Whether task monitoring is active - security_fingerprint: Security context fingerprint - warnings: Any non-fatal issues encountered - error: Error message if creation failed Raises: No exceptions - all errors returned in response dict """ execution_start = time.time() warnings = [] try: # Progress reporting if ctx: await ctx.report_progress(0, 100, f"Creating session '{session_name}'") await ctx.info(f"Validating root path: {root_path}") # Phase 1: Input validation and sanitization if ctx: await ctx.report_progress(10, 100, "Validating inputs") # Validate root_path try: root_path_obj = Path(root_path).resolve() except Exception as e: return { "success": False, "error": f"Invalid root path: {str(e)}", "error_type": "VALIDATION_ERROR", } if not root_path_obj.is_absolute(): return { "success": False, "error": "Root path must be absolute", "error_type": "VALIDATION_ERROR", } if not root_path_obj.exists(): return { "success": False, "error": f"Root path does not exist: {root_path}", "error_type": "PATH_NOT_FOUND", } if not root_path_obj.is_dir(): return { "success": False, "error": f"Root path is not a directory: {root_path}", "error_type": "INVALID_PATH", } # Validate session name sanitized_name = sanitize_user_input(session_name) if not sanitized_name or len(sanitized_name.strip()) == 0: return { "success": False, "error": "Session name cannot be empty", "error_type": "VALIDATION_ERROR", } if len(sanitized_name) > 100: return { "success": False, "error": f"Session name too long: {len(sanitized_name)} > 100", "error_type": "VALIDATION_ERROR", } # Validate security level try: sec_level = SecurityLevel[security_level.upper()] except KeyError: return { "success": False, "error": f"Invalid security level: {security_level}. Must be HIGH, MEDIUM, or LOW", "error_type": "VALIDATION_ERROR", } # Phase 2: Check system capacity if ctx: await ctx.report_progress(20, 100, "Checking system capacity") current_session_count = len(self.session_manager.sessions) if current_session_count >= self.session_manager.max_sessions: return { "success": False, "error": f"Maximum session limit reached: {self.session_manager.max_sessions}", "error_type": "CAPACITY_ERROR", } # Phase 3: Check session name uniqueness if ctx: await ctx.report_progress(30, 100, "Verifying session uniqueness") if any( session.name == sanitized_name for session in self.session_manager.sessions.values() ): return { "success": False, "error": f"Session name already exists: {sanitized_name}", "error_type": "DUPLICATE_SESSION", } # Phase 4: Create session via SessionManager if ctx: await ctx.report_progress( 50, 100, "Creating session with security boundaries" ) await ctx.info("Initializing Git integration and task monitoring...") try: # Create session with comprehensive setup result = await self.session_manager.create_session( root_path=root_path_obj, session_name=sanitized_name, security_level=sec_level, max_agents=8, # Default max agents per session auto_git_integration=True, enable_task_monitoring=True, custom_config={ "created_via": "mcp_tool", "mcp_context": ctx is not None, }, ) if not result.success: return { "success": False, "error": result.message, "error_type": "SESSION_CREATION_ERROR", "warnings": result.warnings, } # Add any warnings from session creation warnings.extend(result.warnings) except Exception as e: error_msg = str(e) self.logger.error(f"Session creation failed: {error_msg}") return { "success": False, "error": f"Failed to create session: {error_msg}", "error_type": "INTERNAL_ERROR", } # Phase 5: Complete session setup if ctx: await ctx.report_progress(90, 100, "Finalizing session configuration") # Calculate execution time execution_duration = (time.time() - execution_start) * 1000 # Update performance statistics self._update_tool_performance( "create_session", execution_duration, success=True ) # Log successful session creation if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.INFO, category=AuditCategory.SESSION_OPERATIONS, operation="session_created", resource_type="session", resource_id=str(result.session_id), success=True, metadata={ "session_name": sanitized_name, "root_path": str(root_path_obj), "security_level": security_level, "git_integrated": result.git_integrated, "task_monitoring_enabled": result.task_monitoring_enabled, "execution_duration_ms": execution_duration, "warnings_count": len(warnings), }, ) # Phase 6: Return success result if ctx: await ctx.report_progress(100, 100, "Session created successfully") await ctx.info(f"Session '{sanitized_name}' ready at {root_path_obj}") return { "success": True, "session_id": str(result.session_id), "session_name": sanitized_name, "root_path": str(root_path_obj), "git_integrated": result.git_integrated, "task_monitoring_enabled": result.task_monitoring_enabled, "security_fingerprint": result.security_fingerprint, "security_level": security_level, "max_agents": 8, "execution_duration_ms": execution_duration, "warnings": warnings, "message": f"Session '{sanitized_name}' created successfully", } except Exception as e: # Catch-all for unexpected errors error_msg = f"Unexpected error during session creation: {str(e)}" self.logger.error(error_msg, exc_info=True) # Update failure statistics self._update_tool_performance("create_session", 0, success=False) # Log failure if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.ERROR, category=AuditCategory.SESSION_OPERATIONS, operation="session_creation_failed", resource_type="session", success=False, metadata={ "session_name": session_name, "root_path": root_path, "error": error_msg, }, ) return { "success": False, "error": error_msg, "error_type": "UNEXPECTED_ERROR", } @require(lambda self, *args, **kwargs: True) # No preconditions for status queries @ensure( lambda result, *args, **kwargs: isinstance(result, dict) and "success" in result ) async def get_session_status( self, session_id: Optional[str] = None, include_metrics: bool = True, include_health: bool = True, ctx: Optional[Context] = None, ) -> Dict[str, Any]: """ Get comprehensive status of session(s) and their agents. Provides real-time monitoring data for sessions and agents including resource usage, health status, and operational metrics. Contracts: Preconditions: - session_id must be valid if provided - Caller must have monitoring permissions Postconditions: - Returns complete status for requested session(s) - All agent statuses aggregated correctly - Resource metrics included if requested - Health status evaluated if requested Invariants: - Status data is consistent across all managers - No sensitive information exposed - Performance impact minimized Security Implementation: - Access Control: Verify monitoring permissions - Data Filtering: Only expose authorized information - Rate Limiting: Prevent status query abuse - Audit Trail: Log all status queries Args: session_id: Specific session ID to query (None for all sessions) include_metrics: Include resource usage metrics include_health: Include health check results ctx: FastMCP context for progress reporting Returns: Comprehensive status report with session and agent details Raises: ValidationError: Invalid session ID format SecurityError: Insufficient monitoring permissions OperationError: Status collection failed """ execution_start = time.time() try: if ctx: if session_id: await ctx.info(f"Getting status for session {session_id}") else: await ctx.info("Getting status for all sessions") await ctx.report_progress(5, 100, "Initializing status collection") # Phase 1: Input Validation if session_id: # Validate session ID format if provided try: validated_session_id = SessionId(session_id) except Exception as e: raise ValidationError(f"Invalid session ID format: {e}") else: validated_session_id = None # Phase 2: Session Discovery if ctx: await ctx.report_progress(15, 100, "Discovering sessions") if validated_session_id: # Get specific session session_state = await self.session_manager.get_session_state( validated_session_id, SecurityContext() ) if not session_state: raise ValidationError(f"Session {session_id} not found") sessions_to_query = [session_state] else: # Get all sessions all_sessions = await self.session_manager.get_all_sessions( SecurityContext() ) sessions_to_query = list(all_sessions.values()) # Phase 3: Status Collection if ctx: await ctx.report_progress( 30, 100, f"Collecting status for {len(sessions_to_query)} session(s)", ) session_statuses = [] total_agents = 0 for i, session in enumerate(sessions_to_query): if ctx: progress = 30 + int((i / len(sessions_to_query)) * 50) await ctx.report_progress( progress, 100, f"Processing session {session.name}" ) # Get agents for this session agents = await self.agent_manager.get_agents_by_session( session.session_id, SecurityContext() ) # Collect agent statuses agent_statuses = [] for agent in agents: agent_status = await self._collect_agent_status( agent=agent, include_metrics=include_metrics, include_health=include_health, ) agent_statuses.append(agent_status) total_agents += 1 # Aggregate session metrics session_metrics = None if include_metrics: session_metrics = await self._aggregate_session_metrics( agent_statuses ) # Evaluate session health session_health = None if include_health: session_health = self._evaluate_session_health(agent_statuses) # Build session status session_status = { "session_id": str(session.session_id), "session_name": session.name, "root_path": str(session.root_path), "security_level": session.security_level.value, "created_at": ( session.created_at.isoformat() if hasattr(session, "created_at") else None ), "agent_count": len(agent_statuses), "max_agents": getattr(session, "max_agents", 8), "agents": agent_statuses, "session_metrics": session_metrics, "session_health": session_health, } session_statuses.append(session_status) # Phase 4: Global Aggregation if ctx: await ctx.report_progress(85, 100, "Aggregating global statistics") # Calculate global metrics global_metrics = { "total_sessions": len(session_statuses), "total_agents": total_agents, "active_agents": sum( 1 for session in session_statuses for agent in session["agents"] if agent.get("status") == "ACTIVE" ), "degraded_agents": sum( 1 for session in session_statuses for agent in session["agents"] if agent.get("status") == "DEGRADED" ), "failed_agents": sum( 1 for session in session_statuses for agent in session["agents"] if agent.get("status") == "FAILED" ), } if include_metrics: global_metrics.update( { "total_cpu_percent": sum( session.get("session_metrics", {}).get( "total_cpu_percent", 0 ) for session in session_statuses ), "total_memory_mb": sum( session.get("session_metrics", {}).get("total_memory_mb", 0) for session in session_statuses ), "total_file_descriptors": sum( session.get("session_metrics", {}).get( "total_file_descriptors", 0 ) for session in session_statuses ), } ) # Phase 5: Completion if ctx: await ctx.report_progress(100, 100, "Status collection complete") await ctx.info( f"Collected status for {len(session_statuses)} session(s) with {total_agents} agents" ) # Calculate execution time execution_duration = (time.time() - execution_start) * 1000 # Update performance statistics self._update_tool_performance( "get_session_status", execution_duration, success=True ) # Log successful status query if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.INFO, category=AuditCategory.SESSION_MONITORING, operation="session_status_retrieved", resource_type="session_status", resource_id=session_id or "all_sessions", success=True, metadata={ "session_count": len(session_statuses), "total_agents": total_agents, "include_metrics": include_metrics, "include_health": include_health, "execution_duration_ms": execution_duration, }, ) # Return comprehensive status result = { "success": True, "query_timestamp": datetime.utcnow().isoformat(), "query_type": "single_session" if session_id else "all_sessions", "sessions": session_statuses, "global_metrics": global_metrics, "execution_duration_ms": execution_duration, "metadata": { "include_metrics": include_metrics, "include_health": include_health, "query_session_id": session_id, }, } # Add single session shortcut for convenience if session_id and len(session_statuses) == 1: result["session"] = session_statuses[0] return result except Exception as e: # Error handling and logging execution_duration = (time.time() - execution_start) * 1000 self._update_tool_performance( "get_session_status", execution_duration, success=False ) # Log status query failure if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.ERROR, category=AuditCategory.SESSION_MONITORING, operation="session_status_failed", resource_type="session_status", resource_id=session_id or "all_sessions", success=False, error_message=str(e), metadata={ "include_metrics": include_metrics, "include_health": include_health, "execution_duration_ms": execution_duration, "error_type": type(e).__name__, }, ) if ctx: await ctx.error(f"Status collection failed: {str(e)}") return { "success": False, "error": str(e), "error_type": type(e).__name__, "query_timestamp": datetime.utcnow().isoformat(), "execution_duration_ms": execution_duration, "query_session_id": session_id, } @require( lambda self, session_id, *args, **kwargs: session_id and isinstance(session_id, str) ) @ensure( lambda result, *args, **kwargs: isinstance(result, dict) and "success" in result ) async def delete_session( self, session_id: str, cleanup_agents: bool = True, preserve_work: bool = True, force: bool = False, ctx: Optional[Context] = None, ) -> Dict[str, Any]: """ Delete session with comprehensive cleanup and work preservation. Implements secure session deletion with cascade agent cleanup, work preservation, and comprehensive audit logging. Contracts: Preconditions: - session_id corresponds to existing, accessible session - User has permission to delete the session - System is in consistent state for deletion Postconditions: - Session and all agents completely removed - Work preserved if requested and possible - All resources cleaned up (processes, tabs, state) - Complete audit trail created Invariants: - No partial deletion states remain - All operations are logged with security context - System remains in consistent state Security Implementation: - Permission Validation: Verify session ownership/access - Safe Deletion Order: Agents before session state - Work Preservation: Secure backup of uncommitted changes - Audit Logging: Complete trail of deletion operations - Rollback Support: Recovery from partial deletion failures Args: session_id: Session identifier to delete cleanup_agents: Whether to delete all agents in session preserve_work: Whether to preserve uncommitted work force: Force deletion even with active operations ctx: FastMCP context for progress reporting Returns: Dict[str, Any]: Deletion result with comprehensive status: - success: Whether deletion completed successfully - session_id: ID of deleted session - agents_deleted: Number of agents removed - work_preserved: Whether work was successfully preserved - preservation_path: Path to preserved work (if applicable) - cleanup_summary: Details of cleanup operations - execution_duration_ms: Total operation time Raises: ValidationError: Invalid session ID or format SecurityError: Insufficient permissions for deletion OperationError: Session has critical operations (unless force=True) """ execution_start = time.time() operation_id = f"delete_session_{int(execution_start * 1000)}" try: # Import required modules from src.utils.cascade_deletion import CascadeDeletionOrchestrator from src.utils.work_preservation import WorkPreservationHandler from src.validators.session_deletion import ( SessionDeletionContext, SessionDeletionValidator, ) # Phase 1: Initial Validation and Setup if ctx: await ctx.info( f"Deleting session {session_id} (cleanup_agents={cleanup_agents}, preserve_work={preserve_work})" ) await ctx.report_progress(5, 100, "Validating session deletion request") # Initialize deletion components validator = SessionDeletionValidator() cascade_orchestrator = CascadeDeletionOrchestrator() work_handler = WorkPreservationHandler() # Validate session exists and is accessible session_state = await self.session_manager.get_session_state( session_id=session_id, security_context=SecurityContext() ) if not session_state: raise ValidationError(f"Session {session_id} not found") # Phase 2: Deletion Validation if ctx: await ctx.report_progress(15, 100, "Performing deletion safety checks") deletion_context = SessionDeletionContext( session_id=session_id, cleanup_agents=cleanup_agents, preserve_work=preserve_work, force=force, initiated_by="mcp_tool", security_context=SecurityContext(), ) validation_result = await validator.validate_session_deletion( session_id=session_id, context=deletion_context, cleanup_agents=cleanup_agents, preserve_work=preserve_work, force=force, ) if not validation_result.valid: raise OperationError( f"Session deletion validation failed: {validation_result.error_message}" ) # Phase 3: Work Preservation (if requested) preservation_result = None if preserve_work: if ctx: await ctx.report_progress(25, 100, "Preserving uncommitted work") try: preservation_result = await work_handler.preserve_session_work( session_state=session_state, include_git=True, include_files=True, include_metadata=True, ) if ctx and preservation_result.success: await ctx.info( f"Work preserved: {preservation_result.preserved_count} items" ) except Exception as e: if not force: raise OperationError(f"Work preservation failed: {str(e)}") else: if ctx: await ctx.warning( f"Work preservation failed (continuing due to force=True): {str(e)}" ) # Phase 4: Agent Cascade Deletion agents_deleted = 0 if cleanup_agents and session_state.agents: if ctx: await ctx.report_progress( 40, 100, f"Deleting {len(session_state.agents)} agents" ) # Get agent states for deletion ordering agent_states = [] for agent_id in session_state.agents: agent_state = await self.agent_manager.get_agent_state( agent_id=agent_id, security_context=SecurityContext() ) if agent_state: agent_states.append(agent_state) # Prepare cascade deletion order deletion_order = await cascade_orchestrator.prepare_cascade_deletion( session_state=session_state, agents=agent_states ) # Execute cascade deletion deletion_results = await cascade_orchestrator.execute_cascade_deletion( agent_order=deletion_order, timeout_seconds=30, force_termination=force, ) agents_deleted = len([r for r in deletion_results if r.success]) if agents_deleted < len(session_state.agents) and not force: failed_agents = [ r.agent_id for r in deletion_results if not r.success ] raise OperationError( f"Failed to delete {len(failed_agents)} agents: {failed_agents}. " f"Use force=True to override." ) # Phase 5: Session State Cleanup if ctx: await ctx.report_progress(70, 100, "Cleaning up session state") # Remove session from manager await self.session_manager.delete_session( session_id=session_id, force=force, security_context=SecurityContext() ) # Phase 6: Resource Cleanup if ctx: await ctx.report_progress(85, 100, "Performing final resource cleanup") # Cleanup any orphaned resources cleanup_summary = await cascade_orchestrator.cleanup_orphaned_resources( session_id=session_id ) # Phase 7: Completion and Audit if ctx: await ctx.report_progress( 95, 100, "Finalizing deletion and creating audit trail" ) execution_duration = (time.time() - execution_start) * 1000 # Update performance statistics self._update_tool_performance( "delete_session", execution_duration, success=True ) # Create audit log if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.INFO, category=AuditCategory.SESSION_MANAGEMENT, operation="delete_session", details={ "session_id": session_id, "agents_deleted": agents_deleted, "work_preserved": preserve_work and preservation_result and preservation_result.success, "preservation_path": ( str(preservation_result.preservation_path) if preservation_result else None ), "execution_duration_ms": execution_duration, "cleanup_summary": cleanup_summary, }, ) if ctx: await ctx.report_progress(100, 100, "Session deletion complete") await ctx.info(f"Successfully deleted session {session_id}") return { "success": True, "session_id": session_id, "agents_deleted": agents_deleted, "work_preserved": preserve_work and preservation_result and preservation_result.success, "preservation_path": ( str(preservation_result.preservation_path) if preservation_result and preservation_result.preservation_path else None ), "preserved_items": ( preservation_result.preserved_count if preservation_result else 0 ), "cleanup_summary": cleanup_summary, "execution_duration_ms": execution_duration, "operation_id": operation_id, } except ValidationError as e: error_msg = f"Session deletion validation failed: {str(e)}" if ctx: await ctx.error(error_msg) self._update_tool_performance("delete_session", 0, success=False) if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.ERROR, category=AuditCategory.SESSION_MANAGEMENT, operation="delete_session", details={ "session_id": session_id, "error": str(e), "error_type": "VALIDATION_ERROR", }, ) return { "success": False, "session_id": session_id, "error": error_msg, "error_type": "VALIDATION_ERROR", } except OperationError as e: error_msg = f"Session deletion operation failed: {str(e)}" if ctx: await ctx.error(error_msg) self._update_tool_performance("delete_session", 0, success=False) if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.ERROR, category=AuditCategory.SESSION_MANAGEMENT, operation="delete_session", details={ "session_id": session_id, "error": str(e), "error_type": "OPERATION_ERROR", }, ) return { "success": False, "session_id": session_id, "error": error_msg, "error_type": "OPERATION_ERROR", } except Exception as e: error_msg = f"Unexpected error during session deletion: {str(e)}" if ctx: await ctx.error(error_msg) self._update_tool_performance("delete_session", 0, success=False) if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.ERROR, category=AuditCategory.SESSION_MANAGEMENT, operation="delete_session", details={ "session_id": session_id, "error": str(e), "error_type": "UNEXPECTED_ERROR", }, ) return { "success": False, "session_id": session_id, "error": error_msg, "error_type": "UNEXPECTED_ERROR", } @require(lambda self, agent_name, message, *args, **kwargs: agent_name and message) @ensure( lambda result, *args, **kwargs: isinstance(result, dict) and "success" in result ) async def send_message_to_agent( self, agent_name: str, message: str, prepend_adder: bool = True, wait_for_response: bool = False, timeout_seconds: int = 30, ctx: Optional[Context] = None, ) -> Dict[str, Any]: """ Send message to specific agent with optional ADDER+ prepending. Implements secure message routing to target agents with comprehensive sanitization, ADDER+ prompt integration, and delivery confirmation. Contracts: Preconditions: - agent_name must be valid and agent must exist - message must pass sanitization checks - Caller must have permission to message agent Postconditions: - Message delivered to agent's iTerm2 tab - ADDER+ prompt prepended if requested - Audit trail created for message - Response returned if wait_for_response=True Invariants: - No injection attacks possible through messages - All messages are logged with security context - Agent state remains consistent Security Implementation: - Input Sanitization: Comprehensive message cleaning - Injection Prevention: Escape sequences and command blocking - Access Control: Verify messaging permissions - Audit Trail: Complete logging of all messages Args: agent_name: Target agent name (Agent_# format) message: Message content to send (will be sanitized) prepend_adder: Whether to prepend ADDER+ prompt wait_for_response: Whether to wait for agent response timeout_seconds: Timeout for response waiting ctx: FastMCP context for progress reporting Returns: MessageResult with delivery status and optional response Raises: ValidationError: Invalid agent name or message SecurityError: Message contains forbidden content OperationError: Message delivery failed TimeoutError: Response timeout exceeded """ execution_start = time.time() try: if ctx: await ctx.info(f"Sending message to agent {agent_name}") await ctx.report_progress(5, 100, "Validating agent name format") # Phase 1: Agent Name Validation import re agent_name_pattern = re.compile(r"^Agent_\d+$") if not agent_name_pattern.match(agent_name): raise ValidationError( f"Invalid agent name format. Expected 'Agent_#', got: {agent_name}" ) # Phase 2: Agent Location if ctx: await ctx.report_progress(15, 100, "Locating agent") agent_info = await self.agent_manager.find_agent_by_name( agent_name=agent_name, security_context=SecurityContext() ) if not agent_info: raise ValidationError(f"Agent {agent_name} not found") # Check agent status if agent_info.status.value != "ACTIVE": raise OperationError( f"Agent {agent_name} is not active (status: {agent_info.status.value})" ) # Phase 3: Message Sanitization if ctx: await ctx.report_progress(30, 100, "Sanitizing message") # Import message sanitization utilities from src.utils.message_sanitization import ( SanitizationLevel, create_sanitizer_for_security_level, ) # Create sanitizer based on session security level session_state = await self.session_manager.get_session_state( agent_info.session_id, SecurityContext() ) sanitizer = create_sanitizer_for_security_level( session_state.security_level if session_state else SecurityLevel.HIGH ) sanitized_message = sanitizer.sanitize(message) # Phase 4: ADDER+ Prompt Construction final_message = sanitized_message if prepend_adder: if ctx: await ctx.report_progress(45, 100, "Building ADDER+ prompt") # Import ADDER+ prompt builder from src.utils.adder_prompt_builder import build_adder_task_prompt final_message = build_adder_task_prompt( agent_name=agent_name, message=sanitized_message, session_id=str(agent_info.session_id), session_root=( session_state.root_path if session_state else Path("/tmp") ), specialization=agent_info.specialization, priority="MEDIUM", use_minimal=False, ) # Phase 5: Message Delivery if ctx: await ctx.report_progress(65, 100, "Delivering message to iTerm2") try: delivery_result = await self.iterm_manager.send_text( tab_id=agent_info.iterm_tab_id, text=final_message + "\n", security_context=SecurityContext(), ) if not delivery_result: raise OperationError("Message delivery to iTerm2 failed") except Exception as e: raise OperationError(f"Failed to deliver message via iTerm2: {e}") # Phase 6: Response Waiting (Optional) response = None if wait_for_response: if ctx: await ctx.report_progress( 80, 100, f"Waiting for response (timeout: {timeout_seconds}s)" ) response = await self._wait_for_agent_response( agent_id=agent_info.agent_id, timeout_seconds=timeout_seconds ) if ctx: await ctx.report_progress(100, 100, "Message sent successfully") await ctx.info(f"Message delivered to {agent_name}") # Calculate execution time execution_duration = (time.time() - execution_start) * 1000 # Update performance statistics self._update_tool_performance( "send_message_to_agent", execution_duration, success=True ) # Log message operation if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.INFO, category=AuditCategory.AGENT_COMMUNICATION, operation="message_sent", resource_type="agent_message", resource_id=str(agent_info.agent_id), success=True, metadata={ "agent_name": agent_name, "message_length": len(message), "sanitized_message_length": len(sanitized_message), "prepend_adder": prepend_adder, "wait_for_response": wait_for_response, "execution_duration_ms": execution_duration, "response_received": response is not None, }, ) return { "success": True, "agent_name": agent_name, "message_delivered": True, "delivery_timestamp": datetime.utcnow().isoformat(), "prepend_adder": prepend_adder, "message_length": len(message), "sanitized_message_length": len(sanitized_message), "response": response if wait_for_response else None, "execution_duration_ms": execution_duration, } except Exception as e: # Error handling and logging execution_duration = (time.time() - execution_start) * 1000 self._update_tool_performance( "send_message_to_agent", execution_duration, success=False ) # Log message failure if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.ERROR, category=AuditCategory.AGENT_COMMUNICATION, operation="message_send_failed", resource_type="agent_message", success=False, error_message=str(e), metadata={ "agent_name": agent_name, "message_length": len(message), "prepend_adder": prepend_adder, "execution_duration_ms": execution_duration, "error_type": type(e).__name__, }, ) if ctx: await ctx.error(f"Message delivery failed: {str(e)}") return { "success": False, "error": str(e), "error_type": type(e).__name__, "agent_name": agent_name, "execution_duration_ms": execution_duration, } @require( lambda self, agent_name, *args, **kwargs: agent_name and isinstance(agent_name, str) ) @ensure( lambda result, *args, **kwargs: isinstance(result, dict) and "success" in result ) async def clear_agent_conversation( self, agent_name: str, preserve_state: bool = True, ctx: Optional[Context] = None, ) -> Dict[str, Any]: """ Clear agent conversation by closing current iTerm2 tab. Provides clean conversation management by gracefully terminating the current Claude Code session and optionally preserving agent state for restoration. Contracts: Preconditions: - agent_name must be valid and agent must exist - Agent must have an active conversation (iTerm tab) - System must be in consistent state Postconditions: - Agent's iTerm2 tab is closed - Claude Code process is terminated gracefully - Agent state is preserved if requested - Agent status updated to reflect conversation state Invariants: - No orphaned processes remain after clearing - Agent state remains consistent - All operations are logged Security Implementation: - Agent Validation: Verify agent ownership and access - Process Safety: Graceful termination with timeout - State Protection: Secure state preservation - Audit Trail: Complete logging of conversation operations Args: agent_name: Name of agent whose conversation to clear (Agent_# format) preserve_state: Whether to save current agent state before clearing ctx: FastMCP context for progress reporting Returns: Dict[str, Any]: Clearing result with comprehensive status: - success: Whether clearing completed successfully - agent_name: Name of affected agent - conversation_cleared: Whether conversation was cleared - state_preserved: Whether state was successfully preserved - tab_closed: Whether iTerm2 tab was closed - process_terminated: Whether Claude Code process ended - execution_duration_ms: Total operation time Raises: ValidationError: Invalid agent name or agent not found OperationError: Conversation clearing failed """ execution_start = time.time() operation_id = f"clear_conversation_{int(execution_start * 1000)}" try: # Phase 1: Initial Validation if ctx: await ctx.info(f"Clearing conversation for agent {agent_name}") await ctx.report_progress(5, 100, "Validating agent name and status") # Validate agent name format import re agent_name_pattern = re.compile(r"^Agent_\d+$") if not agent_name_pattern.match(agent_name): raise ValidationError( f"Invalid agent name format. Expected 'Agent_#', got: {agent_name}" ) # Phase 2: Agent Location and Status Check if ctx: await ctx.report_progress(15, 100, "Locating agent and checking status") # Find agent across all sessions agent_info = await self.agent_manager.find_agent_by_name( agent_name=agent_name, security_context=SecurityContext() ) if not agent_info: raise ValidationError(f"Agent {agent_name} not found in any session") # Check if agent has an active conversation if not hasattr(agent_info, "iterm_tab_id") or not agent_info.iterm_tab_id: return { "success": True, "agent_name": agent_name, "conversation_cleared": False, "message": "Agent has no active conversation to clear", "already_cleared": True, "execution_duration_ms": (time.time() - execution_start) * 1000, } # Phase 3: State Preservation (if requested) state_preserved = False preservation_path = None if preserve_state: if ctx: await ctx.report_progress(30, 100, "Preserving agent state") try: # Get current agent state agent_state = await self.agent_manager.get_agent_state( agent_id=agent_info.agent_id, security_context=SecurityContext() ) if agent_state: # Import state preservation utilities from src.utils.work_preservation import WorkPreservationHandler preservation_handler = WorkPreservationHandler() # Preserve conversation context preservation_result = ( await preservation_handler.preserve_agent_conversation( agent_state=agent_state, include_conversation_history=True, include_working_context=True, ) ) state_preserved = preservation_result.success preservation_path = preservation_result.preservation_path if ctx and state_preserved: await ctx.info( f"Agent state preserved: {preservation_result.preserved_count} items" ) except Exception as e: if ctx: await ctx.warning(f"State preservation failed: {str(e)}") # Continue with clearing even if preservation fails # Phase 4: Process Termination if ctx: await ctx.report_progress(50, 100, "Terminating Claude Code process") process_terminated = False try: # Send graceful exit command to Claude Code await self.iterm_manager.send_text( tab_id=agent_info.iterm_tab_id, text="/exit\n", security_context=SecurityContext(), ) # Wait for graceful termination termination_timeout = 10 # seconds elapsed = 0 while elapsed < termination_timeout: if hasattr(agent_info, "process_id") and agent_info.process_id: if not await self._is_process_running(agent_info.process_id): process_terminated = True break await asyncio.sleep(1) elapsed += 1 # Force termination if needed if ( not process_terminated and hasattr(agent_info, "process_id") and agent_info.process_id ): await self._force_terminate_process(agent_info.process_id) process_terminated = True except Exception as e: if ctx: await ctx.warning(f"Process termination warning: {str(e)}") # Continue with tab closing # Phase 5: iTerm2 Tab Closure if ctx: await ctx.report_progress(70, 100, "Closing iTerm2 tab") tab_closed = False try: await self.iterm_manager.close_tab( tab_id=agent_info.iterm_tab_id, security_context=SecurityContext() ) tab_closed = True except Exception as e: if ctx: await ctx.warning(f"Tab closure warning: {str(e)}") # Phase 6: Agent State Update if ctx: await ctx.report_progress(85, 100, "Updating agent status") try: # Update agent to reflect conversation cleared await self.agent_manager.update_agent_conversation_status( agent_id=agent_info.agent_id, has_active_conversation=False, iterm_tab_id=None, security_context=SecurityContext(), ) except Exception as e: if ctx: await ctx.warning(f"Agent state update warning: {str(e)}") # Phase 7: Completion if ctx: await ctx.report_progress(100, 100, "Conversation clearing complete") await ctx.info(f"Successfully cleared conversation for {agent_name}") # Calculate execution time execution_duration = (time.time() - execution_start) * 1000 # Update performance statistics self._update_tool_performance( "clear_agent_conversation", execution_duration, success=True ) # Log successful conversation clearing if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.INFO, category=AuditCategory.AGENT_COMMUNICATION, operation="conversation_cleared", resource_type="agent_conversation", resource_id=str(agent_info.agent_id), success=True, metadata={ "agent_name": agent_name, "state_preserved": state_preserved, "preservation_path": ( str(preservation_path) if preservation_path else None ), "tab_closed": tab_closed, "process_terminated": process_terminated, "execution_duration_ms": execution_duration, }, ) return { "success": True, "agent_name": agent_name, "conversation_cleared": True, "state_preserved": state_preserved, "preservation_path": ( str(preservation_path) if preservation_path else None ), "tab_closed": tab_closed, "process_terminated": process_terminated, "execution_duration_ms": execution_duration, "operation_id": operation_id, "cleared_at": datetime.utcnow().isoformat(), } except Exception as e: # Error handling and logging execution_duration = (time.time() - execution_start) * 1000 self._update_tool_performance( "clear_agent_conversation", execution_duration, success=False ) # Log conversation clearing failure if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.ERROR, category=AuditCategory.AGENT_COMMUNICATION, operation="conversation_clear_failed", resource_type="agent_conversation", success=False, error_message=str(e), metadata={ "agent_name": agent_name, "preserve_state": preserve_state, "execution_duration_ms": execution_duration, "error_type": type(e).__name__, }, ) if ctx: await ctx.error(f"Conversation clearing failed: {str(e)}") return { "success": False, "error": str(e), "error_type": type(e).__name__, "agent_name": agent_name, "execution_duration_ms": execution_duration, "operation_id": operation_id, } @require( lambda self, agent_name, *args, **kwargs: agent_name and isinstance(agent_name, str) ) @ensure( lambda result, *args, **kwargs: isinstance(result, dict) and "success" in result ) async def start_new_agent_conversation( self, agent_name: str, restore_context: bool = True, ctx: Optional[Context] = None, ) -> Dict[str, Any]: """ Start new conversation for existing agent by creating new iTerm2 tab. Creates a fresh Claude Code session for an existing agent while optionally restoring previous context and state for seamless conversation continuation. Contracts: Preconditions: - agent_name must be valid and agent must exist - Agent must not have an active conversation - System must have capacity for new conversation Postconditions: - New iTerm2 tab created for agent - Claude Code process spawned and initialized - ADDER+ prompt injected with agent context - Agent state updated with new conversation details - Context restored if requested and available Invariants: - Only one conversation per agent at any time - All conversation resources properly tracked - Agent state remains consistent Security Implementation: - Agent Validation: Verify agent ownership and access - Resource Limits: Enforce conversation limits per session - Context Security: Secure restoration of previous state - Audit Trail: Complete logging of conversation operations Args: agent_name: Name of agent to start conversation for (Agent_# format) restore_context: Whether to restore previous conversation context ctx: FastMCP context for progress reporting Returns: Dict[str, Any]: Start result with comprehensive status: - success: Whether conversation start completed successfully - agent_name: Name of affected agent - conversation_started: Whether new conversation was created - tab_id: New iTerm2 tab identifier - process_id: New Claude Code process identifier - context_restored: Whether previous context was restored - adder_prompt_injected: Whether ADDER+ prompt was successful - execution_duration_ms: Total operation time Raises: ValidationError: Invalid agent name or agent not found OperationError: Conversation start failed or agent busy """ execution_start = time.time() operation_id = f"start_conversation_{int(execution_start * 1000)}" try: # Phase 1: Initial Validation if ctx: await ctx.info(f"Starting new conversation for agent {agent_name}") await ctx.report_progress(5, 100, "Validating agent name and status") # Validate agent name format import re agent_name_pattern = re.compile(r"^Agent_\d+$") if not agent_name_pattern.match(agent_name): raise ValidationError( f"Invalid agent name format. Expected 'Agent_#', got: {agent_name}" ) # Phase 2: Agent Location and Status Check if ctx: await ctx.report_progress( 15, 100, "Locating agent and checking availability" ) # Find agent across all sessions agent_info = await self.agent_manager.find_agent_by_name( agent_name=agent_name, security_context=SecurityContext() ) if not agent_info: raise ValidationError(f"Agent {agent_name} not found in any session") # Check if agent already has an active conversation if hasattr(agent_info, "iterm_tab_id") and agent_info.iterm_tab_id: raise OperationError( f"Agent {agent_name} already has an active conversation. " f"Clear existing conversation first." ) # Get session information for context session_state = await self.session_manager.get_session_state( agent_info.session_id, SecurityContext() ) if not session_state: raise OperationError(f"Session for agent {agent_name} not found") # Phase 3: Context Restoration Preparation restored_context = None context_restored = False if restore_context: if ctx: await ctx.report_progress(25, 100, "Preparing context restoration") try: # Import state preservation utilities from src.utils.work_preservation import WorkPreservationHandler preservation_handler = WorkPreservationHandler() # Look for preserved context restoration_result = ( await preservation_handler.restore_agent_conversation( agent_id=agent_info.agent_id, session_root=session_state.root_path, ) ) if restoration_result.success: restored_context = restoration_result.restored_context context_restored = True if ctx: await ctx.info( f"Context restored: {restoration_result.restored_count} items" ) except Exception as e: if ctx: await ctx.warning(f"Context restoration failed: {str(e)}") # Continue without context restoration # Phase 4: iTerm2 Tab Creation if ctx: await ctx.report_progress(40, 100, "Creating new iTerm2 tab") try: # Create new tab in session window new_tab_id = await self.iterm_manager.create_tab( agent_id=agent_info.agent_id, session_id=agent_info.session_id, working_directory=session_state.root_path, security_context=SecurityContext(), ) if not new_tab_id: raise OperationError("Failed to create new iTerm2 tab") except Exception as e: raise OperationError(f"iTerm2 tab creation failed: {str(e)}") # Phase 5: Claude Code Process Spawning if ctx: await ctx.report_progress(55, 100, "Spawning Claude Code process") try: # Get agent configuration for Claude Code agent_state = await self.agent_manager.get_agent_state( agent_id=agent_info.agent_id, security_context=SecurityContext() ) # Build Claude Code activation command claude_config = getattr(agent_state, "claude_config", None) activation_command = f"cd {session_state.root_path} && claude" if claude_config: if getattr(claude_config, "model", "sonnet-3.5") != "sonnet-3.5": activation_command += f" --model {claude_config.model}" if getattr(claude_config, "no_color", False): activation_command += " --no-color" # Send activation command to new tab await self.iterm_manager.send_text( tab_id=new_tab_id, text=activation_command + "\n", security_context=SecurityContext(), ) # Wait for Claude Code to initialize await asyncio.sleep(3) except Exception as e: # Cleanup tab on failure try: await self.iterm_manager.close_tab(new_tab_id, SecurityContext()) except: pass raise OperationError(f"Claude Code process spawn failed: {str(e)}") # Phase 6: Context and ADDER+ Prompt Injection if ctx: await ctx.report_progress( 70, 100, "Injecting ADDER+ prompt and context" ) adder_prompt_injected = False try: # Build ADDER+ prompt with agent context specialization = getattr(agent_state, "specialization", None) system_prompt_suffix = getattr(agent_state, "system_prompt_suffix", "") adder_prompt = self._build_adder_prompt( agent_name=agent_name, specialization=specialization, system_prompt_suffix=system_prompt_suffix, session_root_path=session_state.root_path, ) # Add restored context if available if restored_context: context_prompt = ( f"\n\n**Restored Context:**\n{restored_context}\n\n" ) adder_prompt += context_prompt # Send ADDER+ prompt to new conversation await self.iterm_manager.send_text( tab_id=new_tab_id, text=adder_prompt + "\n", security_context=SecurityContext(), ) adder_prompt_injected = True # Wait for prompt processing await asyncio.sleep(2) except Exception as e: if ctx: await ctx.warning(f"ADDER+ prompt injection warning: {str(e)}") # Continue - conversation can still be used manually # Phase 7: Agent State Update if ctx: await ctx.report_progress(85, 100, "Updating agent conversation status") new_process_id = None try: # Get new process ID (placeholder - would need iTerm2 process tracking) new_process_id = await self.iterm_manager.get_tab_process_id( new_tab_id, SecurityContext() ) # Update agent with new conversation details await self.agent_manager.update_agent_conversation_status( agent_id=agent_info.agent_id, has_active_conversation=True, iterm_tab_id=new_tab_id, process_id=new_process_id, security_context=SecurityContext(), ) except Exception as e: if ctx: await ctx.warning(f"Agent state update warning: {str(e)}") # Phase 8: Completion if ctx: await ctx.report_progress( 100, 100, "New conversation started successfully" ) await ctx.info(f"New conversation ready for {agent_name}") # Calculate execution time execution_duration = (time.time() - execution_start) * 1000 # Update performance statistics self._update_tool_performance( "start_new_agent_conversation", execution_duration, success=True ) # Log successful conversation start if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.INFO, category=AuditCategory.AGENT_COMMUNICATION, operation="conversation_started", resource_type="agent_conversation", resource_id=str(agent_info.agent_id), success=True, metadata={ "agent_name": agent_name, "new_tab_id": new_tab_id, "new_process_id": new_process_id, "context_restored": context_restored, "adder_prompt_injected": adder_prompt_injected, "execution_duration_ms": execution_duration, }, ) return { "success": True, "agent_name": agent_name, "conversation_started": True, "tab_id": new_tab_id, "process_id": new_process_id, "context_restored": context_restored, "adder_prompt_injected": adder_prompt_injected, "session_id": str(agent_info.session_id), "working_directory": str(session_state.root_path), "execution_duration_ms": execution_duration, "operation_id": operation_id, "started_at": datetime.utcnow().isoformat(), } except Exception as e: # Error handling and logging execution_duration = (time.time() - execution_start) * 1000 self._update_tool_performance( "start_new_agent_conversation", execution_duration, success=False ) # Log conversation start failure if self._audit_logger: await self._audit_logger.log_event( level=AuditLevel.ERROR, category=AuditCategory.AGENT_COMMUNICATION, operation="conversation_start_failed", resource_type="agent_conversation", success=False, error_message=str(e), metadata={ "agent_name": agent_name, "restore_context": restore_context, "execution_duration_ms": execution_duration, "error_type": type(e).__name__, }, ) if ctx: await ctx.error(f"Conversation start failed: {str(e)}") return { "success": False, "error": str(e), "error_type": type(e).__name__, "agent_name": agent_name, "execution_duration_ms": execution_duration, "operation_id": operation_id, } # Helper methods def _build_adder_prompt( self, agent_name: str, specialization: Optional[AgentSpecialization], system_prompt_suffix: str, session_root_path: Path, ) -> str: """ Build complete ADDER+ system prompt with agent name injection. Args: agent_name: Agent name to inject into prompt specialization: Agent specialization for context system_prompt_suffix: Additional prompt content session_root_path: Session root path for context Returns: str: Complete ADDER+ prompt with agent context """ # Build base ADDER+ prompt (this would load from actual prompt document) base_prompt = f"""You are {agent_name} # ELITE CODE AGENT: ADDER+ (Advanced Development, Documentation & Error Resolution) <role_specification> You are an elite AI development agent with 15+ years of enterprise software architecture experience, specializing in autonomous task management and advanced programming synthesis for multi-agent collaboration. Your agent name is {agent_name} - use this for all task assignments, progress tracking, and communication. **Core Expertise:** - **Enterprise Architecture**: Microservices, event-driven architectures, distributed systems with systematic design pattern application - **Autonomous Task Management**: TODO.md-driven execution with real-time progress tracking and dynamic task creation - **Advanced Programming Synthesis**: Design by Contract + defensive programming + type-driven development + property-based testing + functional programming - **Systematic Error Resolution**: Root Cause Analysis frameworks with automatic task generation and comprehensive tracking - **Documentation Excellence**: Real-time technical documentation with context-aware folder documentation and architectural decision recording </role_specification> **Session Context:** - **Session Root**: {session_root_path} - **Agent Name**: {agent_name} - **Specialization**: {specialization.value if specialization else "GENERAL"} {system_prompt_suffix} '{session_root_path}' """ return base_prompt def _update_tool_performance( self, tool_name: str, duration_ms: float, success: bool ) -> None: """Update performance statistics for tool execution.""" if tool_name in self._tool_execution_stats: stats = self._tool_execution_stats[tool_name] stats["total_executions"] += 1 if success: stats["successful_executions"] += 1 else: stats["failed_executions"] += 1 # Update average duration (exponential moving average) current_avg = stats["avg_duration_ms"] stats["avg_duration_ms"] = (current_avg * 0.9) + (duration_ms * 0.1) def get_tool_performance_summary(self) -> Dict[str, Any]: """Get performance summary for all tools.""" return { "tools": self._tool_execution_stats, "summary": { "total_tools": len(self._tool_execution_stats), "total_executions": sum( stats["total_executions"] for stats in self._tool_execution_stats.values() ), "overall_success_rate": self._calculate_overall_success_rate(), }, } def _calculate_overall_success_rate(self) -> float: """Calculate overall success rate across all tools.""" total_executions = sum( stats["total_executions"] for stats in self._tool_execution_stats.values() ) total_successes = sum( stats["successful_executions"] for stats in self._tool_execution_stats.values() ) return ( (total_successes / total_executions * 100) if total_executions > 0 else 0.0 ) async def _wait_for_agent_response( self, agent_id: AgentId, timeout_seconds: int ) -> Optional[str]: """ Wait for agent response with timeout. This is a placeholder implementation that would integrate with Claude Code output monitoring in a full implementation. Args: agent_id: Agent ID to wait for response from timeout_seconds: Maximum time to wait Returns: Agent response text if received, None if timeout """ # TODO: Implement actual response monitoring # This would integrate with iTerm2 output monitoring # and Claude Code response parsing await asyncio.sleep(min(2, timeout_seconds)) # Simulate waiting return None # Placeholder - no actual response monitoring yet async def _collect_agent_status( self, agent, include_metrics: bool, include_health: bool ) -> Dict[str, Any]: """ Collect comprehensive status for a single agent. Args: agent: Agent state object include_metrics: Whether to include resource metrics include_health: Whether to include health check results Returns: Dictionary with agent status information """ base_status = { "agent_id": str(agent.agent_id), "agent_name": getattr(agent, "name", "unknown"), "specialization": ( getattr(agent, "specialization", {}).get("value", "GENERAL") if hasattr(agent, "specialization") else "GENERAL" ), "status": ( getattr(agent, "status", {}).get("value", "UNKNOWN") if hasattr(agent, "status") else "UNKNOWN" ), "created_at": ( getattr(agent, "created_at", datetime.utcnow()).isoformat() if hasattr(agent, "created_at") else datetime.utcnow().isoformat() ), "iterm_tab_id": getattr(agent, "iterm_tab_id", "unknown"), "process_id": getattr(agent, "process_id", 0), } if include_metrics: try: # Get resource metrics (placeholder implementation) metrics = { "cpu_percent": 5.2, # TODO: Get real metrics "memory_mb": 128.5, # TODO: Get real metrics "file_descriptors": 25, # TODO: Get real metrics "thread_count": 12, # TODO: Get real metrics } base_status["metrics"] = metrics except Exception: # Fallback for metrics collection errors base_status["metrics"] = { "cpu_percent": 0.0, "memory_mb": 0.0, "file_descriptors": 0, "thread_count": 0, "metrics_error": "Unable to collect metrics", } if include_health: try: # Get health status (placeholder implementation) health = { "status": "HEALTHY", # TODO: Get real health status "last_check": datetime.utcnow().isoformat(), "check_results": { "process_running": True, "iterm_responsive": True, "claude_responsive": True, }, } base_status["health"] = health except Exception: # Fallback for health check errors base_status["health"] = { "status": "UNKNOWN", "last_check": datetime.utcnow().isoformat(), "check_results": {}, "health_error": "Unable to perform health check", } return base_status async def _aggregate_session_metrics( self, agent_statuses: List[Dict[str, Any]] ) -> Dict[str, Any]: """ Aggregate metrics across all agents in session. Args: agent_statuses: List of agent status dictionaries Returns: Dictionary with aggregated session metrics """ if not agent_statuses: return { "total_cpu_percent": 0.0, "total_memory_mb": 0.0, "total_file_descriptors": 0, "active_agents": 0, "degraded_agents": 0, "failed_agents": 0, "unknown_agents": 0, } metrics = { "total_cpu_percent": sum( agent.get("metrics", {}).get("cpu_percent", 0) for agent in agent_statuses ), "total_memory_mb": sum( agent.get("metrics", {}).get("memory_mb", 0) for agent in agent_statuses ), "total_file_descriptors": sum( agent.get("metrics", {}).get("file_descriptors", 0) for agent in agent_statuses ), "total_thread_count": sum( agent.get("metrics", {}).get("thread_count", 0) for agent in agent_statuses ), "active_agents": sum( 1 for agent in agent_statuses if agent.get("status") == "ACTIVE" ), "degraded_agents": sum( 1 for agent in agent_statuses if agent.get("status") == "DEGRADED" ), "failed_agents": sum( 1 for agent in agent_statuses if agent.get("status") == "FAILED" ), "unknown_agents": sum( 1 for agent in agent_statuses if agent.get("status") == "UNKNOWN" ), "average_cpu_percent": 0.0, "average_memory_mb": 0.0, } # Calculate averages if we have agents agent_count = len(agent_statuses) if agent_count > 0: metrics["average_cpu_percent"] = metrics["total_cpu_percent"] / agent_count metrics["average_memory_mb"] = metrics["total_memory_mb"] / agent_count return metrics def _evaluate_session_health(self, agent_statuses: List[Dict[str, Any]]) -> str: """ Evaluate overall session health based on agent statuses. Args: agent_statuses: List of agent status dictionaries Returns: String indicating overall session health """ if not agent_statuses: return "EMPTY" total_agents = len(agent_statuses) failed_count = sum( 1 for agent in agent_statuses if agent.get("status") == "FAILED" ) degraded_count = sum( 1 for agent in agent_statuses if agent.get("status") == "DEGRADED" ) active_count = sum( 1 for agent in agent_statuses if agent.get("status") == "ACTIVE" ) # Health evaluation logic if failed_count > total_agents * 0.5: return "CRITICAL" elif failed_count > 0 or degraded_count > total_agents * 0.3: return "DEGRADED" elif active_count == total_agents: return "HEALTHY" elif active_count > total_agents * 0.8: return "MOSTLY_HEALTHY" else: return "UNKNOWN" # Export MCP tools __all__ = ["AgentOrchestrationTools"]

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/Nexus-Digital-Automations/Claude_Code_MCP_2'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

mcp_tools.py•116 KiB