Medical GraphRAG Assistant

streamlit_app.py•91.6 KiB

#!/usr/bin/env python3 """ Agentic Medical Chat with Tool Use Claude calls MCP tools autonomously based on user questions """ import streamlit as st import asyncio import json import subprocess import os import sys import plotly.graph_objects as go # Interactive graph visualization try: from streamlit_agraph import agraph, Node, Edge, Config AGRAPH_AVAILABLE = True except ImportError: AGRAPH_AVAILABLE = False print("Warning: streamlit-agraph not available, using static graphs", file=sys.stderr) # Load .env file if present try: from dotenv import load_dotenv # Look for .env in parent directory (project root) env_path = os.path.join(os.path.dirname(__file__), '..', '.env') if os.path.exists(env_path): load_dotenv(env_path) except ImportError: pass # python-dotenv not installed # OpenAI support try: from openai import OpenAI OPENAI_AVAILABLE = True except ImportError: OPENAI_AVAILABLE = False # DICOM support try: import pydicom from PIL import Image import numpy as np DICOM_AVAILABLE = True except ImportError: DICOM_AVAILABLE = False # Add parent directory to sys.path for src module imports parent_dir = os.path.abspath(os.path.join(os.path.dirname(__file__), '..')) if parent_dir not in sys.path: sys.path.insert(0, parent_dir) from fhir_graphrag_mcp_server import call_tool # ============================================================================ # Data Models for GraphRAG Details Panel (Feature 005) # ============================================================================ from dataclasses import dataclass, field from typing import List, Optional, Any from enum import Enum from datetime import datetime class EntityType(Enum): """Category of medical entity.""" SYMPTOM = "symptom" CONDITION = "condition" MEDICATION = "medication" PROCEDURE = "procedure" ANATOMY = "anatomy" LAB_RESULT = "lab_result" VITAL_SIGN = "vital_sign" OTHER = "other" class ExecutionStatus(Enum): """Status of tool execution.""" SUCCESS = "success" FAILED = "failed" TIMEOUT = "timeout" SKIPPED = "skipped" @dataclass class SourceReference: """Reference to source document for an entity.""" document_id: str document_type: str = "" excerpt: str = "" @dataclass class DisplayEntity: """Represents a medical entity extracted from GraphRAG results for display.""" id: str name: str type: EntityType score: float = 0.0 sources: List[SourceReference] = field(default_factory=list) context: str = "" @dataclass class DisplayRelationship: """Represents a connection between two entities.""" id: str source_id: str target_id: str relationship_type: str strength: float = 0.5 @dataclass class ToolExecution: """Record of a tool invocation during response generation.""" id: str tool_name: str start_time: datetime duration_ms: int status: ExecutionStatus parameters: dict = field(default_factory=dict) result_summary: str = "" error_message: str = "" @dataclass class DetailsPanel: """Aggregate structure containing all details panel data.""" entities: List[DisplayEntity] = field(default_factory=list) relationships: List[DisplayRelationship] = field(default_factory=list) tool_executions: List[ToolExecution] = field(default_factory=list) total_entity_count: int = 0 is_truncated: bool = False query_text: str = "" response_time_ms: int = 0 # ============================================================================ # Data Extraction Functions for Details Panel # ============================================================================ def _map_entity_type(type_str: str) -> EntityType: """Map a string entity type to EntityType enum.""" type_lower = type_str.lower() if type_str else "other" type_mapping = { "symptom": EntityType.SYMPTOM, "condition": EntityType.CONDITION, "medication": EntityType.MEDICATION, "drug": EntityType.MEDICATION, "procedure": EntityType.PROCEDURE, "anatomy": EntityType.ANATOMY, "body_part": EntityType.ANATOMY, "lab_result": EntityType.LAB_RESULT, "lab": EntityType.LAB_RESULT, "vital_sign": EntityType.VITAL_SIGN, "vital": EntityType.VITAL_SIGN, } return type_mapping.get(type_lower, EntityType.OTHER) def extract_entities_from_results(tool_results: List[dict]) -> List[DisplayEntity]: """ Extract entities from tool results for display. Parses entities from search_knowledge_graph, hybrid_search, and visualize_graphrag_results tool outputs. NOTE: As of v2.16.0, the backend search_knowledge_graph tool now returns complete entity objects (including entities discovered via relationships). This function still handles legacy responses and other tools. Args: tool_results: List of tool call results from the AI response Returns: List of DisplayEntity objects sorted by score descending """ entities = [] seen_ids = set() for result in tool_results: tool_name = result.get("tool_name", "") result_data = result.get("result", {}) # Handle string result data (JSON) if isinstance(result_data, str): try: result_data = json.loads(result_data) except json.JSONDecodeError: continue # Extract from search_knowledge_graph if tool_name == "search_knowledge_graph": for entity_data in result_data.get("entities", []): # Handle both 'name' and 'text' field names entity_name = entity_data.get("name") or entity_data.get("text", "Unknown") entity_id = str(entity_data.get("id", hash(entity_name))) if entity_id in seen_ids: continue seen_ids.add(entity_id) # Handle both 'score', 'relevance', and 'confidence' field names score = entity_data.get("score") or entity_data.get("confidence") or entity_data.get("relevance", 0.0) # Check if this is a direct match or discovered via relationship (v2.16.0+) entity_source = entity_data.get("source", "direct_match") entities.append(DisplayEntity( id=entity_id, name=entity_name, type=_map_entity_type(entity_data.get("type", "other")), score=float(score) if score else 0.0, context=entity_data.get("context", "")[:500] if entity_data.get("context") else entity_source, sources=[SourceReference( document_id=src.get("doc_id", ""), document_type=src.get("doc_type", ""), excerpt=src.get("excerpt", "")[:200] ) for src in entity_data.get("sources", [])[:10]] )) # LEGACY FALLBACK: Extract entities from relationships if backend doesn't include them # This handles older backend versions that don't include related entities in the entities list for rel_data in result_data.get("relationships", []): # Extract source entity from relationship src_id = str(rel_data.get("source_id", "")) src_text = rel_data.get("source_text", "") if src_id and src_text and src_id not in seen_ids: seen_ids.add(src_id) entities.append(DisplayEntity( id=src_id, name=src_text, type=EntityType.OTHER, # Type not available in legacy relationship data score=0.4 # Lower score since it's a related entity, not a direct match )) # Extract target entity from relationship tgt_id = str(rel_data.get("target_id", "")) tgt_text = rel_data.get("target_text", "") if tgt_id and tgt_text and tgt_id not in seen_ids: seen_ids.add(tgt_id) entities.append(DisplayEntity( id=tgt_id, name=tgt_text, type=EntityType.OTHER, score=0.4 )) # Extract from hybrid_search elif tool_name == "hybrid_search": # Hybrid search may include entity matches for entity_data in result_data.get("entity_matches", []): entity_id = str(entity_data.get("id", hash(entity_data.get("name", "")))) if entity_id in seen_ids: continue seen_ids.add(entity_id) entities.append(DisplayEntity( id=entity_id, name=entity_data.get("name", "Unknown"), type=_map_entity_type(entity_data.get("type", "other")), score=float(entity_data.get("score", 0.0)), context=entity_data.get("context", "")[:500] )) # Extract from visualize_graphrag_results or plot_entity_network elif tool_name in ["visualize_graphrag_results", "plot_entity_network"]: nodes = result_data.get("data", {}).get("nodes", []) for idx, node in enumerate(nodes): node_type = node.get("type", "other") if node_type == "QUERY": continue # Skip query node entity_id = str(node.get("id", idx)) if entity_id in seen_ids: continue seen_ids.add(entity_id) entities.append(DisplayEntity( id=entity_id, name=node.get("name", "Unknown"), type=_map_entity_type(node_type), score=float(node.get("score", 0.5)) )) # Sort by score descending entities.sort(key=lambda e: e.score, reverse=True) return entities def extract_relationships_from_results(tool_results: List[dict], entities: List[DisplayEntity] = None) -> List[DisplayRelationship]: """ Extract relationships from tool results for graph display. Parses relationships from plot_entity_network and visualize_graphrag_results outputs. Also generates co-occurrence relationships from entities when no explicit relationships exist. Args: tool_results: List of tool call results from the AI response entities: Optional list of extracted entities for co-occurrence relationships Returns: List of DisplayRelationship objects """ relationships = [] seen_ids = set() for result in tool_results: tool_name = result.get("tool_name", "") result_data = result.get("result", {}) # Handle string result data (JSON) if isinstance(result_data, str): try: result_data = json.loads(result_data) except json.JSONDecodeError: continue # Extract from plot_entity_network or visualize_graphrag_results if tool_name in ["plot_entity_network", "visualize_graphrag_results"]: nodes = result_data.get("data", {}).get("nodes", []) edges = result_data.get("data", {}).get("edges", []) # Build index-to-entityID mapping (edges use array indices, but we need entity IDs) idx_to_entity_id = {} for idx, node in enumerate(nodes): # Use database entity ID if available, otherwise use index entity_id = str(node.get("id", idx)) idx_to_entity_id[idx] = entity_id for idx, edge in enumerate(edges): # Convert array indices to entity IDs source_idx = edge.get("source", idx) target_idx = edge.get("target", idx) source_id = idx_to_entity_id.get(source_idx, str(source_idx)) target_id = idx_to_entity_id.get(target_idx, str(target_idx)) rel_id = f"{min(source_id, target_id)}_{max(source_id, target_id)}" if rel_id in seen_ids: continue seen_ids.add(rel_id) relationships.append(DisplayRelationship( id=rel_id, source_id=source_id, target_id=target_id, relationship_type=edge.get("type", edge.get("label", "related")), strength=float(edge.get("weight", edge.get("strength", 0.5))) )) # Extract from search_knowledge_graph - use real relationships from EntityRelationships table elif tool_name == "search_knowledge_graph": # Extract real relationships returned by the tool for rel_data in result_data.get("relationships", []): src_id = str(rel_data.get("source_id", "")) tgt_id = str(rel_data.get("target_id", "")) rel_id = f"{min(src_id, tgt_id)}_{max(src_id, tgt_id)}" if rel_id in seen_ids: continue seen_ids.add(rel_id) relationships.append(DisplayRelationship( id=rel_id, source_id=src_id, target_id=tgt_id, relationship_type=rel_data.get("type", "related"), strength=0.7 )) # If still no relationships but we have entities, create relationships between them if len(relationships) == 0 and entities and len(entities) >= 2: # Create star graph from highest scored entity to others center = entities[0] for other in entities[1:min(8, len(entities))]: rel_id = f"{min(center.id, other.id)}_{max(center.id, other.id)}" if rel_id in seen_ids: continue seen_ids.add(rel_id) relationships.append(DisplayRelationship( id=rel_id, source_id=center.id, target_id=other.id, relationship_type="query-related", strength=0.3 )) return relationships def extract_tool_executions(execution_log: List[dict]) -> List[ToolExecution]: """ Extract tool execution records from the execution log. Args: execution_log: List of execution log entries from chat_with_tools Returns: List of ToolExecution objects in chronological order """ executions = [] for idx, log_entry in enumerate(execution_log): # Skip non-tool entries (thinking, memory_recall) if log_entry.get("type") in ["thinking", "memory_recall"]: continue tool_name = log_entry.get("tool_name") if not tool_name: continue # Determine status from result result_summary = log_entry.get("result_summary", "") status = ExecutionStatus.SUCCESS error_message = "" if "error" in result_summary.lower(): status = ExecutionStatus.FAILED error_message = result_summary elif "timeout" in result_summary.lower(): status = ExecutionStatus.TIMEOUT error_message = result_summary # Use iteration number for ordering; estimate timing iteration = log_entry.get("iteration", idx) executions.append(ToolExecution( id=f"tool_{idx}_{tool_name}", tool_name=tool_name, start_time=datetime.now(), # Placeholder - could enhance with actual timing duration_ms=log_entry.get("duration_ms", 0), status=status, parameters=log_entry.get("tool_input", {}), result_summary=result_summary[:200], error_message=error_message )) return executions # ============================================================================ # Details Panel Render Components (Feature 005) # ============================================================================ # Session state keys for panel collapse/expand states DETAILS_SESSION_KEYS = { "details_selected_entity": None, "details_entities_expanded": True, "details_graph_expanded": True, "details_tools_expanded": True, "details_show_all_entities": False, } # App Settings session state keys APP_SETTINGS_KEYS = { "show_tool_prompts": False, # Show full tool input/prompts in execution details "auto_expand_tool_details": False, # Auto-expand tool details in execution panel } MAX_DISPLAY_ENTITIES = 50 def _init_details_session_state(): """Initialize session state keys for details panel if not present.""" for key, default in DETAILS_SESSION_KEYS.items(): if key not in st.session_state: st.session_state[key] = default def _init_app_settings(): """Initialize app settings session state keys if not present.""" for key, default in APP_SETTINGS_KEYS.items(): if key not in st.session_state: st.session_state[key] = default def _get_entity_type_emoji(entity_type: EntityType) -> str: """Return emoji for entity type.""" emoji_map = { EntityType.SYMPTOM: "🤒", EntityType.CONDITION: "🩺", EntityType.MEDICATION: "💊", EntityType.PROCEDURE: "🔧", EntityType.ANATOMY: "🫀", EntityType.LAB_RESULT: "🔬", EntityType.VITAL_SIGN: "📊", EntityType.OTHER: "📋", } return emoji_map.get(entity_type, "📋") def render_entity_section(entities: List[DisplayEntity], total_count: int, msg_idx: int) -> Optional[str]: """ Render the entity list with tooltips and truncation. Args: entities: List of entities to display total_count: Total entity count before truncation msg_idx: Message index for unique keys Returns: Selected entity ID or None """ _init_details_session_state() with st.expander(f"📋 Entities Found ({total_count})", expanded=st.session_state.details_entities_expanded): if not entities: st.info("No entities found in this query") return None # Group entities by type by_type = {} for entity in entities: type_key = entity.type.value if type_key not in by_type: by_type[type_key] = [] by_type[type_key].append(entity) # Determine display limit show_all = st.session_state.details_show_all_entities display_entities = entities if show_all else entities[:MAX_DISPLAY_ENTITIES] # Render entities grouped by type selected_entity_id = None for entity_type, type_entities in by_type.items(): emoji = _get_entity_type_emoji(EntityType(entity_type)) st.markdown(f"**{emoji} {entity_type.replace('_', ' ').title()}** ({len(type_entities)})") # Limit per type for better UX display_type_entities = type_entities[:15] if not show_all else type_entities for entity in display_type_entities: # Create clickable entity button btn_key = f"entity_{msg_idx}_{entity.id}" score_display = f" ({entity.score:.2f})" if entity.score > 0 else "" col1, col2 = st.columns([4, 1]) with col1: if st.button(f"{entity.name}{score_display}", key=btn_key, use_container_width=True): st.session_state.details_selected_entity = entity.id selected_entity_id = entity.id # Show tooltip/details for selected entity if st.session_state.details_selected_entity == entity.id: with st.container(): st.info(f"**{entity.name}** ({entity.type.value})") if entity.context: st.caption(f"Context: {entity.context[:200]}...") if entity.sources: st.markdown("**Source Documents:**") for src in entity.sources[:3]: st.caption(f"• {src.document_type}: {src.document_id}") if src.excerpt: st.caption(f" \"{src.excerpt[:100]}...\"") # Show "Show all" button if truncated if total_count > MAX_DISPLAY_ENTITIES and not show_all: if st.button(f"Show all {total_count} entities", key=f"show_all_{msg_idx}"): st.session_state.details_show_all_entities = True st.rerun() return selected_entity_id def render_graph_section( entities: List[DisplayEntity], relationships: List[DisplayRelationship], selected_entity_id: Optional[str], msg_idx: int ) -> Optional[str]: """ Render a static relationship graph using Plotly (works in nested expanders). Args: entities: List of entities as nodes relationships: List of relationships as edges selected_entity_id: Currently selected entity to highlight msg_idx: Message index for unique keys Returns: None (static graph, no click handling) """ _init_details_session_state() with st.expander("🕸️ Entity Relationships", expanded=st.session_state.details_graph_expanded): # Minimum threshold check if len(relationships) < 1 or len(entities) < 2: st.info("Not enough relationships to display graph (need at least 2 entities with relationships)") return None # Build entity lookup and limit nodes for readability max_nodes = 25 display_entities = entities[:max_nodes] entity_ids = {e.id for e in display_entities} entity_names = {e.id: e.name for e in display_entities} entity_types = {e.id: e.type for e in display_entities} # Filter relationships to only include displayed entities display_rels = [r for r in relationships if r.source_id in entity_ids and r.target_id in entity_ids] if len(display_rels) < 1: st.info("No relationships between displayed entities") return None # Create circular layout for nodes import math n = len(display_entities) node_positions = {} for i, entity in enumerate(display_entities): angle = 2 * math.pi * i / n node_positions[entity.id] = (math.cos(angle), math.sin(angle)) # Color mapping for entity types type_colors = { EntityType.SYMPTOM: "#FF6B6B", # Red EntityType.CONDITION: "#4ECDC4", # Teal EntityType.MEDICATION: "#45B7D1", # Blue EntityType.PROCEDURE: "#96CEB4", # Green EntityType.ANATOMY: "#FFEAA7", # Yellow EntityType.LAB_RESULT: "#DDA0DD", # Plum EntityType.VITAL_SIGN: "#98D8C8", # Mint EntityType.OTHER: "#C0C0C0", # Gray } # Build edge traces edge_x = [] edge_y = [] for rel in display_rels: if rel.source_id in node_positions and rel.target_id in node_positions: x0, y0 = node_positions[rel.source_id] x1, y1 = node_positions[rel.target_id] edge_x.extend([x0, x1, None]) edge_y.extend([y0, y1, None]) edge_trace = go.Scatter( x=edge_x, y=edge_y, mode='lines', line=dict(width=1, color='#888888'), hoverinfo='none' ) # Build node traces (one per type for legend) node_traces = [] for entity_type in EntityType: type_entities = [e for e in display_entities if e.type == entity_type] if not type_entities: continue node_x = [node_positions[e.id][0] for e in type_entities] node_y = [node_positions[e.id][1] for e in type_entities] node_text = [e.name for e in type_entities] hover_text = [f"{e.name}<br>Type: {e.type.value}<br>Score: {e.score:.2f}" for e in type_entities] node_traces.append(go.Scatter( x=node_x, y=node_y, mode='markers+text', name=entity_type.value.replace('_', ' ').title(), text=node_text, textposition="top center", textfont=dict(size=8), hovertext=hover_text, hoverinfo='text', marker=dict( size=12, color=type_colors.get(entity_type, '#C0C0C0'), line=dict(width=1, color='white') ) )) # Create figure fig = go.Figure( data=[edge_trace] + node_traces, layout=go.Layout( title=dict( text=f"{len(display_rels)} relationships between {len(display_entities)} entities", font=dict(size=12) ), showlegend=True, legend=dict( orientation="h", yanchor="bottom", y=-0.2, xanchor="center", x=0.5, font=dict(size=9) ), hovermode='closest', margin=dict(b=60, l=5, r=5, t=30), xaxis=dict(showgrid=False, zeroline=False, showticklabels=False), yaxis=dict(showgrid=False, zeroline=False, showticklabels=False), height=350, paper_bgcolor='rgba(0,0,0,0)', plot_bgcolor='rgba(0,0,0,0)' ) ) # Render static Plotly chart st.plotly_chart(fig, key=f"details_graph_{msg_idx}", use_container_width=True) if len(entities) > max_nodes: st.caption(f"Showing top {max_nodes} of {len(entities)} entities. Full graph in main response area.") return None def render_tools_section(tool_executions: List[ToolExecution], msg_idx: int) -> None: """ Render the tool execution timeline. Args: tool_executions: List of tool executions in chronological order msg_idx: Message index for unique keys """ _init_details_session_state() _init_app_settings() # Calculate total duration total_duration_ms = sum(t.duration_ms for t in tool_executions) total_duration_s = total_duration_ms / 1000 if total_duration_ms > 0 else 0 header = f"⚙️ Tool Execution ({len(tool_executions)} tools" if total_duration_s > 0: header += f", {total_duration_s:.1f}s total" header += ")" with st.expander(header, expanded=st.session_state.details_tools_expanded): if not tool_executions: st.info("No tool executions recorded") return # Check if tool prompts should be shown (from app settings) show_prompts = st.session_state.get("show_tool_prompts", False) auto_expand = st.session_state.get("auto_expand_tool_details", False) for idx, tool in enumerate(tool_executions): # Status icon status_icons = { ExecutionStatus.SUCCESS: "✅", ExecutionStatus.FAILED: "❌", ExecutionStatus.TIMEOUT: "⏱️", ExecutionStatus.SKIPPED: "⏭️", } status_icon = status_icons.get(tool.status, "❓") # Duration badge duration_str = f"{tool.duration_ms}ms" if tool.duration_ms > 0 else "" if tool.duration_ms >= 1000: duration_str = f"{tool.duration_ms/1000:.1f}s" # Tool header st.markdown(f"{status_icon} **{tool.tool_name}** `{duration_str}`") # If show_prompts is enabled, show parameters inline (not in expander) if show_prompts and tool.parameters: st.markdown("**Tool Input/Prompt:**") st.code(json.dumps(tool.parameters, indent=2), language="json") # Expandable details for each tool (auto-expand if setting enabled) with st.expander(f"Details", expanded=auto_expand): if tool.parameters and not show_prompts: # Only show in expander if not already shown inline st.markdown("**Parameters:**") st.code(json.dumps(tool.parameters, indent=2), language="json") if tool.result_summary: st.markdown("**Result:**") st.caption(tool.result_summary) if tool.error_message and tool.status != ExecutionStatus.SUCCESS: st.error(tool.error_message) def render_details_panel( tool_results: List[dict], thinking_blocks: List[str], memory_recalls: List[str], execution_log: List[dict], response_time_ms: int, msg_idx: int ) -> None: """ Render the enhanced execution details panel with entities, graph, and tools. Args: tool_results: List of tool call results from the AI response thinking_blocks: List of thinking/reasoning text blocks memory_recalls: List of recalled memory items execution_log: Raw execution log from chat_with_tools response_time_ms: Total response generation time msg_idx: Message index for unique keys Returns: None (renders directly to Streamlit) Side Effects: - Updates st.session_state for collapse/selection state - Renders UI components to current Streamlit container """ _init_details_session_state() with st.expander("🔍 **Show Execution Details**", expanded=False): st.caption("Click sections below to expand/collapse") # Extract data for display entities = extract_entities_from_results(tool_results) relationships = extract_relationships_from_results(tool_results, entities) tool_executions = extract_tool_executions(execution_log) # Entity Section (User Story 1) selected_entity_id = render_entity_section( entities=entities, total_count=len(entities), msg_idx=msg_idx ) # Graph Section (User Story 2) render_graph_section( entities=entities, relationships=relationships, selected_entity_id=selected_entity_id, msg_idx=msg_idx ) # Tools Section (User Story 3) render_tools_section(tool_executions, msg_idx) # Legacy: Show thinking blocks if present if thinking_blocks: with st.expander("💭 Thinking", expanded=False): for block in thinking_blocks: st.info(block) # Legacy: Show memory recalls if present if memory_recalls: with st.expander("🧠 Memory Recall", expanded=False): for recall in memory_recalls: st.success(recall) # Import memory system for UI try: from src.memory import VectorMemory MEMORY_AVAILABLE = True except ImportError: MEMORY_AVAILABLE = False print("Warning: Memory system not available", file=sys.stderr) st.set_page_config(page_title="Agentic Medical Chat", page_icon="🤖", layout="wide") # Set AWS profile # Initialize if 'messages' not in st.session_state: st.session_state.messages = [] # Determine LLM provider priority: NIM (local) > OpenAI > Bedrock if 'llm_provider' not in st.session_state: st.session_state.llm_provider = None st.session_state.openai_client = None st.session_state.llm_model = None # 1. Check for local NIM LLM first (most secure - data never leaves instance) nim_llm_url = os.getenv('NIM_LLM_URL') # e.g., http://localhost:8003/v1 if nim_llm_url and OPENAI_AVAILABLE: try: client = OpenAI(base_url=nim_llm_url, api_key="not-needed") # NIM uses OpenAI-compatible API st.session_state.openai_client = client st.session_state.llm_provider = 'nim' st.session_state.llm_model = os.getenv('NIM_LLM_MODEL', 'meta/llama-3.1-8b-instruct') st.success(f"✅ Using local NIM LLM ({st.session_state.llm_model}) - data stays on instance") except Exception as e: pass # Try next option # 2. Check for OpenAI if st.session_state.llm_provider is None: openai_key = os.getenv('OPENAI_API_KEY') if openai_key and OPENAI_AVAILABLE: try: client = OpenAI(api_key=openai_key) st.session_state.openai_client = client st.session_state.llm_provider = 'openai' st.session_state.llm_model = os.getenv('OPENAI_MODEL', 'gpt-4o') st.success(f"✅ Using OpenAI ({st.session_state.llm_model}) for synthesis") except Exception as e: st.warning(f"⚠️ OpenAI initialization failed: {e}") # 3. Fall back to Bedrock if st.session_state.llm_provider is None: try: test_cmd = [ "aws", "bedrock-runtime", "converse", "--model-id", "global.anthropic.claude-sonnet-4-5-20250929-v1:0", "--messages", json.dumps([{"role": "user", "content": [{"text": "test"}]}]) ] result = subprocess.run(test_cmd, capture_output=True, text=True, env=os.environ.copy(), timeout=10) if result.returncode == 0: st.session_state.llm_provider = 'bedrock' st.session_state.llm_model = 'claude-sonnet-4.5' st.success("✅ Using AWS Bedrock Claude for synthesis") else: st.warning(f"⚠️ No LLM provider available. Running in demo mode without synthesis.") except Exception as e: st.warning(f"⚠️ No LLM provider available ({str(e)}). Running in demo mode without synthesis.") # Backward compatibility if 'bedrock_available' not in st.session_state: st.session_state.bedrock_available = (st.session_state.llm_provider is not None) # Define MCP tools for Claude MCP_TOOLS = [ { "name": "search_fhir_documents", "description": "Search FHIR clinical documents by text. Returns relevant medical records.", "input_schema": { "type": "object", "properties": { "query": {"type": "string", "description": "Search terms"}, "limit": {"type": "integer", "description": "Max results", "default": 5} }, "required": ["query"] } }, { "name": "search_knowledge_graph", "description": "Search medical knowledge graph for entities (symptoms, conditions, medications, etc.)", "input_schema": { "type": "object", "properties": { "query": {"type": "string", "description": "Entity search terms"}, "limit": {"type": "integer", "description": "Max entities", "default": 5} }, "required": ["query"] } }, { "name": "hybrid_search", "description": "Combined FHIR + Knowledge Graph search with ranking fusion. Best for complex queries.", "input_schema": { "type": "object", "properties": { "query": {"type": "string", "description": "Medical search query"}, "top_k": {"type": "integer", "description": "Number of results", "default": 5} }, "required": ["query"] } }, { "name": "get_document_details", "description": "Retrieve full clinical note from a FHIR document by ID", "input_schema": { "type": "object", "properties": { "fhir_id": {"type": "string", "description": "Document ID (e.g., '1474')"} }, "required": ["fhir_id"] } }, { "name": "get_entity_statistics", "description": "Get knowledge graph statistics - entity counts, types, distribution", "input_schema": {"type": "object", "properties": {}} }, { "name": "plot_symptom_frequency", "description": "Generate bar chart data showing most frequent symptoms", "input_schema": { "type": "object", "properties": { "top_n": {"type": "integer", "description": "Number of top symptoms", "default": 10} } } }, { "name": "plot_entity_distribution", "description": "Generate chart data showing distribution of entity types", "input_schema": { "type": "object", "properties": { "chart_type": {"type": "string", "enum": ["pie", "bar"], "default": "bar"} } } }, { "name": "plot_patient_timeline", "description": "Generate timeline chart data of patient encounters over time", "input_schema": {"type": "object", "properties": {}} }, { "name": "plot_entity_network", "description": "Generate network graph visualization of entity relationships", "input_schema": { "type": "object", "properties": { "entity": {"type": "string", "description": "Entity to center the network around (optional)"}, "max_nodes": {"type": "integer", "description": "Maximum number of nodes", "default": 50} } } }, { "name": "visualize_graphrag_results", "description": "Visualize GraphRAG search results showing query, entities found, and their relationships", "input_schema": { "type": "object", "properties": { "query": {"type": "string", "description": "The search query used"}, "limit": {"type": "integer", "description": "Number of results to visualize", "default": 10} }, "required": ["query"] } }, { "name": "search_medical_images", "description": "Search for medical images (X-rays) using text query or metadata.", "input_schema": { "type": "object", "properties": { "query": {"type": "string", "description": "Search query (e.g., 'chest X-ray of pneumonia')"}, "limit": {"type": "integer", "description": "Max images", "default": 5} }, "required": ["query"] } } ] def execute_mcp_tool(tool_name: str, tool_input: dict): """Execute an MCP tool and return results""" try: result = asyncio.run(call_tool(tool_name, tool_input)) return json.loads(result[0].text) except Exception as e: return {"error": str(e)} def load_dicom_image(dicom_path): """Load DICOM file and convert to PIL Image for display.""" if not DICOM_AVAILABLE: return None try: dcm = pydicom.dcmread(dicom_path) pixel_array = dcm.pixel_array # Normalize to 0-255 if pixel_array.max() > 0: pixel_array = ((pixel_array - pixel_array.min()) / (pixel_array.max() - pixel_array.min()) * 255).astype(np.uint8) # Convert to PIL Image img = Image.fromarray(pixel_array) # Convert to RGB if grayscale if img.mode != 'RGB': img = img.convert('RGB') return img except Exception as e: print(f"Error loading DICOM {dicom_path}: {e}", file=sys.stderr) return None def render_chart(tool_name: str, data, unique_id: str = None): """Render visualization if tool returns chart data""" # Debug logging import sys import traceback import time # Generate unique key for this chart instance if unique_id is None: unique_id = f"{tool_name}_{int(time.time() * 1000000)}" print(f"DEBUG render_chart: tool_name={tool_name}, data type={type(data)}, unique_id={unique_id}", file=sys.stderr) if isinstance(data, str): print(f"DEBUG: data is string, first 200 chars: {data[:200]}", file=sys.stderr) elif isinstance(data, dict): print(f"DEBUG: data is dict, keys: {data.keys()}", file=sys.stderr) try: # Handle case where data might be a string (JSON) if isinstance(data, str): try: data = json.loads(data) except json.JSONDecodeError as e: st.error(f"Failed to parse chart data: {e}") st.code(data[:500], language="text") print(f"ERROR: JSON decode failed: {e}", file=sys.stderr) print(f"ERROR: Full traceback:\n{traceback.format_exc()}", file=sys.stderr) return False # Check if data is a dict if not isinstance(data, dict): st.error(f"Chart data is not a dict: {type(data)}") print(f"ERROR: Data is not dict: {type(data)}", file=sys.stderr) return False if tool_name == "plot_symptom_frequency": fig = go.Figure(data=[go.Bar( x=data["data"]["symptoms"], y=data["data"]["frequencies"], marker_color='lightcoral' )]) fig.update_layout(title="Most Frequent Symptoms", height=400) st.plotly_chart(fig, key=unique_id, use_container_width=True) return True elif tool_name == "plot_entity_distribution": if data.get("chart_type") == "pie": fig = go.Figure(data=[go.Pie( labels=data["data"]["labels"], values=data["data"]["values"] )]) else: fig = go.Figure(data=[go.Bar( x=data["data"]["labels"], y=data["data"]["values"], marker_color='steelblue' )]) fig.update_layout(title="Entity Type Distribution", height=400) st.plotly_chart(fig, key=unique_id, use_container_width=True) return True elif tool_name == "plot_patient_timeline": fig = go.Figure(data=[go.Scatter( x=data["data"]["dates"], y=data["data"]["counts"], mode='lines+markers', line=dict(color='green', width=2) )]) fig.update_layout(title="Patient Timeline", height=400) st.plotly_chart(fig, key=unique_id, use_container_width=True) return True elif tool_name == "plot_entity_network": # Create interactive network graph using streamlit-agraph nodes_data = data["data"]["nodes"] edges_data = data["data"]["edges"] if AGRAPH_AVAILABLE: # Build agraph nodes and edges agraph_nodes = [] agraph_edges = [] for i, n in enumerate(nodes_data): agraph_nodes.append(Node( id=str(i), label=n["name"], size=25, color=n.get("color", "#97c2fc"), title=f"{n['name']}\nType: {n['type']}" )) for edge in edges_data: agraph_edges.append(Edge( source=str(edge["source"]), target=str(edge["target"]), # No label on main graph to reduce clutter (hover shows relationship) color="#888888" )) st.subheader("Entity Relationship Network (Interactive)") # Physics controls - initialize session state if "graph_physics_enabled" not in st.session_state: st.session_state.graph_physics_enabled = True # Control panel for graph settings ctrl_cols = st.columns([2, 3, 2]) with ctrl_cols[0]: physics_enabled = st.checkbox( "Physics Animation", value=st.session_state.graph_physics_enabled, key=f"physics_toggle_{unique_id}", help="Toggle force-directed layout animation" ) st.session_state.graph_physics_enabled = physics_enabled with ctrl_cols[1]: st.caption("Drag nodes to rearrange. Scroll to zoom.") # Configure the graph - physics enables force-directed animation # Using vis.js-compatible options only config = Config( width=800, height=600, directed=False, physics=physics_enabled, hierarchical=False ) agraph(nodes=agraph_nodes, edges=agraph_edges, config=config) return True else: # Fallback to static Plotly if agraph not available node_x = [n["x"] for n in nodes_data] node_y = [n["y"] for n in nodes_data] node_text = [f"{n['name']}<br>Type: {n['type']}" for n in nodes_data] edge_traces = [] for edge in edges_data: x0, y0 = nodes_data[edge["source"]]["x"], nodes_data[edge["source"]]["y"] x1, y1 = nodes_data[edge["target"]]["x"], nodes_data[edge["target"]]["y"] edge_traces.append(go.Scatter( x=[x0, x1, None], y=[y0, y1, None], mode='lines', line=dict(width=0.5, color='#888'), hoverinfo='none', showlegend=False )) node_trace = go.Scatter( x=node_x, y=node_y, mode='markers+text', text=[n["name"] for n in nodes_data], textposition="top center", hovertext=node_text, hoverinfo='text', marker=dict(size=10, color=[n.get("color", "lightblue") for n in nodes_data], line=dict(width=2, color='white')) ) fig = go.Figure(data=edge_traces + [node_trace]) fig.update_layout( title="Entity Relationship Network", showlegend=False, hovermode='closest', margin=dict(b=0, l=0, r=0, t=40), height=600, xaxis=dict(showgrid=False, zeroline=False, showticklabels=False), yaxis=dict(showgrid=False, zeroline=False, showticklabels=False) ) st.plotly_chart(fig, key=unique_id, use_container_width=True) return True elif tool_name == "visualize_graphrag_results": # Create interactive GraphRAG results visualization nodes_data = data["data"]["nodes"] edges_data = data["data"]["edges"] if AGRAPH_AVAILABLE: # Build agraph nodes and edges agraph_nodes = [] agraph_edges = [] for i, n in enumerate(nodes_data): # Query node is larger size = 35 if n.get("type") == "QUERY" else 25 agraph_nodes.append(Node( id=str(i), label=n["name"], size=size, color=n.get("color", "#97c2fc"), title=f"{n['name']}\nType: {n['type']}" )) for edge in edges_data: # MATCHES edges are thicker width = 3 if edge.get("type") == "MATCHES" else 1 color = "#444444" if edge.get("type") == "MATCHES" else "#888888" agraph_edges.append(Edge( source=str(edge["source"]), target=str(edge["target"]), # No label to reduce clutter (hover shows relationship) color=color, width=width )) st.subheader(f"GraphRAG Results: {data.get('query', '')} ({data.get('entities_found', 0)} entities)") # Physics controls - initialize session state if "graph_physics_enabled" not in st.session_state: st.session_state.graph_physics_enabled = True # Control panel for graph settings ctrl_cols = st.columns([2, 3, 2]) with ctrl_cols[0]: physics_enabled = st.checkbox( "Physics Animation", value=st.session_state.graph_physics_enabled, key=f"physics_toggle_{unique_id}", help="Toggle force-directed layout animation" ) st.session_state.graph_physics_enabled = physics_enabled with ctrl_cols[1]: st.caption("Drag nodes to rearrange. Scroll to zoom.") # Configure the graph with physics for animation # Using vis.js-compatible options only config = Config( width=800, height=600, directed=False, physics=physics_enabled, hierarchical=False ) agraph(nodes=agraph_nodes, edges=agraph_edges, config=config) return True else: # Fallback to static Plotly node_x = [n["x"] for n in nodes_data] node_y = [n["y"] for n in nodes_data] node_text = [f"{n['name']}<br>Type: {n['type']}" for n in nodes_data] node_sizes = [20 if n.get("type") == "QUERY" else 12 for n in nodes_data] edge_traces = [] for edge in edges_data: x0, y0 = nodes_data[edge["source"]]["x"], nodes_data[edge["source"]]["y"] x1, y1 = nodes_data[edge["target"]]["x"], nodes_data[edge["target"]]["y"] width = 1.5 if edge.get("type") == "MATCHES" else 0.5 color = '#444' if edge.get("type") == "MATCHES" else '#888' edge_traces.append(go.Scatter( x=[x0, x1, None], y=[y0, y1, None], mode='lines', line=dict(width=width, color=color), hoverinfo='none', showlegend=False )) node_trace = go.Scatter( x=node_x, y=node_y, mode='markers+text', text=[n["name"] for n in nodes_data], textposition="top center", hovertext=node_text, hoverinfo='text', marker=dict(size=node_sizes, color=[n.get("color", "lightblue") for n in nodes_data], line=dict(width=2, color='white')) ) fig = go.Figure(data=edge_traces + [node_trace]) fig.update_layout( title=f"GraphRAG Search Results: {data.get('query', '')} ({data.get('entities_found', 0)} entities found)", showlegend=False, hovermode='closest', margin=dict(b=0, l=0, r=0, t=40), height=600, xaxis=dict(showgrid=False, zeroline=False, showticklabels=False), yaxis=dict(showgrid=False, zeroline=False, showticklabels=False) ) st.plotly_chart(fig, key=unique_id, use_container_width=True) return True elif tool_name == "search_medical_images": # T020: Enhanced UX for embedder initialization search_mode = data.get("search_mode", "unknown") fallback_reason = data.get("fallback_reason") if search_mode == "keyword" and fallback_reason: # Check if it's a connection issue vs embedder not initialized if "not available" in fallback_reason.lower() or "not initialized" in fallback_reason.lower(): # Show friendly info box instead of warning st.info(f"🔄 **First search** - Initializing semantic search engine (NV-CLIP). Using keyword search for this query.") st.caption("Subsequent searches will use AI-powered semantic search automatically.") else: # Real error - show as warning st.warning(f"⚠️ Semantic search temporarily unavailable. Using keyword search.") with st.expander("Technical details"): st.code(fallback_reason) # Show search statistics exec_time = data.get("execution_time_ms", 0) cache_hit = data.get("cache_hit", False) avg_score = data.get("avg_score") # Display search metadata with improved UX meta_cols = st.columns(4) with meta_cols[0]: # Show search mode with emoji indicator if search_mode == "semantic": st.metric("Search Mode", "🤖 Semantic", help="AI-powered vector search using NV-CLIP") else: st.metric("Search Mode", "🔤 Keyword", help="Text-based keyword matching") with meta_cols[1]: st.metric("Execution Time", f"{exec_time}ms") if search_mode == "semantic": with meta_cols[2]: st.metric("Cache", "⚡ Hit" if cache_hit else "🔄 Miss") if avg_score is not None: with meta_cols[3]: st.metric("Avg Score", f"{avg_score:.2f}", help="Average similarity score (0-1)") # Render images grid images = data.get("images", []) if not images: st.warning("No images found matching your query.") return False st.subheader(f"Found {len(images)} Images for '{data.get('query', '')}'") # T019: Create columns for grid layout with score badges cols = st.columns(3) for idx, img in enumerate(images): with cols[idx % 3]: # Get scoring metadata similarity_score = img.get("similarity_score") score_color = img.get("score_color", "gray") confidence_level = img.get("confidence_level", "unknown") # Map color names to hex color_map = { "green": "#28a745", "yellow": "#ffc107", "gray": "#6c757d" } hex_color = color_map.get(score_color, "#6c757d") # Use image path if available, or placeholder img_path = img.get("image_path") study_type = img.get('study_type', 'Unknown Study') image_id = img.get('image_id', 'Unknown ID') # T017: Use patient_display from radiology integration (linked patient name or unlinked fallback) patient_display = img.get('patient_display', img.get('patient_name', 'Unknown Patient')) patient_linked = img.get('patient_linked', False) # Build caption with score badge - style patient differently if linked vs unlinked patient_style = "color: #28a745;" if patient_linked else "color: #dc3545; font-style: italic;" caption_html = f""" <div style='text-align: center; margin-bottom: 8px;'> <strong>{study_type}</strong><br/> <small style='{patient_style}'>{patient_display}</small><br/> <small style='color: #666;'>ID: {image_id[:8]}...</small> </div> """ # Add score badge if available if similarity_score is not None: caption_html += f""" <div style=' background-color: {hex_color}; color: white; padding: 6px 12px; border-radius: 4px; text-align: center; font-weight: bold; margin-top: 4px; '> Score: {similarity_score:.2f} ({confidence_level}) </div> """ # Display caption with HTML st.markdown(caption_html, unsafe_allow_html=True) try: # Convert relative path to absolute (relative to project root) if img_path: if not os.path.isabs(img_path): # Path is relative, resolve from parent directory img_path = os.path.abspath(os.path.join(parent_dir, img_path)) if img_path and os.path.exists(img_path): # Check if DICOM file if img_path.lower().endswith('.dcm'): dicom_img = load_dicom_image(img_path) if dicom_img: st.image(dicom_img, use_container_width=True) else: st.warning(f"Could not load DICOM: {os.path.basename(img_path)}") st.info(f"{study_type} - {patient_display}") else: # Regular image file (PNG, JPG, etc.) st.image(img_path, use_container_width=True) else: # Fallback if local path not found st.warning(f"Image not found: {os.path.basename(img_path) if img_path else 'N/A'}") st.info(f"{study_type} - Patient {patient_id}") except Exception as e: st.error(f"Error loading image: {e}") return True return False except Exception as e: error_msg = f"❌ RENDER ERROR: {str(e)}" st.error(error_msg) print(f"\n{'='*60}", file=sys.stderr) print(f"FATAL ERROR in render_chart:", file=sys.stderr) print(f"Tool: {tool_name}", file=sys.stderr) print(f"Error: {e}", file=sys.stderr) print(f"Full traceback:\n{traceback.format_exc()}", file=sys.stderr) print(f"{'='*60}\n", file=sys.stderr) return False def demo_mode_search(user_message: str): """Demo mode without Claude - directly execute MCP tools based on keywords""" query_lower = user_message.lower() status = st.empty() status.write("🔍 Running in demo mode (no Claude) - executing direct search...") try: # Check for visualization requests if "plot" in query_lower or "chart" in query_lower or "visualize" in query_lower: if "symptom" in query_lower and ("frequency" in query_lower or "common" in query_lower): result = asyncio.run(call_tool("plot_symptom_frequency", {"top_n": 10})) data = json.loads(result[0].text) fig = go.Figure(data=[go.Bar( x=data["data"]["symptoms"], y=data["data"]["frequencies"], marker_color='lightcoral' )]) fig.update_layout(title="Most Frequent Symptoms", height=400) st.plotly_chart(fig, use_container_width=True) status.empty() return "Chart displayed above showing top 10 symptoms." elif "entity" in query_lower or "distribution" in query_lower: result = asyncio.run(call_tool("plot_entity_distribution", {"chart_type": "bar"})) data = json.loads(result[0].text) fig = go.Figure(data=[go.Bar( x=data["data"]["labels"], y=data["data"]["values"], marker_color='steelblue' )]) fig.update_layout(title="Entity Type Distribution", height=400) st.plotly_chart(fig, use_container_width=True) status.empty() return "Chart displayed above showing entity distribution." # Check for image search if "image" in query_lower or "x-ray" in query_lower or "scan" in query_lower: result = asyncio.run(call_tool("search_medical_images", {"query": user_message, "limit": 3})) data = json.loads(result[0].text) # Render images manually for demo mode since we return text here # But wait, chat_with_tools expects text return from demo_mode_search # And it doesn't render charts/images from the return value of demo_mode_search # demo_mode_search renders charts directly using st.plotly_chart # So we should render images directly here too images = data.get("images", []) if images: st.subheader(f"Found {len(images)} Images (Demo Mode)") cols = st.columns(3) for idx, img in enumerate(images): with cols[idx % 3]: img_path = img.get("image_path") # Convert relative path to absolute (relative to project root) if img_path and not os.path.isabs(img_path): img_path = os.path.abspath(os.path.join(parent_dir, img_path)) study_type = img.get('study_type', 'Unknown Study') patient_id = img.get('patient_id', 'Unknown Patient') caption = f"{study_type} - Patient {patient_id}" if img_path and os.path.exists(img_path): # Check if DICOM file if img_path.lower().endswith('.dcm'): dicom_img = load_dicom_image(img_path) if dicom_img: st.image(dicom_img, caption=caption, use_container_width=True) else: st.info(f"Image: {caption}") else: # Regular image file st.image(img_path, caption=caption, use_container_width=True) else: st.info(f"Image: {caption}") status.empty() return f"Found {len(images)} images for your query." else: return "No images found matching your query." # Otherwise do hybrid search result = asyncio.run(call_tool("hybrid_search", {"query": user_message, "top_k": 5})) data = json.loads(result[0].text) status.empty() response = f"**Search Results** (Demo Mode)\n\n" response += f"- FHIR results: {data['fhir_results']}\n" response += f"- GraphRAG results: {data['graphrag_results']}\n" response += f"- Fused results: {data['fused_results']}\n\n" if data['top_documents']: response += "**Top Documents:**\n" for doc in data['top_documents']: sources = ", ".join(doc['sources']) response += f"- Document {doc['fhir_id']} (score: {doc['rrf_score']:.4f}, sources: {sources})\n" return response except Exception as e: status.empty() return f"❌ Error in demo mode: {str(e)}" def call_openai_compatible(messages, tools=None): """Call OpenAI or NIM LLM (both use OpenAI-compatible API)""" client = st.session_state.openai_client model = st.session_state.llm_model # Convert MCP tools to OpenAI function format openai_tools = [] if tools: for tool in tools: openai_tools.append({ "type": "function", "function": { "name": tool["toolSpec"]["name"], "description": tool["toolSpec"]["description"], "parameters": tool["toolSpec"]["inputSchema"]["json"] } }) # Build OpenAI messages openai_messages = [] for msg in messages: if msg["role"] == "user": if isinstance(msg["content"], str): openai_messages.append({"role": "user", "content": msg["content"]}) elif isinstance(msg["content"], list): # Handle tool results for block in msg["content"]: if block.get("type") == "tool_result": openai_messages.append({ "role": "tool", "tool_call_id": block["tool_use_id"], "content": block["content"] }) elif msg["role"] == "assistant": if isinstance(msg["content"], str): openai_messages.append({"role": "assistant", "content": msg["content"]}) elif isinstance(msg["content"], list): # Handle assistant messages with tool calls text_content = "" tool_calls = [] for block in msg["content"]: if isinstance(block, dict): if block.get("type") == "text": text_content += block.get("text", "") elif block.get("type") == "tool_use": tool_calls.append({ "id": block.get("id"), "type": "function", "function": { "name": block.get("name"), "arguments": json.dumps(block.get("input", {})) } }) assistant_msg = {"role": "assistant", "content": text_content or None} if tool_calls: assistant_msg["tool_calls"] = tool_calls openai_messages.append(assistant_msg) # Call OpenAI/NIM kwargs = { "model": model, "messages": openai_messages, "max_tokens": 4000 } if openai_tools: kwargs["tools"] = openai_tools kwargs["tool_choice"] = "auto" response = client.chat.completions.create(**kwargs) # Convert response to Bedrock-like format for compatibility choice = response.choices[0] result = {"output": {"message": {"role": "assistant", "content": []}}} if choice.message.content: result["output"]["message"]["content"].append({"text": choice.message.content}) if choice.message.tool_calls: for tc in choice.message.tool_calls: result["output"]["message"]["content"].append({ "toolUse": { "toolUseId": tc.id, "name": tc.function.name, "input": json.loads(tc.function.arguments) } }) # Set stop reason if choice.finish_reason == "tool_calls": result["stopReason"] = "tool_use" else: result["stopReason"] = "end_turn" return result def call_claude_via_cli(messages, tools=None): """Call Claude via AWS CLI instead of boto3""" # Convert to Converse API format converse_messages = [] for msg in messages: if msg["role"] == "user": if isinstance(msg["content"], str): converse_messages.append({ "role": "user", "content": [{"text": msg["content"]}] }) elif isinstance(msg["content"], list): # Tool results content_blocks = [] for block in msg["content"]: if block.get("type") == "tool_result": content_blocks.append({ "toolResult": { "toolUseId": block["tool_use_id"], "content": [{"text": block["content"]}] } }) if content_blocks: converse_messages.append({"role": "user", "content": content_blocks}) elif msg["role"] == "assistant": # Convert assistant content content_blocks = [] # Handle case where content is a string (error messages or simple text) if isinstance(msg["content"], str): content_blocks.append({"text": msg["content"]}) elif isinstance(msg["content"], dict) and "text" in msg["content"]: # Handle dict with text key (from our chart responses) content_blocks.append({"text": msg["content"]["text"]}) elif isinstance(msg["content"], list): # Handle list of content blocks (standard Messages API format) for block in msg["content"]: # Type check first before any dict operations if isinstance(block, str): # Handle string content blocks content_blocks.append({"text": block}) elif isinstance(block, dict): # Safe to use .get() now that we've confirmed it's a dict block_type = block.get("type") if block_type == "text": content_blocks.append({"text": block.get("text", "")}) elif block_type == "tool_use": content_blocks.append({ "toolUse": { "toolUseId": block.get("id", ""), "name": block.get("name", ""), "input": block.get("input", {}) } }) else: # Log unexpected block type and skip print(f"Warning: Unexpected block type in assistant message: {type(block)}", file=sys.stderr) if content_blocks: converse_messages.append({"role": "assistant", "content": content_blocks}) cmd = [ "aws", "bedrock-runtime", "converse", "--model-id", "global.anthropic.claude-sonnet-4-5-20250929-v1:0", "--messages", json.dumps(converse_messages) ] if tools: cmd.extend(["--tool-config", json.dumps({"tools": tools})]) cmd.extend(["--inference-config", json.dumps({"maxTokens": 4000})]) result = subprocess.run( cmd, capture_output=True, text=True, env=os.environ.copy(), timeout=30 ) if result.returncode != 0: raise Exception(f"AWS CLI error: {result.stderr}") return json.loads(result.stdout) def recall_relevant_memories(query: str, top_k: int = 3) -> str: """Recall relevant memories for a query and format them as context.""" if not MEMORY_AVAILABLE: return "" try: memory = VectorMemory() memories = memory.recall(query, memory_type=None, top_k=top_k) if not memories: return "" # Format memories as context for the LLM memory_context = "\n[AGENT MEMORY - User preferences and past corrections to consider:]\n" for mem in memories: if mem['similarity'] > 0.3: # Only include reasonably relevant memories memory_context += f"- [{mem['memory_type'].upper()}] {mem['text']}\n" if memory_context == "\n[AGENT MEMORY - User preferences and past corrections to consider:]\n": return "" # No relevant memories above threshold memory_context += "[END MEMORY]\n\n" return memory_context except Exception as e: print(f"Error recalling memories: {e}", file=sys.stderr) return "" def chat_with_tools(user_message: str): """Chat with Claude using tool use""" # If no Claude, run in demo mode if not st.session_state.bedrock_available: return demo_mode_search(user_message) # AUTOMATIC MEMORY RECALL: Inject relevant user preferences/corrections memory_context = recall_relevant_memories(user_message) if memory_context: print(f"DEBUG: Injecting memory context:\n{memory_context}", file=sys.stderr) # Enhance user message if it's asking for visualization viz_keywords = ['plot', 'chart', 'graph', 'visualize', 'show me', 'display'] if any(keyword in user_message.lower() for keyword in viz_keywords): # Add explicit instruction to use visualization tools user_message = user_message + "\n\n[IMPORTANT: Use the appropriate plot_* tool to create a visualization. Available: plot_entity_network, plot_symptom_frequency, plot_entity_distribution, plot_patient_timeline]" # Prepend memory context to user message so LLM sees user preferences if memory_context: user_message = memory_context + user_message # Build conversation history from session state, converting to simple format for API messages = [] for msg in st.session_state.messages: # Skip malformed messages if not isinstance(msg, dict) or "role" not in msg: continue # Extract just the text content for conversation history if msg["role"] == "user": messages.append({"role": "user", "content": msg["content"]}) elif msg["role"] == "assistant": # Extract text from assistant messages if isinstance(msg["content"], dict) and "text" in msg["content"]: messages.append({"role": "assistant", "content": msg["content"]["text"]}) else: messages.append({"role": "assistant", "content": msg["content"]}) # Add the new user message messages.append({"role": "user", "content": user_message}) status = st.empty() chart_container = st.container() text_container = st.container() # Track charts rendered in this conversation rendered_charts = [] # Track tool execution details for transparency tool_execution_log = [] # Log memory recall if it happened if memory_context: tool_execution_log.append({ "iteration": 0, "type": "memory_recall", "content": memory_context.strip() }) max_iterations = 10 # Increased from 5 to handle complex multi-tool queries iteration = 0 while iteration < max_iterations: iteration += 1 try: # Convert MCP tools to Converse API format converse_tools = [] for tool in MCP_TOOLS: converse_tools.append({ "toolSpec": { "name": tool["name"], "description": tool["description"], "inputSchema": {"json": tool["input_schema"]} } }) # Call LLM based on provider if st.session_state.llm_provider in ('openai', 'nim'): response = call_openai_compatible(messages, converse_tools if converse_tools else None) else: response = call_claude_via_cli(messages, converse_tools if converse_tools else None) # Process response stop_reason = response.get('stopReason') output_message = response.get('output', {}).get('message', {}) content = output_message.get('content', []) # Add assistant response to messages messages.append({"role": "assistant", "content": content}) # Handle tool use if stop_reason == "tool_use": status.write(f"🔧 Claude is calling tools... (iteration {iteration})") # Convert Converse API format back to Messages API format for internal processing messages_api_content = [] tool_results = [] for block in content: if 'toolUse' in block: tool_use_block = block['toolUse'] tool_name = tool_use_block['name'] tool_input = tool_use_block['input'] tool_use_id = tool_use_block['toolUseId'] status.write(f"⚙️ Executing: {tool_name}") # Execute the MCP tool result = execute_mcp_tool(tool_name, tool_input) # Log tool execution tool_execution_log.append({ "iteration": iteration, "tool_name": tool_name, "tool_input": tool_input, "result_summary": str(result)[:200] + "..." if len(str(result)) > 200 else str(result), "full_result": result # Store full result for entity extraction }) # Render chart if applicable and track it (only for visualization tools) visualization_tools = ["plot_symptom_frequency", "plot_entity_distribution", "plot_patient_timeline", "plot_entity_network", "visualize_graphrag_results", "search_medical_images"] if tool_name in visualization_tools: with chart_container: was_chart = render_chart(tool_name, result) if was_chart: # Save chart data for re-rendering rendered_charts.append({ "tool_name": tool_name, "data": result }) # Store in Messages API format for next iteration messages_api_content.append({ "type": "tool_use", "id": tool_use_id, "name": tool_name, "input": tool_input }) # Add tool result tool_results.append({ "type": "tool_result", "tool_use_id": tool_use_id, "content": json.dumps(result) }) elif 'text' in block: # Capture thinking/reasoning text thinking_text = block['text'] if thinking_text.strip(): tool_execution_log.append({ "iteration": iteration, "type": "thinking", "content": thinking_text }) messages_api_content.append({ "type": "text", "text": thinking_text }) # Update last assistant message with Messages API format if messages and messages[-1]["role"] == "assistant": messages[-1]["content"] = messages_api_content # Add tool results to conversation messages.append({"role": "user", "content": tool_results}) elif stop_reason == "end_turn": # Claude is done - extract final text status.empty() final_text = "" for block in content: if 'text' in block: final_text += block['text'] with text_container: st.write(final_text) # Return text with chart data and execution log result = {"text": final_text} if rendered_charts: result["chart_data"] = rendered_charts[0] if len(rendered_charts) == 1 else rendered_charts if tool_execution_log: result["execution_log"] = tool_execution_log return result if len(result) > 1 else final_text else: status.empty() return "Unexpected stop reason: " + stop_reason except Exception as e: status.empty() import traceback error_msg = f"❌ Error: {str(e)}" st.error(error_msg) print(f"\n{'='*60}", file=sys.stderr) print(f"EXCEPTION in chat_with_tools:", file=sys.stderr) print(f"Error: {e}", file=sys.stderr) print(f"Full traceback:\n{traceback.format_exc()}", file=sys.stderr) print(f"{'='*60}\n", file=sys.stderr) return error_msg # Max iterations reached - return what we have so far status.empty() error_msg = f"⚠️ Query exceeded maximum iterations ({max_iterations}). Claude called too many tools without completing. This may indicate the query is too complex or ambiguous." result = {"text": error_msg} if tool_execution_log: result["execution_log"] = tool_execution_log return result # UI st.title("🤖 Agentic Medical Chat") st.caption("Claude autonomously calls MCP tools to answer your questions") st.caption("🔧 **Build: v2.16.0** - Backend returns complete entity objects (best practice)") # Sidebar with st.sidebar: st.header("🔧 Available Tools") for tool in MCP_TOOLS: st.write(f"• {tool['name']}") st.divider() if st.button("🗑️ Clear"): st.session_state.messages = [] st.rerun() # Memory Editor UI if MEMORY_AVAILABLE: st.divider() st.header("🧠 Agent Memory") try: memory = VectorMemory() # Show statistics with st.expander("📊 Memory Statistics", expanded=False): stats = memory.get_stats() st.metric("Total Memories", stats['total_memories']) if stats['type_breakdown']: st.write("**By Type:**") for mtype, count in stats['type_breakdown'].items(): st.write(f"- {mtype.title()}: {count}") if stats['most_used_memories']: st.write("**Most Used:**") for mem in stats['most_used_memories'][:3]: st.caption(f"• {mem['text'][:50]}... ({mem['count']}x)") # Browse/Search memories with st.expander("📚 Browse Memories", expanded=False): memory_type_filter = st.selectbox( "Filter by type", ["all", "correction", "knowledge", "preference", "feedback"], key="memory_type_filter" ) # Search interface search_query = st.text_input("Search memories", placeholder="e.g., 'pneumonia' or leave empty to browse all", key="memory_search") # Initialize search results in session state if 'memory_search_results' not in st.session_state: st.session_state.memory_search_results = None if st.button("🔍 Search", key="memory_search_btn"): filter_type = None if memory_type_filter == "all" else memory_type_filter # Empty query returns all memories sorted by use count st.session_state.memory_search_results = memory.recall(search_query or "", memory_type=filter_type, top_k=10) # Display results from session state if st.session_state.memory_search_results is not None: results = st.session_state.memory_search_results if results: st.write(f"Found {len(results)} memories:") for idx, mem in enumerate(results): with st.container(): col1, col2 = st.columns([4, 1]) with col1: st.markdown(f"**{mem['memory_type'].title()}** (Similarity: {mem['similarity']:.2f})") st.text(mem['text'][:200] + "..." if len(mem['text']) > 200 else mem['text']) st.caption(f"Used {mem['use_count']}x • ID: {mem['memory_id'][:8]}") with col2: if st.button("🗑️", key=f"del_{idx}_{mem['memory_id'][:8]}"): memory.forget(memory_id=mem['memory_id']) st.session_state.memory_search_results = None # Clear results st.success("Deleted!") st.rerun() else: st.info("No memories found matching your query.") # Add new memory with st.expander("➕ Add Memory", expanded=False): new_type = st.selectbox("Type", ["correction", "knowledge", "preference", "feedback"], key="new_memory_type") new_text = st.text_area("Memory text", placeholder="Enter information to remember...", key="new_memory_text") if st.button("💾 Save Memory", key="save_memory_btn") and new_text: memory.remember(new_type, new_text, context={"source": "manual_ui"}) st.success(f"✅ Saved {new_type} memory!") st.rerun() except Exception as e: st.error(f"Memory system error: {e}") # App Settings UI st.divider() st.header("Settings") _init_app_settings() with st.expander("Debug & Transparency", expanded=False): show_tool_prompts = st.checkbox( "Show tool prompts/inputs", value=st.session_state.get("show_tool_prompts", False), key="show_tool_prompts_toggle", help="Display the full input/prompt sent to each tool in the execution details" ) st.session_state.show_tool_prompts = show_tool_prompts auto_expand = st.checkbox( "Auto-expand tool details", value=st.session_state.get("auto_expand_tool_details", False), key="auto_expand_toggle", help="Automatically expand the Details section for each tool execution" ) st.session_state.auto_expand_tool_details = auto_expand st.caption("These settings affect the 'Tool Execution' section in response details.") # Display chat for idx, msg in enumerate(st.session_state.messages): # Debug logging import sys print(f"\n=== MESSAGE {idx} ===", file=sys.stderr) print(f"Type: {type(msg)}", file=sys.stderr) print(f"Value: {msg}", file=sys.stderr) # Skip malformed messages if not isinstance(msg, dict) or "role" not in msg: print(f"SKIPPING malformed message {idx}", file=sys.stderr) continue with st.chat_message(msg["role"]): # Check if message has chart data - need to safely handle old message formats content = msg.get("content") if isinstance(msg, dict) else None if isinstance(content, dict) and "chart_data" in content: chart_data = content["chart_data"] # Handle single or multiple charts if isinstance(chart_data, list): for i, chart_info in enumerate(chart_data): unique_id = f"{chart_info['tool_name']}_msg{idx}_chart{i}" render_chart(chart_info["tool_name"], chart_info["data"], unique_id) else: unique_id = f"{chart_data['tool_name']}_msg{idx}" render_chart(chart_data["tool_name"], chart_data["data"], unique_id) # Also show the text if present if "text" in content: st.write(content["text"]) # Show execution details using new enhanced panel if "execution_log" in content: execution_log = content.get("execution_log", []) # Extract tool results for entity/relationship extraction tool_results = [] thinking_blocks = [] memory_recalls = [] for log_entry in execution_log: if log_entry.get("type") == "memory_recall": memory_recalls.append(log_entry.get("content", "")) elif log_entry.get("type") == "thinking": thinking_blocks.append(log_entry.get("content", "")) elif log_entry.get("tool_name"): # Convert log entry to tool result format for extraction # Use full_result if available, otherwise fall back to result_summary tool_results.append({ "tool_name": log_entry.get("tool_name", ""), "result": log_entry.get("full_result", log_entry.get("result_summary", "")) }) # Render enhanced details panel render_details_panel( tool_results=tool_results, thinking_blocks=thinking_blocks, memory_recalls=memory_recalls, execution_log=execution_log, response_time_ms=0, msg_idx=idx ) elif isinstance(content, dict) and "execution_log" in content: # Handle responses with execution_log but no chart_data # Display text content first if "text" in content: st.write(content["text"]) # Extract and render execution details execution_log = content.get("execution_log", []) tool_results = [] thinking_blocks = [] memory_recalls = [] for log_entry in execution_log: if log_entry.get("type") == "memory_recall": memory_recalls.append(log_entry.get("content", "")) elif log_entry.get("type") == "thinking": thinking_blocks.append(log_entry.get("content", "")) elif log_entry.get("tool_name"): # Use full_result if available, otherwise fall back to result_summary tool_results.append({ "tool_name": log_entry.get("tool_name", ""), "result": log_entry.get("full_result", log_entry.get("result_summary", "")) }) # Render enhanced details panel render_details_panel( tool_results=tool_results, thinking_blocks=thinking_blocks, memory_recalls=memory_recalls, execution_log=execution_log, response_time_ms=0, msg_idx=idx ) else: # Display content safely - it might be a string or None if content is not None: st.write(content) # Examples - organized in 3 columns with short labels st.write("**💡 Try these:**") examples = [ ("🔍 Common Symptoms", "What are the most common symptoms?"), ("📊 Symptom Chart", "Show me a chart of symptom frequency"), ("💔 Chest Pain", "Search for chest pain cases"), ("🕸️ Knowledge Graph", "What's in the knowledge graph?"), ("📈 Entity Stats", "Plot entity distribution"), ("🩻 Pneumonia X-rays", "Show me chest X-rays of pneumonia") ] # Use 3 columns with 2 rows for better visibility col1, col2, col3 = st.columns(3) for idx, (label, query) in enumerate(examples): col = [col1, col2, col3][idx % 3] with col: if st.button(label, key=f"ex_{idx}", use_container_width=True): st.session_state.messages.append({"role": "user", "content": query}) st.rerun() st.divider() # Process last user message if not yet answered if st.session_state.messages and isinstance(st.session_state.messages[-1], dict) and st.session_state.messages[-1].get("role") == "user": last_msg = st.session_state.messages[-1]["content"] with st.chat_message("user"): st.write(last_msg) with st.chat_message("assistant"): answer = chat_with_tools(last_msg) st.session_state.messages.append({"role": "assistant", "content": answer}) st.rerun() # Chat input if prompt := st.chat_input("Ask anything..."): st.session_state.messages.append({"role": "user", "content": prompt}) st.rerun()

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/isc-tdyar/medical-graphrag-assistant'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

streamlit_app.py•91.6 KiB