Claude Conversation Memory System

conversation_memory.py•26.5 KiB

#!/usr/bin/env python3 """ Common ConversationMemoryServer implementation This module contains the core conversation memory functionality shared between the FastMCP server and standalone implementations. """ import json import logging import re from datetime import datetime, timedelta from pathlib import Path from typing import Any, Dict, List, Optional import aiofiles try: from .search_database import SearchDatabase SQLITE_AVAILABLE = True except ImportError: try: from search_database import SearchDatabase SQLITE_AVAILABLE = True except ImportError: SQLITE_AVAILABLE = False class ConversationMemoryServer: def __init__( self, storage_path: str = "~/claude-memory", use_data_dir: Optional[bool] = None, enable_sqlite: bool = True, ): self.storage_path = Path(storage_path).expanduser() # Auto-detect directory structure if not specified if use_data_dir is None: use_data_dir = self._detect_data_directory_structure() # Configure paths based on structure if use_data_dir: # New consolidated structure: data/conversations, data/summaries self.conversations_path = self.storage_path / "data" / "conversations" self.summaries_path = self.storage_path / "data" / "summaries" else: # Legacy structure: conversations/, summaries/ in storage root self.conversations_path = self.storage_path / "conversations" self.summaries_path = self.storage_path / "summaries" self.index_file = self.conversations_path / "index.json" self.topics_file = self.conversations_path / "topics.json" # Initialize logger self.logger = logging.getLogger(__name__) # Initialize SQLite search database if available and enabled self.search_db = None self.use_sqlite_search = False if enable_sqlite and SQLITE_AVAILABLE: try: db_path = self.conversations_path / "search.db" self.search_db = SearchDatabase(str(db_path)) self.use_sqlite_search = True self.logger.info("SQLite FTS search enabled") except Exception as e: self.logger.warning(f"Failed to initialize SQLite search: {e}") self.use_sqlite_search = False # Ensure directories exist self.conversations_path.mkdir(parents=True, exist_ok=True) self.summaries_path.mkdir(parents=True, exist_ok=True) (self.summaries_path / "weekly").mkdir(exist_ok=True) # Initialize index files if they don't exist self._init_index_files() def _detect_data_directory_structure(self) -> bool: """ Auto-detect whether to use new data/ structure or legacy structure. Returns: True if data/ directory exists and contains conversations/ False for legacy structure (conversations/ in storage root) """ data_conversations = self.storage_path / "data" / "conversations" legacy_conversations = self.storage_path / "conversations" # If data/conversations exists, use new structure if data_conversations.exists(): return True # If conversations exists in root, use legacy structure if legacy_conversations.exists(): return False # If neither exists, default to new structure for new installations return True def _init_index_files(self): """Initialize index and topics files if they don't exist""" if not self.index_file.exists(): with open(self.index_file, "w") as f: json.dump( {"conversations": [], "last_updated": datetime.now().isoformat()}, f ) if not self.topics_file.exists(): with open(self.topics_file, "w") as f: json.dump({"topics": {}, "last_updated": datetime.now().isoformat()}, f) def _get_date_folder(self, date: datetime) -> Path: """Get the folder path for a given date""" year_folder = self.conversations_path / str(date.year) month_folder = year_folder / f"{date.month:02d}-{date.strftime('%B').lower()}" month_folder.mkdir(parents=True, exist_ok=True) return month_folder def _extract_topics(self, content: str) -> List[str]: """Extract topics from conversation content using simple keyword extraction""" common_tech_terms = [ "python", "javascript", "java", "css", "html", "react", "vue", "angular", "django", "flask", "nodejs", "express", "api", "database", "sql", "mongodb", "docker", "kubernetes", "aws", "azure", "gcp", "git", "github", "gitlab", "testing", "debugging", "deployment", "authentication", "security", "encryption", "machine learning", "ai", "neural network", "data science", "analytics", "frontend", "backend", "fullstack", "devops", "cicd", "microservices", "rest", "graphql", "websocket", "json", "xml", "yaml", "markdown", "linux", "windows", "macos", "bash", "powershell", "terminal", "cli", "performance", "optimization", "scalability", "architecture", "design patterns", "agile", "scrum", "kanban", "project management", "code review", ] # Convert to lowercase for matching content_lower = content.lower() # Find quoted terms (likely important concepts) quoted_terms = re.findall(r'"([^"]+)"', content) quoted_terms.extend(re.findall(r"'([^']+)'", content)) # Find technical terms found_topics = [] for term in common_tech_terms: if term in content_lower: found_topics.append(term) # Add quoted terms (filtered for reasonable length) for term in quoted_terms: if len(term) > 2 and len(term) < 50 and term.lower() not in found_topics: found_topics.append(term.lower()) # Find capitalized words that might be technologies/frameworks tech_pattern = r"\b[A-Z][a-zA-Z]*(?:[A-Z][a-zA-Z]*)*\b" capitalized_words = re.findall(tech_pattern, content) for word in capitalized_words: if ( len(word) > 2 and word.lower() not in found_topics and word not in ["The", "This", "That", "When", "Where", "How", "What", "Why"] ): found_topics.append(word.lower()) return found_topics[:10] # Limit to top 10 topics async def add_conversation( self, content: str, title: Optional[str] = None, conversation_date: Optional[str] = None, ) -> Dict[str, Any]: """Add a new conversation to storage""" try: # Parse date or use current if conversation_date: try: date = datetime.fromisoformat( conversation_date.replace("Z", "+00:00") ) except ValueError: date = datetime.now() else: date = datetime.now() # Generate title if not provided if not title: # Extract first line or first 50 characters as title lines = content.strip().split("\n") first_line = lines[0] if lines else content title = first_line[:50] + "..." if len(first_line) > 50 else first_line # Create conversation record conversation_id = ( f"conv_{date.strftime('%Y%m%d_%H%M%S')}_{hash(content) % 10000:04d}" ) date_folder = self._get_date_folder(date) file_path = date_folder / f"{conversation_id}.json" # Extract topics topics = self._extract_topics(content) conversation_data = { "id": conversation_id, "title": title, "content": content, "date": date.isoformat(), "topics": topics, "created_at": datetime.now().isoformat(), } # Save conversation file async with aiofiles.open(file_path, "w", encoding="utf-8") as f: await f.write( json.dumps(conversation_data, indent=2, ensure_ascii=False) ) # Update index self._update_index(conversation_data, file_path) # Update topics index self._update_topics_index(topics, conversation_id) # Add to SQLite search database if available if self.use_sqlite_search and self.search_db: relative_path = str(file_path.relative_to(self.storage_path)) self.search_db.add_conversation(conversation_data, relative_path) return { "status": "success", "file_path": str(file_path), "topics": topics, "message": f"Conversation saved successfully with ID: {conversation_id}", } except (OSError, ValueError, TypeError) as e: return { "status": "error", "message": f"Failed to save conversation: {str(e)}", } def _calculate_search_score( self, query_terms: List[str], content: str, title: str, topics: List[str] ) -> int: """Calculate relevance score for a conversation based on query terms""" score = 0 for term in query_terms: score += content.count(term) * 1 score += title.count(term) * 3 if term in topics: score += 5 return score async def _process_conversation_for_search( self, conv_info: dict, query_terms: List[str] ) -> Optional[dict]: """Process a single conversation for search results""" try: file_path = self.storage_path / conv_info["file_path"] if not file_path.exists(): return None async with aiofiles.open(file_path, "r", encoding="utf-8") as f: content = await f.read() conv_data = json.loads(content) content = conv_data.get("content", "").lower() title = conv_data.get("title", "").lower() topics = [t.lower() for t in conv_data.get("topics", [])] score = self._calculate_search_score(query_terms, content, title, topics) if score > 0: return { "id": conv_data["id"], "title": conv_data["title"], "date": conv_data["date"], "topics": conv_data["topics"], "score": score, "preview": content[:200] + "..." if len(content) > 200 else content, } return None except (OSError, ValueError, KeyError, TypeError): return None async def search_conversations( self, query: str, limit: int = 10 ) -> List[Dict[str, Any]]: """Search conversations by content and topics""" # Use SQLite FTS search if available and enabled if self.use_sqlite_search and self.search_db: try: return self.search_db.search_conversations(query, limit) except Exception as e: self.logger.warning( f"SQLite search failed, falling back to linear search: {e}" ) # Fall through to linear search # Fallback to linear search through JSON files try: # Load index async with aiofiles.open(self.index_file, "r") as f: content = await f.read() index_data = json.loads(content) conversations = index_data.get("conversations", []) query_terms = query.lower().split() results = [] for conv_info in conversations: result = await self._process_conversation_for_search( conv_info, query_terms ) if result: results.append(result) # Sort by score and return top results results.sort(key=lambda x: x["score"], reverse=True) return results[:limit] except (OSError, ValueError, KeyError, TypeError) as e: return [{"error": f"Search failed: {str(e)}"}] def _get_preview(self, file_path: Path, query_terms: List[str]) -> str: """Get a preview of the conversation around the search terms""" try: with open(file_path, "r", encoding="utf-8") as f: content = f.read() lines = content.split("\n") preview_lines = [] for i, line in enumerate(lines): line_lower = line.lower() if any(term in line_lower for term in query_terms): # Include context lines around the match start = max(0, i - 2) end = min(len(lines), i + 3) context = lines[start:end] preview_lines.extend(context) break preview = "\n".join(preview_lines[:10]) # Limit preview length return preview[:500] + "..." if len(preview) > 500 else preview except (OSError, ValueError, KeyError, TypeError): return "Preview unavailable" def get_preview(self, conversation_id: str) -> str: """Get a preview of a specific conversation""" try: # Load index to find the conversation with open(self.index_file, "r") as f: index_data = json.load(f) conversations = index_data.get("conversations", []) for conv_info in conversations: if conv_info["id"] == conversation_id: file_path = self.storage_path / conv_info["file_path"] if file_path.exists(): with open(file_path, "r", encoding="utf-8") as f: conv_data = json.load(f) content = conv_data.get("content", "") return content[:500] + "..." if len(content) > 500 else content else: return "Conversation file not found" return "Conversation not found" except (OSError, ValueError, KeyError, TypeError) as e: return f"Error retrieving conversation: {str(e)}" def _update_index(self, conversation_data: Dict, file_path: Path): """Update the main index with new conversation""" try: # Load existing index with open(self.index_file, "r") as f: index_data = json.load(f) # Add new conversation to index relative_path = file_path.relative_to(self.storage_path) conv_entry = { "id": conversation_data["id"], "title": conversation_data["title"], "date": conversation_data["date"], "topics": conversation_data["topics"], "file_path": str(relative_path), "added_at": datetime.now().isoformat(), } index_data["conversations"].append(conv_entry) index_data["last_updated"] = datetime.now().isoformat() # Save updated index with open(self.index_file, "w") as f: json.dump(index_data, f, indent=2) except (OSError, ValueError, KeyError, TypeError) as e: self.logger.error(f"Error updating index: {e}") def _update_topics_index(self, topics: List[str], conversation_id: str): """Update the topics index with new conversation topics""" try: # Load existing topics index with open(self.topics_file, "r") as f: topics_data = json.load(f) topics_index = topics_data.get("topics", {}) # Add conversation to each topic for topic in topics: if topic not in topics_index or isinstance(topics_index[topic], int): # Initialize new topics or handle legacy format where topics were stored # as counts topics_index[topic] = [] topics_index[topic].append( { "conversation_id": conversation_id, "added_at": datetime.now().isoformat(), } ) topics_data["topics"] = topics_index topics_data["last_updated"] = datetime.now().isoformat() # Save updated topics index with open(self.topics_file, "w") as f: json.dump(topics_data, f, indent=2) except (OSError, ValueError, KeyError, TypeError) as e: self.logger.error(f"Error updating topics index: {e}") async def generate_weekly_summary(self, week_offset: int = 0) -> str: """Generate a weekly summary of conversations""" try: today = datetime.now() start_of_week = today - timedelta(days=today.weekday() + (week_offset * 7)) end_of_week = start_of_week + timedelta(days=6) week_conversations = self._get_week_conversations( start_of_week, end_of_week ) if not week_conversations: if week_offset == 0: return ( f"No conversations found for current week " f"({start_of_week.strftime('%Y-%m-%d')})" ) else: return ( f"No conversations found for week of " f"{start_of_week.strftime('%Y-%m-%d')} ({week_offset} week(s) ago)" ) summary_text = self._build_weekly_summary_text( start_of_week, end_of_week, week_conversations ) summary_filename = f"week-{start_of_week.strftime('%Y-%m-%d')}.md" summary_file = self.summaries_path / "weekly" / summary_filename async with aiofiles.open(summary_file, "w", encoding="utf-8") as f: await f.write(summary_text) summary_text += f"\n---\n*Summary saved to {summary_file}*" return summary_text except (OSError, ValueError, KeyError, TypeError) as e: return f"Failed to generate weekly summary: {str(e)}" def _get_week_conversations( self, start_of_week: datetime, end_of_week: datetime ) -> List[dict]: """Return conversations for the given week range""" try: with open(self.index_file, "r") as f: index_data = json.load(f) conversations = index_data.get("conversations", []) except (OSError, ValueError, KeyError, TypeError): return [] week_conversations = [] for conv_info in conversations: try: conv_date = datetime.fromisoformat( conv_info["date"].replace("Z", "+00:00") ) if start_of_week.date() <= conv_date.date() <= end_of_week.date(): file_path = self.storage_path / conv_info["file_path"] if file_path.exists(): try: with open(file_path, "r", encoding="utf-8") as f: conv_data = json.load(f) week_conversations.append(conv_data) except (OSError, ValueError, KeyError, TypeError): week_conversations.append( { "title": conv_info.get("title", "Untitled"), "date": conv_info["date"], "topics": conv_info.get("topics", []), } ) except (ValueError, KeyError, TypeError): continue return week_conversations def _build_weekly_summary_text( self, start_of_week: datetime, end_of_week: datetime, week_conversations: List[dict], ) -> str: """Build the markdown summary text for the week""" summary_parts = [] summary_parts.append( f"# Weekly Summary: {start_of_week.strftime('%Y-%m-%d')} " f"to {end_of_week.strftime('%Y-%m-%d')}" ) summary_parts.append( f"\n## Overview\n- Total conversations: {len(week_conversations)}" ) all_topics = [] for conv in week_conversations: all_topics.extend(conv.get("topics", [])) topic_counts: Dict[str, int] = {} for topic in all_topics: topic_counts[topic] = topic_counts.get(topic, 0) + 1 if topic_counts: summary_parts.append("\n## Popular Topics") sorted_topics = sorted( topic_counts.items(), key=lambda x: x[1], reverse=True ) for topic, count in sorted_topics[:10]: summary_parts.append(f"- {topic}: {count} conversations") summary_parts.append("\n## Conversations") for conv in week_conversations: date_str = conv.get("date", "").split("T")[0] topics_str = ", ".join(conv.get("topics", [])[:3]) if len(conv.get("topics", [])) > 3: topics_str += "..." conv_line = f"- [{date_str}] {conv.get('title', 'Untitled')}" if topics_str: conv_line += f" *Topics: {topics_str}*" summary_parts.append(conv_line) return "\n".join(summary_parts) async def get_search_stats(self) -> Dict[str, Any]: """Get search engine statistics and status.""" stats = { "sqlite_available": SQLITE_AVAILABLE, "sqlite_enabled": self.use_sqlite_search, "search_engine": "sqlite_fts" if self.use_sqlite_search else "linear_json", } if self.use_sqlite_search and self.search_db: try: db_stats = self.search_db.get_conversation_stats() stats.update(db_stats) except Exception as e: stats["sqlite_error"] = str(e) return stats async def migrate_to_sqlite(self) -> Dict[str, Any]: """Migrate existing conversations to SQLite database.""" if not SQLITE_AVAILABLE: return {"error": "SQLite not available"} if not self.use_sqlite_search: return {"error": "SQLite search not enabled"} try: from .migrate_to_sqlite import ConversationMigrator # Determine directory structure use_data_dir = self.conversations_path.parent.name == "data" migrator = ConversationMigrator(str(self.storage_path), use_data_dir) migration_stats = migrator.migrate_all_conversations() return migration_stats except ImportError: return {"error": "Migration module not available"} except Exception as e: return {"error": f"Migration failed: {str(e)}"} async def search_by_topic( self, topic: str, limit: int = 10 ) -> List[Dict[str, Any]]: """Search conversations by specific topic.""" if self.use_sqlite_search and self.search_db: try: return self.search_db.search_by_topic(topic, limit) except Exception as e: self.logger.warning(f"SQLite topic search failed: {e}") # Fallback to JSON-based topic search return await self._search_topic_json(topic, limit) async def _search_topic_json(self, topic: str, limit: int) -> List[Dict[str, Any]]: """Helper method for JSON-based topic search.""" try: async with aiofiles.open(self.topics_file, "r") as f: content = await f.read() topics_data = json.loads(content) topics_index = topics_data.get("topics", {}) if topic not in topics_index: return [] # Get conversation IDs for this topic topic_convs = topics_index[topic] # Load conversation details results = [] for topic_conv in topic_convs[:limit]: conv_id = topic_conv.get("conversation_id") if conv_id: preview = self.get_preview(conv_id) if preview and "not found" not in preview.lower(): results.append( { "id": conv_id, "preview": ( preview[:200] + "..." if len(preview) > 200 else preview ), } ) return results except (OSError, ValueError, KeyError, TypeError) as e: return [{"error": f"Topic search failed: {str(e)}"}] def _analyze_conversations(self, conversations: List[dict]) -> List[dict]: """Legacy method for test compatibility - analyze conversation data""" results = [] for conv in conversations: try: file_path = self.storage_path / conv.get("file_path", "") if not file_path.exists(): results.append({"error": "Conversation file not found"}) continue results.append({"title": conv.get("title", "Unknown")}) except Exception as e: results.append({"error": str(e)}) return results @classmethod def _validate_storage_path(cls, path: str) -> bool: """Legacy method for test compatibility - validate storage path""" try: from pathlib import Path p = Path(path) return p.is_dir() or not p.exists() except Exception: return False

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/adamkwhite/claude-memory-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

conversation_memory.py•26.5 KiB