PLTM MCP Server

by Alby2007

Overview Schema Related Servers Score Discussions

PLTM-MCP
src
storage

sqlite_store.py•27.2 KiB

"""SQLite-based graph store with JSON support for memory atoms""" import json from datetime import datetime from pathlib import Path from typing import Optional, Union, List, Dict, Any from uuid import UUID import aiosqlite from loguru import logger from src.core.models import GraphType, MemoryAtom, Provenance class SQLiteGraphStore: """ SQLite with JSON support for graph-like operations. Features: - JSON metadata storage for complex fields - FTS5 full-text search on object field - Indexes for conflict detection (subject + predicate) - Graph-ready schema for future Neo4j migration """ def __init__(self, db_path: Union[Path, str]) -> None: self.db_path = Path(db_path) self._conn: Optional[aiosqlite.Connection] = None async def connect(self) -> None: """Establish database connection""" # Create parent directory if needed self.db_path.parent.mkdir(parents=True, exist_ok=True) self._conn = await aiosqlite.connect(str(self.db_path)) self._conn.row_factory = aiosqlite.Row # Enable WAL mode for better concurrency and durability await self._conn.execute("PRAGMA journal_mode=WAL") # Ensure data is written to disk immediately await self._conn.execute("PRAGMA synchronous=FULL") await self._setup_schema() await self._conn.commit() # Ensure schema is committed logger.info(f"Connected to database: {self.db_path}") async def close(self) -> None: """Close database connection""" if self._conn: await self._conn.close() logger.info("Database connection closed") async def _setup_schema(self) -> None: """Create tables with JSON support and graph-ready structure""" if not self._conn: raise RuntimeError("Database not connected") # Main atoms table await self._conn.execute(""" CREATE TABLE IF NOT EXISTS atoms ( id TEXT PRIMARY KEY, atom_type TEXT NOT NULL, graph TEXT NOT NULL, subject TEXT NOT NULL, predicate TEXT NOT NULL, object TEXT NOT NULL, -- Store complex fields as JSON metadata TEXT NOT NULL, -- For fast queries (denormalized from metadata) confidence REAL DEFAULT 0.5, first_observed INTEGER DEFAULT 0, last_accessed INTEGER DEFAULT 0, UNIQUE(subject, predicate, object, graph) ) """) # Provenance table - every claim must be traceable await self._conn.execute(""" CREATE TABLE IF NOT EXISTS provenance ( id TEXT PRIMARY KEY, claim_id TEXT NOT NULL, source_type TEXT NOT NULL, source_url TEXT NOT NULL, source_title TEXT, quoted_span TEXT NOT NULL, page_or_section TEXT, accessed_at INTEGER NOT NULL, content_hash TEXT NOT NULL, confidence REAL DEFAULT 0.5, authors TEXT, arxiv_id TEXT, doi TEXT, commit_sha TEXT, file_path TEXT, line_range TEXT, FOREIGN KEY (claim_id) REFERENCES atoms(id) ) """) await self._conn.execute(""" CREATE INDEX IF NOT EXISTS idx_provenance_claim ON provenance(claim_id) """) await self._conn.execute(""" CREATE INDEX IF NOT EXISTS idx_provenance_type ON provenance(source_type) """) # Create indexes for common queries await self._conn.execute(""" CREATE INDEX IF NOT EXISTS idx_atoms_subject_predicate ON atoms(subject, predicate) """) await self._conn.execute(""" CREATE INDEX IF NOT EXISTS idx_atoms_graph ON atoms(graph) WHERE graph = 'substantiated' """) await self._conn.execute(""" CREATE INDEX IF NOT EXISTS idx_atoms_confidence ON atoms(confidence DESC) """) # Full-text search for object field await self._conn.execute(""" CREATE VIRTUAL TABLE IF NOT EXISTS atoms_fts USING fts5(id UNINDEXED, object, content=atoms, content_rowid=rowid) """) # Triggers to keep FTS in sync await self._conn.execute(""" CREATE TRIGGER IF NOT EXISTS atoms_fts_insert AFTER INSERT ON atoms BEGIN INSERT INTO atoms_fts(rowid, id, object) VALUES (new.rowid, new.id, new.object); END """) await self._conn.execute(""" CREATE TRIGGER IF NOT EXISTS atoms_fts_delete AFTER DELETE ON atoms BEGIN DELETE FROM atoms_fts WHERE rowid = old.rowid; END """) await self._conn.execute(""" CREATE TRIGGER IF NOT EXISTS atoms_fts_update AFTER UPDATE ON atoms BEGIN DELETE FROM atoms_fts WHERE rowid = old.rowid; INSERT INTO atoms_fts(rowid, id, object) VALUES (new.rowid, new.id, new.object); END """) await self._conn.commit() logger.debug("Database schema initialized") async def insert_atom(self, atom: MemoryAtom) -> None: """Insert or update atom with JSON serialization""" if not self._conn: raise RuntimeError("Database not connected") # Serialize complex fields to JSON metadata = { "provenance": atom.provenance.value, "assertion_count": atom.assertion_count, "explicit_confirms": [dt.isoformat() for dt in atom.explicit_confirms], "last_contradicted": ( atom.last_contradicted.isoformat() if atom.last_contradicted else None ), "strength": atom.strength, "jury_history": [j.model_dump(mode='json') for j in atom.jury_history], "contexts": atom.contexts, "flags": atom.flags, "related_atoms": [str(aid) for aid in atom.related_atoms], "supersedes": str(atom.supersedes) if atom.supersedes else None, "superseded_by": str(atom.superseded_by) if atom.superseded_by else None, "session_id": atom.session_id, "topic_cluster": atom.topic_cluster, "object_metadata": atom.object_metadata, "temporal_validity": atom.temporal_validity, "access_count": atom.access_count, } await self._conn.execute( """ INSERT OR REPLACE INTO atoms (id, atom_type, graph, subject, predicate, object, metadata, confidence, first_observed, last_accessed) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?) """, ( str(atom.id), atom.atom_type.value, atom.graph.value, atom.subject, atom.predicate, atom.object, json.dumps(metadata), atom.confidence, int(atom.first_observed.timestamp()), int(atom.last_accessed.timestamp()), ), ) await self._conn.commit() logger.debug(f"Inserted atom {atom.id}: [{atom.subject}] [{atom.predicate}] [{atom.object}]") async def insert_provenance( self, provenance_id: str, claim_id: str, source_type: str, source_url: str, source_title: str, quoted_span: str, page_or_section: Optional[str], accessed_at: int, content_hash: str, confidence: float, authors: Optional[str] = None, arxiv_id: Optional[str] = None, doi: Optional[str] = None, commit_sha: Optional[str] = None, file_path: Optional[str] = None, line_range: Optional[str] = None ) -> None: """Insert provenance record for a claim""" if not self._conn: raise RuntimeError("Database not connected") await self._conn.execute( """ INSERT OR REPLACE INTO provenance (id, claim_id, source_type, source_url, source_title, quoted_span, page_or_section, accessed_at, content_hash, confidence, authors, arxiv_id, doi, commit_sha, file_path, line_range) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?) """, (provenance_id, claim_id, source_type, source_url, source_title, quoted_span, page_or_section, accessed_at, content_hash, confidence, authors, arxiv_id, doi, commit_sha, file_path, line_range) ) await self._conn.commit() logger.debug(f"Inserted provenance {provenance_id} for claim {claim_id}") async def get_provenance_for_claim(self, claim_id: str) -> List[Dict[str, Any]]: """Get all provenance records for a claim""" if not self._conn: raise RuntimeError("Database not connected") cursor = await self._conn.execute( "SELECT * FROM provenance WHERE claim_id = ?", (claim_id,) ) rows = await cursor.fetchall() result = [] for row in rows: result.append({ "id": row[0], "claim_id": row[1], "source_type": row[2], "source_url": row[3], "source_title": row[4], "quoted_span": row[5], "page_or_section": row[6], "accessed_at": row[7], "content_hash": row[8], "confidence": row[9], "arxiv_id": row[11], "doi": row[12], "commit_sha": row[13] }) return result async def get_unverified_claims(self) -> List[str]: """Get claim IDs that only have internal provenance""" if not self._conn: raise RuntimeError("Database not connected") cursor = await self._conn.execute(""" SELECT DISTINCT a.id FROM atoms a LEFT JOIN provenance p ON a.id = p.claim_id WHERE p.id IS NULL OR p.source_type = 'internal' """) rows = await cursor.fetchall() return [row[0] for row in rows] async def get_provenance_stats(self) -> Dict[str, Any]: """Get provenance statistics""" if not self._conn: raise RuntimeError("Database not connected") cursor = await self._conn.execute( "SELECT source_type, COUNT(*) FROM provenance GROUP BY source_type" ) rows = await cursor.fetchall() by_type = {row[0]: row[1] for row in rows} cursor = await self._conn.execute("SELECT COUNT(*) FROM provenance") total = (await cursor.fetchone())[0] unverified = len(await self.get_unverified_claims()) return {"total": total, "by_type": by_type, "unverified": unverified} async def get_atom(self, atom_id: UUID) -> Optional[MemoryAtom]: """Retrieve atom by ID""" if not self._conn: raise RuntimeError("Database not connected") cursor = await self._conn.execute( "SELECT * FROM atoms WHERE id = ?", (str(atom_id),) ) row = await cursor.fetchone() if not row: return None return self._row_to_atom(row) async def find_by_triple( self, subject: str, predicate: str, exclude_historical: bool = True ) -> list[MemoryAtom]: """ Find atoms matching subject + predicate (for conflict detection). This is the critical query for conflict detection. """ if not self._conn: raise RuntimeError("Database not connected") if exclude_historical: query = """ SELECT * FROM atoms WHERE subject = ? AND predicate = ? AND graph != 'historical' ORDER BY confidence DESC """ else: query = """ SELECT * FROM atoms WHERE subject = ? AND predicate = ? ORDER BY confidence DESC """ cursor = await self._conn.execute(query, (subject, predicate)) rows = await cursor.fetchall() return [self._row_to_atom(row) for row in rows] async def get_substantiated_atoms( self, subject: Optional[str] = None, limit: Optional[int] = None ) -> list[MemoryAtom]: """ Get substantiated knowledge (for prompt context). Ordered by confidence and recency. """ if not self._conn: raise RuntimeError("Database not connected") if subject: query = """ SELECT * FROM atoms WHERE graph = 'substantiated' AND subject = ? ORDER BY confidence DESC, last_accessed DESC """ params = (subject,) else: query = """ SELECT * FROM atoms WHERE graph = 'substantiated' ORDER BY confidence DESC, last_accessed DESC """ params = () if limit: query += f" LIMIT {limit}" cursor = await self._conn.execute(query, params) rows = await cursor.fetchall() return [self._row_to_atom(row) for row in rows] async def get_unsubstantiated_atoms( self, subject: Optional[str] = None, min_confidence: float = 0.0 ) -> list[MemoryAtom]: """Get unsubstantiated atoms (shadow buffer)""" if not self._conn: raise RuntimeError("Database not connected") if subject: query = """ SELECT * FROM atoms WHERE graph = 'unsubstantiated' AND subject = ? AND confidence >= ? ORDER BY confidence DESC """ params = (subject, min_confidence) else: query = """ SELECT * FROM atoms WHERE graph = 'unsubstantiated' AND confidence >= ? ORDER BY confidence DESC """ params = (min_confidence,) cursor = await self._conn.execute(query, params) rows = await cursor.fetchall() return [self._row_to_atom(row) for row in rows] async def promote_atom(self, atom_id: UUID) -> None: """Move atom to substantiated graph""" if not self._conn: raise RuntimeError("Database not connected") await self._conn.execute( """ UPDATE atoms SET graph = 'substantiated', confidence = 1.0 WHERE id = ? """, (str(atom_id),) ) await self._conn.commit() logger.info(f"Promoted atom {atom_id} to substantiated graph") async def archive_atom(self, atom_id: UUID) -> None: """Move atom to historical archive""" if not self._conn: raise RuntimeError("Database not connected") await self._conn.execute( "UPDATE atoms SET graph = 'historical' WHERE id = ?", (str(atom_id),) ) await self._conn.commit() logger.info(f"Archived atom {atom_id}") async def delete_atom(self, atom_id: UUID) -> None: """Permanently delete atom (use sparingly)""" if not self._conn: raise RuntimeError("Database not connected") await self._conn.execute( "DELETE FROM atoms WHERE id = ?", (str(atom_id),) ) await self._conn.commit() logger.warning(f"Deleted atom {atom_id}") async def link_atoms( self, source_id: UUID, target_id: UUID ) -> None: """ Create bidirectional relationship (cached in metadata). Updates both atoms' related_atoms lists. """ if not self._conn: raise RuntimeError("Database not connected") # Update source atom await self._conn.execute( """ UPDATE atoms SET metadata = json_set( metadata, '$.related_atoms', json_insert( COALESCE(json_extract(metadata, '$.related_atoms'), '[]'), '$[#]', ? ) ) WHERE id = ? """, (str(target_id), str(source_id)) ) # Update target atom await self._conn.execute( """ UPDATE atoms SET metadata = json_set( metadata, '$.related_atoms', json_insert( COALESCE(json_extract(metadata, '$.related_atoms'), '[]'), '$[#]', ? ) ) WHERE id = ? """, (str(source_id), str(target_id)) ) await self._conn.commit() logger.debug(f"Linked atoms {source_id} <-> {target_id}") async def get_related_atoms( self, atom_id: UUID, depth: int = 1 ) -> list[MemoryAtom]: """ Get atoms related to this atom (using cached related_atoms). For MVP: depth=1 only (direct relationships). For full version: Use recursive CTE for depth>1. """ if not self._conn: raise RuntimeError("Database not connected") if depth > 1: logger.warning("Depth > 1 not implemented in MVP, using depth=1") query = """ SELECT a.* FROM atoms a WHERE a.id IN ( SELECT value FROM json_each( (SELECT json_extract(metadata, '$.related_atoms') FROM atoms WHERE id = ?) ) ) """ cursor = await self._conn.execute(query, (str(atom_id),)) rows = await cursor.fetchall() return [self._row_to_atom(row) for row in rows] async def search_objects(self, query: str, limit: int = 10) -> list[MemoryAtom]: """Full-text search on object field using FTS5""" if not self._conn: raise RuntimeError("Database not connected") cursor = await self._conn.execute( """ SELECT a.* FROM atoms a JOIN atoms_fts fts ON a.id = fts.id WHERE atoms_fts MATCH ? ORDER BY rank LIMIT ? """, (query, limit) ) rows = await cursor.fetchall() return [self._row_to_atom(row) for row in rows] async def get_stats(self) -> dict[str, int]: """Get database statistics""" if not self._conn: raise RuntimeError("Database not connected") stats = {} # Count by graph type for graph_type in ["substantiated", "unsubstantiated", "historical"]: cursor = await self._conn.execute( "SELECT COUNT(*) FROM atoms WHERE graph = ?", (graph_type,) ) row = await cursor.fetchone() stats[f"{graph_type}_count"] = row[0] if row else 0 # Total atoms cursor = await self._conn.execute("SELECT COUNT(*) FROM atoms") row = await cursor.fetchone() stats["total_atoms"] = row[0] if row else 0 return stats def _row_to_atom(self, row: aiosqlite.Row) -> MemoryAtom: """Convert database row to MemoryAtom""" metadata = json.loads(row["metadata"]) # Parse datetime fields explicit_confirms = [ datetime.fromisoformat(dt) for dt in metadata.get("explicit_confirms", []) ] last_contradicted = ( datetime.fromisoformat(metadata["last_contradicted"]) if metadata.get("last_contradicted") else None ) # Parse UUIDs related_atoms = [UUID(aid) for aid in metadata.get("related_atoms", [])] supersedes = UUID(metadata["supersedes"]) if metadata.get("supersedes") else None superseded_by = UUID(metadata["superseded_by"]) if metadata.get("superseded_by") else None # Parse jury history from src.core.models import JuryDecision jury_history = [JuryDecision(**jd) for jd in metadata.get("jury_history", [])] return MemoryAtom( id=UUID(row["id"]), atom_type=row["atom_type"], graph=row["graph"], subject=row["subject"], predicate=row["predicate"], object=row["object"], object_metadata=metadata.get("object_metadata"), contexts=metadata.get("contexts", []), temporal_validity=metadata.get("temporal_validity"), provenance=Provenance(metadata["provenance"]), assertion_count=metadata.get("assertion_count", 1), explicit_confirms=explicit_confirms, first_observed=datetime.fromtimestamp(row["first_observed"]), last_contradicted=last_contradicted, strength=metadata.get("strength", 0.5), last_accessed=datetime.fromtimestamp(row["last_accessed"]), access_count=metadata.get("access_count", 0), supersedes=supersedes, superseded_by=superseded_by, related_atoms=related_atoms, confidence=row["confidence"], jury_history=jury_history, flags=metadata.get("flags", []), session_id=metadata.get("session_id", ""), topic_cluster=metadata.get("topic_cluster"), ) # ======================================================================== # Convenience API Methods for Experiments # ======================================================================== async def get_atoms_by_subject( self, subject: str, graph: Optional[GraphType] = None ) -> list[MemoryAtom]: """ Get all atoms for a subject (user). This is a convenience method for experiments. Args: subject: Subject identifier (usually user_id) graph: Optional graph filter (SUBSTANTIATED, UNSUBSTANTIATED, HISTORICAL) Returns: List of matching atoms """ if graph is None: # Get from both substantiated and unsubstantiated substantiated = await self.get_substantiated_atoms(subject=subject) unsubstantiated = await self.get_unsubstantiated_atoms(subject=subject) return substantiated + unsubstantiated elif graph == GraphType.SUBSTANTIATED: return await self.get_substantiated_atoms(subject=subject) elif graph == GraphType.UNSUBSTANTIATED: return await self.get_unsubstantiated_atoms(subject=subject) elif graph == GraphType.HISTORICAL: if not self._conn: raise RuntimeError("Database not connected") cursor = await self._conn.execute( "SELECT * FROM atoms WHERE subject = ? AND graph = 'historical'", (subject,) ) rows = await cursor.fetchall() return [self._row_to_atom(row) for row in rows] else: return [] async def get_atoms_by_predicate( self, subject: str, predicates: list[str], graph: Optional[GraphType] = None ) -> list[MemoryAtom]: """ Get atoms matching specific predicates. Example: get_atoms_by_predicate("user_001", ["likes", "dislikes"]) Args: subject: Subject identifier predicates: List of predicates to match graph: Optional graph filter Returns: List of matching atoms """ all_atoms = await self.get_atoms_by_subject(subject, graph) return [ atom for atom in all_atoms if atom.predicate in predicates ] async def get_atoms_by_type( self, subject: str, atom_type: str, graph: Optional[GraphType] = None ) -> list[MemoryAtom]: """ Get atoms of specific type. Example: get_atoms_by_type("user_001", AtomType.PREFERENCE) Args: subject: Subject identifier atom_type: Atom type to match (from AtomType enum) graph: Optional graph filter Returns: List of matching atoms """ all_atoms = await self.get_atoms_by_subject(subject, graph) return [ atom for atom in all_atoms if atom.atom_type == atom_type ] async def get_atoms_by_object_contains( self, subject: str, object_substring: str, graph: Optional[GraphType] = None ) -> list[MemoryAtom]: """ Get atoms where object contains substring. Example: get_atoms_by_object_contains("user_001", "Python") Args: subject: Subject identifier object_substring: Substring to search for in object field graph: Optional graph filter Returns: List of matching atoms """ all_atoms = await self.get_atoms_by_subject(subject, graph) return [ atom for atom in all_atoms if object_substring.lower() in atom.object.lower() ] async def get_all_atoms( self, subject: Optional[str] = None, graph: Optional[GraphType] = None ) -> list[MemoryAtom]: """ Get all atoms (optionally filtered by subject/graph). Args: subject: Optional subject filter graph: Optional graph filter Returns: List of all matching atoms """ if subject: return await self.get_atoms_by_subject(subject, graph) # Get everything if graph == GraphType.SUBSTANTIATED: return await self._get_all_from_graph("substantiated") elif graph == GraphType.UNSUBSTANTIATED: return await self._get_all_from_graph("unsubstantiated") elif graph == GraphType.HISTORICAL: return await self._get_all_from_graph("historical") else: sub = await self._get_all_from_graph("substantiated") unsub = await self._get_all_from_graph("unsubstantiated") return sub + unsub async def _get_all_from_graph(self, graph_name: str) -> list[MemoryAtom]: """Helper: Get all atoms from a specific graph.""" if not self._conn: raise RuntimeError("Database not connected") cursor = await self._conn.execute( f"SELECT * FROM atoms WHERE graph = ?", (graph_name,) ) rows = await cursor.fetchall() return [self._row_to_atom(row) for row in rows] # Alias for MCP server compatibility async def add_atom(self, atom: MemoryAtom) -> None: """Alias for insert_atom (MCP server compatibility)""" await self.insert_atom(atom)

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/Alby2007/PLTM-MCP'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

sqlite_store.py•27.2 KiB