MCP Agent Mail

mcp_agent_mail
src
mcp_agent_mail

db.py•19.5 KiB

"""Async database engine and session management utilities.""" from __future__ import annotations import asyncio import contextvars import random import re import time from collections.abc import AsyncIterator, Callable, Iterator from contextlib import asynccontextmanager, contextmanager, suppress from dataclasses import dataclass, field from functools import wraps from pathlib import Path from typing import Any, TypeVar from sqlalchemy.exc import OperationalError from sqlalchemy.ext.asyncio import AsyncEngine, AsyncSession, async_sessionmaker, create_async_engine from sqlmodel import SQLModel from .config import DatabaseSettings, Settings, clear_settings_cache, get_settings T = TypeVar("T") _engine: AsyncEngine | None = None _session_factory: async_sessionmaker[AsyncSession] | None = None _schema_ready = False _schema_lock: asyncio.Lock | None = None _QUERY_TRACKER: contextvars.ContextVar["QueryTracker | None"] = contextvars.ContextVar("query_tracker", default=None) _QUERY_HOOKS_INSTALLED = False _SLOW_QUERY_LIMIT = 50 _SQL_TABLE_RE = re.compile(r"\bfrom\s+([\w\.\"`\[\]]+)", re.IGNORECASE) _SQL_UPDATE_RE = re.compile(r"\bupdate\s+([\w\.\"`\[\]]+)", re.IGNORECASE) _SQL_INSERT_RE = re.compile(r"\binsert\s+into\s+([\w\.\"`\[\]]+)", re.IGNORECASE) @dataclass(slots=True) class QueryTracker: total: int = 0 total_time_ms: float = 0.0 per_table: dict[str, int] = field(default_factory=dict) slow_query_ms: float | None = None slow_queries: list[dict[str, Any]] = field(default_factory=list) def record(self, statement: str, duration_ms: float) -> None: self.total += 1 self.total_time_ms += duration_ms table = _extract_table_name(statement) if table: self.per_table[table] = self.per_table.get(table, 0) + 1 if ( self.slow_query_ms is not None and duration_ms >= self.slow_query_ms and len(self.slow_queries) < _SLOW_QUERY_LIMIT ): self.slow_queries.append( { "table": table, "duration_ms": round(duration_ms, 2), } ) def to_dict(self) -> dict[str, Any]: return { "total": self.total, "total_time_ms": round(self.total_time_ms, 2), "per_table": dict(sorted(self.per_table.items(), key=lambda item: (-item[1], item[0]))), "slow_query_ms": self.slow_query_ms, "slow_queries": list(self.slow_queries), } def _clean_table_name(raw: str) -> str: cleaned = raw.strip() if "." in cleaned: cleaned = cleaned.split(".")[-1] return cleaned.strip("`\"[]") def _extract_table_name(statement: str) -> str | None: for pattern in (_SQL_INSERT_RE, _SQL_UPDATE_RE, _SQL_TABLE_RE): match = pattern.search(statement) if match: return _clean_table_name(match.group(1)) return None def get_query_tracker() -> QueryTracker | None: return _QUERY_TRACKER.get() def start_query_tracking(*, slow_ms: float | None = None) -> tuple[QueryTracker, contextvars.Token]: tracker = QueryTracker(slow_query_ms=slow_ms) token = _QUERY_TRACKER.set(tracker) return tracker, token def stop_query_tracking(token: contextvars.Token) -> None: _QUERY_TRACKER.reset(token) @contextmanager def track_queries(*, slow_ms: float | None = None) -> Iterator[QueryTracker]: tracker, token = start_query_tracking(slow_ms=slow_ms) try: yield tracker finally: stop_query_tracking(token) def retry_on_db_lock(max_retries: int = 5, base_delay: float = 0.1, max_delay: float = 5.0) -> Callable[..., Any]: """Decorator to retry async functions on SQLite database lock errors with exponential backoff + jitter. Args: max_retries: Maximum number of retry attempts base_delay: Initial delay in seconds (will be exponentially increased) max_delay: Maximum delay between retries in seconds This handles transient "database is locked" errors from SQLite by: 1. Catching OperationalError with lock-related messages 2. Waiting with exponential backoff: base_delay * (2 ** attempt) 3. Adding jitter to prevent thundering herd: random ±25% of delay 4. Giving up after max_retries and re-raising the error """ def decorator(func: Callable[..., Any]) -> Callable[..., Any]: @wraps(func) async def wrapper(*args: Any, **kwargs: Any) -> Any: last_exception = None for attempt in range(max_retries + 1): try: return await func(*args, **kwargs) except OperationalError as e: # Check if it's a lock-related error error_msg = str(e).lower() is_lock_error = any( phrase in error_msg for phrase in ["database is locked", "database is busy", "locked"] ) if not is_lock_error or attempt >= max_retries: # Not a lock error, or we've exhausted retries - raise it raise last_exception = e # Calculate exponential backoff with jitter delay = min(base_delay * (2**attempt), max_delay) jitter = delay * 0.25 * (2 * random.random() - 1) # ±25% jitter total_delay = delay + jitter # Log the retry (if logging is available) import logging func_name = getattr(func, "__name__", getattr(func, "__qualname__", "<callable>")) logging.warning( f"Database locked, retrying {func_name} " f"(attempt {attempt + 1}/{max_retries}) after {total_delay:.2f}s" ) await asyncio.sleep(total_delay) # Should never reach here, but just in case if last_exception: raise last_exception raise RuntimeError("Unexpected retry loop exit") return wrapper return decorator def _build_engine(settings: DatabaseSettings) -> AsyncEngine: """Build async SQLAlchemy engine with SQLite-optimized settings for concurrency.""" from sqlalchemy import event from sqlalchemy.engine import make_url # For SQLite, enable WAL mode and set timeout for better concurrent access connect_args = {} is_sqlite = "sqlite" in settings.url.lower() if is_sqlite: # Ensure parent directory exists for file-backed SQLite URLs. # SQLite returns "unable to open database file" when the directory is missing. try: parsed = make_url(settings.url) if parsed.database and parsed.database != ":memory:": Path(parsed.database).expanduser().resolve().parent.mkdir(parents=True, exist_ok=True) except Exception: pass # Register datetime adapters ONCE globally for Python 3.12+ compatibility # These are module-level registrations, not per-connection import datetime as dt_module import sqlite3 def adapt_datetime_iso(val: Any) -> str: """Adapt datetime.datetime to ISO 8601 date.""" return str(val.isoformat()) def convert_datetime(val: bytes | str) -> dt_module.datetime | None: """Convert ISO 8601 datetime to datetime.datetime object. Returns None for any conversion errors (invalid format, wrong type, corrupted data, etc.) to allow graceful degradation rather than crashing. """ try: # Handle both bytes and str (SQLite can return either) if isinstance(val, bytes): val = val.decode('utf-8') return dt_module.datetime.fromisoformat(val) except (ValueError, AttributeError, TypeError, UnicodeDecodeError, OverflowError): # Return None for any conversion failure: # - ValueError: invalid ISO format string # - TypeError: unexpected type (shouldn't happen but defensive) # - AttributeError: val has no expected attributes (defensive) # - UnicodeDecodeError: corrupted bytes (extreme edge case) # - OverflowError: datetime value out of valid range (year outside 1-9999) return None # Register adapters globally (safe to call multiple times - last registration wins) sqlite3.register_adapter(dt_module.datetime, adapt_datetime_iso) sqlite3.register_converter("timestamp", convert_datetime) connect_args = { "timeout": 30.0, # Wait up to 30 seconds for lock (default is 5) "check_same_thread": False, # Required for async SQLite } # SQLite has low write concurrency; large pools can exhaust FDs under stress tests. pool_size = 5 if is_sqlite else 25 max_overflow = 5 if is_sqlite else 25 engine = create_async_engine( settings.url, echo=settings.echo, future=True, pool_pre_ping=True, pool_size=pool_size, max_overflow=max_overflow, pool_timeout=30, # Fail fast with clear error instead of hanging indefinitely pool_recycle=3600, # Recycle connections after 1 hour to prevent stale handles connect_args=connect_args, ) # For SQLite: Set up event listener to configure each connection with WAL mode if is_sqlite: @event.listens_for(engine.sync_engine, "connect") def set_sqlite_pragma(dbapi_conn: Any, connection_record: Any) -> None: """Set SQLite PRAGMAs for better concurrent performance on each connection.""" cursor = dbapi_conn.cursor() # Enable WAL mode for concurrent reads/writes cursor.execute("PRAGMA journal_mode=WAL") # Use NORMAL synchronous mode (safer than OFF, faster than FULL) cursor.execute("PRAGMA synchronous=NORMAL") # Set busy timeout (wait up to 30 seconds for locks) cursor.execute("PRAGMA busy_timeout=30000") cursor.close() return engine def install_query_hooks(engine: AsyncEngine) -> None: """Install lightweight query counting hooks on the engine (idempotent).""" global _QUERY_HOOKS_INSTALLED if _QUERY_HOOKS_INSTALLED: return from sqlalchemy import event @event.listens_for(engine.sync_engine, "before_cursor_execute") def before_cursor_execute( conn: Any, cursor: Any, statement: str, parameters: Any, context: Any, executemany: bool, ) -> None: tracker = _QUERY_TRACKER.get() if tracker is None: return timings = conn.info.setdefault("query_start_time", []) timings.append(time.perf_counter()) @event.listens_for(engine.sync_engine, "after_cursor_execute") def after_cursor_execute( conn: Any, cursor: Any, statement: str, parameters: Any, context: Any, executemany: bool, ) -> None: tracker = _QUERY_TRACKER.get() if tracker is None: return timings = conn.info.get("query_start_time") if not timings: return start_time = timings.pop() duration_ms = (time.perf_counter() - start_time) * 1000.0 tracker.record(statement, duration_ms) _QUERY_HOOKS_INSTALLED = True def init_engine(settings: Settings | None = None) -> None: """Initialise global engine and session factory once.""" global _engine, _session_factory if _engine is not None and _session_factory is not None: return resolved_settings = settings or get_settings() engine = _build_engine(resolved_settings.database) install_query_hooks(engine) _engine = engine _session_factory = async_sessionmaker(engine, expire_on_commit=False, class_=AsyncSession) def get_engine() -> AsyncEngine: if _engine is None: init_engine() assert _engine is not None return _engine def get_session_factory() -> async_sessionmaker[AsyncSession]: if _session_factory is None: init_engine() assert _session_factory is not None return _session_factory @asynccontextmanager async def get_session() -> AsyncIterator[AsyncSession]: factory = get_session_factory() session = factory() try: yield session finally: # Ensure session close completes even under cancellation (anyio cancel scopes # will raise asyncio.CancelledError which is BaseException in Python 3.14). close_task = asyncio.create_task(session.close()) try: await asyncio.shield(close_task) except BaseException: with suppress(BaseException): await close_task raise @retry_on_db_lock(max_retries=5, base_delay=0.1, max_delay=5.0) async def ensure_schema(settings: Settings | None = None) -> None: """Ensure database schema exists (creates tables from SQLModel definitions). This is the pure SQLModel approach: - Models define the schema - create_all() creates tables that don't exist yet - For schema changes: delete the DB and regenerate (dev) or use Alembic (prod) Also enables SQLite WAL mode for better concurrent access. """ global _schema_ready, _schema_lock if _schema_ready: return if _schema_lock is None: _schema_lock = asyncio.Lock() async with _schema_lock: if _schema_ready: return init_engine(settings) engine = get_engine() async with engine.begin() as conn: # Pure SQLModel: create tables from metadata # (WAL mode is set automatically via event listener in _build_engine) await conn.run_sync(SQLModel.metadata.create_all) # Setup FTS and custom indexes await conn.run_sync(_setup_fts) _schema_ready = True def reset_database_state() -> None: """Test helper to reset global engine/session state.""" global _engine, _session_factory, _schema_ready, _schema_lock # Dispose any existing engine/pool first to avoid leaking file descriptors across tests. if _engine is not None: engine = _engine try: # Prefer a full async dispose when possible (aiosqlite uses background threads). try: running = asyncio.get_running_loop() except RuntimeError: running = None if running is not None and running.is_running(): # Can't block; fall back to sync pool disposal (best effort). engine.sync_engine.dispose() else: try: loop = asyncio.get_event_loop() except RuntimeError: loop = None if loop is not None and not loop.is_running() and not loop.is_closed(): loop.run_until_complete(engine.dispose()) else: asyncio.run(engine.dispose()) except Exception: # Last resort: sync pool disposal. with suppress(Exception): engine.sync_engine.dispose() _engine = None _session_factory = None _schema_ready = False _schema_lock = None # Tests frequently mutate env vars; keep settings cache in sync with DB resets. clear_settings_cache() def _setup_fts(connection: Any) -> None: connection.exec_driver_sql( "CREATE VIRTUAL TABLE IF NOT EXISTS fts_messages USING fts5(message_id UNINDEXED, subject, body)" ) connection.exec_driver_sql( """ CREATE TRIGGER IF NOT EXISTS fts_messages_ai AFTER INSERT ON messages BEGIN INSERT INTO fts_messages(rowid, message_id, subject, body) VALUES (new.id, new.id, new.subject, new.body_md); END; """ ) connection.exec_driver_sql( """ CREATE TRIGGER IF NOT EXISTS fts_messages_ad AFTER DELETE ON messages BEGIN DELETE FROM fts_messages WHERE rowid = old.id; END; """ ) connection.exec_driver_sql( """ CREATE TRIGGER IF NOT EXISTS fts_messages_au AFTER UPDATE ON messages BEGIN DELETE FROM fts_messages WHERE rowid = old.id; INSERT INTO fts_messages(rowid, message_id, subject, body) VALUES (new.id, new.id, new.subject, new.body_md); END; """ ) # Additional performance indexes for common access patterns connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_messages_created_ts ON messages(created_ts)" ) connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_messages_thread_id ON messages(thread_id)" ) connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_messages_importance ON messages(importance)" ) connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_messages_sender_created ON messages(sender_id, created_ts DESC)" ) connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_messages_project_created ON messages(project_id, created_ts DESC)" ) connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_file_reservations_expires_ts ON file_reservations(expires_ts)" ) connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_message_recipients_agent ON message_recipients(agent_id)" ) connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_message_recipients_agent_message " "ON message_recipients(agent_id, message_id)" ) connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_messages_project_sender_created " "ON messages(project_id, sender_id, created_ts DESC)" ) connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_file_reservations_project_released_expires " "ON file_reservations(project_id, released_ts, expires_ts)" ) connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_file_reservations_project_agent_released " "ON file_reservations(project_id, agent_id, released_ts)" ) connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_product_project " "ON product_project_links(product_id, project_id)" ) # AgentLink indexes for efficient contact lookups connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_agent_links_a_project " "ON agent_links(a_project_id)" ) connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_agent_links_b_project " "ON agent_links(b_project_id)" ) connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_agent_links_b_project_agent " "ON agent_links(b_project_id, b_agent_id)" ) connection.exec_driver_sql( "CREATE INDEX IF NOT EXISTS idx_agent_links_status " "ON agent_links(status)" ) def get_database_path(settings: Settings | None = None) -> Path | None: """Extract the filesystem path to the SQLite database file from settings. Args: settings: Application settings, or None to use global settings Returns: Path to the database file, or None if not using SQLite or path cannot be determined """ resolved = settings or get_settings() url_raw = resolved.database.url try: from sqlalchemy.engine import make_url parsed = make_url(url_raw) except Exception: return None if parsed.get_backend_name() != "sqlite": return None db_path = parsed.database if not db_path or db_path == ":memory:": return None return Path(db_path)

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/OmelchMichael/mcp_agent_mail'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

db.py•19.5 KiB