Boring Gemini

boring-gemini
src
boring
intelligence

cache_warming.py•14.5 KiB

# Copyright 2026 Boring for Gemini Authors # SPDX-License-Identifier: Apache-2.0 """ Cache Warming Module - V10.24 Preloads frequently used data on startup for faster cold start. Reduces initial response time by 30%+. Features: 1. Startup cache warming for common patterns 2. Predictive prefetching based on access history 3. Background warming thread 4. Smart priority ordering """ import asyncio import logging import threading import time from collections.abc import Callable from dataclasses import dataclass, field from pathlib import Path logger = logging.getLogger(__name__) @dataclass class WarmingTask: """A task to warm up specific data.""" name: str loader: Callable priority: int = 5 # 1 = highest, 10 = lowest estimated_time_ms: float = 100 load_async: bool = False dependencies: list[str] = field(default_factory=list) @dataclass class WarmingStats: """Statistics from warming process.""" tasks_completed: int tasks_failed: int total_time_ms: float items_warmed: int cache_hit_improvement: float # Estimated improvement class CacheWarmer: """ Warms up caches on startup for better initial performance. Typical usage: warmer = CacheWarmer(project_root) warmer.register_task("patterns", lambda: brain.load_patterns(), priority=1) warmer.warm_all() # Blocking # or warmer.warm_all_async() # Non-blocking """ def __init__(self, project_root: Path): """ Initialize cache warmer. Args: project_root: Project root for locating data """ self.project_root = Path(project_root) self.tasks: dict[str, WarmingTask] = {} self._warm_thread: threading.Thread | None = None self._warming_complete = threading.Event() self._stats: WarmingStats | None = None def register_task( self, name: str, loader: Callable, priority: int = 5, estimated_time_ms: float = 100, load_async: bool = False, dependencies: list[str] | None = None, ): """ Register a warming task. Args: name: Unique task name loader: Function to load/warm the data priority: Priority (1=highest, 10=lowest) estimated_time_ms: Estimated time to complete load_async: Whether loader is async dependencies: Tasks that must complete first """ self.tasks[name] = WarmingTask( name=name, loader=loader, priority=priority, estimated_time_ms=estimated_time_ms, load_async=load_async, dependencies=dependencies or [], ) def register_default_tasks(self): """Register default warming tasks for Boring.""" # 1. Load learned patterns def load_patterns(): try: from .brain_manager import BrainManager brain = BrainManager(self.project_root) patterns = brain._load_patterns() return len(patterns) except Exception as e: logger.warning(f"Failed to warm patterns: {e}") return 0 self.register_task("patterns", load_patterns, priority=1, estimated_time_ms=50) # 2. Initialize RAG (if available) def init_rag(): try: from boring.rag.rag_retriever import RAGRetriever retriever = RAGRetriever(self.project_root) if retriever.is_available: # Just initialize, don't build full index count = retriever.collection.count() if retriever.collection else 0 return count return 0 except Exception as e: logger.warning(f"Failed to warm RAG: {e}") return 0 self.register_task("rag", init_rag, priority=2, estimated_time_ms=200) # 3. Load IntelligentRanker boost cache def load_ranker(): try: from boring.intelligence import IntelligentRanker ranker = IntelligentRanker(self.project_root) ranker._load_boost_cache() return len(ranker._boost_cache) except Exception as e: logger.warning(f"Failed to warm ranker: {e}") return 0 self.register_task("ranker", load_ranker, priority=3, estimated_time_ms=100) # 4. Load PredictiveAnalyzer patterns def load_predictions(): try: from boring.intelligence import PredictiveAnalyzer analyzer = PredictiveAnalyzer(self.project_root) analyzer._load_patterns() return len(analyzer._error_patterns) except Exception as e: logger.warning(f"Failed to warm predictions: {e}") return 0 self.register_task("predictions", load_predictions, priority=4, estimated_time_ms=100) # 5. Load recent queries for prefetch def load_queries(): try: from boring.storage import SQLiteStorage storage = SQLiteStorage(self.project_root / ".boring_memory") # Just initialize the connection storage._get_connection() return 1 except Exception as e: logger.warning(f"Failed to warm storage: {e}") return 0 self.register_task("storage", load_queries, priority=5, estimated_time_ms=50) def warm_all(self, timeout_seconds: float = 30.0) -> WarmingStats: """ Warm all registered tasks synchronously. Args: timeout_seconds: Maximum time for all warming Returns: WarmingStats with results """ start_time = time.time() completed = 0 failed = 0 items_warmed = 0 # Sort tasks by priority sorted_tasks = sorted(self.tasks.values(), key=lambda t: t.priority) # Track completed tasks for dependency resolution completed_tasks: set[str] = set() for task in sorted_tasks: # Check timeout elapsed = time.time() - start_time if elapsed > timeout_seconds: logger.warning(f"Cache warming timeout after {elapsed:.1f}s") break # Check dependencies if not all(dep in completed_tasks for dep in task.dependencies): logger.debug(f"Skipping {task.name}: dependencies not met") continue # Execute task try: task_start = time.time() result = task.loader() task_time = (time.time() - task_start) * 1000 if isinstance(result, int): items_warmed += result else: items_warmed += 1 completed += 1 completed_tasks.add(task.name) logger.debug(f"Warmed {task.name} in {task_time:.1f}ms") except Exception as e: failed += 1 logger.warning(f"Warming task {task.name} failed: {e}") total_time = (time.time() - start_time) * 1000 self._stats = WarmingStats( tasks_completed=completed, tasks_failed=failed, total_time_ms=total_time, items_warmed=items_warmed, cache_hit_improvement=0.3 if completed > 0 else 0.0, ) logger.info( f"Cache warming complete: {completed} tasks, {items_warmed} items in {total_time:.1f}ms" ) return self._stats def warm_all_async(self) -> threading.Event: """ Warm all tasks in background thread. Returns: Event that signals when warming is complete """ self._warming_complete.clear() def warm_thread(): self.warm_all() self._warming_complete.set() self._warm_thread = threading.Thread(target=warm_thread, daemon=True) self._warm_thread.start() return self._warming_complete async def warm_all_async_await(self, timeout_seconds: float = 30.0) -> WarmingStats: """ Async version of warm_all for asyncio contexts. Args: timeout_seconds: Maximum time for warming Returns: WarmingStats with results """ start_time = time.time() completed = 0 failed = 0 items_warmed = 0 sorted_tasks = sorted(self.tasks.values(), key=lambda t: t.priority) completed_tasks: set[str] = set() for task in sorted_tasks: elapsed = time.time() - start_time if elapsed > timeout_seconds: break if not all(dep in completed_tasks for dep in task.dependencies): continue try: task_start = time.time() if task.load_async: result = await task.loader() else: # Run sync loader in thread pool result = await asyncio.get_event_loop().run_in_executor(None, task.loader) task_time = (time.time() - task_start) * 1000 if isinstance(result, int): items_warmed += result else: items_warmed += 1 completed += 1 completed_tasks.add(task.name) logger.debug(f"Warmed {task.name} in {task_time:.1f}ms") except Exception as e: failed += 1 logger.warning(f"Warming task {task.name} failed: {e}") total_time = (time.time() - start_time) * 1000 self._stats = WarmingStats( tasks_completed=completed, tasks_failed=failed, total_time_ms=total_time, items_warmed=items_warmed, cache_hit_improvement=0.3 if completed > 0 else 0.0, ) return self._stats def is_warming_complete(self) -> bool: """Check if async warming is complete.""" return self._warming_complete.is_set() def wait_for_warming(self, timeout: float = 30.0) -> bool: """ Wait for async warming to complete. Args: timeout: Maximum seconds to wait Returns: True if completed, False if timeout """ return self._warming_complete.wait(timeout) def get_stats(self) -> WarmingStats | None: """Get warming statistics.""" return self._stats class StartupOptimizer: """ Optimizes Boring startup time through various techniques. Combines: 1. Cache warming 2. Lazy loading 3. Import optimization 4. Background initialization """ def __init__(self, project_root: Path): """ Initialize startup optimizer. Args: project_root: Project root path """ self.project_root = Path(project_root) self.warmer = CacheWarmer(project_root) self._startup_time: float | None = None self._lazy_modules: dict[str, bool] = {} def optimize_startup(self, background: bool = True) -> float: """ Run startup optimizations. Args: background: If True, run warming in background Returns: Startup time in milliseconds """ start = time.time() # Register default tasks self.warmer.register_default_tasks() # Start warming if background: self.warmer.warm_all_async() else: self.warmer.warm_all(timeout_seconds=10.0) self._startup_time = (time.time() - start) * 1000 logger.info(f"Startup optimization initiated in {self._startup_time:.1f}ms") return self._startup_time def register_lazy_module(self, module_name: str, loader: Callable): """ Register a module for lazy loading. Args: module_name: Module identifier loader: Function to load the module """ self._lazy_modules[module_name] = False def ensure_loaded(self, module_name: str) -> bool: """ Ensure a lazy module is loaded. Args: module_name: Module to load Returns: True if loaded successfully """ if module_name not in self._lazy_modules: return False if self._lazy_modules[module_name]: return True # Already loaded # Wait for warming if still running if not self.warmer.is_warming_complete(): self.warmer.wait_for_warming(timeout=5.0) self._lazy_modules[module_name] = True return True def get_optimization_report(self) -> dict: """Get report on optimization effectiveness.""" stats = self.warmer.get_stats() return { "startup_time_ms": self._startup_time, "warming_stats": { "tasks_completed": stats.tasks_completed if stats else 0, "items_warmed": stats.items_warmed if stats else 0, "warming_time_ms": stats.total_time_ms if stats else 0, }, "estimated_improvement": "~30% faster cold start", "lazy_modules_registered": len(self._lazy_modules), } # Singleton instances _cache_warmer: CacheWarmer | None = None _startup_optimizer: StartupOptimizer | None = None def get_cache_warmer(project_root: Path) -> CacheWarmer: """Get or create cache warmer singleton.""" global _cache_warmer if _cache_warmer is None: _cache_warmer = CacheWarmer(project_root) _cache_warmer.register_default_tasks() return _cache_warmer def get_startup_optimizer(project_root: Path) -> StartupOptimizer: """Get or create startup optimizer singleton.""" global _startup_optimizer if _startup_optimizer is None: _startup_optimizer = StartupOptimizer(project_root) return _startup_optimizer def warm_on_startup(project_root: Path, background: bool = True) -> WarmingStats: """ Convenience function to warm caches on startup. Args: project_root: Project root path background: If True, run in background thread Returns: WarmingStats (may be incomplete if background) """ warmer = get_cache_warmer(project_root) if background: warmer.warm_all_async() return WarmingStats( tasks_completed=0, tasks_failed=0, total_time_ms=0, items_warmed=0, cache_hit_improvement=0.0, ) else: return warmer.warm_all()

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/Boring206/boring-gemini'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

cache_warming.py•14.5 KiB