M.I.M.I.R - Multi-agent Intelligent Memory & Insight Repository

Overview Schema Related Servers Score Discussions

Mimir
nornicdb
pkg
inference

inference.go•32.1 KiB

// Package inference provides automatic relationship detection for NornicDB.
//
// This package implements multiple methods for detecting implicit relationships
// between nodes in the graph:
//   - Similarity-based: Nodes with similar embeddings are likely related
//   - Co-access patterns: Nodes accessed together frequently are likely related
//   - Temporal proximity: Nodes accessed in the same session are likely related
//   - Transitive inference: If A→B and B→C, then A→C (with confidence)
//
// Example Usage:
//
//	// Create inference engine
//	config := inference.DefaultConfig()
//	config.SimilarityThreshold = 0.85 // Higher threshold = more confidence
//	engine := inference.New(config)
//
//	// Hook up vector search
//	engine.SetSimilaritySearch(func(ctx context.Context, embedding []float32, k int) ([]inference.SimilarityResult, error) {
//		return vectorIndex.Search(ctx, embedding, k)
//	})
//
//	// When storing a new memory
//	node := createMemoryNode("Remember to buy milk")
//	suggestions, _ := engine.OnStore(ctx, node.ID, node.Embedding)
//
//	fmt.Printf("Found %d suggested relationships:\n", len(suggestions))
//	for _, sug := range suggestions {
//		fmt.Printf("  %s -> %s (%.2f confidence): %s\n",
//			sug.SourceID, sug.TargetID, sug.Confidence, sug.Reason)
//
//		if sug.Confidence > 0.7 {
//			// High confidence - auto-create the edge
//			createEdge(sug.SourceID, sug.TargetID, sug.Type)
//		}
//	}
//
//	// When accessing a memory
//	suggestions = engine.OnAccess(ctx, "memory-123")
//	for _, sug := range suggestions {
//		if sug.Method == "co_access" {
//			fmt.Printf("Frequently accessed with: %s\n", sug.TargetID)
//		}
//	}
//
// How Each Method Works:
//
//  1. Similarity-Based Linking:
//     Uses vector embeddings to find semantically similar nodes.
//     Example: "Buy milk" and "Purchase dairy products" have similar embeddings.
//
//  2. Co-Access Patterns:
//     Tracks which nodes are accessed within a short time window.
//     Example: If you always access "Project Plan" and "Budget" together,
//     they're probably related.
//
//  3. Temporal Proximity:
//     Nodes accessed in the same session (within 30 minutes) are linked.
//     Example: All memories from a single conversation thread.
//
//  4. Transitive Inference:
//     If A relates to B and B relates to C, then A might relate to C.
//     Example: "Python" → "Programming" → "Computers" suggests "Python" → "Computers"
//
// ELI12 (Explain Like I'm 12):
//
// Imagine you're organizing your school notebooks:
//
//  1. **Similarity**: Your math and science notebooks go together because they're
//     both about numbers and formulas (similar content).
//
//  2. **Co-access**: Your English notebook and dictionary always get used together,
//     so they should be near each other on your shelf.
//
//  3. **Temporal**: All homework from Monday night was done at the same time,
//     so those papers are related.
//
//  4. **Transitive**: If Math relates to Science, and Science relates to Biology,
//     then Math probably relates to Biology too (they're all STEM subjects).
//
// The inference engine is like a smart librarian who notices these patterns
// and suggests: "Hey, these two things seem related - want me to connect them?"
package inference

import (
	"context"
	"sync"
	"time"

	"github.com/orneryd/nornicdb/pkg/config"
	"github.com/orneryd/nornicdb/pkg/storage"
)

// EdgeSuggestion represents a suggested edge.
type EdgeSuggestion struct {
	SourceID   string
	TargetID   string
	Type       string
	Confidence float64
	Reason     string
	Method     string // similarity, co_access, temporal, transitive
}

// Config holds inference engine configuration options.
//
// All thresholds and parameters can be tuned based on your use case:
//   - Higher thresholds = fewer but more confident suggestions
//   - Lower thresholds = more suggestions but potentially noisier
//
// Example:
//
//	// Conservative: Only suggest very confident relationships
//	config := &inference.Config{
//		SimilarityThreshold: 0.90, // Very high bar
//		SimilarityTopK:      5,    // Only check top 5
//		CoAccessMinCount:    5,    // Need 5 co-accesses
//		TransitiveMinConf:   0.7,  // High confidence for transitive
//	}
//
//	// Aggressive: Suggest many potential relationships
//	config = &inference.Config{
//		SimilarityThreshold: 0.75, // Lower bar
//		SimilarityTopK:      20,   // Check top 20
//		CoAccessMinCount:    2,    // Just 2 co-accesses
//		TransitiveMinConf:   0.3,  // Lower confidence OK
//	}
type Config struct {
	// Similarity-based linking
	SimilarityThreshold float64 // Default: 0.82
	SimilarityTopK      int     // How many similar nodes to check

	// Co-access pattern detection
	CoAccessEnabled  bool
	CoAccessWindow   time.Duration // Time window for co-access
	CoAccessMinCount int           // Minimum co-accesses to suggest edge

	// Temporal proximity
	TemporalEnabled bool
	TemporalWindow  time.Duration // Window for "same session"

	// Transitive inference
	TransitiveEnabled bool
	TransitiveMinConf float64 // Minimum confidence for transitive edges
}

// DefaultConfig returns balanced default configuration suitable for most use cases.
//
// Defaults:
//   - SimilarityThreshold: 0.82 (fairly confident)
//   - SimilarityTopK: 10 (check 10 most similar)
//   - CoAccessWindow: 30 seconds
//   - CoAccessMinCount: 3 (need 3 co-accesses before suggesting)
//   - TemporalWindow: 30 minutes (same "session")
//   - TransitiveMinConf: 0.5 (moderate confidence)
//
// Example:
//
//	config := inference.DefaultConfig()
//	engine := inference.New(config)
//
//	// Or customize
//	config = inference.DefaultConfig()
//	config.SimilarityThreshold = 0.90 // Stricter
//	engine = inference.New(config)
func DefaultConfig() *Config {
	return &Config{
		SimilarityThreshold: 0.82,
		SimilarityTopK:      10,
		CoAccessEnabled:     true,
		CoAccessWindow:      30 * time.Second,
		CoAccessMinCount:    3,
		TemporalEnabled:     true,
		TemporalWindow:      30 * time.Minute,
		TransitiveEnabled:   true,
		TransitiveMinConf:   0.5,
	}
}

// Engine handles automatic relationship inference using multiple detection methods.
//
// The Engine is thread-safe and can be used concurrently. It maintains
// internal state for co-access tracking and temporal pattern detection.
//
// Lifecycle:
//  1. Create with New()
//  2. Configure similarity search with SetSimilaritySearch()
//  3. Call OnStore() when creating nodes
//  4. Call OnAccess() when accessing nodes
//  5. Periodically call SuggestTransitive() to find indirect relationships
//
// Example:
//
//	engine := inference.New(inference.DefaultConfig())
//
//	// Connect to vector index
//	engine.SetSimilaritySearch(vectorIndex.Search)
//
//	// Use in your storage layer
//	func StoreMemory(mem *Memory) error {
//		// Store the memory
//		if err := db.Store(mem); err != nil {
//			return err
//		}
//
//		// Get relationship suggestions
//		suggestions, _ := engine.OnStore(ctx, mem.ID, mem.Embedding)
//
//		// Auto-create high-confidence edges
//		for _, sug := range suggestions {
//			if sug.Confidence >= 0.7 {
//				db.CreateEdge(sug.SourceID, sug.TargetID, sug.Type, sug.Confidence)
//			}
//		}
//
//		return nil
//	}
type Engine struct {
	config *Config
	mu     sync.RWMutex

	// Co-access tracking
	accessHistory  []accessRecord
	coAccessCounts map[coAccessKey]int

	// For similarity lookups (injected dependency)
	similaritySearch func(ctx context.Context, embedding []float32, k int) ([]SimilarityResult, error)

	// Optional topology integration (NEW)
	topologyIntegration *TopologyIntegration

	// Optional cluster integration for GPU-accelerated search
	clusterIntegration *ClusterIntegration

	// Optional Kalman adapter for smoothed confidence and temporal patterns
	// Enabled via NORNICDB_KALMAN_ENABLED=true
	kalmanAdapter *KalmanAdapter

	// Tier 1 features - enabled by default for production safety
	cooldownTable   *CooldownTable           // Prevents rapid re-materialization
	evidenceBuffer  *EvidenceBuffer          // Requires multiple signals before materializing
	edgeMetaStore   *storage.EdgeMetaStore   // Logs edge provenance for audit trails
	nodeConfigStore *storage.NodeConfigStore // Per-node edge creation rules

	// Heimdall SLM quality control - validates edges before creation
	// Enabled via NORNICDB_AUTO_TLP_LLM_QC_ENABLED=true
	heimdallQC *HeimdallQC
}

type accessRecord struct {
	NodeID    string
	Timestamp time.Time
}

type coAccessKey struct {
	NodeA string
	NodeB string
}

// SimilarityResult from vector search.
type SimilarityResult struct {
	ID    string
	Score float64
}

// New creates a new inference Engine with the given configuration.
//
// If config is nil, DefaultConfig() is used.
//
// The engine starts with empty co-access tracking. Call SetSimilaritySearch()
// to enable similarity-based inference.
//
// Example:
//
//	// With defaults
//	engine := inference.New(nil)
//
//	// With custom config
//	config := &inference.Config{
//		SimilarityThreshold: 0.85,
//		SimilarityTopK:      15,
//		CoAccessEnabled:     true,
//	}
//	engine = inference.New(config)
//
// Returns a new Engine ready for use.
func New(config *Config) *Engine {
	if config == nil {
		config = DefaultConfig()
	}

	return &Engine{
		config:          config,
		accessHistory:   make([]accessRecord, 0),
		coAccessCounts:  make(map[coAccessKey]int),
		cooldownTable:   NewCooldownTable(),
		evidenceBuffer:  NewEvidenceBuffer(),
		edgeMetaStore:   storage.NewEdgeMetaStore(),
		nodeConfigStore: storage.NewNodeConfigStore(),
	}
}

// SetSimilaritySearch sets the similarity search function.
func (e *Engine) SetSimilaritySearch(fn func(ctx context.Context, embedding []float32, k int) ([]SimilarityResult, error)) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.similaritySearch = fn
}

// SetTopologyIntegration enables topological link prediction.
//
// This adds graph structure analysis to edge suggestions, combining topology
// with semantic/behavioral signals for more robust predictions.
//
// Parameters:
//   - integration: TopologyIntegration instance (nil to disable)
//
// Example:
//
//	engine := inference.New(inference.DefaultConfig())
//
//	// Enable topology
//	topoConfig := inference.DefaultTopologyConfig()
//	topoConfig.Enabled = true
//	topoConfig.Weight = 0.4  // 40% topology, 60% semantic
//
//	topo := inference.NewTopologyIntegration(storage, topoConfig)
//	engine.SetTopologyIntegration(topo)
//
//	// Now suggestions include topology signals
//	suggestions, _ := engine.OnStore(ctx, nodeID, embedding)
func (e *Engine) SetTopologyIntegration(integration *TopologyIntegration) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.topologyIntegration = integration
}

// GetTopologyIntegration returns the current topology integration (or nil).
func (e *Engine) GetTopologyIntegration() *TopologyIntegration {
	e.mu.RLock()
	defer e.mu.RUnlock()
	return e.topologyIntegration
}

// SetClusterIntegration enables GPU-accelerated k-means clustering for similarity search.
//
// When enabled, similarity searches are accelerated using cluster-based
// approximate nearest neighbor search. This provides significant speedup
// for large embedding indices (10K+ embeddings).
//
// Parameters:
//   - integration: ClusterIntegration instance (nil to disable)
//
// Example:
//
//	engine := inference.New(inference.DefaultConfig())
//
//	// Enable clustering
//	gpuManager, _ := gpu.NewManager(&gpu.Config{Enabled: true})
//	clusterConfig := inference.DefaultClusterConfig()
//	clusterConfig.Enabled = true
//	clusterConfig.NumClustersSearch = 5
//
//	ci := inference.NewClusterIntegration(gpuManager, clusterConfig, nil, nil)
//	engine.SetClusterIntegration(ci)
//
//	// Add embeddings during indexing
//	ci.AddEmbedding(nodeID, embedding)
//
//	// Trigger clustering after bulk load
//	ci.OnIndexComplete()
//
//	// Searches now use cluster acceleration
//	results, _ := ci.Search(ctx, queryEmbedding, 10)
func (e *Engine) SetClusterIntegration(integration *ClusterIntegration) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.clusterIntegration = integration
}

// GetClusterIntegration returns the current cluster integration (or nil).
func (e *Engine) GetClusterIntegration() *ClusterIntegration {
	e.mu.RLock()
	defer e.mu.RUnlock()
	return e.clusterIntegration
}

// SetKalmanAdapter configures the Kalman-enhanced inference adapter.
//
// The KalmanAdapter provides:
//   - Smoothed confidence scores using Kalman filtering
//   - Temporal access pattern tracking
//   - Session-aware co-access detection
//   - Relationship strength trend analysis
//
// This is an OPTIONAL enhancement - if not set, base inference works normally.
// Enable via NORNICDB_KALMAN_ENABLED=true environment variable.
//
// Example:
//
//	if config.IsKalmanEnabled() {
//		adapter := inference.NewKalmanAdapter(engine, inference.DefaultKalmanAdapterConfig())
//		tracker := temporal.NewTracker(temporal.DefaultConfig())
//		adapter.SetTracker(tracker)
//		engine.SetKalmanAdapter(adapter)
//	}
func (e *Engine) SetKalmanAdapter(adapter *KalmanAdapter) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.kalmanAdapter = adapter
}

// GetKalmanAdapter returns the current Kalman adapter (or nil if not configured).
func (e *Engine) GetKalmanAdapter() *KalmanAdapter {
	e.mu.RLock()
	defer e.mu.RUnlock()
	return e.kalmanAdapter
}

// SetHeimdallQC sets the Heimdall SLM quality control for edge validation.
//
// When set and enabled (via NORNICDB_AUTO_TLP_LLM_QC_ENABLED=true), each
// edge suggestion from OnStore() and OnAccess() will be validated by
// the Heimdall SLM before being returned. The SLM can approve, reject,
// or modify the suggested relationship type.
//
// Example:
//
//	// Create Heimdall QC with your SLM function
//	qc := inference.NewHeimdallQC(func(ctx context.Context, prompt string) (string, error) {
//		return myOllamaClient.Complete(ctx, prompt)
//	}, nil)
//
//	engine.SetHeimdallQC(qc)
//
//	// Now suggestions are validated by Heimdall
//	suggestions, _ := engine.OnStore(ctx, nodeID, embedding)
//	// Only returns approved suggestions
func (e *Engine) SetHeimdallQC(qc *HeimdallQC) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.heimdallQC = qc
}

// GetHeimdallQC returns the current Heimdall QC (or nil if not configured).
func (e *Engine) GetHeimdallQC() *HeimdallQC {
	e.mu.RLock()
	defer e.mu.RUnlock()
	return e.heimdallQC
}

// OnStore is called when a new node is stored in the graph.
//
// This method analyzes the new node and suggests relationships based on
// vector similarity. High-confidence suggestions can be automatically
// created as edges.
//
// Parameters:
//   - ctx: Context for cancellation
//   - nodeID: ID of the newly created node
//   - embedding: Vector embedding of the node's content
//
// Returns:
//   - Slice of EdgeSuggestion with confidence scores and reasons
//   - Error if similarity search fails
//
// Example:
//
//	// User creates a new note
//	note := &Note{
//		ID:      "note-456",
//		Content: "Machine learning algorithms",
//		Embedding: embedder.Embed("Machine learning algorithms"),
//	}
//
//	// Get suggestions
//	suggestions, err := engine.OnStore(ctx, note.ID, note.Embedding)
//	if err != nil {
//		return err
//	}
//
//	fmt.Printf("Found %d related notes:\n", len(suggestions))
//	for _, sug := range suggestions {
//		relatedNote := getNote(sug.TargetID)
//		fmt.Printf("  - %s (%.0f%% confident): %s\n",
//			relatedNote.Title, sug.Confidence*100, sug.Reason)
//
//		// Auto-link if very confident
//		if sug.Confidence >= 0.8 {
//			createEdge(sug)
//			log.Printf("Auto-linked: %s -> %s", note.ID, relatedNote.ID)
//		}
//	}
//
// Typical confidence levels:
//   - 0.9+: Very confident, safe to auto-create
//   - 0.7-0.9: Confident, suggest to user
//   - 0.5-0.7: Possible, show as "related"
//   - <0.5: Weak, ignore
func (e *Engine) OnStore(ctx context.Context, nodeID string, embedding []float32) ([]EdgeSuggestion, error) {
	e.mu.Lock()
	defer e.mu.Unlock()

	suggestions := make([]EdgeSuggestion, 0)

	// 1. Similarity-based suggestions (semantic)
	if e.similaritySearch != nil && len(embedding) > 0 {
		similar, err := e.similaritySearch(ctx, embedding, e.config.SimilarityTopK)
		if err == nil {
			for _, result := range similar {
				if result.ID == nodeID {
					continue // Skip self
				}
				if result.Score >= e.config.SimilarityThreshold {
					conf := e.scoreToConfidence(result.Score)
					suggestions = append(suggestions, EdgeSuggestion{
						SourceID:   nodeID,
						TargetID:   result.ID,
						Type:       "RELATES_TO",
						Confidence: conf,
						Reason:     "High embedding similarity",
						Method:     "similarity",
					})
				}
			}
		}
	}

	// 2. Topological suggestions (NEW - feature flagged for AUTOMATIC integration)
	// Note: Cypher procedures (CALL gds.linkPrediction.*) are always available
	// This flag only controls automatic use in OnStore()
	if e.topologyIntegration != nil {
		// Check feature flag via config (automatic integration)
		topoConfig := e.topologyIntegration.config
		if topoConfig != nil && topoConfig.Enabled {
			topoSuggestions, err := e.topologyIntegration.SuggestTopological(ctx, nodeID)
			if err == nil && len(topoSuggestions) > 0 {
				// Combine semantic and topological suggestions
				suggestions = e.topologyIntegration.CombinedSuggestions(suggestions, topoSuggestions)
			}
		}
	}

	// 3. Heimdall QC validation (if enabled)
	// Each suggestion is sent to the SLM for approval before returning
	if e.heimdallQC != nil && config.IsAutoTLPLLMQCEnabled() {
		suggestions = e.validateSuggestionsWithHeimdall(ctx, nodeID, suggestions)
	}

	return suggestions, nil
}

// validateSuggestionsWithHeimdall filters suggestions through Heimdall SLM batch review.
// Returns approved suggestions + any augmented suggestions from Heimdall.
func (e *Engine) validateSuggestionsWithHeimdall(ctx context.Context, sourceNodeID string, suggestions []EdgeSuggestion) []EdgeSuggestion {
	if len(suggestions) == 0 || e.heimdallQC == nil {
		return suggestions
	}

	// Build source node summary
	// Note: In a full implementation, we'd look up the node from storage
	sourceNode := NodeSummary{
		ID:     sourceNodeID,
		Labels: []string{}, // Would be populated from storage
		Props:  make(map[string]string),
	}

	// Build candidate pool for augmentation (empty for now - could be populated from similarity search)
	var candidatePool []NodeSummary

	// Call Heimdall batch review
	approved, augmented, err := e.heimdallQC.ReviewBatch(ctx, sourceNode, suggestions, candidatePool)
	if err != nil {
		// On error, return original suggestions (fail-open)
		return suggestions
	}

	// Set source ID on augmented edges
	for i := range augmented {
		augmented[i].SourceID = sourceNodeID
	}

	// Combine approved + augmented
	result := append(approved, augmented...)
	return result
}

// OnAccess is called when a node is accessed (read).
//
// This method tracks co-access patterns - nodes that are accessed close together
// in time are likely related. After seeing the same pair accessed together
// multiple times, it suggests creating a relationship.
//
// Parameters:
//   - ctx: Context (currently unused, reserved for future)
//   - nodeID: ID of the accessed node
//
// Returns:
//   - Slice of EdgeSuggestion based on co-access patterns
//
// Example:
//
//	func GetMemory(id string) (*Memory, error) {
//		// Retrieve memory
//		mem, err := db.Get(id)
//		if err != nil {
//			return nil, err
//		}
//
//		// Track access for inference
//		suggestions := engine.OnAccess(ctx, id)
//
//		// Log co-access patterns
//		for _, sug := range suggestions {
//			if sug.Method == "co_access" {
//				log.Printf("Co-accessed with %s (%d times)",
//					sug.TargetID, sug.Confidence*10)
//
//				// Create edge if frequently co-accessed
//				if sug.Confidence >= 0.6 {
//					createEdge(sug)
//				}
//			}
//		}
//
//		return mem, nil
//	}
//
// How It Works:
//
//	The engine maintains a sliding window of recent accesses.
//	When you access node A, it checks what other nodes were accessed
//	in the last 30 seconds (configurable). If the same pair appears
//	multiple times, it suggests they're related.
//
// Use Case:
//
//	In a note-taking app, if you always view "Project Plan" and "Budget"
//	together, the engine suggests: "These seem related - want to link them?"
func (e *Engine) OnAccess(ctx context.Context, nodeID string) []EdgeSuggestion {
	e.mu.Lock()
	defer e.mu.Unlock()

	now := time.Now()
	suggestions := make([]EdgeSuggestion, 0)

	if !e.config.CoAccessEnabled {
		return suggestions
	}

	// Find recent accesses within the window
	windowStart := now.Add(-e.config.CoAccessWindow)
	recentNodes := make([]string, 0)

	for _, record := range e.accessHistory {
		if record.Timestamp.After(windowStart) && record.NodeID != nodeID {
			recentNodes = append(recentNodes, record.NodeID)
		}
	}

	// Update co-access counts
	for _, otherID := range recentNodes {
		key := e.makeCoAccessKey(nodeID, otherID)
		e.coAccessCounts[key]++

		// Check if we should suggest an edge
		if e.coAccessCounts[key] >= e.config.CoAccessMinCount {
			conf := float64(e.coAccessCounts[key]) / 10.0
			if conf > 0.8 {
				conf = 0.8 // Cap at 0.8 for co-access
			}
			suggestions = append(suggestions, EdgeSuggestion{
				SourceID:   nodeID,
				TargetID:   otherID,
				Type:       "RELATES_TO",
				Confidence: conf,
				Reason:     "Frequently accessed together",
				Method:     "co_access",
			})
		}
	}

	// Add to history
	e.accessHistory = append(e.accessHistory, accessRecord{
		NodeID:    nodeID,
		Timestamp: now,
	})

	// Prune old history
	e.pruneHistory(windowStart)

	return suggestions
}

// SuggestTransitive suggests edges based on transitive relationships.
// If A->B and B->C with sufficient confidence, suggest A->C.
func (e *Engine) SuggestTransitive(ctx context.Context, edges []ExistingEdge) []EdgeSuggestion {
	e.mu.RLock()
	defer e.mu.RUnlock()

	if !e.config.TransitiveEnabled {
		return nil
	}

	suggestions := make([]EdgeSuggestion, 0)

	// Build adjacency map
	outgoing := make(map[string][]ExistingEdge)
	for _, edge := range edges {
		outgoing[edge.SourceID] = append(outgoing[edge.SourceID], edge)
	}

	// For each A->B, look for B->C
	for _, ab := range edges {
		for _, bc := range outgoing[ab.TargetID] {
			if ab.SourceID == bc.TargetID {
				continue // Skip cycles back to origin
			}

			// Calculate transitive confidence
			conf := ab.Confidence * bc.Confidence
			if conf >= e.config.TransitiveMinConf {
				suggestions = append(suggestions, EdgeSuggestion{
					SourceID:   ab.SourceID,
					TargetID:   bc.TargetID,
					Type:       "RELATES_TO",
					Confidence: conf,
					Reason:     "Transitive via " + ab.TargetID,
					Method:     "transitive",
				})
			}
		}
	}

	return suggestions
}

// ExistingEdge represents an edge in the graph.
type ExistingEdge struct {
	SourceID   string
	TargetID   string
	Confidence float64
}

// scoreToConfidence converts similarity score to edge confidence.
func (e *Engine) scoreToConfidence(score float64) float64 {
	// Map similarity score ranges to confidence levels
	switch {
	case score >= 0.95:
		return 0.9
	case score >= 0.90:
		return 0.7
	case score >= 0.85:
		return 0.5
	default:
		return 0.3
	}
}

// makeCoAccessKey creates a consistent key for co-access tracking.
func (e *Engine) makeCoAccessKey(a, b string) coAccessKey {
	// Ensure consistent ordering
	if a < b {
		return coAccessKey{NodeA: a, NodeB: b}
	}
	return coAccessKey{NodeA: b, NodeB: a}
}

// pruneHistory removes old access records.
func (e *Engine) pruneHistory(before time.Time) {
	// Keep records newer than 'before'
	newHistory := make([]accessRecord, 0, len(e.accessHistory))
	for _, record := range e.accessHistory {
		if record.Timestamp.After(before) {
			newHistory = append(newHistory, record)
		}
	}
	e.accessHistory = newHistory
}

// Stats returns inference statistics.
type Stats struct {
	TotalSuggestions  int64
	BySimilarity      int64
	ByCoAccess        int64
	ByTransitive      int64
	TrackedCoAccesses int
}

// GetStats returns current inference statistics.
func (e *Engine) GetStats() Stats {
	e.mu.RLock()
	defer e.mu.RUnlock()

	return Stats{
		TrackedCoAccesses: len(e.coAccessCounts),
	}
}

// ProcessSuggestionResult contains the result of processing a suggestion.
type ProcessSuggestionResult struct {
	ShouldMaterialize bool   // True if edge should be created
	Reason            string // Why or why not
	CooldownBlocked   bool   // True if blocked by cooldown
	EvidencePending   bool   // True if waiting for more evidence
	NodeConfigBlocked bool   // True if blocked by per-node config (deny list, caps, etc.)
}

// ProcessSuggestion processes an edge suggestion through cooldown and evidence buffering.
//
// This method applies Tier 1 safety features (when auto-integration is enabled):
//   - Cooldown: Prevents rapid re-materialization of the same edge pair
//   - Evidence Buffering: Requires multiple signals before materializing
//
// Feature flags:
//   - NORNICDB_COOLDOWN_AUTO_INTEGRATION_ENABLED (default: true)
//   - NORNICDB_EVIDENCE_AUTO_INTEGRATION_ENABLED (default: true)
//
// Parameters:
//   - suggestion: The edge suggestion to process
//   - sessionID: Current session ID for evidence tracking
//
// Returns ProcessSuggestionResult indicating whether to create the edge.
//
// Example:
//
//	suggestions, _ := engine.OnStore(ctx, nodeID, embedding)
//	for _, sug := range suggestions {
//	    result := engine.ProcessSuggestion(sug, "session-123")
//	    if result.ShouldMaterialize {
//	        db.CreateEdge(sug.SourceID, sug.TargetID, sug.Type)
//	        engine.RecordMaterialization(sug.SourceID, sug.TargetID, sug.Type)
//	    }
//	}
func (e *Engine) ProcessSuggestion(suggestion EdgeSuggestion, sessionID string) ProcessSuggestionResult {
	ctx := context.Background()
	result := ProcessSuggestionResult{
		ShouldMaterialize: true,
		Reason:            "passed all checks",
	}

	// Log provenance for this suggestion (if auto-integration enabled)
	if config.IsEdgeProvenanceAutoIntegrationEnabled() && e.edgeMetaStore != nil {
		e.edgeMetaStore.AppendFromSuggestion(
			ctx,
			suggestion.SourceID, suggestion.TargetID, suggestion.Type,
			suggestion.Confidence,
			suggestion.Method, suggestion.Method, suggestion.Reason,
			sessionID, "inference-engine",
			false, // Not materialized yet
		)
	}

	// Check cooldown (if auto-integration enabled)
	if config.IsCooldownAutoIntegrationEnabled() {
		if !e.cooldownTable.CanMaterialize(suggestion.SourceID, suggestion.TargetID, suggestion.Type) {
			result.ShouldMaterialize = false
			result.CooldownBlocked = true
			_, reason := e.cooldownTable.CanMaterializeWithReason(suggestion.SourceID, suggestion.TargetID, suggestion.Type)
			result.Reason = "cooldown: " + reason
			return result
		}
	}

	// Check per-node config (if auto-integration enabled)
	if config.IsPerNodeConfigAutoIntegrationEnabled() && e.nodeConfigStore != nil {
		allowed, reason := e.nodeConfigStore.IsEdgeAllowedWithReason(suggestion.SourceID, suggestion.TargetID, suggestion.Type)
		if !allowed {
			result.ShouldMaterialize = false
			result.NodeConfigBlocked = true
			result.Reason = "node-config: " + reason
			return result
		}
	}

	// Check evidence buffering (if auto-integration enabled)
	if config.IsEvidenceAutoIntegrationEnabled() {
		shouldMaterialize := e.evidenceBuffer.AddEvidence(
			suggestion.SourceID,
			suggestion.TargetID,
			suggestion.Type,
			suggestion.Confidence,
			suggestion.Method,
			sessionID,
		)

		if !shouldMaterialize {
			result.ShouldMaterialize = false
			result.EvidencePending = true
			_, reason := e.evidenceBuffer.CheckThreshold(suggestion.SourceID, suggestion.TargetID, suggestion.Type)
			result.Reason = "evidence: " + reason
			return result
		}
	}

	return result
}

// RecordMaterialization records that an edge was materialized.
//
// Call this after successfully creating an edge to update:
//   - Cooldown tracking (prevents immediate re-creation)
//   - Provenance logs (audit trail of why edge was created)
//   - Node config edge counts (enforces per-node limits)
//
// This is the "clean up after yourself" function - ALWAYS call it after
// creating an edge to keep internal state synchronized.
//
// Example 1: Basic usage after edge creation
//
//	result := engine.ProcessSuggestion(suggestion, "session-123")
//	if result.ShouldMaterialize {
//	    db.CreateEdge(suggestion.SourceID, suggestion.TargetID, suggestion.Type)
//	    engine.RecordMaterialization(suggestion.SourceID, suggestion.TargetID, suggestion.Type)
//	}
//
// Example 2: Batch edge creation
//
//	for _, sug := range suggestions {
//	    if sug.Confidence > 0.8 {
//	        db.CreateEdge(sug.SourceID, sug.TargetID, sug.Type)
//	        engine.RecordMaterialization(sug.SourceID, sug.TargetID, sug.Type)
//	    }
//	}
//
// Example 3: Manual edge creation (bypassing ProcessSuggestion)
//
//	// User explicitly creates an edge
//	db.CreateEdge("user-123", "doc-456", "bookmarked")
//	// Still record it to prevent suggestions for same edge
//	engine.RecordMaterialization("user-123", "doc-456", "bookmarked")
//
// ELI12 (Explain Like I'm 12):
//
// Think of this like checking out a library book. When you return it:
//   - Cooldown: "You just returned this book, wait 5 minutes before checking it out again"
//   - Provenance: "Record that you borrowed this book on June 15th"
//   - Node Config: "Update your total books borrowed count (you're at 9/10 limit now)"
//
// If you forget to call this, it's like never returning the book - the library
// thinks you still have it and might suggest you borrow it again (duplicate!).
func (e *Engine) RecordMaterialization(sourceID, targetID, edgeType string) {
	ctx := context.Background()

	// Update cooldown tracking
	if config.IsCooldownAutoIntegrationEnabled() {
		e.cooldownTable.RecordMaterialization(sourceID, targetID, edgeType)
	}

	// Log materialization in provenance
	if config.IsEdgeProvenanceAutoIntegrationEnabled() && e.edgeMetaStore != nil {
		e.edgeMetaStore.MarkMaterialized(ctx, sourceID, targetID, edgeType, "inference-engine")
	}

	// Update per-node edge counts
	if config.IsPerNodeConfigAutoIntegrationEnabled() && e.nodeConfigStore != nil {
		e.nodeConfigStore.RecordEdgeCreation(sourceID, targetID)
	}
}

// GetCooldownTable returns the cooldown table for direct access.
// The table is always available regardless of auto-integration setting.
func (e *Engine) GetCooldownTable() *CooldownTable {
	return e.cooldownTable
}

// GetEvidenceBuffer returns the evidence buffer for direct access.
// The buffer is always available regardless of auto-integration setting.
func (e *Engine) GetEvidenceBuffer() *EvidenceBuffer {
	return e.evidenceBuffer
}

// SetCooldownTable sets a custom cooldown table.
func (e *Engine) SetCooldownTable(table *CooldownTable) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.cooldownTable = table
}

// SetEvidenceBuffer sets a custom evidence buffer.
func (e *Engine) SetEvidenceBuffer(buffer *EvidenceBuffer) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.evidenceBuffer = buffer
}

// GetEdgeMetaStore returns the edge meta store for direct access.
// The store is always available regardless of auto-integration setting.
func (e *Engine) GetEdgeMetaStore() *storage.EdgeMetaStore {
	return e.edgeMetaStore
}

// SetEdgeMetaStore sets a custom edge meta store.
func (e *Engine) SetEdgeMetaStore(store *storage.EdgeMetaStore) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.edgeMetaStore = store
}

// GetNodeConfigStore returns the node config store for direct access.
// The store is always available regardless of auto-integration setting.
func (e *Engine) GetNodeConfigStore() *storage.NodeConfigStore {
	return e.nodeConfigStore
}

// SetNodeConfigStore sets a custom node config store.
func (e *Engine) SetNodeConfigStore(store *storage.NodeConfigStore) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.nodeConfigStore = store
}

// CleanupTier1 runs cleanup on Tier 1 data structures.
// Should be called periodically (e.g., every 10 minutes).
// provenanceMaxAge specifies the max age for provenance records (0 = don't cleanup).
func (e *Engine) CleanupTier1() (cooldownRemoved, evidenceRemoved int) {
	if e.cooldownTable != nil {
		cooldownRemoved = e.cooldownTable.Cleanup()
	}
	if e.evidenceBuffer != nil {
		evidenceRemoved = e.evidenceBuffer.Cleanup()
	}
	return
}

// CleanupTier1WithProvenance runs cleanup including provenance records.
// provenanceMaxAge specifies the max age for provenance records.
func (e *Engine) CleanupTier1WithProvenance(provenanceMaxAge time.Duration) (cooldownRemoved, evidenceRemoved, provenanceRemoved int) {
	cooldownRemoved, evidenceRemoved = e.CleanupTier1()
	if e.edgeMetaStore != nil && provenanceMaxAge > 0 {
		provenanceRemoved = e.edgeMetaStore.Cleanup(provenanceMaxAge)
	}
	return
}

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/orneryd/Mimir'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

inference.go•32.1 KiB

// Package inference provides automatic relationship detection for NornicDB.
//
// This package implements multiple methods for detecting implicit relationships
// between nodes in the graph:
//   - Similarity-based: Nodes with similar embeddings are likely related
//   - Co-access patterns: Nodes accessed together frequently are likely related
//   - Temporal proximity: Nodes accessed in the same session are likely related
//   - Transitive inference: If A→B and B→C, then A→C (with confidence)
//
// Example Usage:
//
//	// Create inference engine
//	config := inference.DefaultConfig()
//	config.SimilarityThreshold = 0.85 // Higher threshold = more confidence
//	engine := inference.New(config)
//
//	// Hook up vector search
//	engine.SetSimilaritySearch(func(ctx context.Context, embedding []float32, k int) ([]inference.SimilarityResult, error) {
//		return vectorIndex.Search(ctx, embedding, k)
//	})
//
//	// When storing a new memory
//	node := createMemoryNode("Remember to buy milk")
//	suggestions, _ := engine.OnStore(ctx, node.ID, node.Embedding)
//
//	fmt.Printf("Found %d suggested relationships:\n", len(suggestions))
//	for _, sug := range suggestions {
//		fmt.Printf("  %s -> %s (%.2f confidence): %s\n",
//			sug.SourceID, sug.TargetID, sug.Confidence, sug.Reason)
//
//		if sug.Confidence > 0.7 {
//			// High confidence - auto-create the edge
//			createEdge(sug.SourceID, sug.TargetID, sug.Type)
//		}
//	}
//
//	// When accessing a memory
//	suggestions = engine.OnAccess(ctx, "memory-123")
//	for _, sug := range suggestions {
//		if sug.Method == "co_access" {
//			fmt.Printf("Frequently accessed with: %s\n", sug.TargetID)
//		}
//	}
//
// How Each Method Works:
//
//  1. Similarity-Based Linking:
//     Uses vector embeddings to find semantically similar nodes.
//     Example: "Buy milk" and "Purchase dairy products" have similar embeddings.
//
//  2. Co-Access Patterns:
//     Tracks which nodes are accessed within a short time window.
//     Example: If you always access "Project Plan" and "Budget" together,
//     they're probably related.
//
//  3. Temporal Proximity:
//     Nodes accessed in the same session (within 30 minutes) are linked.
//     Example: All memories from a single conversation thread.
//
//  4. Transitive Inference:
//     If A relates to B and B relates to C, then A might relate to C.
//     Example: "Python" → "Programming" → "Computers" suggests "Python" → "Computers"
//
// ELI12 (Explain Like I'm 12):
//
// Imagine you're organizing your school notebooks:
//
//  1. **Similarity**: Your math and science notebooks go together because they're
//     both about numbers and formulas (similar content).
//
//  2. **Co-access**: Your English notebook and dictionary always get used together,
//     so they should be near each other on your shelf.
//
//  3. **Temporal**: All homework from Monday night was done at the same time,
//     so those papers are related.
//
//  4. **Transitive**: If Math relates to Science, and Science relates to Biology,
//     then Math probably relates to Biology too (they're all STEM subjects).
//
// The inference engine is like a smart librarian who notices these patterns
// and suggests: "Hey, these two things seem related - want me to connect them?"
package inference

import (
	"context"
	"sync"
	"time"

	"github.com/orneryd/nornicdb/pkg/config"
	"github.com/orneryd/nornicdb/pkg/storage"
)

// EdgeSuggestion represents a suggested edge.
type EdgeSuggestion struct {
	SourceID   string
	TargetID   string
	Type       string
	Confidence float64
	Reason     string
	Method     string // similarity, co_access, temporal, transitive
}

// Config holds inference engine configuration options.
//
// All thresholds and parameters can be tuned based on your use case:
//   - Higher thresholds = fewer but more confident suggestions
//   - Lower thresholds = more suggestions but potentially noisier
//
// Example:
//
//	// Conservative: Only suggest very confident relationships
//	config := &inference.Config{
//		SimilarityThreshold: 0.90, // Very high bar
//		SimilarityTopK:      5,    // Only check top 5
//		CoAccessMinCount:    5,    // Need 5 co-accesses
//		TransitiveMinConf:   0.7,  // High confidence for transitive
//	}
//
//	// Aggressive: Suggest many potential relationships
//	config = &inference.Config{
//		SimilarityThreshold: 0.75, // Lower bar
//		SimilarityTopK:      20,   // Check top 20
//		CoAccessMinCount:    2,    // Just 2 co-accesses
//		TransitiveMinConf:   0.3,  // Lower confidence OK
//	}
type Config struct {
	// Similarity-based linking
	SimilarityThreshold float64 // Default: 0.82
	SimilarityTopK      int     // How many similar nodes to check

	// Co-access pattern detection
	CoAccessEnabled  bool
	CoAccessWindow   time.Duration // Time window for co-access
	CoAccessMinCount int           // Minimum co-accesses to suggest edge

	// Temporal proximity
	TemporalEnabled bool
	TemporalWindow  time.Duration // Window for "same session"

	// Transitive inference
	TransitiveEnabled bool
	TransitiveMinConf float64 // Minimum confidence for transitive edges
}

// DefaultConfig returns balanced default configuration suitable for most use cases.
//
// Defaults:
//   - SimilarityThreshold: 0.82 (fairly confident)
//   - SimilarityTopK: 10 (check 10 most similar)
//   - CoAccessWindow: 30 seconds
//   - CoAccessMinCount: 3 (need 3 co-accesses before suggesting)
//   - TemporalWindow: 30 minutes (same "session")
//   - TransitiveMinConf: 0.5 (moderate confidence)
//
// Example:
//
//	config := inference.DefaultConfig()
//	engine := inference.New(config)
//
//	// Or customize
//	config = inference.DefaultConfig()
//	config.SimilarityThreshold = 0.90 // Stricter
//	engine = inference.New(config)
func DefaultConfig() *Config {
	return &Config{
		SimilarityThreshold: 0.82,
		SimilarityTopK:      10,
		CoAccessEnabled:     true,
		CoAccessWindow:      30 * time.Second,
		CoAccessMinCount:    3,
		TemporalEnabled:     true,
		TemporalWindow:      30 * time.Minute,
		TransitiveEnabled:   true,
		TransitiveMinConf:   0.5,
	}
}

// Engine handles automatic relationship inference using multiple detection methods.
//
// The Engine is thread-safe and can be used concurrently. It maintains
// internal state for co-access tracking and temporal pattern detection.
//
// Lifecycle:
//  1. Create with New()
//  2. Configure similarity search with SetSimilaritySearch()
//  3. Call OnStore() when creating nodes
//  4. Call OnAccess() when accessing nodes
//  5. Periodically call SuggestTransitive() to find indirect relationships
//
// Example:
//
//	engine := inference.New(inference.DefaultConfig())
//
//	// Connect to vector index
//	engine.SetSimilaritySearch(vectorIndex.Search)
//
//	// Use in your storage layer
//	func StoreMemory(mem *Memory) error {
//		// Store the memory
//		if err := db.Store(mem); err != nil {
//			return err
//		}
//
//		// Get relationship suggestions
//		suggestions, _ := engine.OnStore(ctx, mem.ID, mem.Embedding)
//
//		// Auto-create high-confidence edges
//		for _, sug := range suggestions {
//			if sug.Confidence >= 0.7 {
//				db.CreateEdge(sug.SourceID, sug.TargetID, sug.Type, sug.Confidence)
//			}
//		}
//
//		return nil
//	}
type Engine struct {
	config *Config
	mu     sync.RWMutex

	// Co-access tracking
	accessHistory  []accessRecord
	coAccessCounts map[coAccessKey]int

	// For similarity lookups (injected dependency)
	similaritySearch func(ctx context.Context, embedding []float32, k int) ([]SimilarityResult, error)

	// Optional topology integration (NEW)
	topologyIntegration *TopologyIntegration

	// Optional cluster integration for GPU-accelerated search
	clusterIntegration *ClusterIntegration

	// Optional Kalman adapter for smoothed confidence and temporal patterns
	// Enabled via NORNICDB_KALMAN_ENABLED=true
	kalmanAdapter *KalmanAdapter

	// Tier 1 features - enabled by default for production safety
	cooldownTable   *CooldownTable           // Prevents rapid re-materialization
	evidenceBuffer  *EvidenceBuffer          // Requires multiple signals before materializing
	edgeMetaStore   *storage.EdgeMetaStore   // Logs edge provenance for audit trails
	nodeConfigStore *storage.NodeConfigStore // Per-node edge creation rules

	// Heimdall SLM quality control - validates edges before creation
	// Enabled via NORNICDB_AUTO_TLP_LLM_QC_ENABLED=true
	heimdallQC *HeimdallQC
}

type accessRecord struct {
	NodeID    string
	Timestamp time.Time
}

type coAccessKey struct {
	NodeA string
	NodeB string
}

// SimilarityResult from vector search.
type SimilarityResult struct {
	ID    string
	Score float64
}

// New creates a new inference Engine with the given configuration.
//
// If config is nil, DefaultConfig() is used.
//
// The engine starts with empty co-access tracking. Call SetSimilaritySearch()
// to enable similarity-based inference.
//
// Example:
//
//	// With defaults
//	engine := inference.New(nil)
//
//	// With custom config
//	config := &inference.Config{
//		SimilarityThreshold: 0.85,
//		SimilarityTopK:      15,
//		CoAccessEnabled:     true,
//	}
//	engine = inference.New(config)
//
// Returns a new Engine ready for use.
func New(config *Config) *Engine {
	if config == nil {
		config = DefaultConfig()
	}

	return &Engine{
		config:          config,
		accessHistory:   make([]accessRecord, 0),
		coAccessCounts:  make(map[coAccessKey]int),
		cooldownTable:   NewCooldownTable(),
		evidenceBuffer:  NewEvidenceBuffer(),
		edgeMetaStore:   storage.NewEdgeMetaStore(),
		nodeConfigStore: storage.NewNodeConfigStore(),
	}
}

// SetSimilaritySearch sets the similarity search function.
func (e *Engine) SetSimilaritySearch(fn func(ctx context.Context, embedding []float32, k int) ([]SimilarityResult, error)) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.similaritySearch = fn
}

// SetTopologyIntegration enables topological link prediction.
//
// This adds graph structure analysis to edge suggestions, combining topology
// with semantic/behavioral signals for more robust predictions.
//
// Parameters:
//   - integration: TopologyIntegration instance (nil to disable)
//
// Example:
//
//	engine := inference.New(inference.DefaultConfig())
//
//	// Enable topology
//	topoConfig := inference.DefaultTopologyConfig()
//	topoConfig.Enabled = true
//	topoConfig.Weight = 0.4  // 40% topology, 60% semantic
//
//	topo := inference.NewTopologyIntegration(storage, topoConfig)
//	engine.SetTopologyIntegration(topo)
//
//	// Now suggestions include topology signals
//	suggestions, _ := engine.OnStore(ctx, nodeID, embedding)
func (e *Engine) SetTopologyIntegration(integration *TopologyIntegration) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.topologyIntegration = integration
}

// GetTopologyIntegration returns the current topology integration (or nil).
func (e *Engine) GetTopologyIntegration() *TopologyIntegration {
	e.mu.RLock()
	defer e.mu.RUnlock()
	return e.topologyIntegration
}

// SetClusterIntegration enables GPU-accelerated k-means clustering for similarity search.
//
// When enabled, similarity searches are accelerated using cluster-based
// approximate nearest neighbor search. This provides significant speedup
// for large embedding indices (10K+ embeddings).
//
// Parameters:
//   - integration: ClusterIntegration instance (nil to disable)
//
// Example:
//
//	engine := inference.New(inference.DefaultConfig())
//
//	// Enable clustering
//	gpuManager, _ := gpu.NewManager(&gpu.Config{Enabled: true})
//	clusterConfig := inference.DefaultClusterConfig()
//	clusterConfig.Enabled = true
//	clusterConfig.NumClustersSearch = 5
//
//	ci := inference.NewClusterIntegration(gpuManager, clusterConfig, nil, nil)
//	engine.SetClusterIntegration(ci)
//
//	// Add embeddings during indexing
//	ci.AddEmbedding(nodeID, embedding)
//
//	// Trigger clustering after bulk load
//	ci.OnIndexComplete()
//
//	// Searches now use cluster acceleration
//	results, _ := ci.Search(ctx, queryEmbedding, 10)
func (e *Engine) SetClusterIntegration(integration *ClusterIntegration) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.clusterIntegration = integration
}

// GetClusterIntegration returns the current cluster integration (or nil).
func (e *Engine) GetClusterIntegration() *ClusterIntegration {
	e.mu.RLock()
	defer e.mu.RUnlock()
	return e.clusterIntegration
}

// SetKalmanAdapter configures the Kalman-enhanced inference adapter.
//
// The KalmanAdapter provides:
//   - Smoothed confidence scores using Kalman filtering
//   - Temporal access pattern tracking
//   - Session-aware co-access detection
//   - Relationship strength trend analysis
//
// This is an OPTIONAL enhancement - if not set, base inference works normally.
// Enable via NORNICDB_KALMAN_ENABLED=true environment variable.
//
// Example:
//
//	if config.IsKalmanEnabled() {
//		adapter := inference.NewKalmanAdapter(engine, inference.DefaultKalmanAdapterConfig())
//		tracker := temporal.NewTracker(temporal.DefaultConfig())
//		adapter.SetTracker(tracker)
//		engine.SetKalmanAdapter(adapter)
//	}
func (e *Engine) SetKalmanAdapter(adapter *KalmanAdapter) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.kalmanAdapter = adapter
}

// GetKalmanAdapter returns the current Kalman adapter (or nil if not configured).
func (e *Engine) GetKalmanAdapter() *KalmanAdapter {
	e.mu.RLock()
	defer e.mu.RUnlock()
	return e.kalmanAdapter
}

// SetHeimdallQC sets the Heimdall SLM quality control for edge validation.
//
// When set and enabled (via NORNICDB_AUTO_TLP_LLM_QC_ENABLED=true), each
// edge suggestion from OnStore() and OnAccess() will be validated by
// the Heimdall SLM before being returned. The SLM can approve, reject,
// or modify the suggested relationship type.
//
// Example:
//
//	// Create Heimdall QC with your SLM function
//	qc := inference.NewHeimdallQC(func(ctx context.Context, prompt string) (string, error) {
//		return myOllamaClient.Complete(ctx, prompt)
//	}, nil)
//
//	engine.SetHeimdallQC(qc)
//
//	// Now suggestions are validated by Heimdall
//	suggestions, _ := engine.OnStore(ctx, nodeID, embedding)
//	// Only returns approved suggestions
func (e *Engine) SetHeimdallQC(qc *HeimdallQC) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.heimdallQC = qc
}

// GetHeimdallQC returns the current Heimdall QC (or nil if not configured).
func (e *Engine) GetHeimdallQC() *HeimdallQC {
	e.mu.RLock()
	defer e.mu.RUnlock()
	return e.heimdallQC
}

// OnStore is called when a new node is stored in the graph.
//
// This method analyzes the new node and suggests relationships based on
// vector similarity. High-confidence suggestions can be automatically
// created as edges.
//
// Parameters:
//   - ctx: Context for cancellation
//   - nodeID: ID of the newly created node
//   - embedding: Vector embedding of the node's content
//
// Returns:
//   - Slice of EdgeSuggestion with confidence scores and reasons
//   - Error if similarity search fails
//
// Example:
//
//	// User creates a new note
//	note := &Note{
//		ID:      "note-456",
//		Content: "Machine learning algorithms",
//		Embedding: embedder.Embed("Machine learning algorithms"),
//	}
//
//	// Get suggestions
//	suggestions, err := engine.OnStore(ctx, note.ID, note.Embedding)
//	if err != nil {
//		return err
//	}
//
//	fmt.Printf("Found %d related notes:\n", len(suggestions))
//	for _, sug := range suggestions {
//		relatedNote := getNote(sug.TargetID)
//		fmt.Printf("  - %s (%.0f%% confident): %s\n",
//			relatedNote.Title, sug.Confidence*100, sug.Reason)
//
//		// Auto-link if very confident
//		if sug.Confidence >= 0.8 {
//			createEdge(sug)
//			log.Printf("Auto-linked: %s -> %s", note.ID, relatedNote.ID)
//		}
//	}
//
// Typical confidence levels:
//   - 0.9+: Very confident, safe to auto-create
//   - 0.7-0.9: Confident, suggest to user
//   - 0.5-0.7: Possible, show as "related"
//   - <0.5: Weak, ignore
func (e *Engine) OnStore(ctx context.Context, nodeID string, embedding []float32) ([]EdgeSuggestion, error) {
	e.mu.Lock()
	defer e.mu.Unlock()

	suggestions := make([]EdgeSuggestion, 0)

	// 1. Similarity-based suggestions (semantic)
	if e.similaritySearch != nil && len(embedding) > 0 {
		similar, err := e.similaritySearch(ctx, embedding, e.config.SimilarityTopK)
		if err == nil {
			for _, result := range similar {
				if result.ID == nodeID {
					continue // Skip self
				}
				if result.Score >= e.config.SimilarityThreshold {
					conf := e.scoreToConfidence(result.Score)
					suggestions = append(suggestions, EdgeSuggestion{
						SourceID:   nodeID,
						TargetID:   result.ID,
						Type:       "RELATES_TO",
						Confidence: conf,
						Reason:     "High embedding similarity",
						Method:     "similarity",
					})
				}
			}
		}
	}

	// 2. Topological suggestions (NEW - feature flagged for AUTOMATIC integration)
	// Note: Cypher procedures (CALL gds.linkPrediction.*) are always available
	// This flag only controls automatic use in OnStore()
	if e.topologyIntegration != nil {
		// Check feature flag via config (automatic integration)
		topoConfig := e.topologyIntegration.config
		if topoConfig != nil && topoConfig.Enabled {
			topoSuggestions, err := e.topologyIntegration.SuggestTopological(ctx, nodeID)
			if err == nil && len(topoSuggestions) > 0 {
				// Combine semantic and topological suggestions
				suggestions = e.topologyIntegration.CombinedSuggestions(suggestions, topoSuggestions)
			}
		}
	}

	// 3. Heimdall QC validation (if enabled)
	// Each suggestion is sent to the SLM for approval before returning
	if e.heimdallQC != nil && config.IsAutoTLPLLMQCEnabled() {
		suggestions = e.validateSuggestionsWithHeimdall(ctx, nodeID, suggestions)
	}

	return suggestions, nil
}

// validateSuggestionsWithHeimdall filters suggestions through Heimdall SLM batch review.
// Returns approved suggestions + any augmented suggestions from Heimdall.
func (e *Engine) validateSuggestionsWithHeimdall(ctx context.Context, sourceNodeID string, suggestions []EdgeSuggestion) []EdgeSuggestion {
	if len(suggestions) == 0 || e.heimdallQC == nil {
		return suggestions
	}

	// Build source node summary
	// Note: In a full implementation, we'd look up the node from storage
	sourceNode := NodeSummary{
		ID:     sourceNodeID,
		Labels: []string{}, // Would be populated from storage
		Props:  make(map[string]string),
	}

	// Build candidate pool for augmentation (empty for now - could be populated from similarity search)
	var candidatePool []NodeSummary

	// Call Heimdall batch review
	approved, augmented, err := e.heimdallQC.ReviewBatch(ctx, sourceNode, suggestions, candidatePool)
	if err != nil {
		// On error, return original suggestions (fail-open)
		return suggestions
	}

	// Set source ID on augmented edges
	for i := range augmented {
		augmented[i].SourceID = sourceNodeID
	}

	// Combine approved + augmented
	result := append(approved, augmented...)
	return result
}

// OnAccess is called when a node is accessed (read).
//
// This method tracks co-access patterns - nodes that are accessed close together
// in time are likely related. After seeing the same pair accessed together
// multiple times, it suggests creating a relationship.
//
// Parameters:
//   - ctx: Context (currently unused, reserved for future)
//   - nodeID: ID of the accessed node
//
// Returns:
//   - Slice of EdgeSuggestion based on co-access patterns
//
// Example:
//
//	func GetMemory(id string) (*Memory, error) {
//		// Retrieve memory
//		mem, err := db.Get(id)
//		if err != nil {
//			return nil, err
//		}
//
//		// Track access for inference
//		suggestions := engine.OnAccess(ctx, id)
//
//		// Log co-access patterns
//		for _, sug := range suggestions {
//			if sug.Method == "co_access" {
//				log.Printf("Co-accessed with %s (%d times)",
//					sug.TargetID, sug.Confidence*10)
//
//				// Create edge if frequently co-accessed
//				if sug.Confidence >= 0.6 {
//					createEdge(sug)
//				}
//			}
//		}
//
//		return mem, nil
//	}
//
// How It Works:
//
//	The engine maintains a sliding window of recent accesses.
//	When you access node A, it checks what other nodes were accessed
//	in the last 30 seconds (configurable). If the same pair appears
//	multiple times, it suggests they're related.
//
// Use Case:
//
//	In a note-taking app, if you always view "Project Plan" and "Budget"
//	together, the engine suggests: "These seem related - want to link them?"
func (e *Engine) OnAccess(ctx context.Context, nodeID string) []EdgeSuggestion {
	e.mu.Lock()
	defer e.mu.Unlock()

	now := time.Now()
	suggestions := make([]EdgeSuggestion, 0)

	if !e.config.CoAccessEnabled {
		return suggestions
	}

	// Find recent accesses within the window
	windowStart := now.Add(-e.config.CoAccessWindow)
	recentNodes := make([]string, 0)

	for _, record := range e.accessHistory {
		if record.Timestamp.After(windowStart) && record.NodeID != nodeID {
			recentNodes = append(recentNodes, record.NodeID)
		}
	}

	// Update co-access counts
	for _, otherID := range recentNodes {
		key := e.makeCoAccessKey(nodeID, otherID)
		e.coAccessCounts[key]++

		// Check if we should suggest an edge
		if e.coAccessCounts[key] >= e.config.CoAccessMinCount {
			conf := float64(e.coAccessCounts[key]) / 10.0
			if conf > 0.8 {
				conf = 0.8 // Cap at 0.8 for co-access
			}
			suggestions = append(suggestions, EdgeSuggestion{
				SourceID:   nodeID,
				TargetID:   otherID,
				Type:       "RELATES_TO",
				Confidence: conf,
				Reason:     "Frequently accessed together",
				Method:     "co_access",
			})
		}
	}

	// Add to history
	e.accessHistory = append(e.accessHistory, accessRecord{
		NodeID:    nodeID,
		Timestamp: now,
	})

	// Prune old history
	e.pruneHistory(windowStart)

	return suggestions
}

// SuggestTransitive suggests edges based on transitive relationships.
// If A->B and B->C with sufficient confidence, suggest A->C.
func (e *Engine) SuggestTransitive(ctx context.Context, edges []ExistingEdge) []EdgeSuggestion {
	e.mu.RLock()
	defer e.mu.RUnlock()

	if !e.config.TransitiveEnabled {
		return nil
	}

	suggestions := make([]EdgeSuggestion, 0)

	// Build adjacency map
	outgoing := make(map[string][]ExistingEdge)
	for _, edge := range edges {
		outgoing[edge.SourceID] = append(outgoing[edge.SourceID], edge)
	}

	// For each A->B, look for B->C
	for _, ab := range edges {
		for _, bc := range outgoing[ab.TargetID] {
			if ab.SourceID == bc.TargetID {
				continue // Skip cycles back to origin
			}

			// Calculate transitive confidence
			conf := ab.Confidence * bc.Confidence
			if conf >= e.config.TransitiveMinConf {
				suggestions = append(suggestions, EdgeSuggestion{
					SourceID:   ab.SourceID,
					TargetID:   bc.TargetID,
					Type:       "RELATES_TO",
					Confidence: conf,
					Reason:     "Transitive via " + ab.TargetID,
					Method:     "transitive",
				})
			}
		}
	}

	return suggestions
}

// ExistingEdge represents an edge in the graph.
type ExistingEdge struct {
	SourceID   string
	TargetID   string
	Confidence float64
}

// scoreToConfidence converts similarity score to edge confidence.
func (e *Engine) scoreToConfidence(score float64) float64 {
	// Map similarity score ranges to confidence levels
	switch {
	case score >= 0.95:
		return 0.9
	case score >= 0.90:
		return 0.7
	case score >= 0.85:
		return 0.5
	default:
		return 0.3
	}
}

// makeCoAccessKey creates a consistent key for co-access tracking.
func (e *Engine) makeCoAccessKey(a, b string) coAccessKey {
	// Ensure consistent ordering
	if a < b {
		return coAccessKey{NodeA: a, NodeB: b}
	}
	return coAccessKey{NodeA: b, NodeB: a}
}

// pruneHistory removes old access records.
func (e *Engine) pruneHistory(before time.Time) {
	// Keep records newer than 'before'
	newHistory := make([]accessRecord, 0, len(e.accessHistory))
	for _, record := range e.accessHistory {
		if record.Timestamp.After(before) {
			newHistory = append(newHistory, record)
		}
	}
	e.accessHistory = newHistory
}

// Stats returns inference statistics.
type Stats struct {
	TotalSuggestions  int64
	BySimilarity      int64
	ByCoAccess        int64
	ByTransitive      int64
	TrackedCoAccesses int
}

// GetStats returns current inference statistics.
func (e *Engine) GetStats() Stats {
	e.mu.RLock()
	defer e.mu.RUnlock()

	return Stats{
		TrackedCoAccesses: len(e.coAccessCounts),
	}
}

// ProcessSuggestionResult contains the result of processing a suggestion.
type ProcessSuggestionResult struct {
	ShouldMaterialize bool   // True if edge should be created
	Reason            string // Why or why not
	CooldownBlocked   bool   // True if blocked by cooldown
	EvidencePending   bool   // True if waiting for more evidence
	NodeConfigBlocked bool   // True if blocked by per-node config (deny list, caps, etc.)
}

// ProcessSuggestion processes an edge suggestion through cooldown and evidence buffering.
//
// This method applies Tier 1 safety features (when auto-integration is enabled):
//   - Cooldown: Prevents rapid re-materialization of the same edge pair
//   - Evidence Buffering: Requires multiple signals before materializing
//
// Feature flags:
//   - NORNICDB_COOLDOWN_AUTO_INTEGRATION_ENABLED (default: true)
//   - NORNICDB_EVIDENCE_AUTO_INTEGRATION_ENABLED (default: true)
//
// Parameters:
//   - suggestion: The edge suggestion to process
//   - sessionID: Current session ID for evidence tracking
//
// Returns ProcessSuggestionResult indicating whether to create the edge.
//
// Example:
//
//	suggestions, _ := engine.OnStore(ctx, nodeID, embedding)
//	for _, sug := range suggestions {
//	    result := engine.ProcessSuggestion(sug, "session-123")
//	    if result.ShouldMaterialize {
//	        db.CreateEdge(sug.SourceID, sug.TargetID, sug.Type)
//	        engine.RecordMaterialization(sug.SourceID, sug.TargetID, sug.Type)
//	    }
//	}
func (e *Engine) ProcessSuggestion(suggestion EdgeSuggestion, sessionID string) ProcessSuggestionResult {
	ctx := context.Background()
	result := ProcessSuggestionResult{
		ShouldMaterialize: true,
		Reason:            "passed all checks",
	}

	// Log provenance for this suggestion (if auto-integration enabled)
	if config.IsEdgeProvenanceAutoIntegrationEnabled() && e.edgeMetaStore != nil {
		e.edgeMetaStore.AppendFromSuggestion(
			ctx,
			suggestion.SourceID, suggestion.TargetID, suggestion.Type,
			suggestion.Confidence,
			suggestion.Method, suggestion.Method, suggestion.Reason,
			sessionID, "inference-engine",
			false, // Not materialized yet
		)
	}

	// Check cooldown (if auto-integration enabled)
	if config.IsCooldownAutoIntegrationEnabled() {
		if !e.cooldownTable.CanMaterialize(suggestion.SourceID, suggestion.TargetID, suggestion.Type) {
			result.ShouldMaterialize = false
			result.CooldownBlocked = true
			_, reason := e.cooldownTable.CanMaterializeWithReason(suggestion.SourceID, suggestion.TargetID, suggestion.Type)
			result.Reason = "cooldown: " + reason
			return result
		}
	}

	// Check per-node config (if auto-integration enabled)
	if config.IsPerNodeConfigAutoIntegrationEnabled() && e.nodeConfigStore != nil {
		allowed, reason := e.nodeConfigStore.IsEdgeAllowedWithReason(suggestion.SourceID, suggestion.TargetID, suggestion.Type)
		if !allowed {
			result.ShouldMaterialize = false
			result.NodeConfigBlocked = true
			result.Reason = "node-config: " + reason
			return result
		}
	}

	// Check evidence buffering (if auto-integration enabled)
	if config.IsEvidenceAutoIntegrationEnabled() {
		shouldMaterialize := e.evidenceBuffer.AddEvidence(
			suggestion.SourceID,
			suggestion.TargetID,
			suggestion.Type,
			suggestion.Confidence,
			suggestion.Method,
			sessionID,
		)

		if !shouldMaterialize {
			result.ShouldMaterialize = false
			result.EvidencePending = true
			_, reason := e.evidenceBuffer.CheckThreshold(suggestion.SourceID, suggestion.TargetID, suggestion.Type)
			result.Reason = "evidence: " + reason
			return result
		}
	}

	return result
}

// RecordMaterialization records that an edge was materialized.
//
// Call this after successfully creating an edge to update:
//   - Cooldown tracking (prevents immediate re-creation)
//   - Provenance logs (audit trail of why edge was created)
//   - Node config edge counts (enforces per-node limits)
//
// This is the "clean up after yourself" function - ALWAYS call it after
// creating an edge to keep internal state synchronized.
//
// Example 1: Basic usage after edge creation
//
//	result := engine.ProcessSuggestion(suggestion, "session-123")
//	if result.ShouldMaterialize {
//	    db.CreateEdge(suggestion.SourceID, suggestion.TargetID, suggestion.Type)
//	    engine.RecordMaterialization(suggestion.SourceID, suggestion.TargetID, suggestion.Type)
//	}
//
// Example 2: Batch edge creation
//
//	for _, sug := range suggestions {
//	    if sug.Confidence > 0.8 {
//	        db.CreateEdge(sug.SourceID, sug.TargetID, sug.Type)
//	        engine.RecordMaterialization(sug.SourceID, sug.TargetID, sug.Type)
//	    }
//	}
//
// Example 3: Manual edge creation (bypassing ProcessSuggestion)
//
//	// User explicitly creates an edge
//	db.CreateEdge("user-123", "doc-456", "bookmarked")
//	// Still record it to prevent suggestions for same edge
//	engine.RecordMaterialization("user-123", "doc-456", "bookmarked")
//
// ELI12 (Explain Like I'm 12):
//
// Think of this like checking out a library book. When you return it:
//   - Cooldown: "You just returned this book, wait 5 minutes before checking it out again"
//   - Provenance: "Record that you borrowed this book on June 15th"
//   - Node Config: "Update your total books borrowed count (you're at 9/10 limit now)"
//
// If you forget to call this, it's like never returning the book - the library
// thinks you still have it and might suggest you borrow it again (duplicate!).
func (e *Engine) RecordMaterialization(sourceID, targetID, edgeType string) {
	ctx := context.Background()

	// Update cooldown tracking
	if config.IsCooldownAutoIntegrationEnabled() {
		e.cooldownTable.RecordMaterialization(sourceID, targetID, edgeType)
	}

	// Log materialization in provenance
	if config.IsEdgeProvenanceAutoIntegrationEnabled() && e.edgeMetaStore != nil {
		e.edgeMetaStore.MarkMaterialized(ctx, sourceID, targetID, edgeType, "inference-engine")
	}

	// Update per-node edge counts
	if config.IsPerNodeConfigAutoIntegrationEnabled() && e.nodeConfigStore != nil {
		e.nodeConfigStore.RecordEdgeCreation(sourceID, targetID)
	}
}

// GetCooldownTable returns the cooldown table for direct access.
// The table is always available regardless of auto-integration setting.
func (e *Engine) GetCooldownTable() *CooldownTable {
	return e.cooldownTable
}

// GetEvidenceBuffer returns the evidence buffer for direct access.
// The buffer is always available regardless of auto-integration setting.
func (e *Engine) GetEvidenceBuffer() *EvidenceBuffer {
	return e.evidenceBuffer
}

// SetCooldownTable sets a custom cooldown table.
func (e *Engine) SetCooldownTable(table *CooldownTable) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.cooldownTable = table
}

// SetEvidenceBuffer sets a custom evidence buffer.
func (e *Engine) SetEvidenceBuffer(buffer *EvidenceBuffer) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.evidenceBuffer = buffer
}

// GetEdgeMetaStore returns the edge meta store for direct access.
// The store is always available regardless of auto-integration setting.
func (e *Engine) GetEdgeMetaStore() *storage.EdgeMetaStore {
	return e.edgeMetaStore
}

// SetEdgeMetaStore sets a custom edge meta store.
func (e *Engine) SetEdgeMetaStore(store *storage.EdgeMetaStore) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.edgeMetaStore = store
}

// GetNodeConfigStore returns the node config store for direct access.
// The store is always available regardless of auto-integration setting.
func (e *Engine) GetNodeConfigStore() *storage.NodeConfigStore {
	return e.nodeConfigStore
}

// SetNodeConfigStore sets a custom node config store.
func (e *Engine) SetNodeConfigStore(store *storage.NodeConfigStore) {
	e.mu.Lock()
	defer e.mu.Unlock()
	e.nodeConfigStore = store
}

// CleanupTier1 runs cleanup on Tier 1 data structures.
// Should be called periodically (e.g., every 10 minutes).
// provenanceMaxAge specifies the max age for provenance records (0 = don't cleanup).
func (e *Engine) CleanupTier1() (cooldownRemoved, evidenceRemoved int) {
	if e.cooldownTable != nil {
		cooldownRemoved = e.cooldownTable.Cleanup()
	}
	if e.evidenceBuffer != nil {
		evidenceRemoved = e.evidenceBuffer.Cleanup()
	}
	return
}

// CleanupTier1WithProvenance runs cleanup including provenance records.
// provenanceMaxAge specifies the max age for provenance records.
func (e *Engine) CleanupTier1WithProvenance(provenanceMaxAge time.Duration) (cooldownRemoved, evidenceRemoved, provenanceRemoved int) {
	cooldownRemoved, evidenceRemoved = e.CleanupTier1()
	if e.edgeMetaStore != nil && provenanceMaxAge > 0 {
		provenanceRemoved = e.edgeMetaStore.Cleanup(provenanceMaxAge)
	}
	return
}