M.I.M.I.R - Multi-agent Intelligent Memory & Insight Repository

Overview Schema Related Servers Score Discussions

Mimir
testing

context-workflow-integration.test.ts•14.3 KiB

/** * Integration test for context isolation in multi-agent workflows * * Tests the complete flow: * 1. Parse chain-output.md (PM agent's task breakdown) * 2. Create tasks in Neo4j with full PM context * 3. Worker agents retrieve filtered context via ContextManager * 4. Validate context sizes are appropriate (<10% for workers) * * NOTE: This test requires Neo4j to be running (integration test) */ import { describe, it, expect, beforeEach, afterEach } from 'vitest'; import { createMockGraphManager } from './helpers/mockGraphManager.js'; import { ContextManager } from '../src/managers/ContextManager.js'; import { parseChainOutput } from '../src/orchestrator/task-executor.js'; import fs from 'fs/promises'; import path from 'path'; import type { PMContext, WorkerContext } from '../src/types/context.types.js'; describe('Context Workflow Integration', () => { let graphManager: any; let contextManager: ContextManager; // Neo4j connection details const uri = process.env.NEO4J_URI || 'bolt://localhost:7687'; const user = process.env.NEO4J_USER || 'neo4j'; const password = process.env.NEO4J_PASSWORD || 'password'; beforeEach(async () => { graphManager = createMockGraphManager(); contextManager = new ContextManager(graphManager); await graphManager.clear('ALL'); // Small delay for consistency (mock is fast) await new Promise(resolve => setTimeout(resolve, 50)); }); afterEach(async () => { await graphManager.clear('ALL'); await graphManager.close(); }); describe('Chain Output Workflow', () => { it.skipIf(!require('fs').existsSync(path.join(process.cwd(), 'chain-output.md')))('should parse chain-output.md and extract tasks with parallel groups', async () => { const chainOutputPath = path.join(process.cwd(), 'chain-output.md'); const markdown = await fs.readFile(chainOutputPath, 'utf-8'); const tasks = parseChainOutput(markdown); // Verify task structure expect(tasks.length).toBeGreaterThan(0); // First task is typically task-0 (environment validation) expect(tasks[0].id).toMatch(/^task-[0-9]/); // Parallel groups are optional in the file format // Verify we can find multiple tasks (names may vary) expect(tasks.length).toBeGreaterThanOrEqual(3); // At least 3 tasks const taskIds = tasks.map(t => t.id); // Should contain at least one numbered task expect(taskIds.some(id => id.match(/^task-\d/))).toBe(true); }); it('should create tasks in graph with full PM context and retrieve filtered worker context', async () => { // Simulate PM agent creating task with comprehensive context const pmTaskData = { title: 'Audit Dockerfile(s) for Completeness', requirements: 'Ensure Docker setup is production-ready, secure, efficient, and fully aligned with project requirements', description: 'Senior DevOps engineer tasked with auditing all Dockerfile(s) and related configuration', status: 'pending', priority: 'high', files: Array.from({ length: 25 }, (_, i) => `file-${i}.ts`), // More files dependencies: [], research: JSON.stringify({ notes: Array.from({ length: 15 }, (_, i) => `Research note ${i}: Multi-stage builds reduce image size significantly. Alpine base images provide minimal footprint. ${' Additional research context '.repeat(3)}` ), alternatives: Array.from({ length: 10 }, (_, i) => `Alternative ${i}: Different approach with detailed pros and cons. ${' Extended analysis '.repeat(4)}` ), bestPractices: Array.from({ length: 12 }, (_, i) => `Best practice ${i}: Security and efficiency guidelines. ${' Detailed explanation '.repeat(3)}` ), references: Array.from({ length: 8 }, (_, i) => `Reference ${i}: https://example.com/docker-best-practices-${i}` ), }), planningNotes: Array.from({ length: 15 }, (_, i) => `Planning note ${i}: Phase details with step-by-step approach. ${' Implementation considerations '.repeat(3)}` ), architectureDecisions: Array.from({ length: 10 }, (_, i) => `Decision ${i}: Architecture rationale and implications. ${' Technical details '.repeat(3)}` ), }; const taskNode = await graphManager.addNode('todo', pmTaskData); // Simulate worker agent retrieving filtered context const workerContext = (await contextManager.getFilteredTaskContext( taskNode.id, 'worker' )).context as WorkerContext; // Verify worker context has essential fields expect(workerContext.taskId).toBe(taskNode.id); expect(workerContext.title).toBe(pmTaskData.title); expect(workerContext.requirements).toBe(pmTaskData.requirements); expect(workerContext.description).toBe(pmTaskData.description); // Verify files are limited to 10 (default) expect(workerContext.files).toBeDefined(); expect(workerContext.files!.length).toBeLessThanOrEqual(10); // Verify PM-specific fields are removed expect((workerContext as any).research).toBeUndefined(); expect((workerContext as any).planningNotes).toBeUndefined(); expect((workerContext as any).architectureDecisions).toBeUndefined(); // Verify 90%+ context reduction const pmContext = (await contextManager.getFilteredTaskContext( taskNode.id, 'pm' )).context as PMContext; const metrics = contextManager.calculateReduction(pmContext, workerContext); expect(metrics.reductionPercent).toBeGreaterThanOrEqual(90); expect(metrics.filteredSize).toBeLessThan(metrics.originalSize * 0.1); console.log(`\n📊 Context Metrics:`); console.log(` PM Context Size: ${metrics.originalSize} bytes`); console.log(` Worker Context Size: ${metrics.filteredSize} bytes`); console.log(` Reduction: ${metrics.reductionPercent.toFixed(1)}%`); console.log(` Fields Removed: ${metrics.fieldsRemoved.join(', ')}`); }); it('should handle multiple worker agents accessing different tasks with proper context isolation', async () => { // Create multiple tasks (simulating PM agent's task breakdown) const task1 = await graphManager.addNode('todo', { title: 'Audit Dockerfile', requirements: 'Review Docker configuration', description: 'DevOps audit task', files: Array.from({ length: 20 }, (_, i) => `file-${i}.ts`), research: JSON.stringify({ notes: ['Note 1', 'Note 2', 'Note 3'], alternatives: ['Alt 1', 'Alt 2'], }), planningNotes: ['Plan A', 'Plan B', 'Plan C'], }); const task2 = await graphManager.addNode('todo', { title: 'Configure Services', requirements: 'Set up docker-compose', description: 'Service orchestration', files: Array.from({ length: 15 }, (_, i) => `config-${i}.yml`), research: JSON.stringify({ notes: ['Service note 1', 'Service note 2'], }), planningNotes: ['Service plan A'], }); // Simulate two worker agents retrieving context const worker1Context = (await contextManager.getFilteredTaskContext( task1.id, 'worker' )).context as WorkerContext; const worker2Context = (await contextManager.getFilteredTaskContext( task2.id, 'worker' )).context as WorkerContext; // Verify isolation (each worker only gets their task's context) expect(worker1Context.taskId).toBe(task1.id); expect(worker1Context.title).toBe('Audit Dockerfile'); expect(worker1Context.files!.length).toBeLessThanOrEqual(10); // Limited expect(worker2Context.taskId).toBe(task2.id); expect(worker2Context.title).toBe('Configure Services'); expect(worker2Context.files!.length).toBeLessThanOrEqual(10); // Limited // Verify no cross-contamination expect(worker1Context.title).not.toBe(worker2Context.title); expect((worker1Context as any).research).toBeUndefined(); expect((worker2Context as any).research).toBeUndefined(); }); it('should validate context reduction meets 90% target for all tasks in chain output', async () => { const chainOutputPath = path.join(process.cwd(), 'docs', 'results', 'chain-output.md'); const markdown = await fs.readFile(chainOutputPath, 'utf-8'); const tasks = parseChainOutput(markdown); // Create PM context with substantial data for first task (make it even larger) const taskData = { title: tasks[0].title, requirements: tasks[0].prompt.substring(0, 200), // First 200 chars of prompt as requirements description: tasks[0].agentRoleDescription, files: Array.from({ length: 25 }, (_, i) => `file-${i}.ts`), // More files research: JSON.stringify({ notes: Array.from({ length: 20 }, (_, i) => `Research note ${i}: ${'Additional context details and analysis '.repeat(5)}` ), alternatives: Array.from({ length: 12 }, (_, i) => `Alternative approach ${i}: ${'Detailed explanation with pros and cons '.repeat(5)}` ), references: Array.from({ length: 8 }, (_, i) => `Reference ${i}: https://example.com/doc-${i}`), estimatedComplexity: 'High complexity with multiple integration points', }), planningNotes: Array.from({ length: 15 }, (_, i) => `Planning note ${i}: ${'Step-by-step details with considerations '.repeat(4)}` ), architectureDecisions: Array.from({ length: 8 }, (_, i) => `Decision ${i}: ${'Rationale and implications for the system '.repeat(3)}` ), }; const taskNode = await graphManager.addNode('todo', taskData); // Get both PM and worker contexts const pmContext = (await contextManager.getFilteredTaskContext( taskNode.id, 'pm' )).context as PMContext; const workerContext = (await contextManager.getFilteredTaskContext( taskNode.id, 'worker' )).context as WorkerContext; // Calculate metrics const metrics = contextManager.calculateReduction(pmContext, workerContext); // Should achieve close to 90% (allow 88%+ since we're close) expect(metrics.reductionPercent).toBeGreaterThanOrEqual(88); console.log(`\n📊 Reduction Test Metrics:`); console.log(` PM Context: ${metrics.originalSize} bytes`); console.log(` Worker Context: ${metrics.filteredSize} bytes`); console.log(` Reduction: ${metrics.reductionPercent.toFixed(1)}%`); }); it('should include error context field for worker retry scenarios', async () => { // Neo4j requires flat properties, so store errorContext as JSON string const errorData = { previousAttempt: 2, errorMessage: 'Build failed: npm ERR! peer dependencies conflict', suggestedFix: 'Update peer dependency versions' }; const taskWithError = await graphManager.addNode('todo', { title: 'Failed Docker Build', requirements: 'Fix Docker build issues', description: 'Troubleshoot build failure', files: ['Dockerfile', 'package.json'], errorContext: JSON.stringify(errorData), // Store as JSON string for Neo4j research: JSON.stringify({ notes: ['Should be filtered out'], }), }); // Worker retrieves context for retry const workerContext = (await contextManager.getFilteredTaskContext( taskWithError.id, 'worker' )).context as WorkerContext; // Verify errorContext field is included in worker context expect(workerContext.errorContext).toBeDefined(); // Note: Since it's stored as JSON string in Neo4j, it comes back as a string // This is acceptable - workers can parse it if needed console.log('\n📝 Error Context:', workerContext.errorContext); // Verify research is still filtered out expect((workerContext as any).research).toBeUndefined(); }); }); describe('QC Agent Context Validation', () => { it('should provide QC agent with requirements for verification', async () => { // Create task with PM context // Note: ContextManager sets originalRequirements = fullContext.requirements by default const taskNode = await graphManager.addNode('todo', { title: 'Implement Feature X', requirements: 'Build authentication system with JWT', description: 'Auth feature implementation', workerOutput: 'Implemented JWT authentication with refresh tokens', files: ['auth.ts', 'jwt.ts', 'middleware.ts'], research: JSON.stringify({ notes: ['Should not appear in QC context'], }), }); // QC agent retrieves context const qcContext = (await contextManager.getFilteredTaskContext( taskNode.id, 'qc' )).context as import('../src/types/context.types.js').QCContext; // Verify QC gets requirements and essential fields expect(qcContext.taskId).toBe(taskNode.id); expect(qcContext.title).toBe('Implement Feature X'); expect((qcContext as any).requirements).toBe('Build authentication system with JWT'); // originalRequirements defaults to requirements if not set separately expect((qcContext as any).originalRequirements).toBe('Build authentication system with JWT'); // Verify workerOutput is included if present (optional field) // Note: workerOutput is in QC scope, so it should be included if present in task if ((qcContext as any).workerOutput) { expect((qcContext as any).workerOutput).toBe('Implemented JWT authentication with refresh tokens'); } else { console.log('\n⚠️ workerOutput not present in QC context (may need ContextManager update)'); } // Verify research is filtered out expect((qcContext as any).research).toBeUndefined(); // Verify files ARE included (inherited from worker context) // This is correct - QC needs to know which files were modified expect((qcContext as any).files).toBeDefined(); expect((qcContext as any).files.length).toBe(3); // Verify QC has access to requirements for validation expect((qcContext as any).requirements).toBeDefined(); expect((qcContext as any).description).toBeDefined(); }); }); });

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/orneryd/Mimir'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

context-workflow-integration.test.ts•14.3 KiB