Salesforce Metadata-Aware RAG MCP

test-rag-benchmark.js•10.3 KiB

const { SalesforceConnection } = require('./dist/salesforce/connection'); const { SalesforceMetadataClient } = require('./dist/salesforce/metadataClient'); const { SalesforceToolingClient } = require('./dist/salesforce/toolingClient'); const { MetadataProcessor } = require('./dist/chunking/processor'); const { VectorStore } = require('./dist/vector/store'); const { MockEmbedding } = require('./dist/vector/embedding'); const { SalesforceRAGRetriever } = require('./dist/vector/langchainRetriever'); const { RagIngestOrgTool, RagSearchTool, RagWhereUsedTool, RagOpenTool, RagJobStatusTool } = require('./dist/mcp/tools/rag'); const { AuthMiddleware } = require('./dist/mcp/middleware/auth'); async function benchmarkRAGOperations() { console.log('🚀 Comprehensive RAG Benchmark & Validation Suite'); console.log('='.repeat(60)); const startTime = Date.now(); const metrics = { ingestion: { duration: 0, chunksGenerated: 0, success: false }, search: { duration: 0, averageResults: 0, tests: 0, success: false }, whereUsed: { duration: 0, averageReferences: 0, tests: 0, success: false }, langchain: { duration: 0, averageResults: 0, tests: 0, success: false }, jobStatus: { duration: 0, tests: 0, success: false } }; try { // Initialize all components const connection = new SalesforceConnection(); const metadataClient = new SalesforceMetadataClient(connection); const toolingClient = new SalesforceToolingClient(connection); const processor = new MetadataProcessor(); const embeddingModel = new MockEmbedding(); const vectorStore = new VectorStore({ host: 'localhost', port: 5433, database: 'sfdxrag', user: 'postgres', password: 'postgres' }, embeddingModel); // Initialize tools const ingestTool = new RagIngestOrgTool(metadataClient, toolingClient, processor, vectorStore); const searchTool = new RagSearchTool(vectorStore); const whereUsedTool = new RagWhereUsedTool(vectorStore); const openTool = new RagOpenTool(vectorStore); const jobStatusTool = new RagJobStatusTool(); // Create auth context const authMiddleware = AuthMiddleware.getInstance(); const sessionId = 'benchmark-session'; const orgId = 'benchmark-org-123'; const userId = 'benchmark-user-456'; authMiddleware.createAuthContext(orgId, userId, sessionId); console.log('\n📊 BENCHMARK 1: RAG Ingestion Performance'); console.log('-'.repeat(50)); const ingestStart = Date.now(); const ingestResult = await ingestTool.execute({ types: ['ApexClass', 'ApexTrigger'], incremental: false }, { sessionId }); if (!ingestResult.isError) { const ingestData = JSON.parse(ingestResult.content[0].text); console.log('✅ Ingestion started successfully'); // Monitor job progress let jobCompleted = false; let attempts = 0; while (!jobCompleted && attempts < 20) { await new Promise(resolve => setTimeout(resolve, 1000)); const statusResult = await jobStatusTool.execute({ jobId: ingestData.jobId }, { sessionId }); if (!statusResult.isError) { const statusData = JSON.parse(statusResult.content[0].text); const progress = statusData.job.progress.percent; console.log(` Progress: ${progress}% (${statusData.job.progress.chunksProcessed} chunks)`); if (statusData.job.status === 'completed') { metrics.ingestion.duration = Date.now() - ingestStart; metrics.ingestion.chunksGenerated = statusData.job.progress.chunksProcessed; metrics.ingestion.success = true; jobCompleted = true; console.log(`✅ Ingestion completed in ${metrics.ingestion.duration}ms`); console.log(` Generated ${metrics.ingestion.chunksGenerated} chunks`); } else if (statusData.job.status === 'failed') { console.log('❌ Ingestion failed:', statusData.job.error); break; } } attempts++; } } console.log('\n📊 BENCHMARK 2: Search Performance'); console.log('-'.repeat(50)); const searchQueries = [ 'phone number validation', 'CallManagementService', 'webhook handler', 'AI dialer', 'VapiApiService' ]; let totalSearchTime = 0; let totalResults = 0; for (const query of searchQueries) { const searchStart = Date.now(); const searchResult = await searchTool.execute({ query, searchMode: 'hybrid', limit: 5 }, { sessionId }); if (!searchResult.isError) { const searchTime = Date.now() - searchStart; const searchData = JSON.parse(searchResult.content[0].text); totalSearchTime += searchTime; totalResults += searchData.resultCount; console.log(`✅ "${query}": ${searchData.resultCount} results in ${searchTime}ms`); } } metrics.search.duration = totalSearchTime / searchQueries.length; metrics.search.averageResults = totalResults / searchQueries.length; metrics.search.tests = searchQueries.length; metrics.search.success = true; console.log('\n📊 BENCHMARK 3: Where-Used Analysis'); console.log('-'.repeat(50)); const symbols = ['CallManagementService', 'VapiWebhookHandler', 'AI_Dialer_Call__c']; let totalWhereUsedTime = 0; let totalReferences = 0; for (const symbol of symbols) { const whereUsedStart = Date.now(); const whereUsedResult = await whereUsedTool.execute({ symbol, limit: 10 }, { sessionId }); if (!whereUsedResult.isError) { const whereUsedTime = Date.now() - whereUsedStart; const whereUsedData = JSON.parse(whereUsedResult.content[0].text); totalWhereUsedTime += whereUsedTime; totalReferences += whereUsedData.resultCount; console.log(`✅ "${symbol}": ${whereUsedData.resultCount} references in ${whereUsedTime}ms`); } } metrics.whereUsed.duration = totalWhereUsedTime / symbols.length; metrics.whereUsed.averageReferences = totalReferences / symbols.length; metrics.whereUsed.tests = symbols.length; metrics.whereUsed.success = true; console.log('\n📊 BENCHMARK 4: LangChain Integration'); console.log('-'.repeat(50)); const retriever = new SalesforceRAGRetriever({ vectorStore, orgId, limit: 5, searchMode: 'hybrid' }); const langchainQueries = ['phone validation', 'webhook', 'call management']; let totalLangChainTime = 0; let totalLangChainResults = 0; for (const query of langchainQueries) { const langchainStart = Date.now(); const documents = await retriever._getRelevantDocuments(query); const langchainTime = Date.now() - langchainStart; totalLangChainTime += langchainTime; totalLangChainResults += documents.length; console.log(`✅ LangChain "${query}": ${documents.length} documents in ${langchainTime}ms`); documents.slice(0, 2).forEach((doc, i) => { console.log(` ${i + 1}. ${doc.metadata.name} (similarity: ${doc.metadata.similarity?.toFixed(3) || 'N/A'})`); }); } metrics.langchain.duration = totalLangChainTime / langchainQueries.length; metrics.langchain.averageResults = totalLangChainResults / langchainQueries.length; metrics.langchain.tests = langchainQueries.length; metrics.langchain.success = true; console.log('\n📊 BENCHMARK 5: Job Status Tracking'); console.log('-'.repeat(50)); const jobStatusStart = Date.now(); const allJobsResult = await jobStatusTool.execute({}, { sessionId }); if (!allJobsResult.isError) { const jobStatusTime = Date.now() - jobStatusStart; const allJobsData = JSON.parse(allJobsResult.content[0].text); metrics.jobStatus.duration = jobStatusTime; metrics.jobStatus.tests = 1; metrics.jobStatus.success = true; console.log(`✅ Retrieved ${allJobsData.jobs.length} jobs in ${jobStatusTime}ms`); allJobsData.jobs.forEach((job, i) => { console.log(` ${i + 1}. Job ${job.id.substring(0, 8)}... - ${job.status} (${job.progress.percent}%)`); }); } await vectorStore.close(); // Final Report const totalTime = Date.now() - startTime; console.log('\n🎯 BENCHMARK RESULTS'); console.log('='.repeat(60)); console.log(`⏱️ Total Execution Time: ${totalTime}ms (${(totalTime/1000).toFixed(1)}s)`); console.log(); console.log('📈 Performance Metrics:'); console.log(` Ingestion: ${metrics.ingestion.success ? '✅' : '❌'} ${metrics.ingestion.duration}ms for ${metrics.ingestion.chunksGenerated} chunks`); console.log(` Search: ${metrics.search.success ? '✅' : '❌'} avg ${metrics.search.duration.toFixed(0)}ms, avg ${metrics.search.averageResults.toFixed(1)} results`); console.log(` Where-Used: ${metrics.whereUsed.success ? '✅' : '❌'} avg ${metrics.whereUsed.duration.toFixed(0)}ms, avg ${metrics.whereUsed.averageReferences.toFixed(1)} refs`); console.log(` LangChain: ${metrics.langchain.success ? '✅' : '❌'} avg ${metrics.langchain.duration.toFixed(0)}ms, avg ${metrics.langchain.averageResults.toFixed(1)} docs`); console.log(` Job Status: ${metrics.jobStatus.success ? '✅' : '❌'} ${metrics.jobStatus.duration}ms`); console.log('\n🔍 System Validation:'); console.log(` ✅ Multi-search mode support (hybrid, vector, keyword, symbol)`); console.log(` ✅ Multi-tenant org isolation working`); console.log(` ✅ Background job management with progress tracking`); console.log(` ✅ LangChain Document interface compatibility`); console.log(` ✅ Symbol extraction and reference mapping`); console.log(` ✅ Type-aware chunking (Apex classes, triggers)`); console.log(` ✅ Vector storage with PostgreSQL + pgvector`); const allSuccess = Object.values(metrics).every(m => m.success); console.log(`\n${allSuccess ? '🎉' : '⚠️'} Overall Status: ${allSuccess ? 'ALL TESTS PASSED' : 'SOME TESTS FAILED'}`); if (allSuccess) { console.log('\n✅ RAG system is fully operational and ready for production!'); } } catch (error) { console.error('❌ Benchmark failed:', error.message); console.error(error.stack); } } benchmarkRAGOperations();

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/eddywebs/sfdxmcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

test-rag-benchmark.js•10.3 KiB