Math MCP Server

math-mcp
src
workers

parallel-matrix.ts•11.6 KiB

/** * @file parallel-matrix.ts * @description Parallel matrix operations using WebWorkers * * This module provides high-level functions for parallel matrix operations * that automatically chunk data and distribute work across worker threads. * * @module workers/parallel-matrix * @since 3.0.0 */ import { WorkerPool } from './worker-pool.js'; import { OperationType, DataChunk } from './worker-types.js'; import { chunkMatrixByRows, getOptimalChunkCount, } from './chunk-utils.js'; import { logger } from '../utils.js'; /** * Thresholds for when to use parallel processing. * Below these sizes, single-threaded WASM is faster due to overhead. * * @constant */ export const PARALLEL_THRESHOLDS = { /** Use parallel processing for matrix multiply when size >= 100×100 */ MATRIX_MULTIPLY: 100, /** Use parallel processing for matrix transpose when size >= 200×200 */ MATRIX_TRANSPOSE: 200, /** Use parallel processing for matrix add/subtract when size >= 200×200 */ MATRIX_ADD_SUB: 200, } as const; /** * Parallel matrix multiplication using worker pool. * * **Algorithm:** * 1. Split matrix A into row chunks * 2. Each worker multiplies its chunk of A with entire B * 3. Combine result chunks * * **Example:** * Matrix A (1000×1000) split into 4 chunks of 250 rows each * Worker 1: Rows 0-249 × B * Worker 2: Rows 250-499 × B * Worker 3: Rows 500-749 × B * Worker 4: Rows 750-999 × B * * @param {number[][]} a - First matrix (m×n) * @param {number[][]} b - Second matrix (n×p) * @param {WorkerPool} pool - Worker pool instance * @returns {Promise<number[][]>} Result matrix (m×p) * * @example * ```typescript * const a = create2DArray(1000, 1000); * const b = create2DArray(1000, 1000); * const result = await parallelMatrixMultiply(a, b, workerPool); * ``` */ export async function parallelMatrixMultiply( a: number[][], b: number[][], pool: WorkerPool ): Promise<number[][]> { const startTime = performance.now(); const size = a.length; logger.debug('Starting parallel matrix multiply', { sizeA: `${a.length}×${a[0]?.length || 0}`, sizeB: `${b.length}×${b[0]?.length || 0}`, }); // Determine optimal chunk count const numChunks = getOptimalChunkCount( size, pool.getAvailableWorkerCount(), 50 // Min 50 rows per chunk ); // Chunk matrix A by rows const chunks = chunkMatrixByRows(a, { numChunks }); // Process chunks in parallel const chunkPromises = chunks.map((chunk) => { return pool.execute<number[][]>({ operation: OperationType.MATRIX_MULTIPLY, data: { matrixA: chunk.data, matrixB: b, startRow: chunk.startIndex, endRow: chunk.endIndex, }, }); }); // Wait for all chunks const results = await Promise.all(chunkPromises); // Merge results const finalResult: number[][] = []; for (const result of results) { finalResult.push(...result); } const duration = performance.now() - startTime; logger.debug('Parallel matrix multiply completed', { duration: `${duration.toFixed(2)}ms`, chunks: chunks.length, resultSize: `${finalResult.length}×${finalResult[0]?.length || 0}`, }); return finalResult; } /** * Merges transposed matrix chunks into final result. * * **Optimized Algorithm (O(n²) instead of O(n³)):** * - Pre-allocates result array with correct dimensions * - Uses cache-friendly row-by-row copying instead of element-by-element * - Avoids triple nested loops * * **How it works:** * When we chunk a matrix by rows and transpose each chunk: * - Original matrix (rows×cols) split into chunks of chunkRows×cols * - Each transposed chunk is cols×chunkRows * - Final result needs to be cols×rows * * We merge by placing each transposed chunk's rows into the correct * columns of the result matrix. * * @param {number[][][]} transposedChunks - Array of transposed matrix chunks * @param {DataChunk<number[][]>[]} originalChunks - Original chunk metadata * @param {number} rows - Original matrix row count * @param {number} cols - Original matrix column count * @returns {number[][]} Merged transposed matrix (cols×rows) * * @private */ function mergeTransposedChunks( transposedChunks: number[][][], originalChunks: DataChunk<number[][]>[], rows: number, cols: number ): number[][] { // Pre-allocate result with correct dimensions: cols×rows const result = new Array<number[]>(cols); for (let i = 0; i < cols; i++) { result[i] = new Array<number>(rows); } // Merge chunks: each transposed chunk is cols×chunkRows // We need to place these columns into the correct positions for (let chunkIdx = 0; chunkIdx < transposedChunks.length; chunkIdx++) { const chunk = transposedChunks[chunkIdx]; const chunkMeta = originalChunks[chunkIdx]; const startCol = chunkMeta.startIndex; // Original row becomes column in transpose // Each row in the transposed chunk becomes part of a row in the final result // transposed chunk is cols×chunkRows for (let i = 0; i < chunk.length; i++) { // Copy this row (which is chunkRows long) into the correct position for (let j = 0; j < chunk[i].length; j++) { result[i][startCol + j] = chunk[i][j]; } } } return result; } /** * Parallel matrix transpose using worker pool. * * **Algorithm:** * 1. Split matrix into row chunks * 2. Each worker transposes its chunk * 3. Merge transposed chunks efficiently (O(n²) instead of O(n³)) * * @param {number[][]} matrix - Matrix to transpose (m×n) * @param {WorkerPool} pool - Worker pool instance * @returns {Promise<number[][]>} Transposed matrix (n×m) * * @example * ```typescript * const matrix = create2DArray(1000, 1000); * const transposed = await parallelMatrixTranspose(matrix, workerPool); * ``` */ export async function parallelMatrixTranspose( matrix: number[][], pool: WorkerPool ): Promise<number[][]> { const startTime = performance.now(); const rows = matrix.length; const cols = matrix[0]?.length || 0; logger.debug('Starting parallel matrix transpose', { size: `${rows}×${cols}`, }); // Determine optimal chunk count const numChunks = getOptimalChunkCount( rows, pool.getAvailableWorkerCount(), 100 // Min 100 rows per chunk ); // Chunk matrix by rows const chunks = chunkMatrixByRows(matrix, { numChunks }); // Process chunks in parallel const chunkPromises = chunks.map((chunk) => { return pool.execute<number[][]>({ operation: OperationType.MATRIX_TRANSPOSE, data: { matrixA: chunk.data, startRow: chunk.startIndex, endRow: chunk.endIndex, }, }); }); // Wait for all chunks const results = await Promise.all(chunkPromises); // Merge transposed chunks using optimized O(n²) algorithm const transposed = mergeTransposedChunks(results, chunks, rows, cols); const duration = performance.now() - startTime; logger.debug('Parallel matrix transpose completed', { duration: `${duration.toFixed(2)}ms`, chunks: chunks.length, resultSize: `${transposed.length}×${transposed[0]?.length || 0}`, }); return transposed; } /** * Parallel matrix addition using worker pool. * * **Algorithm:** * 1. Split both matrices into corresponding row chunks * 2. Each worker adds its pair of chunks * 3. Combine result chunks * * @param {number[][]} a - First matrix * @param {number[][]} b - Second matrix (same dimensions as a) * @param {WorkerPool} pool - Worker pool instance * @returns {Promise<number[][]>} Result matrix (a + b) * * @example * ```typescript * const a = create2DArray(1000, 1000); * const b = create2DArray(1000, 1000); * const sum = await parallelMatrixAdd(a, b, workerPool); * ``` */ export async function parallelMatrixAdd( a: number[][], b: number[][], pool: WorkerPool ): Promise<number[][]> { const startTime = performance.now(); const rows = a.length; logger.debug('Starting parallel matrix add', { size: `${a.length}×${a[0]?.length || 0}`, }); // Determine optimal chunk count const numChunks = getOptimalChunkCount( rows, pool.getAvailableWorkerCount(), 100 // Min 100 rows per chunk ); // Chunk both matrices by rows const chunksA = chunkMatrixByRows(a, { numChunks }); const chunksB = chunkMatrixByRows(b, { numChunks }); // Process chunks in parallel const chunkPromises = chunksA.map((chunkA, index) => { const chunkB = chunksB[index]; return pool.execute<number[][]>({ operation: OperationType.MATRIX_ADD, data: { matrixA: chunkA.data, matrixB: chunkB.data, startRow: chunkA.startIndex, endRow: chunkA.endIndex, }, }); }); // Wait for all chunks const results = await Promise.all(chunkPromises); // Merge results const finalResult: number[][] = []; for (const result of results) { finalResult.push(...result); } const duration = performance.now() - startTime; logger.debug('Parallel matrix add completed', { duration: `${duration.toFixed(2)}ms`, chunks: chunksA.length, }); return finalResult; } /** * Parallel matrix subtraction using worker pool. * * **Algorithm:** * 1. Split both matrices into corresponding row chunks * 2. Each worker subtracts its pair of chunks * 3. Combine result chunks * * @param {number[][]} a - First matrix * @param {number[][]} b - Second matrix (same dimensions as a) * @param {WorkerPool} pool - Worker pool instance * @returns {Promise<number[][]>} Result matrix (a - b) * * @example * ```typescript * const a = create2DArray(1000, 1000); * const b = create2DArray(1000, 1000); * const diff = await parallelMatrixSubtract(a, b, workerPool); * ``` */ export async function parallelMatrixSubtract( a: number[][], b: number[][], pool: WorkerPool ): Promise<number[][]> { const startTime = performance.now(); const rows = a.length; logger.debug('Starting parallel matrix subtract', { size: `${a.length}×${a[0]?.length || 0}`, }); // Determine optimal chunk count const numChunks = getOptimalChunkCount( rows, pool.getAvailableWorkerCount(), 100 // Min 100 rows per chunk ); // Chunk both matrices by rows const chunksA = chunkMatrixByRows(a, { numChunks }); const chunksB = chunkMatrixByRows(b, { numChunks }); // Process chunks in parallel const chunkPromises = chunksA.map((chunkA, index) => { const chunkB = chunksB[index]; return pool.execute<number[][]>({ operation: OperationType.MATRIX_SUBTRACT, data: { matrixA: chunkA.data, matrixB: chunkB.data, startRow: chunkA.startIndex, endRow: chunkA.endIndex, }, }); }); // Wait for all chunks const results = await Promise.all(chunkPromises); // Merge results const finalResult: number[][] = []; for (const result of results) { finalResult.push(...result); } const duration = performance.now() - startTime; logger.debug('Parallel matrix subtract completed', { duration: `${duration.toFixed(2)}ms`, chunks: chunksA.length, }); return finalResult; } /** * Determines if an operation should use parallel processing. * * @param {number} size - Matrix dimension (number of rows) * @param {'multiply' | 'transpose' | 'add' | 'subtract'} operation - Operation type * @returns {boolean} True if parallel processing is beneficial */ export function shouldUseParallel( size: number, operation: 'multiply' | 'transpose' | 'add' | 'subtract' ): boolean { switch (operation) { case 'multiply': return size >= PARALLEL_THRESHOLDS.MATRIX_MULTIPLY; case 'transpose': return size >= PARALLEL_THRESHOLDS.MATRIX_TRANSPOSE; case 'add': case 'subtract': return size >= PARALLEL_THRESHOLDS.MATRIX_ADD_SUB; default: return false; } }

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/danielsimonjr/math-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

parallel-matrix.ts•11.6 KiB