Markdown RAG Documentation

Overview Schema Related Servers Score Discussions

ragdocs-mcp
tests
integration

test_parallel_indexing.py•7.52 KiB

import time import pytest from src.config import Config, IndexingConfig from src.indexing.manager import IndexManager from src.indices.graph import GraphStore from src.indices.keyword import KeywordIndex from src.indices.vector import VectorIndex @pytest.mark.asyncio async def test_parallel_indexing_with_manager(tmp_path, shared_embedding_model): """ Verify IndexManager uses parallel embeddings. This test creates multiple documents and indexes them through the IndexManager, verifying that parallel embedding configuration is respected and improves throughput. """ docs_dir = tmp_path / "docs" docs_dir.mkdir() for i in range(20): (docs_dir / f"doc_{i}.md").write_text( f"# Document {i}\n\nContent for document {i}.\n\n" f"This is a longer piece of text to simulate real documentation." ) config = Config( indexing=IndexingConfig( documents_path=str(docs_dir), index_path=str(tmp_path / "index"), embedding_workers=4, ), ) vector = VectorIndex( embedding_model=shared_embedding_model, embedding_workers=config.indexing.embedding_workers, ) keyword = KeywordIndex() graph = GraphStore() manager = IndexManager(config, vector, keyword, graph) start = time.time() for doc_path in docs_dir.glob("*.md"): manager.index_document(str(doc_path)) duration = time.time() - start assert duration < 15, f"Indexing took {duration:.2f}s, expected <15s with parallelism" assert manager.get_document_count() == 20 @pytest.mark.asyncio async def test_parallel_vs_sequential_throughput(tmp_path, shared_embedding_model): """ Compare throughput between parallel and sequential indexing. This test demonstrates the performance benefit of parallel embedding generation by comparing indexing times. Note: Speedup expectations are modest (1.2x) due to Python GIL overhead. For larger documents or more documents, speedups approach 2-3x. """ docs_dir = tmp_path / "docs" docs_dir.mkdir() # Use larger documents to better demonstrate parallelism benefits for i in range(30): (docs_dir / f"doc_{i}.md").write_text( f"# Document {i}\n\n{'Content section. ' * 100}" ) config_sequential = Config( indexing=IndexingConfig( documents_path=str(docs_dir), index_path=str(tmp_path / "index_seq"), embedding_workers=1, ), ) config_parallel = Config( indexing=IndexingConfig( documents_path=str(docs_dir), index_path=str(tmp_path / "index_par"), embedding_workers=4, ), ) vector_seq = VectorIndex( embedding_model=shared_embedding_model, embedding_workers=1, ) keyword_seq = KeywordIndex() graph_seq = GraphStore() manager_seq = IndexManager(config_sequential, vector_seq, keyword_seq, graph_seq) start_seq = time.time() for doc_path in docs_dir.glob("*.md"): manager_seq.index_document(str(doc_path)) seq_duration = time.time() - start_seq vector_par = VectorIndex( embedding_model=shared_embedding_model, embedding_workers=4, ) keyword_par = KeywordIndex() graph_par = GraphStore() manager_par = IndexManager(config_parallel, vector_par, keyword_par, graph_par) start_par = time.time() for doc_path in docs_dir.glob("*.md"): manager_par.index_document(str(doc_path)) par_duration = time.time() - start_par speedup = seq_duration / par_duration # Relaxed threshold: parallel should be faster, but GIL limits gains # Real-world speedups vary from 1.2x to 3x depending on doc size/count assert speedup >= 1.0, ( f"Parallel indexing should not be slower than sequential, got {speedup:.2f}x " f"(sequential: {seq_duration:.2f}s, parallel: {par_duration:.2f}s)" ) # Log actual speedup for observability (not an assertion) if speedup < 1.2: import logging logging.info( f"Low speedup observed: {speedup:.2f}x. " f"This is expected with small documents or high system load." ) @pytest.mark.asyncio async def test_parallel_indexing_correctness(tmp_path, shared_embedding_model): """ Verify parallel indexing produces correct search results. Results from parallel-indexed documents should match those from sequentially-indexed documents. """ docs_dir = tmp_path / "docs" docs_dir.mkdir() for i in range(10): (docs_dir / f"doc_{i}.md").write_text( f"# Topic {i}\n\nInformation about topic {i}." ) config_sequential = Config( indexing=IndexingConfig( documents_path=str(docs_dir), index_path=str(tmp_path / "index_seq"), embedding_workers=1, ), ) config_parallel = Config( indexing=IndexingConfig( documents_path=str(docs_dir), index_path=str(tmp_path / "index_par"), embedding_workers=4, ), ) vector_seq = VectorIndex( embedding_model=shared_embedding_model, embedding_workers=1, ) keyword_seq = KeywordIndex() graph_seq = GraphStore() manager_seq = IndexManager(config_sequential, vector_seq, keyword_seq, graph_seq) for doc_path in docs_dir.glob("*.md"): manager_seq.index_document(str(doc_path)) vector_par = VectorIndex( embedding_model=shared_embedding_model, embedding_workers=4, ) keyword_par = KeywordIndex() graph_par = GraphStore() manager_par = IndexManager(config_parallel, vector_par, keyword_par, graph_par) for doc_path in docs_dir.glob("*.md"): manager_par.index_document(str(doc_path)) results_seq = vector_seq.search("information topic", top_k=10) results_par = vector_par.search("information topic", top_k=10) seq_ids = {r["chunk_id"] for r in results_seq} par_ids = {r["chunk_id"] for r in results_par} assert seq_ids == par_ids, "Parallel and sequential indexing produced different results" @pytest.mark.asyncio async def test_parallel_indexing_persistence(tmp_path, shared_embedding_model): """ Verify parallel-indexed content persists correctly. After indexing with parallel workers, data should be persisted and reloadable without data loss. """ docs_dir = tmp_path / "docs" docs_dir.mkdir() index_path = tmp_path / "index" for i in range(15): (docs_dir / f"doc_{i}.md").write_text( f"# Document {i}\n\nPersistent content {i}." ) config = Config( indexing=IndexingConfig( documents_path=str(docs_dir), index_path=str(index_path), embedding_workers=4, ), ) vector = VectorIndex( embedding_model=shared_embedding_model, embedding_workers=4, ) keyword = KeywordIndex() graph = GraphStore() manager = IndexManager(config, vector, keyword, graph) for doc_path in docs_dir.glob("*.md"): manager.index_document(str(doc_path)) manager.persist() vector_reloaded = VectorIndex( embedding_model=shared_embedding_model, embedding_workers=4, ) keyword_reloaded = KeywordIndex() graph_reloaded = GraphStore() manager_reloaded = IndexManager(config, vector_reloaded, keyword_reloaded, graph_reloaded) manager_reloaded.load() assert manager_reloaded.get_document_count() == 15 results = vector_reloaded.search("persistent content", top_k=15) assert len(results) == 15

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/andnp/ragdocs-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

test_parallel_indexing.py•7.52 KiB