Obsidian MCP Server

Overview Schema Related Servers Score Discussions

obsidianMCP
src
obsidian_mcp

server.py•27.2 KiB

"""MCP server implementation for Obsidian vault search.""" import asyncio import json import logging from pathlib import Path from typing import Any, Dict, List, Optional, Sequence, Union import click from mcp import McpError from mcp.server import Server from mcp.server.models import InitializationOptions from mcp.server.stdio import stdio_server from mcp.types import ( CallToolRequest, CallToolRequestParams, CallToolResult, ErrorData, ListToolsRequest, ServerCapabilities, TextContent, Tool, ) from pydantic import BaseModel from .config import ServerConfig, load_config_from_env from .parser import ObsidianParser from .search import HybridSearchEngine from .startup_coordination import StartupCoordinator from .watcher import VaultWatcherManager # Configure logging logging.basicConfig(level=logging.INFO) logger = logging.getLogger(__name__) class ObsidianMCPServer: """MCP Server for Obsidian vault search.""" def __init__(self, config: ServerConfig): """Initialize the server with configuration.""" self.config = config self.parser = ObsidianParser(config.vault_path) logger.info(f"Initializing search index at: {config.index_path}") logger.info(f"Vault path: {config.vault_path}") self.search_index = HybridSearchEngine(config) self.watcher = VaultWatcherManager( vault_path=config.vault_path, parser=self.parser, search_index=self.search_index, enabled=config.watch_for_changes, use_polling=config.use_polling_observer, ) self.server: Server[Any, Any] = Server("obsidian-mcp-server") self._setup_tools() # Store flag to initialize index later in async context self._should_initialize_index = config.auto_rebuild_index def _setup_tools(self) -> None: """Setup MCP tools.""" @self.server.list_tools() # type: ignore[no-untyped-call] async def list_tools() -> List[Tool]: """List available tools.""" return [ Tool( name="search_notes", description="Search through Obsidian notes using full-text search", inputSchema={ "type": "object", "properties": { "query": { "type": "string", "description": "Search query string", }, "tags": { "type": "array", "items": {"type": "string"}, "description": "Filter by specific tags (optional)", }, "limit": { "type": "integer", "description": "Maximum number of results (default: 10)", "default": 10, }, }, "required": ["query"], }, ), Tool( name="get_note", description="Get the full content of a specific note by path or title", inputSchema={ "type": "object", "properties": { "identifier": { "type": "string", "description": "Note path (relative to vault) or note title", } }, "required": ["identifier"], }, ), Tool( name="list_recent_notes", description="Get recently modified notes", inputSchema={ "type": "object", "properties": { "limit": { "type": "integer", "description": "Maximum number of notes to return (default: 10)", "default": 10, } }, }, ), Tool( name="get_all_tags", description="Get all available tags in the vault", inputSchema={"type": "object", "properties": {}}, ), Tool( name="search_by_tag", description="Find all notes with specific tags", inputSchema={ "type": "object", "properties": { "tags": { "type": "array", "items": {"type": "string"}, "description": "Tags to search for", }, "limit": { "type": "integer", "description": "Maximum number of results (default: 20)", "default": 20, }, }, "required": ["tags"], }, ), Tool( name="get_vault_stats", description="Get statistics about the vault and search index", inputSchema={"type": "object", "properties": {}}, ), Tool( name="semantic_search", description="Search notes using semantic/vector similarity", inputSchema={ "type": "object", "properties": { "query": { "type": "string", "description": "Search query string", }, "limit": { "type": "integer", "description": "Maximum number of results (default: 10)", "default": 10, }, }, "required": ["query"], }, ), Tool( name="find_similar_notes", description="Find notes similar to a given note", inputSchema={ "type": "object", "properties": { "note_path": { "type": "string", "description": "Path to the reference note (relative to vault)", }, "limit": { "type": "integer", "description": "Maximum number of results (default: 10)", "default": 10, }, }, "required": ["note_path"], }, ), ] @self.server.call_tool() async def call_tool(name: str, arguments: Dict[str, Any]) -> List[TextContent]: """Handle tool calls.""" try: if name == "search_notes": return await self._search_notes(arguments) elif name == "get_note": return await self._get_note(arguments) elif name == "list_recent_notes": return await self._list_recent_notes(arguments) elif name == "get_all_tags": return await self._get_all_tags(arguments) elif name == "search_by_tag": return await self._search_by_tag(arguments) elif name == "get_vault_stats": return await self._get_vault_stats(arguments) elif name == "semantic_search": return await self._semantic_search(arguments) elif name == "find_similar_notes": return await self._find_similar_notes(arguments) else: raise McpError(ErrorData(code=-1, message=f"Unknown tool: {name}")) except Exception as e: logger.error(f"Error in tool {name}: {e}") raise McpError( ErrorData(code=-1, message=f"Tool execution failed: {str(e)}") ) async def _search_notes(self, arguments: Dict[str, Any]) -> List[TextContent]: """Search notes using full-text search.""" query = arguments.get("query", "") tags = set(arguments.get("tags", [])) limit = min(arguments.get("limit", 10), self.config.max_results) if not query.strip(): return [TextContent(type="text", text="Empty search query")] results = self.search_index.search( query=query, limit=limit, tags=tags if tags else None ) if not results: return [ TextContent(type="text", text=f"No results found for query: {query}") ] # Format results response_parts = [f"Found {len(results)} results for '{query}':\n"] for i, result in enumerate(results, 1): response_parts.append(f"{i}. **{result['title']}**") response_parts.append(f" Path: {result['path']}") if result["tags"]: response_parts.append(f" Tags: {', '.join(result['tags'])}") response_parts.append(f" Score: {result['score']:.2f}") # Add content preview content_preview = result["content"][:300] if len(result["content"]) > 300: content_preview += "..." response_parts.append(f" Preview: {content_preview}") response_parts.append("") return [TextContent(type="text", text="\n".join(response_parts))] async def _semantic_search(self, arguments: Dict[str, Any]) -> List[TextContent]: """Perform pure semantic/vector search.""" query = arguments.get("query", "") limit = min(arguments.get("limit", 10), self.config.max_results) if not query.strip(): return [TextContent(type="text", text="Empty search query")] results = self.search_index.semantic_search(query, limit) if not results: return [ TextContent( type="text", text=f"No semantically similar results found for: {query}", ) ] response_parts = [ f"Found {len(results)} semantically similar results for '{query}':\n" ] for i, result in enumerate(results, 1): response_parts.append(f"{i}. **{result['title']}**") response_parts.append(f" Path: {result['path']}") if result["tags"]: response_parts.append(f" Tags: {', '.join(result['tags'])}") response_parts.append( f" Similarity: {result.get('similarity_score', 0):.3f}" ) # Add content preview content_preview = result["content"][:300] if len(result["content"]) > 300: content_preview += "..." response_parts.append(f" Preview: {content_preview}") response_parts.append("") return [TextContent(type="text", text="\n".join(response_parts))] async def _find_similar_notes(self, arguments: Dict[str, Any]) -> List[TextContent]: """Find notes similar to a given note.""" note_path = arguments.get("note_path", "") limit = min(arguments.get("limit", 10), self.config.max_results) if not note_path: return [TextContent(type="text", text="Note path is required")] # Convert to absolute path if needed if not note_path.startswith(str(self.config.vault_path)): full_path = str(self.config.vault_path / note_path) else: full_path = note_path results = self.search_index.find_similar_notes(full_path, limit) if not results: return [ TextContent( type="text", text=f"No similar notes found for: {note_path}" ) ] response_parts = [f"Found {len(results)} notes similar to '{note_path}':\n"] for i, result in enumerate(results, 1): response_parts.append(f"{i}. **{result['title']}**") response_parts.append(f" Path: {result['path']}") if result["tags"]: response_parts.append(f" Tags: {', '.join(result['tags'])}") response_parts.append( f" Similarity: {result.get('similarity_score', 0):.3f}" ) # Add content preview content_preview = result["content"][:300] if len(result["content"]) > 300: content_preview += "..." response_parts.append(f" Preview: {content_preview}") response_parts.append("") return [TextContent(type="text", text="\n".join(response_parts))] async def _get_note(self, arguments: Dict[str, Any]) -> List[TextContent]: """Get full content of a specific note.""" identifier = arguments.get("identifier", "") if not identifier: return [TextContent(type="text", text="Note identifier is required")] # Try to find by path first note_path = self.config.vault_path / identifier if not note_path.exists(): # Try with .md extension note_path = self.config.vault_path / f"{identifier}.md" result = None if note_path.exists(): result = self.search_index.get_note_by_path(note_path) if not result: # Try to find by title through search search_results = self.search_index.search(f'title:"{identifier}"', limit=1) if search_results: result = search_results[0] if not result: return [TextContent(type="text", text=f"Note not found: {identifier}")] # Format note content response_parts = [ f"# {result['title']}", f"**Path:** {result['path']}", ] if result["tags"]: response_parts.append(f"**Tags:** {', '.join(result['tags'])}") if result["modified_date"]: response_parts.append(f"**Modified:** {result['modified_date']}") response_parts.extend(["", "## Content", result["content"]]) return [TextContent(type="text", text="\n".join(response_parts))] async def _list_recent_notes(self, arguments: Dict[str, Any]) -> List[TextContent]: """List recently modified notes.""" limit = min(arguments.get("limit", 10), self.config.max_results) recent_notes = self.search_index.get_recent_notes(limit=limit) if not recent_notes: return [TextContent(type="text", text="No notes found")] response_parts = [f"Recently modified notes (showing {len(recent_notes)}):\n"] for i, note in enumerate(recent_notes, 1): response_parts.append(f"{i}. **{note['title']}**") response_parts.append(f" Path: {note['path']}") if note["modified_date"]: response_parts.append(f" Modified: {note['modified_date']}") if note["tags"]: response_parts.append(f" Tags: {', '.join(note['tags'])}") # Add content preview response_parts.append(f" Preview: {note['content']}") response_parts.append("") return [TextContent(type="text", text="\n".join(response_parts))] async def _get_all_tags(self, arguments: Dict[str, Any]) -> List[TextContent]: """Get all available tags.""" tags = self.search_index.list_all_tags() if not tags: return [TextContent(type="text", text="No tags found in the vault")] response = f"Found {len(tags)} tags:\n\n" + "\n".join( f"- {tag}" for tag in tags ) return [TextContent(type="text", text=response)] async def _search_by_tag(self, arguments: Dict[str, Any]) -> List[TextContent]: """Search notes by specific tags.""" tags = arguments.get("tags", []) limit = min(arguments.get("limit", 20), self.config.max_results) if not tags: return [TextContent(type="text", text="No tags specified")] # Use wildcard search to find notes with these tags tag_query = " OR ".join(f"tags:{tag}" for tag in tags) results = self.search_index.search(query=tag_query, limit=limit) if not results: return [ TextContent( type="text", text=f"No notes found with tags: {', '.join(tags)}" ) ] response_parts = [f"Found {len(results)} notes with tags {', '.join(tags)}:\n"] for i, result in enumerate(results, 1): response_parts.append(f"{i}. **{result['title']}**") response_parts.append(f" Path: {result['path']}") response_parts.append(f" Tags: {', '.join(result['tags'])}") response_parts.append(f" Preview: {result['content'][:200]}...") response_parts.append("") return [TextContent(type="text", text="\n".join(response_parts))] async def _get_vault_stats(self, arguments: Dict[str, Any]) -> List[TextContent]: """Get vault and index statistics.""" try: # Get index stats index_stats = self.search_index.get_stats() # Get watcher stats watcher_stats = self.watcher.get_stats() # Get vault info vault_notes = self.parser.discover_notes() # Show first few files for debugging file_list = "" if vault_notes: def format_note_path(note: Union[Path, str]) -> str: if hasattr(note, "relative_to"): # It's a Path object return str(note.relative_to(self.config.vault_path)) else: # It's a string return str(note) file_list = "\n" + "\n".join( f" - {format_note_path(note)}" for note in vault_notes[:5] ) if len(vault_notes) > 5: file_list += f"\n - ... and {len(vault_notes) - 5} more" else: file_list = "\n - No .md files found" response_parts = [ "# Vault Statistics", "", "## Vault Information", f"- **Path:** {self.config.vault_path}", f"- **Path exists:** {self.config.vault_path.exists()}", f"- **Total markdown files:** {len(vault_notes)}{file_list}", "", "## Search Index", f"- **Indexed documents:** {index_stats.get('doc_count', 0)}", f"- **Index path:** {index_stats.get('index_path', 'Unknown')}", f"- **Fields:** {', '.join(index_stats.get('field_names', []))}", "", "## File Watcher", f"- **Enabled:** {watcher_stats.get('enabled', False)}", f"- **Running:** {watcher_stats.get('running', False)}", f"- **Files updated:** {watcher_stats.get('files_updated', 0)}", f"- **Files deleted:** {watcher_stats.get('files_deleted', 0)}", f"- **Files moved:** {watcher_stats.get('files_moved', 0)}", "", "## Configuration", f"- **Max results:** {self.config.max_results}", f"- **Auto rebuild index:** {self.config.auto_rebuild_index}", f"- **Watch for changes:** {self.config.watch_for_changes}", f"- **Include content in search:** {self.config.include_content_in_search}", ] return [TextContent(type="text", text="\n".join(response_parts))] except Exception as e: logger.error(f"Error getting vault stats: {e}") return [TextContent(type="text", text=f"Error retrieving stats: {str(e)}")] async def _initialize_index(self) -> None: """Initialize the search index with process coordination to prevent conflicts.""" logger.info("Initializing search index...") try: # First check how many notes exist in vault note_paths = self.parser.discover_notes() logger.info(f"Discovered {len(note_paths)} notes in vault") # Use startup coordination to prevent multiple processes from initializing simultaneously if self.config.index_path is None: raise ValueError("index_path cannot be None") coordinator = StartupCoordinator(self.config.index_path, timeout=90.0) # Fast path: check if index is already properly initialized if self.search_index.is_properly_initialized(len(note_paths)): logger.info( "Index is already properly initialized, skipping initialization" ) return # Try to acquire coordination lock if coordinator.acquire_coordination_lock(): # This process is the coordinator - perform initialization logger.info("Acquired startup coordination lock, initializing index...") await self._perform_index_initialization(note_paths) # Release the lock to signal completion coordinator.release_coordination_lock() logger.info("Index initialization completed, lock released") else: # Another process is coordinating - wait for completion logger.info( "Another process is initializing the index, waiting for completion..." ) if coordinator.wait_for_initialization(): logger.info("Index initialization completed by another process") # Verify the index is now properly initialized if self.search_index.is_properly_initialized(len(note_paths)): logger.info("Verified: Index is properly initialized") else: logger.warning( "Index initialization by another process may have failed, attempting fallback" ) await self._perform_index_initialization(note_paths) else: logger.error( "Timeout waiting for another process to complete initialization" ) raise RuntimeError( "Failed to coordinate index initialization with other processes. " "This may indicate multiple server instances are stuck or there's a stale lock file." ) except Exception as e: logger.error(f"Failed to initialize index: {e}") raise async def _perform_index_initialization(self, note_paths: List[Path]) -> None: """Perform the actual index initialization work. Args: note_paths: List of paths to markdown notes discovered in the vault. """ try: # Check current index stats current_stats = self.search_index.get_stats() logger.info( f"Current index has {current_stats.get('doc_count', 0)} documents" ) # If we have notes but no index, or index needs update if note_paths and ( current_stats.get("doc_count", 0) == 0 or self.search_index.needs_update(self.config.vault_path) ): logger.info("Index needs updating...") # Try incremental update first if index exists if current_stats.get("doc_count", 0) > 0: logger.info("Attempting incremental update...") stats = self.search_index.incremental_update( self.config.vault_path, self.parser ) if stats["updated"] > 0 or stats["added"] > 0: logger.info(f"Incremental update completed: {stats}") return logger.info("Performing full index rebuild...") elif not note_paths: logger.warning("No markdown notes found in vault") return else: logger.info("Index is up to date") return # Full rebuild if incremental update wasn't sufficient logger.info(f"Rebuilding index with {len(note_paths)} notes") # Parse all notes notes = [] for note_path in note_paths: note = self.parser.parse_note(note_path) if note: notes.append(note) logger.info(f"Successfully parsed {len(notes)} notes") # Compute backlinks self.parser.compute_backlinks(notes) # Rebuild search index self.search_index.rebuild_index(notes) logger.info("Search index initialization completed successfully") except Exception as e: logger.error(f"Error during index initialization: {e}") raise async def run(self) -> None: """Run the MCP server.""" try: # Initialize index if needed if self._should_initialize_index: await self._initialize_index() # Start file watcher self.watcher.start() # Run MCP server async with stdio_server() as (read_stream, write_stream): initialization_options = InitializationOptions( server_name="obsidian-mcp-server", server_version="0.1.0", capabilities=ServerCapabilities(), ) await self.server.run(read_stream, write_stream, initialization_options) finally: # Clean up self.watcher.stop() @click.command() @click.option( "--vault-path", type=click.Path(exists=True, file_okay=False, dir_okay=True), help="Path to Obsidian vault directory", ) @click.option("--index-path", type=click.Path(), help="Path to store search index") @click.option( "--max-results", type=int, default=50, help="Maximum number of search results" ) def main( vault_path: Optional[Path] = None, index_path: Optional[Path] = None, max_results: int = 50, ) -> None: """Run the Obsidian MCP Server.""" try: # Load configuration if vault_path: config = ServerConfig( vault_path=vault_path, index_path=index_path, max_results=max_results ) else: config = load_config_from_env() # Create and run server server = ObsidianMCPServer(config) asyncio.run(server.run()) except Exception as e: logger.error(f"Server failed: {e}") raise if __name__ == "__main__": main()

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/Bachmann1234/obsidianMCP'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

server.py•27.2 KiB