mcp-dbutils

MIT License
OverviewInspectSchema Related Servers Reviews Score
src
mcp_dbutils
"""Connection server base class"""

import json
from abc import ABC, abstractmethod
from contextlib import asynccontextmanager
from datetime import datetime
from importlib.metadata import metadata
from typing import Any, AsyncContextManager, Dict

import mcp.server.stdio
import mcp.types as types
import yaml
from mcp.server import Server

from .log import create_logger
from .stats import ResourceStats


class ConnectionHandlerError(Exception):
    """Base exception for connection errors"""


class ConfigurationError(ConnectionHandlerError):
    """Configuration related errors"""


class ConnectionError(ConnectionHandlerError):
    """Connection related errors"""



DATABASE_CONNECTION_NAME = "Database connection name"
EMPTY_QUERY_ERROR = "SQL query cannot be empty"
SQL_QUERY_REQUIRED_ERROR = "SQL query required for explain-query tool"
EMPTY_TABLE_NAME_ERROR = "Table name cannot be empty"
CONNECTION_NAME_REQUIRED_ERROR = "Connection name must be specified"
SELECT_ONLY_ERROR = "Only SELECT queries are supported for security reasons"
INVALID_URI_FORMAT_ERROR = "Invalid resource URI format"

# 获取包信息用于日志命名
pkg_meta = metadata("mcp-dbutils")


LOG_NAME = "dbutils"

# MCP日志级别常量
LOG_LEVEL_DEBUG = "debug"       # 0
LOG_LEVEL_INFO = "info"        # 1
LOG_LEVEL_NOTICE = "notice"    # 2
LOG_LEVEL_WARNING = "warning"  # 3
LOG_LEVEL_ERROR = "error"      # 4
LOG_LEVEL_CRITICAL = "critical" # 5
LOG_LEVEL_ALERT = "alert"      # 6
LOG_LEVEL_EMERGENCY = "emergency" # 7

class ConnectionHandler(ABC):
    """Abstract base class defining common interface for connection handlers"""

    def __init__(self, config_path: str, connection: str, debug: bool = False):
        """Initialize connection handler

        Args:
            config_path: Path to configuration file
            connection: str = DATABASE_CONNECTION_NAME
            debug: Enable debug mode
        """
        self.config_path = config_path
        self.connection = connection
        self.debug = debug
        # 创建stderr日志记录器用于本地调试
        self.log = create_logger(f"{LOG_NAME}.handler.{connection}", debug)
        self.stats = ResourceStats()
        self._session = None

    def send_log(self, level: str, message: str):
        """通过MCP发送日志消息和写入stderr

        Args:
            level: 日志级别 (debug/info/notice/warning/error/critical/alert/emergency)
            message: 日志内容
        """
        # 本地stderr日志
        self.log(level, message)

        # MCP日志通知
        if self._session and hasattr(self._session, 'request_context'):
            self._session.request_context.session.send_log_message(
                level=level,
                data=message


    @property
    @abstractmethod
    def db_type(self) -> str:
        """Return database type"""
        pass

    @abstractmethod
    async def get_tables(self) -> list[types.Resource]:
        """Get list of table resources from database connection"""
        pass

    @abstractmethod
    async def get_schema(self, table_name: str) -> str:
        """Get schema information for specified table"""
        pass

    @abstractmethod
    async def _execute_query(self, sql: str) -> str:
        """Internal query execution method to be implemented by subclasses"""
        pass

    async def execute_query(self, sql: str) -> str:
        """Execute SQL query with performance tracking"""
        start_time = datetime.now()
        try:
            self.stats.record_query()
            result = await self._execute_query(sql)
            duration = (datetime.now() - start_time).total_seconds()
            self.stats.record_query_duration(sql, duration)
            self.stats.update_memory_usage(result)
            self.send_log(LOG_LEVEL_INFO, f"Query executed in {duration*1000:.2f}ms. Resource stats: {json.dumps(self.stats.to_dict())}")
            return result
        except Exception as e:
            duration = (datetime.now() - start_time).total_seconds()
            self.stats.record_error(e.__class__.__name__)
            self.send_log(LOG_LEVEL_ERROR, f"Query error after {duration*1000:.2f}ms - {str(e)}\nResource stats: {json.dumps(self.stats.to_dict())}")
            raise

    @abstractmethod
    async def get_table_description(self, table_name: str) -> str:
        """Get detailed table description including columns, types, and comments

        Args:
            table_name: Name of the table to describe

        Returns:
            Formatted table description
        """
        pass

    @abstractmethod
    async def get_table_ddl(self, table_name: str) -> str:
        """Get DDL statement for table including columns, constraints and indexes

        Args:
            table_name: Name of the table to get DDL for

        Returns:
            DDL statement as string
        """
        pass

    @abstractmethod
    async def get_table_indexes(self, table_name: str) -> str:
        """Get index information for table

        Args:
            table_name: Name of the table to get indexes for

        Returns:
            Formatted index information
        """
        pass

    @abstractmethod
    async def get_table_stats(self, table_name: str) -> str:
        """Get table statistics information

        Args:
            table_name: Name of the table to get statistics for

        Returns:
            Formatted statistics information including row count, size, etc.
        """
        pass

    @abstractmethod
    async def get_table_constraints(self, table_name: str) -> str:
        """Get constraint information for table

        Args:
            table_name: Name of the table to get constraints for

        Returns:
            Formatted constraint information including primary keys, foreign keys, etc.
        """
        pass

    @abstractmethod
    async def explain_query(self, sql: str) -> str:
        """Get query execution plan

        Args:
            sql: SQL query to explain

        Returns:
            Formatted query execution plan with cost estimates
        """
        pass

    @abstractmethod
    async def cleanup(self):
        """Cleanup resources"""
        pass

    async def execute_tool_query(self, tool_name: str, table_name: str = "", sql: str = "") -> str:
        """Execute a tool query and return formatted result

        Args:
            tool_name: Name of the tool to execute
            table_name: Name of the table to query (for table-related tools)
            sql: SQL query (for query-related tools)

        Returns:
            Formatted query result
        """
        try:
            self.stats.record_query()

            if tool_name == "dbutils-describe-table":
                result = await self.get_table_description(table_name)
            elif tool_name == "dbutils-get-ddl":
                result = await self.get_table_ddl(table_name)
            elif tool_name == "dbutils-list-indexes":
                result = await self.get_table_indexes(table_name)
            elif tool_name == "dbutils-get-stats":
                result = await self.get_table_stats(table_name)
            elif tool_name == "dbutils-list-constraints":
                result = await self.get_table_constraints(table_name)
            elif tool_name == "dbutils-explain-query":
                if not sql:
                    raise ValueError(SQL_QUERY_REQUIRED_ERROR)
                result = await self.explain_query(sql)
            else:
                raise ValueError(f"Unknown tool: {tool_name}")

            self.stats.update_memory_usage(result)
            self.send_log(LOG_LEVEL_INFO, f"Resource stats: {json.dumps(self.stats.to_dict())}")
            return f"[{self.db_type}]\n{result}"

        except Exception as e:
            self.stats.record_error(e.__class__.__name__)
            self.send_log(LOG_LEVEL_ERROR, f"Tool error - {str(e)}\nResource stats: {json.dumps(self.stats.to_dict())}")
            raise

class ConnectionServer:
    """Unified connection server class"""

    def __init__(self, config_path: str, debug: bool = False):
        """Initialize connection server

        Args:
            config_path: Path to configuration file
            debug: Enable debug mode
        """
        self.config_path = config_path
        self.debug = debug
        # 获取包信息用于服务器配置
        pkg_meta = metadata("mcp-dbutils")
        self.logger = create_logger(f"{LOG_NAME}.server", debug)
        self.server = Server(
            name=LOG_NAME,
            version=pkg_meta["Version"]

        self._session = None
        self._setup_handlers()
        self._setup_prompts()

    def send_log(self, level: str, message: str):
        """通过MCP发送日志消息和写入stderr

        Args:
            level: 日志级别 (debug/info/notice/warning/error/critical/alert/emergency)
            message: 日志内容
        """
        # 本地stderr日志
        self.logger(level, message)

        # MCP日志通知
        if hasattr(self.server, 'session') and self.server.session:
            try:
                self.server.session.send_log_message(
                    level=level,
                    data=message

            except Exception as e:
                self.logger("error", f"Failed to send MCP log message: {str(e)}")

    def _setup_prompts(self):
        """Setup prompts handlers"""
        @self.server.list_prompts()
        async def handle_list_prompts() -> list[types.Prompt]:
            """Handle prompts/list request"""
            try:
                self.send_log(LOG_LEVEL_DEBUG, "Handling list_prompts request")
                return []
            except Exception as e:
                self.send_log(LOG_LEVEL_ERROR, f"Error in list_prompts: {str(e)}")
                raise

    def _get_config_or_raise(self, connection: str) -> dict:
        """读取配置文件并验证连接配置

        Args:
            connection: 连接名称

        Returns:
            dict: 连接配置

        Raises:
            ConfigurationError: 如果配置文件格式不正确或连接不存在
        """
        with open(self.config_path, 'r') as f:
            config = yaml.safe_load(f)
            if not config or 'connections' not in config:
                raise ConfigurationError("Configuration file must contain 'connections' section")
            if connection not in config['connections']:
                available_connections = list(config['connections'].keys())
                raise ConfigurationError(f"Connection not found: {connection}. Available connections: {available_connections}")

            db_config = config['connections'][connection]

            if 'type' not in db_config:
                raise ConfigurationError("Database configuration must include 'type' field")

            return db_config

    def _create_handler_for_type(self, db_type: str, connection: str) -> ConnectionHandler:
        """基于数据库类型创建相应的处理器

        Args:
            db_type: 数据库类型
            connection: 连接名称

        Returns:
            ConnectionHandler: 数据库连接处理器

        Raises:
            ConfigurationError: 如果数据库类型不支持或导入失败
        """
        self.send_log(LOG_LEVEL_DEBUG, f"Creating handler for database type: {db_type}")

        try:
            if db_type == 'sqlite':
                from .sqlite.handler import SQLiteHandler
                return SQLiteHandler(self.config_path, connection, self.debug)
            elif db_type == 'postgres':
                from .postgres.handler import PostgreSQLHandler
                return PostgreSQLHandler(self.config_path, connection, self.debug)
            elif db_type == 'mysql':
                from .mysql.handler import MySQLHandler
                return MySQLHandler(self.config_path, connection, self.debug)
            else:
                raise ConfigurationError(f"Unsupported database type: {db_type}")
        except ImportError as e:
            # 捕获导入错误并转换为ConfigurationError，以保持与现有测试兼容
            raise ConfigurationError(f"Failed to import handler for {db_type}: {str(e)}")

    @asynccontextmanager
    async def get_handler(self, connection: str) -> AsyncContextManager[ConnectionHandler]:
        """Get connection handler

        Get appropriate connection handler based on connection name

        Args:
            connection: str = DATABASE_CONNECTION_NAME

        Returns:
            AsyncContextManager[ConnectionHandler]: Context manager for connection handler
        """
        # Read configuration file and validate connection
        db_config = self._get_config_or_raise(connection)

        # Create appropriate handler based on database type
        handler = None
        try:
            db_type = db_config['type']
            handler = self._create_handler_for_type(db_type, connection)

            # Set session for MCP logging
            if hasattr(self.server, 'session'):
                handler._session = self.server.session

            handler.stats.record_connection_start()
            self.send_log(LOG_LEVEL_DEBUG, f"Handler created successfully for {connection}")

            yield handler
        finally:
            if handler:
                self.send_log(LOG_LEVEL_DEBUG, f"Cleaning up handler for {connection}")
                handler.stats.record_connection_end()

                if hasattr(handler, 'cleanup') and callable(handler.cleanup):
                    await handler.cleanup()

    def _get_available_tools(self) -> list[types.Tool]:
        """返回所有可用的数据库工具列表

        Returns:
            list[types.Tool]: 工具列表
        """
        return [
            types.Tool(
                name="dbutils-run-query",
                description="Execute read-only SQL query on database connection",
                inputSchema={
                    "type": "object",
                    "properties": {
                        "connection": {
                            "type": "string",
                            "description": DATABASE_CONNECTION_NAME

                        "sql": {
                            "type": "string",
                            "description": "SQL query (SELECT only)"


                    "required": ["connection", "sql"]


            types.Tool(
                name="dbutils-list-tables",
                description="List all available tables in the specified database connection",
                inputSchema={
                    "type": "object",
                    "properties": {
                        "connection": {
                            "type": "string",
                            "description": DATABASE_CONNECTION_NAME


                    "required": ["connection"]


            types.Tool(
                name="dbutils-describe-table",
                description="Get detailed information about a table's structure",
                inputSchema={
                    "type": "object",
                    "properties": {
                        "connection": {
                            "type": "string",
                            "description": DATABASE_CONNECTION_NAME

                        "table": {
                            "type": "string",
                            "description": "Table name to describe"


                    "required": ["connection", "table"]


            types.Tool(
                name="dbutils-get-ddl",
                description="Get DDL statement for creating the table",
                inputSchema={
                    "type": "object",
                    "properties": {
                        "connection": {
                            "type": "string",
                            "description": DATABASE_CONNECTION_NAME

                        "table": {
                            "type": "string",
                            "description": "Table name to get DDL for"


                    "required": ["connection", "table"]


            types.Tool(
                name="dbutils-list-indexes",
                description="List all indexes on the specified table",
                inputSchema={
                    "type": "object",
                    "properties": {
                        "connection": {
                            "type": "string",
                            "description": DATABASE_CONNECTION_NAME

                        "table": {
                            "type": "string",
                            "description": "Table name to list indexes for"


                    "required": ["connection", "table"]


            types.Tool(
                name="dbutils-get-stats",
                description="Get table statistics like row count and size",
                inputSchema={
                    "type": "object",
                    "properties": {
                        "connection": {
                            "type": "string",
                            "description": DATABASE_CONNECTION_NAME

                        "table": {
                            "type": "string",
                            "description": "Table name to get statistics for"


                    "required": ["connection", "table"]


            types.Tool(
                name="dbutils-list-constraints",
                description="List all constraints (primary key, foreign keys, etc) on the table",
                inputSchema={
                    "type": "object",
                    "properties": {
                        "connection": {
                            "type": "string",
                            "description": DATABASE_CONNECTION_NAME

                        "table": {
                            "type": "string",
                            "description": "Table name to list constraints for"


                    "required": ["connection", "table"]


            types.Tool(
                name="dbutils-explain-query",
                description="Get execution plan for a SQL query",
                inputSchema={
                    "type": "object",
                    "properties": {
                        "connection": {
                            "type": "string",
                            "description": DATABASE_CONNECTION_NAME

                        "sql": {
                            "type": "string",
                            "description": "SQL query to explain"


                    "required": ["connection", "sql"]


            types.Tool(
                name="dbutils-get-performance",
                description="Get database performance statistics",
                inputSchema={
                    "type": "object",
                    "properties": {
                        "connection": {
                            "type": "string",
                            "description": DATABASE_CONNECTION_NAME


                    "required": ["connection"]


            types.Tool(
                name="dbutils-analyze-query",
                description="Analyze a SQL query for performance",
                inputSchema={
                    "type": "object",
                    "properties": {
                        "connection": {
                            "type": "string",
                            "description": DATABASE_CONNECTION_NAME

                        "sql": {
                            "type": "string",
                            "description": "SQL query to analyze"


                    "required": ["connection", "sql"]




    async def _handle_list_tables(self, connection: str) -> list[types.TextContent]:
        """处理列表表格工具调用

        Args:
            connection: 数据库连接名称

        Returns:
            list[types.TextContent]: 表格列表
        """
        async with self.get_handler(connection) as handler:
            tables = await handler.get_tables()
            if not tables:
                # 空表列表的情况也返回数据库类型
                return [types.TextContent(type="text", text=f"[{handler.db_type}] No tables found")]

            formatted_tables = "\n".join([
                f"Table: {table.name}\n" +
                f"URI: {table.uri}\n" +
                (f"Description: {table.description}\n" if table.description else "") +
                "---"
                for table in tables

            # 添加数据库类型前缀
            return [types.TextContent(type="text", text=f"[{handler.db_type}]\n{formatted_tables}")]

    async def _handle_run_query(self, connection: str, sql: str) -> list[types.TextContent]:
        """处理运行查询工具调用

        Args:
            connection: 数据库连接名称
            sql: SQL查询语句

        Returns:
            list[types.TextContent]: 查询结果

        Raises:
            ConfigurationError: 如果SQL为空或非SELECT语句
        """
        if not sql:
            raise ConfigurationError(EMPTY_QUERY_ERROR)

        # Only allow SELECT statements
        if not sql.lower().startswith("select"):
            raise ConfigurationError(SELECT_ONLY_ERROR)

        async with self.get_handler(connection) as handler:
            result = await handler.execute_query(sql)
            return [types.TextContent(type="text", text=result)]

    async def _handle_table_tools(self, name: str, connection: str, table: str) -> list[types.TextContent]:
        """处理表相关工具调用

        Args:
            name: 工具名称
            connection: 数据库连接名称
            table: 表名

        Returns:
            list[types.TextContent]: 工具执行结果

        Raises:
            ConfigurationError: 如果表名为空
        """
        if not table:
            raise ConfigurationError(EMPTY_TABLE_NAME_ERROR)

        async with self.get_handler(connection) as handler:
            result = await handler.execute_tool_query(name, table_name=table)
            return [types.TextContent(type="text", text=result)]

    async def _handle_explain_query(self, connection: str, sql: str) -> list[types.TextContent]:
        """处理解释查询工具调用

        Args:
            connection: 数据库连接名称
            sql: SQL查询语句

        Returns:
            list[types.TextContent]: 查询解释

        Raises:
            ConfigurationError: 如果SQL为空
        """
        if not sql:
            raise ConfigurationError(EMPTY_QUERY_ERROR)

        async with self.get_handler(connection) as handler:
            result = await handler.execute_tool_query("dbutils-explain-query", sql=sql)
            return [types.TextContent(type="text", text=result)]

    async def _handle_performance(self, connection: str) -> list[types.TextContent]:
        """处理性能统计工具调用

        Args:
            connection: 数据库连接名称

        Returns:
            list[types.TextContent]: 性能统计
        """
        async with self.get_handler(connection) as handler:
            performance_stats = handler.stats.get_performance_stats()
            return [types.TextContent(type="text", text=f"[{handler.db_type}]\n{performance_stats}")]

    async def _handle_analyze_query(self, connection: str, sql: str) -> list[types.TextContent]:
        """处理查询分析工具调用

        Args:
            connection: 数据库连接名称
            sql: SQL查询语句

        Returns:
            list[types.TextContent]: 查询分析结果

        Raises:
            ConfigurationError: 如果SQL为空
        """
        if not sql:
            raise ConfigurationError(EMPTY_QUERY_ERROR)

        async with self.get_handler(connection) as handler:
            # First get the execution plan
            explain_result = await handler.explain_query(sql)

            # Then execute the actual query to measure performance
            start_time = datetime.now()
            if sql.lower().startswith("select"):

                    await handler.execute_query(sql)
                except Exception as e:
                    # If query fails, we still provide the execution plan
                    self.send_log(LOG_LEVEL_ERROR, f"Query execution failed during analysis: {str(e)}")
            duration = (datetime.now() - start_time).total_seconds()

            # Combine analysis results
            analysis = [
                f"[{handler.db_type}] Query Analysis",
                f"SQL: {sql}",

                f"Execution Time: {duration*1000:.2f}ms",

                "Execution Plan:",
                explain_result


            # Add optimization suggestions
            suggestions = self._get_optimization_suggestions(explain_result, duration)
            if suggestions:
                analysis.append("\nOptimization Suggestions:")
                analysis.extend(suggestions)

            return [types.TextContent(type="text", text="\n".join(analysis))]

    def _get_optimization_suggestions(self, explain_result: str, duration: float) -> list[str]:
        """根据执行计划和耗时获取优化建议

        Args:
            explain_result: 执行计划
            duration: 查询耗时（秒）

        Returns:
            list[str]: 优化建议列表
        """
        suggestions = []
        if "seq scan" in explain_result.lower() and duration > 0.1:
            suggestions.append("- Consider adding an index to avoid sequential scan")
        if "hash join" in explain_result.lower() and duration > 0.5:
            suggestions.append("- Consider optimizing join conditions")
        if duration > 0.5:  # 500ms
            suggestions.append("- Query is slow, consider optimizing or adding caching")
        if "temporary" in explain_result.lower():
            suggestions.append("- Query creates temporary tables, consider restructuring")

        return suggestions

    def _setup_handlers(self):
        """Setup MCP handlers"""
        @self.server.list_resources()
        async def handle_list_resources(arguments: dict | None = None) -> list[types.Resource]:
            if not arguments or 'connection' not in arguments:
                # Return empty list when no connection specified
                return []

            connection = arguments['connection']
            async with self.get_handler(connection) as handler:
                return await handler.get_tables()

        @self.server.read_resource()
        async def handle_read_resource(uri: str, arguments: dict | None = None) -> str:
            if not arguments or 'connection' not in arguments:
                raise ConfigurationError(CONNECTION_NAME_REQUIRED_ERROR)

            parts = uri.split('/')
            if len(parts) < 3:
                raise ConfigurationError(INVALID_URI_FORMAT_ERROR)

            connection = arguments['connection']
            table_name = parts[-2]  # URI format: xxx/table_name/schema

            async with self.get_handler(connection) as handler:
                return await handler.get_schema(table_name)

        @self.server.list_tools()
        async def handle_list_tools() -> list[types.Tool]:
            return self._get_available_tools()

        @self.server.call_tool()
        async def handle_call_tool(name: str, arguments: dict) -> list[types.TextContent]:
            if "connection" not in arguments:
                raise ConfigurationError(CONNECTION_NAME_REQUIRED_ERROR)

            connection = arguments["connection"]

            if name == "dbutils-list-tables":
                return await self._handle_list_tables(connection)
            elif name == "dbutils-run-query":
                sql = arguments.get("sql", "").strip()
                return await self._handle_run_query(connection, sql)
            elif name in ["dbutils-describe-table", "dbutils-get-ddl", "dbutils-list-indexes",
                         "dbutils-get-stats", "dbutils-list-constraints"]:
                table = arguments.get("table", "").strip()
                return await self._handle_table_tools(name, connection, table)
            elif name == "dbutils-explain-query":
                sql = arguments.get("sql", "").strip()
                return await self._handle_explain_query(connection, sql)
            elif name == "dbutils-get-performance":
                return await self._handle_performance(connection)
            elif name == "dbutils-analyze-query":
                sql = arguments.get("sql", "").strip()
                return await self._handle_analyze_query(connection, sql)
            else:
                raise ConfigurationError(f"Unknown tool: {name}")

    async def run(self):
        """Run server"""
        async with mcp.server.stdio.stdio_server() as streams:
            await self.server.run(
                streams[0],
                streams[1],
                self.server.create_initialization_options()