# Licensed to the Apache Software Foundation (ASF) under one # or more contributor license agreements. See the NOTICE file # distributed with this work for additional information # regarding copyright ownership. The ASF licenses this file # to you under the Apache License, Version 2.0 (the # "License"); you may not use this file except in compliance # with the License. You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, # software distributed under the License is distributed on an # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY # KIND, either express or implied. See the License for the # specific language governing permissions and limitations # under the License. """ Apache Doris MCP Server - Enterprise Database Service Implementation Based on Apache Doris official MCP Server architecture design, providing complete MCP protocol support Supports independent encapsulation implementation of Resources, Tools, and Prompts Supports both stdio and streamable HTTP startup modes """ import argparse import asyncio import json import logging from typing import Any from mcp.server import Server from mcp.server.models import InitializationOptions from mcp.types import ( Prompt, Resource, TextContent, Tool, ) from .tools.tools_manager import DorisToolsManager from .tools.prompts_manager import DorisPromptsManager from .tools.resources_manager import DorisResourcesManager from .utils.config import DorisConfig from .utils.db import DorisConnectionManager from .utils.security import DorisSecurityManager import os # Configure logging logging.basicConfig(level=logging.INFO) logger = logging.getLogger(__name__) # Create a default config instance for getting default values _default_config = DorisConfig() class DorisServer: """Apache Doris MCP Server main class""" def __init__(self, config: DorisConfig): self.config = config self.server = Server("doris-mcp-server") # Initialize security manager self.security_manager = DorisSecurityManager(config) # Initialize connection manager, pass in security manager self.connection_manager = DorisConnectionManager(config, self.security_manager) # Initialize independent managers self.resources_manager = DorisResourcesManager(self.connection_manager) self.tools_manager = DorisToolsManager(self.connection_manager) self.prompts_manager = DorisPromptsManager(self.connection_manager) self.logger = logging.getLogger(f"{__name__}.DorisServer") self._setup_handlers() def _setup_handlers(self): """Setup MCP protocol handlers""" @self.server.list_resources() async def handle_list_resources() -> list[Resource]: """Handle resource list request""" try: self.logger.info("Handling resource list request") resources = await self.resources_manager.list_resources() self.logger.info(f"Returning {len(resources)} resources") return resources except Exception as e: self.logger.error(f"Failed to handle resource list request: {e}") return [] @self.server.read_resource() async def handle_read_resource(uri: str) -> str: """Handle resource read request""" try: self.logger.info(f"Handling resource read request: {uri}") content = await self.resources_manager.read_resource(uri) return content except Exception as e: self.logger.error(f"Failed to handle resource read request: {e}") return json.dumps( {"error": f"Failed to read resource: {str(e)}", "uri": uri}, ensure_ascii=False, indent=2, ) @self.server.list_tools() async def handle_list_tools() -> list[Tool]: """Handle tool list request""" try: self.logger.info("Handling tool list request") tools = await self.tools_manager.list_tools() self.logger.info(f"Returning {len(tools)} tools") return tools except Exception as e: self.logger.error(f"Failed to handle tool list request: {e}") return [] @self.server.call_tool() async def handle_call_tool( name: str, arguments: dict[str, Any] ) -> list[TextContent]: """Handle tool call request""" try: self.logger.info(f"Handling tool call request: {name}") result = await self.tools_manager.call_tool(name, arguments) return [TextContent(type="text", text=result)] except Exception as e: self.logger.error(f"Failed to handle tool call request: {e}") error_result = json.dumps( { "error": f"Tool call failed: {str(e)}", "tool_name": name, "arguments": arguments, }, ensure_ascii=False, indent=2, ) return [TextContent(type="text", text=error_result)] @self.server.list_prompts() async def handle_list_prompts() -> list[Prompt]: """Handle prompt list request""" try: self.logger.info("Handling prompt list request") prompts = await self.prompts_manager.list_prompts() self.logger.info(f"Returning {len(prompts)} prompts") return prompts except Exception as e: self.logger.error(f"Failed to handle prompt list request: {e}") return [] @self.server.get_prompt() async def handle_get_prompt(name: str, arguments: dict[str, Any]) -> str: """Handle prompt get request""" try: self.logger.info(f"Handling prompt get request: {name}") result = await self.prompts_manager.get_prompt(name, arguments) return result except Exception as e: self.logger.error(f"Failed to handle prompt get request: {e}") error_result = json.dumps( { "error": f"Failed to get prompt: {str(e)}", "prompt_name": name, "arguments": arguments, }, ensure_ascii=False, indent=2, ) return error_result async def start_stdio(self): """Start stdio transport mode""" self.logger.info("Starting Doris MCP Server (stdio mode)") try: # Ensure connection manager is initialized await self.connection_manager.initialize() self.logger.info("Connection manager initialization completed") # Start stdio server - using simpler approach from mcp.server.stdio import stdio_server self.logger.info("Creating stdio_server transport...") # Try different startup approaches try: async with stdio_server() as streams: read_stream, write_stream = streams self.logger.info("stdio_server streams created successfully") # Create initialization options # MCP 1.8.0 requires parameters for get_capabilities from mcp.server.lowlevel.server import NotificationOptions capabilities = self.server.get_capabilities( notification_options=NotificationOptions( prompts_changed=True, resources_changed=True, tools_changed=True ), experimental_capabilities={} ) init_options = InitializationOptions( server_name="doris-mcp-server", server_version=os.getenv("SERVER_VERSION", _default_config.server_version), capabilities=capabilities, ) self.logger.info("Initialization options created successfully") # Run server self.logger.info("Starting to run MCP server...") await self.server.run(read_stream, write_stream, init_options) except Exception as inner_e: self.logger.error(f"stdio_server internal error: {inner_e}") self.logger.error(f"Error type: {type(inner_e)}") # Try to get more error information import traceback self.logger.error("Complete error stack:") self.logger.error(traceback.format_exc()) # If it's ExceptionGroup, try to parse if hasattr(inner_e, 'exceptions'): self.logger.error(f"ExceptionGroup contains {len(inner_e.exceptions)} exceptions:") for i, exc in enumerate(inner_e.exceptions): self.logger.error(f" Exception {i+1}: {type(exc).__name__}: {exc}") raise inner_e except Exception as e: self.logger.error(f"stdio server startup failed: {e}") self.logger.error(f"Error type: {type(e)}") raise async def start_http(self, host: str = os.getenv("SERVER_HOST", _default_config.database.host), port: int = os.getenv("SERVER_PORT", _default_config.server_port)): """Start Streamable HTTP transport mode""" self.logger.info(f"Starting Doris MCP Server (Streamable HTTP mode) - {host}:{port}") try: # Ensure connection manager is initialized await self.connection_manager.initialize() # Use Starlette and StreamableHTTPSessionManager according to official example import uvicorn import contextlib from collections.abc import AsyncIterator from mcp.server.streamable_http_manager import StreamableHTTPSessionManager from starlette.applications import Starlette from starlette.routing import Route from starlette.responses import JSONResponse, Response from starlette.types import Scope # Create session manager session_manager = StreamableHTTPSessionManager( app=self.server, json_response=True, # Enable JSON response stateless=False # Maintain session state ) self.logger.info(f"StreamableHTTP session manager created, will start at http://{host}:{port}") # Health check endpoint async def health_check(request): return JSONResponse({"status": "healthy", "service": "doris-mcp-server"}) # Lifecycle manager - simplified since we manage session_manager externally @contextlib.asynccontextmanager async def lifespan(app: Starlette) -> AsyncIterator[None]: """Context manager for managing application lifecycle""" self.logger.info("Application started!") try: yield finally: self.logger.info("Application is shutting down...") # Create ASGI application - use direct session manager as ASGI app starlette_app = Starlette( debug=True, routes=[ Route("/health", health_check, methods=["GET"]), ], lifespan=lifespan, ) # Custom ASGI app that handles both /mcp and /mcp/ without redirects async def mcp_app(scope, receive, send): # Handle lifespan events if scope["type"] == "lifespan": await starlette_app(scope, receive, send) return # Handle HTTP requests if scope["type"] == "http": path = scope.get("path", "") self.logger.info(f"Received request for path: {path}") try: # Handle health check if path.startswith("/health"): await starlette_app(scope, receive, send) return # Handle MCP requests - both /mcp and /mcp/ go to session manager if path == "/mcp" or path.startswith("/mcp/"): self.logger.info(f"Handling MCP request for path: {path}") # Log request details for debugging method = scope.get("method", "UNKNOWN") headers = dict(scope.get("headers", [])) self.logger.info(f"MCP Request - Method: {method}") self.logger.info(f"MCP Request - Headers: {headers}") # Handle Dify compatibility for GET requests if method == "GET": accept_header = headers.get(b'accept', b'').decode('utf-8') user_agent = headers.get(b'user-agent', b'').decode('utf-8') # For other GET requests, try to add application/json to Accept header if 'text/event-stream' in accept_header and 'application/json' not in accept_header: self.logger.info("Adding application/json to Accept header for GET request") # Modify headers to include both content types new_headers = [] for name, value in scope.get("headers", []): if name == b'accept': # Add application/json to the accept header new_value = value.decode('utf-8') + ', application/json' new_headers.append((name, new_value.encode('utf-8'))) else: new_headers.append((name, value)) # Update scope with modified headers scope = dict(scope) scope["headers"] = new_headers self.logger.info(f"Modified Accept header to: {new_value}") await session_manager.handle_request(scope, receive, send) return # 404 for other paths self.logger.info(f"Path not found: {path}") response = Response("Not Found", status_code=404) await response(scope, receive, send) except Exception as e: self.logger.error(f"Error handling request for {path}: {e}") import traceback self.logger.error(traceback.format_exc()) response = Response("Internal Server Error", status_code=500) await response(scope, receive, send) else: # For other scope types, just return self.logger.warning(f"Unsupported scope type: {scope['type']}") return # Start uvicorn server with session manager lifecycle config = uvicorn.Config( app=mcp_app, host=host, port=port, log_level="info" ) server = uvicorn.Server(config) # Run session manager and server together async with session_manager.run(): self.logger.info("Session manager started, now starting HTTP server") await server.serve() except Exception as e: self.logger.error(f"Streamable HTTP server startup failed: {e}") import traceback self.logger.error("Complete error stack:") self.logger.error(traceback.format_exc()) # If it's ExceptionGroup, try to parse if hasattr(e, 'exceptions'): self.logger.error(f"ExceptionGroup contains {len(e.exceptions)} exceptions:") for i, exc in enumerate(e.exceptions): self.logger.error(f" Exception {i+1}: {type(exc).__name__}: {exc}") raise async def shutdown(self): """Shutdown server""" self.logger.info("Shutting down Doris MCP Server") try: await self.connection_manager.close() self.logger.info("Doris MCP Server has been shut down") except Exception as e: self.logger.error(f"Error occurred while shutting down server: {e}") def create_arg_parser(): """Create command line argument parser""" parser = argparse.ArgumentParser( description="Apache Doris MCP Server - Enterprise Database Service", formatter_class=argparse.RawDescriptionHelpFormatter, epilog=""" Transport Modes: stdio - Standard input/output (for local process communication) http - Streamable HTTP mode (MCP 2025-03-26 protocol) Examples: python -m doris_mcp_server --transport stdio python -m doris_mcp_server --transport http --host 0.0.0.0 --port 3000 """ ) parser.add_argument( "--transport", type=str, choices=["stdio", "http"], default=os.getenv("TRANSPORT", _default_config.transport), help=f"Transport protocol type: stdio (local), http (Streamable HTTP) (default: {_default_config.transport})", ) parser.add_argument( "--host", type=str, default=os.getenv("SERVER_HOST", _default_config.database.host), help=f"Host address for HTTP mode (default: {_default_config.database.host})", ) parser.add_argument( "--port", type=int, default=os.getenv("SERVER_PORT", _default_config.server_port), help=f"Port number for HTTP mode (default: {_default_config.server_port})" ) parser.add_argument( "--db-host", type=str, default=os.getenv("DB_HOST", _default_config.database.host), help=f"Doris database host address (default: {_default_config.database.host})", ) parser.add_argument( "--db-port", type=int, default=os.getenv("DB_PORT", _default_config.database.port), help=f"Doris database port number (default: {_default_config.database.port})" ) parser.add_argument( "--db-user", type=str, default=os.getenv("DB_USER", _default_config.database.user), help=f"Doris database username (default: {_default_config.database.user})" ) parser.add_argument("--db-password", type=str, default="", help="Doris database password") parser.add_argument( "--db-database", type=str, default=os.getenv("DB_DATABASE", _default_config.database.database), help=f"Doris database name (default: {_default_config.database.database})", ) parser.add_argument( "--log-level", type=str, choices=["DEBUG", "INFO", "WARNING", "ERROR"], default=os.getenv("LOG_LEVEL", _default_config.logging.level), help=f"Log level (default: {_default_config.logging.level})", ) return parser async def main(): """Main function""" parser = create_arg_parser() args = parser.parse_args() # Set log level logging.getLogger().setLevel(getattr(logging, args.log_level)) # Create configuration - priority: command line arguments > .env file > default values config = DorisConfig.from_env() # First load from .env file and environment variables # Command line arguments override configuration (if provided) if args.db_host != _default_config.database.host: # If not default value, use command line argument config.database.host = args.db_host if args.db_port != _default_config.database.port: config.database.port = args.db_port if args.db_user != _default_config.database.user: config.database.user = args.db_user if args.db_password: # Use password if provided config.database.password = args.db_password if args.db_database != _default_config.database.database: config.database.database = args.db_database if args.log_level != _default_config.logging.level: config.logging.level = args.log_level # Create server instance server = DorisServer(config) try: if args.transport == "stdio": await server.start_stdio() elif args.transport == "http": await server.start_http(args.host, args.port) else: logger.error(f"Unsupported transport protocol: {args.transport}") await server.shutdown() return 1 except KeyboardInterrupt: logger.info("Received interrupt signal, shutting down server...") except Exception as e: logger.error(f"Server runtime error: {e}") # Clean up resources even in case of exception try: await server.shutdown() except Exception as shutdown_error: logger.error(f"Error occurred while shutting down server: {shutdown_error}") return 1 finally: # Cleanup in case of normal shutdown try: await server.shutdown() except Exception as shutdown_error: logger.error(f"Error occurred while shutting down server: {shutdown_error}") return 0 def main_sync(): """Synchronous main function for entry point""" exit_code = asyncio.run(main()) exit(exit_code) if __name__ == "__main__": main_sync()