Voice Generation MCP Server

MIT License

Overview InspectNew Endpoints Schema Related Servers Reviews Score

voice-gen-mcp

server.py•7.07 kB

#!/usr/bin/env python3 """ MCP Server for Voice Generation using Minimax AI API. Provides tools to generate speech from text and upload to S3. """ import os import sys import logging import uuid from datetime import datetime, timedelta from fastmcp import FastMCP, Context from fastmcp.server.auth.providers.jwt import StaticTokenVerifier from dotenv import load_dotenv import boto3 from botocore.exceptions import ClientError, NoCredentialsError # Import voice generation components from config import load_config from voice_generator import VoiceGenerator, VoiceGeneratorError # Configure logging to stderr (required for MCP servers) logging.basicConfig( level=logging.INFO, format='%(asctime)s - %(name)s - %(levelname)s - %(message)s', handlers=[logging.StreamHandler(sys.stderr)] ) logger = logging.getLogger(__name__) # Load environment variables load_dotenv() voice_generator = None s3_client = None config = None def initialize_services(): """Initialize the voice generator and S3 client with configuration.""" global voice_generator, s3_client, config try: config = load_config() voice_generator = VoiceGenerator(config) # Initialize S3 client s3_config = config.get('s3', {}) s3_client = boto3.client( 's3', region_name=s3_config['region'], aws_access_key_id=s3_config['access_key_id'], aws_secret_access_key=s3_config['secret_access_key'], endpoint_url=s3_config.get('endpoint_url', 'https://s3.amazonaws.com') ) logger.info("Voice generator and S3 client initialized successfully") except Exception as e: logger.error(f"Failed to initialize services: {e}") raise # Initialize FastMCP server mcp = FastMCP("voice-gen") auth_token = os.getenv("VOICE_GEN_MCP_AUTH_TOKEN") if auth_token is not None: mcp.auth = StaticTokenVerifier( tokens={ auth_token: { "client_id": "default", "scopes": ["read:data", "write:data", "admin:users"] } }, required_scopes=["read:data", "write:data"], ) def upload_to_s3(audio_data: bytes, filename: str) -> str: """Upload audio data to S3 and return the public URL.""" try: s3_config = config.get('s3', {}) bucket_name = s3_config['bucket_name'] prefix = s3_config.get('prefix', 'voice-gen/') public_url_base = s3_config.get('public_url_base', f'https://{bucket_name}.s3.{s3_config["region"]}.amazonaws.com') # Generate directory structure: Year/Month/Day_{unique_id}_{filename} now = datetime.now() year = now.strftime("%Y") month = now.strftime("%m") day = now.strftime("%d") unique_id = str(uuid.uuid4())[:8] # Create S3 key with new format: prefix/Year/Month/Day_{unique_id}_{filename} s3_key = f"{prefix}{year}/{month}/{day}_{unique_id}_{filename}" # Calculate expiration date (1 month from now) expiration_date = now + timedelta(days=30) # Upload to S3 with expiration metadata s3_client.put_object( Bucket=bucket_name, Key=s3_key, Body=audio_data, ContentType='audio/mpeg', Metadata={ 'expiration-date': expiration_date.isoformat(), 'created-date': now.isoformat(), 'unique-id': unique_id }, Expires=expiration_date ) # Generate public URL public_url = f"{public_url_base}/{s3_key}" logger.info(f"Audio uploaded to S3: {s3_key} (expires: {expiration_date.strftime('%Y-%m-%d %H:%M:%S')})") return public_url except ClientError as e: error_msg = f"S3 upload error: {e}" logger.error(error_msg) raise Exception(error_msg) except NoCredentialsError: error_msg = "S3 credentials not found" logger.error(error_msg) raise Exception(error_msg) @mcp.tool async def generate_voice( text: str, model: str = "speech-2.5-hd-preview", voice_id: str = "mylxsw_voice_1", speed: float = 1.0, ctx: Context = None ) -> str: """Generate speech audio from text using Minimax AI API and upload to S3. Args: text: The text to convert to speech model: Model to use for generation (default: speech-2.5-hd-preview) voice_id: Voice ID to use (default: mylxsw_voice_1) speed: Speech speed (default: 1.0, typically 0.5-2.0) ctx: FastMCP context for logging and other operations Returns: str: Success message with S3 URL or error message """ try: if ctx: await ctx.info(f"Starting voice generation for text: {text[:50]}...") if not text.strip(): error_msg = "Error: Text cannot be empty" if ctx: await ctx.error(error_msg) return error_msg logger.info(f"Generating voice for text: {text[:50]}...") # Generate audio data audio_data = voice_generator.generate_voice( text=text, model=model, voice_id=voice_id, speed=speed ) if ctx: await ctx.info("Voice generated successfully, uploading to S3...") # Generate filename (timestamp info is already in S3 path) filename = "voice.mp3" # Upload to S3 public_url = upload_to_s3(audio_data, filename) file_size = len(audio_data) logger.info(f"Voice generated and uploaded successfully ({file_size} bytes)") if ctx: await ctx.info(f"File uploaded successfully: {public_url}") return f"Successfully generated voice audio and uploaded to S3.\nURL: {public_url}\nSize: {file_size} bytes" except VoiceGeneratorError as e: error_msg = f"Voice generation error: {e}" logger.error(error_msg) return error_msg except Exception as e: error_msg = f"Unexpected error: {e}" logger.error(error_msg) return error_msg if __name__ == "__main__": # Initialize services before starting the server try: initialize_services() except Exception as e: logger.error(f"Failed to initialize services: {e}") sys.exit(1) # Get server configuration transport_type = os.getenv('MCP_TRANSPORT', 'stdio') server_host = os.getenv('MCP_SERVER_HOST', '0.0.0.0') server_port = int(os.getenv('MCP_SERVER_PORT', '8000')) # Start the MCP server if transport_type == 'http': logger.info(f"Starting MCP server in HTTP mode on {server_host}:{server_port}") mcp.run(transport='http', host=server_host, port=server_port, path='/mcp') elif transport_type == 'sse': logger.info(f"Starting MCP server in SSE mode on {server_host}:{server_port}") mcp.run(transport='sse', host=server_host, port=server_port) else: logger.info("Starting MCP server in STDIO mode") mcp.run(transport='stdio')

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/mylxsw/voice-gen-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server