generate_speech

Name	Required	Description
`bitrate`	No	Bitrate of the generated audio (for MP3 only)
`channel`	No	Number of audio channels (1=mono, 2=stereo)
`emotion`	No	Emotion of the speech
`format`	No	Audio format
`languageBoost`	No	Enhance recognition of specific languages
`latexRead`	No	Whether to read LaTeX formulas
`model`	No	Model version to use for speech generation. speech-02-hd is the newest high-definition model with better quality and naturalness. speech-02-turbo has excellent performance with low latency.
`outputFile`	Yes	Absolute path to save the generated audio file
`pitch`	No	Speech pitch (-12 to 12)
`pronunciationDict`	No	List of pronunciation replacements
`sampleRate`	No	Sample rate of the generated audio
`speed`	No	Speech speed (0.5-2.0)
`stream`	No	Whether to use streaming mode
`subtitleEnable`	No	Whether to enable subtitle generation
`text`	Yes	Text to convert to speech
`timberWeights`	No	Voice timber weights for voice mixing
`voiceId`	No	Voice ID to use. Options include: - Male voices: male-qn-qingse (青涩青年), male-qn-jingying (精英青年), male-qn-badao (霸道青年), male-qn-daxuesheng (青年大学生) - Female voices: female-shaonv (少女), female-yujie (御姐), female-chengshu (成熟女性), female-tianmei (甜美女性) - Presenters: presenter_male (男性主持人), presenter_female (女性主持人) - Audiobooks: audiobook_male_1 (男性有声书1), audiobook_male_2 (男性有声书2), audiobook_female_1 (女性有声书1), audiobook_female_2 (女性有声书2) - Beta voices: male-qn-qingse-jingpin (青涩青年-beta), male-qn-jingying-jingpin (精英青年-beta), male-qn-badao-jingpin (霸道青年-beta), male-qn-daxuesheng-jingpin (青年大学生-beta), female-shaonv-jingpin (少女音色-beta), female-yujie-jingpin (御姐音色-beta), female-chengshu-jingpin (成熟女性-beta), female-tianmei-jingpin (甜美女性-beta) - Character voices: clever_boy (聪明男童), cute_boy (可爱男童), lovely_girl (萌萌女童), cartoon_pig (卡通猪小琪), bingjiao_didi (病娇弟弟), junlang_nanyou (俊朗男友), chunzhen_xuedi (纯真学弟), lengdan_xiongzhang (冷淡学长), badao_shaoye (霸道少爷), tianxin_xiaoling (甜心小玲), qiaopi_mengmei (俏皮萌妹), wumei_yujie (妩媚御姐), diadia_xuemei (嗲嗲学妹), danya_xuejie (淡雅学姐) - Western characters: Santa_Claus, Grinch, Rudolph, Arnold, Charming_Santa, Charming_Lady, Sweet_Girl, Cute_Elf, Attractive_Girl, Serene_Woman
`volume`	No	Speech volume (0.1-10.0)

{
  "$schema": "http://json-schema.org/draft-07/schema#",
  "additionalProperties": false,
  "properties": {
    "bitrate": {
      "description": "Bitrate of the generated audio (for MP3 only)",
      "enum": [
        32000,
        64000,
        128000,
        256000
      ],
      "type": "string"
    },
    "channel": {
      "description": "Number of audio channels (1=mono, 2=stereo)",
      "enum": [
        1,
        2
      ],
      "type": "string"
    },
    "emotion": {
      "description": "Emotion of the speech",
      "enum": [
        "happy",
        "sad",
        "angry",
        "fearful",
        "disgusted",
        "surprised",
        "neutral"
      ],
      "type": "string"
    },
    "format": {
      "description": "Audio format",
      "enum": [
        "mp3",
        "pcm",
        "flac",
        "wav"
      ],
      "type": "string"
    },
    "languageBoost": {
      "description": "Enhance recognition of specific languages",
      "enum": [
        "Chinese",
        "Chinese,Yue",
        "English",
        "Arabic",
        "Russian",
        "Spanish",
        "French",
        "Portuguese",
        "German",
        "Turkish",
        "Dutch",
        "Ukrainian",
        "Vietnamese",
        "Indonesian",
        "Japanese",
        "Italian",
        "Korean",
        "Thai",
        "Polish",
        "Romanian",
        "Greek",
        "Czech",
        "Finnish",
        "Hindi",
        "auto"
      ],
      "type": "string"
    },
    "latexRead": {
      "description": "Whether to read LaTeX formulas",
      "type": "boolean"
    },
    "model": {
      "description": "Model version to use for speech generation. speech-02-hd is the newest high-definition model with better quality and naturalness. speech-02-turbo has excellent performance with low latency.",
      "enum": [
        "speech-02-hd",
        "speech-02-turbo"
      ],
      "type": "string"
    },
    "outputFile": {
      "description": "Absolute path to save the generated audio file",
      "type": "string"
    },
    "pitch": {
      "description": "Speech pitch (-12 to 12)",
      "maximum": 12,
      "minimum": -12,
      "type": "number"
    },
    "pronunciationDict": {
      "description": "List of pronunciation replacements",
      "items": {
        "type": "string"
      },
      "type": "array"
    },
    "sampleRate": {
      "description": "Sample rate of the generated audio",
      "enum": [
        8000,
        16000,
        22050,
        24000,
        32000,
        44100
      ],
      "type": "string"
    },
    "speed": {
      "description": "Speech speed (0.5-2.0)",
      "maximum": 2,
      "minimum": 0.5,
      "type": "number"
    },
    "stream": {
      "description": "Whether to use streaming mode",
      "type": "boolean"
    },
    "subtitleEnable": {
      "description": "Whether to enable subtitle generation",
      "type": "boolean"
    },
    "text": {
      "description": "Text to convert to speech",
      "type": "string"
    },
    "timberWeights": {
      "description": "Voice timber weights for voice mixing",
      "items": {
        "additionalProperties": false,
        "properties": {
          "voice_id": {
            "type": "string"
          },
          "weight": {
            "maximum": 100,
            "minimum": 1,
            "type": "number"
          }
        },
        "required": [
          "voice_id",
          "weight"
        ],
        "type": "object"
      },
      "type": "array"
    },
    "voiceId": {
      "description": "Voice ID to use. Options include:\n- Male voices: male-qn-qingse (青涩青年), male-qn-jingying (精英青年), male-qn-badao (霸道青年), male-qn-daxuesheng (青年大学生)\n- Female voices: female-shaonv (少女), female-yujie (御姐), female-chengshu (成熟女性), female-tianmei (甜美女性)\n- Presenters: presenter_male (男性主持人), presenter_female (女性主持人)\n- Audiobooks: audiobook_male_1 (男性有声书1), audiobook_male_2 (男性有声书2), audiobook_female_1 (女性有声书1), audiobook_female_2 (女性有声书2)\n- Beta voices: male-qn-qingse-jingpin (青涩青年-beta), male-qn-jingying-jingpin (精英青年-beta), male-qn-badao-jingpin (霸道青年-beta), male-qn-daxuesheng-jingpin (青年大学生-beta), female-shaonv-jingpin (少女音色-beta), female-yujie-jingpin (御姐音色-beta), female-chengshu-jingpin (成熟女性-beta), female-tianmei-jingpin (甜美女性-beta)\n- Character voices: clever_boy (聪明男童), cute_boy (可爱男童), lovely_girl (萌萌女童), cartoon_pig (卡通猪小琪), \n  bingjiao_didi (病娇弟弟), junlang_nanyou (俊朗男友), chunzhen_xuedi (纯真学弟), lengdan_xiongzhang (冷淡学长),\n  badao_shaoye (霸道少爷), tianxin_xiaoling (甜心小玲), qiaopi_mengmei (俏皮萌妹), wumei_yujie (妩媚御姐),\n  diadia_xuemei (嗲嗲学妹), danya_xuejie (淡雅学姐)\n- Western characters: Santa_Claus, Grinch, Rudolph, Arnold, Charming_Santa, Charming_Lady, Sweet_Girl, Cute_Elf, Attractive_Girl, Serene_Woman",
      "type": "string"
    },
    "volume": {
      "description": "Speech volume (0.1-10.0)",
      "maximum": 10,
      "minimum": 0.1,
      "type": "number"
    }
  },
  "required": [
    "text",
    "outputFile"
  ],
  "type": "object"
}

Minimax MCP Tools

Input Schema

Input Schema (JSON Schema)

Other Tools from Minimax MCP Tools

Related Tools

MCP directory API