MiniMax Speech 2.8 Turbo 同期音声合成

curl --request POST \
  --url https://api.highwayapi.ai/v3/minimax-speech-2.8-turbo \
  --header 'Authorization: <authorization>' \
  --header 'Content-Type: <content-type>' \
  --data '
{
  "text": "<string>",
  "stream": true,
  "voice_modify": {
    "pitch": 123,
    "timbre": 123,
    "intensity": 123,
    "sound_effects": "<string>"
  },
  "audio_setting": {
    "format": "<string>",
    "bitrate": 123,
    "channel": 123,
    "force_cbr": true,
    "sample_rate": 123
  },
  "output_format": "<string>",
  "voice_setting": {
    "vol": 123,
    "pitch": 123,
    "speed": 123,
    "emotion": "<string>",
    "voice_id": "<string>",
    "latex_read": true,
    "text_normalization": true
  },
  "aigc_watermark": true,
  "language_boost": "<string>",
  "stream_options": {
    "exclude_aggregated_audio": true
  },
  "timber_weights": [
    {
      "weight": 123,
      "voice_id": "<string>"
    }
  ],
  "subtitle_enable": true,
  "continuous_sound": true,
  "pronunciation_dict": {
    "tone": [
      "<string>"
    ]
  }
}
'

import requests

url = "https://api.highwayapi.ai/v3/minimax-speech-2.8-turbo"

payload = {
    "text": "<string>",
    "stream": True,
    "voice_modify": {
        "pitch": 123,
        "timbre": 123,
        "intensity": 123,
        "sound_effects": "<string>"
    },
    "audio_setting": {
        "format": "<string>",
        "bitrate": 123,
        "channel": 123,
        "force_cbr": True,
        "sample_rate": 123
    },
    "output_format": "<string>",
    "voice_setting": {
        "vol": 123,
        "pitch": 123,
        "speed": 123,
        "emotion": "<string>",
        "voice_id": "<string>",
        "latex_read": True,
        "text_normalization": True
    },
    "aigc_watermark": True,
    "language_boost": "<string>",
    "stream_options": { "exclude_aggregated_audio": True },
    "timber_weights": [
        {
            "weight": 123,
            "voice_id": "<string>"
        }
    ],
    "subtitle_enable": True,
    "continuous_sound": True,
    "pronunciation_dict": { "tone": ["<string>"] }
}
headers = {
    "Content-Type": "<content-type>",
    "Authorization": "<authorization>"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'Content-Type': '<content-type>', Authorization: '<authorization>'},
  body: JSON.stringify({
    text: '<string>',
    stream: true,
    voice_modify: {pitch: 123, timbre: 123, intensity: 123, sound_effects: '<string>'},
    audio_setting: {
      format: '<string>',
      bitrate: 123,
      channel: 123,
      force_cbr: true,
      sample_rate: 123
    },
    output_format: '<string>',
    voice_setting: {
      vol: 123,
      pitch: 123,
      speed: 123,
      emotion: '<string>',
      voice_id: '<string>',
      latex_read: true,
      text_normalization: true
    },
    aigc_watermark: true,
    language_boost: '<string>',
    stream_options: {exclude_aggregated_audio: true},
    timber_weights: [{weight: 123, voice_id: '<string>'}],
    subtitle_enable: true,
    continuous_sound: true,
    pronunciation_dict: {tone: ['<string>']}
  })
};

fetch('https://api.highwayapi.ai/v3/minimax-speech-2.8-turbo', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.highwayapi.ai/v3/minimax-speech-2.8-turbo",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'text' => '<string>',
    'stream' => true,
    'voice_modify' => [
        'pitch' => 123,
        'timbre' => 123,
        'intensity' => 123,
        'sound_effects' => '<string>'
    ],
    'audio_setting' => [
        'format' => '<string>',
        'bitrate' => 123,
        'channel' => 123,
        'force_cbr' => true,
        'sample_rate' => 123
    ],
    'output_format' => '<string>',
    'voice_setting' => [
        'vol' => 123,
        'pitch' => 123,
        'speed' => 123,
        'emotion' => '<string>',
        'voice_id' => '<string>',
        'latex_read' => true,
        'text_normalization' => true
    ],
    'aigc_watermark' => true,
    'language_boost' => '<string>',
    'stream_options' => [
        'exclude_aggregated_audio' => true
    ],
    'timber_weights' => [
        [
                'weight' => 123,
                'voice_id' => '<string>'
        ]
    ],
    'subtitle_enable' => true,
    'continuous_sound' => true,
    'pronunciation_dict' => [
        'tone' => [
                '<string>'
        ]
    ]
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: <authorization>",
    "Content-Type: <content-type>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.highwayapi.ai/v3/minimax-speech-2.8-turbo"

	payload := strings.NewReader("{\n  \"text\": \"<string>\",\n  \"stream\": true,\n  \"voice_modify\": {\n    \"pitch\": 123,\n    \"timbre\": 123,\n    \"intensity\": 123,\n    \"sound_effects\": \"<string>\"\n  },\n  \"audio_setting\": {\n    \"format\": \"<string>\",\n    \"bitrate\": 123,\n    \"channel\": 123,\n    \"force_cbr\": true,\n    \"sample_rate\": 123\n  },\n  \"output_format\": \"<string>\",\n  \"voice_setting\": {\n    \"vol\": 123,\n    \"pitch\": 123,\n    \"speed\": 123,\n    \"emotion\": \"<string>\",\n    \"voice_id\": \"<string>\",\n    \"latex_read\": true,\n    \"text_normalization\": true\n  },\n  \"aigc_watermark\": true,\n  \"language_boost\": \"<string>\",\n  \"stream_options\": {\n    \"exclude_aggregated_audio\": true\n  },\n  \"timber_weights\": [\n    {\n      \"weight\": 123,\n      \"voice_id\": \"<string>\"\n    }\n  ],\n  \"subtitle_enable\": true,\n  \"continuous_sound\": true,\n  \"pronunciation_dict\": {\n    \"tone\": [\n      \"<string>\"\n    ]\n  }\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Content-Type", "<content-type>")
	req.Header.Add("Authorization", "<authorization>")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.highwayapi.ai/v3/minimax-speech-2.8-turbo")
  .header("Content-Type", "<content-type>")
  .header("Authorization", "<authorization>")
  .body("{\n  \"text\": \"<string>\",\n  \"stream\": true,\n  \"voice_modify\": {\n    \"pitch\": 123,\n    \"timbre\": 123,\n    \"intensity\": 123,\n    \"sound_effects\": \"<string>\"\n  },\n  \"audio_setting\": {\n    \"format\": \"<string>\",\n    \"bitrate\": 123,\n    \"channel\": 123,\n    \"force_cbr\": true,\n    \"sample_rate\": 123\n  },\n  \"output_format\": \"<string>\",\n  \"voice_setting\": {\n    \"vol\": 123,\n    \"pitch\": 123,\n    \"speed\": 123,\n    \"emotion\": \"<string>\",\n    \"voice_id\": \"<string>\",\n    \"latex_read\": true,\n    \"text_normalization\": true\n  },\n  \"aigc_watermark\": true,\n  \"language_boost\": \"<string>\",\n  \"stream_options\": {\n    \"exclude_aggregated_audio\": true\n  },\n  \"timber_weights\": [\n    {\n      \"weight\": 123,\n      \"voice_id\": \"<string>\"\n    }\n  ],\n  \"subtitle_enable\": true,\n  \"continuous_sound\": true,\n  \"pronunciation_dict\": {\n    \"tone\": [\n      \"<string>\"\n    ]\n  }\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.highwayapi.ai/v3/minimax-speech-2.8-turbo")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Content-Type"] = '<content-type>'
request["Authorization"] = '<authorization>'
request.body = "{\n  \"text\": \"<string>\",\n  \"stream\": true,\n  \"voice_modify\": {\n    \"pitch\": 123,\n    \"timbre\": 123,\n    \"intensity\": 123,\n    \"sound_effects\": \"<string>\"\n  },\n  \"audio_setting\": {\n    \"format\": \"<string>\",\n    \"bitrate\": 123,\n    \"channel\": 123,\n    \"force_cbr\": true,\n    \"sample_rate\": 123\n  },\n  \"output_format\": \"<string>\",\n  \"voice_setting\": {\n    \"vol\": 123,\n    \"pitch\": 123,\n    \"speed\": 123,\n    \"emotion\": \"<string>\",\n    \"voice_id\": \"<string>\",\n    \"latex_read\": true,\n    \"text_normalization\": true\n  },\n  \"aigc_watermark\": true,\n  \"language_boost\": \"<string>\",\n  \"stream_options\": {\n    \"exclude_aggregated_audio\": true\n  },\n  \"timber_weights\": [\n    {\n      \"weight\": 123,\n      \"voice_id\": \"<string>\"\n    }\n  ],\n  \"subtitle_enable\": true,\n  \"continuous_sound\": true,\n  \"pronunciation_dict\": {\n    \"tone\": [\n      \"<string>\"\n    ]\n  }\n}"

response = http.request(request)
puts response.read_body

{
  "data": {},
  "trace_id": "<string>",
  "base_resp": {},
  "extra_info": {}
}

POST

minimax-speech-2.8-turbo

MiniMax Speech 2.8 Turbo 同期音声合成

curl --request POST \
  --url https://api.highwayapi.ai/v3/minimax-speech-2.8-turbo \
  --header 'Authorization: <authorization>' \
  --header 'Content-Type: <content-type>' \
  --data '
{
  "text": "<string>",
  "stream": true,
  "voice_modify": {
    "pitch": 123,
    "timbre": 123,
    "intensity": 123,
    "sound_effects": "<string>"
  },
  "audio_setting": {
    "format": "<string>",
    "bitrate": 123,
    "channel": 123,
    "force_cbr": true,
    "sample_rate": 123
  },
  "output_format": "<string>",
  "voice_setting": {
    "vol": 123,
    "pitch": 123,
    "speed": 123,
    "emotion": "<string>",
    "voice_id": "<string>",
    "latex_read": true,
    "text_normalization": true
  },
  "aigc_watermark": true,
  "language_boost": "<string>",
  "stream_options": {
    "exclude_aggregated_audio": true
  },
  "timber_weights": [
    {
      "weight": 123,
      "voice_id": "<string>"
    }
  ],
  "subtitle_enable": true,
  "continuous_sound": true,
  "pronunciation_dict": {
    "tone": [
      "<string>"
    ]
  }
}
'

import requests

url = "https://api.highwayapi.ai/v3/minimax-speech-2.8-turbo"

payload = {
    "text": "<string>",
    "stream": True,
    "voice_modify": {
        "pitch": 123,
        "timbre": 123,
        "intensity": 123,
        "sound_effects": "<string>"
    },
    "audio_setting": {
        "format": "<string>",
        "bitrate": 123,
        "channel": 123,
        "force_cbr": True,
        "sample_rate": 123
    },
    "output_format": "<string>",
    "voice_setting": {
        "vol": 123,
        "pitch": 123,
        "speed": 123,
        "emotion": "<string>",
        "voice_id": "<string>",
        "latex_read": True,
        "text_normalization": True
    },
    "aigc_watermark": True,
    "language_boost": "<string>",
    "stream_options": { "exclude_aggregated_audio": True },
    "timber_weights": [
        {
            "weight": 123,
            "voice_id": "<string>"
        }
    ],
    "subtitle_enable": True,
    "continuous_sound": True,
    "pronunciation_dict": { "tone": ["<string>"] }
}
headers = {
    "Content-Type": "<content-type>",
    "Authorization": "<authorization>"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'Content-Type': '<content-type>', Authorization: '<authorization>'},
  body: JSON.stringify({
    text: '<string>',
    stream: true,
    voice_modify: {pitch: 123, timbre: 123, intensity: 123, sound_effects: '<string>'},
    audio_setting: {
      format: '<string>',
      bitrate: 123,
      channel: 123,
      force_cbr: true,
      sample_rate: 123
    },
    output_format: '<string>',
    voice_setting: {
      vol: 123,
      pitch: 123,
      speed: 123,
      emotion: '<string>',
      voice_id: '<string>',
      latex_read: true,
      text_normalization: true
    },
    aigc_watermark: true,
    language_boost: '<string>',
    stream_options: {exclude_aggregated_audio: true},
    timber_weights: [{weight: 123, voice_id: '<string>'}],
    subtitle_enable: true,
    continuous_sound: true,
    pronunciation_dict: {tone: ['<string>']}
  })
};

fetch('https://api.highwayapi.ai/v3/minimax-speech-2.8-turbo', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.highwayapi.ai/v3/minimax-speech-2.8-turbo",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'text' => '<string>',
    'stream' => true,
    'voice_modify' => [
        'pitch' => 123,
        'timbre' => 123,
        'intensity' => 123,
        'sound_effects' => '<string>'
    ],
    'audio_setting' => [
        'format' => '<string>',
        'bitrate' => 123,
        'channel' => 123,
        'force_cbr' => true,
        'sample_rate' => 123
    ],
    'output_format' => '<string>',
    'voice_setting' => [
        'vol' => 123,
        'pitch' => 123,
        'speed' => 123,
        'emotion' => '<string>',
        'voice_id' => '<string>',
        'latex_read' => true,
        'text_normalization' => true
    ],
    'aigc_watermark' => true,
    'language_boost' => '<string>',
    'stream_options' => [
        'exclude_aggregated_audio' => true
    ],
    'timber_weights' => [
        [
                'weight' => 123,
                'voice_id' => '<string>'
        ]
    ],
    'subtitle_enable' => true,
    'continuous_sound' => true,
    'pronunciation_dict' => [
        'tone' => [
                '<string>'
        ]
    ]
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: <authorization>",
    "Content-Type: <content-type>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.highwayapi.ai/v3/minimax-speech-2.8-turbo"

	payload := strings.NewReader("{\n  \"text\": \"<string>\",\n  \"stream\": true,\n  \"voice_modify\": {\n    \"pitch\": 123,\n    \"timbre\": 123,\n    \"intensity\": 123,\n    \"sound_effects\": \"<string>\"\n  },\n  \"audio_setting\": {\n    \"format\": \"<string>\",\n    \"bitrate\": 123,\n    \"channel\": 123,\n    \"force_cbr\": true,\n    \"sample_rate\": 123\n  },\n  \"output_format\": \"<string>\",\n  \"voice_setting\": {\n    \"vol\": 123,\n    \"pitch\": 123,\n    \"speed\": 123,\n    \"emotion\": \"<string>\",\n    \"voice_id\": \"<string>\",\n    \"latex_read\": true,\n    \"text_normalization\": true\n  },\n  \"aigc_watermark\": true,\n  \"language_boost\": \"<string>\",\n  \"stream_options\": {\n    \"exclude_aggregated_audio\": true\n  },\n  \"timber_weights\": [\n    {\n      \"weight\": 123,\n      \"voice_id\": \"<string>\"\n    }\n  ],\n  \"subtitle_enable\": true,\n  \"continuous_sound\": true,\n  \"pronunciation_dict\": {\n    \"tone\": [\n      \"<string>\"\n    ]\n  }\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Content-Type", "<content-type>")
	req.Header.Add("Authorization", "<authorization>")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.highwayapi.ai/v3/minimax-speech-2.8-turbo")
  .header("Content-Type", "<content-type>")
  .header("Authorization", "<authorization>")
  .body("{\n  \"text\": \"<string>\",\n  \"stream\": true,\n  \"voice_modify\": {\n    \"pitch\": 123,\n    \"timbre\": 123,\n    \"intensity\": 123,\n    \"sound_effects\": \"<string>\"\n  },\n  \"audio_setting\": {\n    \"format\": \"<string>\",\n    \"bitrate\": 123,\n    \"channel\": 123,\n    \"force_cbr\": true,\n    \"sample_rate\": 123\n  },\n  \"output_format\": \"<string>\",\n  \"voice_setting\": {\n    \"vol\": 123,\n    \"pitch\": 123,\n    \"speed\": 123,\n    \"emotion\": \"<string>\",\n    \"voice_id\": \"<string>\",\n    \"latex_read\": true,\n    \"text_normalization\": true\n  },\n  \"aigc_watermark\": true,\n  \"language_boost\": \"<string>\",\n  \"stream_options\": {\n    \"exclude_aggregated_audio\": true\n  },\n  \"timber_weights\": [\n    {\n      \"weight\": 123,\n      \"voice_id\": \"<string>\"\n    }\n  ],\n  \"subtitle_enable\": true,\n  \"continuous_sound\": true,\n  \"pronunciation_dict\": {\n    \"tone\": [\n      \"<string>\"\n    ]\n  }\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.highwayapi.ai/v3/minimax-speech-2.8-turbo")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Content-Type"] = '<content-type>'
request["Authorization"] = '<authorization>'
request.body = "{\n  \"text\": \"<string>\",\n  \"stream\": true,\n  \"voice_modify\": {\n    \"pitch\": 123,\n    \"timbre\": 123,\n    \"intensity\": 123,\n    \"sound_effects\": \"<string>\"\n  },\n  \"audio_setting\": {\n    \"format\": \"<string>\",\n    \"bitrate\": 123,\n    \"channel\": 123,\n    \"force_cbr\": true,\n    \"sample_rate\": 123\n  },\n  \"output_format\": \"<string>\",\n  \"voice_setting\": {\n    \"vol\": 123,\n    \"pitch\": 123,\n    \"speed\": 123,\n    \"emotion\": \"<string>\",\n    \"voice_id\": \"<string>\",\n    \"latex_read\": true,\n    \"text_normalization\": true\n  },\n  \"aigc_watermark\": true,\n  \"language_boost\": \"<string>\",\n  \"stream_options\": {\n    \"exclude_aggregated_audio\": true\n  },\n  \"timber_weights\": [\n    {\n      \"weight\": 123,\n      \"voice_id\": \"<string>\"\n    }\n  ],\n  \"subtitle_enable\": true,\n  \"continuous_sound\": true,\n  \"pronunciation_dict\": {\n    \"tone\": [\n      \"<string>\"\n    ]\n  }\n}"

response = http.request(request)
puts response.read_body

{
  "data": {},
  "trace_id": "<string>",
  "base_resp": {},
  "extra_info": {}
}

テキストを音声に変換します。複数の音色、感情制御、話速調整などの機能に対応しています。テキスト長は 10000 文字未満に制限されます。テキスト長が 3000 文字を超える場合は、ストリーミング出力の使用を推奨します。

リクエストヘッダー

string

必須

列挙値: application/json

string

必須

Bearer 認証形式: Bearer {{API Key}}。

リクエストボディ

string

必須

音声合成するテキスト。長さは 10000 文字未満に制限されます。テキスト長が 3000 文字を超える場合は、ストリーミング出力の使用を推奨します。段落切り替え（改行）、ポーズ制御（<#x#> マーク）、フィラータグ（(laughs)、(coughs) など。speech-2.8-hd/turbo のみ対応）をサポートします

boolean

デフォルト:false

ストリーミング出力するかどうかを制御します。デフォルトは false、つまりストリーミングは有効化されません

object

非表示プロパティ

integer

ピッチ調整（低め/明るめ）。範囲は [-100, 100] です。値が -100 に近いほど声はより低くなり、100 に近いほどより明るくなります値の範囲：[-100, 100]

integer

音色調整（深み/クリア）。範囲は [-100, 100] です。値が -100 に近いほど声はより厚みを増し、100 に近いほどよりクリアになります値の範囲：[-100, 100]

integer

強度調整（力強さ/柔らかさ）。範囲は [-100, 100] です。値が -100 に近いほど声はより力強くなり、100 に近いほどより柔らかくなります値の範囲：[-100, 100]

string

音響効果の設定。一度に 1 種類のみ選択できます。選択可能な値：spacious_echo（広い空間のエコー）、auditorium_echo（講堂放送）、lofi_telephone（電話風の歪み）、robotic（電子音）選択可能な値：spacious_echo, auditorium_echo, lofi_telephone, robotic

object

非表示プロパティ

string

デフォルト:"mp3"

生成される音声の形式。wav は非ストリーミング出力でのみサポートされます選択可能な値：mp3, pcm, flac, wav

integer

デフォルト:128000

生成される音声のビットレート。選択可能な範囲は [32000, 64000, 128000, 256000]、デフォルト値は 128000 です。このパラメータは mp3 形式の音声にのみ有効です選択可能な値：32000, 64000, 128000, 256000

integer

デフォルト:1

生成される音声のチャンネル数。選択可能な範囲：[1, 2]。1 はモノラル、2 はステレオです。デフォルト値は 1 です選択可能な値：1, 2

boolean

デフォルト:false

音声の固定ビットレート（cbr）制御に使用します。false、true を選択できます。このパラメータを true に設定すると、固定ビットレート方式で音声をエンコードします。注意：このパラメータは、音声がストリーミング出力に設定され、かつ音声形式が mp3 の場合にのみ有効です

integer

デフォルト:32000

生成される音声のサンプリングレート。選択可能な範囲は [8000, 16000, 22050, 24000, 32000, 44100]、デフォルトは 32000 です選択可能な値：8000, 16000, 22050, 24000, 32000, 44100

string

デフォルト:"hex"

出力結果形式を制御するパラメータです。選択可能な値の範囲は url、hex で、デフォルト値は hex です。このパラメータは非ストリーミングシナリオでのみ有効です。ストリーミングシナリオでは hex 形式の返却のみサポートされます。返却される url の有効期限は 24 時間です選択可能な値：url, hex

object

非表示プロパティ

number

デフォルト:1

合成音声の音量。値が大きいほど音量が高くなります。値の範囲は (0, 10]、デフォルト値は 1.0 です値の範囲：[0, 10]

integer

デフォルト:0

合成音声のピッチ。値の範囲は [-12, 12]、デフォルト値は 0 です。0 は元の音色で出力することを示します値の範囲：[-12, 12]

number

デフォルト:1

合成音声の話速。値が大きいほど話速が速くなります。値の範囲は [0.5, 2]、デフォルト値は 1.0 です値の範囲：[0.5, 2]

string

合成音声の感情を制御します。パラメータ範囲はそれぞれ 8 種類の感情に対応します：喜び(happy)、悲しみ(sad)、怒り(angry)、恐れ(fearful)、嫌悪(disgusted)、驚き(surprised)、中立(calm)、生き生き(fluent)、ささやき(whisper)。モデルは入力テキストに基づいて適切な感情を自動的に一致させるため、通常は手動指定は不要です選択可能な値：happy, sad, angry, fearful, disgusted, surprised, calm, fluent, whisper

string

必須

合成音声の音色 ID。混合音色を設定する必要がある場合は、timber_weights パラメータを設定し、このパラメータは空値にしてください。システム音色、クローン音色、テキスト生成音色の 3 種類をサポートします

boolean

デフォルト:false

latex 数式を読み上げるかどうかを制御します。デフォルトは false です。中国語のみ対応しています。このパラメータを有効にすると、language_boost パラメータは Chinese に設定されます

boolean

デフォルト:false

中国語・英語テキストの正規化を有効にするかどうか。オンにすると数字読み上げシナリオの性能を向上できますが、遅延がわずかに増加します。デフォルト値は false です

boolean

デフォルト:false

合成音声の末尾に音声リズム識別子を追加するかどうかを制御します。デフォルト値は false です。このパラメータは非ストリーミング合成にのみ有効です

string

指定した少数言語および方言の認識能力を強化するかどうか。デフォルト値は null です。auto に設定すると、モデルに自律的に判断させることができます選択可能な値：Chinese, Chinese,Yue, English, Arabic, Russian, Spanish, French, Portuguese, German, Turkish, Dutch, Ukrainian, Vietnamese, Indonesian, Japanese, Italian, Korean, Thai, Polish, Romanian, Greek, Czech, Finnish, Hindi, Bulgarian, Danish, Hebrew, Malay, Persian, Slovak, Swedish, Croatian, Filipino, Hungarian, Norwegian, Slovenian, Catalan, Nynorsk, Tamil, Afrikaans, auto

object

非表示プロパティ

boolean

デフォルト:false

最後の chunk に結合後の音声 hex データを含めるかどうかを設定します。デフォルト値は false、つまり最後の chunk には結合後の完全な音声 hex データが含まれます

object[]

混合音色設定。最大 4 種類の音色混合をサポートします

非表示プロパティ

integer

必須

合成音声における各音色の重み。voice_id と同期して入力する必要があります。選択可能な値の範囲は [1, 100] で、最大 4 種類の音色混合をサポートします。単一音色の値の比率が高いほど、合成音色はその音色により近くなります値の範囲：[1, 100]

string

必須

合成音声の音色 ID。weight パラメータと同期して入力する必要があります。システム音色、クローン音色、テキスト生成音色の 3 種類をサポートします

boolean

デフォルト:false

字幕サービスを有効にするかどうかを制御します。デフォルト値は false です。このパラメータは非ストリーミング出力シナリオでのみ有効であり、speech-2.6-hd, speech-2.6-turbo, speech-01-turbo, speech-01-hd モデルに対してのみ有効です

boolean

デフォルト:false

このパラメータを有効にすると、句と句のつなぎ目がより自然になります。speech-2.8-hd および speech-2.8-turbo モデルのみ対応しています

object

非表示プロパティ

string[]

特別な注記が必要な文字または記号に対応する注音または発音の置換ルールを定義します。中国語テキストでは、声調を数字で表します：一声は 1、二声は 2、三声は 3、四声は 4、軽声は 5 です。例：[“燕少飞/(yan4)(shao3)(fei1)”, “omg/oh my god”]

レスポンス情報

object

返却される合成データオブジェクト。null の可能性があるため、非 null 判定が必要です

string

今回のセッションの id。問い合わせ/フィードバック時に問題の特定に役立ちます

object

今回のリクエストのステータスコードと詳細

object

音声の追加情報

MiniMax Speech 2.8 Turbo 非同期音声合成

MiniMax Speech 2.8 HD 非同期音声合成

API の基本

大規模言語モデル

画像

動画

音声

MiniMax Speech 2.8 Turbo 同期音声合成

リクエストヘッダー

リクエストボディ

レスポンス情報

​リクエストヘッダー

​リクエストボディ

​レスポンス情報

リクエストヘッダー

リクエストボディ

レスポンス情報