MiniMax Speech 2.8 HD 非同期音声合成

curl --request POST \
  --url https://api.highwayapi.ai/v3/async/minimax-speech-2.8-hd \
  --header 'Authorization: <authorization>' \
  --header 'Content-Type: <content-type>' \
  --data '
{
  "text": "<string>",
  "text_file_id": 123,
  "voice_modify": {
    "pitch": 123,
    "timbre": 123,
    "intensity": 123,
    "sound_effects": "<string>"
  },
  "audio_setting": {
    "format": "<string>",
    "bitrate": 123,
    "channel": 123,
    "audio_sample_rate": 123
  },
  "voice_setting": {
    "vol": 123,
    "pitch": 123,
    "speed": 123,
    "emotion": "<string>",
    "voice_id": "<string>",
    "english_normalization": true
  },
  "aigc_watermark": true,
  "language_boost": "<string>",
  "continuous_sound": true,
  "pronunciation_dict": {
    "tone": [
      "<string>"
    ]
  }
}
'

import requests

url = "https://api.highwayapi.ai/v3/async/minimax-speech-2.8-hd"

payload = {
    "text": "<string>",
    "text_file_id": 123,
    "voice_modify": {
        "pitch": 123,
        "timbre": 123,
        "intensity": 123,
        "sound_effects": "<string>"
    },
    "audio_setting": {
        "format": "<string>",
        "bitrate": 123,
        "channel": 123,
        "audio_sample_rate": 123
    },
    "voice_setting": {
        "vol": 123,
        "pitch": 123,
        "speed": 123,
        "emotion": "<string>",
        "voice_id": "<string>",
        "english_normalization": True
    },
    "aigc_watermark": True,
    "language_boost": "<string>",
    "continuous_sound": True,
    "pronunciation_dict": { "tone": ["<string>"] }
}
headers = {
    "Content-Type": "<content-type>",
    "Authorization": "<authorization>"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'Content-Type': '<content-type>', Authorization: '<authorization>'},
  body: JSON.stringify({
    text: '<string>',
    text_file_id: 123,
    voice_modify: {pitch: 123, timbre: 123, intensity: 123, sound_effects: '<string>'},
    audio_setting: {format: '<string>', bitrate: 123, channel: 123, audio_sample_rate: 123},
    voice_setting: {
      vol: 123,
      pitch: 123,
      speed: 123,
      emotion: '<string>',
      voice_id: '<string>',
      english_normalization: true
    },
    aigc_watermark: true,
    language_boost: '<string>',
    continuous_sound: true,
    pronunciation_dict: {tone: ['<string>']}
  })
};

fetch('https://api.highwayapi.ai/v3/async/minimax-speech-2.8-hd', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.highwayapi.ai/v3/async/minimax-speech-2.8-hd",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'text' => '<string>',
    'text_file_id' => 123,
    'voice_modify' => [
        'pitch' => 123,
        'timbre' => 123,
        'intensity' => 123,
        'sound_effects' => '<string>'
    ],
    'audio_setting' => [
        'format' => '<string>',
        'bitrate' => 123,
        'channel' => 123,
        'audio_sample_rate' => 123
    ],
    'voice_setting' => [
        'vol' => 123,
        'pitch' => 123,
        'speed' => 123,
        'emotion' => '<string>',
        'voice_id' => '<string>',
        'english_normalization' => true
    ],
    'aigc_watermark' => true,
    'language_boost' => '<string>',
    'continuous_sound' => true,
    'pronunciation_dict' => [
        'tone' => [
                '<string>'
        ]
    ]
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: <authorization>",
    "Content-Type: <content-type>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.highwayapi.ai/v3/async/minimax-speech-2.8-hd"

	payload := strings.NewReader("{\n  \"text\": \"<string>\",\n  \"text_file_id\": 123,\n  \"voice_modify\": {\n    \"pitch\": 123,\n    \"timbre\": 123,\n    \"intensity\": 123,\n    \"sound_effects\": \"<string>\"\n  },\n  \"audio_setting\": {\n    \"format\": \"<string>\",\n    \"bitrate\": 123,\n    \"channel\": 123,\n    \"audio_sample_rate\": 123\n  },\n  \"voice_setting\": {\n    \"vol\": 123,\n    \"pitch\": 123,\n    \"speed\": 123,\n    \"emotion\": \"<string>\",\n    \"voice_id\": \"<string>\",\n    \"english_normalization\": true\n  },\n  \"aigc_watermark\": true,\n  \"language_boost\": \"<string>\",\n  \"continuous_sound\": true,\n  \"pronunciation_dict\": {\n    \"tone\": [\n      \"<string>\"\n    ]\n  }\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Content-Type", "<content-type>")
	req.Header.Add("Authorization", "<authorization>")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.highwayapi.ai/v3/async/minimax-speech-2.8-hd")
  .header("Content-Type", "<content-type>")
  .header("Authorization", "<authorization>")
  .body("{\n  \"text\": \"<string>\",\n  \"text_file_id\": 123,\n  \"voice_modify\": {\n    \"pitch\": 123,\n    \"timbre\": 123,\n    \"intensity\": 123,\n    \"sound_effects\": \"<string>\"\n  },\n  \"audio_setting\": {\n    \"format\": \"<string>\",\n    \"bitrate\": 123,\n    \"channel\": 123,\n    \"audio_sample_rate\": 123\n  },\n  \"voice_setting\": {\n    \"vol\": 123,\n    \"pitch\": 123,\n    \"speed\": 123,\n    \"emotion\": \"<string>\",\n    \"voice_id\": \"<string>\",\n    \"english_normalization\": true\n  },\n  \"aigc_watermark\": true,\n  \"language_boost\": \"<string>\",\n  \"continuous_sound\": true,\n  \"pronunciation_dict\": {\n    \"tone\": [\n      \"<string>\"\n    ]\n  }\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.highwayapi.ai/v3/async/minimax-speech-2.8-hd")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Content-Type"] = '<content-type>'
request["Authorization"] = '<authorization>'
request.body = "{\n  \"text\": \"<string>\",\n  \"text_file_id\": 123,\n  \"voice_modify\": {\n    \"pitch\": 123,\n    \"timbre\": 123,\n    \"intensity\": 123,\n    \"sound_effects\": \"<string>\"\n  },\n  \"audio_setting\": {\n    \"format\": \"<string>\",\n    \"bitrate\": 123,\n    \"channel\": 123,\n    \"audio_sample_rate\": 123\n  },\n  \"voice_setting\": {\n    \"vol\": 123,\n    \"pitch\": 123,\n    \"speed\": 123,\n    \"emotion\": \"<string>\",\n    \"voice_id\": \"<string>\",\n    \"english_normalization\": true\n  },\n  \"aigc_watermark\": true,\n  \"language_boost\": \"<string>\",\n  \"continuous_sound\": true,\n  \"pronunciation_dict\": {\n    \"tone\": [\n      \"<string>\"\n    ]\n  }\n}"

response = http.request(request)
puts response.read_body

{
  "file_id": 123,
  "task_id": "<string>",
  "base_resp": {
    "status_msg": "<string>",
    "status_code": 123
  },
  "task_token": "<string>",
  "usage_characters": 123
}

POST

async

minimax-speech-2.8-hd

MiniMax Speech 2.8 HD 非同期音声合成

curl --request POST \
  --url https://api.highwayapi.ai/v3/async/minimax-speech-2.8-hd \
  --header 'Authorization: <authorization>' \
  --header 'Content-Type: <content-type>' \
  --data '
{
  "text": "<string>",
  "text_file_id": 123,
  "voice_modify": {
    "pitch": 123,
    "timbre": 123,
    "intensity": 123,
    "sound_effects": "<string>"
  },
  "audio_setting": {
    "format": "<string>",
    "bitrate": 123,
    "channel": 123,
    "audio_sample_rate": 123
  },
  "voice_setting": {
    "vol": 123,
    "pitch": 123,
    "speed": 123,
    "emotion": "<string>",
    "voice_id": "<string>",
    "english_normalization": true
  },
  "aigc_watermark": true,
  "language_boost": "<string>",
  "continuous_sound": true,
  "pronunciation_dict": {
    "tone": [
      "<string>"
    ]
  }
}
'

import requests

url = "https://api.highwayapi.ai/v3/async/minimax-speech-2.8-hd"

payload = {
    "text": "<string>",
    "text_file_id": 123,
    "voice_modify": {
        "pitch": 123,
        "timbre": 123,
        "intensity": 123,
        "sound_effects": "<string>"
    },
    "audio_setting": {
        "format": "<string>",
        "bitrate": 123,
        "channel": 123,
        "audio_sample_rate": 123
    },
    "voice_setting": {
        "vol": 123,
        "pitch": 123,
        "speed": 123,
        "emotion": "<string>",
        "voice_id": "<string>",
        "english_normalization": True
    },
    "aigc_watermark": True,
    "language_boost": "<string>",
    "continuous_sound": True,
    "pronunciation_dict": { "tone": ["<string>"] }
}
headers = {
    "Content-Type": "<content-type>",
    "Authorization": "<authorization>"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'Content-Type': '<content-type>', Authorization: '<authorization>'},
  body: JSON.stringify({
    text: '<string>',
    text_file_id: 123,
    voice_modify: {pitch: 123, timbre: 123, intensity: 123, sound_effects: '<string>'},
    audio_setting: {format: '<string>', bitrate: 123, channel: 123, audio_sample_rate: 123},
    voice_setting: {
      vol: 123,
      pitch: 123,
      speed: 123,
      emotion: '<string>',
      voice_id: '<string>',
      english_normalization: true
    },
    aigc_watermark: true,
    language_boost: '<string>',
    continuous_sound: true,
    pronunciation_dict: {tone: ['<string>']}
  })
};

fetch('https://api.highwayapi.ai/v3/async/minimax-speech-2.8-hd', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.highwayapi.ai/v3/async/minimax-speech-2.8-hd",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'text' => '<string>',
    'text_file_id' => 123,
    'voice_modify' => [
        'pitch' => 123,
        'timbre' => 123,
        'intensity' => 123,
        'sound_effects' => '<string>'
    ],
    'audio_setting' => [
        'format' => '<string>',
        'bitrate' => 123,
        'channel' => 123,
        'audio_sample_rate' => 123
    ],
    'voice_setting' => [
        'vol' => 123,
        'pitch' => 123,
        'speed' => 123,
        'emotion' => '<string>',
        'voice_id' => '<string>',
        'english_normalization' => true
    ],
    'aigc_watermark' => true,
    'language_boost' => '<string>',
    'continuous_sound' => true,
    'pronunciation_dict' => [
        'tone' => [
                '<string>'
        ]
    ]
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: <authorization>",
    "Content-Type: <content-type>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.highwayapi.ai/v3/async/minimax-speech-2.8-hd"

	payload := strings.NewReader("{\n  \"text\": \"<string>\",\n  \"text_file_id\": 123,\n  \"voice_modify\": {\n    \"pitch\": 123,\n    \"timbre\": 123,\n    \"intensity\": 123,\n    \"sound_effects\": \"<string>\"\n  },\n  \"audio_setting\": {\n    \"format\": \"<string>\",\n    \"bitrate\": 123,\n    \"channel\": 123,\n    \"audio_sample_rate\": 123\n  },\n  \"voice_setting\": {\n    \"vol\": 123,\n    \"pitch\": 123,\n    \"speed\": 123,\n    \"emotion\": \"<string>\",\n    \"voice_id\": \"<string>\",\n    \"english_normalization\": true\n  },\n  \"aigc_watermark\": true,\n  \"language_boost\": \"<string>\",\n  \"continuous_sound\": true,\n  \"pronunciation_dict\": {\n    \"tone\": [\n      \"<string>\"\n    ]\n  }\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Content-Type", "<content-type>")
	req.Header.Add("Authorization", "<authorization>")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.highwayapi.ai/v3/async/minimax-speech-2.8-hd")
  .header("Content-Type", "<content-type>")
  .header("Authorization", "<authorization>")
  .body("{\n  \"text\": \"<string>\",\n  \"text_file_id\": 123,\n  \"voice_modify\": {\n    \"pitch\": 123,\n    \"timbre\": 123,\n    \"intensity\": 123,\n    \"sound_effects\": \"<string>\"\n  },\n  \"audio_setting\": {\n    \"format\": \"<string>\",\n    \"bitrate\": 123,\n    \"channel\": 123,\n    \"audio_sample_rate\": 123\n  },\n  \"voice_setting\": {\n    \"vol\": 123,\n    \"pitch\": 123,\n    \"speed\": 123,\n    \"emotion\": \"<string>\",\n    \"voice_id\": \"<string>\",\n    \"english_normalization\": true\n  },\n  \"aigc_watermark\": true,\n  \"language_boost\": \"<string>\",\n  \"continuous_sound\": true,\n  \"pronunciation_dict\": {\n    \"tone\": [\n      \"<string>\"\n    ]\n  }\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.highwayapi.ai/v3/async/minimax-speech-2.8-hd")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Content-Type"] = '<content-type>'
request["Authorization"] = '<authorization>'
request.body = "{\n  \"text\": \"<string>\",\n  \"text_file_id\": 123,\n  \"voice_modify\": {\n    \"pitch\": 123,\n    \"timbre\": 123,\n    \"intensity\": 123,\n    \"sound_effects\": \"<string>\"\n  },\n  \"audio_setting\": {\n    \"format\": \"<string>\",\n    \"bitrate\": 123,\n    \"channel\": 123,\n    \"audio_sample_rate\": 123\n  },\n  \"voice_setting\": {\n    \"vol\": 123,\n    \"pitch\": 123,\n    \"speed\": 123,\n    \"emotion\": \"<string>\",\n    \"voice_id\": \"<string>\",\n    \"english_normalization\": true\n  },\n  \"aigc_watermark\": true,\n  \"language_boost\": \"<string>\",\n  \"continuous_sound\": true,\n  \"pronunciation_dict\": {\n    \"tone\": [\n      \"<string>\"\n    ]\n  }\n}"

response = http.request(request)
puts response.read_body

{
  "file_id": 123,
  "task_id": "<string>",
  "base_resp": {
    "status_msg": "<string>",
    "status_code": 123
  },
  "task_token": "<string>",
  "usage_characters": 123
}

このインターフェースを使用して、非同期音声合成タスクを作成します。テキストまたはファイル入力に対応し、テキストの長さは最大 5 万文字、ファイルは最大 10 万文字までに制限されます。

これは非同期API であり、非同期タスクの task_id のみを返します。この task_id を使用してタスク結果照会 API にリクエストし、生成結果を取得してください。

リクエストヘッダー

string

必須

列挙値: application/json

string

必須

Bearer 認証形式: Bearer {{API Key}}。

リクエストボディ

string

合成する音声のテキスト。最大 5 万文字までに制限されます。text_file_id とのいずれか一方が必須です

• フィラータグ：モデルで speech-2.8-hd または speech-2.8-turbo を選択した場合のみ、テキスト内にフィラータグを挿入できます。対応するフィラー：(laughs)（笑い声）、(chuckle)（軽い笑い）、(coughs)（咳）、(clear-throat)（咳払い）、(groans)（うめき声）、(breath)（通常の呼吸）、(pant)（息切れ）、(inhale)（吸気）、(exhale)（呼気）、(gasps)（息をのむ）、(sniffs)（鼻をすする）、(sighs)（ため息）、(snorts)（鼻息）、(burps)（げっぷ）、(lip-smacking)（舌鼓）、(humming)（鼻歌）、(hissing)（シューという音）、(emm)（ええと）、(whistles)（口笛）、(sneezes)（くしゃみ）、(crying)（すすり泣き）、(applause)（拍手）

integer

合成する音声のテキストファイル id。単一ファイルの長さは 10 万文字未満に制限され、対応ファイル形式は txt、zip です。text とのいずれか一方が必須で、指定後に形式が自動検証されます。
• txt ファイル：長さ制限 <100000 文字。<#x#> マークによるカスタムポーズに対応しています。x はポーズの長さ（単位：秒）で、範囲は [0.01, 99.99]、小数点以下は最大 2 桁まで保持できます。ポーズは音声として発音可能な 2 つのテキストの間に設定する必要があり、複数のポーズマークを連続して使用することはできません
• zip ファイル：
• 圧縮ファイル内には、同一形式の txt または json ファイルを含める必要があります。
• json ファイル形式：[title, content, extra] の 3 つのフィールドに対応しており、それぞれタイトル、本文、追加情報を表します。3 つのフィールドがすべて存在する場合、3 セットの結果、合計 9 ファイルが生成され、1 つのフォルダにまとめて保存されます。いずれかのフィールドが存在しない、または内容が空の場合、そのフィールドに対応する結果は生成されません

object

非表示プロパティ

integer

ピッチ調整（低い/明るい）。範囲は [-100, 100] で、値が -100 に近いほど声はより低くなり、100 に近いほど声はより明るくなります値の範囲：[-100, 100]

integer

音色調整（渋い/クリア）。範囲は [-100, 100] で、値が -100 に近いほど声はより厚みが増し、100 に近いほど声はよりクリアになります値の範囲：[-100, 100]

integer

強度調整（力強さ/柔らかさ）。範囲は [-100, 100] で、値が -100 に近いほど声はより力強くなり、100 に近いほど声はより柔らかくなります値の範囲：[-100, 100]

string

音響効果の設定。1 回につき 1 種類のみ選択可能です。選択可能な値：

spacious_echo（広い空間のエコー）
auditorium_echo（講堂放送）
lofi_telephone（電話の歪み）
robotic（電子音声）

選択可能な値：spacious_echo, auditorium_echo, lofi_telephone, robotic

object

非表示プロパティ

string

デフォルト:"mp3"

生成される音声の形式。選択可能な範囲は [mp3, pcm, flac]、デフォルト値は mp3 です選択可能な値：mp3, pcm, flac

integer

デフォルト:128000

生成される音声のビットレート。選択可能な範囲は [32000, 64000, 128000, 256000]、デフォルト値は 128000 です。このパラメータは mp3 形式の音声にのみ有効です

integer

デフォルト:2

生成される音声のチャンネル数。選択可能な範囲：[1, 2]。1 はモノラル、2 はステレオを表し、デフォルト値は 1 です

integer

デフォルト:32000

生成される音声のサンプリングレート。選択可能な範囲は [8000, 16000, 22050, 24000, 32000, 44100]、デフォルトは 32000 です

object

必須

非表示プロパティ

number

デフォルト:1

合成音声の音量。値が大きいほど音量が大きくなります。値の範囲は (0, 10]、デフォルト値は 1.0 です値の範囲：[0, 10]

integer

デフォルト:0

合成音声のイントネーション。値の範囲は [-12, 12]、デフォルト値は 0 です。0 は元の音色での出力を表します値の範囲：[-12, 12]

number

デフォルト:1

合成音声の話速。値が大きいほど話速が速くなります。値の範囲は [0.5, 2]、デフォルト値は 1.0 です値の範囲：[0.5, 2]

string

合成音声の感情を制御します。パラメータ範囲は [“happy”, “sad”, “angry”, “fearful”, “disgusted”, “surprised”, “calm”, “fluent”, “whisper”] で、それぞれ 8 種類の感情に対応します：喜び、悲しみ、怒り、恐れ、嫌悪、驚き、中立、生き生き、ささやき
• モデルは入力テキストに基づいて適切な感情を自動的にマッチングするため、通常は手動指定は不要です
• このパラメータは speech-2.6-hd, speech-2.6-turbo, speech-01-hd, speech-01-turbo モデルにのみ有効です
• オプション fluent, whisper は speech-2.6-turbo, speech-2.6-hd モデルにのみ有効です選択可能な値：happy, sad, angry, fearful, disgusted, surprised, calm, fluent, whisper

string

必須

合成音声の音色番号。混合音色を設定する必要がある場合は、timber_weights パラメータを設定し、このパラメータは空値にしてください。システム音色、クローン音色、テキスト生成音色の 3 種類に対応しています。以下は最新のシステム音色（ID）の一部です。公式に対応しているすべての音色を確認できます
• 中国語:
• moss_audio_ce44fc67-7ce3-11f0-8de5-96e35d26fb85
• moss_audio_aaa1346a-7ce7-11f0-8e61-2e6e3c7ee85d
• Chinese (Mandarin)_Lyrical_Voice
• Chinese (Mandarin)_HK_Flight_Attendant
• 英語:
• English_Graceful_Lady
• English_Insightful_Speaker
• English_radiant_girl
• English_Persuasive_Man
• moss_audio_6dc281eb-713c-11f0-a447-9613c873494c
• moss_audio_570551b1-735c-11f0-b236-0adeeecad052
• moss_audio_ad5baf92-735f-11f0-8263-fe5a2fe98ec8
• English_Lucky_Robot
• 日本語:
• Japanese_Whisper_Belle
• moss_audio_24875c4a-7be4-11f0-9359-4e72c55db738
• moss_audio_7f4ee608-78ea-11f0-bb73-1e2a4cfcd245
• moss_audio_c1a6a3ac-7be6-11f0-8e8e-36b92fbb4f95

boolean

デフォルト:false

英語テキストの正規化に対応します。有効にすると数字読み上げシーンでの性能を向上できますが、レイテンシがわずかに増加します。デフォルトは false です

boolean

デフォルト:false

合成音声の末尾に音声リズム識別子を追加するかどうかを制御します。デフォルト値は False です。このパラメータは非ストリーミング合成にのみ有効です

string

指定した少数言語および方言の認識能力を強化するかどうか。デフォルト値は null で、auto に設定するとモデルが自律的に判断します。選択可能な値：Chinese, Chinese,Yue, English, Arabic, Russian, Spanish, French, Portuguese, German, Turkish, Dutch, Ukrainian, Vietnamese, Indonesian, Japanese, Italian, Korean, Thai, Polish, Romanian, Greek, Czech, Finnish, Hindi, Bulgarian, Danish, Hebrew, Malay, Persian, Slovak, Swedish, Croatian, Filipino, Hungarian, Norwegian, Slovenian, Catalan, Nynorsk, Tamil, Afrikaans, auto

boolean

デフォルト:false

このパラメータを有効にすると、句の接続部分がより自然になります。speech-2.8-hd および speech-2.8-turbo モデルのみ対応しています

object

非表示プロパティ

string[]

特別な注記が必要な文字または記号に対応するルビや発音置換ルールを定義します。中国語テキストでは、声調を数字で表します：一声は 1、二声は 2、三声は 3、四声は 4、軽声は 5 例： [“燕少飞/(yan4)(shao3)(fei1)”, “omg/oh my god”]

レスポンス情報

integer

タスク作成成功後に返される、対応する音声ファイルの ID。

• タスク完了後、file_id で照会できます。リクエストでエラーが発生した場合、このフィールドは返されません注意：返されるダウンロード URL は生成時から 9 時間（32400 秒）有効です。有効期限を過ぎるとファイルは無効になり、生成された情報は失われます。ダウンロード情報の時間にご注意ください

string

task_id を使用してタスク結果照会 API にリクエストし、生成された出力を取得します。

object

非表示プロパティ

string

必須

ステータスの詳細

integer

必須

ステータスコード

• 0: 正常
• 1002: レート制限
• 1004: 認証失敗
• 1039: TPM レート制限に達しました
• 1042: 不正な文字が 10% 超
• 2013: パラメータエラー

string

現在のタスクの完了に使用されたキー情報

integer

課金対象文字数

MiniMax Speech 2.8 Turbo 同期音声合成

MiniMax Speech 2.8 HD 同期音声合成

API の基本

大規模言語モデル

画像

動画

音声

MiniMax Speech 2.8 HD 非同期音声合成

リクエストヘッダー

リクエストボディ

レスポンス情報

​リクエストヘッダー

​リクエストボディ

​レスポンス情報

リクエストヘッダー

リクエストボディ

レスポンス情報