Voice Cloning API | MiniMax Audio Quick Cloning

MiniMax Audio Quick Cloning

curl --request POST \
  --url https://api.highwayapi.ai/v3/minimax-voice-cloning \
  --header 'Authorization: <authorization>' \
  --header 'Content-Type: <content-type>' \
  --data '
{
  "audio_url": "<string>",
  "text": "<string>",
  "model": "<string>",
  "accuracy": 123,
  "need_noise_reduction": true,
  "need_volume_normalization": true
}
'

import requests

url = "https://api.highwayapi.ai/v3/minimax-voice-cloning"

payload = {
    "audio_url": "<string>",
    "text": "<string>",
    "model": "<string>",
    "accuracy": 123,
    "need_noise_reduction": True,
    "need_volume_normalization": True
}
headers = {
    "Content-Type": "<content-type>",
    "Authorization": "<authorization>"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'Content-Type': '<content-type>', Authorization: '<authorization>'},
  body: JSON.stringify({
    audio_url: '<string>',
    text: '<string>',
    model: '<string>',
    accuracy: 123,
    need_noise_reduction: true,
    need_volume_normalization: true
  })
};

fetch('https://api.highwayapi.ai/v3/minimax-voice-cloning', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.highwayapi.ai/v3/minimax-voice-cloning",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'audio_url' => '<string>',
    'text' => '<string>',
    'model' => '<string>',
    'accuracy' => 123,
    'need_noise_reduction' => true,
    'need_volume_normalization' => true
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: <authorization>",
    "Content-Type: <content-type>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.highwayapi.ai/v3/minimax-voice-cloning"

	payload := strings.NewReader("{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Content-Type", "<content-type>")
	req.Header.Add("Authorization", "<authorization>")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.highwayapi.ai/v3/minimax-voice-cloning")
  .header("Content-Type", "<content-type>")
  .header("Authorization", "<authorization>")
  .body("{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.highwayapi.ai/v3/minimax-voice-cloning")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Content-Type"] = '<content-type>'
request["Authorization"] = '<authorization>'
request.body = "{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}"

response = http.request(request)
puts response.read_body

{
  "demo_audio_url": "<string>",
  "voice_id": "<string>"
}

POST

minimax-voice-cloning

MiniMax Audio Quick Cloning

curl --request POST \
  --url https://api.highwayapi.ai/v3/minimax-voice-cloning \
  --header 'Authorization: <authorization>' \
  --header 'Content-Type: <content-type>' \
  --data '
{
  "audio_url": "<string>",
  "text": "<string>",
  "model": "<string>",
  "accuracy": 123,
  "need_noise_reduction": true,
  "need_volume_normalization": true
}
'

import requests

url = "https://api.highwayapi.ai/v3/minimax-voice-cloning"

payload = {
    "audio_url": "<string>",
    "text": "<string>",
    "model": "<string>",
    "accuracy": 123,
    "need_noise_reduction": True,
    "need_volume_normalization": True
}
headers = {
    "Content-Type": "<content-type>",
    "Authorization": "<authorization>"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'Content-Type': '<content-type>', Authorization: '<authorization>'},
  body: JSON.stringify({
    audio_url: '<string>',
    text: '<string>',
    model: '<string>',
    accuracy: 123,
    need_noise_reduction: true,
    need_volume_normalization: true
  })
};

fetch('https://api.highwayapi.ai/v3/minimax-voice-cloning', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.highwayapi.ai/v3/minimax-voice-cloning",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'audio_url' => '<string>',
    'text' => '<string>',
    'model' => '<string>',
    'accuracy' => 123,
    'need_noise_reduction' => true,
    'need_volume_normalization' => true
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: <authorization>",
    "Content-Type: <content-type>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.highwayapi.ai/v3/minimax-voice-cloning"

	payload := strings.NewReader("{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Content-Type", "<content-type>")
	req.Header.Add("Authorization", "<authorization>")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.highwayapi.ai/v3/minimax-voice-cloning")
  .header("Content-Type", "<content-type>")
  .header("Authorization", "<authorization>")
  .body("{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.highwayapi.ai/v3/minimax-voice-cloning")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Content-Type"] = '<content-type>'
request["Authorization"] = '<authorization>'
request.body = "{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}"

response = http.request(request)
puts response.read_body

{
  "demo_audio_url": "<string>",
  "voice_id": "<string>"
}

This API supports cloning voices from mono or stereo audio, enabling quick replication of speech with the same timbre based on a specified audio file. The quickly cloned voice produced by this API is a temporary voice. If you wish to permanently retain a cloned voice, please use this voice in any T2A speech synthesis API within 168 hours (7 days) (excluding the trial-listening behavior within this API); otherwise, the voice will be deleted. Applicable scenarios for this API: IP replication, voice cloning, and other scenarios that require quickly replicating a specific voice. Notes:

The uploaded audio file format must be: mp3, m4a, or wav;
The uploaded audio file must be at least 10 seconds long and no longer than 5 minutes;
The uploaded audio file size must not exceed 20mb.

Request Headers

string

required

Enum value: application/json

string

required

Bearer authentication format: Bearer {{API Key}}.

Request Body

string

required

The audio file url for the voice to be cloned. Supports mp3, m4a, and wav formats.

Voice cloning parameters. Providing this parameter helps improve the timbre similarity and stability of speech synthesis.If this parameter is used, you must also upload a short sample audio clip (less than 8s) and the corresponding text for the audio. The audio supports mp3, m4a, and wav formats.

Show properties

number

required

Audio prompt parameter: the sample audio url. The duration must be less than 8s.

string

required

Audio prompt parameter: enter the corresponding text for the sample audio. Make sure it matches the audio content, and the sentence must end with punctuation.

string

Cloning trial-listening parameter. The model will read this text using the cloned voice and return the synthesized audio result as a link for previewing the cloning effect. Limited to 2000 characters. Note: trial listening will be charged for speech synthesis based on the number of characters, with pricing consistent with the T2A APIs.

string

Cloning trial-listening parameter. Specifies the speech model used for trial listening. This field is required when the “text” field is provided.
Options: speech-2.8-hd, speech-2.8-turbo

float

Audio cloning parameter. Value range: [0,1]. Providing this field sets the text verification accuracy threshold. If not provided, the default value is 0.7.

bool

Audio cloning parameter. Whether to enable noise reduction. Defaults to false if not provided.

bool

Audio cloning parameter. Whether to enable volume normalization. Defaults to false if not provided.

Response Information

string

If the request body includes the trial-listening text text and the trial-listening model model, this parameter returns the trial-listening audio as a link.

string

The generated voice_id

MiniMax Speech 2.8 HD Synchronous Speech Synthesis

ElevenLabs Speech to Text V1

API Basics

Large Language Models

Images

Video

Audio

MiniMax Audio Quick Cloning

Request Headers

Request Body

Response Information

​Request Headers

​Request Body

​Response Information

Request Headers

Request Body

Response Information