Voice Cloning API | MiniMax Audio-Schnellklonen

MiniMax Audio-Schnellklonen

curl --request POST \
  --url https://api.highwayapi.ai/v3/minimax-voice-cloning \
  --header 'Authorization: <authorization>' \
  --header 'Content-Type: <content-type>' \
  --data '
{
  "audio_url": "<string>",
  "text": "<string>",
  "model": "<string>",
  "accuracy": 123,
  "need_noise_reduction": true,
  "need_volume_normalization": true
}
'

import requests

url = "https://api.highwayapi.ai/v3/minimax-voice-cloning"

payload = {
    "audio_url": "<string>",
    "text": "<string>",
    "model": "<string>",
    "accuracy": 123,
    "need_noise_reduction": True,
    "need_volume_normalization": True
}
headers = {
    "Content-Type": "<content-type>",
    "Authorization": "<authorization>"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'Content-Type': '<content-type>', Authorization: '<authorization>'},
  body: JSON.stringify({
    audio_url: '<string>',
    text: '<string>',
    model: '<string>',
    accuracy: 123,
    need_noise_reduction: true,
    need_volume_normalization: true
  })
};

fetch('https://api.highwayapi.ai/v3/minimax-voice-cloning', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.highwayapi.ai/v3/minimax-voice-cloning",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'audio_url' => '<string>',
    'text' => '<string>',
    'model' => '<string>',
    'accuracy' => 123,
    'need_noise_reduction' => true,
    'need_volume_normalization' => true
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: <authorization>",
    "Content-Type: <content-type>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.highwayapi.ai/v3/minimax-voice-cloning"

	payload := strings.NewReader("{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Content-Type", "<content-type>")
	req.Header.Add("Authorization", "<authorization>")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.highwayapi.ai/v3/minimax-voice-cloning")
  .header("Content-Type", "<content-type>")
  .header("Authorization", "<authorization>")
  .body("{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.highwayapi.ai/v3/minimax-voice-cloning")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Content-Type"] = '<content-type>'
request["Authorization"] = '<authorization>'
request.body = "{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}"

response = http.request(request)
puts response.read_body

{
  "demo_audio_url": "<string>",
  "voice_id": "<string>"
}

POST

minimax-voice-cloning

MiniMax Audio-Schnellklonen

curl --request POST \
  --url https://api.highwayapi.ai/v3/minimax-voice-cloning \
  --header 'Authorization: <authorization>' \
  --header 'Content-Type: <content-type>' \
  --data '
{
  "audio_url": "<string>",
  "text": "<string>",
  "model": "<string>",
  "accuracy": 123,
  "need_noise_reduction": true,
  "need_volume_normalization": true
}
'

import requests

url = "https://api.highwayapi.ai/v3/minimax-voice-cloning"

payload = {
    "audio_url": "<string>",
    "text": "<string>",
    "model": "<string>",
    "accuracy": 123,
    "need_noise_reduction": True,
    "need_volume_normalization": True
}
headers = {
    "Content-Type": "<content-type>",
    "Authorization": "<authorization>"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'Content-Type': '<content-type>', Authorization: '<authorization>'},
  body: JSON.stringify({
    audio_url: '<string>',
    text: '<string>',
    model: '<string>',
    accuracy: 123,
    need_noise_reduction: true,
    need_volume_normalization: true
  })
};

fetch('https://api.highwayapi.ai/v3/minimax-voice-cloning', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.highwayapi.ai/v3/minimax-voice-cloning",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'audio_url' => '<string>',
    'text' => '<string>',
    'model' => '<string>',
    'accuracy' => 123,
    'need_noise_reduction' => true,
    'need_volume_normalization' => true
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: <authorization>",
    "Content-Type: <content-type>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.highwayapi.ai/v3/minimax-voice-cloning"

	payload := strings.NewReader("{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Content-Type", "<content-type>")
	req.Header.Add("Authorization", "<authorization>")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.highwayapi.ai/v3/minimax-voice-cloning")
  .header("Content-Type", "<content-type>")
  .header("Authorization", "<authorization>")
  .body("{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.highwayapi.ai/v3/minimax-voice-cloning")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Content-Type"] = '<content-type>'
request["Authorization"] = '<authorization>'
request.body = "{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}"

response = http.request(request)
puts response.read_body

{
  "demo_audio_url": "<string>",
  "voice_id": "<string>"
}

Diese Schnittstelle unterstützt das Klonen von Stimmen aus Mono- und Stereo-Audio und ermöglicht das schnelle Klonen einer Stimme mit derselben Klangfarbe anhand einer angegebenen Audiodatei. Die von dieser Schnittstelle erzeugte schnell geklonte Stimme ist eine temporäre Stimme. Wenn Sie eine geklonte Stimme dauerhaft behalten möchten, rufen Sie diese Stimme bitte innerhalb von 168 Stunden (7 Tagen) in einer beliebigen T2A-Sprachsynthese-Schnittstelle auf (das Probehören innerhalb dieser Schnittstelle zählt nicht dazu); andernfalls wird diese Stimme gelöscht. Geeignete Anwendungsfälle für diese Schnittstelle: IP-Klonen, Stimmenklonen und andere Szenarien, in denen eine bestimmte Stimme schnell geklont werden muss. Hinweise:

Das Format der hochgeladenen Audiodatei muss eines der folgenden sein: mp3, m4a, wav;
Die Dauer der hochgeladenen Audiodatei sollte mindestens 10 Sekunden betragen und darf höchstens 5 Minuten betragen;
Die Größe der hochgeladenen Audiodatei darf 20mb nicht überschreiten.

Anfrageheader

string

erforderlich

Enumerationswert: application/json

string

erforderlich

Bearer-Authentifizierungsformat: Bearer {{API Key}}.

Anfragetext

string

erforderlich

Die URL der Audiodatei, deren Stimme geklont werden soll. Unterstützt die Formate mp3, m4a, wav.

Parameter für das Stimmenklonen. Die Bereitstellung dieses Parameters hilft, die Ähnlichkeit und Stabilität der Stimme bei der Sprachsynthese zu verbessern.Wenn dieser Parameter verwendet wird, müssen gleichzeitig ein kurzes Beispielaudio (Dauer unter 8s) und der zugehörige Text des Audios hochgeladen werden. Unterstützte Audioformate sind mp3, m4a, wav.

Anzeigen properties

number

erforderlich

Audio-prompt-Parameter, URL des Beispielaudios; die Dauer muss unter 8s liegen.

string

erforderlich

Audio-prompt-Parameter. Geben Sie den zum Beispielaudio gehörenden Text ein; stellen Sie sicher, dass er mit dem Audioinhalt übereinstimmt und dass der Satz am Ende mit einem Satzzeichen abschließt.

string

Parameter für das Probehören der geklonten Stimme. Das Modell liest diesen Text mit der geklonten Stimme vor und gibt das Ergebnis der Audiosynthese als Link zurück, damit der Kloneffekt angehört werden kann. Begrenzt auf maximal 2000 Zeichen. Hinweis: Für das Probehören werden entsprechend der Zeichenanzahl regulär Gebühren für die Sprachsynthese berechnet; die Preisgestaltung entspricht den jeweiligen T2A-Schnittstellen.

string

Parameter für das Probehören der geklonten Stimme. Gibt das für das Probehören verwendete Sprachmodell an; wenn das Feld “text” übergeben wird, ist dieses Feld erforderlich.
Optionen: speech-2.8-hd, speech-2.8-turbo

float

Parameter für das Audioklonen. Wertebereich [0,1]. Wenn dieses Feld hochgeladen wird, wird der Genauigkeitsschwellenwert für die Textprüfung festgelegt. Wird es nicht übergeben, beträgt der Standardwert dieses Feldes 0.7.

bool

Parameter für das Audioklonen. Gibt an, ob Rauschunterdrückung aktiviert werden soll. Wird der Parameter nicht übergeben, ist der Standardwert false.

bool

Parameter für das Audioklonen. Gibt an, ob Lautstärkenormalisierung aktiviert werden soll. Wird der Parameter nicht übergeben, ist der Standardwert false.

Antwortinformationen

string

Wenn im Anfragetext der Probehörtext text und das Probehörmodell model übergeben wurden, gibt dieser Parameter das Probehör-Audio als Link zurück.

string

Die generierte voice_id

MiniMax Speech 2.8 HD synchrone Sprachsynthese

Zurück

ElevenLabs Speech-to-Text V1

Weiter

API-Grundlagen

Große Sprachmodelle

Bilder

Video

Audio

MiniMax Audio-Schnellklonen

Anfrageheader

Anfragetext

Antwortinformationen

​Anfrageheader

​Anfragetext

​Antwortinformationen

Anfrageheader

Anfragetext

Antwortinformationen