API de Clonagem de Voz | Clonagem rápida de áudio MiniMax

Clonagem rápida de áudio MiniMax

curl --request POST \
  --url https://api.highwayapi.ai/v3/minimax-voice-cloning \
  --header 'Authorization: <authorization>' \
  --header 'Content-Type: <content-type>' \
  --data '
{
  "audio_url": "<string>",
  "text": "<string>",
  "model": "<string>",
  "accuracy": 123,
  "need_noise_reduction": true,
  "need_volume_normalization": true
}
'

import requests

url = "https://api.highwayapi.ai/v3/minimax-voice-cloning"

payload = {
    "audio_url": "<string>",
    "text": "<string>",
    "model": "<string>",
    "accuracy": 123,
    "need_noise_reduction": True,
    "need_volume_normalization": True
}
headers = {
    "Content-Type": "<content-type>",
    "Authorization": "<authorization>"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'Content-Type': '<content-type>', Authorization: '<authorization>'},
  body: JSON.stringify({
    audio_url: '<string>',
    text: '<string>',
    model: '<string>',
    accuracy: 123,
    need_noise_reduction: true,
    need_volume_normalization: true
  })
};

fetch('https://api.highwayapi.ai/v3/minimax-voice-cloning', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.highwayapi.ai/v3/minimax-voice-cloning",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'audio_url' => '<string>',
    'text' => '<string>',
    'model' => '<string>',
    'accuracy' => 123,
    'need_noise_reduction' => true,
    'need_volume_normalization' => true
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: <authorization>",
    "Content-Type: <content-type>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.highwayapi.ai/v3/minimax-voice-cloning"

	payload := strings.NewReader("{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Content-Type", "<content-type>")
	req.Header.Add("Authorization", "<authorization>")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.highwayapi.ai/v3/minimax-voice-cloning")
  .header("Content-Type", "<content-type>")
  .header("Authorization", "<authorization>")
  .body("{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.highwayapi.ai/v3/minimax-voice-cloning")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Content-Type"] = '<content-type>'
request["Authorization"] = '<authorization>'
request.body = "{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}"

response = http.request(request)
puts response.read_body

{
  "demo_audio_url": "<string>",
  "voice_id": "<string>"
}

POST

minimax-voice-cloning

Clonagem rápida de áudio MiniMax

curl --request POST \
  --url https://api.highwayapi.ai/v3/minimax-voice-cloning \
  --header 'Authorization: <authorization>' \
  --header 'Content-Type: <content-type>' \
  --data '
{
  "audio_url": "<string>",
  "text": "<string>",
  "model": "<string>",
  "accuracy": 123,
  "need_noise_reduction": true,
  "need_volume_normalization": true
}
'

import requests

url = "https://api.highwayapi.ai/v3/minimax-voice-cloning"

payload = {
    "audio_url": "<string>",
    "text": "<string>",
    "model": "<string>",
    "accuracy": 123,
    "need_noise_reduction": True,
    "need_volume_normalization": True
}
headers = {
    "Content-Type": "<content-type>",
    "Authorization": "<authorization>"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'Content-Type': '<content-type>', Authorization: '<authorization>'},
  body: JSON.stringify({
    audio_url: '<string>',
    text: '<string>',
    model: '<string>',
    accuracy: 123,
    need_noise_reduction: true,
    need_volume_normalization: true
  })
};

fetch('https://api.highwayapi.ai/v3/minimax-voice-cloning', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.highwayapi.ai/v3/minimax-voice-cloning",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'audio_url' => '<string>',
    'text' => '<string>',
    'model' => '<string>',
    'accuracy' => 123,
    'need_noise_reduction' => true,
    'need_volume_normalization' => true
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: <authorization>",
    "Content-Type: <content-type>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.highwayapi.ai/v3/minimax-voice-cloning"

	payload := strings.NewReader("{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Content-Type", "<content-type>")
	req.Header.Add("Authorization", "<authorization>")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.highwayapi.ai/v3/minimax-voice-cloning")
  .header("Content-Type", "<content-type>")
  .header("Authorization", "<authorization>")
  .body("{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.highwayapi.ai/v3/minimax-voice-cloning")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Content-Type"] = '<content-type>'
request["Authorization"] = '<authorization>'
request.body = "{\n  \"audio_url\": \"<string>\",\n  \"text\": \"<string>\",\n  \"model\": \"<string>\",\n  \"accuracy\": 123,\n  \"need_noise_reduction\": true,\n  \"need_volume_normalization\": true\n}"

response = http.request(request)
puts response.read_body

{
  "demo_audio_url": "<string>",
  "voice_id": "<string>"
}

Esta interface oferece suporte à clonagem de voz em canal único e canal duplo, permitindo clonar rapidamente uma voz com o mesmo timbre a partir de um arquivo de áudio especificado. O timbre gerado pela clonagem rápida nesta interface é temporário. Se você deseja manter permanentemente um determinado timbre clonado, chame esse timbre em qualquer interface de síntese de voz T2A dentro de 168 horas (7 dias) (não inclui a ação de audição de teste nesta interface); caso contrário, esse timbre será excluído. Cenários aplicáveis desta interface: clonagem de IP, clonagem de timbre e outros cenários relacionados que exigem a clonagem rápida de um determinado timbre. Observações:

O formato do arquivo de áudio enviado deve ser: mp3, m4a ou wav;
A duração do arquivo de áudio enviado deve ser de no mínimo 10 segundos e no máximo 5 minutos;
O tamanho do arquivo de áudio enviado não deve exceder 20mb.

Cabeçalhos da solicitação

string

obrigatório

Valor enumerado: application/json

string

obrigatório

Formato de autenticação Bearer: Bearer {{API Key}}.

Corpo da solicitação

string

obrigatório

URL do arquivo de áudio cujo timbre precisa ser clonado. Suporta os formatos mp3, m4a e wav.

Parâmetro de clonagem de timbre. Fornecer este parâmetro ajudará a aumentar a similaridade e a estabilidade do timbre na síntese de voz.Se usar este parâmetro, é necessário enviar simultaneamente um pequeno trecho de áudio de exemplo (duração inferior a 8s) e o texto correspondente ao áudio. O áudio suporta os formatos mp3, m4a e wav.

Mostrar properties

number

obrigatório

Parâmetro de prompt de áudio: URL do áudio de exemplo, cuja duração deve ser inferior a 8s.

string

obrigatório

Parâmetro de prompt de áudio: preencha com o texto correspondente ao áudio de exemplo. Certifique-se de que ele seja consistente com o conteúdo do áudio e que a frase termine com pontuação.

string

Parâmetro de audição de teste da clonagem. O modelo usará o timbre clonado para ler o conteúdo deste texto e retornará o resultado da síntese de áudio em forma de link, para audição do efeito da clonagem. Limite de até 2000 caracteres. Observação: a audição de teste será cobrada normalmente pela síntese de voz de acordo com o número de caracteres, com a mesma precificação das interfaces T2A.

string

Parâmetro de audição de teste da clonagem. Especifica o modelo de voz usado na audição de teste; este campo é obrigatório ao enviar o campo “text”.
Opções: speech-2.8-hd, speech-2.8-turbo

float

Parâmetro de clonagem de áudio. Intervalo de valores: [0,1]. Enviar este campo definirá o limite de precisão da verificação de texto; se não for enviado, o valor padrão deste campo será 0.7.

bool

Parâmetro de clonagem de áudio. Indica se a redução de ruído deve ser ativada. Se não for enviado, o valor padrão será false.

bool

Parâmetro de clonagem de áudio. Indica se a normalização de volume deve ser ativada. Se não for enviado, o valor padrão será false.

Informações de resposta

string

Se o texto de audição de teste text e o modelo de audição de teste model forem enviados no corpo da solicitação, este parâmetro retornará o áudio de audição de teste em forma de link.

string

O voice_id gerado

Síntese de voz síncrona MiniMax Speech 2.8 HD

ElevenLabs Speech-to-Text V1

Noções básicas da API

Modelos de linguagem

Imagens

Vídeo

Áudio

Clonagem rápida de áudio MiniMax

Cabeçalhos da solicitação

Corpo da solicitação

Informações de resposta

​Cabeçalhos da solicitação

​Corpo da solicitação

​Informações de resposta

Cabeçalhos da solicitação

Corpo da solicitação

Informações de resposta