Audio Cloning API | Fish Audio

Fish Audio Audio Cloning

curl --request POST \
  --url https://api.highwayapi.ai/v4beta/model \
  --header 'Authorization: <authorization>' \
  --header 'Content-Type: <content-type>' \
  --data '
{
  "type": {},
  "title": "<string>",
  "train_mode": {},
  "voices": [
    null
  ],
  "visibility": {},
  "description": {},
  "cover_image": {},
  "texts": [
    "<string>"
  ],
  "tags": [
    "<string>"
  ],
  "enhance_audio_quality": true
}
'

import requests

url = "https://api.highwayapi.ai/v4beta/model"

payload = {
    "type": {},
    "title": "<string>",
    "train_mode": {},
    "voices": [None],
    "visibility": {},
    "description": {},
    "cover_image": {},
    "texts": ["<string>"],
    "tags": ["<string>"],
    "enhance_audio_quality": True
}
headers = {
    "Content-Type": "<content-type>",
    "Authorization": "<authorization>"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'Content-Type': '<content-type>', Authorization: '<authorization>'},
  body: JSON.stringify({
    type: {},
    title: '<string>',
    train_mode: {},
    voices: [null],
    visibility: {},
    description: {},
    cover_image: {},
    texts: ['<string>'],
    tags: ['<string>'],
    enhance_audio_quality: true
  })
};

fetch('https://api.highwayapi.ai/v4beta/model', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.highwayapi.ai/v4beta/model",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'type' => [
        
    ],
    'title' => '<string>',
    'train_mode' => [
        
    ],
    'voices' => [
        null
    ],
    'visibility' => [
        
    ],
    'description' => [
        
    ],
    'cover_image' => [
        
    ],
    'texts' => [
        '<string>'
    ],
    'tags' => [
        '<string>'
    ],
    'enhance_audio_quality' => true
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: <authorization>",
    "Content-Type: <content-type>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.highwayapi.ai/v4beta/model"

	payload := strings.NewReader("{\n  \"type\": {},\n  \"title\": \"<string>\",\n  \"train_mode\": {},\n  \"voices\": [\n    null\n  ],\n  \"visibility\": {},\n  \"description\": {},\n  \"cover_image\": {},\n  \"texts\": [\n    \"<string>\"\n  ],\n  \"tags\": [\n    \"<string>\"\n  ],\n  \"enhance_audio_quality\": true\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Content-Type", "<content-type>")
	req.Header.Add("Authorization", "<authorization>")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.highwayapi.ai/v4beta/model")
  .header("Content-Type", "<content-type>")
  .header("Authorization", "<authorization>")
  .body("{\n  \"type\": {},\n  \"title\": \"<string>\",\n  \"train_mode\": {},\n  \"voices\": [\n    null\n  ],\n  \"visibility\": {},\n  \"description\": {},\n  \"cover_image\": {},\n  \"texts\": [\n    \"<string>\"\n  ],\n  \"tags\": [\n    \"<string>\"\n  ],\n  \"enhance_audio_quality\": true\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.highwayapi.ai/v4beta/model")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Content-Type"] = '<content-type>'
request["Authorization"] = '<authorization>'
request.body = "{\n  \"type\": {},\n  \"title\": \"<string>\",\n  \"train_mode\": {},\n  \"voices\": [\n    null\n  ],\n  \"visibility\": {},\n  \"description\": {},\n  \"cover_image\": {},\n  \"texts\": [\n    \"<string>\"\n  ],\n  \"tags\": [\n    \"<string>\"\n  ],\n  \"enhance_audio_quality\": true\n}"

response = http.request(request)
puts response.read_body

{
  "_id": "<string>",
  "type": {},
  "title": "<string>",
  "description": "<string>",
  "cover_image": "<string>",
  "state": {},
  "tags": [
    "<string>"
  ],
  "created_at": {},
  "updated_at": {},
  "visibility": {},
  "like_count": 123,
  "mark_count": 123,
  "shared_count": 123,
  "task_count": 123,
  "author": {
    "_id": "<string>",
    "nickname": "<string>",
    "avatar": "<string>"
  },
  "train_mode": {},
  "samples": [
    {
      "title": "<string>",
      "text": "<string>",
      "task_id": "<string>",
      "audio": "<string>"
    }
  ],
  "languages": [
    "<string>"
  ],
  "lock_visibility": true,
  "unliked": true,
  "liked": true,
  "marked": true
}

POST

v4beta

model

Fish Audio Audio Cloning

curl --request POST \
  --url https://api.highwayapi.ai/v4beta/model \
  --header 'Authorization: <authorization>' \
  --header 'Content-Type: <content-type>' \
  --data '
{
  "type": {},
  "title": "<string>",
  "train_mode": {},
  "voices": [
    null
  ],
  "visibility": {},
  "description": {},
  "cover_image": {},
  "texts": [
    "<string>"
  ],
  "tags": [
    "<string>"
  ],
  "enhance_audio_quality": true
}
'

import requests

url = "https://api.highwayapi.ai/v4beta/model"

payload = {
    "type": {},
    "title": "<string>",
    "train_mode": {},
    "voices": [None],
    "visibility": {},
    "description": {},
    "cover_image": {},
    "texts": ["<string>"],
    "tags": ["<string>"],
    "enhance_audio_quality": True
}
headers = {
    "Content-Type": "<content-type>",
    "Authorization": "<authorization>"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'Content-Type': '<content-type>', Authorization: '<authorization>'},
  body: JSON.stringify({
    type: {},
    title: '<string>',
    train_mode: {},
    voices: [null],
    visibility: {},
    description: {},
    cover_image: {},
    texts: ['<string>'],
    tags: ['<string>'],
    enhance_audio_quality: true
  })
};

fetch('https://api.highwayapi.ai/v4beta/model', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.highwayapi.ai/v4beta/model",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'type' => [
        
    ],
    'title' => '<string>',
    'train_mode' => [
        
    ],
    'voices' => [
        null
    ],
    'visibility' => [
        
    ],
    'description' => [
        
    ],
    'cover_image' => [
        
    ],
    'texts' => [
        '<string>'
    ],
    'tags' => [
        '<string>'
    ],
    'enhance_audio_quality' => true
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: <authorization>",
    "Content-Type: <content-type>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.highwayapi.ai/v4beta/model"

	payload := strings.NewReader("{\n  \"type\": {},\n  \"title\": \"<string>\",\n  \"train_mode\": {},\n  \"voices\": [\n    null\n  ],\n  \"visibility\": {},\n  \"description\": {},\n  \"cover_image\": {},\n  \"texts\": [\n    \"<string>\"\n  ],\n  \"tags\": [\n    \"<string>\"\n  ],\n  \"enhance_audio_quality\": true\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Content-Type", "<content-type>")
	req.Header.Add("Authorization", "<authorization>")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.highwayapi.ai/v4beta/model")
  .header("Content-Type", "<content-type>")
  .header("Authorization", "<authorization>")
  .body("{\n  \"type\": {},\n  \"title\": \"<string>\",\n  \"train_mode\": {},\n  \"voices\": [\n    null\n  ],\n  \"visibility\": {},\n  \"description\": {},\n  \"cover_image\": {},\n  \"texts\": [\n    \"<string>\"\n  ],\n  \"tags\": [\n    \"<string>\"\n  ],\n  \"enhance_audio_quality\": true\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.highwayapi.ai/v4beta/model")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Content-Type"] = '<content-type>'
request["Authorization"] = '<authorization>'
request.body = "{\n  \"type\": {},\n  \"title\": \"<string>\",\n  \"train_mode\": {},\n  \"voices\": [\n    null\n  ],\n  \"visibility\": {},\n  \"description\": {},\n  \"cover_image\": {},\n  \"texts\": [\n    \"<string>\"\n  ],\n  \"tags\": [\n    \"<string>\"\n  ],\n  \"enhance_audio_quality\": true\n}"

response = http.request(request)
puts response.read_body

{
  "_id": "<string>",
  "type": {},
  "title": "<string>",
  "description": "<string>",
  "cover_image": "<string>",
  "state": {},
  "tags": [
    "<string>"
  ],
  "created_at": {},
  "updated_at": {},
  "visibility": {},
  "like_count": 123,
  "mark_count": 123,
  "shared_count": 123,
  "task_count": 123,
  "author": {
    "_id": "<string>",
    "nickname": "<string>",
    "avatar": "<string>"
  },
  "train_mode": {},
  "samples": [
    {
      "title": "<string>",
      "text": "<string>",
      "task_id": "<string>",
      "audio": "<string>"
    }
  ],
  "languages": [
    "<string>"
  ],
  "lock_visibility": true,
  "unliked": true,
  "liked": true,
  "marked": true
}

The Fish Audio API is used to create voice models (voice cloning).

Request Headers

string

required

Enum value: application/json

string

required

Bearer authentication format: Bearer {{API Key}}.

Request Body

enum<string>

required

Model type. tts represents text-to-speech.Available value: ttsAllowed value: "tts"

string

required

The model title or name.

enum<string>

required

The model training mode. For TTS models, fast means the model is available immediately after creation.Available value: fastAllowed value: "fast"

file[]

required

Upload voice files used to fine-tune the model.

enum<string>

default:"public"

Model visibility. public will be displayed on the discovery page, unlist allows anyone with the link to access it, and private is visible only to the creator.Available values: public, unlist, private

string | null

Model description.

file | null

Model cover image. This is required if the model is public.

string[]

Text corresponding to the voices. If not specified, ASR (automatic speech recognition) will be performed on the voices.

string[]

Model tags.

boolean

default:false

Enhance audio quality.

Response Information

string

required

The unique identifier of the created model.

enum<string>

required

Model type.Available values: svc, tts

string

required

The model title or name.

string

required

Model description.

string

required

The URL of the model cover image.

enum<string>

required

The current state of the model.Available values: created, training, trained, failed

string[]

required

Model tags.

string<date-time>

required

The timestamp when the model was created.

string<date-time>

required

The timestamp when the model was last updated.

enum<string>

required

The model visibility setting.Available values: public, unlist, private

integer

required

The number of likes the model has received.

integer

required

The number of favorites/bookmarks the model has received.

integer

required

The number of times the model has been shared.

integer

required

The number of tasks associated with the model.

AuthorEntity · object

required

Information about the model author.

Show properties

string

required

The unique identifier of the author.

string

required

The author’s nickname.

string

required

The URL of the author’s avatar image.

enum<string>

default:"full"

The training mode used by the model.Available values: fast, full

SampleEntity · object[]

Sample data associated with the model.

Show properties

string

required

Sample title.

string

required

The text content of the sample.

string

required

The task identifier of the sample.

string

required

The URL of the sample audio file.

string[]

Languages supported by the model.

boolean

default:false

Whether the visibility setting is locked.

boolean

default:false

Whether the current user has unliked this model.

boolean

default:false

Whether the current user has liked this model.

boolean

default:false

Whether the current user has favorited/bookmarked this model.

Fish Audio Text-to-Speech

Gemini 2.5 Flash TTS Text-to-Speech

API Basics

Large Language Models

Images

Video

Audio

Fish Audio Audio Cloning

Request Headers

Request Body

Response Information

​Request Headers

​Request Body

​Response Information

Request Headers

Request Body

Response Information