오디오

음성 API (Beta)

Converts text to speech using various voice models and formats.

Voice cloning: Some TTS models (e.g. tts-chatterbox-hd) accept a cloned-voice handle in the voice field. Mint a handle by uploading a reference audio sample to POST /v1/audio/voices, then pass the returned vv_<id> value as voice here paired with the same model. Supported voice-cloning models advertise the voice_cloning capability on GET /models?type=tts.

Authentication: This endpoint accepts either a Bearer API key or a SIGN-IN-WITH-X header for x402 wallet-based authentication. The legacy X-Sign-In-With-X header is also accepted during migration. When using x402, a 402 Payment Required response indicates insufficient balance and includes top-up instructions.

POST

audio

speech

/api/v1/audio/speech

curl --request POST \
  --url https://api.venice.ai/api/v1/audio/speech \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "input": "Hello, welcome to Venice Voice.",
  "model": "tts-xai-v1",
  "response_format": "mp3",
  "speed": 1,
  "streaming": false,
  "voice": "af_sky"
}
'

import requests

url = "https://api.venice.ai/api/v1/audio/speech"

payload = {
    "input": "Hello, welcome to Venice Voice.",
    "model": "tts-xai-v1",
    "response_format": "mp3",
    "speed": 1,
    "streaming": False,
    "voice": "af_sky"
}
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {Authorization: 'Bearer <token>', 'Content-Type': 'application/json'},
  body: JSON.stringify({
    input: 'Hello, welcome to Venice Voice.',
    model: 'tts-xai-v1',
    response_format: 'mp3',
    speed: 1,
    streaming: false,
    voice: 'af_sky'
  })
};

fetch('https://api.venice.ai/api/v1/audio/speech', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.venice.ai/api/v1/audio/speech",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'input' => 'Hello, welcome to Venice Voice.',
    'model' => 'tts-xai-v1',
    'response_format' => 'mp3',
    'speed' => 1,
    'streaming' => false,
    'voice' => 'af_sky'
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.venice.ai/api/v1/audio/speech"

	payload := strings.NewReader("{\n  \"input\": \"Hello, welcome to Venice Voice.\",\n  \"model\": \"tts-xai-v1\",\n  \"response_format\": \"mp3\",\n  \"speed\": 1,\n  \"streaming\": false,\n  \"voice\": \"af_sky\"\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.venice.ai/api/v1/audio/speech")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"input\": \"Hello, welcome to Venice Voice.\",\n  \"model\": \"tts-xai-v1\",\n  \"response_format\": \"mp3\",\n  \"speed\": 1,\n  \"streaming\": false,\n  \"voice\": \"af_sky\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.venice.ai/api/v1/audio/speech")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"input\": \"Hello, welcome to Venice Voice.\",\n  \"model\": \"tts-xai-v1\",\n  \"response_format\": \"mp3\",\n  \"speed\": 1,\n  \"streaming\": false,\n  \"voice\": \"af_sky\"\n}"

response = http.request(request)
puts response.read_body

"<string>"

{
  "error": "<string>",
  "details": {
    "_errors": [],
    "field": {
      "_errors": [
        "Field is required"
      ]
    }
  }
}

{
  "error": "<string>"
}

{
  "error": "<string>"
}

{
  "error": "<string>"
}

{
  "error": "<string>"
}

{
  "error": "<string>"
}

{
  "error": "<string>"
}

{
  "error": "<string>"
}

인증

Authorization

string

header

필수

Bearer authentication header of the form Bearer <token>, where <token> is your auth token.

본문

application/json

Request to generate audio from text.

input

string

필수

The text to generate audio for. The maximum length is 4096 characters.

Required string length: 1 - 4096

예시:

"Hello, this is a test of the text to speech system."

language

string

Optional language hint. Accepted values are model-specific: Qwen 3 accepts full names (English, Chinese, ...); xAI/ElevenLabs accept ISO 639-1 codes (en, ja, ...); MiniMax accepts full names. Unsupported values are silently ignored. Omit to let the model auto-detect.

Required string length: 2 - 32

예시:

"English"

model

enum<string>

기본값:tts-kokoro

The model ID of a Venice TTS model.

사용 가능한 옵션:

tts-kokoro,

tts-qwen3-0-6b,

tts-qwen3-1-7b,

tts-xai-v1,

tts-inworld-1-5-max,

tts-chatterbox-hd,

tts-orpheus,

tts-elevenlabs-turbo-v2-5,

tts-minimax-speech-02-hd,

tts-gemini-3-1-flash,

tts-gradium-v1

예시:

"tts-xai-v1"

prompt

string

A style prompt to control the emotion and delivery of the speech. Supported by models advertising supportsPromptParam (currently Qwen 3 TTS). Ignored by other models. Examples: "Very happy.", "Sad and slow.", "Excited and energetic."

Maximum string length: 500

예시:

"Very happy."

response_format

enum<string>

기본값:mp3

The format to audio in.

사용 가능한 옵션:

mp3,

opus,

aac,

flac,

wav,

pcm

예시:

"mp3"

speed

number

기본값:1

The speed of the generated audio. Select a value from 0.25 to 4.0. 1.0 is the default.

필수 범위: 0.25 <= x <= 4

예시:

1

streaming

boolean

기본값:false

Should the content stream back sentence by sentence or be processed and returned as a complete audio file.

예시:

true

temperature

number

Sampling temperature for speech generation. Higher values produce more varied output. Supported by models advertising supportsTemperatureParam (Qwen 3, Orpheus, Chatterbox HD). Ignored by other models.

필수 범위: 0 <= x <= 2

예시:

0.9

top_p

number

Nucleus sampling parameter. Supported by models advertising supportsTopPParam (currently Qwen 3 TTS). Ignored by other models.

필수 범위: 0 <= x <= 1

예시:

1

voice

기본값:af_sky

The voice to use when generating the audio. Voices are model-specific: Kokoro (e.g. af_sky, af_bella, am_adam), Qwen 3 (e.g. Vivian, Serena, Dylan), xAI (eve, ara, rex, sal, leo), Orpheus (tara, leah, jess, leo, dan, mia, zac, zoe), Inworld (Craig, Ashley, ...), Chatterbox (Aurora, Blade, ...), ElevenLabs Turbo (Rachel, Aria, ...), MiniMax (WiseWoman, DeepVoiceMan, ...), Gradium (Emma, Kent, Mia, Maximilian, Valentina, Sergio, Elise, Leo, Alice, Davi — spanning en/de/es/fr/pt). You can also pass a cloned-voice handle (vv_<id>) returned by POST /v1/audio/voices to synthesize in a previously cloned voice; the handle must be paired with the same model used to create it. Using an incompatible voice returns a 400 error. Call GET /models/{id} to list voices for a specific model.

사용 가능한 옵션:

af_alloy,

af_aoede,

af_bella,

af_heart,

af_jadzia,

af_jessica,

af_kore,

af_nicole,

af_nova,

af_river,

af_sarah,

af_sky,

am_adam,

am_echo,

am_eric,

am_fenrir,

am_liam,

am_michael,

am_onyx,

am_puck,

am_santa,

bf_alice,

bf_emma,

bf_lily,

bm_daniel,

bm_fable,

bm_george,

bm_lewis,

zf_xiaobei,

zf_xiaoni,

zf_xiaoxiao,

zf_xiaoyi,

zm_yunjian,

zm_yunxi,

zm_yunxia,

zm_yunyang,

ff_siwis,

hf_alpha,

hf_beta,

hm_omega,

hm_psi,

if_sara,

im_nicola,

jf_alpha,

jf_gongitsune,

jf_nezumi,

jf_tebukuro,

jm_kumo,

pf_dora,

pm_alex,

pm_santa,

ef_dora,

em_alex,

em_santa,

Vivian,

Serena,

Ono_Anna,

Sohee,

Uncle_Fu,

Dylan,

Eric,

Ryan,

Aiden,

eve,

ara,

rex,

sal,

leo,

Craig,

Ashley,

Olivia,

Sarah,

Elizabeth,

Priya,

Alex,

Edward,

Theodore,

Ronald,

Mark,

Hades,

Luna,

Pixie,

Aurora,

Britney,

Siobhan,

Vicky,

Blade,

Carl,

Cliff,

Richard,

Rico,

tara,

leah,

jess,

mia,

zoe,

dan,

zac,

Rachel,

Aria,

Laura,

Charlotte,

Alice,

Matilda,

Jessica,

Lily,

Roger,

Charlie,

George,

Callum,

River,

Liam,

Will,

Chris,

Brian,

Daniel,

Bill,

WiseWoman,

FriendlyPerson,

InspirationalGirl,

CalmWoman,

LivelyGirl,

LovelyGirl,

SweetGirl,

ExuberantGirl,

DeepVoiceMan,

CasualGuy,

PatientMan,

YoungKnight,

DeterminedMan,

ImposingManner,

ElegantMan,

Achernar,

Achird,

Algenib,

Algieba,

Alnilam,

Aoede,

Autonoe,

Callirrhoe,

Charon,

Despina,

Enceladus,

Erinome,

Fenrir,

Gacrux,

Iapetus,

Kore,

Laomedeia,

Leda,

Orus,

Pulcherrima,

Puck,

Rasalgethi,

Sadachbia,

Sadaltager,

Schedar,

Sulafat,

Umbriel,

Vindemiatrix,

Zephyr,

Zubenelgenubi,

Emma,

Kent,

Eva,

Jack,

Mia,

Maximilian,

Valentina,

Sergio,

Elise,

Leo,

Davi

예시:

"af_sky"

응답

Audio content generated successfully

The response is of type file.

이미지 생성 (OpenAI 호환 API)

전사 API (Beta)

⌘I

/api/v1/audio/speech

curl --request POST \
  --url https://api.venice.ai/api/v1/audio/speech \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "input": "Hello, welcome to Venice Voice.",
  "model": "tts-xai-v1",
  "response_format": "mp3",
  "speed": 1,
  "streaming": false,
  "voice": "af_sky"
}
'

import requests

url = "https://api.venice.ai/api/v1/audio/speech"

payload = {
    "input": "Hello, welcome to Venice Voice.",
    "model": "tts-xai-v1",
    "response_format": "mp3",
    "speed": 1,
    "streaming": False,
    "voice": "af_sky"
}
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {Authorization: 'Bearer <token>', 'Content-Type': 'application/json'},
  body: JSON.stringify({
    input: 'Hello, welcome to Venice Voice.',
    model: 'tts-xai-v1',
    response_format: 'mp3',
    speed: 1,
    streaming: false,
    voice: 'af_sky'
  })
};

fetch('https://api.venice.ai/api/v1/audio/speech', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.venice.ai/api/v1/audio/speech",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'input' => 'Hello, welcome to Venice Voice.',
    'model' => 'tts-xai-v1',
    'response_format' => 'mp3',
    'speed' => 1,
    'streaming' => false,
    'voice' => 'af_sky'
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.venice.ai/api/v1/audio/speech"

	payload := strings.NewReader("{\n  \"input\": \"Hello, welcome to Venice Voice.\",\n  \"model\": \"tts-xai-v1\",\n  \"response_format\": \"mp3\",\n  \"speed\": 1,\n  \"streaming\": false,\n  \"voice\": \"af_sky\"\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.venice.ai/api/v1/audio/speech")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"input\": \"Hello, welcome to Venice Voice.\",\n  \"model\": \"tts-xai-v1\",\n  \"response_format\": \"mp3\",\n  \"speed\": 1,\n  \"streaming\": false,\n  \"voice\": \"af_sky\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.venice.ai/api/v1/audio/speech")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"input\": \"Hello, welcome to Venice Voice.\",\n  \"model\": \"tts-xai-v1\",\n  \"response_format\": \"mp3\",\n  \"speed\": 1,\n  \"streaming\": false,\n  \"voice\": \"af_sky\"\n}"

response = http.request(request)
puts response.read_body

"<string>"

{
  "error": "<string>",
  "details": {
    "_errors": [],
    "field": {
      "_errors": [
        "Field is required"
      ]
    }
  }
}

{
  "error": "<string>"
}

{
  "error": "<string>"
}

{
  "error": "<string>"
}

{
  "error": "<string>"
}

{
  "error": "<string>"
}

{
  "error": "<string>"
}

{
  "error": "<string>"
}