Generate Speech

curl --request POST \
  --url https://{gatewayBaseURL}/audio/speech \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "input": "<string>",
  "model": "<string>",
  "voice": "<string>",
  "instructions": "<string>",
  "response_format": "<string>",
  "speed": 123,
  "stream_format": "<string>"
}
'

import requests

url = "https://{gatewayBaseURL}/audio/speech"

payload = {
    "input": "<string>",
    "model": "<string>",
    "voice": "<string>",
    "instructions": "<string>",
    "response_format": "<string>",
    "speed": 123,
    "stream_format": "<string>"
}
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {Authorization: 'Bearer <token>', 'Content-Type': 'application/json'},
  body: JSON.stringify({
    input: '<string>',
    model: '<string>',
    voice: '<string>',
    instructions: '<string>',
    response_format: '<string>',
    speed: 123,
    stream_format: '<string>'
  })
};

fetch('https://{gatewayBaseURL}/audio/speech', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://{gatewayBaseURL}/audio/speech",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'input' => '<string>',
    'model' => '<string>',
    'voice' => '<string>',
    'instructions' => '<string>',
    'response_format' => '<string>',
    'speed' => 123,
    'stream_format' => '<string>'
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://{gatewayBaseURL}/audio/speech"

	payload := strings.NewReader("{\n  \"input\": \"<string>\",\n  \"model\": \"<string>\",\n  \"voice\": \"<string>\",\n  \"instructions\": \"<string>\",\n  \"response_format\": \"<string>\",\n  \"speed\": 123,\n  \"stream_format\": \"<string>\"\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://{gatewayBaseURL}/audio/speech")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"input\": \"<string>\",\n  \"model\": \"<string>\",\n  \"voice\": \"<string>\",\n  \"instructions\": \"<string>\",\n  \"response_format\": \"<string>\",\n  \"speed\": 123,\n  \"stream_format\": \"<string>\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://{gatewayBaseURL}/audio/speech")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"input\": \"<string>\",\n  \"model\": \"<string>\",\n  \"voice\": \"<string>\",\n  \"instructions\": \"<string>\",\n  \"response_format\": \"<string>\",\n  \"speed\": 123,\n  \"stream_format\": \"<string>\"\n}"

response = http.request(request)
puts response.read_body

"<string>"

POST

audio

speech

Generate Speech

curl --request POST \
  --url https://{gatewayBaseURL}/audio/speech \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "input": "<string>",
  "model": "<string>",
  "voice": "<string>",
  "instructions": "<string>",
  "response_format": "<string>",
  "speed": 123,
  "stream_format": "<string>"
}
'

import requests

url = "https://{gatewayBaseURL}/audio/speech"

payload = {
    "input": "<string>",
    "model": "<string>",
    "voice": "<string>",
    "instructions": "<string>",
    "response_format": "<string>",
    "speed": 123,
    "stream_format": "<string>"
}
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {Authorization: 'Bearer <token>', 'Content-Type': 'application/json'},
  body: JSON.stringify({
    input: '<string>',
    model: '<string>',
    voice: '<string>',
    instructions: '<string>',
    response_format: '<string>',
    speed: 123,
    stream_format: '<string>'
  })
};

fetch('https://{gatewayBaseURL}/audio/speech', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://{gatewayBaseURL}/audio/speech",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'input' => '<string>',
    'model' => '<string>',
    'voice' => '<string>',
    'instructions' => '<string>',
    'response_format' => '<string>',
    'speed' => 123,
    'stream_format' => '<string>'
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://{gatewayBaseURL}/audio/speech"

	payload := strings.NewReader("{\n  \"input\": \"<string>\",\n  \"model\": \"<string>\",\n  \"voice\": \"<string>\",\n  \"instructions\": \"<string>\",\n  \"response_format\": \"<string>\",\n  \"speed\": 123,\n  \"stream_format\": \"<string>\"\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://{gatewayBaseURL}/audio/speech")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"input\": \"<string>\",\n  \"model\": \"<string>\",\n  \"voice\": \"<string>\",\n  \"instructions\": \"<string>\",\n  \"response_format\": \"<string>\",\n  \"speed\": 123,\n  \"stream_format\": \"<string>\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://{gatewayBaseURL}/audio/speech")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"input\": \"<string>\",\n  \"model\": \"<string>\",\n  \"voice\": \"<string>\",\n  \"instructions\": \"<string>\",\n  \"response_format\": \"<string>\",\n  \"speed\": 123,\n  \"stream_format\": \"<string>\"\n}"

response = http.request(request)
puts response.read_body

"<string>"

Authorizations

Authorization

string

header

required

Bearer authentication header of the form Bearer <token>, where <token> is your auth token.

Headers

x-tfy-metadata

string

Optional metadata for the request

Body

application/json

Text to convert to speech and speech generation options

input

string

required

The text to generate audio for. The maximum length is 4096 characters.

model

string

required

The TTS model to use (e.g. tts-1, tts-1-hd, gpt-4o-mini-tts).

voice

The voice to use for single-speaker TTS. Can be a string (OpenAI format: alloy, ash, ballad, coral, echo, fable, onyx, nova, sage, shimmer, verse) or an object with name and languageCode (Vertex AI format).

instructions

string | null

Control the voice of your generated audio with additional instructions. Does not work with tts-1 or tts-1-hd.

response_format

string | null

The format to audio in. Supported formats are mp3, opus, aac, flac, wav, and pcm. Default: mp3.

speed

number | null

The speed of the generated audio. Select a value from 0.25 to 4.0. Default: 1.0.

stream_format

string | null

The format to stream the audio in. Supported formats are sse and audio. sse is not supported for tts-1 or tts-1-hd. Default: audio.

Response

Audio generated successfully

The audio file content

Translate Audio List Batches

⌘I

Get Started

LLM Gateway

MCP Registry and Gateway

Skills Registry

Prompt Registry

Guardrails and Security

Observability

Deployment

Admin Guide

Chat

Messages

Embeddings

Rerank

Responses

Image

Audio

Batch

Files

Fine-tuning

Moderations

Models

Generate Speech

Authorizations

Headers

Body

Response