interface SpeechCreateParams {
    input: string;
    instructions?: string;
    model: string & {} | OpenAIClient.Audio.Speech.SpeechModel;
    response_format?:
        | "wav"
        | "mp3"
        | "flac"
        | "opus"
        | "aac"
        | "pcm";
    speed?: number;
    voice:
        | string & {}
        | "alloy"
        | "ash"
        | "ballad"
        | "coral"
        | "echo"
        | "fable"
        | "onyx"
        | "nova"
        | "sage"
        | "shimmer"
        | "verse";
}

Properties

input: string

The text to generate audio for. The maximum length is 4096 characters.

instructions?: string

Control the voice of your generated audio with additional instructions. Does not work with tts-1 or tts-1-hd.

model: string & {} | OpenAIClient.Audio.Speech.SpeechModel

One of the available TTS models: tts-1, tts-1-hd or gpt-4o-mini-tts.

response_format?:
    | "wav"
    | "mp3"
    | "flac"
    | "opus"
    | "aac"
    | "pcm"

The format to audio in. Supported formats are mp3, opus, aac, flac, wav, and pcm.

speed?: number

The speed of the generated audio. Select a value from 0.25 to 4.0. 1.0 is the default.

voice:
    | string & {}
    | "alloy"
    | "ash"
    | "ballad"
    | "coral"
    | "echo"
    | "fable"
    | "onyx"
    | "nova"
    | "sage"
    | "shimmer"
    | "verse"

The voice to use when generating the audio. Supported voices are alloy, ash, ballad, coral, echo, fable, onyx, nova, sage, shimmer, and verse. Previews of the voices are available in the Text to speech guide.