@@ -41,7 +41,7 @@ def create(
41
41
input : str ,
42
42
model : Union [str , Literal ["tts-1" , "tts-1-hd" ]],
43
43
voice : Literal ["alloy" , "echo" , "fable" , "onyx" , "nova" , "shimmer" ],
44
- response_format : Literal ["mp3" , "opus" , "aac" , "flac" ] | NotGiven = NOT_GIVEN ,
44
+ response_format : Literal ["mp3" , "opus" , "aac" , "flac" , "pcm" , "wav" ] | NotGiven = NOT_GIVEN ,
45
45
speed : float | NotGiven = NOT_GIVEN ,
46
46
# Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
47
47
# The extra values given here take precedence over values defined on the client or passed to this method.
@@ -65,7 +65,11 @@ def create(
65
65
available in the
66
66
[Text to speech guide](https://platform.openai.com/docs/guides/text-to-speech/voice-options).
67
67
68
- response_format: The format to audio in. Supported formats are `mp3`, `opus`, `aac`, and `flac`.
68
+ response_format: The format to return audio in. Supported formats are `mp3`, `opus`, `aac`,
69
+ `flac`, `pcm`, and `wav`.
70
+
71
+ The `pcm` audio format, similar to `wav` but without a header, utilizes a 24kHz
72
+ sample rate, mono channel, and 16-bit depth in signed little-endian format.
69
73
70
74
speed: The speed of the generated audio. Select a value from `0.25` to `4.0`. `1.0` is
71
75
the default.
@@ -113,7 +117,7 @@ async def create(
113
117
input : str ,
114
118
model : Union [str , Literal ["tts-1" , "tts-1-hd" ]],
115
119
voice : Literal ["alloy" , "echo" , "fable" , "onyx" , "nova" , "shimmer" ],
116
- response_format : Literal ["mp3" , "opus" , "aac" , "flac" ] | NotGiven = NOT_GIVEN ,
120
+ response_format : Literal ["mp3" , "opus" , "aac" , "flac" , "pcm" , "wav" ] | NotGiven = NOT_GIVEN ,
117
121
speed : float | NotGiven = NOT_GIVEN ,
118
122
# Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
119
123
# The extra values given here take precedence over values defined on the client or passed to this method.
@@ -137,7 +141,11 @@ async def create(
137
141
available in the
138
142
[Text to speech guide](https://platform.openai.com/docs/guides/text-to-speech/voice-options).
139
143
140
- response_format: The format to audio in. Supported formats are `mp3`, `opus`, `aac`, and `flac`.
144
+ response_format: The format to return audio in. Supported formats are `mp3`, `opus`, `aac`,
145
+ `flac`, `pcm`, and `wav`.
146
+
147
+ The `pcm` audio format, similar to `wav` but without a header, utilizes a 24kHz
148
+ sample rate, mono channel, and 16-bit depth in signed little-endian format.
141
149
142
150
speed: The speed of the generated audio. Select a value from `0.25` to `4.0`. `1.0` is
143
151
the default.
0 commit comments