@@ -54,14 +54,17 @@ def create(
54
54
"gpt-4o-realtime-preview" ,
55
55
"gpt-4o-realtime-preview-2024-10-01" ,
56
56
"gpt-4o-realtime-preview-2024-12-17" ,
57
+ "gpt-4o-realtime-preview-2025-06-03" ,
57
58
"gpt-4o-mini-realtime-preview" ,
58
59
"gpt-4o-mini-realtime-preview-2024-12-17" ,
59
60
]
60
61
| NotGiven = NOT_GIVEN ,
61
62
output_audio_format : Literal ["pcm16" , "g711_ulaw" , "g711_alaw" ] | NotGiven = NOT_GIVEN ,
63
+ speed : float | NotGiven = NOT_GIVEN ,
62
64
temperature : float | NotGiven = NOT_GIVEN ,
63
65
tool_choice : str | NotGiven = NOT_GIVEN ,
64
66
tools : Iterable [session_create_params .Tool ] | NotGiven = NOT_GIVEN ,
67
+ tracing : session_create_params .Tracing | NotGiven = NOT_GIVEN ,
65
68
turn_detection : session_create_params .TurnDetection | NotGiven = NOT_GIVEN ,
66
69
voice : Union [
67
70
str , Literal ["alloy" , "ash" , "ballad" , "coral" , "echo" , "fable" , "onyx" , "nova" , "sage" , "shimmer" , "verse" ]
@@ -129,6 +132,10 @@ def create(
129
132
output_audio_format: The format of output audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
130
133
For `pcm16`, output audio is sampled at a rate of 24kHz.
131
134
135
+ speed: The speed of the model's spoken response. 1.0 is the default speed. 0.25 is the
136
+ minimum speed. 1.5 is the maximum speed. This value can only be changed in
137
+ between model turns, not while a response is in progress.
138
+
132
139
temperature: Sampling temperature for the model, limited to [0.6, 1.2]. For audio models a
133
140
temperature of 0.8 is highly recommended for best performance.
134
141
@@ -137,6 +144,12 @@ def create(
137
144
138
145
tools: Tools (functions) available to the model.
139
146
147
+ tracing: Configuration options for tracing. Set to null to disable tracing. Once tracing
148
+ is enabled for a session, the configuration cannot be modified.
149
+
150
+ `auto` will create a trace for the session with default values for the workflow
151
+ name, group id, and metadata.
152
+
140
153
turn_detection: Configuration for turn detection, ether Server VAD or Semantic VAD. This can be
141
154
set to `null` to turn off, in which case the client must manually trigger model
142
155
response. Server VAD means that the model will detect the start and end of
@@ -175,9 +188,11 @@ def create(
175
188
"modalities" : modalities ,
176
189
"model" : model ,
177
190
"output_audio_format" : output_audio_format ,
191
+ "speed" : speed ,
178
192
"temperature" : temperature ,
179
193
"tool_choice" : tool_choice ,
180
194
"tools" : tools ,
195
+ "tracing" : tracing ,
181
196
"turn_detection" : turn_detection ,
182
197
"voice" : voice ,
183
198
},
@@ -224,14 +239,17 @@ async def create(
224
239
"gpt-4o-realtime-preview" ,
225
240
"gpt-4o-realtime-preview-2024-10-01" ,
226
241
"gpt-4o-realtime-preview-2024-12-17" ,
242
+ "gpt-4o-realtime-preview-2025-06-03" ,
227
243
"gpt-4o-mini-realtime-preview" ,
228
244
"gpt-4o-mini-realtime-preview-2024-12-17" ,
229
245
]
230
246
| NotGiven = NOT_GIVEN ,
231
247
output_audio_format : Literal ["pcm16" , "g711_ulaw" , "g711_alaw" ] | NotGiven = NOT_GIVEN ,
248
+ speed : float | NotGiven = NOT_GIVEN ,
232
249
temperature : float | NotGiven = NOT_GIVEN ,
233
250
tool_choice : str | NotGiven = NOT_GIVEN ,
234
251
tools : Iterable [session_create_params .Tool ] | NotGiven = NOT_GIVEN ,
252
+ tracing : session_create_params .Tracing | NotGiven = NOT_GIVEN ,
235
253
turn_detection : session_create_params .TurnDetection | NotGiven = NOT_GIVEN ,
236
254
voice : Union [
237
255
str , Literal ["alloy" , "ash" , "ballad" , "coral" , "echo" , "fable" , "onyx" , "nova" , "sage" , "shimmer" , "verse" ]
@@ -299,6 +317,10 @@ async def create(
299
317
output_audio_format: The format of output audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
300
318
For `pcm16`, output audio is sampled at a rate of 24kHz.
301
319
320
+ speed: The speed of the model's spoken response. 1.0 is the default speed. 0.25 is the
321
+ minimum speed. 1.5 is the maximum speed. This value can only be changed in
322
+ between model turns, not while a response is in progress.
323
+
302
324
temperature: Sampling temperature for the model, limited to [0.6, 1.2]. For audio models a
303
325
temperature of 0.8 is highly recommended for best performance.
304
326
@@ -307,6 +329,12 @@ async def create(
307
329
308
330
tools: Tools (functions) available to the model.
309
331
332
+ tracing: Configuration options for tracing. Set to null to disable tracing. Once tracing
333
+ is enabled for a session, the configuration cannot be modified.
334
+
335
+ `auto` will create a trace for the session with default values for the workflow
336
+ name, group id, and metadata.
337
+
310
338
turn_detection: Configuration for turn detection, ether Server VAD or Semantic VAD. This can be
311
339
set to `null` to turn off, in which case the client must manually trigger model
312
340
response. Server VAD means that the model will detect the start and end of
@@ -345,9 +373,11 @@ async def create(
345
373
"modalities" : modalities ,
346
374
"model" : model ,
347
375
"output_audio_format" : output_audio_format ,
376
+ "speed" : speed ,
348
377
"temperature" : temperature ,
349
378
"tool_choice" : tool_choice ,
350
379
"tools" : tools ,
380
+ "tracing" : tracing ,
351
381
"turn_detection" : turn_detection ,
352
382
"voice" : voice ,
353
383
},
0 commit comments