@@ -54,14 +54,17 @@ def create(
5454 "gpt-4o-realtime-preview" ,
5555 "gpt-4o-realtime-preview-2024-10-01" ,
5656 "gpt-4o-realtime-preview-2024-12-17" ,
57+ "gpt-4o-realtime-preview-2025-06-03" ,
5758 "gpt-4o-mini-realtime-preview" ,
5859 "gpt-4o-mini-realtime-preview-2024-12-17" ,
5960 ]
6061 | NotGiven = NOT_GIVEN ,
6162 output_audio_format : Literal ["pcm16" , "g711_ulaw" , "g711_alaw" ] | NotGiven = NOT_GIVEN ,
63+ speed : float | NotGiven = NOT_GIVEN ,
6264 temperature : float | NotGiven = NOT_GIVEN ,
6365 tool_choice : str | NotGiven = NOT_GIVEN ,
6466 tools : Iterable [session_create_params .Tool ] | NotGiven = NOT_GIVEN ,
67+ tracing : session_create_params .Tracing | NotGiven = NOT_GIVEN ,
6568 turn_detection : session_create_params .TurnDetection | NotGiven = NOT_GIVEN ,
6669 voice : Union [
6770 str , Literal ["alloy" , "ash" , "ballad" , "coral" , "echo" , "fable" , "onyx" , "nova" , "sage" , "shimmer" , "verse" ]
@@ -129,6 +132,10 @@ def create(
129132 output_audio_format: The format of output audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
130133 For `pcm16`, output audio is sampled at a rate of 24kHz.
131134
135+ speed: The speed of the model's spoken response. 1.0 is the default speed. 0.25 is the
136+ minimum speed. 1.5 is the maximum speed. This value can only be changed in
137+ between model turns, not while a response is in progress.
138+
132139 temperature: Sampling temperature for the model, limited to [0.6, 1.2]. For audio models a
133140 temperature of 0.8 is highly recommended for best performance.
134141
@@ -137,6 +144,12 @@ def create(
137144
138145 tools: Tools (functions) available to the model.
139146
147+ tracing: Configuration options for tracing. Set to null to disable tracing. Once tracing
148+ is enabled for a session, the configuration cannot be modified.
149+
150+ `auto` will create a trace for the session with default values for the workflow
151+ name, group id, and metadata.
152+
140153 turn_detection: Configuration for turn detection, ether Server VAD or Semantic VAD. This can be
141154 set to `null` to turn off, in which case the client must manually trigger model
142155 response. Server VAD means that the model will detect the start and end of
@@ -175,9 +188,11 @@ def create(
175188 "modalities" : modalities ,
176189 "model" : model ,
177190 "output_audio_format" : output_audio_format ,
191+ "speed" : speed ,
178192 "temperature" : temperature ,
179193 "tool_choice" : tool_choice ,
180194 "tools" : tools ,
195+ "tracing" : tracing ,
181196 "turn_detection" : turn_detection ,
182197 "voice" : voice ,
183198 },
@@ -224,14 +239,17 @@ async def create(
224239 "gpt-4o-realtime-preview" ,
225240 "gpt-4o-realtime-preview-2024-10-01" ,
226241 "gpt-4o-realtime-preview-2024-12-17" ,
242+ "gpt-4o-realtime-preview-2025-06-03" ,
227243 "gpt-4o-mini-realtime-preview" ,
228244 "gpt-4o-mini-realtime-preview-2024-12-17" ,
229245 ]
230246 | NotGiven = NOT_GIVEN ,
231247 output_audio_format : Literal ["pcm16" , "g711_ulaw" , "g711_alaw" ] | NotGiven = NOT_GIVEN ,
248+ speed : float | NotGiven = NOT_GIVEN ,
232249 temperature : float | NotGiven = NOT_GIVEN ,
233250 tool_choice : str | NotGiven = NOT_GIVEN ,
234251 tools : Iterable [session_create_params .Tool ] | NotGiven = NOT_GIVEN ,
252+ tracing : session_create_params .Tracing | NotGiven = NOT_GIVEN ,
235253 turn_detection : session_create_params .TurnDetection | NotGiven = NOT_GIVEN ,
236254 voice : Union [
237255 str , Literal ["alloy" , "ash" , "ballad" , "coral" , "echo" , "fable" , "onyx" , "nova" , "sage" , "shimmer" , "verse" ]
@@ -299,6 +317,10 @@ async def create(
299317 output_audio_format: The format of output audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
300318 For `pcm16`, output audio is sampled at a rate of 24kHz.
301319
320+ speed: The speed of the model's spoken response. 1.0 is the default speed. 0.25 is the
321+ minimum speed. 1.5 is the maximum speed. This value can only be changed in
322+ between model turns, not while a response is in progress.
323+
302324 temperature: Sampling temperature for the model, limited to [0.6, 1.2]. For audio models a
303325 temperature of 0.8 is highly recommended for best performance.
304326
@@ -307,6 +329,12 @@ async def create(
307329
308330 tools: Tools (functions) available to the model.
309331
332+ tracing: Configuration options for tracing. Set to null to disable tracing. Once tracing
333+ is enabled for a session, the configuration cannot be modified.
334+
335+ `auto` will create a trace for the session with default values for the workflow
336+ name, group id, and metadata.
337+
310338 turn_detection: Configuration for turn detection, ether Server VAD or Semantic VAD. This can be
311339 set to `null` to turn off, in which case the client must manually trigger model
312340 response. Server VAD means that the model will detect the start and end of
@@ -345,9 +373,11 @@ async def create(
345373 "modalities" : modalities ,
346374 "model" : model ,
347375 "output_audio_format" : output_audio_format ,
376+ "speed" : speed ,
348377 "temperature" : temperature ,
349378 "tool_choice" : tool_choice ,
350379 "tools" : tools ,
380+ "tracing" : tracing ,
351381 "turn_detection" : turn_detection ,
352382 "voice" : voice ,
353383 },
0 commit comments