@@ -32,7 +32,9 @@ export interface Session {
3232 id ?: string ;
3333
3434 /**
35- * The format of input audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
35+ * The format of input audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`. For
36+ * `pcm16`, input audio must be 16-bit PCM at a 24kHz sample rate, single channel
37+ * (mono), and little-endian byte order.
3638 */
3739 input_audio_format ?: 'pcm16' | 'g711_ulaw' | 'g711_alaw' ;
3840
@@ -86,6 +88,7 @@ export interface Session {
8688
8789 /**
8890 * The format of output audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
91+ * For `pcm16`, output audio is sampled at a rate of 24kHz.
8992 */
9093 output_audio_format ?: 'pcm16' | 'g711_ulaw' | 'g711_alaw' ;
9194
@@ -372,17 +375,9 @@ export namespace SessionCreateResponse {
372375
373376export interface SessionCreateParams {
374377 /**
375- * The Realtime model used for this session.
376- */
377- model :
378- | 'gpt-4o-realtime-preview'
379- | 'gpt-4o-realtime-preview-2024-10-01'
380- | 'gpt-4o-realtime-preview-2024-12-17'
381- | 'gpt-4o-mini-realtime-preview'
382- | 'gpt-4o-mini-realtime-preview-2024-12-17' ;
383-
384- /**
385- * The format of input audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
378+ * The format of input audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`. For
379+ * `pcm16`, input audio must be 16-bit PCM at a 24kHz sample rate, single channel
380+ * (mono), and little-endian byte order.
386381 */
387382 input_audio_format ?: 'pcm16' | 'g711_ulaw' | 'g711_alaw' ;
388383
@@ -423,8 +418,19 @@ export interface SessionCreateParams {
423418 */
424419 modalities ?: Array < 'text' | 'audio' > ;
425420
421+ /**
422+ * The Realtime model used for this session.
423+ */
424+ model ?:
425+ | 'gpt-4o-realtime-preview'
426+ | 'gpt-4o-realtime-preview-2024-10-01'
427+ | 'gpt-4o-realtime-preview-2024-12-17'
428+ | 'gpt-4o-mini-realtime-preview'
429+ | 'gpt-4o-mini-realtime-preview-2024-12-17' ;
430+
426431 /**
427432 * The format of output audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
433+ * For `pcm16`, output audio is sampled at a rate of 24kHz.
428434 */
429435 output_audio_format ?: 'pcm16' | 'g711_ulaw' | 'g711_alaw' ;
430436
0 commit comments