@@ -34,7 +34,9 @@ export interface Session {
3434 id ?: string ;
3535
3636 /**
37- * The format of input audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
37+ * The format of input audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`. For
38+ * `pcm16`, input audio must be 16-bit PCM at a 24kHz sample rate, single channel
39+ * (mono), and little-endian byte order.
3840 */
3941 input_audio_format ?: 'pcm16' | 'g711_ulaw' | 'g711_alaw' ;
4042
@@ -88,6 +90,7 @@ export interface Session {
8890
8991 /**
9092 * The format of output audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
93+ * For `pcm16`, output audio is sampled at a rate of 24kHz.
9194 */
9295 output_audio_format ?: 'pcm16' | 'g711_ulaw' | 'g711_alaw' ;
9396
@@ -374,17 +377,9 @@ export namespace SessionCreateResponse {
374377
375378export interface SessionCreateParams {
376379 /**
377- * The Realtime model used for this session.
378- */
379- model :
380- | 'gpt-4o-realtime-preview'
381- | 'gpt-4o-realtime-preview-2024-10-01'
382- | 'gpt-4o-realtime-preview-2024-12-17'
383- | 'gpt-4o-mini-realtime-preview'
384- | 'gpt-4o-mini-realtime-preview-2024-12-17' ;
385-
386- /**
387- * The format of input audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
380+ * The format of input audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`. For
381+ * `pcm16`, input audio must be 16-bit PCM at a 24kHz sample rate, single channel
382+ * (mono), and little-endian byte order.
388383 */
389384 input_audio_format ?: 'pcm16' | 'g711_ulaw' | 'g711_alaw' ;
390385
@@ -425,8 +420,19 @@ export interface SessionCreateParams {
425420 */
426421 modalities ?: Array < 'text' | 'audio' > ;
427422
423+ /**
424+ * The Realtime model used for this session.
425+ */
426+ model ?:
427+ | 'gpt-4o-realtime-preview'
428+ | 'gpt-4o-realtime-preview-2024-10-01'
429+ | 'gpt-4o-realtime-preview-2024-12-17'
430+ | 'gpt-4o-mini-realtime-preview'
431+ | 'gpt-4o-mini-realtime-preview-2024-12-17' ;
432+
428433 /**
429434 * The format of output audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
435+ * For `pcm16`, output audio is sampled at a rate of 24kHz.
430436 */
431437 output_audio_format ?: 'pcm16' | 'g711_ulaw' | 'g711_alaw' ;
432438
0 commit comments