Skip to content

Commit a5f005b

Browse files
committed
use correct object key: output_modalities instead of modalities
see https://platform.openai.com/docs/api-reference/realtime-beta-sessions/session_object
1 parent 4361aa6 commit a5f005b

File tree

2 files changed

+7
-4
lines changed

2 files changed

+7
-4
lines changed

plugins/openai/src/realtime/api_proto.ts

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -190,7 +190,7 @@ export interface SessionResource {
190190
id: string;
191191
object: 'realtime.session';
192192
model: string;
193-
modalities: ['text', 'audio'] | ['text']; // default: ["text", "audio"]
193+
output_modalities: ['text', 'audio'] | ['text'] | ['audio']; // default: ["text", "audio"]
194194
instructions: string;
195195
voice: Voice; // default: "alloy"
196196
input_audio_format: AudioFormat; // default: "pcm16"
@@ -267,7 +267,7 @@ export interface SessionUpdateEvent extends BaseClientEvent {
267267
type: 'session.update';
268268
session: Partial<{
269269
model: Model;
270-
modalities: ['text', 'audio'] | ['text'];
270+
output_modalities: ['text', 'audio'] | ['text'] | ['audio'];
271271
instructions: string;
272272
voice: Voice;
273273
input_audio_format: AudioFormat;
@@ -350,7 +350,7 @@ export interface ConversationItemDeleteEvent extends BaseClientEvent {
350350
export interface ResponseCreateEvent extends BaseClientEvent {
351351
type: 'response.create';
352352
response?: Partial<{
353-
modalities: ['text', 'audio'] | ['text'];
353+
output_modalities: ['text', 'audio'] | ['text'] | ['audio'];
354354
instructions: string;
355355
voice: Voice;
356356
output_audio_format: AudioFormat;

plugins/openai/src/realtime/realtime_model.ts

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -406,7 +406,10 @@ export class RealtimeSession extends llm.RealtimeSession {
406406
voice: this.oaiRealtimeModel._options.voice,
407407
input_audio_format: 'pcm16',
408408
output_audio_format: 'pcm16',
409-
modalities: this.oaiRealtimeModel._options.modalities as ['text', 'audio'] | ['text'],
409+
output_modalities: this.oaiRealtimeModel._options.modalities as
410+
| ['text', 'audio']
411+
| ['text']
412+
| ['audio'],
410413
turn_detection: this.oaiRealtimeModel._options.turnDetection,
411414
input_audio_transcription: this.oaiRealtimeModel._options.inputAudioTranscription,
412415
// TODO(shubhra): add inputAudioNoiseReduction

0 commit comments

Comments
 (0)