@@ -34,20 +34,24 @@ func NewAudioService(opts ...option.RequestOption) (r AudioService) {
3434type AudioModel = string
3535
3636const (
37- AudioModelWhisper1 AudioModel = "whisper-1"
38- AudioModelGPT4oTranscribe AudioModel = "gpt-4o-transcribe"
39- AudioModelGPT4oMiniTranscribe AudioModel = "gpt-4o-mini-transcribe"
37+ AudioModelWhisper1 AudioModel = "whisper-1"
38+ AudioModelGPT4oTranscribe AudioModel = "gpt-4o-transcribe"
39+ AudioModelGPT4oMiniTranscribe AudioModel = "gpt-4o-mini-transcribe"
40+ AudioModelGPT4oTranscribeDiarize AudioModel = "gpt-4o-transcribe-diarize"
4041)
4142
4243// The format of the output, in one of these options: `json`, `text`, `srt`,
43- // `verbose_json`, or `vtt`. For `gpt-4o-transcribe` and `gpt-4o-mini-transcribe`,
44- // the only supported format is `json`.
44+ // `verbose_json`, `vtt`, or `diarized_json`. For `gpt-4o-transcribe` and
45+ // `gpt-4o-mini-transcribe`, the only supported format is `json`. For
46+ // `gpt-4o-transcribe-diarize`, the supported formats are `json`, `text`, and
47+ // `diarized_json`, with `diarized_json` required to receive speaker annotations.
4548type AudioResponseFormat string
4649
4750const (
48- AudioResponseFormatJSON AudioResponseFormat = "json"
49- AudioResponseFormatText AudioResponseFormat = "text"
50- AudioResponseFormatSRT AudioResponseFormat = "srt"
51- AudioResponseFormatVerboseJSON AudioResponseFormat = "verbose_json"
52- AudioResponseFormatVTT AudioResponseFormat = "vtt"
51+ AudioResponseFormatJSON AudioResponseFormat = "json"
52+ AudioResponseFormatText AudioResponseFormat = "text"
53+ AudioResponseFormatSRT AudioResponseFormat = "srt"
54+ AudioResponseFormatVerboseJSON AudioResponseFormat = "verbose_json"
55+ AudioResponseFormatVTT AudioResponseFormat = "vtt"
56+ AudioResponseFormatDiarizedJSON AudioResponseFormat = "diarized_json"
5357)
0 commit comments