@@ -10,11 +10,14 @@ import {
1010 TranscriptionCreateParamsNonStreaming ,
1111 TranscriptionCreateParamsStreaming ,
1212 TranscriptionCreateResponse ,
13+ TranscriptionDiarized ,
14+ TranscriptionDiarizedSegment ,
1315 TranscriptionInclude ,
1416 TranscriptionSegment ,
1517 TranscriptionStreamEvent ,
1618 TranscriptionTextDeltaEvent ,
1719 TranscriptionTextDoneEvent ,
20+ TranscriptionTextSegmentEvent ,
1821 TranscriptionVerbose ,
1922 TranscriptionWord ,
2023 Transcriptions ,
@@ -34,14 +37,20 @@ export class Audio extends APIResource {
3437 speech : SpeechAPI . Speech = new SpeechAPI . Speech ( this . _client ) ;
3538}
3639
37- export type AudioModel = 'whisper-1' | 'gpt-4o-transcribe' | 'gpt-4o-mini-transcribe' ;
40+ export type AudioModel =
41+ | 'whisper-1'
42+ | 'gpt-4o-transcribe'
43+ | 'gpt-4o-mini-transcribe'
44+ | 'gpt-4o-transcribe-diarize' ;
3845
3946/**
4047 * The format of the output, in one of these options: `json`, `text`, `srt`,
41- * `verbose_json`, or `vtt`. For `gpt-4o-transcribe` and `gpt-4o-mini-transcribe`,
42- * the only supported format is `json`.
48+ * `verbose_json`, `vtt`, or `diarized_json`. For `gpt-4o-transcribe` and
49+ * `gpt-4o-mini-transcribe`, the only supported format is `json`. For
50+ * `gpt-4o-transcribe-diarize`, the supported formats are `json`, `text`, and
51+ * `diarized_json`, with `diarized_json` required to receive speaker annotations.
4352 */
44- export type AudioResponseFormat = 'json' | 'text' | 'srt' | 'verbose_json' | 'vtt' ;
53+ export type AudioResponseFormat = 'json' | 'text' | 'srt' | 'verbose_json' | 'vtt' | 'diarized_json' ;
4554
4655Audio . Transcriptions = Transcriptions ;
4756Audio . Translations = Translations ;
@@ -53,11 +62,14 @@ export declare namespace Audio {
5362 export {
5463 Transcriptions as Transcriptions ,
5564 type Transcription as Transcription ,
65+ type TranscriptionDiarized as TranscriptionDiarized ,
66+ type TranscriptionDiarizedSegment as TranscriptionDiarizedSegment ,
5667 type TranscriptionInclude as TranscriptionInclude ,
5768 type TranscriptionSegment as TranscriptionSegment ,
5869 type TranscriptionStreamEvent as TranscriptionStreamEvent ,
5970 type TranscriptionTextDeltaEvent as TranscriptionTextDeltaEvent ,
6071 type TranscriptionTextDoneEvent as TranscriptionTextDoneEvent ,
72+ type TranscriptionTextSegmentEvent as TranscriptionTextSegmentEvent ,
6173 type TranscriptionVerbose as TranscriptionVerbose ,
6274 type TranscriptionWord as TranscriptionWord ,
6375 type TranscriptionCreateResponse as TranscriptionCreateResponse ,
0 commit comments