openai 6.36.0 → 6.37.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +23 -0
- package/internal/utils/log.d.mts.map +1 -1
- package/internal/utils/log.d.ts.map +1 -1
- package/internal/utils/log.js +2 -0
- package/internal/utils/log.js.map +1 -1
- package/internal/utils/log.mjs +2 -0
- package/internal/utils/log.mjs.map +1 -1
- package/package.json +1 -1
- package/resources/admin/organization/usage.d.mts +45 -0
- package/resources/admin/organization/usage.d.mts.map +1 -1
- package/resources/admin/organization/usage.d.ts +45 -0
- package/resources/admin/organization/usage.d.ts.map +1 -1
- package/resources/chat/completions/completions.d.mts +4 -4
- package/resources/chat/completions/completions.d.mts.map +1 -1
- package/resources/chat/completions/completions.d.ts +4 -4
- package/resources/chat/completions/completions.d.ts.map +1 -1
- package/resources/images.d.mts +53 -24
- package/resources/images.d.mts.map +1 -1
- package/resources/images.d.ts +53 -24
- package/resources/images.d.ts.map +1 -1
- package/resources/realtime/calls.d.mts +10 -1
- package/resources/realtime/calls.d.mts.map +1 -1
- package/resources/realtime/calls.d.ts +10 -1
- package/resources/realtime/calls.d.ts.map +1 -1
- package/resources/realtime/client-secrets.d.mts +24 -37
- package/resources/realtime/client-secrets.d.mts.map +1 -1
- package/resources/realtime/client-secrets.d.ts +24 -37
- package/resources/realtime/client-secrets.d.ts.map +1 -1
- package/resources/realtime/index.d.mts +1 -1
- package/resources/realtime/index.d.mts.map +1 -1
- package/resources/realtime/index.d.ts +1 -1
- package/resources/realtime/index.d.ts.map +1 -1
- package/resources/realtime/index.js.map +1 -1
- package/resources/realtime/index.mjs.map +1 -1
- package/resources/realtime/realtime.d.mts +545 -10
- package/resources/realtime/realtime.d.mts.map +1 -1
- package/resources/realtime/realtime.d.ts +545 -10
- package/resources/realtime/realtime.d.ts.map +1 -1
- package/resources/realtime/realtime.js.map +1 -1
- package/resources/realtime/realtime.mjs.map +1 -1
- package/resources/responses/responses.d.mts +45 -11
- package/resources/responses/responses.d.mts.map +1 -1
- package/resources/responses/responses.d.ts +45 -11
- package/resources/responses/responses.d.ts.map +1 -1
- package/resources/responses/responses.js.map +1 -1
- package/resources/responses/responses.mjs.map +1 -1
- package/src/internal/utils/log.ts +2 -0
- package/src/resources/admin/organization/usage.ts +54 -0
- package/src/resources/chat/completions/completions.ts +4 -4
- package/src/resources/images.ts +60 -22
- package/src/resources/realtime/api.md +18 -1
- package/src/resources/realtime/calls.ts +12 -0
- package/src/resources/realtime/client-secrets.ts +25 -37
- package/src/resources/realtime/index.ts +0 -1
- package/src/resources/realtime/realtime.ts +647 -8
- package/src/resources/responses/responses.ts +53 -10
- package/src/version.ts +1 -1
- package/version.d.mts +1 -1
- package/version.d.ts +1 -1
- package/version.js +1 -1
- package/version.mjs +1 -1
package/src/resources/images.ts
CHANGED
|
@@ -400,7 +400,15 @@ export interface ImageGenPartialImageEvent {
|
|
|
400
400
|
*/
|
|
401
401
|
export type ImageGenStreamEvent = ImageGenPartialImageEvent | ImageGenCompletedEvent;
|
|
402
402
|
|
|
403
|
-
export type ImageModel =
|
|
403
|
+
export type ImageModel =
|
|
404
|
+
| 'gpt-image-1'
|
|
405
|
+
| 'gpt-image-1-mini'
|
|
406
|
+
| 'gpt-image-2'
|
|
407
|
+
| 'gpt-image-2-2026-04-21'
|
|
408
|
+
| 'gpt-image-1.5'
|
|
409
|
+
| 'chatgpt-image-latest'
|
|
410
|
+
| 'dall-e-2'
|
|
411
|
+
| 'dall-e-3';
|
|
404
412
|
|
|
405
413
|
/**
|
|
406
414
|
* The response from the image generation endpoint.
|
|
@@ -553,10 +561,10 @@ export interface ImageEditParamsBase {
|
|
|
553
561
|
/**
|
|
554
562
|
* The image(s) to edit. Must be a supported image file or an array of images.
|
|
555
563
|
*
|
|
556
|
-
* For the GPT image models (`gpt-image-1`, `gpt-image-1-mini`,
|
|
557
|
-
* `gpt-image-
|
|
558
|
-
* 50MB. You can provide up to
|
|
559
|
-
*
|
|
564
|
+
* For the GPT image models (`gpt-image-1`, `gpt-image-1-mini`, `gpt-image-1.5`,
|
|
565
|
+
* `gpt-image-2`, `gpt-image-2-2026-04-21`, and `chatgpt-image-latest`), each image
|
|
566
|
+
* should be a `png`, `webp`, or `jpg` file less than 50MB. You can provide up to
|
|
567
|
+
* 16 images.
|
|
560
568
|
*
|
|
561
569
|
* For `dall-e-2`, you can only provide one image, and it should be a square `png`
|
|
562
570
|
* file less than 4MB.
|
|
@@ -571,9 +579,14 @@ export interface ImageEditParamsBase {
|
|
|
571
579
|
|
|
572
580
|
/**
|
|
573
581
|
* Allows to set transparency for the background of the generated image(s). This
|
|
574
|
-
* parameter is only supported for
|
|
575
|
-
* `transparent`, `opaque
|
|
576
|
-
* model will automatically determine the best background
|
|
582
|
+
* parameter is only supported for GPT image models that support transparent
|
|
583
|
+
* backgrounds. Must be one of `transparent`, `opaque`, or `auto` (default value).
|
|
584
|
+
* When `auto` is used, the model will automatically determine the best background
|
|
585
|
+
* for the image.
|
|
586
|
+
*
|
|
587
|
+
* `gpt-image-2` and `gpt-image-2-2026-04-21` do not support transparent
|
|
588
|
+
* backgrounds. Requests with `background` set to `transparent` will return an
|
|
589
|
+
* error for these models; use `opaque` or `auto` instead.
|
|
577
590
|
*
|
|
578
591
|
* If `transparent`, the output format needs to support transparency, so it should
|
|
579
592
|
* be set to either `png` (default value) or `webp`.
|
|
@@ -597,7 +610,10 @@ export interface ImageEditParamsBase {
|
|
|
597
610
|
mask?: Uploadable;
|
|
598
611
|
|
|
599
612
|
/**
|
|
600
|
-
* The model to use for image generation.
|
|
613
|
+
* The model to use for image generation. One of `dall-e-2` or a GPT image model
|
|
614
|
+
* (`gpt-image-1`, `gpt-image-1-mini`, `gpt-image-1.5`, `gpt-image-2`,
|
|
615
|
+
* `gpt-image-2-2026-04-21`, or `chatgpt-image-latest`). Defaults to
|
|
616
|
+
* `gpt-image-1.5`.
|
|
601
617
|
*/
|
|
602
618
|
model?: (string & {}) | ImageModel | null;
|
|
603
619
|
|
|
@@ -645,11 +661,19 @@ export interface ImageEditParamsBase {
|
|
|
645
661
|
response_format?: 'url' | 'b64_json' | null;
|
|
646
662
|
|
|
647
663
|
/**
|
|
648
|
-
* The size of the generated images.
|
|
649
|
-
*
|
|
650
|
-
*
|
|
664
|
+
* The size of the generated images. For `gpt-image-2` and
|
|
665
|
+
* `gpt-image-2-2026-04-21`, arbitrary resolutions are supported as `WIDTHxHEIGHT`
|
|
666
|
+
* strings, for example `1536x864`. Width and height must both be divisible by 16
|
|
667
|
+
* and the requested aspect ratio must be between 1:3 and 3:1. Resolutions above
|
|
668
|
+
* `2560x1440` are experimental, and the maximum supported resolution is
|
|
669
|
+
* `3840x2160`. The requested size must also satisfy the model's current pixel and
|
|
670
|
+
* edge limits. The standard sizes `1024x1024`, `1536x1024`, and `1024x1536` are
|
|
671
|
+
* supported by the GPT image models; `auto` is supported for models that allow
|
|
672
|
+
* automatic sizing. For `dall-e-2`, use one of `256x256`, `512x512`, or
|
|
673
|
+
* `1024x1024`. For `dall-e-3`, use one of `1024x1024`, `1792x1024`, or
|
|
674
|
+
* `1024x1792`.
|
|
651
675
|
*/
|
|
652
|
-
size?: '256x256' | '512x512' | '1024x1024' | '1536x1024' | '1024x1536' | 'auto' | null;
|
|
676
|
+
size?: (string & {}) | '256x256' | '512x512' | '1024x1024' | '1536x1024' | '1024x1536' | 'auto' | null;
|
|
653
677
|
|
|
654
678
|
/**
|
|
655
679
|
* Edit the image in streaming mode. Defaults to `false`. See the
|
|
@@ -701,9 +725,14 @@ export interface ImageGenerateParamsBase {
|
|
|
701
725
|
|
|
702
726
|
/**
|
|
703
727
|
* Allows to set transparency for the background of the generated image(s). This
|
|
704
|
-
* parameter is only supported for
|
|
705
|
-
* `transparent`, `opaque
|
|
706
|
-
* model will automatically determine the best background
|
|
728
|
+
* parameter is only supported for GPT image models that support transparent
|
|
729
|
+
* backgrounds. Must be one of `transparent`, `opaque`, or `auto` (default value).
|
|
730
|
+
* When `auto` is used, the model will automatically determine the best background
|
|
731
|
+
* for the image.
|
|
732
|
+
*
|
|
733
|
+
* `gpt-image-2` and `gpt-image-2-2026-04-21` do not support transparent
|
|
734
|
+
* backgrounds. Requests with `background` set to `transparent` will return an
|
|
735
|
+
* error for these models; use `opaque` or `auto` instead.
|
|
707
736
|
*
|
|
708
737
|
* If `transparent`, the output format needs to support transparency, so it should
|
|
709
738
|
* be set to either `png` (default value) or `webp`.
|
|
@@ -712,8 +741,9 @@ export interface ImageGenerateParamsBase {
|
|
|
712
741
|
|
|
713
742
|
/**
|
|
714
743
|
* The model to use for image generation. One of `dall-e-2`, `dall-e-3`, or a GPT
|
|
715
|
-
* image model (`gpt-image-1`, `gpt-image-1-mini`, `gpt-image-1.5`
|
|
716
|
-
* `dall-e-2` unless a parameter specific
|
|
744
|
+
* image model (`gpt-image-1`, `gpt-image-1-mini`, `gpt-image-1.5`, `gpt-image-2`,
|
|
745
|
+
* or `gpt-image-2-2026-04-21`). Defaults to `dall-e-2` unless a parameter specific
|
|
746
|
+
* to the GPT image models is used.
|
|
717
747
|
*/
|
|
718
748
|
model?: (string & {}) | ImageModel | null;
|
|
719
749
|
|
|
@@ -773,12 +803,20 @@ export interface ImageGenerateParamsBase {
|
|
|
773
803
|
response_format?: 'url' | 'b64_json' | null;
|
|
774
804
|
|
|
775
805
|
/**
|
|
776
|
-
* The size of the generated images.
|
|
777
|
-
*
|
|
778
|
-
*
|
|
779
|
-
*
|
|
806
|
+
* The size of the generated images. For `gpt-image-2` and
|
|
807
|
+
* `gpt-image-2-2026-04-21`, arbitrary resolutions are supported as `WIDTHxHEIGHT`
|
|
808
|
+
* strings, for example `1536x864`. Width and height must both be divisible by 16
|
|
809
|
+
* and the requested aspect ratio must be between 1:3 and 3:1. Resolutions above
|
|
810
|
+
* `2560x1440` are experimental, and the maximum supported resolution is
|
|
811
|
+
* `3840x2160`. The requested size must also satisfy the model's current pixel and
|
|
812
|
+
* edge limits. The standard sizes `1024x1024`, `1536x1024`, and `1024x1536` are
|
|
813
|
+
* supported by the GPT image models; `auto` is supported for models that allow
|
|
814
|
+
* automatic sizing. For `dall-e-2`, use one of `256x256`, `512x512`, or
|
|
815
|
+
* `1024x1024`. For `dall-e-3`, use one of `1024x1024`, `1792x1024`, or
|
|
816
|
+
* `1024x1792`.
|
|
780
817
|
*/
|
|
781
818
|
size?:
|
|
819
|
+
| (string & {})
|
|
782
820
|
| 'auto'
|
|
783
821
|
| '1024x1024'
|
|
784
822
|
| '1536x1024'
|
|
@@ -56,6 +56,8 @@ Types:
|
|
|
56
56
|
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeMcpToolCall</a></code>
|
|
57
57
|
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeMcpToolExecutionError</a></code>
|
|
58
58
|
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeMcphttpError</a></code>
|
|
59
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeReasoning</a></code>
|
|
60
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeReasoningEffort</a></code>
|
|
59
61
|
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeResponse</a></code>
|
|
60
62
|
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeResponseCreateAudioOutput</a></code>
|
|
61
63
|
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeResponseCreateMcpTool</a></code>
|
|
@@ -75,6 +77,22 @@ Types:
|
|
|
75
77
|
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranscriptionSessionAudioInput</a></code>
|
|
76
78
|
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranscriptionSessionAudioInputTurnDetection</a></code>
|
|
77
79
|
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranscriptionSessionCreateRequest</a></code>
|
|
80
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationClientEvent</a></code>
|
|
81
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationClientSecretCreateRequest</a></code>
|
|
82
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationClientSecretCreateResponse</a></code>
|
|
83
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationInputAudioBufferAppendEvent</a></code>
|
|
84
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationInputTranscriptDeltaEvent</a></code>
|
|
85
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationOutputAudioDeltaEvent</a></code>
|
|
86
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationOutputTranscriptDeltaEvent</a></code>
|
|
87
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationServerEvent</a></code>
|
|
88
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationSession</a></code>
|
|
89
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationSessionCloseEvent</a></code>
|
|
90
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationSessionClosedEvent</a></code>
|
|
91
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationSessionCreateRequest</a></code>
|
|
92
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationSessionCreatedEvent</a></code>
|
|
93
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationSessionUpdateEvent</a></code>
|
|
94
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationSessionUpdateRequest</a></code>
|
|
95
|
+
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTranslationSessionUpdatedEvent</a></code>
|
|
78
96
|
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTruncation</a></code>
|
|
79
97
|
- <code><a href="./src/resources/realtime/realtime.ts">RealtimeTruncationRetentionRatio</a></code>
|
|
80
98
|
- <code><a href="./src/resources/realtime/realtime.ts">ResponseAudioDeltaEvent</a></code>
|
|
@@ -108,7 +126,6 @@ Types:
|
|
|
108
126
|
|
|
109
127
|
Types:
|
|
110
128
|
|
|
111
|
-
- <code><a href="./src/resources/realtime/client-secrets.ts">RealtimeSessionClientSecret</a></code>
|
|
112
129
|
- <code><a href="./src/resources/realtime/client-secrets.ts">RealtimeSessionCreateResponse</a></code>
|
|
113
130
|
- <code><a href="./src/resources/realtime/client-secrets.ts">RealtimeTranscriptionSessionCreateResponse</a></code>
|
|
114
131
|
- <code><a href="./src/resources/realtime/client-secrets.ts">RealtimeTranscriptionSessionTurnDetection</a></code>
|
|
@@ -134,6 +134,7 @@ export interface CallAcceptParams {
|
|
|
134
134
|
| (string & {})
|
|
135
135
|
| 'gpt-realtime'
|
|
136
136
|
| 'gpt-realtime-1.5'
|
|
137
|
+
| 'gpt-realtime-2'
|
|
137
138
|
| 'gpt-realtime-2025-08-28'
|
|
138
139
|
| 'gpt-4o-realtime-preview'
|
|
139
140
|
| 'gpt-4o-realtime-preview-2024-10-01'
|
|
@@ -157,12 +158,23 @@ export interface CallAcceptParams {
|
|
|
157
158
|
*/
|
|
158
159
|
output_modalities?: Array<'text' | 'audio'>;
|
|
159
160
|
|
|
161
|
+
/**
|
|
162
|
+
* Whether the model may call multiple tools in parallel. Only supported by
|
|
163
|
+
* reasoning Realtime models such as `gpt-realtime-2`.
|
|
164
|
+
*/
|
|
165
|
+
parallel_tool_calls?: boolean;
|
|
166
|
+
|
|
160
167
|
/**
|
|
161
168
|
* Reference to a prompt template and its variables.
|
|
162
169
|
* [Learn more](https://platform.openai.com/docs/guides/text?api-mode=responses#reusable-prompts).
|
|
163
170
|
*/
|
|
164
171
|
prompt?: ResponsesAPI.ResponsePrompt | null;
|
|
165
172
|
|
|
173
|
+
/**
|
|
174
|
+
* Configuration for reasoning-capable Realtime models such as `gpt-realtime-2`.
|
|
175
|
+
*/
|
|
176
|
+
reasoning?: RealtimeAPI.RealtimeReasoning;
|
|
177
|
+
|
|
166
178
|
/**
|
|
167
179
|
* How the model chooses tools. Provide one of the string modes or force a specific
|
|
168
180
|
* function/MCP tool.
|
|
@@ -41,32 +41,18 @@ export class ClientSecrets extends APIResource {
|
|
|
41
41
|
}
|
|
42
42
|
|
|
43
43
|
/**
|
|
44
|
-
*
|
|
44
|
+
* A Realtime session configuration object.
|
|
45
45
|
*/
|
|
46
|
-
export interface
|
|
47
|
-
/**
|
|
48
|
-
* Timestamp for when the token expires. Currently, all tokens expire after one
|
|
49
|
-
* minute.
|
|
50
|
-
*/
|
|
51
|
-
expires_at: number;
|
|
52
|
-
|
|
46
|
+
export interface RealtimeSessionCreateResponse {
|
|
53
47
|
/**
|
|
54
|
-
*
|
|
55
|
-
* Realtime API. Use this in client-side environments rather than a standard API
|
|
56
|
-
* token, which should only be used server-side.
|
|
48
|
+
* Unique identifier for the session that looks like `sess_1234567890abcdef`.
|
|
57
49
|
*/
|
|
58
|
-
|
|
59
|
-
}
|
|
50
|
+
id: string;
|
|
60
51
|
|
|
61
|
-
/**
|
|
62
|
-
* A new Realtime session configuration, with an ephemeral key. Default TTL for
|
|
63
|
-
* keys is one minute.
|
|
64
|
-
*/
|
|
65
|
-
export interface RealtimeSessionCreateResponse {
|
|
66
52
|
/**
|
|
67
|
-
*
|
|
53
|
+
* The object type. Always `realtime.session`.
|
|
68
54
|
*/
|
|
69
|
-
|
|
55
|
+
object: 'realtime.session';
|
|
70
56
|
|
|
71
57
|
/**
|
|
72
58
|
* The type of session to create. Always `realtime` for the Realtime API.
|
|
@@ -78,6 +64,11 @@ export interface RealtimeSessionCreateResponse {
|
|
|
78
64
|
*/
|
|
79
65
|
audio?: RealtimeSessionCreateResponse.Audio;
|
|
80
66
|
|
|
67
|
+
/**
|
|
68
|
+
* Expiration timestamp for the session, in seconds since epoch.
|
|
69
|
+
*/
|
|
70
|
+
expires_at?: number;
|
|
71
|
+
|
|
81
72
|
/**
|
|
82
73
|
* Additional fields to include in server outputs.
|
|
83
74
|
*
|
|
@@ -115,6 +106,7 @@ export interface RealtimeSessionCreateResponse {
|
|
|
115
106
|
| (string & {})
|
|
116
107
|
| 'gpt-realtime'
|
|
117
108
|
| 'gpt-realtime-1.5'
|
|
109
|
+
| 'gpt-realtime-2'
|
|
118
110
|
| 'gpt-realtime-2025-08-28'
|
|
119
111
|
| 'gpt-4o-realtime-preview'
|
|
120
112
|
| 'gpt-4o-realtime-preview-2024-10-01'
|
|
@@ -144,6 +136,11 @@ export interface RealtimeSessionCreateResponse {
|
|
|
144
136
|
*/
|
|
145
137
|
prompt?: ResponsesAPI.ResponsePrompt | null;
|
|
146
138
|
|
|
139
|
+
/**
|
|
140
|
+
* Configuration for reasoning-capable Realtime models such as `gpt-realtime-2`.
|
|
141
|
+
*/
|
|
142
|
+
reasoning?: RealtimeAPI.RealtimeReasoning;
|
|
143
|
+
|
|
147
144
|
/**
|
|
148
145
|
* How the model chooses tools. Provide one of the string modes or force a specific
|
|
149
146
|
* function/MCP tool.
|
|
@@ -215,16 +212,6 @@ export namespace RealtimeSessionCreateResponse {
|
|
|
215
212
|
*/
|
|
216
213
|
noise_reduction?: Input.NoiseReduction;
|
|
217
214
|
|
|
218
|
-
/**
|
|
219
|
-
* Configuration for input audio transcription, defaults to off and can be set to
|
|
220
|
-
* `null` to turn off once on. Input audio transcription is not native to the
|
|
221
|
-
* model, since the model consumes audio directly. Transcription runs
|
|
222
|
-
* asynchronously through
|
|
223
|
-
* [the /audio/transcriptions endpoint](https://platform.openai.com/docs/api-reference/audio/createTranscription)
|
|
224
|
-
* and should be treated as guidance of input audio content rather than precisely
|
|
225
|
-
* what the model heard. The client can optionally set the language and prompt for
|
|
226
|
-
* transcription, these offer additional guidance to the transcription service.
|
|
227
|
-
*/
|
|
228
215
|
transcription?: RealtimeAPI.AudioTranscription;
|
|
229
216
|
|
|
230
217
|
/**
|
|
@@ -241,6 +228,9 @@ export namespace RealtimeSessionCreateResponse {
|
|
|
241
228
|
* trails off with "uhhm", the model will score a low probability of turn end and
|
|
242
229
|
* wait longer for the user to continue speaking. This can be useful for more
|
|
243
230
|
* natural conversations, but may have a higher latency.
|
|
231
|
+
*
|
|
232
|
+
* For `gpt-realtime-whisper` transcription sessions, turn detection must be set to
|
|
233
|
+
* `null`; VAD is not supported.
|
|
244
234
|
*/
|
|
245
235
|
turn_detection?: Input.ServerVad | Input.SemanticVad | null;
|
|
246
236
|
}
|
|
@@ -640,17 +630,15 @@ export namespace RealtimeTranscriptionSessionCreateResponse {
|
|
|
640
630
|
*/
|
|
641
631
|
noise_reduction?: Input.NoiseReduction;
|
|
642
632
|
|
|
643
|
-
/**
|
|
644
|
-
* Configuration of the transcription model.
|
|
645
|
-
*/
|
|
646
633
|
transcription?: RealtimeAPI.AudioTranscription;
|
|
647
634
|
|
|
648
635
|
/**
|
|
649
636
|
* Configuration for turn detection. Can be set to `null` to turn off. Server VAD
|
|
650
637
|
* means that the model will detect the start and end of speech based on audio
|
|
651
|
-
* volume and respond at the end of user speech.
|
|
638
|
+
* volume and respond at the end of user speech. For `gpt-realtime-whisper`, this
|
|
639
|
+
* must be `null`; VAD is not supported.
|
|
652
640
|
*/
|
|
653
|
-
turn_detection?: ClientSecretsAPI.RealtimeTranscriptionSessionTurnDetection;
|
|
641
|
+
turn_detection?: ClientSecretsAPI.RealtimeTranscriptionSessionTurnDetection | null;
|
|
654
642
|
}
|
|
655
643
|
|
|
656
644
|
export namespace Input {
|
|
@@ -672,7 +660,8 @@ export namespace RealtimeTranscriptionSessionCreateResponse {
|
|
|
672
660
|
/**
|
|
673
661
|
* Configuration for turn detection. Can be set to `null` to turn off. Server VAD
|
|
674
662
|
* means that the model will detect the start and end of speech based on audio
|
|
675
|
-
* volume and respond at the end of user speech.
|
|
663
|
+
* volume and respond at the end of user speech. For `gpt-realtime-whisper`, this
|
|
664
|
+
* must be `null`; VAD is not supported.
|
|
676
665
|
*/
|
|
677
666
|
export interface RealtimeTranscriptionSessionTurnDetection {
|
|
678
667
|
/**
|
|
@@ -763,7 +752,6 @@ export namespace ClientSecretCreateParams {
|
|
|
763
752
|
|
|
764
753
|
export declare namespace ClientSecrets {
|
|
765
754
|
export {
|
|
766
|
-
type RealtimeSessionClientSecret as RealtimeSessionClientSecret,
|
|
767
755
|
type RealtimeSessionCreateResponse as RealtimeSessionCreateResponse,
|
|
768
756
|
type RealtimeTranscriptionSessionCreateResponse as RealtimeTranscriptionSessionCreateResponse,
|
|
769
757
|
type RealtimeTranscriptionSessionTurnDetection as RealtimeTranscriptionSessionTurnDetection,
|
|
@@ -3,7 +3,6 @@
|
|
|
3
3
|
export { Calls, type CallAcceptParams, type CallReferParams, type CallRejectParams } from './calls';
|
|
4
4
|
export {
|
|
5
5
|
ClientSecrets,
|
|
6
|
-
type RealtimeSessionClientSecret,
|
|
7
6
|
type RealtimeSessionCreateResponse,
|
|
8
7
|
type RealtimeTranscriptionSessionCreateResponse,
|
|
9
8
|
type RealtimeTranscriptionSessionTurnDetection,
|