@ai-sdk/openai 3.0.14 → 3.0.15
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +6 -0
- package/dist/index.js +1 -1
- package/dist/index.mjs +1 -1
- package/package.json +6 -5
- package/src/chat/__fixtures__/azure-model-router.1.chunks.txt +8 -0
- package/src/chat/__snapshots__/openai-chat-language-model.test.ts.snap +88 -0
- package/src/chat/convert-openai-chat-usage.ts +57 -0
- package/src/chat/convert-to-openai-chat-messages.test.ts +516 -0
- package/src/chat/convert-to-openai-chat-messages.ts +225 -0
- package/src/chat/get-response-metadata.ts +15 -0
- package/src/chat/map-openai-finish-reason.ts +19 -0
- package/src/chat/openai-chat-api.ts +198 -0
- package/src/chat/openai-chat-language-model.test.ts +3496 -0
- package/src/chat/openai-chat-language-model.ts +700 -0
- package/src/chat/openai-chat-options.ts +186 -0
- package/src/chat/openai-chat-prepare-tools.test.ts +322 -0
- package/src/chat/openai-chat-prepare-tools.ts +84 -0
- package/src/chat/openai-chat-prompt.ts +70 -0
- package/src/completion/convert-openai-completion-usage.ts +46 -0
- package/src/completion/convert-to-openai-completion-prompt.ts +93 -0
- package/src/completion/get-response-metadata.ts +15 -0
- package/src/completion/map-openai-finish-reason.ts +19 -0
- package/src/completion/openai-completion-api.ts +81 -0
- package/src/completion/openai-completion-language-model.test.ts +752 -0
- package/src/completion/openai-completion-language-model.ts +336 -0
- package/src/completion/openai-completion-options.ts +58 -0
- package/src/embedding/__snapshots__/openai-embedding-model.test.ts.snap +43 -0
- package/src/embedding/openai-embedding-api.ts +13 -0
- package/src/embedding/openai-embedding-model.test.ts +146 -0
- package/src/embedding/openai-embedding-model.ts +95 -0
- package/src/embedding/openai-embedding-options.ts +30 -0
- package/src/image/openai-image-api.ts +35 -0
- package/src/image/openai-image-model.test.ts +722 -0
- package/src/image/openai-image-model.ts +305 -0
- package/src/image/openai-image-options.ts +28 -0
- package/src/index.ts +9 -0
- package/src/internal/index.ts +19 -0
- package/src/openai-config.ts +18 -0
- package/src/openai-error.test.ts +34 -0
- package/src/openai-error.ts +22 -0
- package/src/openai-language-model-capabilities.test.ts +93 -0
- package/src/openai-language-model-capabilities.ts +54 -0
- package/src/openai-provider.test.ts +98 -0
- package/src/openai-provider.ts +270 -0
- package/src/openai-tools.ts +114 -0
- package/src/responses/__fixtures__/openai-apply-patch-tool-delete.1.chunks.txt +5 -0
- package/src/responses/__fixtures__/openai-apply-patch-tool.1.chunks.txt +38 -0
- package/src/responses/__fixtures__/openai-apply-patch-tool.1.json +69 -0
- package/src/responses/__fixtures__/openai-code-interpreter-tool.1.chunks.txt +393 -0
- package/src/responses/__fixtures__/openai-code-interpreter-tool.1.json +137 -0
- package/src/responses/__fixtures__/openai-error.1.chunks.txt +4 -0
- package/src/responses/__fixtures__/openai-error.1.json +8 -0
- package/src/responses/__fixtures__/openai-file-search-tool.1.chunks.txt +94 -0
- package/src/responses/__fixtures__/openai-file-search-tool.1.json +89 -0
- package/src/responses/__fixtures__/openai-file-search-tool.2.chunks.txt +93 -0
- package/src/responses/__fixtures__/openai-file-search-tool.2.json +112 -0
- package/src/responses/__fixtures__/openai-image-generation-tool.1.chunks.txt +16 -0
- package/src/responses/__fixtures__/openai-image-generation-tool.1.json +96 -0
- package/src/responses/__fixtures__/openai-local-shell-tool.1.chunks.txt +7 -0
- package/src/responses/__fixtures__/openai-local-shell-tool.1.json +70 -0
- package/src/responses/__fixtures__/openai-mcp-tool-approval.1.chunks.txt +11 -0
- package/src/responses/__fixtures__/openai-mcp-tool-approval.1.json +169 -0
- package/src/responses/__fixtures__/openai-mcp-tool-approval.2.chunks.txt +123 -0
- package/src/responses/__fixtures__/openai-mcp-tool-approval.2.json +176 -0
- package/src/responses/__fixtures__/openai-mcp-tool-approval.3.chunks.txt +11 -0
- package/src/responses/__fixtures__/openai-mcp-tool-approval.3.json +169 -0
- package/src/responses/__fixtures__/openai-mcp-tool-approval.4.chunks.txt +84 -0
- package/src/responses/__fixtures__/openai-mcp-tool-approval.4.json +182 -0
- package/src/responses/__fixtures__/openai-mcp-tool.1.chunks.txt +373 -0
- package/src/responses/__fixtures__/openai-mcp-tool.1.json +159 -0
- package/src/responses/__fixtures__/openai-reasoning-encrypted-content.1.chunks.txt +110 -0
- package/src/responses/__fixtures__/openai-reasoning-encrypted-content.1.json +117 -0
- package/src/responses/__fixtures__/openai-shell-tool.1.chunks.txt +182 -0
- package/src/responses/__fixtures__/openai-shell-tool.1.json +73 -0
- package/src/responses/__fixtures__/openai-web-search-tool.1.chunks.txt +185 -0
- package/src/responses/__fixtures__/openai-web-search-tool.1.json +266 -0
- package/src/responses/__snapshots__/openai-responses-language-model.test.ts.snap +10955 -0
- package/src/responses/convert-openai-responses-usage.ts +53 -0
- package/src/responses/convert-to-openai-responses-input.test.ts +2976 -0
- package/src/responses/convert-to-openai-responses-input.ts +578 -0
- package/src/responses/map-openai-responses-finish-reason.ts +22 -0
- package/src/responses/openai-responses-api.test.ts +89 -0
- package/src/responses/openai-responses-api.ts +1086 -0
- package/src/responses/openai-responses-language-model.test.ts +6927 -0
- package/src/responses/openai-responses-language-model.ts +1932 -0
- package/src/responses/openai-responses-options.ts +312 -0
- package/src/responses/openai-responses-prepare-tools.test.ts +924 -0
- package/src/responses/openai-responses-prepare-tools.ts +264 -0
- package/src/responses/openai-responses-provider-metadata.ts +39 -0
- package/src/speech/openai-speech-api.ts +38 -0
- package/src/speech/openai-speech-model.test.ts +202 -0
- package/src/speech/openai-speech-model.ts +137 -0
- package/src/speech/openai-speech-options.ts +22 -0
- package/src/tool/apply-patch.ts +141 -0
- package/src/tool/code-interpreter.ts +104 -0
- package/src/tool/file-search.ts +145 -0
- package/src/tool/image-generation.ts +126 -0
- package/src/tool/local-shell.test-d.ts +20 -0
- package/src/tool/local-shell.ts +72 -0
- package/src/tool/mcp.ts +125 -0
- package/src/tool/shell.ts +85 -0
- package/src/tool/web-search-preview.ts +139 -0
- package/src/tool/web-search.test-d.ts +13 -0
- package/src/tool/web-search.ts +179 -0
- package/src/transcription/openai-transcription-api.ts +37 -0
- package/src/transcription/openai-transcription-model.test.ts +507 -0
- package/src/transcription/openai-transcription-model.ts +232 -0
- package/src/transcription/openai-transcription-options.ts +50 -0
- package/src/transcription/transcription-test.mp3 +0 -0
- package/src/version.ts +6 -0
|
@@ -0,0 +1,336 @@
|
|
|
1
|
+
import {
|
|
2
|
+
LanguageModelV3,
|
|
3
|
+
LanguageModelV3CallOptions,
|
|
4
|
+
LanguageModelV3FinishReason,
|
|
5
|
+
LanguageModelV3GenerateResult,
|
|
6
|
+
LanguageModelV3StreamPart,
|
|
7
|
+
LanguageModelV3StreamResult,
|
|
8
|
+
SharedV3ProviderMetadata,
|
|
9
|
+
SharedV3Warning,
|
|
10
|
+
} from '@ai-sdk/provider';
|
|
11
|
+
import {
|
|
12
|
+
combineHeaders,
|
|
13
|
+
createEventSourceResponseHandler,
|
|
14
|
+
createJsonResponseHandler,
|
|
15
|
+
FetchFunction,
|
|
16
|
+
parseProviderOptions,
|
|
17
|
+
ParseResult,
|
|
18
|
+
postJsonToApi,
|
|
19
|
+
} from '@ai-sdk/provider-utils';
|
|
20
|
+
import { openaiFailedResponseHandler } from '../openai-error';
|
|
21
|
+
import {
|
|
22
|
+
convertOpenAICompletionUsage,
|
|
23
|
+
OpenAICompletionUsage,
|
|
24
|
+
} from './convert-openai-completion-usage';
|
|
25
|
+
import { convertToOpenAICompletionPrompt } from './convert-to-openai-completion-prompt';
|
|
26
|
+
import { getResponseMetadata } from './get-response-metadata';
|
|
27
|
+
import { mapOpenAIFinishReason } from './map-openai-finish-reason';
|
|
28
|
+
import {
|
|
29
|
+
OpenAICompletionChunk,
|
|
30
|
+
openaiCompletionChunkSchema,
|
|
31
|
+
openaiCompletionResponseSchema,
|
|
32
|
+
} from './openai-completion-api';
|
|
33
|
+
import {
|
|
34
|
+
OpenAICompletionModelId,
|
|
35
|
+
openaiCompletionProviderOptions,
|
|
36
|
+
} from './openai-completion-options';
|
|
37
|
+
|
|
38
|
+
type OpenAICompletionConfig = {
|
|
39
|
+
provider: string;
|
|
40
|
+
headers: () => Record<string, string | undefined>;
|
|
41
|
+
url: (options: { modelId: string; path: string }) => string;
|
|
42
|
+
fetch?: FetchFunction;
|
|
43
|
+
};
|
|
44
|
+
|
|
45
|
+
export class OpenAICompletionLanguageModel implements LanguageModelV3 {
|
|
46
|
+
readonly specificationVersion = 'v3';
|
|
47
|
+
|
|
48
|
+
readonly modelId: OpenAICompletionModelId;
|
|
49
|
+
|
|
50
|
+
private readonly config: OpenAICompletionConfig;
|
|
51
|
+
|
|
52
|
+
private get providerOptionsName(): string {
|
|
53
|
+
return this.config.provider.split('.')[0].trim();
|
|
54
|
+
}
|
|
55
|
+
|
|
56
|
+
constructor(
|
|
57
|
+
modelId: OpenAICompletionModelId,
|
|
58
|
+
config: OpenAICompletionConfig,
|
|
59
|
+
) {
|
|
60
|
+
this.modelId = modelId;
|
|
61
|
+
this.config = config;
|
|
62
|
+
}
|
|
63
|
+
|
|
64
|
+
get provider(): string {
|
|
65
|
+
return this.config.provider;
|
|
66
|
+
}
|
|
67
|
+
|
|
68
|
+
readonly supportedUrls: Record<string, RegExp[]> = {
|
|
69
|
+
// No URLs are supported for completion models.
|
|
70
|
+
};
|
|
71
|
+
|
|
72
|
+
private async getArgs({
|
|
73
|
+
prompt,
|
|
74
|
+
maxOutputTokens,
|
|
75
|
+
temperature,
|
|
76
|
+
topP,
|
|
77
|
+
topK,
|
|
78
|
+
frequencyPenalty,
|
|
79
|
+
presencePenalty,
|
|
80
|
+
stopSequences: userStopSequences,
|
|
81
|
+
responseFormat,
|
|
82
|
+
tools,
|
|
83
|
+
toolChoice,
|
|
84
|
+
seed,
|
|
85
|
+
providerOptions,
|
|
86
|
+
}: LanguageModelV3CallOptions) {
|
|
87
|
+
const warnings: SharedV3Warning[] = [];
|
|
88
|
+
|
|
89
|
+
// Parse provider options
|
|
90
|
+
const openaiOptions = {
|
|
91
|
+
...(await parseProviderOptions({
|
|
92
|
+
provider: 'openai',
|
|
93
|
+
providerOptions,
|
|
94
|
+
schema: openaiCompletionProviderOptions,
|
|
95
|
+
})),
|
|
96
|
+
...(await parseProviderOptions({
|
|
97
|
+
provider: this.providerOptionsName,
|
|
98
|
+
providerOptions,
|
|
99
|
+
schema: openaiCompletionProviderOptions,
|
|
100
|
+
})),
|
|
101
|
+
};
|
|
102
|
+
|
|
103
|
+
if (topK != null) {
|
|
104
|
+
warnings.push({ type: 'unsupported', feature: 'topK' });
|
|
105
|
+
}
|
|
106
|
+
|
|
107
|
+
if (tools?.length) {
|
|
108
|
+
warnings.push({ type: 'unsupported', feature: 'tools' });
|
|
109
|
+
}
|
|
110
|
+
|
|
111
|
+
if (toolChoice != null) {
|
|
112
|
+
warnings.push({ type: 'unsupported', feature: 'toolChoice' });
|
|
113
|
+
}
|
|
114
|
+
|
|
115
|
+
if (responseFormat != null && responseFormat.type !== 'text') {
|
|
116
|
+
warnings.push({
|
|
117
|
+
type: 'unsupported',
|
|
118
|
+
feature: 'responseFormat',
|
|
119
|
+
details: 'JSON response format is not supported.',
|
|
120
|
+
});
|
|
121
|
+
}
|
|
122
|
+
|
|
123
|
+
const { prompt: completionPrompt, stopSequences } =
|
|
124
|
+
convertToOpenAICompletionPrompt({ prompt });
|
|
125
|
+
|
|
126
|
+
const stop = [...(stopSequences ?? []), ...(userStopSequences ?? [])];
|
|
127
|
+
|
|
128
|
+
return {
|
|
129
|
+
args: {
|
|
130
|
+
// model id:
|
|
131
|
+
model: this.modelId,
|
|
132
|
+
|
|
133
|
+
// model specific settings:
|
|
134
|
+
echo: openaiOptions.echo,
|
|
135
|
+
logit_bias: openaiOptions.logitBias,
|
|
136
|
+
logprobs:
|
|
137
|
+
openaiOptions?.logprobs === true
|
|
138
|
+
? 0
|
|
139
|
+
: openaiOptions?.logprobs === false
|
|
140
|
+
? undefined
|
|
141
|
+
: openaiOptions?.logprobs,
|
|
142
|
+
suffix: openaiOptions.suffix,
|
|
143
|
+
user: openaiOptions.user,
|
|
144
|
+
|
|
145
|
+
// standardized settings:
|
|
146
|
+
max_tokens: maxOutputTokens,
|
|
147
|
+
temperature,
|
|
148
|
+
top_p: topP,
|
|
149
|
+
frequency_penalty: frequencyPenalty,
|
|
150
|
+
presence_penalty: presencePenalty,
|
|
151
|
+
seed,
|
|
152
|
+
|
|
153
|
+
// prompt:
|
|
154
|
+
prompt: completionPrompt,
|
|
155
|
+
|
|
156
|
+
// stop sequences:
|
|
157
|
+
stop: stop.length > 0 ? stop : undefined,
|
|
158
|
+
},
|
|
159
|
+
warnings,
|
|
160
|
+
};
|
|
161
|
+
}
|
|
162
|
+
|
|
163
|
+
async doGenerate(
|
|
164
|
+
options: LanguageModelV3CallOptions,
|
|
165
|
+
): Promise<LanguageModelV3GenerateResult> {
|
|
166
|
+
const { args, warnings } = await this.getArgs(options);
|
|
167
|
+
|
|
168
|
+
const {
|
|
169
|
+
responseHeaders,
|
|
170
|
+
value: response,
|
|
171
|
+
rawValue: rawResponse,
|
|
172
|
+
} = await postJsonToApi({
|
|
173
|
+
url: this.config.url({
|
|
174
|
+
path: '/completions',
|
|
175
|
+
modelId: this.modelId,
|
|
176
|
+
}),
|
|
177
|
+
headers: combineHeaders(this.config.headers(), options.headers),
|
|
178
|
+
body: args,
|
|
179
|
+
failedResponseHandler: openaiFailedResponseHandler,
|
|
180
|
+
successfulResponseHandler: createJsonResponseHandler(
|
|
181
|
+
openaiCompletionResponseSchema,
|
|
182
|
+
),
|
|
183
|
+
abortSignal: options.abortSignal,
|
|
184
|
+
fetch: this.config.fetch,
|
|
185
|
+
});
|
|
186
|
+
|
|
187
|
+
const choice = response.choices[0];
|
|
188
|
+
|
|
189
|
+
const providerMetadata: SharedV3ProviderMetadata = { openai: {} };
|
|
190
|
+
|
|
191
|
+
if (choice.logprobs != null) {
|
|
192
|
+
providerMetadata.openai.logprobs = choice.logprobs;
|
|
193
|
+
}
|
|
194
|
+
|
|
195
|
+
return {
|
|
196
|
+
content: [{ type: 'text', text: choice.text }],
|
|
197
|
+
usage: convertOpenAICompletionUsage(response.usage),
|
|
198
|
+
finishReason: {
|
|
199
|
+
unified: mapOpenAIFinishReason(choice.finish_reason),
|
|
200
|
+
raw: choice.finish_reason ?? undefined,
|
|
201
|
+
},
|
|
202
|
+
request: { body: args },
|
|
203
|
+
response: {
|
|
204
|
+
...getResponseMetadata(response),
|
|
205
|
+
headers: responseHeaders,
|
|
206
|
+
body: rawResponse,
|
|
207
|
+
},
|
|
208
|
+
providerMetadata,
|
|
209
|
+
warnings,
|
|
210
|
+
};
|
|
211
|
+
}
|
|
212
|
+
|
|
213
|
+
async doStream(
|
|
214
|
+
options: LanguageModelV3CallOptions,
|
|
215
|
+
): Promise<LanguageModelV3StreamResult> {
|
|
216
|
+
const { args, warnings } = await this.getArgs(options);
|
|
217
|
+
|
|
218
|
+
const body = {
|
|
219
|
+
...args,
|
|
220
|
+
stream: true,
|
|
221
|
+
|
|
222
|
+
stream_options: {
|
|
223
|
+
include_usage: true,
|
|
224
|
+
},
|
|
225
|
+
};
|
|
226
|
+
|
|
227
|
+
const { responseHeaders, value: response } = await postJsonToApi({
|
|
228
|
+
url: this.config.url({
|
|
229
|
+
path: '/completions',
|
|
230
|
+
modelId: this.modelId,
|
|
231
|
+
}),
|
|
232
|
+
headers: combineHeaders(this.config.headers(), options.headers),
|
|
233
|
+
body,
|
|
234
|
+
failedResponseHandler: openaiFailedResponseHandler,
|
|
235
|
+
successfulResponseHandler: createEventSourceResponseHandler(
|
|
236
|
+
openaiCompletionChunkSchema,
|
|
237
|
+
),
|
|
238
|
+
abortSignal: options.abortSignal,
|
|
239
|
+
fetch: this.config.fetch,
|
|
240
|
+
});
|
|
241
|
+
|
|
242
|
+
let finishReason: LanguageModelV3FinishReason = {
|
|
243
|
+
unified: 'other',
|
|
244
|
+
raw: undefined,
|
|
245
|
+
};
|
|
246
|
+
const providerMetadata: SharedV3ProviderMetadata = { openai: {} };
|
|
247
|
+
let usage: OpenAICompletionUsage | undefined = undefined;
|
|
248
|
+
let isFirstChunk = true;
|
|
249
|
+
|
|
250
|
+
return {
|
|
251
|
+
stream: response.pipeThrough(
|
|
252
|
+
new TransformStream<
|
|
253
|
+
ParseResult<OpenAICompletionChunk>,
|
|
254
|
+
LanguageModelV3StreamPart
|
|
255
|
+
>({
|
|
256
|
+
start(controller) {
|
|
257
|
+
controller.enqueue({ type: 'stream-start', warnings });
|
|
258
|
+
},
|
|
259
|
+
|
|
260
|
+
transform(chunk, controller) {
|
|
261
|
+
if (options.includeRawChunks) {
|
|
262
|
+
controller.enqueue({ type: 'raw', rawValue: chunk.rawValue });
|
|
263
|
+
}
|
|
264
|
+
|
|
265
|
+
// handle failed chunk parsing / validation:
|
|
266
|
+
if (!chunk.success) {
|
|
267
|
+
finishReason = { unified: 'error', raw: undefined };
|
|
268
|
+
controller.enqueue({ type: 'error', error: chunk.error });
|
|
269
|
+
return;
|
|
270
|
+
}
|
|
271
|
+
|
|
272
|
+
const value = chunk.value;
|
|
273
|
+
|
|
274
|
+
// handle error chunks:
|
|
275
|
+
if ('error' in value) {
|
|
276
|
+
finishReason = { unified: 'error', raw: undefined };
|
|
277
|
+
controller.enqueue({ type: 'error', error: value.error });
|
|
278
|
+
return;
|
|
279
|
+
}
|
|
280
|
+
|
|
281
|
+
if (isFirstChunk) {
|
|
282
|
+
isFirstChunk = false;
|
|
283
|
+
|
|
284
|
+
controller.enqueue({
|
|
285
|
+
type: 'response-metadata',
|
|
286
|
+
...getResponseMetadata(value),
|
|
287
|
+
});
|
|
288
|
+
|
|
289
|
+
controller.enqueue({ type: 'text-start', id: '0' });
|
|
290
|
+
}
|
|
291
|
+
|
|
292
|
+
if (value.usage != null) {
|
|
293
|
+
usage = value.usage;
|
|
294
|
+
}
|
|
295
|
+
|
|
296
|
+
const choice = value.choices[0];
|
|
297
|
+
|
|
298
|
+
if (choice?.finish_reason != null) {
|
|
299
|
+
finishReason = {
|
|
300
|
+
unified: mapOpenAIFinishReason(choice.finish_reason),
|
|
301
|
+
raw: choice.finish_reason,
|
|
302
|
+
};
|
|
303
|
+
}
|
|
304
|
+
|
|
305
|
+
if (choice?.logprobs != null) {
|
|
306
|
+
providerMetadata.openai.logprobs = choice.logprobs;
|
|
307
|
+
}
|
|
308
|
+
|
|
309
|
+
if (choice?.text != null && choice.text.length > 0) {
|
|
310
|
+
controller.enqueue({
|
|
311
|
+
type: 'text-delta',
|
|
312
|
+
id: '0',
|
|
313
|
+
delta: choice.text,
|
|
314
|
+
});
|
|
315
|
+
}
|
|
316
|
+
},
|
|
317
|
+
|
|
318
|
+
flush(controller) {
|
|
319
|
+
if (!isFirstChunk) {
|
|
320
|
+
controller.enqueue({ type: 'text-end', id: '0' });
|
|
321
|
+
}
|
|
322
|
+
|
|
323
|
+
controller.enqueue({
|
|
324
|
+
type: 'finish',
|
|
325
|
+
finishReason,
|
|
326
|
+
providerMetadata,
|
|
327
|
+
usage: convertOpenAICompletionUsage(usage),
|
|
328
|
+
});
|
|
329
|
+
},
|
|
330
|
+
}),
|
|
331
|
+
),
|
|
332
|
+
request: { body },
|
|
333
|
+
response: { headers: responseHeaders },
|
|
334
|
+
};
|
|
335
|
+
}
|
|
336
|
+
}
|
|
@@ -0,0 +1,58 @@
|
|
|
1
|
+
import { InferSchema, lazySchema, zodSchema } from '@ai-sdk/provider-utils';
|
|
2
|
+
import { z } from 'zod/v4';
|
|
3
|
+
|
|
4
|
+
// https://platform.openai.com/docs/models
|
|
5
|
+
export type OpenAICompletionModelId = 'gpt-3.5-turbo-instruct' | (string & {});
|
|
6
|
+
|
|
7
|
+
export const openaiCompletionProviderOptions = lazySchema(() =>
|
|
8
|
+
zodSchema(
|
|
9
|
+
z.object({
|
|
10
|
+
/**
|
|
11
|
+
Echo back the prompt in addition to the completion.
|
|
12
|
+
*/
|
|
13
|
+
echo: z.boolean().optional(),
|
|
14
|
+
|
|
15
|
+
/**
|
|
16
|
+
Modify the likelihood of specified tokens appearing in the completion.
|
|
17
|
+
|
|
18
|
+
Accepts a JSON object that maps tokens (specified by their token ID in
|
|
19
|
+
the GPT tokenizer) to an associated bias value from -100 to 100. You
|
|
20
|
+
can use this tokenizer tool to convert text to token IDs. Mathematically,
|
|
21
|
+
the bias is added to the logits generated by the model prior to sampling.
|
|
22
|
+
The exact effect will vary per model, but values between -1 and 1 should
|
|
23
|
+
decrease or increase likelihood of selection; values like -100 or 100
|
|
24
|
+
should result in a ban or exclusive selection of the relevant token.
|
|
25
|
+
|
|
26
|
+
As an example, you can pass {"50256": -100} to prevent the <|endoftext|>
|
|
27
|
+
token from being generated.
|
|
28
|
+
*/
|
|
29
|
+
logitBias: z.record(z.string(), z.number()).optional(),
|
|
30
|
+
|
|
31
|
+
/**
|
|
32
|
+
The suffix that comes after a completion of inserted text.
|
|
33
|
+
*/
|
|
34
|
+
suffix: z.string().optional(),
|
|
35
|
+
|
|
36
|
+
/**
|
|
37
|
+
A unique identifier representing your end-user, which can help OpenAI to
|
|
38
|
+
monitor and detect abuse. Learn more.
|
|
39
|
+
*/
|
|
40
|
+
user: z.string().optional(),
|
|
41
|
+
|
|
42
|
+
/**
|
|
43
|
+
Return the log probabilities of the tokens. Including logprobs will increase
|
|
44
|
+
the response size and can slow down response times. However, it can
|
|
45
|
+
be useful to better understand how the model is behaving.
|
|
46
|
+
Setting to true will return the log probabilities of the tokens that
|
|
47
|
+
were generated.
|
|
48
|
+
Setting to a number will return the log probabilities of the top n
|
|
49
|
+
tokens that were generated.
|
|
50
|
+
*/
|
|
51
|
+
logprobs: z.union([z.boolean(), z.number()]).optional(),
|
|
52
|
+
}),
|
|
53
|
+
),
|
|
54
|
+
);
|
|
55
|
+
|
|
56
|
+
export type OpenAICompletionProviderOptions = InferSchema<
|
|
57
|
+
typeof openaiCompletionProviderOptions
|
|
58
|
+
>;
|
|
@@ -0,0 +1,43 @@
|
|
|
1
|
+
// Vitest Snapshot v1, https://vitest.dev/guide/snapshot.html
|
|
2
|
+
|
|
3
|
+
exports[`doEmbed > should expose the raw response 1`] = `
|
|
4
|
+
{
|
|
5
|
+
"body": {
|
|
6
|
+
"data": [
|
|
7
|
+
{
|
|
8
|
+
"embedding": [
|
|
9
|
+
0.1,
|
|
10
|
+
0.2,
|
|
11
|
+
0.3,
|
|
12
|
+
0.4,
|
|
13
|
+
0.5,
|
|
14
|
+
],
|
|
15
|
+
"index": 0,
|
|
16
|
+
"object": "embedding",
|
|
17
|
+
},
|
|
18
|
+
{
|
|
19
|
+
"embedding": [
|
|
20
|
+
0.6,
|
|
21
|
+
0.7,
|
|
22
|
+
0.8,
|
|
23
|
+
0.9,
|
|
24
|
+
1,
|
|
25
|
+
],
|
|
26
|
+
"index": 1,
|
|
27
|
+
"object": "embedding",
|
|
28
|
+
},
|
|
29
|
+
],
|
|
30
|
+
"model": "text-embedding-3-large",
|
|
31
|
+
"object": "list",
|
|
32
|
+
"usage": {
|
|
33
|
+
"prompt_tokens": 8,
|
|
34
|
+
"total_tokens": 8,
|
|
35
|
+
},
|
|
36
|
+
},
|
|
37
|
+
"headers": {
|
|
38
|
+
"content-length": "236",
|
|
39
|
+
"content-type": "application/json",
|
|
40
|
+
"test-header": "test-value",
|
|
41
|
+
},
|
|
42
|
+
}
|
|
43
|
+
`;
|
|
@@ -0,0 +1,13 @@
|
|
|
1
|
+
import { lazySchema, zodSchema } from '@ai-sdk/provider-utils';
|
|
2
|
+
import { z } from 'zod/v4';
|
|
3
|
+
|
|
4
|
+
// minimal version of the schema, focussed on what is needed for the implementation
|
|
5
|
+
// this approach limits breakages when the API changes and increases efficiency
|
|
6
|
+
export const openaiTextEmbeddingResponseSchema = lazySchema(() =>
|
|
7
|
+
zodSchema(
|
|
8
|
+
z.object({
|
|
9
|
+
data: z.array(z.object({ embedding: z.array(z.number()) })),
|
|
10
|
+
usage: z.object({ prompt_tokens: z.number() }).nullish(),
|
|
11
|
+
}),
|
|
12
|
+
),
|
|
13
|
+
);
|
|
@@ -0,0 +1,146 @@
|
|
|
1
|
+
import { EmbeddingModelV3Embedding } from '@ai-sdk/provider';
|
|
2
|
+
import { createTestServer } from '@ai-sdk/test-server/with-vitest';
|
|
3
|
+
import { createOpenAI } from '../openai-provider';
|
|
4
|
+
import { describe, it, expect, vi } from 'vitest';
|
|
5
|
+
|
|
6
|
+
vi.mock('../version', () => ({
|
|
7
|
+
VERSION: '0.0.0-test',
|
|
8
|
+
}));
|
|
9
|
+
|
|
10
|
+
const dummyEmbeddings = [
|
|
11
|
+
[0.1, 0.2, 0.3, 0.4, 0.5],
|
|
12
|
+
[0.6, 0.7, 0.8, 0.9, 1.0],
|
|
13
|
+
];
|
|
14
|
+
const testValues = ['sunny day at the beach', 'rainy day in the city'];
|
|
15
|
+
|
|
16
|
+
const provider = createOpenAI({ apiKey: 'test-api-key' });
|
|
17
|
+
const model = provider.embedding('text-embedding-3-large');
|
|
18
|
+
|
|
19
|
+
const server = createTestServer({
|
|
20
|
+
'https://api.openai.com/v1/embeddings': {},
|
|
21
|
+
});
|
|
22
|
+
|
|
23
|
+
describe('doEmbed', () => {
|
|
24
|
+
function prepareJsonResponse({
|
|
25
|
+
embeddings = dummyEmbeddings,
|
|
26
|
+
usage = { prompt_tokens: 8, total_tokens: 8 },
|
|
27
|
+
headers,
|
|
28
|
+
}: {
|
|
29
|
+
embeddings?: EmbeddingModelV3Embedding[];
|
|
30
|
+
usage?: { prompt_tokens: number; total_tokens: number };
|
|
31
|
+
headers?: Record<string, string>;
|
|
32
|
+
} = {}) {
|
|
33
|
+
server.urls['https://api.openai.com/v1/embeddings'].response = {
|
|
34
|
+
type: 'json-value',
|
|
35
|
+
headers,
|
|
36
|
+
body: {
|
|
37
|
+
object: 'list',
|
|
38
|
+
data: embeddings.map((embedding, i) => ({
|
|
39
|
+
object: 'embedding',
|
|
40
|
+
index: i,
|
|
41
|
+
embedding,
|
|
42
|
+
})),
|
|
43
|
+
model: 'text-embedding-3-large',
|
|
44
|
+
usage,
|
|
45
|
+
},
|
|
46
|
+
};
|
|
47
|
+
}
|
|
48
|
+
|
|
49
|
+
it('should extract embedding', async () => {
|
|
50
|
+
prepareJsonResponse();
|
|
51
|
+
|
|
52
|
+
const { embeddings } = await model.doEmbed({ values: testValues });
|
|
53
|
+
|
|
54
|
+
expect(embeddings).toStrictEqual(dummyEmbeddings);
|
|
55
|
+
});
|
|
56
|
+
|
|
57
|
+
it('should expose the raw response', async () => {
|
|
58
|
+
prepareJsonResponse({
|
|
59
|
+
headers: {
|
|
60
|
+
'test-header': 'test-value',
|
|
61
|
+
},
|
|
62
|
+
});
|
|
63
|
+
|
|
64
|
+
const { response } = await model.doEmbed({ values: testValues });
|
|
65
|
+
|
|
66
|
+
expect(response?.headers).toStrictEqual({
|
|
67
|
+
// default headers:
|
|
68
|
+
'content-length': '236',
|
|
69
|
+
'content-type': 'application/json',
|
|
70
|
+
|
|
71
|
+
// custom header
|
|
72
|
+
'test-header': 'test-value',
|
|
73
|
+
});
|
|
74
|
+
expect(response).toMatchSnapshot();
|
|
75
|
+
});
|
|
76
|
+
|
|
77
|
+
it('should extract usage', async () => {
|
|
78
|
+
prepareJsonResponse({
|
|
79
|
+
usage: { prompt_tokens: 20, total_tokens: 20 },
|
|
80
|
+
});
|
|
81
|
+
|
|
82
|
+
const { usage } = await model.doEmbed({ values: testValues });
|
|
83
|
+
|
|
84
|
+
expect(usage).toStrictEqual({ tokens: 20 });
|
|
85
|
+
});
|
|
86
|
+
|
|
87
|
+
it('should pass the model and the values', async () => {
|
|
88
|
+
prepareJsonResponse();
|
|
89
|
+
|
|
90
|
+
await model.doEmbed({ values: testValues });
|
|
91
|
+
|
|
92
|
+
expect(await server.calls[0].requestBodyJson).toStrictEqual({
|
|
93
|
+
model: 'text-embedding-3-large',
|
|
94
|
+
input: testValues,
|
|
95
|
+
encoding_format: 'float',
|
|
96
|
+
});
|
|
97
|
+
});
|
|
98
|
+
|
|
99
|
+
it('should pass the dimensions setting', async () => {
|
|
100
|
+
prepareJsonResponse();
|
|
101
|
+
|
|
102
|
+
await provider.embedding('text-embedding-3-large').doEmbed({
|
|
103
|
+
values: testValues,
|
|
104
|
+
providerOptions: { openai: { dimensions: 64 } },
|
|
105
|
+
});
|
|
106
|
+
|
|
107
|
+
expect(await server.calls[0].requestBodyJson).toStrictEqual({
|
|
108
|
+
model: 'text-embedding-3-large',
|
|
109
|
+
input: testValues,
|
|
110
|
+
encoding_format: 'float',
|
|
111
|
+
dimensions: 64,
|
|
112
|
+
});
|
|
113
|
+
});
|
|
114
|
+
|
|
115
|
+
it('should pass headers', async () => {
|
|
116
|
+
prepareJsonResponse();
|
|
117
|
+
|
|
118
|
+
const provider = createOpenAI({
|
|
119
|
+
apiKey: 'test-api-key',
|
|
120
|
+
organization: 'test-organization',
|
|
121
|
+
project: 'test-project',
|
|
122
|
+
headers: {
|
|
123
|
+
'Custom-Provider-Header': 'provider-header-value',
|
|
124
|
+
},
|
|
125
|
+
});
|
|
126
|
+
|
|
127
|
+
await provider.embedding('text-embedding-3-large').doEmbed({
|
|
128
|
+
values: testValues,
|
|
129
|
+
headers: {
|
|
130
|
+
'Custom-Request-Header': 'request-header-value',
|
|
131
|
+
},
|
|
132
|
+
});
|
|
133
|
+
|
|
134
|
+
expect(server.calls[0].requestHeaders).toStrictEqual({
|
|
135
|
+
authorization: 'Bearer test-api-key',
|
|
136
|
+
'content-type': 'application/json',
|
|
137
|
+
'custom-provider-header': 'provider-header-value',
|
|
138
|
+
'custom-request-header': 'request-header-value',
|
|
139
|
+
'openai-organization': 'test-organization',
|
|
140
|
+
'openai-project': 'test-project',
|
|
141
|
+
});
|
|
142
|
+
expect(server.calls[0].requestUserAgent).toContain(
|
|
143
|
+
`ai-sdk/openai/0.0.0-test`,
|
|
144
|
+
);
|
|
145
|
+
});
|
|
146
|
+
});
|
|
@@ -0,0 +1,95 @@
|
|
|
1
|
+
import {
|
|
2
|
+
EmbeddingModelV3,
|
|
3
|
+
TooManyEmbeddingValuesForCallError,
|
|
4
|
+
} from '@ai-sdk/provider';
|
|
5
|
+
import {
|
|
6
|
+
combineHeaders,
|
|
7
|
+
createJsonResponseHandler,
|
|
8
|
+
parseProviderOptions,
|
|
9
|
+
postJsonToApi,
|
|
10
|
+
} from '@ai-sdk/provider-utils';
|
|
11
|
+
import { OpenAIConfig } from '../openai-config';
|
|
12
|
+
import { openaiFailedResponseHandler } from '../openai-error';
|
|
13
|
+
import {
|
|
14
|
+
OpenAIEmbeddingModelId,
|
|
15
|
+
openaiEmbeddingProviderOptions,
|
|
16
|
+
} from './openai-embedding-options';
|
|
17
|
+
import { openaiTextEmbeddingResponseSchema } from './openai-embedding-api';
|
|
18
|
+
|
|
19
|
+
export class OpenAIEmbeddingModel implements EmbeddingModelV3 {
|
|
20
|
+
readonly specificationVersion = 'v3';
|
|
21
|
+
readonly modelId: OpenAIEmbeddingModelId;
|
|
22
|
+
readonly maxEmbeddingsPerCall = 2048;
|
|
23
|
+
readonly supportsParallelCalls = true;
|
|
24
|
+
|
|
25
|
+
private readonly config: OpenAIConfig;
|
|
26
|
+
|
|
27
|
+
get provider(): string {
|
|
28
|
+
return this.config.provider;
|
|
29
|
+
}
|
|
30
|
+
|
|
31
|
+
constructor(modelId: OpenAIEmbeddingModelId, config: OpenAIConfig) {
|
|
32
|
+
this.modelId = modelId;
|
|
33
|
+
this.config = config;
|
|
34
|
+
}
|
|
35
|
+
|
|
36
|
+
async doEmbed({
|
|
37
|
+
values,
|
|
38
|
+
headers,
|
|
39
|
+
abortSignal,
|
|
40
|
+
providerOptions,
|
|
41
|
+
}: Parameters<EmbeddingModelV3['doEmbed']>[0]): Promise<
|
|
42
|
+
Awaited<ReturnType<EmbeddingModelV3['doEmbed']>>
|
|
43
|
+
> {
|
|
44
|
+
if (values.length > this.maxEmbeddingsPerCall) {
|
|
45
|
+
throw new TooManyEmbeddingValuesForCallError({
|
|
46
|
+
provider: this.provider,
|
|
47
|
+
modelId: this.modelId,
|
|
48
|
+
maxEmbeddingsPerCall: this.maxEmbeddingsPerCall,
|
|
49
|
+
values,
|
|
50
|
+
});
|
|
51
|
+
}
|
|
52
|
+
|
|
53
|
+
// Parse provider options
|
|
54
|
+
const openaiOptions =
|
|
55
|
+
(await parseProviderOptions({
|
|
56
|
+
provider: 'openai',
|
|
57
|
+
providerOptions,
|
|
58
|
+
schema: openaiEmbeddingProviderOptions,
|
|
59
|
+
})) ?? {};
|
|
60
|
+
|
|
61
|
+
const {
|
|
62
|
+
responseHeaders,
|
|
63
|
+
value: response,
|
|
64
|
+
rawValue,
|
|
65
|
+
} = await postJsonToApi({
|
|
66
|
+
url: this.config.url({
|
|
67
|
+
path: '/embeddings',
|
|
68
|
+
modelId: this.modelId,
|
|
69
|
+
}),
|
|
70
|
+
headers: combineHeaders(this.config.headers(), headers),
|
|
71
|
+
body: {
|
|
72
|
+
model: this.modelId,
|
|
73
|
+
input: values,
|
|
74
|
+
encoding_format: 'float',
|
|
75
|
+
dimensions: openaiOptions.dimensions,
|
|
76
|
+
user: openaiOptions.user,
|
|
77
|
+
},
|
|
78
|
+
failedResponseHandler: openaiFailedResponseHandler,
|
|
79
|
+
successfulResponseHandler: createJsonResponseHandler(
|
|
80
|
+
openaiTextEmbeddingResponseSchema,
|
|
81
|
+
),
|
|
82
|
+
abortSignal,
|
|
83
|
+
fetch: this.config.fetch,
|
|
84
|
+
});
|
|
85
|
+
|
|
86
|
+
return {
|
|
87
|
+
warnings: [],
|
|
88
|
+
embeddings: response.data.map(item => item.embedding),
|
|
89
|
+
usage: response.usage
|
|
90
|
+
? { tokens: response.usage.prompt_tokens }
|
|
91
|
+
: undefined,
|
|
92
|
+
response: { headers: responseHeaders, body: rawValue },
|
|
93
|
+
};
|
|
94
|
+
}
|
|
95
|
+
}
|