@ai-sdk/gateway 0.0.0-70e0935a-20260114150030 → 0.0.0-98261322-20260122142521
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +49 -4
- package/dist/index.d.mts +20 -10
- package/dist/index.d.ts +20 -10
- package/dist/index.js +62 -25
- package/dist/index.js.map +1 -1
- package/dist/index.mjs +62 -25
- package/dist/index.mjs.map +1 -1
- package/docs/00-ai-gateway.mdx +625 -0
- package/package.json +12 -5
- package/src/errors/as-gateway-error.ts +33 -0
- package/src/errors/create-gateway-error.test.ts +590 -0
- package/src/errors/create-gateway-error.ts +132 -0
- package/src/errors/extract-api-call-response.test.ts +270 -0
- package/src/errors/extract-api-call-response.ts +15 -0
- package/src/errors/gateway-authentication-error.ts +84 -0
- package/src/errors/gateway-error-types.test.ts +278 -0
- package/src/errors/gateway-error.ts +47 -0
- package/src/errors/gateway-internal-server-error.ts +33 -0
- package/src/errors/gateway-invalid-request-error.ts +33 -0
- package/src/errors/gateway-model-not-found-error.ts +47 -0
- package/src/errors/gateway-rate-limit-error.ts +33 -0
- package/src/errors/gateway-response-error.ts +42 -0
- package/src/errors/index.ts +16 -0
- package/src/errors/parse-auth-method.test.ts +136 -0
- package/src/errors/parse-auth-method.ts +23 -0
- package/src/gateway-config.ts +7 -0
- package/src/gateway-embedding-model-settings.ts +22 -0
- package/src/gateway-embedding-model.test.ts +213 -0
- package/src/gateway-embedding-model.ts +109 -0
- package/src/gateway-fetch-metadata.test.ts +774 -0
- package/src/gateway-fetch-metadata.ts +127 -0
- package/src/gateway-image-model-settings.ts +12 -0
- package/src/gateway-image-model.test.ts +823 -0
- package/src/gateway-image-model.ts +145 -0
- package/src/gateway-language-model-settings.ts +159 -0
- package/src/gateway-language-model.test.ts +1485 -0
- package/src/gateway-language-model.ts +212 -0
- package/src/gateway-model-entry.ts +58 -0
- package/src/gateway-provider-options.ts +66 -0
- package/src/gateway-provider.test.ts +1210 -0
- package/src/gateway-provider.ts +284 -0
- package/src/gateway-tools.ts +15 -0
- package/src/index.ts +27 -0
- package/src/tool/perplexity-search.ts +294 -0
- package/src/vercel-environment.test.ts +65 -0
- package/src/vercel-environment.ts +6 -0
- package/src/version.ts +6 -0
|
@@ -0,0 +1,22 @@
|
|
|
1
|
+
export type GatewayEmbeddingModelId =
|
|
2
|
+
| 'alibaba/qwen3-embedding-0.6b'
|
|
3
|
+
| 'alibaba/qwen3-embedding-4b'
|
|
4
|
+
| 'alibaba/qwen3-embedding-8b'
|
|
5
|
+
| 'amazon/titan-embed-text-v2'
|
|
6
|
+
| 'cohere/embed-v4.0'
|
|
7
|
+
| 'google/gemini-embedding-001'
|
|
8
|
+
| 'google/text-embedding-005'
|
|
9
|
+
| 'google/text-multilingual-embedding-002'
|
|
10
|
+
| 'mistral/codestral-embed'
|
|
11
|
+
| 'mistral/mistral-embed'
|
|
12
|
+
| 'openai/text-embedding-3-large'
|
|
13
|
+
| 'openai/text-embedding-3-small'
|
|
14
|
+
| 'openai/text-embedding-ada-002'
|
|
15
|
+
| 'voyage/voyage-3-large'
|
|
16
|
+
| 'voyage/voyage-3.5'
|
|
17
|
+
| 'voyage/voyage-3.5-lite'
|
|
18
|
+
| 'voyage/voyage-code-2'
|
|
19
|
+
| 'voyage/voyage-code-3'
|
|
20
|
+
| 'voyage/voyage-finance-2'
|
|
21
|
+
| 'voyage/voyage-law-2'
|
|
22
|
+
| (string & {});
|
|
@@ -0,0 +1,213 @@
|
|
|
1
|
+
import { describe, it, expect } from 'vitest';
|
|
2
|
+
import { createTestServer } from '@ai-sdk/test-server/with-vitest';
|
|
3
|
+
import { GatewayEmbeddingModel } from './gateway-embedding-model';
|
|
4
|
+
import type { GatewayConfig } from './gateway-config';
|
|
5
|
+
import {
|
|
6
|
+
GatewayInvalidRequestError,
|
|
7
|
+
GatewayInternalServerError,
|
|
8
|
+
} from './errors';
|
|
9
|
+
|
|
10
|
+
const dummyEmbeddings = [
|
|
11
|
+
[0.1, 0.2, 0.3],
|
|
12
|
+
[0.4, 0.5, 0.6],
|
|
13
|
+
];
|
|
14
|
+
const testValues = ['sunny day at the beach', 'rainy afternoon in the city'];
|
|
15
|
+
|
|
16
|
+
const server = createTestServer({
|
|
17
|
+
'https://api.test.com/embedding-model': {},
|
|
18
|
+
});
|
|
19
|
+
|
|
20
|
+
const createTestModel = (
|
|
21
|
+
config: Partial<
|
|
22
|
+
GatewayConfig & { o11yHeaders?: Record<string, string> }
|
|
23
|
+
> = {},
|
|
24
|
+
) =>
|
|
25
|
+
new GatewayEmbeddingModel('openai/text-embedding-3-small', {
|
|
26
|
+
provider: 'gateway',
|
|
27
|
+
baseURL: 'https://api.test.com',
|
|
28
|
+
headers: () => ({
|
|
29
|
+
Authorization: 'Bearer test-token',
|
|
30
|
+
'ai-gateway-auth-method': 'api-key',
|
|
31
|
+
}),
|
|
32
|
+
fetch: globalThis.fetch,
|
|
33
|
+
o11yHeaders: config.o11yHeaders || {},
|
|
34
|
+
...config,
|
|
35
|
+
});
|
|
36
|
+
|
|
37
|
+
describe('GatewayEmbeddingModel', () => {
|
|
38
|
+
function prepareJsonResponse({
|
|
39
|
+
embeddings = dummyEmbeddings,
|
|
40
|
+
usage = { tokens: 8 },
|
|
41
|
+
headers,
|
|
42
|
+
}: {
|
|
43
|
+
embeddings?: number[][];
|
|
44
|
+
usage?: { tokens: number };
|
|
45
|
+
headers?: Record<string, string>;
|
|
46
|
+
} = {}) {
|
|
47
|
+
server.urls['https://api.test.com/embedding-model'].response = {
|
|
48
|
+
type: 'json-value',
|
|
49
|
+
headers,
|
|
50
|
+
body: {
|
|
51
|
+
embeddings,
|
|
52
|
+
usage,
|
|
53
|
+
},
|
|
54
|
+
};
|
|
55
|
+
}
|
|
56
|
+
|
|
57
|
+
describe('doEmbed', () => {
|
|
58
|
+
it('should pass headers correctly', async () => {
|
|
59
|
+
prepareJsonResponse();
|
|
60
|
+
|
|
61
|
+
await createTestModel().doEmbed({
|
|
62
|
+
values: testValues,
|
|
63
|
+
headers: { 'Custom-Header': 'test-value' },
|
|
64
|
+
});
|
|
65
|
+
|
|
66
|
+
const headers = server.calls[0].requestHeaders;
|
|
67
|
+
expect(headers).toMatchObject({
|
|
68
|
+
authorization: 'Bearer test-token',
|
|
69
|
+
'custom-header': 'test-value',
|
|
70
|
+
'ai-embedding-model-specification-version': '3',
|
|
71
|
+
'ai-model-id': 'openai/text-embedding-3-small',
|
|
72
|
+
});
|
|
73
|
+
});
|
|
74
|
+
|
|
75
|
+
it('should include o11y headers', async () => {
|
|
76
|
+
prepareJsonResponse();
|
|
77
|
+
|
|
78
|
+
const o11yHeaders = {
|
|
79
|
+
'ai-o11y-deployment-id': 'deployment-1',
|
|
80
|
+
'ai-o11y-environment': 'production',
|
|
81
|
+
'ai-o11y-region': 'iad1',
|
|
82
|
+
} as const;
|
|
83
|
+
|
|
84
|
+
await createTestModel({ o11yHeaders }).doEmbed({ values: testValues });
|
|
85
|
+
|
|
86
|
+
const headers = server.calls[0].requestHeaders;
|
|
87
|
+
expect(headers).toMatchObject(o11yHeaders);
|
|
88
|
+
});
|
|
89
|
+
|
|
90
|
+
it('should extract embeddings and usage', async () => {
|
|
91
|
+
prepareJsonResponse({
|
|
92
|
+
embeddings: dummyEmbeddings,
|
|
93
|
+
usage: { tokens: 42 },
|
|
94
|
+
});
|
|
95
|
+
|
|
96
|
+
const { embeddings, usage } = await createTestModel().doEmbed({
|
|
97
|
+
values: testValues,
|
|
98
|
+
});
|
|
99
|
+
|
|
100
|
+
expect(embeddings).toStrictEqual(dummyEmbeddings);
|
|
101
|
+
expect(usage).toStrictEqual({ tokens: 42 });
|
|
102
|
+
});
|
|
103
|
+
|
|
104
|
+
it('should send value as array', async () => {
|
|
105
|
+
prepareJsonResponse();
|
|
106
|
+
|
|
107
|
+
await createTestModel().doEmbed({ values: testValues });
|
|
108
|
+
expect(await server.calls[0].requestBodyJson).toStrictEqual({
|
|
109
|
+
values: testValues,
|
|
110
|
+
});
|
|
111
|
+
});
|
|
112
|
+
|
|
113
|
+
it('should pass providerOptions into request body', async () => {
|
|
114
|
+
prepareJsonResponse();
|
|
115
|
+
|
|
116
|
+
await createTestModel().doEmbed({
|
|
117
|
+
values: testValues,
|
|
118
|
+
providerOptions: { openai: { dimensions: 64 } },
|
|
119
|
+
});
|
|
120
|
+
|
|
121
|
+
expect(await server.calls[0].requestBodyJson).toStrictEqual({
|
|
122
|
+
values: testValues,
|
|
123
|
+
providerOptions: { openai: { dimensions: 64 } },
|
|
124
|
+
});
|
|
125
|
+
});
|
|
126
|
+
|
|
127
|
+
it('should not include providerOptions when not provided', async () => {
|
|
128
|
+
prepareJsonResponse();
|
|
129
|
+
|
|
130
|
+
await createTestModel().doEmbed({ values: testValues });
|
|
131
|
+
|
|
132
|
+
const body = await server.calls[0].requestBodyJson;
|
|
133
|
+
expect(body).toStrictEqual({ values: testValues });
|
|
134
|
+
expect('providerOptions' in body).toBe(false);
|
|
135
|
+
});
|
|
136
|
+
|
|
137
|
+
it('should convert gateway error responses', async () => {
|
|
138
|
+
server.urls['https://api.test.com/embedding-model'].response = {
|
|
139
|
+
type: 'error',
|
|
140
|
+
status: 400,
|
|
141
|
+
body: JSON.stringify({
|
|
142
|
+
error: {
|
|
143
|
+
message: 'Invalid input',
|
|
144
|
+
type: 'invalid_request_error',
|
|
145
|
+
},
|
|
146
|
+
}),
|
|
147
|
+
};
|
|
148
|
+
|
|
149
|
+
await expect(
|
|
150
|
+
createTestModel().doEmbed({ values: testValues }),
|
|
151
|
+
).rejects.toSatisfy(
|
|
152
|
+
err =>
|
|
153
|
+
GatewayInvalidRequestError.isInstance(err) && err.statusCode === 400,
|
|
154
|
+
);
|
|
155
|
+
|
|
156
|
+
server.urls['https://api.test.com/embedding-model'].response = {
|
|
157
|
+
type: 'error',
|
|
158
|
+
status: 500,
|
|
159
|
+
body: JSON.stringify({
|
|
160
|
+
error: {
|
|
161
|
+
message: 'Server blew up',
|
|
162
|
+
type: 'internal_server_error',
|
|
163
|
+
},
|
|
164
|
+
}),
|
|
165
|
+
};
|
|
166
|
+
|
|
167
|
+
await expect(
|
|
168
|
+
createTestModel().doEmbed({ values: testValues }),
|
|
169
|
+
).rejects.toSatisfy(
|
|
170
|
+
err =>
|
|
171
|
+
GatewayInternalServerError.isInstance(err) && err.statusCode === 500,
|
|
172
|
+
);
|
|
173
|
+
});
|
|
174
|
+
|
|
175
|
+
it('should include providerMetadata in response body', async () => {
|
|
176
|
+
server.urls['https://api.test.com/embedding-model'].response = {
|
|
177
|
+
type: 'json-value',
|
|
178
|
+
body: {
|
|
179
|
+
embeddings: dummyEmbeddings,
|
|
180
|
+
usage: { tokens: 5 },
|
|
181
|
+
providerMetadata: { gateway: { routing: { test: true } } },
|
|
182
|
+
},
|
|
183
|
+
};
|
|
184
|
+
|
|
185
|
+
const { response } = await createTestModel().doEmbed({
|
|
186
|
+
values: testValues,
|
|
187
|
+
});
|
|
188
|
+
|
|
189
|
+
expect(response?.body).toMatchObject({
|
|
190
|
+
providerMetadata: { gateway: { routing: { test: true } } },
|
|
191
|
+
});
|
|
192
|
+
});
|
|
193
|
+
|
|
194
|
+
it('should extract providerMetadata to top level', async () => {
|
|
195
|
+
server.urls['https://api.test.com/embedding-model'].response = {
|
|
196
|
+
type: 'json-value',
|
|
197
|
+
body: {
|
|
198
|
+
embeddings: dummyEmbeddings,
|
|
199
|
+
usage: { tokens: 5 },
|
|
200
|
+
providerMetadata: { gateway: { routing: { test: true } } },
|
|
201
|
+
},
|
|
202
|
+
};
|
|
203
|
+
|
|
204
|
+
const result = await createTestModel().doEmbed({
|
|
205
|
+
values: testValues,
|
|
206
|
+
});
|
|
207
|
+
|
|
208
|
+
expect(result.providerMetadata).toStrictEqual({
|
|
209
|
+
gateway: { routing: { test: true } },
|
|
210
|
+
});
|
|
211
|
+
});
|
|
212
|
+
});
|
|
213
|
+
});
|
|
@@ -0,0 +1,109 @@
|
|
|
1
|
+
import type {
|
|
2
|
+
EmbeddingModelV3,
|
|
3
|
+
SharedV3ProviderMetadata,
|
|
4
|
+
} from '@ai-sdk/provider';
|
|
5
|
+
import {
|
|
6
|
+
combineHeaders,
|
|
7
|
+
createJsonErrorResponseHandler,
|
|
8
|
+
createJsonResponseHandler,
|
|
9
|
+
lazySchema,
|
|
10
|
+
postJsonToApi,
|
|
11
|
+
resolve,
|
|
12
|
+
zodSchema,
|
|
13
|
+
type Resolvable,
|
|
14
|
+
} from '@ai-sdk/provider-utils';
|
|
15
|
+
import { z } from 'zod/v4';
|
|
16
|
+
import { asGatewayError } from './errors';
|
|
17
|
+
import { parseAuthMethod } from './errors/parse-auth-method';
|
|
18
|
+
import type { GatewayConfig } from './gateway-config';
|
|
19
|
+
|
|
20
|
+
export class GatewayEmbeddingModel implements EmbeddingModelV3 {
|
|
21
|
+
readonly specificationVersion = 'v3';
|
|
22
|
+
readonly maxEmbeddingsPerCall = 2048;
|
|
23
|
+
readonly supportsParallelCalls = true;
|
|
24
|
+
|
|
25
|
+
constructor(
|
|
26
|
+
readonly modelId: string,
|
|
27
|
+
private readonly config: GatewayConfig & {
|
|
28
|
+
provider: string;
|
|
29
|
+
o11yHeaders: Resolvable<Record<string, string>>;
|
|
30
|
+
},
|
|
31
|
+
) {}
|
|
32
|
+
|
|
33
|
+
get provider(): string {
|
|
34
|
+
return this.config.provider;
|
|
35
|
+
}
|
|
36
|
+
|
|
37
|
+
async doEmbed({
|
|
38
|
+
values,
|
|
39
|
+
headers,
|
|
40
|
+
abortSignal,
|
|
41
|
+
providerOptions,
|
|
42
|
+
}: Parameters<EmbeddingModelV3['doEmbed']>[0]): Promise<
|
|
43
|
+
Awaited<ReturnType<EmbeddingModelV3['doEmbed']>>
|
|
44
|
+
> {
|
|
45
|
+
const resolvedHeaders = await resolve(this.config.headers());
|
|
46
|
+
try {
|
|
47
|
+
const {
|
|
48
|
+
responseHeaders,
|
|
49
|
+
value: responseBody,
|
|
50
|
+
rawValue,
|
|
51
|
+
} = await postJsonToApi({
|
|
52
|
+
url: this.getUrl(),
|
|
53
|
+
headers: combineHeaders(
|
|
54
|
+
resolvedHeaders,
|
|
55
|
+
headers ?? {},
|
|
56
|
+
this.getModelConfigHeaders(),
|
|
57
|
+
await resolve(this.config.o11yHeaders),
|
|
58
|
+
),
|
|
59
|
+
body: {
|
|
60
|
+
values,
|
|
61
|
+
...(providerOptions ? { providerOptions } : {}),
|
|
62
|
+
},
|
|
63
|
+
successfulResponseHandler: createJsonResponseHandler(
|
|
64
|
+
gatewayEmbeddingResponseSchema,
|
|
65
|
+
),
|
|
66
|
+
failedResponseHandler: createJsonErrorResponseHandler({
|
|
67
|
+
errorSchema: z.any(),
|
|
68
|
+
errorToMessage: data => data,
|
|
69
|
+
}),
|
|
70
|
+
...(abortSignal && { abortSignal }),
|
|
71
|
+
fetch: this.config.fetch,
|
|
72
|
+
});
|
|
73
|
+
|
|
74
|
+
return {
|
|
75
|
+
embeddings: responseBody.embeddings,
|
|
76
|
+
usage: responseBody.usage ?? undefined,
|
|
77
|
+
providerMetadata:
|
|
78
|
+
responseBody.providerMetadata as unknown as SharedV3ProviderMetadata,
|
|
79
|
+
response: { headers: responseHeaders, body: rawValue },
|
|
80
|
+
warnings: [],
|
|
81
|
+
};
|
|
82
|
+
} catch (error) {
|
|
83
|
+
throw await asGatewayError(error, await parseAuthMethod(resolvedHeaders));
|
|
84
|
+
}
|
|
85
|
+
}
|
|
86
|
+
|
|
87
|
+
private getUrl() {
|
|
88
|
+
return `${this.config.baseURL}/embedding-model`;
|
|
89
|
+
}
|
|
90
|
+
|
|
91
|
+
private getModelConfigHeaders() {
|
|
92
|
+
return {
|
|
93
|
+
'ai-embedding-model-specification-version': '3',
|
|
94
|
+
'ai-model-id': this.modelId,
|
|
95
|
+
};
|
|
96
|
+
}
|
|
97
|
+
}
|
|
98
|
+
|
|
99
|
+
const gatewayEmbeddingResponseSchema = lazySchema(() =>
|
|
100
|
+
zodSchema(
|
|
101
|
+
z.object({
|
|
102
|
+
embeddings: z.array(z.array(z.number())),
|
|
103
|
+
usage: z.object({ tokens: z.number() }).nullish(),
|
|
104
|
+
providerMetadata: z
|
|
105
|
+
.record(z.string(), z.record(z.string(), z.unknown()))
|
|
106
|
+
.optional(),
|
|
107
|
+
}),
|
|
108
|
+
),
|
|
109
|
+
);
|