@adaline/gateway 0.6.0 → 0.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/dist/index.d.mts CHANGED
@@ -1,5 +1,6 @@
1
1
  import { z } from 'zod';
2
2
  import { ChatModelV1, EmbeddingModelV1 } from '@adaline/provider';
3
+ import { GatewayBaseError } from '@adaline/types';
3
4
  import { AxiosInstance } from 'axios';
4
5
 
5
6
  declare class GatewayError extends Error {
@@ -27,18 +28,36 @@ interface HttpClientResponse<T> {
27
28
  };
28
29
  }
29
30
 
31
+ declare class HttpClientError extends GatewayBaseError {
32
+ readonly info: string;
33
+ readonly cause: unknown;
34
+ constructor({ info, cause }: {
35
+ info: string;
36
+ cause: unknown;
37
+ });
38
+ static isHttpClientError(error: unknown): error is HttpClientError;
39
+ }
40
+ declare class HttpRequestError extends GatewayBaseError {
41
+ readonly info: string;
42
+ readonly cause: {
43
+ status: number;
44
+ headers: Record<string, string>;
45
+ data: unknown;
46
+ };
47
+ constructor(message: string, status: number | undefined, headers: Record<string, string>, data: unknown);
48
+ static isHttpRequestError(error: unknown): error is HttpRequestError;
49
+ }
50
+
30
51
  interface HttpClientConfig {
31
52
  timeoutInMilliseconds?: number;
32
53
  axiosInstance?: AxiosInstance;
33
- }
34
- declare class IsomorphicHttpClientError extends Error {
35
- status: number;
36
- data: unknown;
37
- constructor(message: string, status?: number, data?: unknown);
54
+ proxyUrl?: string;
38
55
  }
39
56
  declare class IsomorphicHttpClient implements HttpClient {
40
57
  private defaultTimeout?;
41
58
  private client;
59
+ private httpProxyAgent?;
60
+ private httpsProxyAgent?;
42
61
  constructor(config: HttpClientConfig);
43
62
  isNodeEnvironment: () => boolean;
44
63
  private makeRequest;
@@ -51,586 +70,427 @@ declare class IsomorphicHttpClient implements HttpClient {
51
70
  put<T>(url: string, data?: Record<string, unknown>, headers?: Record<string, string | undefined>): Promise<HttpClientResponse<T>>;
52
71
  delete<T>(url: string, params?: Record<string, unknown>, headers?: Record<string, string | undefined>): Promise<HttpClientResponse<T>>;
53
72
  patch<T>(url: string, data?: Record<string, unknown>, headers?: Record<string, string | undefined>): Promise<HttpClientResponse<T>>;
54
- static IsomorphicHttpClientError: typeof IsomorphicHttpClientError;
55
73
  }
56
74
 
57
- type Task<Request, Response> = {
58
- tryCount: number;
59
- modelIndex: number;
60
- inputTokens: number;
61
- queueTime: number;
62
- attemptTime: number;
75
+ declare class QueueTaskTimeoutError extends GatewayBaseError {
76
+ readonly info: string;
77
+ readonly cause: unknown;
78
+ constructor({ info, cause }: {
79
+ info: string;
80
+ cause: unknown;
81
+ });
82
+ static isQueueTaskTimeoutError(error: unknown): error is QueueTaskTimeoutError;
83
+ }
84
+
85
+ interface Cache<T> {
86
+ get(key: string): T | undefined;
87
+ set(key: string, value: T): void;
88
+ delete(key: string): void;
89
+ clear(): void;
90
+ }
91
+
92
+ declare class LRUCache<T extends object> implements Cache<T> {
93
+ private cache;
94
+ constructor(maxEntries?: number);
95
+ get(key: string): T | undefined;
96
+ set(key: string, value: T): void;
97
+ delete(key: string): void;
98
+ clear(): void;
99
+ }
100
+
101
+ type QueueTask<Request, Response> = {
63
102
  request: Request;
64
- queuePriority: number | undefined;
103
+ cache: Cache<Response>;
65
104
  resolve: (value: Response) => void;
66
- execute: (request: {
67
- modelIndex: number;
68
- data: Request;
69
- resolve: (value: Response) => void;
70
- reject: (error: any) => void;
71
- }) => Promise<void>;
72
105
  reject: (error: any) => void;
106
+ execute: (request: Request) => Promise<Response>;
73
107
  };
74
108
  interface Queue<Request, Response> {
75
- enqueue(task: Task<Request, Response>): void;
109
+ enqueue(task: QueueTask<Request, Response>): void;
76
110
  }
111
+ declare const QueueOptions: z.ZodObject<{
112
+ maxConcurrentTasks: z.ZodNumber;
113
+ retryCount: z.ZodNumber;
114
+ timeout: z.ZodNumber;
115
+ retry: z.ZodObject<{
116
+ initialDelay: z.ZodNumber;
117
+ exponentialFactor: z.ZodNumber;
118
+ }, "strip", z.ZodTypeAny, {
119
+ initialDelay: number;
120
+ exponentialFactor: number;
121
+ }, {
122
+ initialDelay: number;
123
+ exponentialFactor: number;
124
+ }>;
125
+ }, "strip", z.ZodTypeAny, {
126
+ timeout: number;
127
+ maxConcurrentTasks: number;
128
+ retryCount: number;
129
+ retry: {
130
+ initialDelay: number;
131
+ exponentialFactor: number;
132
+ };
133
+ }, {
134
+ timeout: number;
135
+ maxConcurrentTasks: number;
136
+ retryCount: number;
137
+ retry: {
138
+ initialDelay: number;
139
+ exponentialFactor: number;
140
+ };
141
+ }>;
142
+ type QueueOptionsType = z.infer<typeof QueueOptions>;
77
143
 
78
- type QueueOptions = {
79
- maxRetries?: number;
80
- tokensPerMinute?: number;
81
- timeout?: number;
82
- backOffInitialDelay?: number;
83
- backOffMultiplier?: number;
84
- rateLimitRetryTimeout?: number;
85
- shouldRetry?: (status: number) => boolean;
86
- };
87
- declare class SimpleQueue<Req, Res> implements Queue<Req, Res> {
144
+ declare class SimpleQueue<Request, Response> implements Queue<Request, Response> {
145
+ private options;
146
+ private activeTasks;
88
147
  private queue;
89
- private isProcessing;
90
- private maxRetries;
91
- private tokensPerMinute;
92
- private timeout;
93
- private backOffInitialDelay;
94
- private backOffMultiplier;
95
- private rateLimitRetryTimeout;
96
- private shouldRetry;
97
- constructor(options: QueueOptions);
98
- enqueue(task: Task<Req, Res>): void;
99
- private calculateBackoff;
148
+ constructor(options: QueueOptionsType);
149
+ enqueue(task: QueueTask<Request, Response>): void;
150
+ private withTimeout;
151
+ private executeWithRetry;
100
152
  private processQueue;
101
- private execute;
102
153
  }
103
154
 
104
- declare const CompleteChatHandlerRequest: z.ZodObject<{
105
- model: z.ZodType<ChatModelV1<{
106
- name: string;
107
- description: string;
108
- roles: Partial<Record<"system" | "user" | "assistant" | "tool", string | undefined>>;
109
- modalities: ["text" | "image" | "tool-call" | "tool-response", ...("text" | "image" | "tool-call" | "tool-response")[]];
110
- maxInputTokens: number;
111
- maxOutputTokens: number;
112
- config: {
113
- def: Record<string, {
114
- type: "multi-string";
115
- param: string;
116
- title: string;
117
- description: string;
118
- max: number;
119
- } | {
120
- type: "range";
121
- param: string;
122
- title: string;
123
- description: string;
124
- max: number;
125
- min: number;
126
- step: number;
127
- default: number;
128
- } | {
129
- type: "select-string";
130
- param: string;
131
- title: string;
132
- description: string;
133
- default: string;
134
- choices: string[];
135
- } | {
136
- type: "object-schema";
137
- param: string;
138
- title: string;
139
- description: string;
140
- objectSchema?: any;
141
- } | {
142
- type: "select-boolean";
143
- param: string;
144
- title: string;
145
- description: string;
146
- default: boolean | null;
147
- }>;
148
- schema: z.ZodObject<z.ZodRawShape, z.UnknownKeysParam, z.ZodTypeAny, unknown, unknown>;
149
- };
150
- }>, z.ZodTypeDef, ChatModelV1<{
151
- name: string;
152
- description: string;
153
- roles: Partial<Record<"system" | "user" | "assistant" | "tool", string | undefined>>;
154
- modalities: ["text" | "image" | "tool-call" | "tool-response", ...("text" | "image" | "tool-call" | "tool-response")[]];
155
- maxInputTokens: number;
156
- maxOutputTokens: number;
157
- config: {
158
- def: Record<string, {
159
- type: "multi-string";
160
- param: string;
161
- title: string;
162
- description: string;
163
- max: number;
164
- } | {
165
- type: "range";
166
- param: string;
167
- title: string;
168
- description: string;
169
- max: number;
170
- min: number;
171
- step: number;
172
- default: number;
173
- } | {
174
- type: "select-string";
175
- param: string;
176
- title: string;
177
- description: string;
178
- default: string;
179
- choices: string[];
180
- } | {
181
- type: "object-schema";
182
- param: string;
183
- title: string;
184
- description: string;
185
- objectSchema?: any;
186
- } | {
187
- type: "select-boolean";
188
- param: string;
189
- title: string;
190
- description: string;
191
- default: boolean | null;
192
- }>;
193
- schema: z.ZodObject<z.ZodRawShape, z.UnknownKeysParam, z.ZodTypeAny, unknown, unknown>;
194
- };
195
- }>>;
196
- config: z.ZodRecord<z.ZodString, z.ZodAny>;
197
- messages: z.ZodArray<z.ZodObject<{
198
- role: z.ZodEnum<["system", "user", "assistant", "tool"]>;
199
- content: z.ZodArray<z.ZodDiscriminatedUnion<"modality", [z.ZodObject<{
200
- modality: z.ZodLiteral<"text">;
201
- value: z.ZodString;
202
- metadata: z.ZodUndefined;
203
- }, "strip", z.ZodTypeAny, {
204
- value: string;
205
- modality: "text";
206
- metadata?: undefined;
207
- }, {
208
- value: string;
209
- modality: "text";
210
- metadata?: undefined;
211
- }>, z.ZodObject<{
212
- modality: z.ZodLiteral<"image">;
213
- detail: z.ZodEnum<["low", "medium", "high", "auto"]>;
214
- value: z.ZodDiscriminatedUnion<"type", [z.ZodObject<{
215
- type: z.ZodLiteral<"base64">;
216
- base64: z.ZodString;
217
- media_type: z.ZodEnum<["png", "jpeg", "webp", "gif"]>;
155
+ declare const CompleteChatHandlerResponse: z.ZodObject<{
156
+ request: z.ZodObject<{
157
+ config: z.ZodRecord<z.ZodString, z.ZodAny>;
158
+ messages: z.ZodArray<z.ZodObject<{
159
+ role: z.ZodEnum<["system", "user", "assistant", "tool"]>;
160
+ content: z.ZodArray<z.ZodDiscriminatedUnion<"modality", [z.ZodObject<{
161
+ modality: z.ZodLiteral<"text">;
162
+ value: z.ZodString;
163
+ metadata: z.ZodUndefined;
218
164
  }, "strip", z.ZodTypeAny, {
219
- type: "base64";
220
- base64: string;
221
- media_type: "png" | "jpeg" | "webp" | "gif";
165
+ value: string;
166
+ modality: "text";
167
+ metadata?: undefined;
222
168
  }, {
223
- type: "base64";
224
- base64: string;
225
- media_type: "png" | "jpeg" | "webp" | "gif";
169
+ value: string;
170
+ modality: "text";
171
+ metadata?: undefined;
226
172
  }>, z.ZodObject<{
227
- type: z.ZodLiteral<"url">;
228
- url: z.ZodString;
173
+ modality: z.ZodLiteral<"image">;
174
+ detail: z.ZodEnum<["low", "medium", "high", "auto"]>;
175
+ value: z.ZodDiscriminatedUnion<"type", [z.ZodObject<{
176
+ type: z.ZodLiteral<"base64">;
177
+ base64: z.ZodString;
178
+ media_type: z.ZodEnum<["png", "jpeg", "webp", "gif"]>;
179
+ }, "strip", z.ZodTypeAny, {
180
+ type: "base64";
181
+ base64: string;
182
+ media_type: "png" | "jpeg" | "webp" | "gif";
183
+ }, {
184
+ type: "base64";
185
+ base64: string;
186
+ media_type: "png" | "jpeg" | "webp" | "gif";
187
+ }>, z.ZodObject<{
188
+ type: z.ZodLiteral<"url">;
189
+ url: z.ZodString;
190
+ }, "strip", z.ZodTypeAny, {
191
+ type: "url";
192
+ url: string;
193
+ }, {
194
+ type: "url";
195
+ url: string;
196
+ }>]>;
197
+ metadata: z.ZodUndefined;
229
198
  }, "strip", z.ZodTypeAny, {
230
- type: "url";
231
- url: string;
199
+ value: {
200
+ type: "base64";
201
+ base64: string;
202
+ media_type: "png" | "jpeg" | "webp" | "gif";
203
+ } | {
204
+ type: "url";
205
+ url: string;
206
+ };
207
+ modality: "image";
208
+ detail: "low" | "medium" | "high" | "auto";
209
+ metadata?: undefined;
232
210
  }, {
233
- type: "url";
234
- url: string;
235
- }>]>;
211
+ value: {
212
+ type: "base64";
213
+ base64: string;
214
+ media_type: "png" | "jpeg" | "webp" | "gif";
215
+ } | {
216
+ type: "url";
217
+ url: string;
218
+ };
219
+ modality: "image";
220
+ detail: "low" | "medium" | "high" | "auto";
221
+ metadata?: undefined;
222
+ }>, z.ZodObject<{
223
+ modality: z.ZodLiteral<"tool-call">;
224
+ index: z.ZodNumber;
225
+ id: z.ZodString;
226
+ name: z.ZodString;
227
+ arguments: z.ZodString;
228
+ metadata: z.ZodUndefined;
229
+ }, "strip", z.ZodTypeAny, {
230
+ name: string;
231
+ modality: "tool-call";
232
+ index: number;
233
+ id: string;
234
+ arguments: string;
235
+ metadata?: undefined;
236
+ }, {
237
+ name: string;
238
+ modality: "tool-call";
239
+ index: number;
240
+ id: string;
241
+ arguments: string;
242
+ metadata?: undefined;
243
+ }>, z.ZodObject<{
244
+ modality: z.ZodLiteral<"tool-response">;
245
+ index: z.ZodNumber;
246
+ id: z.ZodString;
247
+ name: z.ZodString;
248
+ data: z.ZodString;
249
+ metadata: z.ZodUndefined;
250
+ }, "strip", z.ZodTypeAny, {
251
+ data: string;
252
+ name: string;
253
+ modality: "tool-response";
254
+ index: number;
255
+ id: string;
256
+ metadata?: undefined;
257
+ }, {
258
+ data: string;
259
+ name: string;
260
+ modality: "tool-response";
261
+ index: number;
262
+ id: string;
263
+ metadata?: undefined;
264
+ }>]>, "many">;
236
265
  metadata: z.ZodUndefined;
237
266
  }, "strip", z.ZodTypeAny, {
238
- value: {
239
- type: "base64";
240
- base64: string;
241
- media_type: "png" | "jpeg" | "webp" | "gif";
267
+ role: "system" | "user" | "assistant" | "tool";
268
+ content: ({
269
+ value: string;
270
+ modality: "text";
271
+ metadata?: undefined;
242
272
  } | {
243
- type: "url";
244
- url: string;
245
- };
246
- modality: "image";
247
- detail: "low" | "medium" | "high" | "auto";
248
- metadata?: undefined;
249
- }, {
250
- value: {
251
- type: "base64";
252
- base64: string;
253
- media_type: "png" | "jpeg" | "webp" | "gif";
273
+ value: {
274
+ type: "base64";
275
+ base64: string;
276
+ media_type: "png" | "jpeg" | "webp" | "gif";
277
+ } | {
278
+ type: "url";
279
+ url: string;
280
+ };
281
+ modality: "image";
282
+ detail: "low" | "medium" | "high" | "auto";
283
+ metadata?: undefined;
254
284
  } | {
255
- type: "url";
256
- url: string;
257
- };
258
- modality: "image";
259
- detail: "low" | "medium" | "high" | "auto";
260
- metadata?: undefined;
261
- }>, z.ZodObject<{
262
- modality: z.ZodLiteral<"tool-call">;
263
- index: z.ZodNumber;
264
- id: z.ZodString;
265
- name: z.ZodString;
266
- arguments: z.ZodString;
267
- metadata: z.ZodUndefined;
268
- }, "strip", z.ZodTypeAny, {
269
- name: string;
270
- modality: "tool-call";
271
- index: number;
272
- id: string;
273
- arguments: string;
274
- metadata?: undefined;
275
- }, {
276
- name: string;
277
- modality: "tool-call";
278
- index: number;
279
- id: string;
280
- arguments: string;
281
- metadata?: undefined;
282
- }>, z.ZodObject<{
283
- modality: z.ZodLiteral<"tool-response">;
284
- index: z.ZodNumber;
285
- id: z.ZodString;
286
- name: z.ZodString;
287
- data: z.ZodString;
288
- metadata: z.ZodUndefined;
289
- }, "strip", z.ZodTypeAny, {
290
- data: string;
291
- name: string;
292
- modality: "tool-response";
293
- index: number;
294
- id: string;
285
+ name: string;
286
+ modality: "tool-call";
287
+ index: number;
288
+ id: string;
289
+ arguments: string;
290
+ metadata?: undefined;
291
+ } | {
292
+ data: string;
293
+ name: string;
294
+ modality: "tool-response";
295
+ index: number;
296
+ id: string;
297
+ metadata?: undefined;
298
+ })[];
295
299
  metadata?: undefined;
296
300
  }, {
297
- data: string;
298
- name: string;
299
- modality: "tool-response";
300
- index: number;
301
- id: string;
302
- metadata?: undefined;
303
- }>]>, "many">;
304
- metadata: z.ZodUndefined;
305
- }, "strip", z.ZodTypeAny, {
306
- role: "system" | "user" | "assistant" | "tool";
307
- content: ({
308
- value: string;
309
- modality: "text";
310
- metadata?: undefined;
311
- } | {
312
- value: {
313
- type: "base64";
314
- base64: string;
315
- media_type: "png" | "jpeg" | "webp" | "gif";
301
+ role: "system" | "user" | "assistant" | "tool";
302
+ content: ({
303
+ value: string;
304
+ modality: "text";
305
+ metadata?: undefined;
316
306
  } | {
317
- type: "url";
318
- url: string;
319
- };
320
- modality: "image";
321
- detail: "low" | "medium" | "high" | "auto";
322
- metadata?: undefined;
323
- } | {
324
- name: string;
325
- modality: "tool-call";
326
- index: number;
327
- id: string;
328
- arguments: string;
329
- metadata?: undefined;
330
- } | {
331
- data: string;
332
- name: string;
333
- modality: "tool-response";
334
- index: number;
335
- id: string;
336
- metadata?: undefined;
337
- })[];
338
- metadata?: undefined;
339
- }, {
340
- role: "system" | "user" | "assistant" | "tool";
341
- content: ({
342
- value: string;
343
- modality: "text";
344
- metadata?: undefined;
345
- } | {
346
- value: {
347
- type: "base64";
348
- base64: string;
349
- media_type: "png" | "jpeg" | "webp" | "gif";
307
+ value: {
308
+ type: "base64";
309
+ base64: string;
310
+ media_type: "png" | "jpeg" | "webp" | "gif";
311
+ } | {
312
+ type: "url";
313
+ url: string;
314
+ };
315
+ modality: "image";
316
+ detail: "low" | "medium" | "high" | "auto";
317
+ metadata?: undefined;
350
318
  } | {
351
- type: "url";
352
- url: string;
353
- };
354
- modality: "image";
355
- detail: "low" | "medium" | "high" | "auto";
356
- metadata?: undefined;
357
- } | {
358
- name: string;
359
- modality: "tool-call";
360
- index: number;
361
- id: string;
362
- arguments: string;
363
- metadata?: undefined;
364
- } | {
365
- data: string;
366
- name: string;
367
- modality: "tool-response";
368
- index: number;
369
- id: string;
319
+ name: string;
320
+ modality: "tool-call";
321
+ index: number;
322
+ id: string;
323
+ arguments: string;
324
+ metadata?: undefined;
325
+ } | {
326
+ data: string;
327
+ name: string;
328
+ modality: "tool-response";
329
+ index: number;
330
+ id: string;
331
+ metadata?: undefined;
332
+ })[];
370
333
  metadata?: undefined;
371
- })[];
372
- metadata?: undefined;
373
- }>, "many">;
374
- tools: z.ZodOptional<z.ZodArray<z.ZodDiscriminatedUnion<"type", [z.ZodObject<z.objectUtil.extendShape<{
375
- type: z.ZodEnum<["function"]>;
376
- definition: z.ZodObject<{
377
- schema: z.ZodObject<{
378
- name: z.ZodString;
379
- description: z.ZodString;
380
- parameters: z.ZodAny;
381
- strict: z.ZodOptional<z.ZodBoolean>;
334
+ }>, "many">;
335
+ tools: z.ZodOptional<z.ZodArray<z.ZodDiscriminatedUnion<"type", [z.ZodObject<z.objectUtil.extendShape<{
336
+ type: z.ZodEnum<["function"]>;
337
+ definition: z.ZodObject<{
338
+ schema: z.ZodObject<{
339
+ name: z.ZodString;
340
+ description: z.ZodString;
341
+ parameters: z.ZodAny;
342
+ strict: z.ZodOptional<z.ZodBoolean>;
343
+ }, "strip", z.ZodTypeAny, {
344
+ name: string;
345
+ description: string;
346
+ strict?: boolean | undefined;
347
+ parameters?: any;
348
+ }, {
349
+ name: string;
350
+ description: string;
351
+ strict?: boolean | undefined;
352
+ parameters?: any;
353
+ }>;
382
354
  }, "strip", z.ZodTypeAny, {
383
- name: string;
384
- description: string;
385
- strict?: boolean | undefined;
386
- parameters?: any;
355
+ schema: {
356
+ name: string;
357
+ description: string;
358
+ strict?: boolean | undefined;
359
+ parameters?: any;
360
+ };
387
361
  }, {
388
- name: string;
389
- description: string;
390
- strict?: boolean | undefined;
391
- parameters?: any;
362
+ schema: {
363
+ name: string;
364
+ description: string;
365
+ strict?: boolean | undefined;
366
+ parameters?: any;
367
+ };
392
368
  }>;
393
- }, "strip", z.ZodTypeAny, {
394
- schema: {
395
- name: string;
396
- description: string;
397
- strict?: boolean | undefined;
398
- parameters?: any;
369
+ }, {
370
+ metadata: z.ZodTypeAny;
371
+ }>, "strip", z.ZodTypeAny, {
372
+ type: "function";
373
+ definition: {
374
+ schema: {
375
+ name: string;
376
+ description: string;
377
+ strict?: boolean | undefined;
378
+ parameters?: any;
379
+ };
399
380
  };
381
+ metadata?: any;
400
382
  }, {
401
- schema: {
402
- name: string;
403
- description: string;
404
- strict?: boolean | undefined;
405
- parameters?: any;
406
- };
407
- }>;
408
- }, {
409
- metadata: z.ZodTypeAny;
410
- }>, "strip", z.ZodTypeAny, {
411
- type: "function";
412
- definition: {
413
- schema: {
414
- name: string;
415
- description: string;
416
- strict?: boolean | undefined;
417
- parameters?: any;
418
- };
419
- };
420
- metadata?: any;
421
- }, {
422
- type: "function";
423
- definition: {
424
- schema: {
425
- name: string;
426
- description: string;
427
- strict?: boolean | undefined;
428
- parameters?: any;
383
+ type: "function";
384
+ definition: {
385
+ schema: {
386
+ name: string;
387
+ description: string;
388
+ strict?: boolean | undefined;
389
+ parameters?: any;
390
+ };
429
391
  };
430
- };
431
- metadata?: any;
432
- }>]>, "many">>;
433
- callbacks: z.ZodOptional<z.ZodArray<z.ZodType<CompleteChatCallbackType<any>, z.ZodTypeDef, CompleteChatCallbackType<any>>, "atleastone">>;
434
- metadataForCallbacks: z.ZodOptional<z.ZodAny>;
435
- }, "strip", z.ZodTypeAny, {
436
- config: Record<string, any>;
437
- model: ChatModelV1<{
438
- name: string;
439
- description: string;
440
- roles: Partial<Record<"system" | "user" | "assistant" | "tool", string | undefined>>;
441
- modalities: ["text" | "image" | "tool-call" | "tool-response", ...("text" | "image" | "tool-call" | "tool-response")[]];
442
- maxInputTokens: number;
443
- maxOutputTokens: number;
444
- config: {
445
- def: Record<string, {
446
- type: "multi-string";
447
- param: string;
448
- title: string;
449
- description: string;
450
- max: number;
451
- } | {
452
- type: "range";
453
- param: string;
454
- title: string;
455
- description: string;
456
- max: number;
457
- min: number;
458
- step: number;
459
- default: number;
460
- } | {
461
- type: "select-string";
462
- param: string;
463
- title: string;
464
- description: string;
465
- default: string;
466
- choices: string[];
392
+ metadata?: any;
393
+ }>]>, "many">>;
394
+ }, "strip", z.ZodTypeAny, {
395
+ config: Record<string, any>;
396
+ messages: {
397
+ role: "system" | "user" | "assistant" | "tool";
398
+ content: ({
399
+ value: string;
400
+ modality: "text";
401
+ metadata?: undefined;
467
402
  } | {
468
- type: "object-schema";
469
- param: string;
470
- title: string;
471
- description: string;
472
- objectSchema?: any;
403
+ value: {
404
+ type: "base64";
405
+ base64: string;
406
+ media_type: "png" | "jpeg" | "webp" | "gif";
407
+ } | {
408
+ type: "url";
409
+ url: string;
410
+ };
411
+ modality: "image";
412
+ detail: "low" | "medium" | "high" | "auto";
413
+ metadata?: undefined;
473
414
  } | {
474
- type: "select-boolean";
475
- param: string;
476
- title: string;
477
- description: string;
478
- default: boolean | null;
479
- }>;
480
- schema: z.ZodObject<z.ZodRawShape, z.UnknownKeysParam, z.ZodTypeAny, unknown, unknown>;
481
- };
482
- }>;
483
- messages: {
484
- role: "system" | "user" | "assistant" | "tool";
485
- content: ({
486
- value: string;
487
- modality: "text";
488
- metadata?: undefined;
489
- } | {
490
- value: {
491
- type: "base64";
492
- base64: string;
493
- media_type: "png" | "jpeg" | "webp" | "gif";
415
+ name: string;
416
+ modality: "tool-call";
417
+ index: number;
418
+ id: string;
419
+ arguments: string;
420
+ metadata?: undefined;
494
421
  } | {
495
- type: "url";
496
- url: string;
497
- };
498
- modality: "image";
499
- detail: "low" | "medium" | "high" | "auto";
500
- metadata?: undefined;
501
- } | {
502
- name: string;
503
- modality: "tool-call";
504
- index: number;
505
- id: string;
506
- arguments: string;
507
- metadata?: undefined;
508
- } | {
509
- data: string;
510
- name: string;
511
- modality: "tool-response";
512
- index: number;
513
- id: string;
514
- metadata?: undefined;
515
- })[];
516
- metadata?: undefined;
517
- }[];
518
- tools?: {
519
- type: "function";
520
- definition: {
521
- schema: {
422
+ data: string;
522
423
  name: string;
523
- description: string;
524
- strict?: boolean | undefined;
525
- parameters?: any;
424
+ modality: "tool-response";
425
+ index: number;
426
+ id: string;
427
+ metadata?: undefined;
428
+ })[];
429
+ metadata?: undefined;
430
+ }[];
431
+ tools?: {
432
+ type: "function";
433
+ definition: {
434
+ schema: {
435
+ name: string;
436
+ description: string;
437
+ strict?: boolean | undefined;
438
+ parameters?: any;
439
+ };
526
440
  };
527
- };
528
- metadata?: any;
529
- }[] | undefined;
530
- callbacks?: [CompleteChatCallbackType<any>, ...CompleteChatCallbackType<any>[]] | undefined;
531
- metadataForCallbacks?: any;
532
- }, {
533
- config: Record<string, any>;
534
- model: ChatModelV1<{
535
- name: string;
536
- description: string;
537
- roles: Partial<Record<"system" | "user" | "assistant" | "tool", string | undefined>>;
538
- modalities: ["text" | "image" | "tool-call" | "tool-response", ...("text" | "image" | "tool-call" | "tool-response")[]];
539
- maxInputTokens: number;
540
- maxOutputTokens: number;
541
- config: {
542
- def: Record<string, {
543
- type: "multi-string";
544
- param: string;
545
- title: string;
546
- description: string;
547
- max: number;
548
- } | {
549
- type: "range";
550
- param: string;
551
- title: string;
552
- description: string;
553
- max: number;
554
- min: number;
555
- step: number;
556
- default: number;
441
+ metadata?: any;
442
+ }[] | undefined;
443
+ }, {
444
+ config: Record<string, any>;
445
+ messages: {
446
+ role: "system" | "user" | "assistant" | "tool";
447
+ content: ({
448
+ value: string;
449
+ modality: "text";
450
+ metadata?: undefined;
557
451
  } | {
558
- type: "select-string";
559
- param: string;
560
- title: string;
561
- description: string;
562
- default: string;
563
- choices: string[];
452
+ value: {
453
+ type: "base64";
454
+ base64: string;
455
+ media_type: "png" | "jpeg" | "webp" | "gif";
456
+ } | {
457
+ type: "url";
458
+ url: string;
459
+ };
460
+ modality: "image";
461
+ detail: "low" | "medium" | "high" | "auto";
462
+ metadata?: undefined;
564
463
  } | {
565
- type: "object-schema";
566
- param: string;
567
- title: string;
568
- description: string;
569
- objectSchema?: any;
464
+ name: string;
465
+ modality: "tool-call";
466
+ index: number;
467
+ id: string;
468
+ arguments: string;
469
+ metadata?: undefined;
570
470
  } | {
571
- type: "select-boolean";
572
- param: string;
573
- title: string;
574
- description: string;
575
- default: boolean | null;
576
- }>;
577
- schema: z.ZodObject<z.ZodRawShape, z.UnknownKeysParam, z.ZodTypeAny, unknown, unknown>;
578
- };
579
- }>;
580
- messages: {
581
- role: "system" | "user" | "assistant" | "tool";
582
- content: ({
583
- value: string;
584
- modality: "text";
585
- metadata?: undefined;
586
- } | {
587
- value: {
588
- type: "base64";
589
- base64: string;
590
- media_type: "png" | "jpeg" | "webp" | "gif";
591
- } | {
592
- type: "url";
593
- url: string;
594
- };
595
- modality: "image";
596
- detail: "low" | "medium" | "high" | "auto";
597
- metadata?: undefined;
598
- } | {
599
- name: string;
600
- modality: "tool-call";
601
- index: number;
602
- id: string;
603
- arguments: string;
604
- metadata?: undefined;
605
- } | {
606
- data: string;
607
- name: string;
608
- modality: "tool-response";
609
- index: number;
610
- id: string;
611
- metadata?: undefined;
612
- })[];
613
- metadata?: undefined;
614
- }[];
615
- tools?: {
616
- type: "function";
617
- definition: {
618
- schema: {
471
+ data: string;
619
472
  name: string;
620
- description: string;
621
- strict?: boolean | undefined;
622
- parameters?: any;
473
+ modality: "tool-response";
474
+ index: number;
475
+ id: string;
476
+ metadata?: undefined;
477
+ })[];
478
+ metadata?: undefined;
479
+ }[];
480
+ tools?: {
481
+ type: "function";
482
+ definition: {
483
+ schema: {
484
+ name: string;
485
+ description: string;
486
+ strict?: boolean | undefined;
487
+ parameters?: any;
488
+ };
623
489
  };
624
- };
625
- metadata?: any;
626
- }[] | undefined;
627
- callbacks?: [CompleteChatCallbackType<any>, ...CompleteChatCallbackType<any>[]] | undefined;
628
- metadataForCallbacks?: any;
629
- }>;
630
- type CompleteChatHandlerRequestType = z.infer<typeof CompleteChatHandlerRequest>;
631
- declare const CompleteChatHandlerResponse: z.ZodObject<{
632
- request: z.ZodObject<{
633
- config: z.ZodRecord<z.ZodString, z.ZodAny>;
490
+ metadata?: any;
491
+ }[] | undefined;
492
+ }>;
493
+ response: z.ZodObject<{
634
494
  messages: z.ZodArray<z.ZodObject<{
635
495
  role: z.ZodEnum<["system", "user", "assistant", "tool"]>;
636
496
  content: z.ZodArray<z.ZodDiscriminatedUnion<"modality", [z.ZodObject<{
@@ -724,18 +584,18 @@ declare const CompleteChatHandlerResponse: z.ZodObject<{
724
584
  data: z.ZodString;
725
585
  metadata: z.ZodUndefined;
726
586
  }, "strip", z.ZodTypeAny, {
727
- data: string;
728
587
  name: string;
729
588
  modality: "tool-response";
730
589
  index: number;
731
590
  id: string;
591
+ data: string;
732
592
  metadata?: undefined;
733
593
  }, {
734
- data: string;
735
594
  name: string;
736
595
  modality: "tool-response";
737
596
  index: number;
738
597
  id: string;
598
+ data: string;
739
599
  metadata?: undefined;
740
600
  }>]>, "many">;
741
601
  metadata: z.ZodUndefined;
@@ -765,160 +625,15 @@ declare const CompleteChatHandlerResponse: z.ZodObject<{
765
625
  arguments: string;
766
626
  metadata?: undefined;
767
627
  } | {
768
- data: string;
769
628
  name: string;
770
629
  modality: "tool-response";
771
630
  index: number;
772
631
  id: string;
773
- metadata?: undefined;
774
- })[];
775
- metadata?: undefined;
776
- }, {
777
- role: "system" | "user" | "assistant" | "tool";
778
- content: ({
779
- value: string;
780
- modality: "text";
781
- metadata?: undefined;
782
- } | {
783
- value: {
784
- type: "base64";
785
- base64: string;
786
- media_type: "png" | "jpeg" | "webp" | "gif";
787
- } | {
788
- type: "url";
789
- url: string;
790
- };
791
- modality: "image";
792
- detail: "low" | "medium" | "high" | "auto";
793
- metadata?: undefined;
794
- } | {
795
- name: string;
796
- modality: "tool-call";
797
- index: number;
798
- id: string;
799
- arguments: string;
800
- metadata?: undefined;
801
- } | {
802
632
  data: string;
803
- name: string;
804
- modality: "tool-response";
805
- index: number;
806
- id: string;
807
633
  metadata?: undefined;
808
634
  })[];
809
635
  metadata?: undefined;
810
- }>, "many">;
811
- tools: z.ZodOptional<z.ZodArray<z.ZodDiscriminatedUnion<"type", [z.ZodObject<z.objectUtil.extendShape<{
812
- type: z.ZodEnum<["function"]>;
813
- definition: z.ZodObject<{
814
- schema: z.ZodObject<{
815
- name: z.ZodString;
816
- description: z.ZodString;
817
- parameters: z.ZodAny;
818
- strict: z.ZodOptional<z.ZodBoolean>;
819
- }, "strip", z.ZodTypeAny, {
820
- name: string;
821
- description: string;
822
- strict?: boolean | undefined;
823
- parameters?: any;
824
- }, {
825
- name: string;
826
- description: string;
827
- strict?: boolean | undefined;
828
- parameters?: any;
829
- }>;
830
- }, "strip", z.ZodTypeAny, {
831
- schema: {
832
- name: string;
833
- description: string;
834
- strict?: boolean | undefined;
835
- parameters?: any;
836
- };
837
- }, {
838
- schema: {
839
- name: string;
840
- description: string;
841
- strict?: boolean | undefined;
842
- parameters?: any;
843
- };
844
- }>;
845
- }, {
846
- metadata: z.ZodTypeAny;
847
- }>, "strip", z.ZodTypeAny, {
848
- type: "function";
849
- definition: {
850
- schema: {
851
- name: string;
852
- description: string;
853
- strict?: boolean | undefined;
854
- parameters?: any;
855
- };
856
- };
857
- metadata?: any;
858
636
  }, {
859
- type: "function";
860
- definition: {
861
- schema: {
862
- name: string;
863
- description: string;
864
- strict?: boolean | undefined;
865
- parameters?: any;
866
- };
867
- };
868
- metadata?: any;
869
- }>]>, "many">>;
870
- }, "strip", z.ZodTypeAny, {
871
- config: Record<string, any>;
872
- messages: {
873
- role: "system" | "user" | "assistant" | "tool";
874
- content: ({
875
- value: string;
876
- modality: "text";
877
- metadata?: undefined;
878
- } | {
879
- value: {
880
- type: "base64";
881
- base64: string;
882
- media_type: "png" | "jpeg" | "webp" | "gif";
883
- } | {
884
- type: "url";
885
- url: string;
886
- };
887
- modality: "image";
888
- detail: "low" | "medium" | "high" | "auto";
889
- metadata?: undefined;
890
- } | {
891
- name: string;
892
- modality: "tool-call";
893
- index: number;
894
- id: string;
895
- arguments: string;
896
- metadata?: undefined;
897
- } | {
898
- data: string;
899
- name: string;
900
- modality: "tool-response";
901
- index: number;
902
- id: string;
903
- metadata?: undefined;
904
- })[];
905
- metadata?: undefined;
906
- }[];
907
- tools?: {
908
- type: "function";
909
- definition: {
910
- schema: {
911
- name: string;
912
- description: string;
913
- strict?: boolean | undefined;
914
- parameters?: any;
915
- };
916
- };
917
- metadata?: any;
918
- }[] | undefined;
919
- }, {
920
- config: Record<string, any>;
921
- messages: {
922
637
  role: "system" | "user" | "assistant" | "tool";
923
638
  content: ({
924
639
  value: string;
@@ -944,962 +659,168 @@ declare const CompleteChatHandlerResponse: z.ZodObject<{
944
659
  arguments: string;
945
660
  metadata?: undefined;
946
661
  } | {
947
- data: string;
948
662
  name: string;
949
663
  modality: "tool-response";
950
664
  index: number;
951
665
  id: string;
952
- metadata?: undefined;
953
- })[];
954
- metadata?: undefined;
955
- }[];
956
- tools?: {
957
- type: "function";
958
- definition: {
959
- schema: {
960
- name: string;
961
- description: string;
962
- strict?: boolean | undefined;
963
- parameters?: any;
964
- };
965
- };
966
- metadata?: any;
967
- }[] | undefined;
968
- }>;
969
- response: z.ZodObject<{
970
- messages: z.ZodArray<z.ZodObject<{
971
- role: z.ZodEnum<["system", "user", "assistant", "tool"]>;
972
- content: z.ZodArray<z.ZodDiscriminatedUnion<"modality", [z.ZodObject<{
973
- modality: z.ZodLiteral<"text">;
974
- value: z.ZodString;
975
- metadata: z.ZodUndefined;
976
- }, "strip", z.ZodTypeAny, {
977
- value: string;
978
- modality: "text";
979
- metadata?: undefined;
980
- }, {
981
- value: string;
982
- modality: "text";
983
- metadata?: undefined;
984
- }>, z.ZodObject<{
985
- modality: z.ZodLiteral<"image">;
986
- detail: z.ZodEnum<["low", "medium", "high", "auto"]>;
987
- value: z.ZodDiscriminatedUnion<"type", [z.ZodObject<{
988
- type: z.ZodLiteral<"base64">;
989
- base64: z.ZodString;
990
- media_type: z.ZodEnum<["png", "jpeg", "webp", "gif"]>;
991
- }, "strip", z.ZodTypeAny, {
992
- type: "base64";
993
- base64: string;
994
- media_type: "png" | "jpeg" | "webp" | "gif";
995
- }, {
996
- type: "base64";
997
- base64: string;
998
- media_type: "png" | "jpeg" | "webp" | "gif";
999
- }>, z.ZodObject<{
1000
- type: z.ZodLiteral<"url">;
1001
- url: z.ZodString;
1002
- }, "strip", z.ZodTypeAny, {
1003
- type: "url";
1004
- url: string;
1005
- }, {
1006
- type: "url";
1007
- url: string;
1008
- }>]>;
1009
- metadata: z.ZodUndefined;
1010
- }, "strip", z.ZodTypeAny, {
1011
- value: {
1012
- type: "base64";
1013
- base64: string;
1014
- media_type: "png" | "jpeg" | "webp" | "gif";
1015
- } | {
1016
- type: "url";
1017
- url: string;
1018
- };
1019
- modality: "image";
1020
- detail: "low" | "medium" | "high" | "auto";
1021
- metadata?: undefined;
1022
- }, {
1023
- value: {
1024
- type: "base64";
1025
- base64: string;
1026
- media_type: "png" | "jpeg" | "webp" | "gif";
1027
- } | {
1028
- type: "url";
1029
- url: string;
1030
- };
1031
- modality: "image";
1032
- detail: "low" | "medium" | "high" | "auto";
1033
- metadata?: undefined;
1034
- }>, z.ZodObject<{
1035
- modality: z.ZodLiteral<"tool-call">;
1036
- index: z.ZodNumber;
1037
- id: z.ZodString;
1038
- name: z.ZodString;
1039
- arguments: z.ZodString;
1040
- metadata: z.ZodUndefined;
1041
- }, "strip", z.ZodTypeAny, {
1042
- modality: "tool-call";
1043
- index: number;
1044
- id: string;
1045
- name: string;
1046
- arguments: string;
1047
- metadata?: undefined;
1048
- }, {
1049
- modality: "tool-call";
1050
- index: number;
1051
- id: string;
1052
- name: string;
1053
- arguments: string;
1054
- metadata?: undefined;
1055
- }>, z.ZodObject<{
1056
- modality: z.ZodLiteral<"tool-response">;
1057
- index: z.ZodNumber;
1058
- id: z.ZodString;
1059
- name: z.ZodString;
1060
- data: z.ZodString;
1061
- metadata: z.ZodUndefined;
1062
- }, "strip", z.ZodTypeAny, {
1063
- modality: "tool-response";
1064
- index: number;
1065
- id: string;
1066
- name: string;
1067
- data: string;
1068
- metadata?: undefined;
1069
- }, {
1070
- modality: "tool-response";
1071
- index: number;
1072
- id: string;
1073
- name: string;
1074
- data: string;
1075
- metadata?: undefined;
1076
- }>]>, "many">;
1077
- metadata: z.ZodUndefined;
1078
- }, "strip", z.ZodTypeAny, {
1079
- role: "system" | "user" | "assistant" | "tool";
1080
- content: ({
1081
- value: string;
1082
- modality: "text";
1083
- metadata?: undefined;
1084
- } | {
1085
- value: {
1086
- type: "base64";
1087
- base64: string;
1088
- media_type: "png" | "jpeg" | "webp" | "gif";
1089
- } | {
1090
- type: "url";
1091
- url: string;
1092
- };
1093
- modality: "image";
1094
- detail: "low" | "medium" | "high" | "auto";
1095
- metadata?: undefined;
1096
- } | {
1097
- modality: "tool-call";
1098
- index: number;
1099
- id: string;
1100
- name: string;
1101
- arguments: string;
1102
- metadata?: undefined;
1103
- } | {
1104
- modality: "tool-response";
1105
- index: number;
1106
- id: string;
1107
- name: string;
1108
- data: string;
1109
- metadata?: undefined;
1110
- })[];
1111
- metadata?: undefined;
1112
- }, {
1113
- role: "system" | "user" | "assistant" | "tool";
1114
- content: ({
1115
- value: string;
1116
- modality: "text";
1117
- metadata?: undefined;
1118
- } | {
1119
- value: {
1120
- type: "base64";
1121
- base64: string;
1122
- media_type: "png" | "jpeg" | "webp" | "gif";
1123
- } | {
1124
- type: "url";
1125
- url: string;
1126
- };
1127
- modality: "image";
1128
- detail: "low" | "medium" | "high" | "auto";
1129
- metadata?: undefined;
1130
- } | {
1131
- modality: "tool-call";
1132
- index: number;
1133
- id: string;
1134
- name: string;
1135
- arguments: string;
1136
- metadata?: undefined;
1137
- } | {
1138
- modality: "tool-response";
1139
- index: number;
1140
- id: string;
1141
- name: string;
1142
- data: string;
1143
- metadata?: undefined;
1144
- })[];
1145
- metadata?: undefined;
1146
- }>, "many">;
1147
- usage: z.ZodOptional<z.ZodObject<{
1148
- promptTokens: z.ZodNumber;
1149
- completionTokens: z.ZodNumber;
1150
- totalTokens: z.ZodNumber;
1151
- }, "strip", z.ZodTypeAny, {
1152
- totalTokens: number;
1153
- promptTokens: number;
1154
- completionTokens: number;
1155
- }, {
1156
- totalTokens: number;
1157
- promptTokens: number;
1158
- completionTokens: number;
1159
- }>>;
1160
- logProbs: z.ZodOptional<z.ZodArray<z.ZodObject<z.objectUtil.extendShape<{
1161
- token: z.ZodString;
1162
- logProb: z.ZodNumber;
1163
- bytes: z.ZodNullable<z.ZodArray<z.ZodNumber, "many">>;
1164
- }, {
1165
- topLogProbs: z.ZodArray<z.ZodObject<{
1166
- token: z.ZodString;
1167
- logProb: z.ZodNumber;
1168
- bytes: z.ZodNullable<z.ZodArray<z.ZodNumber, "many">>;
1169
- }, "strip", z.ZodTypeAny, {
1170
- token: string;
1171
- logProb: number;
1172
- bytes: number[] | null;
1173
- }, {
1174
- token: string;
1175
- logProb: number;
1176
- bytes: number[] | null;
1177
- }>, "many">;
1178
- }>, "strip", z.ZodTypeAny, {
1179
- token: string;
1180
- logProb: number;
1181
- bytes: number[] | null;
1182
- topLogProbs: {
1183
- token: string;
1184
- logProb: number;
1185
- bytes: number[] | null;
1186
- }[];
1187
- }, {
1188
- token: string;
1189
- logProb: number;
1190
- bytes: number[] | null;
1191
- topLogProbs: {
1192
- token: string;
1193
- logProb: number;
1194
- bytes: number[] | null;
1195
- }[];
1196
- }>, "many">>;
1197
- }, "strip", z.ZodTypeAny, {
1198
- messages: {
1199
- role: "system" | "user" | "assistant" | "tool";
1200
- content: ({
1201
- value: string;
1202
- modality: "text";
1203
- metadata?: undefined;
1204
- } | {
1205
- value: {
1206
- type: "base64";
1207
- base64: string;
1208
- media_type: "png" | "jpeg" | "webp" | "gif";
1209
- } | {
1210
- type: "url";
1211
- url: string;
1212
- };
1213
- modality: "image";
1214
- detail: "low" | "medium" | "high" | "auto";
1215
- metadata?: undefined;
1216
- } | {
1217
- modality: "tool-call";
1218
- index: number;
1219
- id: string;
1220
- name: string;
1221
- arguments: string;
1222
- metadata?: undefined;
1223
- } | {
1224
- modality: "tool-response";
1225
- index: number;
1226
- id: string;
1227
- name: string;
1228
- data: string;
1229
- metadata?: undefined;
1230
- })[];
1231
- metadata?: undefined;
1232
- }[];
1233
- usage?: {
1234
- totalTokens: number;
1235
- promptTokens: number;
1236
- completionTokens: number;
1237
- } | undefined;
1238
- logProbs?: {
1239
- token: string;
1240
- logProb: number;
1241
- bytes: number[] | null;
1242
- topLogProbs: {
1243
- token: string;
1244
- logProb: number;
1245
- bytes: number[] | null;
1246
- }[];
1247
- }[] | undefined;
1248
- }, {
1249
- messages: {
1250
- role: "system" | "user" | "assistant" | "tool";
1251
- content: ({
1252
- value: string;
1253
- modality: "text";
1254
- metadata?: undefined;
1255
- } | {
1256
- value: {
1257
- type: "base64";
1258
- base64: string;
1259
- media_type: "png" | "jpeg" | "webp" | "gif";
1260
- } | {
1261
- type: "url";
1262
- url: string;
1263
- };
1264
- modality: "image";
1265
- detail: "low" | "medium" | "high" | "auto";
1266
- metadata?: undefined;
1267
- } | {
1268
- modality: "tool-call";
1269
- index: number;
1270
- id: string;
1271
- name: string;
1272
- arguments: string;
1273
- metadata?: undefined;
1274
- } | {
1275
- modality: "tool-response";
1276
- index: number;
1277
- id: string;
1278
- name: string;
1279
- data: string;
1280
- metadata?: undefined;
1281
- })[];
1282
- metadata?: undefined;
1283
- }[];
1284
- usage?: {
1285
- totalTokens: number;
1286
- promptTokens: number;
1287
- completionTokens: number;
1288
- } | undefined;
1289
- logProbs?: {
1290
- token: string;
1291
- logProb: number;
1292
- bytes: number[] | null;
1293
- topLogProbs: {
1294
- token: string;
1295
- logProb: number;
1296
- bytes: number[] | null;
1297
- }[];
1298
- }[] | undefined;
1299
- }>;
1300
- latencyInMs: z.ZodNumber;
1301
- metadataForCallbacks: z.ZodOptional<z.ZodAny>;
1302
- provider: z.ZodObject<{
1303
- request: z.ZodAny;
1304
- response: z.ZodAny;
1305
- }, "strip", z.ZodTypeAny, {
1306
- request?: any;
1307
- response?: any;
1308
- }, {
1309
- request?: any;
1310
- response?: any;
1311
- }>;
1312
- }, "strip", z.ZodTypeAny, {
1313
- request: {
1314
- config: Record<string, any>;
1315
- messages: {
1316
- role: "system" | "user" | "assistant" | "tool";
1317
- content: ({
1318
- value: string;
1319
- modality: "text";
1320
- metadata?: undefined;
1321
- } | {
1322
- value: {
1323
- type: "base64";
1324
- base64: string;
1325
- media_type: "png" | "jpeg" | "webp" | "gif";
1326
- } | {
1327
- type: "url";
1328
- url: string;
1329
- };
1330
- modality: "image";
1331
- detail: "low" | "medium" | "high" | "auto";
1332
- metadata?: undefined;
1333
- } | {
1334
- name: string;
1335
- modality: "tool-call";
1336
- index: number;
1337
- id: string;
1338
- arguments: string;
1339
- metadata?: undefined;
1340
- } | {
1341
- data: string;
1342
- name: string;
1343
- modality: "tool-response";
1344
- index: number;
1345
- id: string;
1346
- metadata?: undefined;
1347
- })[];
1348
- metadata?: undefined;
1349
- }[];
1350
- tools?: {
1351
- type: "function";
1352
- definition: {
1353
- schema: {
1354
- name: string;
1355
- description: string;
1356
- strict?: boolean | undefined;
1357
- parameters?: any;
1358
- };
1359
- };
1360
- metadata?: any;
1361
- }[] | undefined;
1362
- };
1363
- response: {
1364
- messages: {
1365
- role: "system" | "user" | "assistant" | "tool";
1366
- content: ({
1367
- value: string;
1368
- modality: "text";
1369
- metadata?: undefined;
1370
- } | {
1371
- value: {
1372
- type: "base64";
1373
- base64: string;
1374
- media_type: "png" | "jpeg" | "webp" | "gif";
1375
- } | {
1376
- type: "url";
1377
- url: string;
1378
- };
1379
- modality: "image";
1380
- detail: "low" | "medium" | "high" | "auto";
1381
- metadata?: undefined;
1382
- } | {
1383
- modality: "tool-call";
1384
- index: number;
1385
- id: string;
1386
- name: string;
1387
- arguments: string;
1388
- metadata?: undefined;
1389
- } | {
1390
- modality: "tool-response";
1391
- index: number;
1392
- id: string;
1393
- name: string;
1394
- data: string;
1395
- metadata?: undefined;
1396
- })[];
1397
- metadata?: undefined;
1398
- }[];
1399
- usage?: {
1400
- totalTokens: number;
1401
- promptTokens: number;
1402
- completionTokens: number;
1403
- } | undefined;
1404
- logProbs?: {
1405
- token: string;
1406
- logProb: number;
1407
- bytes: number[] | null;
1408
- topLogProbs: {
1409
- token: string;
1410
- logProb: number;
1411
- bytes: number[] | null;
1412
- }[];
1413
- }[] | undefined;
1414
- };
1415
- latencyInMs: number;
1416
- provider: {
1417
- request?: any;
1418
- response?: any;
1419
- };
1420
- metadataForCallbacks?: any;
1421
- }, {
1422
- request: {
1423
- config: Record<string, any>;
1424
- messages: {
1425
- role: "system" | "user" | "assistant" | "tool";
1426
- content: ({
1427
- value: string;
1428
- modality: "text";
1429
- metadata?: undefined;
1430
- } | {
1431
- value: {
1432
- type: "base64";
1433
- base64: string;
1434
- media_type: "png" | "jpeg" | "webp" | "gif";
1435
- } | {
1436
- type: "url";
1437
- url: string;
1438
- };
1439
- modality: "image";
1440
- detail: "low" | "medium" | "high" | "auto";
1441
- metadata?: undefined;
1442
- } | {
1443
- name: string;
1444
- modality: "tool-call";
1445
- index: number;
1446
- id: string;
1447
- arguments: string;
1448
- metadata?: undefined;
1449
- } | {
1450
- data: string;
1451
- name: string;
1452
- modality: "tool-response";
1453
- index: number;
1454
- id: string;
1455
- metadata?: undefined;
1456
- })[];
1457
- metadata?: undefined;
1458
- }[];
1459
- tools?: {
1460
- type: "function";
1461
- definition: {
1462
- schema: {
1463
- name: string;
1464
- description: string;
1465
- strict?: boolean | undefined;
1466
- parameters?: any;
1467
- };
1468
- };
1469
- metadata?: any;
1470
- }[] | undefined;
1471
- };
1472
- response: {
1473
- messages: {
1474
- role: "system" | "user" | "assistant" | "tool";
1475
- content: ({
1476
- value: string;
1477
- modality: "text";
1478
- metadata?: undefined;
1479
- } | {
1480
- value: {
1481
- type: "base64";
1482
- base64: string;
1483
- media_type: "png" | "jpeg" | "webp" | "gif";
1484
- } | {
1485
- type: "url";
1486
- url: string;
1487
- };
1488
- modality: "image";
1489
- detail: "low" | "medium" | "high" | "auto";
1490
- metadata?: undefined;
1491
- } | {
1492
- modality: "tool-call";
1493
- index: number;
1494
- id: string;
1495
- name: string;
1496
- arguments: string;
1497
- metadata?: undefined;
1498
- } | {
1499
- modality: "tool-response";
1500
- index: number;
1501
- id: string;
1502
- name: string;
1503
- data: string;
1504
- metadata?: undefined;
1505
- })[];
1506
- metadata?: undefined;
1507
- }[];
1508
- usage?: {
1509
- totalTokens: number;
1510
- promptTokens: number;
1511
- completionTokens: number;
1512
- } | undefined;
1513
- logProbs?: {
1514
- token: string;
1515
- logProb: number;
1516
- bytes: number[] | null;
1517
- topLogProbs: {
1518
- token: string;
1519
- logProb: number;
1520
- bytes: number[] | null;
1521
- }[];
1522
- }[] | undefined;
1523
- };
1524
- latencyInMs: number;
1525
- provider: {
1526
- request?: any;
1527
- response?: any;
1528
- };
1529
- metadataForCallbacks?: any;
1530
- }>;
1531
- type CompleteChatHandlerResponseType = z.infer<typeof CompleteChatHandlerResponse>;
1532
- type CompleteChatCallbackType<M = any> = {
1533
- onChatStart?: (metadata?: M) => Promise<void> | void;
1534
- onChatCached?: (metadata?: M, response?: CompleteChatHandlerResponseType) => Promise<void> | void;
1535
- onChatComplete?: (metadata?: M, response?: CompleteChatHandlerResponseType) => Promise<void> | void;
1536
- onChatError?: (metadata?: M, error?: GatewayError) => Promise<void> | void;
1537
- };
1538
-
1539
- declare function handleCompleteChat(request: CompleteChatHandlerRequestType, client: HttpClient): Promise<CompleteChatHandlerResponseType>;
1540
-
1541
- declare const GetEmbeddingsHandlerRequest: z.ZodObject<{
1542
- model: z.ZodType<EmbeddingModelV1<{
1543
- description: string;
1544
- name: string;
1545
- modalities: ["text" | "token", ...("text" | "token")[]];
1546
- maxInputTokens: number;
1547
- maxOutputTokens: number;
1548
- config: {
1549
- def: Record<string, {
1550
- type: "multi-string";
1551
- param: string;
1552
- title: string;
1553
- description: string;
1554
- max: number;
1555
- } | {
1556
- type: "range";
1557
- param: string;
1558
- title: string;
1559
- description: string;
1560
- max: number;
1561
- min: number;
1562
- step: number;
1563
- default: number;
1564
- } | {
1565
- type: "select-string";
1566
- param: string;
1567
- title: string;
1568
- description: string;
1569
- default: string;
1570
- choices: string[];
1571
- } | {
1572
- type: "object-schema";
1573
- param: string;
1574
- title: string;
1575
- description: string;
1576
- objectSchema?: any;
1577
- } | {
1578
- type: "select-boolean";
1579
- param: string;
1580
- title: string;
1581
- description: string;
1582
- default: boolean | null;
1583
- }>;
1584
- schema: z.ZodObject<z.ZodRawShape, z.UnknownKeysParam, z.ZodTypeAny, unknown, unknown>;
1585
- };
1586
- }>, z.ZodTypeDef, EmbeddingModelV1<{
1587
- description: string;
1588
- name: string;
1589
- modalities: ["text" | "token", ...("text" | "token")[]];
1590
- maxInputTokens: number;
1591
- maxOutputTokens: number;
1592
- config: {
1593
- def: Record<string, {
1594
- type: "multi-string";
1595
- param: string;
1596
- title: string;
1597
- description: string;
1598
- max: number;
1599
- } | {
1600
- type: "range";
1601
- param: string;
1602
- title: string;
1603
- description: string;
1604
- max: number;
1605
- min: number;
1606
- step: number;
1607
- default: number;
1608
- } | {
1609
- type: "select-string";
1610
- param: string;
1611
- title: string;
1612
- description: string;
1613
- default: string;
1614
- choices: string[];
1615
- } | {
1616
- type: "object-schema";
1617
- param: string;
1618
- title: string;
1619
- description: string;
1620
- objectSchema?: any;
1621
- } | {
1622
- type: "select-boolean";
1623
- param: string;
1624
- title: string;
1625
- description: string;
1626
- default: boolean | null;
1627
- }>;
1628
- schema: z.ZodObject<z.ZodRawShape, z.UnknownKeysParam, z.ZodTypeAny, unknown, unknown>;
1629
- };
1630
- }>>;
1631
- config: z.ZodRecord<z.ZodString, z.ZodAny>;
1632
- embeddingRequests: z.ZodDiscriminatedUnion<"modality", [z.ZodObject<{
1633
- modality: z.ZodLiteral<"text">;
1634
- metadata: z.ZodUndefined;
1635
- requests: z.ZodArray<z.ZodString, "many">;
1636
- }, "strip", z.ZodTypeAny, {
1637
- modality: "text";
1638
- requests: string[];
1639
- metadata?: undefined;
1640
- }, {
1641
- modality: "text";
1642
- requests: string[];
1643
- metadata?: undefined;
1644
- }>, z.ZodObject<{
1645
- modality: z.ZodLiteral<"token">;
1646
- metadata: z.ZodUndefined;
1647
- requests: z.ZodArray<z.ZodArray<z.ZodNumber, "many">, "many">;
1648
- }, "strip", z.ZodTypeAny, {
1649
- modality: "token";
1650
- requests: number[][];
1651
- metadata?: undefined;
1652
- }, {
1653
- modality: "token";
1654
- requests: number[][];
1655
- metadata?: undefined;
1656
- }>]>;
1657
- callbacks: z.ZodOptional<z.ZodArray<z.ZodType<GetEmbeddingsCallbackType<any>, z.ZodTypeDef, GetEmbeddingsCallbackType<any>>, "atleastone">>;
1658
- metadataForCallbacks: z.ZodOptional<z.ZodAny>;
1659
- }, "strip", z.ZodTypeAny, {
1660
- config: Record<string, any>;
1661
- model: EmbeddingModelV1<{
1662
- description: string;
1663
- name: string;
1664
- modalities: ["text" | "token", ...("text" | "token")[]];
1665
- maxInputTokens: number;
1666
- maxOutputTokens: number;
1667
- config: {
1668
- def: Record<string, {
1669
- type: "multi-string";
1670
- param: string;
1671
- title: string;
1672
- description: string;
1673
- max: number;
1674
- } | {
1675
- type: "range";
1676
- param: string;
1677
- title: string;
1678
- description: string;
1679
- max: number;
1680
- min: number;
1681
- step: number;
1682
- default: number;
1683
- } | {
1684
- type: "select-string";
1685
- param: string;
1686
- title: string;
1687
- description: string;
1688
- default: string;
1689
- choices: string[];
1690
- } | {
1691
- type: "object-schema";
1692
- param: string;
1693
- title: string;
1694
- description: string;
1695
- objectSchema?: any;
1696
- } | {
1697
- type: "select-boolean";
1698
- param: string;
1699
- title: string;
1700
- description: string;
1701
- default: boolean | null;
1702
- }>;
1703
- schema: z.ZodObject<z.ZodRawShape, z.UnknownKeysParam, z.ZodTypeAny, unknown, unknown>;
1704
- };
1705
- }>;
1706
- embeddingRequests: {
1707
- modality: "text";
1708
- requests: string[];
1709
- metadata?: undefined;
1710
- } | {
1711
- modality: "token";
1712
- requests: number[][];
1713
- metadata?: undefined;
1714
- };
1715
- callbacks?: [GetEmbeddingsCallbackType<any>, ...GetEmbeddingsCallbackType<any>[]] | undefined;
1716
- metadataForCallbacks?: any;
1717
- }, {
1718
- config: Record<string, any>;
1719
- model: EmbeddingModelV1<{
1720
- description: string;
1721
- name: string;
1722
- modalities: ["text" | "token", ...("text" | "token")[]];
1723
- maxInputTokens: number;
1724
- maxOutputTokens: number;
1725
- config: {
1726
- def: Record<string, {
1727
- type: "multi-string";
1728
- param: string;
1729
- title: string;
1730
- description: string;
1731
- max: number;
1732
- } | {
1733
- type: "range";
1734
- param: string;
1735
- title: string;
1736
- description: string;
1737
- max: number;
1738
- min: number;
1739
- step: number;
1740
- default: number;
1741
- } | {
1742
- type: "select-string";
1743
- param: string;
1744
- title: string;
1745
- description: string;
1746
- default: string;
1747
- choices: string[];
1748
- } | {
1749
- type: "object-schema";
1750
- param: string;
1751
- title: string;
1752
- description: string;
1753
- objectSchema?: any;
1754
- } | {
1755
- type: "select-boolean";
1756
- param: string;
1757
- title: string;
1758
- description: string;
1759
- default: boolean | null;
1760
- }>;
1761
- schema: z.ZodObject<z.ZodRawShape, z.UnknownKeysParam, z.ZodTypeAny, unknown, unknown>;
1762
- };
1763
- }>;
1764
- embeddingRequests: {
1765
- modality: "text";
1766
- requests: string[];
1767
- metadata?: undefined;
1768
- } | {
1769
- modality: "token";
1770
- requests: number[][];
1771
- metadata?: undefined;
1772
- };
1773
- callbacks?: [GetEmbeddingsCallbackType<any>, ...GetEmbeddingsCallbackType<any>[]] | undefined;
1774
- metadataForCallbacks?: any;
1775
- }>;
1776
- type GetEmbeddingsHandlerRequestType = z.infer<typeof GetEmbeddingsHandlerRequest>;
1777
- declare const GetEmbeddingsHandlerResponse: z.ZodObject<{
1778
- request: z.ZodObject<{
1779
- config: z.ZodRecord<z.ZodString, z.ZodAny>;
1780
- embeddingRequests: z.ZodDiscriminatedUnion<"modality", [z.ZodObject<{
1781
- modality: z.ZodLiteral<"text">;
1782
- metadata: z.ZodUndefined;
1783
- requests: z.ZodArray<z.ZodString, "many">;
1784
- }, "strip", z.ZodTypeAny, {
1785
- modality: "text";
1786
- requests: string[];
1787
- metadata?: undefined;
1788
- }, {
1789
- modality: "text";
1790
- requests: string[];
1791
- metadata?: undefined;
1792
- }>, z.ZodObject<{
1793
- modality: z.ZodLiteral<"token">;
1794
- metadata: z.ZodUndefined;
1795
- requests: z.ZodArray<z.ZodArray<z.ZodNumber, "many">, "many">;
1796
- }, "strip", z.ZodTypeAny, {
1797
- modality: "token";
1798
- requests: number[][];
1799
- metadata?: undefined;
1800
- }, {
1801
- modality: "token";
1802
- requests: number[][];
1803
- metadata?: undefined;
1804
- }>]>;
1805
- }, "strip", z.ZodTypeAny, {
1806
- config: Record<string, any>;
1807
- embeddingRequests: {
1808
- modality: "text";
1809
- requests: string[];
1810
- metadata?: undefined;
1811
- } | {
1812
- modality: "token";
1813
- requests: number[][];
1814
- metadata?: undefined;
1815
- };
1816
- }, {
1817
- config: Record<string, any>;
1818
- embeddingRequests: {
1819
- modality: "text";
1820
- requests: string[];
1821
- metadata?: undefined;
1822
- } | {
1823
- modality: "token";
1824
- requests: number[][];
1825
- metadata?: undefined;
1826
- };
1827
- }>;
1828
- response: z.ZodDiscriminatedUnion<"encodingFormat", [z.ZodObject<{
1829
- encodingFormat: z.ZodLiteral<"float">;
1830
- embeddings: z.ZodArray<z.ZodObject<{
1831
- index: z.ZodNumber;
1832
- embedding: z.ZodArray<z.ZodNumber, "many">;
1833
- }, "strip", z.ZodTypeAny, {
1834
- index: number;
1835
- embedding: number[];
1836
- }, {
1837
- index: number;
1838
- embedding: number[];
666
+ data: string;
667
+ metadata?: undefined;
668
+ })[];
669
+ metadata?: undefined;
1839
670
  }>, "many">;
1840
671
  usage: z.ZodOptional<z.ZodObject<{
672
+ promptTokens: z.ZodNumber;
673
+ completionTokens: z.ZodNumber;
1841
674
  totalTokens: z.ZodNumber;
1842
675
  }, "strip", z.ZodTypeAny, {
1843
676
  totalTokens: number;
677
+ promptTokens: number;
678
+ completionTokens: number;
1844
679
  }, {
1845
680
  totalTokens: number;
681
+ promptTokens: number;
682
+ completionTokens: number;
1846
683
  }>>;
1847
- }, "strip", z.ZodTypeAny, {
1848
- encodingFormat: "float";
1849
- embeddings: {
1850
- index: number;
1851
- embedding: number[];
1852
- }[];
1853
- usage?: {
1854
- totalTokens: number;
1855
- } | undefined;
1856
- }, {
1857
- encodingFormat: "float";
1858
- embeddings: {
1859
- index: number;
1860
- embedding: number[];
1861
- }[];
1862
- usage?: {
1863
- totalTokens: number;
1864
- } | undefined;
1865
- }>, z.ZodObject<{
1866
- encodingFormat: z.ZodLiteral<"base64">;
1867
- embeddings: z.ZodArray<z.ZodObject<{
1868
- index: z.ZodNumber;
1869
- embedding: z.ZodString;
1870
- }, "strip", z.ZodTypeAny, {
1871
- index: number;
1872
- embedding: string;
684
+ logProbs: z.ZodOptional<z.ZodArray<z.ZodObject<z.objectUtil.extendShape<{
685
+ token: z.ZodString;
686
+ logProb: z.ZodNumber;
687
+ bytes: z.ZodNullable<z.ZodArray<z.ZodNumber, "many">>;
1873
688
  }, {
1874
- index: number;
1875
- embedding: string;
1876
- }>, "many">;
1877
- usage: z.ZodOptional<z.ZodObject<{
1878
- totalTokens: z.ZodNumber;
1879
- }, "strip", z.ZodTypeAny, {
1880
- totalTokens: number;
689
+ topLogProbs: z.ZodArray<z.ZodObject<{
690
+ token: z.ZodString;
691
+ logProb: z.ZodNumber;
692
+ bytes: z.ZodNullable<z.ZodArray<z.ZodNumber, "many">>;
693
+ }, "strip", z.ZodTypeAny, {
694
+ token: string;
695
+ logProb: number;
696
+ bytes: number[] | null;
697
+ }, {
698
+ token: string;
699
+ logProb: number;
700
+ bytes: number[] | null;
701
+ }>, "many">;
702
+ }>, "strip", z.ZodTypeAny, {
703
+ token: string;
704
+ logProb: number;
705
+ bytes: number[] | null;
706
+ topLogProbs: {
707
+ token: string;
708
+ logProb: number;
709
+ bytes: number[] | null;
710
+ }[];
1881
711
  }, {
1882
- totalTokens: number;
1883
- }>>;
712
+ token: string;
713
+ logProb: number;
714
+ bytes: number[] | null;
715
+ topLogProbs: {
716
+ token: string;
717
+ logProb: number;
718
+ bytes: number[] | null;
719
+ }[];
720
+ }>, "many">>;
1884
721
  }, "strip", z.ZodTypeAny, {
1885
- encodingFormat: "base64";
1886
- embeddings: {
1887
- index: number;
1888
- embedding: string;
722
+ messages: {
723
+ role: "system" | "user" | "assistant" | "tool";
724
+ content: ({
725
+ value: string;
726
+ modality: "text";
727
+ metadata?: undefined;
728
+ } | {
729
+ value: {
730
+ type: "base64";
731
+ base64: string;
732
+ media_type: "png" | "jpeg" | "webp" | "gif";
733
+ } | {
734
+ type: "url";
735
+ url: string;
736
+ };
737
+ modality: "image";
738
+ detail: "low" | "medium" | "high" | "auto";
739
+ metadata?: undefined;
740
+ } | {
741
+ name: string;
742
+ modality: "tool-call";
743
+ index: number;
744
+ id: string;
745
+ arguments: string;
746
+ metadata?: undefined;
747
+ } | {
748
+ name: string;
749
+ modality: "tool-response";
750
+ index: number;
751
+ id: string;
752
+ data: string;
753
+ metadata?: undefined;
754
+ })[];
755
+ metadata?: undefined;
1889
756
  }[];
1890
757
  usage?: {
1891
758
  totalTokens: number;
759
+ promptTokens: number;
760
+ completionTokens: number;
1892
761
  } | undefined;
762
+ logProbs?: {
763
+ token: string;
764
+ logProb: number;
765
+ bytes: number[] | null;
766
+ topLogProbs: {
767
+ token: string;
768
+ logProb: number;
769
+ bytes: number[] | null;
770
+ }[];
771
+ }[] | undefined;
1893
772
  }, {
1894
- encodingFormat: "base64";
1895
- embeddings: {
1896
- index: number;
1897
- embedding: string;
773
+ messages: {
774
+ role: "system" | "user" | "assistant" | "tool";
775
+ content: ({
776
+ value: string;
777
+ modality: "text";
778
+ metadata?: undefined;
779
+ } | {
780
+ value: {
781
+ type: "base64";
782
+ base64: string;
783
+ media_type: "png" | "jpeg" | "webp" | "gif";
784
+ } | {
785
+ type: "url";
786
+ url: string;
787
+ };
788
+ modality: "image";
789
+ detail: "low" | "medium" | "high" | "auto";
790
+ metadata?: undefined;
791
+ } | {
792
+ name: string;
793
+ modality: "tool-call";
794
+ index: number;
795
+ id: string;
796
+ arguments: string;
797
+ metadata?: undefined;
798
+ } | {
799
+ name: string;
800
+ modality: "tool-response";
801
+ index: number;
802
+ id: string;
803
+ data: string;
804
+ metadata?: undefined;
805
+ })[];
806
+ metadata?: undefined;
1898
807
  }[];
1899
808
  usage?: {
1900
809
  totalTokens: number;
810
+ promptTokens: number;
811
+ completionTokens: number;
1901
812
  } | undefined;
1902
- }>]>;
813
+ logProbs?: {
814
+ token: string;
815
+ logProb: number;
816
+ bytes: number[] | null;
817
+ topLogProbs: {
818
+ token: string;
819
+ logProb: number;
820
+ bytes: number[] | null;
821
+ }[];
822
+ }[] | undefined;
823
+ }>;
1903
824
  latencyInMs: z.ZodNumber;
1904
825
  metadataForCallbacks: z.ZodOptional<z.ZodAny>;
1905
826
  provider: z.ZodObject<{
@@ -1915,34 +836,105 @@ declare const GetEmbeddingsHandlerResponse: z.ZodObject<{
1915
836
  }, "strip", z.ZodTypeAny, {
1916
837
  request: {
1917
838
  config: Record<string, any>;
1918
- embeddingRequests: {
1919
- modality: "text";
1920
- requests: string[];
839
+ messages: {
840
+ role: "system" | "user" | "assistant" | "tool";
841
+ content: ({
842
+ value: string;
843
+ modality: "text";
844
+ metadata?: undefined;
845
+ } | {
846
+ value: {
847
+ type: "base64";
848
+ base64: string;
849
+ media_type: "png" | "jpeg" | "webp" | "gif";
850
+ } | {
851
+ type: "url";
852
+ url: string;
853
+ };
854
+ modality: "image";
855
+ detail: "low" | "medium" | "high" | "auto";
856
+ metadata?: undefined;
857
+ } | {
858
+ name: string;
859
+ modality: "tool-call";
860
+ index: number;
861
+ id: string;
862
+ arguments: string;
863
+ metadata?: undefined;
864
+ } | {
865
+ data: string;
866
+ name: string;
867
+ modality: "tool-response";
868
+ index: number;
869
+ id: string;
870
+ metadata?: undefined;
871
+ })[];
1921
872
  metadata?: undefined;
1922
- } | {
1923
- modality: "token";
1924
- requests: number[][];
873
+ }[];
874
+ tools?: {
875
+ type: "function";
876
+ definition: {
877
+ schema: {
878
+ name: string;
879
+ description: string;
880
+ strict?: boolean | undefined;
881
+ parameters?: any;
882
+ };
883
+ };
884
+ metadata?: any;
885
+ }[] | undefined;
886
+ };
887
+ response: {
888
+ messages: {
889
+ role: "system" | "user" | "assistant" | "tool";
890
+ content: ({
891
+ value: string;
892
+ modality: "text";
893
+ metadata?: undefined;
894
+ } | {
895
+ value: {
896
+ type: "base64";
897
+ base64: string;
898
+ media_type: "png" | "jpeg" | "webp" | "gif";
899
+ } | {
900
+ type: "url";
901
+ url: string;
902
+ };
903
+ modality: "image";
904
+ detail: "low" | "medium" | "high" | "auto";
905
+ metadata?: undefined;
906
+ } | {
907
+ name: string;
908
+ modality: "tool-call";
909
+ index: number;
910
+ id: string;
911
+ arguments: string;
912
+ metadata?: undefined;
913
+ } | {
914
+ name: string;
915
+ modality: "tool-response";
916
+ index: number;
917
+ id: string;
918
+ data: string;
919
+ metadata?: undefined;
920
+ })[];
1925
921
  metadata?: undefined;
1926
- };
1927
- };
1928
- response: {
1929
- encodingFormat: "float";
1930
- embeddings: {
1931
- index: number;
1932
- embedding: number[];
1933
- }[];
1934
- usage?: {
1935
- totalTokens: number;
1936
- } | undefined;
1937
- } | {
1938
- encodingFormat: "base64";
1939
- embeddings: {
1940
- index: number;
1941
- embedding: string;
1942
922
  }[];
1943
923
  usage?: {
1944
924
  totalTokens: number;
925
+ promptTokens: number;
926
+ completionTokens: number;
1945
927
  } | undefined;
928
+ logProbs?: {
929
+ token: string;
930
+ logProb: number;
931
+ bytes: number[] | null;
932
+ topLogProbs: {
933
+ token: string;
934
+ logProb: number;
935
+ bytes: number[] | null;
936
+ }[];
937
+ }[] | undefined;
1946
938
  };
1947
939
  latencyInMs: number;
1948
940
  provider: {
@@ -1953,579 +945,344 @@ declare const GetEmbeddingsHandlerResponse: z.ZodObject<{
1953
945
  }, {
1954
946
  request: {
1955
947
  config: Record<string, any>;
1956
- embeddingRequests: {
1957
- modality: "text";
1958
- requests: string[];
1959
- metadata?: undefined;
1960
- } | {
1961
- modality: "token";
1962
- requests: number[][];
1963
- metadata?: undefined;
1964
- };
1965
- };
1966
- response: {
1967
- encodingFormat: "float";
1968
- embeddings: {
1969
- index: number;
1970
- embedding: number[];
1971
- }[];
1972
- usage?: {
1973
- totalTokens: number;
1974
- } | undefined;
1975
- } | {
1976
- encodingFormat: "base64";
1977
- embeddings: {
1978
- index: number;
1979
- embedding: string;
1980
- }[];
1981
- usage?: {
1982
- totalTokens: number;
1983
- } | undefined;
1984
- };
1985
- latencyInMs: number;
1986
- provider: {
1987
- request?: any;
1988
- response?: any;
1989
- };
1990
- metadataForCallbacks?: any;
1991
- }>;
1992
- type GetEmbeddingsHandlerResponseType = z.infer<typeof GetEmbeddingsHandlerResponse>;
1993
- type GetEmbeddingsCallbackType<M = any> = {
1994
- onGetEmbeddingsStart?: (metadata?: M) => Promise<void> | void;
1995
- onGetEmbeddingsCached?: (metadata?: M, response?: GetEmbeddingsHandlerResponseType) => Promise<void> | void;
1996
- onGetEmbeddingsComplete?: (metadata?: M, response?: GetEmbeddingsHandlerResponseType) => Promise<void> | void;
1997
- onGetEmbeddingsError?: (metadata?: M, error?: GatewayError) => Promise<void> | void;
1998
- };
1999
-
2000
- declare function handleGetEmbeddings(request: GetEmbeddingsHandlerRequestType, client: HttpClient): Promise<GetEmbeddingsHandlerResponseType>;
2001
-
2002
- declare const StreamChatHandlerRequest: z.ZodObject<{
2003
- model: z.ZodType<ChatModelV1<{
2004
- name: string;
2005
- description: string;
2006
- roles: Partial<Record<"system" | "user" | "assistant" | "tool", string | undefined>>;
2007
- modalities: ["text" | "image" | "tool-call" | "tool-response", ...("text" | "image" | "tool-call" | "tool-response")[]];
2008
- maxInputTokens: number;
2009
- maxOutputTokens: number;
2010
- config: {
2011
- def: Record<string, {
2012
- type: "multi-string";
2013
- param: string;
2014
- title: string;
2015
- description: string;
2016
- max: number;
2017
- } | {
2018
- type: "range";
2019
- param: string;
2020
- title: string;
2021
- description: string;
2022
- max: number;
2023
- min: number;
2024
- step: number;
2025
- default: number;
2026
- } | {
2027
- type: "select-string";
2028
- param: string;
2029
- title: string;
2030
- description: string;
2031
- default: string;
2032
- choices: string[];
2033
- } | {
2034
- type: "object-schema";
2035
- param: string;
2036
- title: string;
2037
- description: string;
2038
- objectSchema?: any;
2039
- } | {
2040
- type: "select-boolean";
2041
- param: string;
2042
- title: string;
2043
- description: string;
2044
- default: boolean | null;
2045
- }>;
2046
- schema: z.ZodObject<z.ZodRawShape, z.UnknownKeysParam, z.ZodTypeAny, unknown, unknown>;
2047
- };
2048
- }>, z.ZodTypeDef, ChatModelV1<{
2049
- name: string;
2050
- description: string;
2051
- roles: Partial<Record<"system" | "user" | "assistant" | "tool", string | undefined>>;
2052
- modalities: ["text" | "image" | "tool-call" | "tool-response", ...("text" | "image" | "tool-call" | "tool-response")[]];
2053
- maxInputTokens: number;
2054
- maxOutputTokens: number;
2055
- config: {
2056
- def: Record<string, {
2057
- type: "multi-string";
2058
- param: string;
2059
- title: string;
2060
- description: string;
2061
- max: number;
2062
- } | {
2063
- type: "range";
2064
- param: string;
2065
- title: string;
2066
- description: string;
2067
- max: number;
2068
- min: number;
2069
- step: number;
2070
- default: number;
948
+ messages: {
949
+ role: "system" | "user" | "assistant" | "tool";
950
+ content: ({
951
+ value: string;
952
+ modality: "text";
953
+ metadata?: undefined;
2071
954
  } | {
2072
- type: "select-string";
2073
- param: string;
2074
- title: string;
2075
- description: string;
2076
- default: string;
2077
- choices: string[];
955
+ value: {
956
+ type: "base64";
957
+ base64: string;
958
+ media_type: "png" | "jpeg" | "webp" | "gif";
959
+ } | {
960
+ type: "url";
961
+ url: string;
962
+ };
963
+ modality: "image";
964
+ detail: "low" | "medium" | "high" | "auto";
965
+ metadata?: undefined;
2078
966
  } | {
2079
- type: "object-schema";
2080
- param: string;
2081
- title: string;
2082
- description: string;
2083
- objectSchema?: any;
967
+ name: string;
968
+ modality: "tool-call";
969
+ index: number;
970
+ id: string;
971
+ arguments: string;
972
+ metadata?: undefined;
2084
973
  } | {
2085
- type: "select-boolean";
2086
- param: string;
2087
- title: string;
2088
- description: string;
2089
- default: boolean | null;
2090
- }>;
2091
- schema: z.ZodObject<z.ZodRawShape, z.UnknownKeysParam, z.ZodTypeAny, unknown, unknown>;
2092
- };
2093
- }>>;
2094
- config: z.ZodRecord<z.ZodString, z.ZodAny>;
2095
- messages: z.ZodArray<z.ZodObject<{
2096
- role: z.ZodEnum<["system", "user", "assistant", "tool"]>;
2097
- content: z.ZodArray<z.ZodDiscriminatedUnion<"modality", [z.ZodObject<{
2098
- modality: z.ZodLiteral<"text">;
2099
- value: z.ZodString;
2100
- metadata: z.ZodUndefined;
2101
- }, "strip", z.ZodTypeAny, {
2102
- value: string;
2103
- modality: "text";
2104
- metadata?: undefined;
2105
- }, {
2106
- value: string;
2107
- modality: "text";
974
+ data: string;
975
+ name: string;
976
+ modality: "tool-response";
977
+ index: number;
978
+ id: string;
979
+ metadata?: undefined;
980
+ })[];
2108
981
  metadata?: undefined;
2109
- }>, z.ZodObject<{
2110
- modality: z.ZodLiteral<"image">;
2111
- detail: z.ZodEnum<["low", "medium", "high", "auto"]>;
2112
- value: z.ZodDiscriminatedUnion<"type", [z.ZodObject<{
2113
- type: z.ZodLiteral<"base64">;
2114
- base64: z.ZodString;
2115
- media_type: z.ZodEnum<["png", "jpeg", "webp", "gif"]>;
2116
- }, "strip", z.ZodTypeAny, {
2117
- type: "base64";
2118
- base64: string;
2119
- media_type: "png" | "jpeg" | "webp" | "gif";
2120
- }, {
2121
- type: "base64";
2122
- base64: string;
2123
- media_type: "png" | "jpeg" | "webp" | "gif";
2124
- }>, z.ZodObject<{
2125
- type: z.ZodLiteral<"url">;
2126
- url: z.ZodString;
2127
- }, "strip", z.ZodTypeAny, {
2128
- type: "url";
2129
- url: string;
2130
- }, {
2131
- type: "url";
2132
- url: string;
2133
- }>]>;
2134
- metadata: z.ZodUndefined;
2135
- }, "strip", z.ZodTypeAny, {
2136
- value: {
2137
- type: "base64";
2138
- base64: string;
2139
- media_type: "png" | "jpeg" | "webp" | "gif";
2140
- } | {
2141
- type: "url";
2142
- url: string;
982
+ }[];
983
+ tools?: {
984
+ type: "function";
985
+ definition: {
986
+ schema: {
987
+ name: string;
988
+ description: string;
989
+ strict?: boolean | undefined;
990
+ parameters?: any;
991
+ };
2143
992
  };
2144
- modality: "image";
2145
- detail: "low" | "medium" | "high" | "auto";
2146
- metadata?: undefined;
2147
- }, {
2148
- value: {
2149
- type: "base64";
2150
- base64: string;
2151
- media_type: "png" | "jpeg" | "webp" | "gif";
993
+ metadata?: any;
994
+ }[] | undefined;
995
+ };
996
+ response: {
997
+ messages: {
998
+ role: "system" | "user" | "assistant" | "tool";
999
+ content: ({
1000
+ value: string;
1001
+ modality: "text";
1002
+ metadata?: undefined;
2152
1003
  } | {
2153
- type: "url";
2154
- url: string;
2155
- };
2156
- modality: "image";
2157
- detail: "low" | "medium" | "high" | "auto";
1004
+ value: {
1005
+ type: "base64";
1006
+ base64: string;
1007
+ media_type: "png" | "jpeg" | "webp" | "gif";
1008
+ } | {
1009
+ type: "url";
1010
+ url: string;
1011
+ };
1012
+ modality: "image";
1013
+ detail: "low" | "medium" | "high" | "auto";
1014
+ metadata?: undefined;
1015
+ } | {
1016
+ name: string;
1017
+ modality: "tool-call";
1018
+ index: number;
1019
+ id: string;
1020
+ arguments: string;
1021
+ metadata?: undefined;
1022
+ } | {
1023
+ name: string;
1024
+ modality: "tool-response";
1025
+ index: number;
1026
+ id: string;
1027
+ data: string;
1028
+ metadata?: undefined;
1029
+ })[];
2158
1030
  metadata?: undefined;
2159
- }>, z.ZodObject<{
2160
- modality: z.ZodLiteral<"tool-call">;
2161
- index: z.ZodNumber;
2162
- id: z.ZodString;
2163
- name: z.ZodString;
2164
- arguments: z.ZodString;
1031
+ }[];
1032
+ usage?: {
1033
+ totalTokens: number;
1034
+ promptTokens: number;
1035
+ completionTokens: number;
1036
+ } | undefined;
1037
+ logProbs?: {
1038
+ token: string;
1039
+ logProb: number;
1040
+ bytes: number[] | null;
1041
+ topLogProbs: {
1042
+ token: string;
1043
+ logProb: number;
1044
+ bytes: number[] | null;
1045
+ }[];
1046
+ }[] | undefined;
1047
+ };
1048
+ latencyInMs: number;
1049
+ provider: {
1050
+ request?: any;
1051
+ response?: any;
1052
+ };
1053
+ metadataForCallbacks?: any;
1054
+ }>;
1055
+ type CompleteChatHandlerResponseType = z.infer<typeof CompleteChatHandlerResponse>;
1056
+ type CompleteChatCallbackType<M = any> = {
1057
+ onChatStart?: (metadata?: M) => Promise<void> | void;
1058
+ onChatCached?: (metadata?: M, response?: CompleteChatHandlerResponseType) => Promise<void> | void;
1059
+ onChatComplete?: (metadata?: M, response?: CompleteChatHandlerResponseType) => Promise<void> | void;
1060
+ onChatError?: (metadata?: M, error?: GatewayError | HttpRequestError) => Promise<void> | void;
1061
+ };
1062
+
1063
+ declare const GetEmbeddingsHandlerResponse: z.ZodObject<{
1064
+ request: z.ZodObject<{
1065
+ config: z.ZodRecord<z.ZodString, z.ZodAny>;
1066
+ embeddingRequests: z.ZodDiscriminatedUnion<"modality", [z.ZodObject<{
1067
+ modality: z.ZodLiteral<"text">;
2165
1068
  metadata: z.ZodUndefined;
1069
+ requests: z.ZodArray<z.ZodString, "many">;
2166
1070
  }, "strip", z.ZodTypeAny, {
2167
- name: string;
2168
- modality: "tool-call";
2169
- index: number;
2170
- id: string;
2171
- arguments: string;
1071
+ modality: "text";
1072
+ requests: string[];
2172
1073
  metadata?: undefined;
2173
1074
  }, {
2174
- name: string;
2175
- modality: "tool-call";
2176
- index: number;
2177
- id: string;
2178
- arguments: string;
1075
+ modality: "text";
1076
+ requests: string[];
2179
1077
  metadata?: undefined;
2180
1078
  }>, z.ZodObject<{
2181
- modality: z.ZodLiteral<"tool-response">;
2182
- index: z.ZodNumber;
2183
- id: z.ZodString;
2184
- name: z.ZodString;
2185
- data: z.ZodString;
1079
+ modality: z.ZodLiteral<"token">;
2186
1080
  metadata: z.ZodUndefined;
1081
+ requests: z.ZodArray<z.ZodArray<z.ZodNumber, "many">, "many">;
2187
1082
  }, "strip", z.ZodTypeAny, {
2188
- data: string;
2189
- name: string;
2190
- modality: "tool-response";
2191
- index: number;
2192
- id: string;
1083
+ modality: "token";
1084
+ requests: number[][];
2193
1085
  metadata?: undefined;
2194
1086
  }, {
2195
- data: string;
2196
- name: string;
2197
- modality: "tool-response";
2198
- index: number;
2199
- id: string;
1087
+ modality: "token";
1088
+ requests: number[][];
2200
1089
  metadata?: undefined;
2201
- }>]>, "many">;
2202
- metadata: z.ZodUndefined;
1090
+ }>]>;
2203
1091
  }, "strip", z.ZodTypeAny, {
2204
- role: "system" | "user" | "assistant" | "tool";
2205
- content: ({
2206
- value: string;
1092
+ config: Record<string, any>;
1093
+ embeddingRequests: {
2207
1094
  modality: "text";
1095
+ requests: string[];
2208
1096
  metadata?: undefined;
2209
1097
  } | {
2210
- value: {
2211
- type: "base64";
2212
- base64: string;
2213
- media_type: "png" | "jpeg" | "webp" | "gif";
2214
- } | {
2215
- type: "url";
2216
- url: string;
2217
- };
2218
- modality: "image";
2219
- detail: "low" | "medium" | "high" | "auto";
2220
- metadata?: undefined;
2221
- } | {
2222
- name: string;
2223
- modality: "tool-call";
2224
- index: number;
2225
- id: string;
2226
- arguments: string;
2227
- metadata?: undefined;
2228
- } | {
2229
- data: string;
2230
- name: string;
2231
- modality: "tool-response";
2232
- index: number;
2233
- id: string;
1098
+ modality: "token";
1099
+ requests: number[][];
2234
1100
  metadata?: undefined;
2235
- })[];
2236
- metadata?: undefined;
1101
+ };
2237
1102
  }, {
2238
- role: "system" | "user" | "assistant" | "tool";
2239
- content: ({
2240
- value: string;
1103
+ config: Record<string, any>;
1104
+ embeddingRequests: {
2241
1105
  modality: "text";
1106
+ requests: string[];
2242
1107
  metadata?: undefined;
2243
1108
  } | {
2244
- value: {
2245
- type: "base64";
2246
- base64: string;
2247
- media_type: "png" | "jpeg" | "webp" | "gif";
2248
- } | {
2249
- type: "url";
2250
- url: string;
2251
- };
2252
- modality: "image";
2253
- detail: "low" | "medium" | "high" | "auto";
1109
+ modality: "token";
1110
+ requests: number[][];
2254
1111
  metadata?: undefined;
2255
- } | {
2256
- name: string;
2257
- modality: "tool-call";
1112
+ };
1113
+ }>;
1114
+ response: z.ZodDiscriminatedUnion<"encodingFormat", [z.ZodObject<{
1115
+ encodingFormat: z.ZodLiteral<"float">;
1116
+ embeddings: z.ZodArray<z.ZodObject<{
1117
+ index: z.ZodNumber;
1118
+ embedding: z.ZodArray<z.ZodNumber, "many">;
1119
+ }, "strip", z.ZodTypeAny, {
2258
1120
  index: number;
2259
- id: string;
2260
- arguments: string;
2261
- metadata?: undefined;
2262
- } | {
2263
- data: string;
2264
- name: string;
2265
- modality: "tool-response";
1121
+ embedding: number[];
1122
+ }, {
2266
1123
  index: number;
2267
- id: string;
2268
- metadata?: undefined;
2269
- })[];
2270
- metadata?: undefined;
2271
- }>, "many">;
2272
- tools: z.ZodOptional<z.ZodArray<z.ZodDiscriminatedUnion<"type", [z.ZodObject<z.objectUtil.extendShape<{
2273
- type: z.ZodEnum<["function"]>;
2274
- definition: z.ZodObject<{
2275
- schema: z.ZodObject<{
2276
- name: z.ZodString;
2277
- description: z.ZodString;
2278
- parameters: z.ZodAny;
2279
- strict: z.ZodOptional<z.ZodBoolean>;
2280
- }, "strip", z.ZodTypeAny, {
2281
- name: string;
2282
- description: string;
2283
- strict?: boolean | undefined;
2284
- parameters?: any;
2285
- }, {
2286
- name: string;
2287
- description: string;
2288
- strict?: boolean | undefined;
2289
- parameters?: any;
2290
- }>;
1124
+ embedding: number[];
1125
+ }>, "many">;
1126
+ usage: z.ZodOptional<z.ZodObject<{
1127
+ totalTokens: z.ZodNumber;
1128
+ }, "strip", z.ZodTypeAny, {
1129
+ totalTokens: number;
1130
+ }, {
1131
+ totalTokens: number;
1132
+ }>>;
1133
+ }, "strip", z.ZodTypeAny, {
1134
+ encodingFormat: "float";
1135
+ embeddings: {
1136
+ index: number;
1137
+ embedding: number[];
1138
+ }[];
1139
+ usage?: {
1140
+ totalTokens: number;
1141
+ } | undefined;
1142
+ }, {
1143
+ encodingFormat: "float";
1144
+ embeddings: {
1145
+ index: number;
1146
+ embedding: number[];
1147
+ }[];
1148
+ usage?: {
1149
+ totalTokens: number;
1150
+ } | undefined;
1151
+ }>, z.ZodObject<{
1152
+ encodingFormat: z.ZodLiteral<"base64">;
1153
+ embeddings: z.ZodArray<z.ZodObject<{
1154
+ index: z.ZodNumber;
1155
+ embedding: z.ZodString;
2291
1156
  }, "strip", z.ZodTypeAny, {
2292
- schema: {
2293
- name: string;
2294
- description: string;
2295
- strict?: boolean | undefined;
2296
- parameters?: any;
2297
- };
1157
+ index: number;
1158
+ embedding: string;
2298
1159
  }, {
2299
- schema: {
2300
- name: string;
2301
- description: string;
2302
- strict?: boolean | undefined;
2303
- parameters?: any;
2304
- };
2305
- }>;
2306
- }, {
2307
- metadata: z.ZodTypeAny;
2308
- }>, "strip", z.ZodTypeAny, {
2309
- type: "function";
2310
- definition: {
2311
- schema: {
2312
- name: string;
2313
- description: string;
2314
- strict?: boolean | undefined;
2315
- parameters?: any;
2316
- };
2317
- };
2318
- metadata?: any;
1160
+ index: number;
1161
+ embedding: string;
1162
+ }>, "many">;
1163
+ usage: z.ZodOptional<z.ZodObject<{
1164
+ totalTokens: z.ZodNumber;
1165
+ }, "strip", z.ZodTypeAny, {
1166
+ totalTokens: number;
1167
+ }, {
1168
+ totalTokens: number;
1169
+ }>>;
1170
+ }, "strip", z.ZodTypeAny, {
1171
+ encodingFormat: "base64";
1172
+ embeddings: {
1173
+ index: number;
1174
+ embedding: string;
1175
+ }[];
1176
+ usage?: {
1177
+ totalTokens: number;
1178
+ } | undefined;
2319
1179
  }, {
2320
- type: "function";
2321
- definition: {
2322
- schema: {
2323
- name: string;
2324
- description: string;
2325
- strict?: boolean | undefined;
2326
- parameters?: any;
2327
- };
2328
- };
2329
- metadata?: any;
2330
- }>]>, "many">>;
2331
- callbacks: z.ZodOptional<z.ZodArray<z.ZodType<StreamChatCallbackType<any>, z.ZodTypeDef, StreamChatCallbackType<any>>, "atleastone">>;
1180
+ encodingFormat: "base64";
1181
+ embeddings: {
1182
+ index: number;
1183
+ embedding: string;
1184
+ }[];
1185
+ usage?: {
1186
+ totalTokens: number;
1187
+ } | undefined;
1188
+ }>]>;
1189
+ latencyInMs: z.ZodNumber;
2332
1190
  metadataForCallbacks: z.ZodOptional<z.ZodAny>;
2333
- }, "strip", z.ZodTypeAny, {
2334
- config: Record<string, any>;
2335
- model: ChatModelV1<{
2336
- name: string;
2337
- description: string;
2338
- roles: Partial<Record<"system" | "user" | "assistant" | "tool", string | undefined>>;
2339
- modalities: ["text" | "image" | "tool-call" | "tool-response", ...("text" | "image" | "tool-call" | "tool-response")[]];
2340
- maxInputTokens: number;
2341
- maxOutputTokens: number;
2342
- config: {
2343
- def: Record<string, {
2344
- type: "multi-string";
2345
- param: string;
2346
- title: string;
2347
- description: string;
2348
- max: number;
2349
- } | {
2350
- type: "range";
2351
- param: string;
2352
- title: string;
2353
- description: string;
2354
- max: number;
2355
- min: number;
2356
- step: number;
2357
- default: number;
2358
- } | {
2359
- type: "select-string";
2360
- param: string;
2361
- title: string;
2362
- description: string;
2363
- default: string;
2364
- choices: string[];
2365
- } | {
2366
- type: "object-schema";
2367
- param: string;
2368
- title: string;
2369
- description: string;
2370
- objectSchema?: any;
2371
- } | {
2372
- type: "select-boolean";
2373
- param: string;
2374
- title: string;
2375
- description: string;
2376
- default: boolean | null;
2377
- }>;
2378
- schema: z.ZodObject<z.ZodRawShape, z.UnknownKeysParam, z.ZodTypeAny, unknown, unknown>;
2379
- };
1191
+ provider: z.ZodObject<{
1192
+ request: z.ZodAny;
1193
+ response: z.ZodAny;
1194
+ }, "strip", z.ZodTypeAny, {
1195
+ request?: any;
1196
+ response?: any;
1197
+ }, {
1198
+ request?: any;
1199
+ response?: any;
2380
1200
  }>;
2381
- messages: {
2382
- role: "system" | "user" | "assistant" | "tool";
2383
- content: ({
2384
- value: string;
1201
+ }, "strip", z.ZodTypeAny, {
1202
+ request: {
1203
+ config: Record<string, any>;
1204
+ embeddingRequests: {
2385
1205
  modality: "text";
1206
+ requests: string[];
2386
1207
  metadata?: undefined;
2387
1208
  } | {
2388
- value: {
2389
- type: "base64";
2390
- base64: string;
2391
- media_type: "png" | "jpeg" | "webp" | "gif";
2392
- } | {
2393
- type: "url";
2394
- url: string;
2395
- };
2396
- modality: "image";
2397
- detail: "low" | "medium" | "high" | "auto";
1209
+ modality: "token";
1210
+ requests: number[][];
2398
1211
  metadata?: undefined;
2399
- } | {
2400
- name: string;
2401
- modality: "tool-call";
1212
+ };
1213
+ };
1214
+ response: {
1215
+ encodingFormat: "float";
1216
+ embeddings: {
2402
1217
  index: number;
2403
- id: string;
2404
- arguments: string;
2405
- metadata?: undefined;
2406
- } | {
2407
- data: string;
2408
- name: string;
2409
- modality: "tool-response";
1218
+ embedding: number[];
1219
+ }[];
1220
+ usage?: {
1221
+ totalTokens: number;
1222
+ } | undefined;
1223
+ } | {
1224
+ encodingFormat: "base64";
1225
+ embeddings: {
2410
1226
  index: number;
2411
- id: string;
2412
- metadata?: undefined;
2413
- })[];
2414
- metadata?: undefined;
2415
- }[];
2416
- tools?: {
2417
- type: "function";
2418
- definition: {
2419
- schema: {
2420
- name: string;
2421
- description: string;
2422
- strict?: boolean | undefined;
2423
- parameters?: any;
2424
- };
2425
- };
2426
- metadata?: any;
2427
- }[] | undefined;
2428
- callbacks?: [StreamChatCallbackType<any>, ...StreamChatCallbackType<any>[]] | undefined;
1227
+ embedding: string;
1228
+ }[];
1229
+ usage?: {
1230
+ totalTokens: number;
1231
+ } | undefined;
1232
+ };
1233
+ latencyInMs: number;
1234
+ provider: {
1235
+ request?: any;
1236
+ response?: any;
1237
+ };
2429
1238
  metadataForCallbacks?: any;
2430
1239
  }, {
2431
- config: Record<string, any>;
2432
- model: ChatModelV1<{
2433
- name: string;
2434
- description: string;
2435
- roles: Partial<Record<"system" | "user" | "assistant" | "tool", string | undefined>>;
2436
- modalities: ["text" | "image" | "tool-call" | "tool-response", ...("text" | "image" | "tool-call" | "tool-response")[]];
2437
- maxInputTokens: number;
2438
- maxOutputTokens: number;
2439
- config: {
2440
- def: Record<string, {
2441
- type: "multi-string";
2442
- param: string;
2443
- title: string;
2444
- description: string;
2445
- max: number;
2446
- } | {
2447
- type: "range";
2448
- param: string;
2449
- title: string;
2450
- description: string;
2451
- max: number;
2452
- min: number;
2453
- step: number;
2454
- default: number;
2455
- } | {
2456
- type: "select-string";
2457
- param: string;
2458
- title: string;
2459
- description: string;
2460
- default: string;
2461
- choices: string[];
2462
- } | {
2463
- type: "object-schema";
2464
- param: string;
2465
- title: string;
2466
- description: string;
2467
- objectSchema?: any;
2468
- } | {
2469
- type: "select-boolean";
2470
- param: string;
2471
- title: string;
2472
- description: string;
2473
- default: boolean | null;
2474
- }>;
2475
- schema: z.ZodObject<z.ZodRawShape, z.UnknownKeysParam, z.ZodTypeAny, unknown, unknown>;
2476
- };
2477
- }>;
2478
- messages: {
2479
- role: "system" | "user" | "assistant" | "tool";
2480
- content: ({
2481
- value: string;
1240
+ request: {
1241
+ config: Record<string, any>;
1242
+ embeddingRequests: {
2482
1243
  modality: "text";
1244
+ requests: string[];
2483
1245
  metadata?: undefined;
2484
1246
  } | {
2485
- value: {
2486
- type: "base64";
2487
- base64: string;
2488
- media_type: "png" | "jpeg" | "webp" | "gif";
2489
- } | {
2490
- type: "url";
2491
- url: string;
2492
- };
2493
- modality: "image";
2494
- detail: "low" | "medium" | "high" | "auto";
1247
+ modality: "token";
1248
+ requests: number[][];
2495
1249
  metadata?: undefined;
2496
- } | {
2497
- name: string;
2498
- modality: "tool-call";
1250
+ };
1251
+ };
1252
+ response: {
1253
+ encodingFormat: "float";
1254
+ embeddings: {
2499
1255
  index: number;
2500
- id: string;
2501
- arguments: string;
2502
- metadata?: undefined;
2503
- } | {
2504
- data: string;
2505
- name: string;
2506
- modality: "tool-response";
1256
+ embedding: number[];
1257
+ }[];
1258
+ usage?: {
1259
+ totalTokens: number;
1260
+ } | undefined;
1261
+ } | {
1262
+ encodingFormat: "base64";
1263
+ embeddings: {
2507
1264
  index: number;
2508
- id: string;
2509
- metadata?: undefined;
2510
- })[];
2511
- metadata?: undefined;
2512
- }[];
2513
- tools?: {
2514
- type: "function";
2515
- definition: {
2516
- schema: {
2517
- name: string;
2518
- description: string;
2519
- strict?: boolean | undefined;
2520
- parameters?: any;
2521
- };
2522
- };
2523
- metadata?: any;
2524
- }[] | undefined;
2525
- callbacks?: [StreamChatCallbackType<any>, ...StreamChatCallbackType<any>[]] | undefined;
1265
+ embedding: string;
1266
+ }[];
1267
+ usage?: {
1268
+ totalTokens: number;
1269
+ } | undefined;
1270
+ };
1271
+ latencyInMs: number;
1272
+ provider: {
1273
+ request?: any;
1274
+ response?: any;
1275
+ };
2526
1276
  metadataForCallbacks?: any;
2527
1277
  }>;
2528
- type StreamChatHandlerRequestType = z.infer<typeof StreamChatHandlerRequest>;
1278
+ type GetEmbeddingsHandlerResponseType = z.infer<typeof GetEmbeddingsHandlerResponse>;
1279
+ type GetEmbeddingsCallbackType<M = any> = {
1280
+ onGetEmbeddingsStart?: (metadata?: M) => Promise<void> | void;
1281
+ onGetEmbeddingsCached?: (metadata?: M, response?: GetEmbeddingsHandlerResponseType) => Promise<void> | void;
1282
+ onGetEmbeddingsComplete?: (metadata?: M, response?: GetEmbeddingsHandlerResponseType) => Promise<void> | void;
1283
+ onGetEmbeddingsError?: (metadata?: M, error?: GatewayError | HttpRequestError) => Promise<void> | void;
1284
+ };
1285
+
2529
1286
  declare const StreamChatHandlerResponse: z.ZodObject<{
2530
1287
  request: z.ZodObject<{
2531
1288
  config: z.ZodRecord<z.ZodString, z.ZodAny>;
@@ -2889,16 +1646,16 @@ declare const StreamChatHandlerResponse: z.ZodObject<{
2889
1646
  }, "strip", z.ZodTypeAny, {
2890
1647
  modality: "partial-tool-call";
2891
1648
  index: number;
1649
+ name?: string | undefined;
2892
1650
  metadata?: undefined;
2893
1651
  id?: string | undefined;
2894
- name?: string | undefined;
2895
1652
  arguments?: string | undefined;
2896
1653
  }, {
2897
1654
  modality: "partial-tool-call";
2898
1655
  index: number;
1656
+ name?: string | undefined;
2899
1657
  metadata?: undefined;
2900
1658
  id?: string | undefined;
2901
- name?: string | undefined;
2902
1659
  arguments?: string | undefined;
2903
1660
  }>]>;
2904
1661
  metadata: z.ZodUndefined;
@@ -2911,9 +1668,9 @@ declare const StreamChatHandlerResponse: z.ZodObject<{
2911
1668
  } | {
2912
1669
  modality: "partial-tool-call";
2913
1670
  index: number;
1671
+ name?: string | undefined;
2914
1672
  metadata?: undefined;
2915
1673
  id?: string | undefined;
2916
- name?: string | undefined;
2917
1674
  arguments?: string | undefined;
2918
1675
  };
2919
1676
  metadata?: undefined;
@@ -2926,9 +1683,9 @@ declare const StreamChatHandlerResponse: z.ZodObject<{
2926
1683
  } | {
2927
1684
  modality: "partial-tool-call";
2928
1685
  index: number;
1686
+ name?: string | undefined;
2929
1687
  metadata?: undefined;
2930
1688
  id?: string | undefined;
2931
- name?: string | undefined;
2932
1689
  arguments?: string | undefined;
2933
1690
  };
2934
1691
  metadata?: undefined;
@@ -2993,9 +1750,9 @@ declare const StreamChatHandlerResponse: z.ZodObject<{
2993
1750
  } | {
2994
1751
  modality: "partial-tool-call";
2995
1752
  index: number;
1753
+ name?: string | undefined;
2996
1754
  metadata?: undefined;
2997
1755
  id?: string | undefined;
2998
- name?: string | undefined;
2999
1756
  arguments?: string | undefined;
3000
1757
  };
3001
1758
  metadata?: undefined;
@@ -3025,9 +1782,9 @@ declare const StreamChatHandlerResponse: z.ZodObject<{
3025
1782
  } | {
3026
1783
  modality: "partial-tool-call";
3027
1784
  index: number;
1785
+ name?: string | undefined;
3028
1786
  metadata?: undefined;
3029
1787
  id?: string | undefined;
3030
- name?: string | undefined;
3031
1788
  arguments?: string | undefined;
3032
1789
  };
3033
1790
  metadata?: undefined;
@@ -3120,9 +1877,9 @@ declare const StreamChatHandlerResponse: z.ZodObject<{
3120
1877
  } | {
3121
1878
  modality: "partial-tool-call";
3122
1879
  index: number;
1880
+ name?: string | undefined;
3123
1881
  metadata?: undefined;
3124
1882
  id?: string | undefined;
3125
- name?: string | undefined;
3126
1883
  arguments?: string | undefined;
3127
1884
  };
3128
1885
  metadata?: undefined;
@@ -3209,9 +1966,9 @@ declare const StreamChatHandlerResponse: z.ZodObject<{
3209
1966
  } | {
3210
1967
  modality: "partial-tool-call";
3211
1968
  index: number;
1969
+ name?: string | undefined;
3212
1970
  metadata?: undefined;
3213
1971
  id?: string | undefined;
3214
- name?: string | undefined;
3215
1972
  arguments?: string | undefined;
3216
1973
  };
3217
1974
  metadata?: undefined;
@@ -3247,21 +2004,667 @@ type StreamChatCallbackType<M = any> = {
3247
2004
  onStreamError?: (metadata?: M, error?: GatewayError) => Promise<void> | void;
3248
2005
  };
3249
2006
 
3250
- declare function handleStreamChat<M>(request: StreamChatHandlerRequestType, client: HttpClient): AsyncGenerator<StreamChatHandlerResponseType, void, unknown>;
3251
-
3252
- type GatewayCallbackType<M = any> = CompleteChatCallbackType<M> | StreamChatCallbackType<M>;
3253
2007
  declare const GatewayOptions: z.ZodObject<{
2008
+ queueOptions: z.ZodOptional<z.ZodObject<{
2009
+ maxConcurrentTasks: z.ZodOptional<z.ZodNumber>;
2010
+ retryCount: z.ZodOptional<z.ZodNumber>;
2011
+ timeout: z.ZodOptional<z.ZodNumber>;
2012
+ retry: z.ZodOptional<z.ZodObject<{
2013
+ initialDelay: z.ZodNumber;
2014
+ exponentialFactor: z.ZodNumber;
2015
+ }, "strip", z.ZodTypeAny, {
2016
+ initialDelay: number;
2017
+ exponentialFactor: number;
2018
+ }, {
2019
+ initialDelay: number;
2020
+ exponentialFactor: number;
2021
+ }>>;
2022
+ }, "strip", z.ZodTypeAny, {
2023
+ timeout?: number | undefined;
2024
+ maxConcurrentTasks?: number | undefined;
2025
+ retryCount?: number | undefined;
2026
+ retry?: {
2027
+ initialDelay: number;
2028
+ exponentialFactor: number;
2029
+ } | undefined;
2030
+ }, {
2031
+ timeout?: number | undefined;
2032
+ maxConcurrentTasks?: number | undefined;
2033
+ retryCount?: number | undefined;
2034
+ retry?: {
2035
+ initialDelay: number;
2036
+ exponentialFactor: number;
2037
+ } | undefined;
2038
+ }>>;
3254
2039
  dangerouslyAllowBrowser: z.ZodOptional<z.ZodBoolean>;
3255
2040
  httpClient: z.ZodOptional<z.ZodType<HttpClient, z.ZodTypeDef, HttpClient>>;
3256
- callbacks: z.ZodOptional<z.ZodArray<z.ZodType<GatewayCallbackType<any>, z.ZodTypeDef, GatewayCallbackType<any>>, "atleastone">>;
2041
+ completeChatCache: z.ZodOptional<z.ZodType<Cache<{
2042
+ request: {
2043
+ config: Record<string, any>;
2044
+ messages: {
2045
+ role: "system" | "user" | "assistant" | "tool";
2046
+ content: ({
2047
+ value: string;
2048
+ modality: "text";
2049
+ metadata?: undefined;
2050
+ } | {
2051
+ value: {
2052
+ type: "base64";
2053
+ base64: string;
2054
+ media_type: "png" | "jpeg" | "webp" | "gif";
2055
+ } | {
2056
+ type: "url";
2057
+ url: string;
2058
+ };
2059
+ modality: "image";
2060
+ detail: "low" | "medium" | "high" | "auto";
2061
+ metadata?: undefined;
2062
+ } | {
2063
+ name: string;
2064
+ modality: "tool-call";
2065
+ index: number;
2066
+ id: string;
2067
+ arguments: string;
2068
+ metadata?: undefined;
2069
+ } | {
2070
+ data: string;
2071
+ name: string;
2072
+ modality: "tool-response";
2073
+ index: number;
2074
+ id: string;
2075
+ metadata?: undefined;
2076
+ })[];
2077
+ metadata?: undefined;
2078
+ }[];
2079
+ tools?: {
2080
+ type: "function";
2081
+ definition: {
2082
+ schema: {
2083
+ name: string;
2084
+ description: string;
2085
+ strict?: boolean | undefined;
2086
+ parameters?: any;
2087
+ };
2088
+ };
2089
+ metadata?: any;
2090
+ }[] | undefined;
2091
+ };
2092
+ response: {
2093
+ messages: {
2094
+ role: "system" | "user" | "assistant" | "tool";
2095
+ content: ({
2096
+ value: string;
2097
+ modality: "text";
2098
+ metadata?: undefined;
2099
+ } | {
2100
+ value: {
2101
+ type: "base64";
2102
+ base64: string;
2103
+ media_type: "png" | "jpeg" | "webp" | "gif";
2104
+ } | {
2105
+ type: "url";
2106
+ url: string;
2107
+ };
2108
+ modality: "image";
2109
+ detail: "low" | "medium" | "high" | "auto";
2110
+ metadata?: undefined;
2111
+ } | {
2112
+ name: string;
2113
+ modality: "tool-call";
2114
+ index: number;
2115
+ id: string;
2116
+ arguments: string;
2117
+ metadata?: undefined;
2118
+ } | {
2119
+ name: string;
2120
+ modality: "tool-response";
2121
+ index: number;
2122
+ id: string;
2123
+ data: string;
2124
+ metadata?: undefined;
2125
+ })[];
2126
+ metadata?: undefined;
2127
+ }[];
2128
+ usage?: {
2129
+ totalTokens: number;
2130
+ promptTokens: number;
2131
+ completionTokens: number;
2132
+ } | undefined;
2133
+ logProbs?: {
2134
+ token: string;
2135
+ logProb: number;
2136
+ bytes: number[] | null;
2137
+ topLogProbs: {
2138
+ token: string;
2139
+ logProb: number;
2140
+ bytes: number[] | null;
2141
+ }[];
2142
+ }[] | undefined;
2143
+ };
2144
+ latencyInMs: number;
2145
+ provider: {
2146
+ request?: any;
2147
+ response?: any;
2148
+ };
2149
+ metadataForCallbacks?: any;
2150
+ }>, z.ZodTypeDef, Cache<{
2151
+ request: {
2152
+ config: Record<string, any>;
2153
+ messages: {
2154
+ role: "system" | "user" | "assistant" | "tool";
2155
+ content: ({
2156
+ value: string;
2157
+ modality: "text";
2158
+ metadata?: undefined;
2159
+ } | {
2160
+ value: {
2161
+ type: "base64";
2162
+ base64: string;
2163
+ media_type: "png" | "jpeg" | "webp" | "gif";
2164
+ } | {
2165
+ type: "url";
2166
+ url: string;
2167
+ };
2168
+ modality: "image";
2169
+ detail: "low" | "medium" | "high" | "auto";
2170
+ metadata?: undefined;
2171
+ } | {
2172
+ name: string;
2173
+ modality: "tool-call";
2174
+ index: number;
2175
+ id: string;
2176
+ arguments: string;
2177
+ metadata?: undefined;
2178
+ } | {
2179
+ data: string;
2180
+ name: string;
2181
+ modality: "tool-response";
2182
+ index: number;
2183
+ id: string;
2184
+ metadata?: undefined;
2185
+ })[];
2186
+ metadata?: undefined;
2187
+ }[];
2188
+ tools?: {
2189
+ type: "function";
2190
+ definition: {
2191
+ schema: {
2192
+ name: string;
2193
+ description: string;
2194
+ strict?: boolean | undefined;
2195
+ parameters?: any;
2196
+ };
2197
+ };
2198
+ metadata?: any;
2199
+ }[] | undefined;
2200
+ };
2201
+ response: {
2202
+ messages: {
2203
+ role: "system" | "user" | "assistant" | "tool";
2204
+ content: ({
2205
+ value: string;
2206
+ modality: "text";
2207
+ metadata?: undefined;
2208
+ } | {
2209
+ value: {
2210
+ type: "base64";
2211
+ base64: string;
2212
+ media_type: "png" | "jpeg" | "webp" | "gif";
2213
+ } | {
2214
+ type: "url";
2215
+ url: string;
2216
+ };
2217
+ modality: "image";
2218
+ detail: "low" | "medium" | "high" | "auto";
2219
+ metadata?: undefined;
2220
+ } | {
2221
+ name: string;
2222
+ modality: "tool-call";
2223
+ index: number;
2224
+ id: string;
2225
+ arguments: string;
2226
+ metadata?: undefined;
2227
+ } | {
2228
+ name: string;
2229
+ modality: "tool-response";
2230
+ index: number;
2231
+ id: string;
2232
+ data: string;
2233
+ metadata?: undefined;
2234
+ })[];
2235
+ metadata?: undefined;
2236
+ }[];
2237
+ usage?: {
2238
+ totalTokens: number;
2239
+ promptTokens: number;
2240
+ completionTokens: number;
2241
+ } | undefined;
2242
+ logProbs?: {
2243
+ token: string;
2244
+ logProb: number;
2245
+ bytes: number[] | null;
2246
+ topLogProbs: {
2247
+ token: string;
2248
+ logProb: number;
2249
+ bytes: number[] | null;
2250
+ }[];
2251
+ }[] | undefined;
2252
+ };
2253
+ latencyInMs: number;
2254
+ provider: {
2255
+ request?: any;
2256
+ response?: any;
2257
+ };
2258
+ metadataForCallbacks?: any;
2259
+ }>>>;
2260
+ completeChatCallbacks: z.ZodOptional<z.ZodArray<z.ZodType<CompleteChatCallbackType, z.ZodTypeDef, CompleteChatCallbackType>, "atleastone">>;
2261
+ getEmbeddingsCache: z.ZodOptional<z.ZodType<Cache<{
2262
+ request: {
2263
+ config: Record<string, any>;
2264
+ embeddingRequests: {
2265
+ modality: "text";
2266
+ requests: string[];
2267
+ metadata?: undefined;
2268
+ } | {
2269
+ modality: "token";
2270
+ requests: number[][];
2271
+ metadata?: undefined;
2272
+ };
2273
+ };
2274
+ response: {
2275
+ encodingFormat: "float";
2276
+ embeddings: {
2277
+ index: number;
2278
+ embedding: number[];
2279
+ }[];
2280
+ usage?: {
2281
+ totalTokens: number;
2282
+ } | undefined;
2283
+ } | {
2284
+ encodingFormat: "base64";
2285
+ embeddings: {
2286
+ index: number;
2287
+ embedding: string;
2288
+ }[];
2289
+ usage?: {
2290
+ totalTokens: number;
2291
+ } | undefined;
2292
+ };
2293
+ latencyInMs: number;
2294
+ provider: {
2295
+ request?: any;
2296
+ response?: any;
2297
+ };
2298
+ metadataForCallbacks?: any;
2299
+ }>, z.ZodTypeDef, Cache<{
2300
+ request: {
2301
+ config: Record<string, any>;
2302
+ embeddingRequests: {
2303
+ modality: "text";
2304
+ requests: string[];
2305
+ metadata?: undefined;
2306
+ } | {
2307
+ modality: "token";
2308
+ requests: number[][];
2309
+ metadata?: undefined;
2310
+ };
2311
+ };
2312
+ response: {
2313
+ encodingFormat: "float";
2314
+ embeddings: {
2315
+ index: number;
2316
+ embedding: number[];
2317
+ }[];
2318
+ usage?: {
2319
+ totalTokens: number;
2320
+ } | undefined;
2321
+ } | {
2322
+ encodingFormat: "base64";
2323
+ embeddings: {
2324
+ index: number;
2325
+ embedding: string;
2326
+ }[];
2327
+ usage?: {
2328
+ totalTokens: number;
2329
+ } | undefined;
2330
+ };
2331
+ latencyInMs: number;
2332
+ provider: {
2333
+ request?: any;
2334
+ response?: any;
2335
+ };
2336
+ metadataForCallbacks?: any;
2337
+ }>>>;
2338
+ getEmbeddingsCallbacks: z.ZodOptional<z.ZodArray<z.ZodType<GetEmbeddingsCallbackType, z.ZodTypeDef, GetEmbeddingsCallbackType>, "atleastone">>;
2339
+ streamChatCallbacks: z.ZodOptional<z.ZodArray<z.ZodType<StreamChatCallbackType, z.ZodTypeDef, StreamChatCallbackType>, "atleastone">>;
3257
2340
  }, "strip", z.ZodTypeAny, {
3258
- callbacks?: [GatewayCallbackType<any>, ...GatewayCallbackType<any>[]] | undefined;
2341
+ queueOptions?: {
2342
+ timeout?: number | undefined;
2343
+ maxConcurrentTasks?: number | undefined;
2344
+ retryCount?: number | undefined;
2345
+ retry?: {
2346
+ initialDelay: number;
2347
+ exponentialFactor: number;
2348
+ } | undefined;
2349
+ } | undefined;
3259
2350
  dangerouslyAllowBrowser?: boolean | undefined;
3260
2351
  httpClient?: HttpClient | undefined;
2352
+ completeChatCache?: Cache<{
2353
+ request: {
2354
+ config: Record<string, any>;
2355
+ messages: {
2356
+ role: "system" | "user" | "assistant" | "tool";
2357
+ content: ({
2358
+ value: string;
2359
+ modality: "text";
2360
+ metadata?: undefined;
2361
+ } | {
2362
+ value: {
2363
+ type: "base64";
2364
+ base64: string;
2365
+ media_type: "png" | "jpeg" | "webp" | "gif";
2366
+ } | {
2367
+ type: "url";
2368
+ url: string;
2369
+ };
2370
+ modality: "image";
2371
+ detail: "low" | "medium" | "high" | "auto";
2372
+ metadata?: undefined;
2373
+ } | {
2374
+ name: string;
2375
+ modality: "tool-call";
2376
+ index: number;
2377
+ id: string;
2378
+ arguments: string;
2379
+ metadata?: undefined;
2380
+ } | {
2381
+ data: string;
2382
+ name: string;
2383
+ modality: "tool-response";
2384
+ index: number;
2385
+ id: string;
2386
+ metadata?: undefined;
2387
+ })[];
2388
+ metadata?: undefined;
2389
+ }[];
2390
+ tools?: {
2391
+ type: "function";
2392
+ definition: {
2393
+ schema: {
2394
+ name: string;
2395
+ description: string;
2396
+ strict?: boolean | undefined;
2397
+ parameters?: any;
2398
+ };
2399
+ };
2400
+ metadata?: any;
2401
+ }[] | undefined;
2402
+ };
2403
+ response: {
2404
+ messages: {
2405
+ role: "system" | "user" | "assistant" | "tool";
2406
+ content: ({
2407
+ value: string;
2408
+ modality: "text";
2409
+ metadata?: undefined;
2410
+ } | {
2411
+ value: {
2412
+ type: "base64";
2413
+ base64: string;
2414
+ media_type: "png" | "jpeg" | "webp" | "gif";
2415
+ } | {
2416
+ type: "url";
2417
+ url: string;
2418
+ };
2419
+ modality: "image";
2420
+ detail: "low" | "medium" | "high" | "auto";
2421
+ metadata?: undefined;
2422
+ } | {
2423
+ name: string;
2424
+ modality: "tool-call";
2425
+ index: number;
2426
+ id: string;
2427
+ arguments: string;
2428
+ metadata?: undefined;
2429
+ } | {
2430
+ name: string;
2431
+ modality: "tool-response";
2432
+ index: number;
2433
+ id: string;
2434
+ data: string;
2435
+ metadata?: undefined;
2436
+ })[];
2437
+ metadata?: undefined;
2438
+ }[];
2439
+ usage?: {
2440
+ totalTokens: number;
2441
+ promptTokens: number;
2442
+ completionTokens: number;
2443
+ } | undefined;
2444
+ logProbs?: {
2445
+ token: string;
2446
+ logProb: number;
2447
+ bytes: number[] | null;
2448
+ topLogProbs: {
2449
+ token: string;
2450
+ logProb: number;
2451
+ bytes: number[] | null;
2452
+ }[];
2453
+ }[] | undefined;
2454
+ };
2455
+ latencyInMs: number;
2456
+ provider: {
2457
+ request?: any;
2458
+ response?: any;
2459
+ };
2460
+ metadataForCallbacks?: any;
2461
+ }> | undefined;
2462
+ completeChatCallbacks?: [CompleteChatCallbackType, ...CompleteChatCallbackType[]] | undefined;
2463
+ getEmbeddingsCache?: Cache<{
2464
+ request: {
2465
+ config: Record<string, any>;
2466
+ embeddingRequests: {
2467
+ modality: "text";
2468
+ requests: string[];
2469
+ metadata?: undefined;
2470
+ } | {
2471
+ modality: "token";
2472
+ requests: number[][];
2473
+ metadata?: undefined;
2474
+ };
2475
+ };
2476
+ response: {
2477
+ encodingFormat: "float";
2478
+ embeddings: {
2479
+ index: number;
2480
+ embedding: number[];
2481
+ }[];
2482
+ usage?: {
2483
+ totalTokens: number;
2484
+ } | undefined;
2485
+ } | {
2486
+ encodingFormat: "base64";
2487
+ embeddings: {
2488
+ index: number;
2489
+ embedding: string;
2490
+ }[];
2491
+ usage?: {
2492
+ totalTokens: number;
2493
+ } | undefined;
2494
+ };
2495
+ latencyInMs: number;
2496
+ provider: {
2497
+ request?: any;
2498
+ response?: any;
2499
+ };
2500
+ metadataForCallbacks?: any;
2501
+ }> | undefined;
2502
+ getEmbeddingsCallbacks?: [GetEmbeddingsCallbackType, ...GetEmbeddingsCallbackType[]] | undefined;
2503
+ streamChatCallbacks?: [StreamChatCallbackType, ...StreamChatCallbackType[]] | undefined;
3261
2504
  }, {
3262
- callbacks?: [GatewayCallbackType<any>, ...GatewayCallbackType<any>[]] | undefined;
2505
+ queueOptions?: {
2506
+ timeout?: number | undefined;
2507
+ maxConcurrentTasks?: number | undefined;
2508
+ retryCount?: number | undefined;
2509
+ retry?: {
2510
+ initialDelay: number;
2511
+ exponentialFactor: number;
2512
+ } | undefined;
2513
+ } | undefined;
3263
2514
  dangerouslyAllowBrowser?: boolean | undefined;
3264
2515
  httpClient?: HttpClient | undefined;
2516
+ completeChatCache?: Cache<{
2517
+ request: {
2518
+ config: Record<string, any>;
2519
+ messages: {
2520
+ role: "system" | "user" | "assistant" | "tool";
2521
+ content: ({
2522
+ value: string;
2523
+ modality: "text";
2524
+ metadata?: undefined;
2525
+ } | {
2526
+ value: {
2527
+ type: "base64";
2528
+ base64: string;
2529
+ media_type: "png" | "jpeg" | "webp" | "gif";
2530
+ } | {
2531
+ type: "url";
2532
+ url: string;
2533
+ };
2534
+ modality: "image";
2535
+ detail: "low" | "medium" | "high" | "auto";
2536
+ metadata?: undefined;
2537
+ } | {
2538
+ name: string;
2539
+ modality: "tool-call";
2540
+ index: number;
2541
+ id: string;
2542
+ arguments: string;
2543
+ metadata?: undefined;
2544
+ } | {
2545
+ data: string;
2546
+ name: string;
2547
+ modality: "tool-response";
2548
+ index: number;
2549
+ id: string;
2550
+ metadata?: undefined;
2551
+ })[];
2552
+ metadata?: undefined;
2553
+ }[];
2554
+ tools?: {
2555
+ type: "function";
2556
+ definition: {
2557
+ schema: {
2558
+ name: string;
2559
+ description: string;
2560
+ strict?: boolean | undefined;
2561
+ parameters?: any;
2562
+ };
2563
+ };
2564
+ metadata?: any;
2565
+ }[] | undefined;
2566
+ };
2567
+ response: {
2568
+ messages: {
2569
+ role: "system" | "user" | "assistant" | "tool";
2570
+ content: ({
2571
+ value: string;
2572
+ modality: "text";
2573
+ metadata?: undefined;
2574
+ } | {
2575
+ value: {
2576
+ type: "base64";
2577
+ base64: string;
2578
+ media_type: "png" | "jpeg" | "webp" | "gif";
2579
+ } | {
2580
+ type: "url";
2581
+ url: string;
2582
+ };
2583
+ modality: "image";
2584
+ detail: "low" | "medium" | "high" | "auto";
2585
+ metadata?: undefined;
2586
+ } | {
2587
+ name: string;
2588
+ modality: "tool-call";
2589
+ index: number;
2590
+ id: string;
2591
+ arguments: string;
2592
+ metadata?: undefined;
2593
+ } | {
2594
+ name: string;
2595
+ modality: "tool-response";
2596
+ index: number;
2597
+ id: string;
2598
+ data: string;
2599
+ metadata?: undefined;
2600
+ })[];
2601
+ metadata?: undefined;
2602
+ }[];
2603
+ usage?: {
2604
+ totalTokens: number;
2605
+ promptTokens: number;
2606
+ completionTokens: number;
2607
+ } | undefined;
2608
+ logProbs?: {
2609
+ token: string;
2610
+ logProb: number;
2611
+ bytes: number[] | null;
2612
+ topLogProbs: {
2613
+ token: string;
2614
+ logProb: number;
2615
+ bytes: number[] | null;
2616
+ }[];
2617
+ }[] | undefined;
2618
+ };
2619
+ latencyInMs: number;
2620
+ provider: {
2621
+ request?: any;
2622
+ response?: any;
2623
+ };
2624
+ metadataForCallbacks?: any;
2625
+ }> | undefined;
2626
+ completeChatCallbacks?: [CompleteChatCallbackType, ...CompleteChatCallbackType[]] | undefined;
2627
+ getEmbeddingsCache?: Cache<{
2628
+ request: {
2629
+ config: Record<string, any>;
2630
+ embeddingRequests: {
2631
+ modality: "text";
2632
+ requests: string[];
2633
+ metadata?: undefined;
2634
+ } | {
2635
+ modality: "token";
2636
+ requests: number[][];
2637
+ metadata?: undefined;
2638
+ };
2639
+ };
2640
+ response: {
2641
+ encodingFormat: "float";
2642
+ embeddings: {
2643
+ index: number;
2644
+ embedding: number[];
2645
+ }[];
2646
+ usage?: {
2647
+ totalTokens: number;
2648
+ } | undefined;
2649
+ } | {
2650
+ encodingFormat: "base64";
2651
+ embeddings: {
2652
+ index: number;
2653
+ embedding: string;
2654
+ }[];
2655
+ usage?: {
2656
+ totalTokens: number;
2657
+ } | undefined;
2658
+ };
2659
+ latencyInMs: number;
2660
+ provider: {
2661
+ request?: any;
2662
+ response?: any;
2663
+ };
2664
+ metadataForCallbacks?: any;
2665
+ }> | undefined;
2666
+ getEmbeddingsCallbacks?: [GetEmbeddingsCallbackType, ...GetEmbeddingsCallbackType[]] | undefined;
2667
+ streamChatCallbacks?: [StreamChatCallbackType, ...StreamChatCallbackType[]] | undefined;
3265
2668
  }>;
3266
2669
  type GatewayOptionsType = z.infer<typeof GatewayOptions>;
3267
2670
  declare const GatewayCompleteChatRequest: z.ZodObject<{
@@ -3594,14 +2997,11 @@ declare const GatewayCompleteChatRequest: z.ZodObject<{
3594
2997
  metadata?: any;
3595
2998
  }>]>, "many">>;
3596
2999
  options: z.ZodOptional<z.ZodObject<{
3597
- queuePriority: z.ZodOptional<z.ZodNumber>;
3598
3000
  metadataForCallbacks: z.ZodOptional<z.ZodAny>;
3599
3001
  }, "strip", z.ZodTypeAny, {
3600
3002
  metadataForCallbacks?: any;
3601
- queuePriority?: number | undefined;
3602
3003
  }, {
3603
3004
  metadataForCallbacks?: any;
3604
- queuePriority?: number | undefined;
3605
3005
  }>>;
3606
3006
  }, "strip", z.ZodTypeAny, {
3607
3007
  config: Record<string, any>;
@@ -3688,7 +3088,6 @@ declare const GatewayCompleteChatRequest: z.ZodObject<{
3688
3088
  }[];
3689
3089
  options?: {
3690
3090
  metadataForCallbacks?: any;
3691
- queuePriority?: number | undefined;
3692
3091
  } | undefined;
3693
3092
  tools?: {
3694
3093
  type: "function";
@@ -3787,7 +3186,6 @@ declare const GatewayCompleteChatRequest: z.ZodObject<{
3787
3186
  }[];
3788
3187
  options?: {
3789
3188
  metadataForCallbacks?: any;
3790
- queuePriority?: number | undefined;
3791
3189
  } | undefined;
3792
3190
  tools?: {
3793
3191
  type: "function";
@@ -4133,14 +3531,11 @@ declare const GatewayStreamChatRequest: z.ZodObject<{
4133
3531
  metadata?: any;
4134
3532
  }>]>, "many">>;
4135
3533
  options: z.ZodOptional<z.ZodObject<{
4136
- queuePriority: z.ZodOptional<z.ZodNumber>;
4137
3534
  metadataForCallbacks: z.ZodOptional<z.ZodAny>;
4138
3535
  }, "strip", z.ZodTypeAny, {
4139
3536
  metadataForCallbacks?: any;
4140
- queuePriority?: number | undefined;
4141
3537
  }, {
4142
3538
  metadataForCallbacks?: any;
4143
- queuePriority?: number | undefined;
4144
3539
  }>>;
4145
3540
  }, "strip", z.ZodTypeAny, {
4146
3541
  config: Record<string, any>;
@@ -4227,7 +3622,6 @@ declare const GatewayStreamChatRequest: z.ZodObject<{
4227
3622
  }[];
4228
3623
  options?: {
4229
3624
  metadataForCallbacks?: any;
4230
- queuePriority?: number | undefined;
4231
3625
  } | undefined;
4232
3626
  tools?: {
4233
3627
  type: "function";
@@ -4326,7 +3720,6 @@ declare const GatewayStreamChatRequest: z.ZodObject<{
4326
3720
  }[];
4327
3721
  options?: {
4328
3722
  metadataForCallbacks?: any;
4329
- queuePriority?: number | undefined;
4330
3723
  } | undefined;
4331
3724
  tools?: {
4332
3725
  type: "function";
@@ -4594,15 +3987,15 @@ type GatewayGetEmbeddingsRequestType = z.infer<typeof GatewayGetEmbeddingsReques
4594
3987
  declare class Gateway {
4595
3988
  private options;
4596
3989
  private httpClient;
4597
- private completeQueue;
4598
- private embeddingQueue;
3990
+ private queues;
3991
+ private caches;
4599
3992
  constructor(options: GatewayOptionsType);
4600
3993
  completeChat(request: GatewayCompleteChatRequestType): Promise<CompleteChatHandlerResponseType>;
4601
- private executeCompleteChatTask;
3994
+ private executeCompleteChat;
4602
3995
  streamChat(request: GatewayStreamChatRequestType): AsyncGenerator<StreamChatHandlerResponseType, void, unknown>;
4603
3996
  getEmbeddings(request: GatewayGetEmbeddingsRequestType): Promise<GetEmbeddingsHandlerResponseType>;
4604
3997
  private executeGetEmbeddingsTask;
4605
3998
  static GatewayError: typeof GatewayError;
4606
3999
  }
4607
4000
 
4608
- export { type CompleteChatCallbackType, CompleteChatHandlerRequest, type CompleteChatHandlerRequestType, CompleteChatHandlerResponse, type CompleteChatHandlerResponseType, Gateway, type GatewayCallbackType, GatewayError, type GatewayOptionsType, type GetEmbeddingsCallbackType, GetEmbeddingsHandlerRequest, type GetEmbeddingsHandlerRequestType, GetEmbeddingsHandlerResponse, type GetEmbeddingsHandlerResponseType, type HttpClient, type HttpClientResponse, IsomorphicHttpClient, IsomorphicHttpClientError, type Queue, SimpleQueue, type StreamChatCallbackType, StreamChatHandlerRequest, type StreamChatHandlerRequestType, StreamChatHandlerResponse, type StreamChatHandlerResponseType, type Task, handleCompleteChat, handleGetEmbeddings, handleStreamChat };
4001
+ export { type Cache, Gateway, GatewayError, type GatewayOptionsType, type HttpClient, HttpClientError, type HttpClientResponse, HttpRequestError, IsomorphicHttpClient, LRUCache, type Queue, QueueOptions, type QueueOptionsType, type QueueTask, QueueTaskTimeoutError, SimpleQueue };