@layer-ai/sdk 0.5.0 → 0.5.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,1629 +1,2983 @@
1
- // Centralized model registry - single source of truth
2
- // Only includes models from supported providers (openai, anthropic, google)
1
+ // AUTO-GENERATED FILE - DO NOT EDIT MANUALLY
2
+ // Generated at: 2026-01-02T09:52:55.923Z
3
+ // Source: Internal Model Registry API
4
+ // To update: Run `pnpm sync:registry`
3
5
  //
4
- // Data sources:
5
- // - AIMLAPI: model discovery, categorization, context lengths (all model types)
6
- // - Artificial Analysis API: pricing, benchmarks, performance metrics (chat models only)
7
- //
8
- // To update: Run `pnpm run sync:models` (requires AIMLAPI_API_KEY and ARTIFICIAL_ANALYSIS_API_KEY in .env)
9
- // APIs:
10
- // - https://api.aimlapi.com/models
11
- // - https://artificialanalysis.ai/api/v2/data/llms/models
12
- // Data attribution: https://aimlapi.com, https://artificialanalysis.ai/
6
+ // Registry version: 2026-01-02
7
+ // Last sync: 2026-01-02T09:52:55.918Z
8
+ // Total models: 103
13
9
  // Providers we support with adapters
14
10
  export const SUPPORTED_PROVIDERS = ['openai', 'anthropic', 'google', 'mistral'];
15
11
  export const MODEL_REGISTRY = {
16
- // Openai models
17
- 'openai/gpt-4o': {
12
+ 'claude-3-7-sonnet-20250219': {
18
13
  type: 'chat',
19
- provider: 'openai',
20
- displayName: 'GPT 4o',
21
- pricing: { input: 0.0025, output: 0.01 },
22
- benchmarks: {
23
- intelligence: 27,
24
- coding: 24,
25
- math: 6,
26
- mmluPro: 0.748,
27
- gpqa: 0.543,
28
- },
29
- performance: {
30
- outputTokenPerSecond: 235.657,
31
- timeTofirstToken: 0.323,
32
- intelligenceScore: 27,
33
- },
34
- lastUpdated: '2025-12-24',
14
+ provider: 'anthropic',
15
+ displayName: 'Claude Sonnet 3.7',
16
+ description: 'Legacy fast model with extended thinking support',
17
+ pricing: { input: 3, output: 15 },
18
+ benchmarks: {
19
+ intelligence: 49.9,
20
+ coding: 35.8,
21
+ math: 56.3,
22
+ mmluPro: 0.84,
23
+ gpqa: 0.77,
24
+ },
25
+ performance: {
26
+ intelligenceScore: 49.9,
27
+ },
28
+ contextLength: 200000,
29
+ context: {
30
+ input: {
31
+ text: true,
32
+ audio: false,
33
+ image: true,
34
+ video: false
35
+ },
36
+ output: {
37
+ text: true,
38
+ audio: false,
39
+ image: false,
40
+ video: false
41
+ }
42
+ },
43
+ deprecated: false,
44
+ isAvailable: true,
45
+ lastUpdated: '2026-01-02',
35
46
  },
36
- 'gpt-4o-2024-08-06': {
47
+ 'claude-3-haiku-20240307': {
37
48
  type: 'chat',
38
- provider: 'openai',
39
- displayName: 'GPT 4o 2024-08-06',
40
- pricing: { input: 0.0025, output: 0.01 },
49
+ provider: 'anthropic',
50
+ displayName: 'Claude Haiku 3',
51
+ description: 'Legacy fast model with 4K token output',
52
+ pricing: { input: 0.25, output: 1.25 },
41
53
  benchmarks: {
42
- intelligence: 29,
43
- gpqa: 0.521,
54
+ intelligence: 1,
55
+ coding: 7.8,
56
+ mmluPro: 0.43,
57
+ gpqa: 0.33,
44
58
  },
45
59
  performance: {
46
- outputTokenPerSecond: 123.952,
47
- timeTofirstToken: 0.436,
48
- intelligenceScore: 29,
60
+ intelligenceScore: 1,
49
61
  },
50
- lastUpdated: '2025-12-24',
62
+ contextLength: 200000,
63
+ context: {
64
+ input: {
65
+ text: true,
66
+ audio: false,
67
+ image: true,
68
+ video: false
69
+ },
70
+ output: {
71
+ text: true,
72
+ audio: false,
73
+ image: false,
74
+ video: false
75
+ }
76
+ },
77
+ deprecated: false,
78
+ isAvailable: true,
79
+ lastUpdated: '2026-01-02',
51
80
  },
52
- 'gpt-4o-2024-05-13': {
81
+ 'claude-haiku-4-5-20251001': {
53
82
  type: 'chat',
54
- provider: 'openai',
55
- displayName: 'GPT 4o 2024-05-13',
56
- pricing: { input: 0.005, output: 0.015 },
83
+ provider: 'anthropic',
84
+ displayName: 'Claude Haiku 4.5',
85
+ description: 'Our fastest model with near-frontier intelligence',
86
+ pricing: { input: 1, output: 5 },
57
87
  benchmarks: {
58
- intelligence: 26.3,
59
- coding: 24.2,
60
- mmluPro: 0.74,
61
- gpqa: 0.526,
88
+ intelligence: 20.2,
89
+ mmluPro: 0.63,
90
+ gpqa: 0.41,
62
91
  },
63
92
  performance: {
64
- outputTokenPerSecond: 118.509,
65
- timeTofirstToken: 0.483,
66
- intelligenceScore: 26.3,
93
+ intelligenceScore: 20.2,
67
94
  },
68
- lastUpdated: '2025-12-24',
95
+ contextLength: 200000,
96
+ context: {
97
+ input: {
98
+ text: true,
99
+ audio: false,
100
+ image: true,
101
+ video: false
102
+ },
103
+ output: {
104
+ text: true,
105
+ audio: false,
106
+ image: false,
107
+ video: false
108
+ }
109
+ },
110
+ deprecated: false,
111
+ isAvailable: true,
112
+ lastUpdated: '2026-01-02',
69
113
  },
70
- 'gpt-4o-mini': {
114
+ 'claude-opus-4-1-20250805': {
71
115
  type: 'chat',
72
- provider: 'openai',
73
- displayName: 'GPT 4o mini',
74
- pricing: { input: 0.00015, output: 0.0006 },
75
- benchmarks: {
76
- intelligence: 21.2,
77
- math: 14.7,
78
- mmluPro: 0.648,
79
- gpqa: 0.426,
80
- },
81
- performance: {
82
- outputTokenPerSecond: 47.79,
83
- timeTofirstToken: 0.58,
84
- intelligenceScore: 21.2,
85
- },
86
- lastUpdated: '2025-12-24',
116
+ provider: 'anthropic',
117
+ displayName: 'Claude Opus 4.1',
118
+ description: 'Legacy premium model with moderate latency',
119
+ pricing: { input: 15, output: 75 },
120
+ benchmarks: {
121
+ intelligence: 59.3,
122
+ coding: 46.1,
123
+ math: 80.3,
124
+ mmluPro: 0.88,
125
+ gpqa: 0.81,
126
+ },
127
+ performance: {
128
+ intelligenceScore: 59.3,
129
+ },
130
+ contextLength: 200000,
131
+ context: {
132
+ input: {
133
+ text: true,
134
+ audio: false,
135
+ image: true,
136
+ video: false
137
+ },
138
+ output: {
139
+ text: true,
140
+ audio: false,
141
+ image: false,
142
+ video: false
143
+ }
144
+ },
145
+ deprecated: false,
146
+ isAvailable: true,
147
+ lastUpdated: '2026-01-02',
87
148
  },
88
- 'gpt-4o-mini-2024-07-18': {
149
+ 'claude-opus-4-5-20251101': {
89
150
  type: 'chat',
90
- provider: 'openai',
91
- displayName: 'GPT 4o mini 2024-07-18',
92
- pricing: { input: 0.00015, output: 0.0006 },
93
- benchmarks: {
94
- intelligence: 21.2,
95
- math: 14.7,
96
- mmluPro: 0.648,
97
- gpqa: 0.426,
98
- },
99
- performance: {
100
- outputTokenPerSecond: 47.79,
101
- timeTofirstToken: 0.58,
102
- intelligenceScore: 21.2,
103
- },
104
- lastUpdated: '2025-12-24',
151
+ provider: 'anthropic',
152
+ displayName: 'Claude Opus 4.5',
153
+ description: 'Premium model combining maximum intelligence with practical performance',
154
+ pricing: { input: 5, output: 25 },
155
+ benchmarks: {
156
+ intelligence: 9.7,
157
+ coding: 14,
158
+ mmluPro: 0.5,
159
+ gpqa: 0.32,
160
+ },
161
+ performance: {
162
+ intelligenceScore: 9.7,
163
+ },
164
+ contextLength: 200000,
165
+ context: {
166
+ input: {
167
+ text: true,
168
+ audio: false,
169
+ image: true,
170
+ video: false
171
+ },
172
+ output: {
173
+ text: true,
174
+ audio: false,
175
+ image: false,
176
+ video: false
177
+ }
178
+ },
179
+ deprecated: false,
180
+ isAvailable: true,
181
+ lastUpdated: '2026-01-02',
105
182
  },
106
- 'chatgpt-4o-latest': {
183
+ 'claude-sonnet-4-20250514': {
107
184
  type: 'chat',
108
- provider: 'openai',
109
- displayName: 'ChatGPT 4o latest',
110
- pricing: { input: 0.005, output: 0.015 },
185
+ provider: 'anthropic',
186
+ displayName: 'Claude Sonnet 4',
187
+ description: 'Legacy fast model with extended thinking support',
188
+ pricing: { input: 3, output: 15 },
111
189
  benchmarks: {
112
- intelligence: 25.3,
113
- mmluPro: 0.773,
114
- gpqa: 0.511,
190
+ intelligence: 44.4,
191
+ coding: 35.9,
192
+ math: 38,
193
+ mmluPro: 0.84,
194
+ gpqa: 0.68,
115
195
  },
116
196
  performance: {
117
- outputTokenPerSecond: 244.456,
118
- timeTofirstToken: 0.925,
119
- intelligenceScore: 25.3,
197
+ intelligenceScore: 44.4,
120
198
  },
121
- lastUpdated: '2025-12-24',
199
+ contextLength: 200000,
200
+ context: {
201
+ input: {
202
+ text: true,
203
+ audio: false,
204
+ image: true,
205
+ video: false
206
+ },
207
+ output: {
208
+ text: true,
209
+ audio: false,
210
+ image: false,
211
+ video: false
212
+ }
213
+ },
214
+ deprecated: false,
215
+ isAvailable: true,
216
+ lastUpdated: '2026-01-02',
122
217
  },
123
- 'gpt-4-turbo': {
218
+ 'claude-sonnet-4-5-20250929': {
124
219
  type: 'chat',
125
- provider: 'openai',
126
- displayName: 'GPT 4 turbo',
127
- pricing: { input: 0.01, output: 0.03 },
220
+ provider: 'anthropic',
221
+ displayName: 'Claude Sonnet 4.5',
222
+ description: 'Our smart model for complex agents and coding',
223
+ pricing: { input: 3, output: 15 },
128
224
  benchmarks: {
129
- intelligence: 24.2,
130
- coding: 21.5,
131
- mmluPro: 0.694,
225
+ intelligence: 49.6,
226
+ coding: 42.9,
227
+ math: 37,
228
+ mmluPro: 0.86,
229
+ gpqa: 0.73,
132
230
  },
133
231
  performance: {
134
- outputTokenPerSecond: 40.254,
135
- timeTofirstToken: 0.847,
136
- intelligenceScore: 24.2,
232
+ intelligenceScore: 49.6,
137
233
  },
138
- lastUpdated: '2025-12-24',
139
- },
140
- 'gpt-4-turbo-2024-04-09': {
234
+ contextLength: 200000,
235
+ context: {
236
+ input: {
237
+ text: true,
238
+ audio: false,
239
+ image: true,
240
+ video: false
241
+ },
242
+ output: {
243
+ text: true,
244
+ audio: false,
245
+ image: false,
246
+ video: false
247
+ }
248
+ },
249
+ deprecated: false,
250
+ isAvailable: true,
251
+ lastUpdated: '2026-01-02',
252
+ },
253
+ 'embedding-001': {
254
+ type: 'embedding',
255
+ provider: 'google',
256
+ displayName: 'Embedding 001',
257
+ description: 'Legacy embedding model for text embeddings',
258
+ pricing: { input: 0.15, output: 0 },
259
+ context: {
260
+ input: {
261
+ text: true,
262
+ audio: false,
263
+ image: false,
264
+ video: false
265
+ },
266
+ output: {
267
+ text: false,
268
+ audio: false,
269
+ image: false,
270
+ video: false
271
+ }
272
+ },
273
+ deprecated: false,
274
+ isAvailable: true,
275
+ lastUpdated: '2026-01-02',
276
+ },
277
+ 'gemini-2.0-flash': {
141
278
  type: 'chat',
142
- provider: 'openai',
143
- displayName: 'GPT 4 turbo 2024-04-09',
144
- pricing: { input: 0.01, output: 0.03 },
145
- benchmarks: {
146
- intelligence: 24.2,
147
- coding: 21.5,
148
- mmluPro: 0.694,
149
- },
150
- performance: {
151
- outputTokenPerSecond: 40.254,
152
- timeTofirstToken: 0.847,
153
- intelligenceScore: 24.2,
154
- },
155
- lastUpdated: '2025-12-24',
156
- },
157
- 'gpt-4': {
279
+ provider: 'google',
280
+ displayName: 'Gemini 2.0 Flash',
281
+ description: 'Second generation workhorse model with 1 million token context window, superior speed, native tool use, and next-gen features',
282
+ pricing: { input: 0.1, output: 0.4 },
283
+ benchmarks: {
284
+ intelligence: 12.8,
285
+ coding: 17.6,
286
+ },
287
+ performance: {
288
+ intelligenceScore: 12.8,
289
+ },
290
+ contextLength: 1048576,
291
+ context: {
292
+ input: {
293
+ text: true,
294
+ audio: true,
295
+ image: true,
296
+ video: true
297
+ },
298
+ output: {
299
+ text: true,
300
+ audio: false,
301
+ image: false,
302
+ video: false
303
+ }
304
+ },
305
+ deprecated: false,
306
+ isAvailable: true,
307
+ lastUpdated: '2026-01-02',
308
+ },
309
+ 'gemini-2.0-flash-exp-image-generation': {
158
310
  type: 'chat',
159
- provider: 'openai',
160
- displayName: 'GPT 4',
161
- pricing: { input: 0.03, output: 0.06 },
311
+ provider: 'google',
312
+ displayName: 'Gemini 2.0 Flash Image',
313
+ description: 'Second generation model with image generation capabilities',
314
+ contextLength: 32768,
315
+ context: {
316
+ input: {
317
+ text: true,
318
+ audio: true,
319
+ image: true,
320
+ video: true
321
+ },
322
+ output: {
323
+ text: true,
324
+ audio: false,
325
+ image: true,
326
+ video: false
327
+ }
328
+ },
329
+ deprecated: false,
330
+ isAvailable: true,
331
+ lastUpdated: '2026-01-02',
332
+ },
333
+ 'gemini-2.0-flash-lite': {
334
+ type: 'chat',
335
+ provider: 'google',
336
+ displayName: 'Gemini 2.0 Flash-Lite',
337
+ description: 'Second generation small and powerful model with 1 million token context window, optimized for cost efficiency and low latency',
338
+ pricing: { input: 0.075, output: 0.3 },
339
+ benchmarks: {
340
+ intelligence: 26.8,
341
+ mmluPro: 0.72,
342
+ gpqa: 0.54,
343
+ },
344
+ performance: {
345
+ intelligenceScore: 26.8,
346
+ },
347
+ contextLength: 1048576,
348
+ context: {
349
+ input: {
350
+ text: true,
351
+ audio: true,
352
+ image: true,
353
+ video: true
354
+ },
355
+ output: {
356
+ text: true,
357
+ audio: false,
358
+ image: false,
359
+ video: false
360
+ }
361
+ },
362
+ deprecated: false,
363
+ isAvailable: true,
364
+ lastUpdated: '2026-01-02',
365
+ },
366
+ 'gemini-2.5-flash': {
367
+ type: 'chat',
368
+ provider: 'google',
369
+ displayName: 'Gemini 2.5 Flash',
370
+ description: 'Fast and intelligent model with best price-performance, versatile features for high-volume tasks',
371
+ pricing: { input: 0.3, output: 2.5 },
372
+ benchmarks: {
373
+ intelligence: 54.4,
374
+ coding: 42.5,
375
+ math: 78.3,
376
+ mmluPro: 0.84,
377
+ gpqa: 0.79,
378
+ },
379
+ performance: {
380
+ intelligenceScore: 54.4,
381
+ },
382
+ contextLength: 1048576,
383
+ context: {
384
+ input: {
385
+ text: true,
386
+ audio: true,
387
+ image: true,
388
+ video: true
389
+ },
390
+ output: {
391
+ text: true,
392
+ audio: false,
393
+ image: false,
394
+ video: false
395
+ }
396
+ },
397
+ deprecated: false,
398
+ isAvailable: true,
399
+ lastUpdated: '2026-01-02',
400
+ },
401
+ 'gemini-2.5-flash-image': {
402
+ type: 'image-generation',
403
+ provider: 'google',
404
+ displayName: 'Gemini 2.5 Flash Image',
405
+ description: 'Image generation model for creating images from text and image inputs',
406
+ pricing: { input: 0.3, output: 30 },
407
+ contextLength: 65536,
408
+ context: {
409
+ input: {
410
+ text: true,
411
+ audio: false,
412
+ image: true,
413
+ video: false
414
+ },
415
+ output: {
416
+ text: true,
417
+ audio: false,
418
+ image: true,
419
+ video: false
420
+ }
421
+ },
422
+ deprecated: false,
423
+ isAvailable: true,
424
+ lastUpdated: '2026-01-02',
425
+ },
426
+ 'gemini-2.5-flash-lite': {
427
+ type: 'chat',
428
+ provider: 'google',
429
+ displayName: 'Gemini 2.5 Flash-Lite',
430
+ description: 'Ultra fast model optimized for cost efficiency and high throughput',
431
+ pricing: { input: 0.1, output: 0.4 },
432
+ benchmarks: {
433
+ intelligence: 40.1,
434
+ coding: 27.6,
435
+ math: 53.3,
436
+ mmluPro: 0.76,
437
+ gpqa: 0.63,
438
+ },
439
+ performance: {
440
+ intelligenceScore: 40.1,
441
+ },
442
+ contextLength: 1048576,
443
+ context: {
444
+ input: {
445
+ text: true,
446
+ audio: true,
447
+ image: true,
448
+ video: true
449
+ },
450
+ output: {
451
+ text: true,
452
+ audio: false,
453
+ image: false,
454
+ video: false
455
+ }
456
+ },
457
+ deprecated: false,
458
+ isAvailable: true,
459
+ lastUpdated: '2026-01-02',
460
+ },
461
+ 'gemini-2.5-flash-preview-tts': {
462
+ type: 'tts',
463
+ provider: 'google',
464
+ displayName: 'Gemini 2.5 Flash TTS',
465
+ description: 'Text-to-speech model for audio generation',
466
+ pricing: { input: 0.5, output: 100 },
467
+ contextLength: 8192,
468
+ context: {
469
+ input: {
470
+ text: true,
471
+ audio: false,
472
+ image: false,
473
+ video: false
474
+ },
475
+ output: {
476
+ text: false,
477
+ audio: true,
478
+ image: false,
479
+ video: false
480
+ }
481
+ },
482
+ deprecated: false,
483
+ isAvailable: true,
484
+ lastUpdated: '2026-01-02',
485
+ },
486
+ 'gemini-2.5-pro': {
487
+ type: 'chat',
488
+ provider: 'google',
489
+ displayName: 'Gemini 2.5 Pro',
490
+ description: 'Advanced thinking model for complex reasoning in code, math, and STEM, with long context for analyzing large datasets, codebases, and documents',
491
+ pricing: { input: 1.25, output: 10 },
492
+ benchmarks: {
493
+ intelligence: 53.2,
494
+ mmluPro: 0.84,
495
+ gpqa: 0.82,
496
+ },
497
+ performance: {
498
+ intelligenceScore: 53.2,
499
+ },
500
+ contextLength: 1048576,
501
+ context: {
502
+ input: {
503
+ pdf: true,
504
+ text: true,
505
+ audio: true,
506
+ image: true,
507
+ video: true
508
+ },
509
+ output: {
510
+ text: true,
511
+ audio: false,
512
+ image: false,
513
+ video: false
514
+ }
515
+ },
516
+ deprecated: false,
517
+ isAvailable: true,
518
+ lastUpdated: '2026-01-02',
519
+ },
520
+ 'gemini-2.5-pro-preview-tts': {
521
+ type: 'tts',
522
+ provider: 'google',
523
+ displayName: 'Gemini 2.5 Pro TTS',
524
+ description: 'Text-to-speech model for audio generation',
525
+ pricing: { input: 1, output: 20 },
526
+ contextLength: 8192,
527
+ context: {
528
+ input: {
529
+ text: true,
530
+ audio: false,
531
+ image: false,
532
+ video: false
533
+ },
534
+ output: {
535
+ text: false,
536
+ audio: true,
537
+ image: false,
538
+ video: false
539
+ }
540
+ },
541
+ deprecated: false,
542
+ isAvailable: true,
543
+ lastUpdated: '2026-01-02',
544
+ },
545
+ 'gemini-3-flash-preview': {
546
+ type: 'chat',
547
+ provider: 'google',
548
+ displayName: 'Gemini 3 Flash Preview',
549
+ description: 'Most balanced model designed for speed, scale and the latest AI',
550
+ pricing: { input: 0.5, output: 3 },
551
+ benchmarks: {
552
+ intelligence: 71.3,
553
+ coding: 59.2,
554
+ math: 97,
555
+ mmluPro: 0.89,
556
+ gpqa: 0.9,
557
+ },
558
+ performance: {
559
+ intelligenceScore: 71.3,
560
+ },
561
+ contextLength: 1048576,
562
+ context: {
563
+ input: {
564
+ text: true,
565
+ audio: true,
566
+ image: true,
567
+ video: true
568
+ },
569
+ output: {
570
+ text: true,
571
+ audio: false,
572
+ image: false,
573
+ video: false
574
+ }
575
+ },
576
+ deprecated: false,
577
+ isAvailable: true,
578
+ lastUpdated: '2026-01-02',
579
+ },
580
+ 'gemini-3-pro-image-preview': {
581
+ type: 'image-generation',
582
+ provider: 'google',
583
+ displayName: 'Gemini 3 Pro Image Preview',
584
+ description: 'Image generation model for creating images from text and image inputs',
585
+ pricing: { input: 2, output: 12 },
586
+ contextLength: 65536,
587
+ context: {
588
+ input: {
589
+ text: true,
590
+ audio: false,
591
+ image: true,
592
+ video: false
593
+ },
594
+ output: {
595
+ text: true,
596
+ audio: false,
597
+ image: true,
598
+ video: false
599
+ }
600
+ },
601
+ deprecated: false,
602
+ isAvailable: true,
603
+ lastUpdated: '2026-01-02',
604
+ },
605
+ 'gemini-3-pro-preview': {
606
+ type: 'chat',
607
+ provider: 'google',
608
+ displayName: 'Gemini 3 Pro Preview',
609
+ description: 'Most intelligent model with advanced reasoning, richer visuals and deeper interactions',
610
+ pricing: { input: 2, output: 12 },
611
+ benchmarks: {
612
+ intelligence: 64.5,
613
+ coding: 55.8,
614
+ math: 86.7,
615
+ mmluPro: 0.9,
616
+ gpqa: 0.89,
617
+ },
618
+ performance: {
619
+ intelligenceScore: 64.5,
620
+ },
621
+ contextLength: 1048576,
622
+ context: {
623
+ input: {
624
+ text: true,
625
+ audio: true,
626
+ image: true,
627
+ video: true
628
+ },
629
+ output: {
630
+ text: true,
631
+ audio: false,
632
+ image: false,
633
+ video: false
634
+ }
635
+ },
636
+ deprecated: false,
637
+ isAvailable: true,
638
+ lastUpdated: '2026-01-02',
639
+ },
640
+ 'gemini-robotics-er-1.5-preview': {
641
+ type: 'chat',
642
+ provider: 'google',
643
+ displayName: 'Gemini Robotics ER 1.5 Preview',
644
+ description: 'Robotics model for embodied reasoning and control tasks',
645
+ pricing: { input: 0.3, output: 2.5 },
646
+ context: {
647
+ input: {
648
+ text: true,
649
+ audio: false,
650
+ image: true,
651
+ video: true
652
+ },
653
+ output: {
654
+ text: true,
655
+ audio: false,
656
+ image: false,
657
+ video: false
658
+ }
659
+ },
660
+ deprecated: false,
661
+ isAvailable: true,
662
+ lastUpdated: '2026-01-02',
663
+ },
664
+ 'gemma-3-12b-it': {
665
+ type: 'chat',
666
+ provider: 'google',
667
+ displayName: 'Gemma 3 12B IT',
668
+ description: 'Medium instruction-tuned Gemma model',
669
+ pricing: { input: 0, output: 0 },
162
670
  benchmarks: {
163
- intelligence: 21.5,
164
- coding: 13.1,
671
+ intelligence: 20.4,
672
+ coding: 10.6,
673
+ math: 18.3,
674
+ mmluPro: 0.6,
675
+ gpqa: 0.35,
165
676
  },
166
677
  performance: {
167
- outputTokenPerSecond: 29.898,
168
- timeTofirstToken: 0.781,
169
- intelligenceScore: 21.5,
678
+ intelligenceScore: 20.4,
170
679
  },
171
- lastUpdated: '2025-12-24',
172
- },
173
- 'gpt-4-0125-preview': {
680
+ context: {
681
+ input: {
682
+ text: true,
683
+ audio: false,
684
+ image: false,
685
+ video: false
686
+ },
687
+ output: {
688
+ text: true,
689
+ audio: false,
690
+ image: false,
691
+ video: false
692
+ }
693
+ },
694
+ deprecated: false,
695
+ isAvailable: true,
696
+ lastUpdated: '2026-01-02',
697
+ },
698
+ 'gemma-3-1b-it': {
174
699
  type: 'chat',
175
- provider: 'openai',
176
- displayName: 'GPT 4 0125 preview',
177
- pricing: { input: 0.03, output: 0.06 },
700
+ provider: 'google',
701
+ displayName: 'Gemma 3 1B IT',
702
+ description: 'Compact instruction-tuned Gemma model',
703
+ pricing: { input: 0, output: 0 },
704
+ benchmarks: {
705
+ intelligence: 12.5,
706
+ mmluPro: 0.48,
707
+ gpqa: 0.28,
708
+ },
709
+ performance: {
710
+ intelligenceScore: 12.5,
711
+ },
712
+ context: {
713
+ input: {
714
+ text: true,
715
+ audio: false,
716
+ image: false,
717
+ video: false
718
+ },
719
+ output: {
720
+ text: true,
721
+ audio: false,
722
+ image: false,
723
+ video: false
724
+ }
725
+ },
726
+ deprecated: false,
727
+ isAvailable: true,
728
+ lastUpdated: '2026-01-02',
729
+ },
730
+ 'gemma-3-27b-it': {
731
+ type: 'chat',
732
+ provider: 'google',
733
+ displayName: 'Gemma 3 27B IT',
734
+ description: 'Large instruction-tuned Gemma model',
735
+ pricing: { input: 0, output: 0 },
178
736
  benchmarks: {
179
- intelligence: 21.5,
180
- coding: 13.1,
737
+ intelligence: 22.1,
738
+ coding: 12.8,
739
+ math: 20.7,
740
+ mmluPro: 0.67,
741
+ gpqa: 0.43,
181
742
  },
182
743
  performance: {
183
- outputTokenPerSecond: 29.898,
184
- timeTofirstToken: 0.781,
185
- intelligenceScore: 21.5,
744
+ intelligenceScore: 22.1,
186
745
  },
187
- lastUpdated: '2025-12-24',
188
- },
189
- 'gpt-4-1106-preview': {
746
+ context: {
747
+ input: {
748
+ text: true,
749
+ audio: false,
750
+ image: false,
751
+ video: false
752
+ },
753
+ output: {
754
+ text: true,
755
+ audio: false,
756
+ image: false,
757
+ video: false
758
+ }
759
+ },
760
+ deprecated: false,
761
+ isAvailable: true,
762
+ lastUpdated: '2026-01-02',
763
+ },
764
+ 'gemma-3-4b-it': {
190
765
  type: 'chat',
191
- provider: 'openai',
192
- displayName: 'GPT 4 1106 preview',
193
- pricing: { input: 0.03, output: 0.06 },
766
+ provider: 'google',
767
+ displayName: 'Gemma 3 4B IT',
768
+ description: 'Small instruction-tuned Gemma model',
769
+ pricing: { input: 0, output: 0 },
194
770
  benchmarks: {
195
- intelligence: 21.5,
196
- coding: 13.1,
771
+ intelligence: 15.5,
772
+ coding: 8.3,
773
+ math: 14.3,
774
+ mmluPro: 0.49,
775
+ gpqa: 0.3,
197
776
  },
198
777
  performance: {
199
- outputTokenPerSecond: 29.898,
200
- timeTofirstToken: 0.781,
201
- intelligenceScore: 21.5,
778
+ intelligenceScore: 15.5,
202
779
  },
203
- lastUpdated: '2025-12-24',
780
+ context: {
781
+ input: {
782
+ text: true,
783
+ audio: false,
784
+ image: false,
785
+ video: false
786
+ },
787
+ output: {
788
+ text: true,
789
+ audio: false,
790
+ image: false,
791
+ video: false
792
+ }
793
+ },
794
+ deprecated: false,
795
+ isAvailable: true,
796
+ lastUpdated: '2026-01-02',
797
+ },
798
+ 'imagen-4.0-fast-generate-001': {
799
+ type: 'image-generation',
800
+ provider: 'google',
801
+ displayName: 'Imagen 4.0 Fast',
802
+ description: 'Fast image generation model',
803
+ pricing: { input: 0, output: 0 },
804
+ context: {
805
+ input: {
806
+ text: true,
807
+ audio: false,
808
+ image: false,
809
+ video: false
810
+ },
811
+ output: {
812
+ text: false,
813
+ audio: false,
814
+ image: true,
815
+ video: false
816
+ }
817
+ },
818
+ deprecated: false,
819
+ isAvailable: true,
820
+ lastUpdated: '2026-01-02',
821
+ },
822
+ 'imagen-4.0-generate-001': {
823
+ type: 'image-generation',
824
+ provider: 'google',
825
+ displayName: 'Imagen 4.0',
826
+ description: 'Image generation model',
827
+ pricing: { input: 0, output: 0 },
828
+ context: {
829
+ input: {
830
+ text: true,
831
+ audio: false,
832
+ image: false,
833
+ video: false
834
+ },
835
+ output: {
836
+ text: false,
837
+ audio: false,
838
+ image: true,
839
+ video: false
840
+ }
841
+ },
842
+ deprecated: false,
843
+ isAvailable: true,
844
+ lastUpdated: '2026-01-02',
845
+ },
846
+ 'imagen-4.0-ultra-generate-001': {
847
+ type: 'image-generation',
848
+ provider: 'google',
849
+ displayName: 'Imagen 4.0 Ultra',
850
+ description: 'Ultra quality image generation model',
851
+ pricing: { input: 0, output: 0 },
852
+ context: {
853
+ input: {
854
+ text: true,
855
+ audio: false,
856
+ image: false,
857
+ video: false
858
+ },
859
+ output: {
860
+ text: false,
861
+ audio: false,
862
+ image: true,
863
+ video: false
864
+ }
865
+ },
866
+ deprecated: false,
867
+ isAvailable: true,
868
+ lastUpdated: '2026-01-02',
204
869
  },
205
- 'gpt-3.5-turbo': {
870
+ 'text-embedding-004': {
871
+ type: 'embedding',
872
+ provider: 'google',
873
+ displayName: 'Text Embedding 004',
874
+ description: 'Text embedding model for semantic similarity and retrieval',
875
+ pricing: { input: 0.6, output: 0 },
876
+ context: {
877
+ input: {
878
+ text: true,
879
+ audio: false,
880
+ image: false,
881
+ video: false
882
+ },
883
+ output: {
884
+ text: false,
885
+ audio: false,
886
+ image: false,
887
+ video: false
888
+ }
889
+ },
890
+ deprecated: false,
891
+ isAvailable: true,
892
+ lastUpdated: '2026-01-02',
893
+ },
894
+ 'veo-2.0-generate-001': {
895
+ type: 'video-generation',
896
+ provider: 'google',
897
+ displayName: 'Veo 2.0',
898
+ description: 'Video generation model',
899
+ pricing: { input: 0, output: 0 },
900
+ context: {
901
+ input: {
902
+ text: true,
903
+ audio: false,
904
+ image: false,
905
+ video: false
906
+ },
907
+ output: {
908
+ text: false,
909
+ audio: false,
910
+ image: false,
911
+ video: true
912
+ }
913
+ },
914
+ deprecated: false,
915
+ isAvailable: true,
916
+ lastUpdated: '2026-01-02',
917
+ },
918
+ 'veo-3.0-fast-generate-001': {
919
+ type: 'video-generation',
920
+ provider: 'google',
921
+ displayName: 'Veo 3.0 Fast',
922
+ description: 'Fast video generation model',
923
+ pricing: { input: 0, output: 0 },
924
+ context: {
925
+ input: {
926
+ text: true,
927
+ audio: false,
928
+ image: false,
929
+ video: false
930
+ },
931
+ output: {
932
+ text: false,
933
+ audio: false,
934
+ image: false,
935
+ video: true
936
+ }
937
+ },
938
+ deprecated: false,
939
+ isAvailable: true,
940
+ lastUpdated: '2026-01-02',
941
+ },
942
+ 'veo-3.0-generate-001': {
943
+ type: 'video-generation',
944
+ provider: 'google',
945
+ displayName: 'Veo 3.0',
946
+ description: 'Video generation model',
947
+ pricing: { input: 0, output: 0 },
948
+ context: {
949
+ input: {
950
+ text: true,
951
+ audio: false,
952
+ image: false,
953
+ video: false
954
+ },
955
+ output: {
956
+ text: false,
957
+ audio: false,
958
+ image: false,
959
+ video: true
960
+ }
961
+ },
962
+ deprecated: false,
963
+ isAvailable: true,
964
+ lastUpdated: '2026-01-02',
965
+ },
966
+ 'veo-3.1-fast-generate-preview': {
967
+ type: 'video-generation',
968
+ provider: 'google',
969
+ displayName: 'Veo 3.1 Fast',
970
+ description: 'Fast video generation model',
971
+ pricing: { input: 0, output: 0 },
972
+ context: {
973
+ input: {
974
+ text: true,
975
+ audio: false,
976
+ image: false,
977
+ video: false
978
+ },
979
+ output: {
980
+ text: false,
981
+ audio: false,
982
+ image: false,
983
+ video: true
984
+ }
985
+ },
986
+ deprecated: false,
987
+ isAvailable: true,
988
+ lastUpdated: '2026-01-02',
989
+ },
990
+ 'veo-3.1-generate-preview': {
991
+ type: 'video-generation',
992
+ provider: 'google',
993
+ displayName: 'Veo 3.1',
994
+ description: 'Video generation model',
995
+ pricing: { input: 0, output: 0 },
996
+ context: {
997
+ input: {
998
+ text: true,
999
+ audio: false,
1000
+ image: false,
1001
+ video: false
1002
+ },
1003
+ output: {
1004
+ text: false,
1005
+ audio: false,
1006
+ image: false,
1007
+ video: true
1008
+ }
1009
+ },
1010
+ deprecated: false,
1011
+ isAvailable: true,
1012
+ lastUpdated: '2026-01-02',
1013
+ },
1014
+ 'codestral-2412': {
206
1015
  type: 'chat',
207
- provider: 'openai',
208
- displayName: 'GPT 3.5 turbo',
209
- pricing: { input: 0.0005, output: 0.0015 },
1016
+ provider: 'mistral',
1017
+ displayName: 'Codestral',
1018
+ description: 'Our cutting-edge language model for code completion released end of July 2025.',
210
1019
  benchmarks: {
211
- intelligence: 8.3,
212
- coding: 10.7,
213
- mmluPro: 0.462,
214
- gpqa: 0.297,
1020
+ intelligence: 68.5,
1021
+ coding: 53.5,
1022
+ math: 98.7,
1023
+ mmluPro: 0.87,
1024
+ gpqa: 0.84,
215
1025
  },
216
1026
  performance: {
217
- outputTokenPerSecond: 129.872,
218
- timeTofirstToken: 0.68,
219
- intelligenceScore: 8.3,
1027
+ intelligenceScore: 68.5,
220
1028
  },
221
- lastUpdated: '2025-12-24',
222
- },
223
- 'gpt-3.5-turbo-0125': {
1029
+ context: {
1030
+ input: {
1031
+ text: true,
1032
+ audio: false,
1033
+ image: false,
1034
+ video: false
1035
+ },
1036
+ output: {
1037
+ text: true,
1038
+ audio: false,
1039
+ image: false,
1040
+ video: false
1041
+ }
1042
+ },
1043
+ deprecated: false,
1044
+ isAvailable: true,
1045
+ lastUpdated: '2026-01-02',
1046
+ },
1047
+ 'codestral-2508': {
224
1048
  type: 'chat',
225
- provider: 'openai',
226
- displayName: 'GPT 3.5 turbo 0125',
227
- pricing: { input: 0.0005, output: 0.0015 },
1049
+ provider: 'mistral',
1050
+ displayName: 'Codestral',
1051
+ description: 'Our cutting-edge language model for code completion released end of July 2025.',
1052
+ context: {
1053
+ input: {
1054
+ text: true,
1055
+ audio: false,
1056
+ image: false,
1057
+ video: false
1058
+ },
1059
+ output: {
1060
+ text: true,
1061
+ audio: false,
1062
+ image: false,
1063
+ video: false
1064
+ }
1065
+ },
1066
+ deprecated: false,
1067
+ isAvailable: true,
1068
+ lastUpdated: '2026-01-02',
1069
+ },
1070
+ 'codestral-embed-2505': {
1071
+ type: 'embedding',
1072
+ provider: 'mistral',
1073
+ displayName: 'Codestral Embed',
1074
+ description: 'Our state-of-the-art semantic for extracting representation of code extracts',
1075
+ pricing: { input: 0.15, output: 0 },
1076
+ context: {
1077
+ input: {
1078
+ text: true,
1079
+ audio: false,
1080
+ image: false,
1081
+ video: false
1082
+ },
1083
+ output: {
1084
+ text: false,
1085
+ audio: false,
1086
+ image: false,
1087
+ video: false
1088
+ }
1089
+ },
1090
+ deprecated: false,
1091
+ isAvailable: true,
1092
+ lastUpdated: '2026-01-02',
1093
+ },
1094
+ 'codestral-latest': {
1095
+ type: 'chat',
1096
+ provider: 'mistral',
1097
+ displayName: 'Codestral',
1098
+ description: 'Our cutting-edge language model for code completion',
1099
+ pricing: { input: 0.3, output: 0.9 },
1100
+ benchmarks: {
1101
+ intelligence: 12.2,
1102
+ mmluPro: 0.47,
1103
+ gpqa: 0.34,
1104
+ },
1105
+ performance: {
1106
+ intelligenceScore: 12.2,
1107
+ },
1108
+ context: {
1109
+ input: {
1110
+ text: true,
1111
+ audio: false,
1112
+ image: false,
1113
+ video: false
1114
+ },
1115
+ output: {
1116
+ text: true,
1117
+ audio: false,
1118
+ image: false,
1119
+ video: false
1120
+ }
1121
+ },
1122
+ deprecated: false,
1123
+ isAvailable: true,
1124
+ lastUpdated: '2026-01-02',
1125
+ },
1126
+ 'devstral-2512': {
1127
+ type: 'chat',
1128
+ provider: 'mistral',
1129
+ displayName: 'Devstral 2',
1130
+ description: 'Our frontier code agents model for solving software engineering tasks.',
1131
+ benchmarks: {
1132
+ intelligence: 19.6,
1133
+ mmluPro: 0.63,
1134
+ gpqa: 0.43,
1135
+ },
1136
+ performance: {
1137
+ intelligenceScore: 19.6,
1138
+ },
1139
+ context: {
1140
+ input: {
1141
+ text: true,
1142
+ audio: false,
1143
+ image: false,
1144
+ video: false
1145
+ },
1146
+ output: {
1147
+ text: true,
1148
+ audio: false,
1149
+ image: false,
1150
+ video: false
1151
+ }
1152
+ },
1153
+ deprecated: false,
1154
+ isAvailable: true,
1155
+ lastUpdated: '2026-01-02',
1156
+ },
1157
+ 'devstral-latest': {
1158
+ type: 'chat',
1159
+ provider: 'mistral',
1160
+ displayName: 'Devstral',
1161
+ description: 'Our frontier code agents model for solving software engineering tasks.',
1162
+ pricing: { input: 0, output: 0 },
1163
+ benchmarks: {
1164
+ intelligence: 27.2,
1165
+ coding: 18.5,
1166
+ math: 29.3,
1167
+ mmluPro: 0.62,
1168
+ gpqa: 0.41,
1169
+ },
1170
+ performance: {
1171
+ intelligenceScore: 27.2,
1172
+ },
1173
+ context: {
1174
+ input: {
1175
+ text: true,
1176
+ audio: false,
1177
+ image: false,
1178
+ video: false
1179
+ },
1180
+ output: {
1181
+ text: true,
1182
+ audio: false,
1183
+ image: false,
1184
+ video: false
1185
+ }
1186
+ },
1187
+ deprecated: false,
1188
+ isAvailable: true,
1189
+ lastUpdated: '2026-01-02',
1190
+ },
1191
+ 'magistral-medium-2509': {
1192
+ type: 'chat',
1193
+ provider: 'mistral',
1194
+ displayName: 'Magistral Medium 1.2',
1195
+ description: 'Our frontier-class multimodal reasoning model.',
1196
+ benchmarks: {
1197
+ intelligence: 33.2,
1198
+ coding: 30.3,
1199
+ math: 40.3,
1200
+ mmluPro: 0.75,
1201
+ gpqa: 0.68,
1202
+ },
1203
+ performance: {
1204
+ intelligenceScore: 33.2,
1205
+ },
1206
+ context: {
1207
+ input: {
1208
+ text: true,
1209
+ audio: false,
1210
+ image: true,
1211
+ video: false
1212
+ },
1213
+ output: {
1214
+ text: true,
1215
+ audio: false,
1216
+ image: false,
1217
+ video: false
1218
+ }
1219
+ },
1220
+ deprecated: false,
1221
+ isAvailable: true,
1222
+ lastUpdated: '2026-01-02',
1223
+ },
1224
+ 'magistral-medium-latest': {
1225
+ type: 'chat',
1226
+ provider: 'mistral',
1227
+ displayName: 'Magistral Medium',
1228
+ description: 'Our frontier-class multimodal reasoning model',
1229
+ pricing: { input: 2, output: 5 },
1230
+ benchmarks: {
1231
+ intelligence: 33.2,
1232
+ coding: 30.3,
1233
+ math: 40.3,
1234
+ mmluPro: 0.75,
1235
+ gpqa: 0.68,
1236
+ },
1237
+ performance: {
1238
+ intelligenceScore: 33.2,
1239
+ },
1240
+ context: {
1241
+ input: {
1242
+ text: true,
1243
+ audio: false,
1244
+ image: true,
1245
+ video: false
1246
+ },
1247
+ output: {
1248
+ text: true,
1249
+ audio: false,
1250
+ image: false,
1251
+ video: false
1252
+ }
1253
+ },
1254
+ deprecated: false,
1255
+ isAvailable: true,
1256
+ lastUpdated: '2026-01-02',
1257
+ },
1258
+ 'magistral-small-2509': {
1259
+ type: 'chat',
1260
+ provider: 'mistral',
1261
+ displayName: 'Magistral Small 1.2',
1262
+ description: 'Our small multimodal reasoning model.',
1263
+ benchmarks: {
1264
+ intelligence: 43,
1265
+ coding: 37.2,
1266
+ math: 80.3,
1267
+ mmluPro: 0.77,
1268
+ gpqa: 0.66,
1269
+ },
1270
+ performance: {
1271
+ intelligenceScore: 43,
1272
+ },
1273
+ context: {
1274
+ input: {
1275
+ text: true,
1276
+ audio: false,
1277
+ image: true,
1278
+ video: false
1279
+ },
1280
+ output: {
1281
+ text: true,
1282
+ audio: false,
1283
+ image: false,
1284
+ video: false
1285
+ }
1286
+ },
1287
+ deprecated: false,
1288
+ isAvailable: true,
1289
+ lastUpdated: '2026-01-02',
1290
+ },
1291
+ 'magistral-small-latest': {
1292
+ type: 'chat',
1293
+ provider: 'mistral',
1294
+ displayName: 'Magistral Small',
1295
+ description: 'Our small multimodal reasoning model',
1296
+ pricing: { input: 0.5, output: 1.5 },
1297
+ benchmarks: {
1298
+ intelligence: 31.9,
1299
+ coding: 26.6,
1300
+ math: 41.3,
1301
+ mmluPro: 0.75,
1302
+ gpqa: 0.64,
1303
+ },
1304
+ performance: {
1305
+ intelligenceScore: 31.9,
1306
+ },
1307
+ context: {
1308
+ input: {
1309
+ text: true,
1310
+ audio: false,
1311
+ image: true,
1312
+ video: false
1313
+ },
1314
+ output: {
1315
+ text: true,
1316
+ audio: false,
1317
+ image: false,
1318
+ video: false
1319
+ }
1320
+ },
1321
+ deprecated: false,
1322
+ isAvailable: true,
1323
+ lastUpdated: '2026-01-02',
1324
+ },
1325
+ 'ministral-14b-2512': {
1326
+ type: 'chat',
1327
+ provider: 'mistral',
1328
+ displayName: 'Ministral 3 14B',
1329
+ description: 'A powerful model offering best-in-class text and vision capabilities.',
1330
+ benchmarks: {
1331
+ intelligence: 30.5,
1332
+ coding: 21,
1333
+ math: 30,
1334
+ mmluPro: 0.69,
1335
+ gpqa: 0.57,
1336
+ },
1337
+ performance: {
1338
+ intelligenceScore: 30.5,
1339
+ },
1340
+ context: {
1341
+ input: {
1342
+ text: true,
1343
+ audio: false,
1344
+ image: true,
1345
+ video: false
1346
+ },
1347
+ output: {
1348
+ text: true,
1349
+ audio: false,
1350
+ image: false,
1351
+ video: false
1352
+ }
1353
+ },
1354
+ deprecated: false,
1355
+ isAvailable: true,
1356
+ lastUpdated: '2026-01-02',
1357
+ },
1358
+ 'ministral-14b-latest': {
1359
+ type: 'chat',
1360
+ provider: 'mistral',
1361
+ displayName: 'Ministral 3 14B',
1362
+ description: 'A powerful model offering best-in-class text and vision capabilities.',
1363
+ pricing: { input: 0.2, output: 0.2 },
228
1364
  benchmarks: {
229
- intelligence: 8.3,
230
- coding: 10.7,
231
- mmluPro: 0.462,
232
- gpqa: 0.297,
1365
+ intelligence: 1,
233
1366
  },
234
1367
  performance: {
235
- outputTokenPerSecond: 129.872,
236
- timeTofirstToken: 0.68,
237
- intelligenceScore: 8.3,
1368
+ intelligenceScore: 1,
238
1369
  },
239
- lastUpdated: '2025-12-24',
240
- },
241
- 'gpt-3.5-turbo-1106': {
1370
+ context: {
1371
+ input: {
1372
+ text: true,
1373
+ audio: false,
1374
+ image: true,
1375
+ video: false
1376
+ },
1377
+ output: {
1378
+ text: true,
1379
+ audio: false,
1380
+ image: false,
1381
+ video: false
1382
+ }
1383
+ },
1384
+ deprecated: false,
1385
+ isAvailable: true,
1386
+ lastUpdated: '2026-01-02',
1387
+ },
1388
+ 'ministral-3b-2512': {
242
1389
  type: 'chat',
243
- provider: 'openai',
244
- displayName: 'GPT 3.5 turbo 1106',
245
- pricing: { input: 0.0005, output: 0.0015 },
1390
+ provider: 'mistral',
1391
+ displayName: 'Ministral 3 3B',
1392
+ description: 'A tiny and efficient model offering best-in-class text and vision capabilities.',
1393
+ benchmarks: {
1394
+ intelligence: 21.8,
1395
+ coding: 13,
1396
+ math: 22,
1397
+ mmluPro: 0.52,
1398
+ gpqa: 0.36,
1399
+ },
1400
+ performance: {
1401
+ intelligenceScore: 21.8,
1402
+ },
1403
+ context: {
1404
+ input: {
1405
+ text: true,
1406
+ audio: false,
1407
+ image: true,
1408
+ video: false
1409
+ },
1410
+ output: {
1411
+ text: true,
1412
+ audio: false,
1413
+ image: false,
1414
+ video: false
1415
+ }
1416
+ },
1417
+ deprecated: false,
1418
+ isAvailable: true,
1419
+ lastUpdated: '2026-01-02',
1420
+ },
1421
+ 'ministral-3b-latest': {
1422
+ type: 'chat',
1423
+ provider: 'mistral',
1424
+ displayName: 'Ministral 3 3B',
1425
+ description: 'A tiny and efficient model offering best-in-class text and vision capabilities.',
1426
+ pricing: { input: 0.1, output: 0.1 },
1427
+ benchmarks: {
1428
+ intelligence: 12.7,
1429
+ coding: 6.9,
1430
+ math: 0.3,
1431
+ mmluPro: 0.44,
1432
+ gpqa: 0.32,
1433
+ },
1434
+ performance: {
1435
+ intelligenceScore: 12.7,
1436
+ },
1437
+ context: {
1438
+ input: {
1439
+ text: true,
1440
+ audio: false,
1441
+ image: true,
1442
+ video: false
1443
+ },
1444
+ output: {
1445
+ text: true,
1446
+ audio: false,
1447
+ image: false,
1448
+ video: false
1449
+ }
1450
+ },
1451
+ deprecated: false,
1452
+ isAvailable: true,
1453
+ lastUpdated: '2026-01-02',
1454
+ },
1455
+ 'ministral-8b-2512': {
1456
+ type: 'chat',
1457
+ provider: 'mistral',
1458
+ displayName: 'Ministral 3 8B',
1459
+ description: 'A powerful and efficient model offering best-in-class text and vision capabilities.',
1460
+ benchmarks: {
1461
+ intelligence: 28.2,
1462
+ coding: 18.4,
1463
+ math: 31.7,
1464
+ mmluPro: 0.64,
1465
+ gpqa: 0.47,
1466
+ },
1467
+ performance: {
1468
+ intelligenceScore: 28.2,
1469
+ },
1470
+ context: {
1471
+ input: {
1472
+ text: true,
1473
+ audio: false,
1474
+ image: true,
1475
+ video: false
1476
+ },
1477
+ output: {
1478
+ text: true,
1479
+ audio: false,
1480
+ image: false,
1481
+ video: false
1482
+ }
1483
+ },
1484
+ deprecated: false,
1485
+ isAvailable: true,
1486
+ lastUpdated: '2026-01-02',
1487
+ },
1488
+ 'ministral-8b-latest': {
1489
+ type: 'chat',
1490
+ provider: 'mistral',
1491
+ displayName: 'Ministral 3 8B',
1492
+ description: 'A powerful and efficient model offering best-in-class text and vision capabilities.',
1493
+ pricing: { input: 0.15, output: 0.15 },
1494
+ benchmarks: {
1495
+ intelligence: 7,
1496
+ mmluPro: 0.41,
1497
+ gpqa: 0.3,
1498
+ },
1499
+ performance: {
1500
+ intelligenceScore: 7,
1501
+ },
1502
+ context: {
1503
+ input: {
1504
+ text: true,
1505
+ audio: false,
1506
+ image: true,
1507
+ video: false
1508
+ },
1509
+ output: {
1510
+ text: true,
1511
+ audio: false,
1512
+ image: false,
1513
+ video: false
1514
+ }
1515
+ },
1516
+ deprecated: false,
1517
+ isAvailable: true,
1518
+ lastUpdated: '2026-01-02',
1519
+ },
1520
+ 'mistral-embed': {
1521
+ type: 'embedding',
1522
+ provider: 'mistral',
1523
+ displayName: 'Mistral Embed',
1524
+ description: 'Our state-of-the-art semantic for extracting representation of code extracts',
1525
+ pricing: { input: 0.1, output: 0 },
1526
+ context: {
1527
+ input: {
1528
+ text: true,
1529
+ audio: false,
1530
+ image: false,
1531
+ video: false
1532
+ },
1533
+ output: {
1534
+ text: false,
1535
+ audio: false,
1536
+ image: false,
1537
+ video: false
1538
+ }
1539
+ },
1540
+ deprecated: false,
1541
+ isAvailable: true,
1542
+ lastUpdated: '2026-01-02',
1543
+ },
1544
+ 'mistral-large-2512': {
1545
+ type: 'chat',
1546
+ provider: 'mistral',
1547
+ displayName: 'Mistral Large 3',
1548
+ description: 'A state-of-the-art, open-weight, general-purpose multimodal model.',
246
1549
  benchmarks: {
247
- intelligence: 8.3,
248
- coding: 10.7,
249
- mmluPro: 0.462,
250
- gpqa: 0.297,
1550
+ intelligence: 2.6,
1551
+ mmluPro: 0.39,
1552
+ gpqa: 0.29,
251
1553
  },
252
1554
  performance: {
253
- outputTokenPerSecond: 129.872,
254
- timeTofirstToken: 0.68,
255
- intelligenceScore: 8.3,
1555
+ intelligenceScore: 2.6,
256
1556
  },
257
- lastUpdated: '2025-12-24',
258
- },
259
- 'o3-mini': {
1557
+ context: {
1558
+ input: {
1559
+ text: true,
1560
+ audio: false,
1561
+ image: true,
1562
+ video: false
1563
+ },
1564
+ output: {
1565
+ text: true,
1566
+ audio: false,
1567
+ image: false,
1568
+ video: false
1569
+ }
1570
+ },
1571
+ deprecated: false,
1572
+ isAvailable: true,
1573
+ lastUpdated: '2026-01-02',
1574
+ },
1575
+ 'mistral-large-latest': {
260
1576
  type: 'chat',
261
- provider: 'openai',
262
- displayName: 'o3 mini',
263
- pricing: { input: 0.0011, output: 0.0044 },
1577
+ provider: 'mistral',
1578
+ displayName: 'Mistral Large',
1579
+ description: 'Top-tier large model for high-complexity tasks.',
1580
+ pricing: { input: 0.5, output: 1.5 },
1581
+ benchmarks: {
1582
+ intelligence: 11.9,
1583
+ mmluPro: 0.52,
1584
+ gpqa: 0.35,
1585
+ },
1586
+ performance: {
1587
+ intelligenceScore: 11.9,
1588
+ },
1589
+ context: {
1590
+ input: {
1591
+ text: true,
1592
+ audio: false,
1593
+ image: false,
1594
+ video: false
1595
+ },
1596
+ output: {
1597
+ text: true,
1598
+ audio: false,
1599
+ image: false,
1600
+ video: false
1601
+ }
1602
+ },
1603
+ deprecated: false,
1604
+ isAvailable: true,
1605
+ lastUpdated: '2026-01-02',
1606
+ },
1607
+ 'mistral-medium-2508': {
1608
+ type: 'chat',
1609
+ provider: 'mistral',
1610
+ displayName: 'Mistral Medium 3.1',
1611
+ description: 'Our frontier-class multimodal model released August 2025.',
264
1612
  benchmarks: {
265
- intelligence: 48.1,
266
- coding: 39.4,
267
- mmluPro: 0.791,
268
- gpqa: 0.748,
1613
+ intelligence: 33.6,
1614
+ coding: 25.6,
1615
+ math: 30.3,
1616
+ mmluPro: 0.76,
1617
+ gpqa: 0.58,
269
1618
  },
270
1619
  performance: {
271
- outputTokenPerSecond: 160.235,
272
- timeTofirstToken: 15.449,
273
- intelligenceScore: 48.1,
1620
+ intelligenceScore: 33.6,
274
1621
  },
275
- lastUpdated: '2025-12-24',
276
- },
277
- 'gpt-4o-audio-preview': {
1622
+ context: {
1623
+ input: {
1624
+ text: true,
1625
+ audio: false,
1626
+ image: true,
1627
+ video: false
1628
+ },
1629
+ output: {
1630
+ text: true,
1631
+ audio: false,
1632
+ image: false,
1633
+ video: false
1634
+ }
1635
+ },
1636
+ deprecated: false,
1637
+ isAvailable: true,
1638
+ lastUpdated: '2026-01-02',
1639
+ },
1640
+ 'mistral-medium-latest': {
278
1641
  type: 'chat',
279
- provider: 'openai',
280
- displayName: 'Chat GPT 4o audio preview',
281
- pricing: { input: 0.0025, output: 0.01 },
1642
+ provider: 'mistral',
1643
+ displayName: 'Mistral Medium 3.1',
1644
+ description: 'Our frontier-class multimodal model released August 2025.',
1645
+ pricing: { input: 0.4, output: 2 },
1646
+ benchmarks: {
1647
+ intelligence: 8.4,
1648
+ mmluPro: 0.49,
1649
+ gpqa: 0.35,
1650
+ },
1651
+ performance: {
1652
+ intelligenceScore: 8.4,
1653
+ },
1654
+ context: {
1655
+ input: {
1656
+ text: true,
1657
+ audio: false,
1658
+ image: true,
1659
+ video: false
1660
+ },
1661
+ output: {
1662
+ text: true,
1663
+ audio: false,
1664
+ image: false,
1665
+ video: false
1666
+ }
1667
+ },
1668
+ deprecated: false,
1669
+ isAvailable: true,
1670
+ lastUpdated: '2026-01-02',
1671
+ },
1672
+ 'mistral-small-2501': {
1673
+ type: 'chat',
1674
+ provider: 'mistral',
1675
+ displayName: 'Mistral Small',
1676
+ description: 'Efficient model for various tasks.',
1677
+ benchmarks: {
1678
+ intelligence: 8.5,
1679
+ mmluPro: 0.42,
1680
+ gpqa: 0.3,
1681
+ },
1682
+ performance: {
1683
+ intelligenceScore: 8.5,
1684
+ },
1685
+ context: {
1686
+ input: {
1687
+ text: true,
1688
+ audio: false,
1689
+ image: false,
1690
+ video: false
1691
+ },
1692
+ output: {
1693
+ text: true,
1694
+ audio: false,
1695
+ image: false,
1696
+ video: false
1697
+ }
1698
+ },
1699
+ deprecated: false,
1700
+ isAvailable: true,
1701
+ lastUpdated: '2026-01-02',
1702
+ },
1703
+ 'mistral-small-2506': {
1704
+ type: 'chat',
1705
+ provider: 'mistral',
1706
+ displayName: 'Mistral Small 3.2',
1707
+ description: 'An update to our previous small model, released June 2025.',
1708
+ benchmarks: {
1709
+ intelligence: 24.9,
1710
+ coding: 18.3,
1711
+ math: 3.7,
1712
+ mmluPro: 0.66,
1713
+ gpqa: 0.45,
1714
+ },
1715
+ performance: {
1716
+ intelligenceScore: 24.9,
1717
+ },
1718
+ context: {
1719
+ input: {
1720
+ text: true,
1721
+ audio: false,
1722
+ image: false,
1723
+ video: false
1724
+ },
1725
+ output: {
1726
+ text: true,
1727
+ audio: false,
1728
+ image: false,
1729
+ video: false
1730
+ }
1731
+ },
1732
+ deprecated: false,
1733
+ isAvailable: true,
1734
+ lastUpdated: '2026-01-02',
1735
+ },
1736
+ 'mistral-small-latest': {
1737
+ type: 'chat',
1738
+ provider: 'mistral',
1739
+ displayName: 'Mistral Small',
1740
+ description: 'An efficient model offering best-in-class text and vision capabilities',
1741
+ pricing: { input: 0.1, output: 0.3 },
1742
+ benchmarks: {
1743
+ intelligence: 24.9,
1744
+ coding: 18.3,
1745
+ math: 3.7,
1746
+ mmluPro: 0.66,
1747
+ gpqa: 0.45,
1748
+ },
1749
+ performance: {
1750
+ intelligenceScore: 24.9,
1751
+ },
1752
+ context: {
1753
+ input: {
1754
+ text: true,
1755
+ audio: false,
1756
+ image: true,
1757
+ video: false
1758
+ },
1759
+ output: {
1760
+ text: true,
1761
+ audio: false,
1762
+ image: false,
1763
+ video: false
1764
+ }
1765
+ },
1766
+ deprecated: false,
1767
+ isAvailable: true,
1768
+ lastUpdated: '2026-01-02',
1769
+ },
1770
+ 'mistral-tiny-2407': {
1771
+ type: 'chat',
1772
+ provider: 'mistral',
1773
+ displayName: 'Mistral Nemo 12B',
1774
+ description: 'Our best multilingual open source model released July 2024.',
1775
+ context: {
1776
+ input: {
1777
+ text: true,
1778
+ audio: false,
1779
+ image: false,
1780
+ video: false
1781
+ },
1782
+ output: {
1783
+ text: true,
1784
+ audio: false,
1785
+ image: false,
1786
+ video: false
1787
+ }
1788
+ },
1789
+ deprecated: false,
1790
+ isAvailable: true,
1791
+ lastUpdated: '2026-01-02',
1792
+ },
1793
+ 'mistral-tiny-latest': {
1794
+ type: 'chat',
1795
+ provider: 'mistral',
1796
+ displayName: 'Mistral Tiny',
1797
+ description: 'Compact model for efficient inference.',
1798
+ pricing: { input: 0.14, output: 0.42 },
1799
+ context: {
1800
+ input: {
1801
+ text: true,
1802
+ audio: false,
1803
+ image: false,
1804
+ video: false
1805
+ },
1806
+ output: {
1807
+ text: true,
1808
+ audio: false,
1809
+ image: false,
1810
+ video: false
1811
+ }
1812
+ },
1813
+ deprecated: false,
1814
+ isAvailable: true,
1815
+ lastUpdated: '2026-01-02',
1816
+ },
1817
+ 'open-mistral-7b': {
1818
+ type: 'chat',
1819
+ provider: 'mistral',
1820
+ displayName: 'Mistral 7B',
1821
+ description: 'Open source model for general purpose tasks.',
282
1822
  benchmarks: {
283
- intelligence: 27,
284
- coding: 24,
285
- math: 6,
286
- mmluPro: 0.748,
287
- gpqa: 0.543,
1823
+ intelligence: 1,
1824
+ mmluPro: 0.25,
1825
+ gpqa: 0.18,
288
1826
  },
289
1827
  performance: {
290
- outputTokenPerSecond: 235.657,
291
- timeTofirstToken: 0.323,
292
- intelligenceScore: 27,
1828
+ intelligenceScore: 1,
293
1829
  },
294
- lastUpdated: '2025-12-24',
295
- },
296
- 'gpt-4o-mini-audio-preview': {
1830
+ context: {
1831
+ input: {
1832
+ text: true,
1833
+ audio: false,
1834
+ image: false,
1835
+ video: false
1836
+ },
1837
+ output: {
1838
+ text: true,
1839
+ audio: false,
1840
+ image: false,
1841
+ video: false
1842
+ }
1843
+ },
1844
+ deprecated: false,
1845
+ isAvailable: true,
1846
+ lastUpdated: '2026-01-02',
1847
+ },
1848
+ 'open-mistral-nemo': {
297
1849
  type: 'chat',
298
- provider: 'openai',
299
- displayName: 'Chat GPT 4o mini audio preview',
300
- pricing: { input: 0.00015, output: 0.0006 },
1850
+ provider: 'mistral',
1851
+ displayName: 'Mistral Nemo 12B',
1852
+ description: 'Our best multilingual open source model released July 2024.',
1853
+ pricing: { input: 0.15, output: 0.15 },
301
1854
  benchmarks: {
302
- intelligence: 21.2,
303
- math: 14.7,
304
- mmluPro: 0.648,
305
- gpqa: 0.426,
1855
+ intelligence: 1,
1856
+ mmluPro: 0.25,
1857
+ gpqa: 0.18,
306
1858
  },
307
1859
  performance: {
308
- outputTokenPerSecond: 47.79,
309
- timeTofirstToken: 0.58,
310
- intelligenceScore: 21.2,
1860
+ intelligenceScore: 1,
311
1861
  },
312
- lastUpdated: '2025-12-24',
313
- },
314
- 'openai/gpt-audio': {
1862
+ context: {
1863
+ input: {
1864
+ text: true,
1865
+ audio: false,
1866
+ image: false,
1867
+ video: false
1868
+ },
1869
+ output: {
1870
+ text: true,
1871
+ audio: false,
1872
+ image: false,
1873
+ video: false
1874
+ }
1875
+ },
1876
+ deprecated: false,
1877
+ isAvailable: true,
1878
+ lastUpdated: '2026-01-02',
1879
+ },
1880
+ 'pixtral-12b-2409': {
1881
+ type: 'chat',
1882
+ provider: 'mistral',
1883
+ displayName: 'Pixtral 12B',
1884
+ description: 'Multimodal model with vision capabilities.',
1885
+ context: {
1886
+ input: {
1887
+ text: true,
1888
+ audio: false,
1889
+ image: true,
1890
+ video: false
1891
+ },
1892
+ output: {
1893
+ text: true,
1894
+ audio: false,
1895
+ image: false,
1896
+ video: false
1897
+ }
1898
+ },
1899
+ deprecated: false,
1900
+ isAvailable: true,
1901
+ lastUpdated: '2026-01-02',
1902
+ },
1903
+ 'pixtral-12b-latest': {
1904
+ type: 'chat',
1905
+ provider: 'mistral',
1906
+ displayName: 'Pixtral 12B',
1907
+ description: 'Multimodal model with vision capabilities.',
1908
+ pricing: { input: 0.15, output: 0.15 },
1909
+ context: {
1910
+ input: {
1911
+ text: true,
1912
+ audio: false,
1913
+ image: true,
1914
+ video: false
1915
+ },
1916
+ output: {
1917
+ text: true,
1918
+ audio: false,
1919
+ image: false,
1920
+ video: false
1921
+ }
1922
+ },
1923
+ deprecated: false,
1924
+ isAvailable: true,
1925
+ lastUpdated: '2026-01-02',
1926
+ },
1927
+ 'pixtral-large-2411': {
315
1928
  type: 'chat',
1929
+ provider: 'mistral',
1930
+ displayName: 'Pixtral Large',
1931
+ description: 'Our first frontier-class multimodal model released November 2024.',
1932
+ context: {
1933
+ input: {
1934
+ text: true,
1935
+ audio: false,
1936
+ image: true,
1937
+ video: false
1938
+ },
1939
+ output: {
1940
+ text: true,
1941
+ audio: false,
1942
+ image: false,
1943
+ video: false
1944
+ }
1945
+ },
1946
+ deprecated: false,
1947
+ isAvailable: true,
1948
+ lastUpdated: '2026-01-02',
1949
+ },
1950
+ 'pixtral-large-latest': {
1951
+ type: 'chat',
1952
+ provider: 'mistral',
1953
+ displayName: 'Pixtral Large',
1954
+ description: 'Our first frontier-class multimodal model released November 2024.',
1955
+ pricing: { input: 2, output: 6 },
1956
+ benchmarks: {
1957
+ intelligence: 25,
1958
+ math: 2.3,
1959
+ mmluPro: 0.7,
1960
+ gpqa: 0.51,
1961
+ },
1962
+ performance: {
1963
+ intelligenceScore: 25,
1964
+ },
1965
+ context: {
1966
+ input: {
1967
+ text: true,
1968
+ audio: false,
1969
+ image: true,
1970
+ video: false
1971
+ },
1972
+ output: {
1973
+ text: true,
1974
+ audio: false,
1975
+ image: false,
1976
+ video: false
1977
+ }
1978
+ },
1979
+ deprecated: false,
1980
+ isAvailable: true,
1981
+ lastUpdated: '2026-01-02',
1982
+ },
1983
+ 'voxtral-mini-2507': {
1984
+ type: 'chat',
1985
+ provider: 'mistral',
1986
+ displayName: 'Voxtral Mini',
1987
+ description: 'A mini version of our first audio input model.',
1988
+ context: {
1989
+ input: {
1990
+ text: true,
1991
+ audio: true,
1992
+ image: false,
1993
+ video: false
1994
+ },
1995
+ output: {
1996
+ text: true,
1997
+ audio: false,
1998
+ image: false,
1999
+ video: false
2000
+ }
2001
+ },
2002
+ deprecated: false,
2003
+ isAvailable: true,
2004
+ lastUpdated: '2026-01-02',
2005
+ },
2006
+ 'voxtral-mini-latest': {
2007
+ type: 'chat',
2008
+ provider: 'mistral',
2009
+ displayName: 'Voxtral Mini',
2010
+ description: 'A mini version of our first audio input model',
2011
+ pricing: { input: 0.04, output: 0.04 },
2012
+ context: {
2013
+ input: {
2014
+ text: true,
2015
+ audio: true,
2016
+ image: false,
2017
+ video: false
2018
+ },
2019
+ output: {
2020
+ text: true,
2021
+ audio: false,
2022
+ image: false,
2023
+ video: false
2024
+ }
2025
+ },
2026
+ deprecated: false,
2027
+ isAvailable: true,
2028
+ lastUpdated: '2026-01-02',
2029
+ },
2030
+ 'voxtral-small-2507': {
2031
+ type: 'chat',
2032
+ provider: 'mistral',
2033
+ displayName: 'Voxtral Small',
2034
+ description: 'Our first model with audio input capabilities for instruct use cases.',
2035
+ context: {
2036
+ input: {
2037
+ text: true,
2038
+ audio: true,
2039
+ image: false,
2040
+ video: false
2041
+ },
2042
+ output: {
2043
+ text: true,
2044
+ audio: false,
2045
+ image: false,
2046
+ video: false
2047
+ }
2048
+ },
2049
+ deprecated: false,
2050
+ isAvailable: true,
2051
+ lastUpdated: '2026-01-02',
2052
+ },
2053
+ 'voxtral-small-latest': {
2054
+ type: 'chat',
2055
+ provider: 'mistral',
2056
+ displayName: 'Voxtral Small',
2057
+ description: 'Our first model with audio input capabilities for instruct use cases',
2058
+ pricing: { input: 0.1, output: 0.3 },
2059
+ context: {
2060
+ input: {
2061
+ text: true,
2062
+ audio: true,
2063
+ image: false,
2064
+ video: false
2065
+ },
2066
+ output: {
2067
+ text: true,
2068
+ audio: false,
2069
+ image: false,
2070
+ video: false
2071
+ }
2072
+ },
2073
+ deprecated: false,
2074
+ isAvailable: true,
2075
+ lastUpdated: '2026-01-02',
2076
+ },
2077
+ 'dall-e-2': {
2078
+ type: 'image',
316
2079
  provider: 'openai',
317
- displayName: 'Chat GPT audio',
318
- pricing: { input: 0.0025, output: 0.01 },
319
- benchmarks: {
320
- intelligence: 27,
321
- coding: 24,
322
- math: 6,
323
- mmluPro: 0.748,
324
- gpqa: 0.543,
325
- },
326
- performance: {
327
- outputTokenPerSecond: 235.657,
328
- timeTofirstToken: 0.323,
329
- intelligenceScore: 27,
330
- },
331
- lastUpdated: '2025-12-24',
2080
+ displayName: 'DALL·E 2',
2081
+ description: 'Our first image generation model',
2082
+ pricing: { input: 0, output: 0 },
2083
+ context: {
2084
+ input: {
2085
+ text: true,
2086
+ audio: false,
2087
+ image: false,
2088
+ video: false
2089
+ },
2090
+ output: {
2091
+ text: false,
2092
+ audio: false,
2093
+ image: true,
2094
+ video: false
2095
+ }
2096
+ },
2097
+ deprecated: false,
2098
+ isAvailable: true,
2099
+ lastUpdated: '2026-01-02',
332
2100
  },
333
- 'openai/gpt-audio-mini': {
334
- type: 'chat',
2101
+ 'dall-e-3': {
2102
+ type: 'image',
335
2103
  provider: 'openai',
336
- displayName: 'Chat GPT mini audio',
337
- pricing: { input: 0.00015, output: 0.0006 },
338
- benchmarks: {
339
- intelligence: 21.2,
340
- math: 14.7,
341
- mmluPro: 0.648,
342
- gpqa: 0.426,
343
- },
344
- performance: {
345
- outputTokenPerSecond: 47.79,
346
- timeTofirstToken: 0.58,
347
- intelligenceScore: 21.2,
348
- },
349
- lastUpdated: '2025-12-24',
2104
+ displayName: 'DALL·E 3',
2105
+ description: 'Previous generation image generation model',
2106
+ pricing: { input: 0, output: 0 },
2107
+ context: {
2108
+ input: {
2109
+ text: true,
2110
+ audio: false,
2111
+ image: false,
2112
+ video: false
2113
+ },
2114
+ output: {
2115
+ text: false,
2116
+ audio: false,
2117
+ image: true,
2118
+ video: false
2119
+ }
2120
+ },
2121
+ deprecated: false,
2122
+ isAvailable: true,
2123
+ lastUpdated: '2026-01-02',
350
2124
  },
351
- 'gpt-4o-search-preview': {
2125
+ 'gpt-3.5-turbo': {
352
2126
  type: 'chat',
353
2127
  provider: 'openai',
354
- displayName: 'Chat GPT 4o search preview',
355
- pricing: { input: 0.0025, output: 0.01 },
356
- benchmarks: {
357
- intelligence: 27,
358
- coding: 24,
359
- math: 6,
360
- mmluPro: 0.748,
361
- gpqa: 0.543,
362
- },
363
- performance: {
364
- outputTokenPerSecond: 235.657,
365
- timeTofirstToken: 0.323,
366
- intelligenceScore: 27,
367
- },
368
- lastUpdated: '2025-12-24',
2128
+ displayName: 'GPT-3.5 Turbo',
2129
+ description: 'Legacy GPT model for cheaper chat and non-chat tasks',
2130
+ pricing: { input: 0.5, output: 1.5 },
2131
+ contextLength: 16385,
2132
+ context: {
2133
+ input: {
2134
+ text: true,
2135
+ audio: false,
2136
+ image: false,
2137
+ video: false
2138
+ },
2139
+ output: {
2140
+ text: true,
2141
+ audio: false,
2142
+ image: false,
2143
+ video: false
2144
+ }
2145
+ },
2146
+ deprecated: false,
2147
+ isAvailable: true,
2148
+ lastUpdated: '2026-01-02',
369
2149
  },
370
- 'gpt-4o-mini-search-preview': {
2150
+ 'gpt-4-turbo': {
371
2151
  type: 'chat',
372
2152
  provider: 'openai',
373
- displayName: 'Chat GPT 4o mini search preview',
374
- pricing: { input: 0.00015, output: 0.0006 },
2153
+ displayName: 'GPT-4 Turbo',
2154
+ description: 'An older high-intelligence GPT model',
2155
+ pricing: { input: 10, output: 30 },
375
2156
  benchmarks: {
376
- intelligence: 21.2,
377
- math: 14.7,
378
- mmluPro: 0.648,
379
- gpqa: 0.426,
2157
+ intelligence: 21.5,
2158
+ coding: 13.1,
380
2159
  },
381
2160
  performance: {
382
- outputTokenPerSecond: 47.79,
383
- timeTofirstToken: 0.58,
384
- intelligenceScore: 21.2,
2161
+ intelligenceScore: 21.5,
385
2162
  },
386
- lastUpdated: '2025-12-24',
387
- },
388
- 'openai/gpt-4.1-2025-04-14': {
2163
+ contextLength: 128000,
2164
+ context: {
2165
+ input: {
2166
+ text: true,
2167
+ audio: false,
2168
+ image: true,
2169
+ video: false
2170
+ },
2171
+ output: {
2172
+ text: true,
2173
+ audio: false,
2174
+ image: false,
2175
+ video: false
2176
+ }
2177
+ },
2178
+ deprecated: false,
2179
+ isAvailable: true,
2180
+ lastUpdated: '2026-01-02',
2181
+ },
2182
+ 'gpt-4.1': {
389
2183
  type: 'chat',
390
2184
  provider: 'openai',
391
- displayName: 'Chat GPT 4.1',
392
- pricing: { input: 0.002, output: 0.008 },
2185
+ displayName: 'GPT-4.1',
2186
+ description: 'Smartest non-reasoning model',
2187
+ pricing: { input: 2, output: 8 },
393
2188
  benchmarks: {
394
2189
  intelligence: 43.4,
395
2190
  coding: 32.2,
396
2191
  math: 34.7,
397
- mmluPro: 0.806,
398
- gpqa: 0.666,
2192
+ mmluPro: 0.81,
2193
+ gpqa: 0.67,
399
2194
  },
400
2195
  performance: {
401
- outputTokenPerSecond: 109.93,
402
- timeTofirstToken: 0.694,
403
2196
  intelligenceScore: 43.4,
404
2197
  },
405
- lastUpdated: '2025-12-24',
406
- },
407
- 'openai/gpt-4.1-mini-2025-04-14': {
2198
+ contextLength: 128000,
2199
+ context: {
2200
+ input: {
2201
+ text: true,
2202
+ audio: false,
2203
+ image: true,
2204
+ video: false
2205
+ },
2206
+ output: {
2207
+ text: true,
2208
+ audio: false,
2209
+ image: false,
2210
+ video: false
2211
+ }
2212
+ },
2213
+ deprecated: false,
2214
+ isAvailable: true,
2215
+ lastUpdated: '2026-01-02',
2216
+ },
2217
+ 'gpt-4.1-mini': {
408
2218
  type: 'chat',
409
2219
  provider: 'openai',
410
- displayName: 'Chat GPT 4.1 mini',
411
- pricing: { input: 0.0004, output: 0.0016 },
2220
+ displayName: 'GPT-4.1 mini',
2221
+ description: 'Smaller, faster version of GPT-4.1',
2222
+ pricing: { input: 0.4, output: 1.6 },
412
2223
  benchmarks: {
413
2224
  intelligence: 42.5,
414
2225
  coding: 31.9,
415
2226
  math: 46.3,
416
- mmluPro: 0.781,
417
- gpqa: 0.664,
2227
+ mmluPro: 0.78,
2228
+ gpqa: 0.66,
418
2229
  },
419
2230
  performance: {
420
- outputTokenPerSecond: 80.606,
421
- timeTofirstToken: 0.505,
422
2231
  intelligenceScore: 42.5,
423
2232
  },
424
- lastUpdated: '2025-12-24',
425
- },
426
- 'openai/gpt-4.1-nano-2025-04-14': {
2233
+ contextLength: 128000,
2234
+ context: {
2235
+ input: {
2236
+ text: true,
2237
+ audio: false,
2238
+ image: true,
2239
+ video: false
2240
+ },
2241
+ output: {
2242
+ text: true,
2243
+ audio: false,
2244
+ image: false,
2245
+ video: false
2246
+ }
2247
+ },
2248
+ deprecated: false,
2249
+ isAvailable: true,
2250
+ lastUpdated: '2026-01-02',
2251
+ },
2252
+ 'gpt-4.1-nano-2025-04-14': {
427
2253
  type: 'chat',
428
2254
  provider: 'openai',
429
- displayName: 'Chat GPT 4.1 nano',
430
- pricing: { input: 0.0001, output: 0.0004 },
2255
+ displayName: 'GPT-4.1 nano',
2256
+ description: 'Fastest, most cost-efficient version of GPT-4.1',
2257
+ pricing: { input: 0.1, output: 0.4 },
431
2258
  benchmarks: {
432
2259
  intelligence: 27.3,
433
2260
  coding: 20.7,
434
2261
  math: 24,
435
- mmluPro: 0.657,
436
- gpqa: 0.512,
2262
+ mmluPro: 0.66,
2263
+ gpqa: 0.51,
437
2264
  },
438
2265
  performance: {
439
- outputTokenPerSecond: 171.016,
440
- timeTofirstToken: 0.446,
441
2266
  intelligenceScore: 27.3,
442
2267
  },
443
- lastUpdated: '2025-12-24',
2268
+ contextLength: 128000,
2269
+ context: {
2270
+ input: {
2271
+ text: true,
2272
+ audio: false,
2273
+ image: true,
2274
+ video: false
2275
+ },
2276
+ output: {
2277
+ text: true,
2278
+ audio: false,
2279
+ image: false,
2280
+ video: false
2281
+ }
2282
+ },
2283
+ deprecated: false,
2284
+ isAvailable: true,
2285
+ lastUpdated: '2026-01-02',
2286
+ },
2287
+ 'gpt-4o': {
2288
+ type: 'chat',
2289
+ provider: 'openai',
2290
+ displayName: 'GPT-4o',
2291
+ description: 'Fast, intelligent, flexible GPT model',
2292
+ pricing: { input: 2.5, output: 10 },
2293
+ benchmarks: {
2294
+ intelligence: 26,
2295
+ coding: 20.1,
2296
+ math: 15.3,
2297
+ mmluPro: 0.75,
2298
+ gpqa: 0.57,
2299
+ },
2300
+ performance: {
2301
+ intelligenceScore: 26,
2302
+ },
2303
+ contextLength: 128000,
2304
+ context: {
2305
+ input: {
2306
+ text: true,
2307
+ audio: false,
2308
+ image: true,
2309
+ video: false
2310
+ },
2311
+ output: {
2312
+ text: true,
2313
+ audio: false,
2314
+ image: false,
2315
+ video: false
2316
+ }
2317
+ },
2318
+ deprecated: false,
2319
+ isAvailable: true,
2320
+ lastUpdated: '2026-01-02',
2321
+ },
2322
+ 'gpt-4o-audio-preview': {
2323
+ type: 'audio',
2324
+ provider: 'openai',
2325
+ displayName: 'GPT-4o Audio',
2326
+ description: 'GPT-4o models capable of audio inputs and outputs',
2327
+ pricing: { input: 2.5, output: 10 },
2328
+ contextLength: 128000,
2329
+ context: {
2330
+ input: {
2331
+ text: true,
2332
+ audio: true,
2333
+ image: false,
2334
+ video: false
2335
+ },
2336
+ output: {
2337
+ text: true,
2338
+ audio: true,
2339
+ image: false,
2340
+ video: false
2341
+ }
2342
+ },
2343
+ deprecated: false,
2344
+ isAvailable: true,
2345
+ lastUpdated: '2026-01-02',
444
2346
  },
445
- 'openai/o4-mini-2025-04-16': {
2347
+ 'gpt-4o-mini': {
446
2348
  type: 'chat',
447
2349
  provider: 'openai',
448
- displayName: 'o4-mini',
449
- pricing: { input: 0.0011, output: 0.0044 },
2350
+ displayName: 'GPT-4o mini',
2351
+ description: 'Fast, affordable small model for focused tasks',
2352
+ pricing: { input: 0.15, output: 0.6 },
450
2353
  benchmarks: {
451
- intelligence: 59.6,
452
- coding: 48.9,
453
- math: 90.7,
454
- mmluPro: 0.832,
455
- gpqa: 0.784,
2354
+ intelligence: 18.9,
456
2355
  },
457
2356
  performance: {
458
- outputTokenPerSecond: 169.795,
459
- timeTofirstToken: 33.795,
460
- intelligenceScore: 59.6,
2357
+ intelligenceScore: 18.9,
2358
+ },
2359
+ contextLength: 128000,
2360
+ context: {
2361
+ input: {
2362
+ text: true,
2363
+ audio: false,
2364
+ image: true,
2365
+ video: false
2366
+ },
2367
+ output: {
2368
+ text: true,
2369
+ audio: false,
2370
+ image: false,
2371
+ video: false
2372
+ }
461
2373
  },
462
- lastUpdated: '2025-12-24',
2374
+ deprecated: false,
2375
+ isAvailable: true,
2376
+ lastUpdated: '2026-01-02',
463
2377
  },
464
- 'openai/o3-2025-04-16': {
2378
+ 'gpt-4o-mini-search-preview': {
465
2379
  type: 'chat',
466
2380
  provider: 'openai',
467
- displayName: 'o3',
468
- pricing: { input: 0.002, output: 0.008 },
469
- benchmarks: {
470
- intelligence: 65.5,
471
- coding: 52.2,
472
- math: 88.3,
473
- mmluPro: 0.853,
474
- gpqa: 0.827,
475
- },
476
- performance: {
477
- outputTokenPerSecond: 359.632,
478
- timeTofirstToken: 8.936,
479
- intelligenceScore: 65.5,
480
- },
481
- lastUpdated: '2025-12-24',
482
- },
483
- 'o1': {
484
- type: 'chat',
2381
+ displayName: 'GPT-4o mini Search Preview',
2382
+ description: 'Fast, affordable small model for web search',
2383
+ pricing: { input: 0.15, output: 0.6 },
2384
+ contextLength: 128000,
2385
+ context: {
2386
+ input: {
2387
+ text: true,
2388
+ audio: false,
2389
+ image: false,
2390
+ video: false
2391
+ },
2392
+ output: {
2393
+ text: true,
2394
+ audio: false,
2395
+ image: false,
2396
+ video: false
2397
+ }
2398
+ },
2399
+ deprecated: false,
2400
+ isAvailable: true,
2401
+ lastUpdated: '2026-01-02',
2402
+ },
2403
+ 'gpt-4o-mini-transcribe': {
2404
+ type: 'audio',
485
2405
  provider: 'openai',
486
- displayName: 'o1',
487
- pricing: { input: 0.015, output: 0.06 },
488
- benchmarks: {
489
- intelligence: 47.2,
490
- coding: 38.6,
491
- mmluPro: 0.841,
492
- gpqa: 0.747,
493
- },
494
- performance: {
495
- outputTokenPerSecond: 200.717,
496
- timeTofirstToken: 15.318,
497
- intelligenceScore: 47.2,
498
- },
499
- lastUpdated: '2025-12-24',
500
- },
501
- 'openai/gpt-5-2025-08-07': {
502
- type: 'chat',
2406
+ displayName: 'GPT-4o mini Transcribe',
2407
+ description: 'Speech-to-text model powered by GPT-4o mini',
2408
+ pricing: { input: 1.25, output: 5 },
2409
+ context: {
2410
+ input: {
2411
+ text: false,
2412
+ audio: true,
2413
+ image: false,
2414
+ video: false
2415
+ },
2416
+ output: {
2417
+ text: true,
2418
+ audio: false,
2419
+ image: false,
2420
+ video: false
2421
+ }
2422
+ },
2423
+ deprecated: false,
2424
+ isAvailable: true,
2425
+ lastUpdated: '2026-01-02',
2426
+ },
2427
+ 'gpt-4o-mini-transcribe-2025-12-15': {
2428
+ type: 'audio',
503
2429
  provider: 'openai',
504
- displayName: 'GPT-5',
505
- pricing: { input: 0.00125, output: 0.01 },
506
- benchmarks: {
507
- intelligence: 68.5,
508
- coding: 52.7,
509
- math: 94.3,
510
- mmluPro: 0.871,
511
- gpqa: 0.854,
512
- },
513
- performance: {
514
- outputTokenPerSecond: 147.254,
515
- timeTofirstToken: 80.387,
516
- intelligenceScore: 68.5,
517
- },
518
- lastUpdated: '2025-12-24',
519
- },
520
- 'openai/gpt-5-mini-2025-08-07': {
521
- type: 'chat',
2430
+ displayName: 'GPT-4o mini Transcribe',
2431
+ description: 'Speech-to-text model powered by GPT-4o mini',
2432
+ pricing: { input: 1.25, output: 5 },
2433
+ context: {
2434
+ input: {
2435
+ text: false,
2436
+ audio: true,
2437
+ image: false,
2438
+ video: false
2439
+ },
2440
+ output: {
2441
+ text: true,
2442
+ audio: false,
2443
+ image: false,
2444
+ video: false
2445
+ }
2446
+ },
2447
+ deprecated: false,
2448
+ isAvailable: true,
2449
+ lastUpdated: '2026-01-02',
2450
+ },
2451
+ 'gpt-4o-mini-tts': {
2452
+ type: 'tts',
522
2453
  provider: 'openai',
523
- displayName: 'GPT-5 mini',
524
- pricing: { input: 0.00025, output: 0.002 },
525
- benchmarks: {
526
- intelligence: 64.3,
527
- coding: 51.4,
528
- math: 90.7,
529
- mmluPro: 0.837,
530
- gpqa: 0.828,
531
- },
532
- performance: {
533
- outputTokenPerSecond: 86.714,
534
- timeTofirstToken: 92.447,
535
- intelligenceScore: 64.3,
536
- },
537
- lastUpdated: '2025-12-24',
538
- },
539
- 'openai/gpt-5-nano-2025-08-07': {
540
- type: 'chat',
2454
+ displayName: 'GPT-4o mini TTS',
2455
+ description: 'Text-to-speech model powered by GPT-4o mini',
2456
+ pricing: { input: 0.6, output: 0 },
2457
+ context: {
2458
+ input: {
2459
+ text: true,
2460
+ audio: false,
2461
+ image: false,
2462
+ video: false
2463
+ },
2464
+ output: {
2465
+ text: false,
2466
+ audio: true,
2467
+ image: false,
2468
+ video: false
2469
+ }
2470
+ },
2471
+ deprecated: false,
2472
+ isAvailable: true,
2473
+ lastUpdated: '2026-01-02',
2474
+ },
2475
+ 'gpt-4o-realtime-preview-2025-06-03': {
2476
+ type: 'audio',
541
2477
  provider: 'openai',
542
- displayName: 'GPT-5 nano',
543
- pricing: { input: 0.00005, output: 0.0004 },
544
- benchmarks: {
545
- intelligence: 51,
546
- coding: 42.3,
547
- math: 83.7,
548
- mmluPro: 0.78,
549
- gpqa: 0.676,
550
- },
551
- performance: {
552
- outputTokenPerSecond: 157.197,
553
- timeTofirstToken: 102.322,
554
- intelligenceScore: 51,
555
- },
556
- lastUpdated: '2025-12-24',
2478
+ displayName: 'GPT-4o Realtime',
2479
+ description: 'Model capable of realtime text and audio inputs and outputs',
2480
+ pricing: { input: 5, output: 20 },
2481
+ contextLength: 128000,
2482
+ context: {
2483
+ input: {
2484
+ text: true,
2485
+ audio: true,
2486
+ image: false,
2487
+ video: false
2488
+ },
2489
+ output: {
2490
+ text: true,
2491
+ audio: true,
2492
+ image: false,
2493
+ video: false
2494
+ }
2495
+ },
2496
+ deprecated: false,
2497
+ isAvailable: true,
2498
+ lastUpdated: '2026-01-02',
557
2499
  },
558
- 'openai/gpt-5-chat-latest': {
2500
+ 'gpt-4o-search-preview': {
559
2501
  type: 'chat',
560
2502
  provider: 'openai',
561
- displayName: 'GPT-5 Chat',
562
- pricing: { input: 0.00125, output: 0.01 },
563
- benchmarks: {
564
- intelligence: 41.8,
565
- coding: 34.7,
566
- math: 48.3,
567
- mmluPro: 0.82,
568
- gpqa: 0.686,
569
- },
570
- performance: {
571
- outputTokenPerSecond: 192.431,
572
- timeTofirstToken: 0.677,
573
- intelligenceScore: 41.8,
574
- },
575
- lastUpdated: '2025-12-24',
576
- },
577
- 'openai/gpt-5-1': {
578
- type: 'chat',
2503
+ displayName: 'GPT-4o Search Preview',
2504
+ description: 'GPT model for web search in Chat Completions',
2505
+ pricing: { input: 2.5, output: 10 },
2506
+ context: {
2507
+ input: {
2508
+ text: true,
2509
+ audio: false,
2510
+ image: false,
2511
+ video: false
2512
+ },
2513
+ output: {
2514
+ text: true,
2515
+ audio: false,
2516
+ image: false,
2517
+ video: false
2518
+ }
2519
+ },
2520
+ deprecated: false,
2521
+ isAvailable: true,
2522
+ lastUpdated: '2026-01-02',
2523
+ },
2524
+ 'gpt-4o-transcribe': {
2525
+ type: 'audio',
579
2526
  provider: 'openai',
580
- displayName: 'GPT-5.1',
581
- pricing: { input: 0.00125, output: 0.01 },
582
- benchmarks: {
583
- intelligence: 69.7,
584
- coding: 57.5,
585
- math: 94,
586
- mmluPro: 0.87,
587
- gpqa: 0.873,
588
- },
589
- performance: {
590
- outputTokenPerSecond: 195.488,
591
- timeTofirstToken: 25.787,
592
- intelligenceScore: 69.7,
593
- },
594
- lastUpdated: '2025-12-24',
595
- },
596
- 'openai/gpt-5-1-chat-latest': {
597
- type: 'chat',
2527
+ displayName: 'GPT-4o Transcribe',
2528
+ description: 'Speech-to-text model powered by GPT-4o',
2529
+ pricing: { input: 2.5, output: 10 },
2530
+ context: {
2531
+ input: {
2532
+ text: false,
2533
+ audio: true,
2534
+ image: false,
2535
+ video: false
2536
+ },
2537
+ output: {
2538
+ text: true,
2539
+ audio: false,
2540
+ image: false,
2541
+ video: false
2542
+ }
2543
+ },
2544
+ deprecated: false,
2545
+ isAvailable: true,
2546
+ lastUpdated: '2026-01-02',
2547
+ },
2548
+ 'gpt-4o-transcribe-diarize': {
2549
+ type: 'audio',
598
2550
  provider: 'openai',
599
- displayName: 'GPT-5.1 Chat Latest',
600
- pricing: { input: 0.00125, output: 0.01 },
601
- benchmarks: {
602
- intelligence: 68.5,
603
- coding: 52.7,
604
- math: 94.3,
605
- mmluPro: 0.871,
606
- gpqa: 0.854,
607
- },
608
- performance: {
609
- outputTokenPerSecond: 147.254,
610
- timeTofirstToken: 80.387,
611
- intelligenceScore: 68.5,
612
- },
613
- lastUpdated: '2025-12-24',
614
- },
615
- 'openai/gpt-5-2': {
2551
+ displayName: 'GPT-4o Transcribe Diarize',
2552
+ description: 'Transcription model that identifies who\'s speaking when',
2553
+ pricing: { input: 2.5, output: 10 },
2554
+ context: {
2555
+ input: {
2556
+ text: false,
2557
+ audio: true,
2558
+ image: false,
2559
+ video: false
2560
+ },
2561
+ output: {
2562
+ text: true,
2563
+ audio: false,
2564
+ image: false,
2565
+ video: false
2566
+ }
2567
+ },
2568
+ deprecated: false,
2569
+ isAvailable: true,
2570
+ lastUpdated: '2026-01-02',
2571
+ },
2572
+ 'gpt-5-mini-2025-08-07': {
616
2573
  type: 'chat',
617
2574
  provider: 'openai',
618
- displayName: 'GPT-5.2',
619
- pricing: { input: 0.00175, output: 0.014 },
2575
+ displayName: 'GPT-5 mini',
2576
+ description: 'A faster, cost-efficient version of GPT-5 for well-defined tasks',
2577
+ pricing: { input: 0.25, output: 2 },
620
2578
  benchmarks: {
621
- intelligence: 72.6,
622
- coding: 61.8,
623
- math: 98.7,
624
- mmluPro: 0.874,
625
- gpqa: 0.903,
626
- },
627
- performance: {
628
- outputTokenPerSecond: 112.643,
629
- timeTofirstToken: 45.724,
630
- intelligenceScore: 72.6,
631
- },
632
- lastUpdated: '2025-12-24',
633
- },
634
- 'openai/gpt-5-2-chat-latest': {
2579
+ intelligence: 66.4,
2580
+ coding: 49.2,
2581
+ math: 91.7,
2582
+ mmluPro: 0.87,
2583
+ gpqa: 0.84,
2584
+ },
2585
+ performance: {
2586
+ intelligenceScore: 66.4,
2587
+ },
2588
+ contextLength: 128000,
2589
+ context: {
2590
+ input: {
2591
+ text: true,
2592
+ audio: false,
2593
+ image: true,
2594
+ video: false
2595
+ },
2596
+ output: {
2597
+ text: true,
2598
+ audio: false,
2599
+ image: false,
2600
+ video: false
2601
+ }
2602
+ },
2603
+ deprecated: false,
2604
+ isAvailable: true,
2605
+ lastUpdated: '2026-01-02',
2606
+ },
2607
+ 'gpt-5-nano-2025-08-07': {
635
2608
  type: 'chat',
636
2609
  provider: 'openai',
637
- displayName: 'GPT-5.2 Chat Latest',
638
- pricing: { input: 0.00125, output: 0.01 },
639
- benchmarks: {
640
- intelligence: 68.5,
641
- coding: 52.7,
642
- math: 94.3,
643
- mmluPro: 0.871,
644
- gpqa: 0.854,
645
- },
646
- performance: {
647
- outputTokenPerSecond: 147.254,
648
- timeTofirstToken: 80.387,
649
- intelligenceScore: 68.5,
650
- },
651
- lastUpdated: '2025-12-24',
652
- },
653
- 'openai/o3-pro': {
654
- type: 'responses',
655
- provider: 'openai',
656
- displayName: 'o3-pro',
657
- pricing: { input: 0.02, output: 0.08 },
658
- benchmarks: {
659
- intelligence: 65.3,
660
- gpqa: 0.845,
661
- },
662
- performance: {
663
- outputTokenPerSecond: 53.281,
664
- timeTofirstToken: 58.458,
665
- intelligenceScore: 65.3,
666
- },
667
- lastUpdated: '2025-12-24',
668
- },
669
- 'openai/gpt-5-pro': {
670
- type: 'responses',
2610
+ displayName: 'GPT-5 nano',
2611
+ description: 'Fastest, most cost-efficient version of GPT-5',
2612
+ pricing: { input: 0.05, output: 0.4 },
2613
+ benchmarks: {
2614
+ intelligence: 29.1,
2615
+ coding: 27.5,
2616
+ math: 27.3,
2617
+ mmluPro: 0.56,
2618
+ gpqa: 0.43,
2619
+ },
2620
+ performance: {
2621
+ intelligenceScore: 29.1,
2622
+ },
2623
+ contextLength: 128000,
2624
+ context: {
2625
+ input: {
2626
+ text: true,
2627
+ audio: false,
2628
+ image: true,
2629
+ video: false
2630
+ },
2631
+ output: {
2632
+ text: true,
2633
+ audio: false,
2634
+ image: false,
2635
+ video: false
2636
+ }
2637
+ },
2638
+ deprecated: false,
2639
+ isAvailable: true,
2640
+ lastUpdated: '2026-01-02',
2641
+ },
2642
+ 'gpt-5-search-api-2025-10-14': {
2643
+ type: 'chat',
671
2644
  provider: 'openai',
672
- displayName: 'GPT 5 Pro',
673
- pricing: { input: 0.00125, output: 0.01 },
2645
+ displayName: 'GPT-5 Search API',
2646
+ description: 'GPT-5 model optimized for web search capabilities',
2647
+ pricing: { input: 1.25, output: 10 },
674
2648
  benchmarks: {
675
2649
  intelligence: 68.5,
676
- coding: 52.7,
677
- math: 94.3,
678
- mmluPro: 0.871,
679
- gpqa: 0.854,
680
- },
681
- performance: {
682
- outputTokenPerSecond: 147.254,
683
- timeTofirstToken: 80.387,
684
- intelligenceScore: 68.5,
685
- },
686
- lastUpdated: '2025-12-24',
687
- },
688
- 'openai/gpt-5-1-codex': {
689
- type: 'responses',
690
- provider: 'openai',
691
- displayName: 'GPT-5.1 Codex',
692
- pricing: { input: 0.00125, output: 0.01 },
693
- benchmarks: {
694
- intelligence: 66.9,
695
- coding: 52.5,
696
- math: 95.7,
697
- mmluPro: 0.86,
698
- gpqa: 0.86,
699
- },
700
- performance: {
701
- outputTokenPerSecond: 264.603,
702
- timeTofirstToken: 12.24,
703
- intelligenceScore: 66.9,
704
- },
705
- lastUpdated: '2025-12-24',
706
- },
707
- 'openai/gpt-5-1-codex-mini': {
708
- type: 'responses',
709
- provider: 'openai',
710
- displayName: 'GPT-5.1 Codex Mini',
711
- pricing: { input: 0.00025, output: 0.002 },
712
- benchmarks: {
713
- intelligence: 62.3,
714
- coding: 52.5,
715
- math: 91.7,
716
- mmluPro: 0.82,
717
- gpqa: 0.813,
718
- },
719
- performance: {
720
- outputTokenPerSecond: 146.418,
721
- timeTofirstToken: 15.16,
722
- intelligenceScore: 62.3,
723
- },
724
- lastUpdated: '2025-12-24',
725
- },
726
- 'openai/gpt-5-2-pro': {
727
- type: 'responses',
728
- provider: 'openai',
729
- displayName: 'GPT-5.2 Pro',
730
- pricing: { input: 0.00175, output: 0.014 },
731
- benchmarks: {
732
- intelligence: 72.6,
733
- coding: 61.8,
2650
+ coding: 53.5,
734
2651
  math: 98.7,
735
- mmluPro: 0.874,
736
- gpqa: 0.903,
2652
+ mmluPro: 0.87,
2653
+ gpqa: 0.84,
737
2654
  },
738
2655
  performance: {
739
- outputTokenPerSecond: 112.643,
740
- timeTofirstToken: 45.724,
741
- intelligenceScore: 72.6,
2656
+ intelligenceScore: 68.5,
742
2657
  },
743
- lastUpdated: '2025-12-24',
744
- },
745
- 'openai/gpt-oss-120b': {
2658
+ contextLength: 128000,
2659
+ context: {
2660
+ input: {
2661
+ text: true,
2662
+ audio: false,
2663
+ image: true,
2664
+ video: false
2665
+ },
2666
+ output: {
2667
+ text: true,
2668
+ audio: false,
2669
+ image: false,
2670
+ video: false
2671
+ }
2672
+ },
2673
+ deprecated: false,
2674
+ isAvailable: true,
2675
+ lastUpdated: '2026-01-02',
2676
+ },
2677
+ 'gpt-5.1-2025-11-13': {
746
2678
  type: 'chat',
747
2679
  provider: 'openai',
748
- displayName: 'GPT OSS 120B',
749
- pricing: { input: 0.00015, output: 0.0006 },
750
- benchmarks: {
751
- intelligence: 60.5,
752
- coding: 49.6,
753
- math: 93.4,
754
- mmluPro: 0.808,
755
- gpqa: 0.782,
756
- },
757
- performance: {
758
- outputTokenPerSecond: 374.199,
759
- timeTofirstToken: 0.534,
760
- intelligenceScore: 60.5,
761
- },
762
- lastUpdated: '2025-12-24',
763
- },
764
- 'openai/gpt-oss-20b': {
765
- type: 'chat',
2680
+ displayName: 'GPT-5.1',
2681
+ description: 'The best model for coding and agentic tasks with configurable reasoning effort',
2682
+ pricing: { input: 1.25, output: 10 },
2683
+ benchmarks: {
2684
+ intelligence: 37,
2685
+ coding: 29.2,
2686
+ math: 73,
2687
+ mmluPro: 0.79,
2688
+ gpqa: 0.68,
2689
+ },
2690
+ performance: {
2691
+ intelligenceScore: 37,
2692
+ },
2693
+ contextLength: 200000,
2694
+ context: {
2695
+ input: {
2696
+ text: true,
2697
+ audio: false,
2698
+ image: true,
2699
+ video: false
2700
+ },
2701
+ output: {
2702
+ text: true,
2703
+ audio: false,
2704
+ image: false,
2705
+ video: false
2706
+ }
2707
+ },
2708
+ deprecated: false,
2709
+ isAvailable: true,
2710
+ lastUpdated: '2026-01-02',
2711
+ },
2712
+ 'gpt-audio-mini-2025-10-06': {
2713
+ type: 'audio',
766
2714
  provider: 'openai',
767
- displayName: 'GPT OSS 20B',
768
- pricing: { input: 0.00007000000000000001, output: 0.0002 },
769
- benchmarks: {
770
- intelligence: 52.1,
771
- coding: 40.7,
772
- math: 89.3,
773
- mmluPro: 0.748,
774
- gpqa: 0.688,
775
- },
776
- performance: {
777
- outputTokenPerSecond: 242.94,
778
- timeTofirstToken: 0.556,
779
- intelligenceScore: 52.1,
780
- },
781
- lastUpdated: '2025-12-24',
782
- },
783
- 'dall-e-3': {
784
- type: 'image',
2715
+ displayName: 'gpt-audio-mini',
2716
+ description: 'A cost-efficient version of GPT Audio',
2717
+ pricing: { input: 0.6, output: 2.4 },
2718
+ contextLength: 128000,
2719
+ context: {
2720
+ input: {
2721
+ text: true,
2722
+ audio: true,
2723
+ image: false,
2724
+ video: false
2725
+ },
2726
+ output: {
2727
+ text: true,
2728
+ audio: true,
2729
+ image: false,
2730
+ video: false
2731
+ }
2732
+ },
2733
+ deprecated: false,
2734
+ isAvailable: true,
2735
+ lastUpdated: '2026-01-02',
2736
+ },
2737
+ 'gpt-audio-mini-2025-12-15': {
2738
+ type: 'audio',
785
2739
  provider: 'openai',
786
- displayName: 'DALL-E 3',
787
- lastUpdated: '2025-12-24',
788
- },
789
- 'dall-e-2': {
2740
+ displayName: 'gpt-audio-mini',
2741
+ description: 'A cost-efficient version of GPT Audio',
2742
+ pricing: { input: 0.6, output: 2.4 },
2743
+ contextLength: 128000,
2744
+ context: {
2745
+ input: {
2746
+ text: true,
2747
+ audio: true,
2748
+ image: false,
2749
+ video: false
2750
+ },
2751
+ output: {
2752
+ text: true,
2753
+ audio: true,
2754
+ image: false,
2755
+ video: false
2756
+ }
2757
+ },
2758
+ deprecated: false,
2759
+ isAvailable: true,
2760
+ lastUpdated: '2026-01-02',
2761
+ },
2762
+ 'gpt-image-1.5': {
790
2763
  type: 'image',
791
2764
  provider: 'openai',
792
- displayName: 'DALL-E 2',
793
- lastUpdated: '2025-12-24',
794
- },
795
- 'openai/gpt-image-1': {
796
- type: 'image',
2765
+ displayName: 'GPT Image 1.5',
2766
+ description: 'State-of-the-art image generation model',
2767
+ pricing: { input: 5, output: 10 },
2768
+ context: {
2769
+ input: {
2770
+ text: true,
2771
+ audio: false,
2772
+ image: false,
2773
+ video: false
2774
+ },
2775
+ output: {
2776
+ text: false,
2777
+ audio: false,
2778
+ image: true,
2779
+ video: false
2780
+ }
2781
+ },
2782
+ deprecated: false,
2783
+ isAvailable: true,
2784
+ lastUpdated: '2026-01-02',
2785
+ },
2786
+ 'gpt-realtime-2025-08-28': {
2787
+ type: 'audio',
797
2788
  provider: 'openai',
798
- displayName: 'GPT Image 1',
799
- lastUpdated: '2025-12-24',
800
- },
801
- 'openai/gpt-image-1-mini': {
802
- type: 'image',
2789
+ displayName: 'gpt-realtime',
2790
+ description: 'Model capable of realtime text and audio inputs and outputs',
2791
+ pricing: { input: 4, output: 16 },
2792
+ contextLength: 128000,
2793
+ context: {
2794
+ input: {
2795
+ text: true,
2796
+ audio: true,
2797
+ image: false,
2798
+ video: false
2799
+ },
2800
+ output: {
2801
+ text: true,
2802
+ audio: true,
2803
+ image: false,
2804
+ video: false
2805
+ }
2806
+ },
2807
+ deprecated: false,
2808
+ isAvailable: true,
2809
+ lastUpdated: '2026-01-02',
2810
+ },
2811
+ 'gpt-realtime-mini-2025-10-06': {
2812
+ type: 'audio',
803
2813
  provider: 'openai',
804
- displayName: 'GPT Image 1 Mini',
805
- lastUpdated: '2025-12-24',
2814
+ displayName: 'gpt-realtime-mini',
2815
+ description: 'A cost-efficient version of GPT Realtime',
2816
+ pricing: { input: 0.6, output: 2.4 },
2817
+ contextLength: 128000,
2818
+ context: {
2819
+ input: {
2820
+ text: true,
2821
+ audio: true,
2822
+ image: false,
2823
+ video: false
2824
+ },
2825
+ output: {
2826
+ text: true,
2827
+ audio: true,
2828
+ image: false,
2829
+ video: false
2830
+ }
2831
+ },
2832
+ deprecated: false,
2833
+ isAvailable: true,
2834
+ lastUpdated: '2026-01-02',
806
2835
  },
807
- 'openai/gpt-image-1-5': {
808
- type: 'image',
809
- provider: 'openai',
810
- displayName: 'GPT-Image-1.5',
811
- lastUpdated: '2025-12-24',
2836
+ 'text-embedding-3-large': {
2837
+ type: 'embedding',
2838
+ provider: 'openai',
2839
+ displayName: 'text-embedding-3-large',
2840
+ description: 'Most capable embedding model',
2841
+ pricing: { input: 0.13, output: 0 },
2842
+ contextLength: 8191,
2843
+ context: {
2844
+ input: {
2845
+ text: true,
2846
+ audio: false,
2847
+ image: false,
2848
+ video: false
2849
+ },
2850
+ output: {
2851
+ text: false,
2852
+ audio: false,
2853
+ image: false,
2854
+ video: false
2855
+ }
2856
+ },
2857
+ deprecated: false,
2858
+ isAvailable: true,
2859
+ lastUpdated: '2026-01-02',
812
2860
  },
813
2861
  'text-embedding-3-small': {
814
- type: 'embeddings',
815
- provider: 'openai',
816
- displayName: 'Text embedding 3 small',
817
- contextLength: 8000,
818
- lastUpdated: '2025-12-24',
819
- },
820
- 'text-embedding-3-large': {
821
- type: 'embeddings',
822
- provider: 'openai',
823
- displayName: 'Text embedding 3 large',
824
- contextLength: 8000,
825
- lastUpdated: '2025-12-24',
2862
+ type: 'embedding',
2863
+ provider: 'openai',
2864
+ displayName: 'text-embedding-3-small',
2865
+ description: 'Small embedding model',
2866
+ pricing: { input: 0.02, output: 0 },
2867
+ contextLength: 8191,
2868
+ context: {
2869
+ input: {
2870
+ text: true,
2871
+ audio: false,
2872
+ image: false,
2873
+ video: false
2874
+ },
2875
+ output: {
2876
+ text: false,
2877
+ audio: false,
2878
+ image: false,
2879
+ video: false
2880
+ }
2881
+ },
2882
+ deprecated: false,
2883
+ isAvailable: true,
2884
+ lastUpdated: '2026-01-02',
826
2885
  },
827
2886
  'text-embedding-ada-002': {
828
- type: 'embeddings',
829
- provider: 'openai',
830
- displayName: 'Text embedding ada 002',
831
- contextLength: 8000,
832
- lastUpdated: '2025-12-24',
833
- },
834
- 'openai/gpt-4o-transcribe': {
835
- type: 'stt',
836
- provider: 'openai',
837
- displayName: 'GPT-4o Transcribe',
838
- lastUpdated: '2025-12-24',
839
- },
840
- 'openai/gpt-4o-mini-transcribe': {
841
- type: 'stt',
842
- provider: 'openai',
843
- displayName: 'GPT-4o Mini Transcribe',
844
- lastUpdated: '2025-12-24',
845
- },
846
- 'openai/gpt-4o-mini-tts': {
847
- type: 'tts',
848
- provider: 'openai',
849
- displayName: 'GPT-4o mini TTS',
850
- lastUpdated: '2025-12-24',
851
- },
852
- 'openai/tts-1': {
2887
+ type: 'embedding',
2888
+ provider: 'openai',
2889
+ displayName: 'text-embedding-ada-002',
2890
+ description: 'Older embedding model',
2891
+ pricing: { input: 0.1, output: 0 },
2892
+ contextLength: 8191,
2893
+ context: {
2894
+ input: {
2895
+ text: true,
2896
+ audio: false,
2897
+ image: false,
2898
+ video: false
2899
+ },
2900
+ output: {
2901
+ text: false,
2902
+ audio: false,
2903
+ image: false,
2904
+ video: false
2905
+ }
2906
+ },
2907
+ deprecated: false,
2908
+ isAvailable: true,
2909
+ lastUpdated: '2026-01-02',
2910
+ },
2911
+ 'tts-1': {
853
2912
  type: 'tts',
854
2913
  provider: 'openai',
855
2914
  displayName: 'TTS-1',
856
- lastUpdated: '2025-12-24',
857
- },
858
- 'openai/tts-1-hd': {
2915
+ description: 'Text-to-speech model optimized for speed',
2916
+ pricing: { input: 0, output: 0 },
2917
+ context: {
2918
+ input: {
2919
+ text: true,
2920
+ audio: false,
2921
+ image: false,
2922
+ video: false
2923
+ },
2924
+ output: {
2925
+ text: false,
2926
+ audio: true,
2927
+ image: false,
2928
+ video: false
2929
+ }
2930
+ },
2931
+ deprecated: false,
2932
+ isAvailable: true,
2933
+ lastUpdated: '2026-01-02',
2934
+ },
2935
+ 'tts-1-hd': {
859
2936
  type: 'tts',
860
2937
  provider: 'openai',
861
2938
  displayName: 'TTS-1 HD',
862
- lastUpdated: '2025-12-24',
863
- },
864
- 'gpt-3.5-turbo-instruct': {
865
- type: 'language-completion',
866
- provider: 'openai',
867
- displayName: 'Gpt 3.5 turbo instruct',
868
- pricing: { input: 0.0005, output: 0.0015 },
869
- benchmarks: {
870
- intelligence: 8.3,
871
- coding: 10.7,
872
- mmluPro: 0.462,
873
- gpqa: 0.297,
874
- },
875
- performance: {
876
- outputTokenPerSecond: 129.872,
877
- timeTofirstToken: 0.68,
878
- intelligenceScore: 8.3,
879
- },
880
- lastUpdated: '2025-12-24',
881
- },
882
- 'openai/sora-2-t2v': {
883
- type: 'video',
884
- provider: 'openai',
885
- displayName: 'Sora 2 Text to Video',
886
- lastUpdated: '2025-12-24',
887
- },
888
- 'openai/sora-2-i2v': {
889
- type: 'video',
890
- provider: 'openai',
891
- displayName: 'Sora 2 Image to Video',
892
- lastUpdated: '2025-12-24',
893
- },
894
- 'openai/sora-2-pro-i2v': {
895
- type: 'video',
896
- provider: 'openai',
897
- displayName: 'Sora 2 Pro Image to Video',
898
- lastUpdated: '2025-12-24',
899
- },
900
- 'openai/sora-2-pro-t2v': {
901
- type: 'video',
902
- provider: 'openai',
903
- displayName: 'Sora 2 Pro Text to Video',
904
- lastUpdated: '2025-12-24',
905
- },
906
- 'fallback-openai/sora-2-t2v': {
907
- type: 'video',
908
- provider: 'openai',
909
- displayName: 'Sora 2 Text to Video',
910
- lastUpdated: '2025-12-24',
911
- },
912
- 'fallback-openai/sora-2-i2v': {
913
- type: 'video',
914
- provider: 'openai',
915
- displayName: 'Sora 2 Image to Video',
916
- lastUpdated: '2025-12-24',
917
- },
918
- 'fallback-openai/sora-2-pro-i2v': {
919
- type: 'video',
920
- provider: 'openai',
921
- displayName: 'Sora 2 Pro Image to Video',
922
- lastUpdated: '2025-12-24',
923
- },
924
- 'fallback-openai/sora-2-pro-t2v': {
925
- type: 'video',
926
- provider: 'openai',
927
- displayName: 'Sora 2 Pro Text to Video',
928
- lastUpdated: '2025-12-24',
929
- },
930
- // Anthropic models
931
- 'claude-3-opus-20240229': {
932
- type: 'chat',
933
- provider: 'anthropic',
934
- displayName: 'Claude 3 Opus 2024-02-29',
935
- pricing: { input: 0.015, output: 0.075 },
936
- benchmarks: {
937
- intelligence: 20.6,
938
- coding: 19.5,
939
- mmluPro: 0.696,
940
- gpqa: 0.489,
941
- },
942
- performance: {
943
- outputTokenPerSecond: 0,
944
- timeTofirstToken: 0,
945
- intelligenceScore: 20.6,
946
- },
947
- lastUpdated: '2025-12-24',
948
- },
949
- 'claude-3-haiku-20240307': {
950
- type: 'chat',
951
- provider: 'anthropic',
952
- displayName: 'Claude 3 Haiku 2024-03-07',
953
- pricing: { input: 0.00025, output: 0.00125 },
954
- benchmarks: {
955
- intelligence: 9.6,
956
- },
957
- performance: {
958
- outputTokenPerSecond: 122.944,
959
- timeTofirstToken: 0.405,
960
- intelligenceScore: 9.6,
961
- },
962
- lastUpdated: '2025-12-24',
963
- },
964
- 'claude-3-5-haiku-20241022': {
965
- type: 'chat',
966
- provider: 'anthropic',
967
- displayName: 'Claude 3.5 Haiku 2024-10-22',
968
- pricing: { input: 0.0008, output: 0.004 },
969
- benchmarks: {
970
- intelligence: 20.2,
971
- mmluPro: 0.634,
972
- gpqa: 0.408,
973
- },
974
- performance: {
975
- outputTokenPerSecond: 47.836,
976
- timeTofirstToken: 0.667,
977
- intelligenceScore: 20.2,
978
- },
979
- lastUpdated: '2025-12-24',
980
- },
981
- 'claude-3-7-sonnet-20250219': {
982
- type: 'chat',
983
- provider: 'anthropic',
984
- displayName: 'Claude 3.7 Sonnet',
985
- pricing: { input: 0.003, output: 0.015 },
986
- benchmarks: {
987
- intelligence: 41.1,
988
- coding: 32.3,
989
- math: 21,
990
- mmluPro: 0.803,
991
- gpqa: 0.656,
992
- },
993
- performance: {
994
- outputTokenPerSecond: 0,
995
- timeTofirstToken: 0,
996
- intelligenceScore: 41.1,
997
- },
998
- lastUpdated: '2025-12-24',
999
- },
1000
- 'claude-sonnet-4-20250514': {
1001
- type: 'chat',
1002
- provider: 'anthropic',
1003
- displayName: 'Claude 4 Sonnet',
1004
- pricing: { input: 0.003, output: 0.015 },
1005
- benchmarks: {
1006
- intelligence: 44.4,
1007
- coding: 35.9,
1008
- math: 38,
1009
- mmluPro: 0.837,
1010
- gpqa: 0.683,
1011
- },
1012
- performance: {
1013
- outputTokenPerSecond: 59.339,
1014
- timeTofirstToken: 1.181,
1015
- intelligenceScore: 44.4,
1016
- },
1017
- lastUpdated: '2025-12-24',
1018
- },
1019
- 'claude-opus-4-20250514': {
1020
- type: 'chat',
1021
- provider: 'anthropic',
1022
- displayName: 'Claude 4 Opus',
1023
- pricing: { input: 0.015, output: 0.075 },
1024
- benchmarks: {
1025
- intelligence: 42.3,
1026
- math: 36.3,
1027
- mmluPro: 0.86,
1028
- gpqa: 0.701,
1029
- },
1030
- performance: {
1031
- outputTokenPerSecond: 40.647,
1032
- timeTofirstToken: 1.319,
1033
- intelligenceScore: 42.3,
1034
- },
1035
- lastUpdated: '2025-12-24',
1036
- },
1037
- 'claude-opus-4-1-20250805': {
1038
- type: 'chat',
1039
- provider: 'anthropic',
1040
- displayName: 'Claude 4.1 Opus',
1041
- pricing: { input: 0.015, output: 0.075 },
1042
- benchmarks: {
1043
- intelligence: 44.6,
1044
- },
1045
- performance: {
1046
- outputTokenPerSecond: 39.197,
1047
- timeTofirstToken: 1.41,
1048
- intelligenceScore: 44.6,
1049
- },
1050
- lastUpdated: '2025-12-24',
1051
- },
1052
- 'claude-sonnet-4-5-20250929': {
1053
- type: 'chat',
1054
- provider: 'anthropic',
1055
- displayName: 'Claude 4.5 Sonnet',
1056
- pricing: { input: 0.003, output: 0.015 },
1057
- benchmarks: {
1058
- intelligence: 49.6,
1059
- coding: 42.9,
1060
- math: 37,
1061
- mmluPro: 0.86,
1062
- gpqa: 0.727,
1063
- },
1064
- performance: {
1065
- outputTokenPerSecond: 69.532,
1066
- timeTofirstToken: 2.014,
1067
- intelligenceScore: 49.6,
1068
- },
1069
- lastUpdated: '2025-12-24',
1070
- },
1071
- 'claude-haiku-4-5-20251001': {
1072
- type: 'chat',
1073
- provider: 'anthropic',
1074
- displayName: 'Claude 4.5 Haiku',
1075
- pricing: { input: 0.001, output: 0.005 },
1076
- benchmarks: {
1077
- intelligence: 41.7,
1078
- coding: 37,
1079
- math: 39,
1080
- mmluPro: 0.8,
1081
- gpqa: 0.646,
1082
- },
1083
- performance: {
1084
- outputTokenPerSecond: 111.623,
1085
- timeTofirstToken: 0.39,
1086
- intelligenceScore: 41.7,
1087
- },
1088
- lastUpdated: '2025-12-24',
1089
- },
1090
- 'claude-opus-4-5-20251101': {
1091
- type: 'chat',
1092
- provider: 'anthropic',
1093
- displayName: 'Claude 4.5 Opus',
1094
- lastUpdated: '2025-12-24',
1095
- },
1096
- 'voyage-large-2-instruct': {
1097
- type: 'embeddings',
1098
- provider: 'anthropic',
1099
- displayName: 'Voyage large 2 instruct',
1100
- contextLength: 16000,
1101
- lastUpdated: '2025-12-24',
1102
- },
1103
- 'voyage-finance-2': {
1104
- type: 'embeddings',
1105
- provider: 'anthropic',
1106
- displayName: 'Voyage finance 2',
1107
- contextLength: 32000,
1108
- lastUpdated: '2025-12-24',
1109
- },
1110
- 'voyage-multilingual-2': {
1111
- type: 'embeddings',
1112
- provider: 'anthropic',
1113
- displayName: 'Voyage multilingual 2',
1114
- contextLength: 32000,
1115
- lastUpdated: '2025-12-24',
1116
- },
1117
- 'voyage-law-2': {
1118
- type: 'embeddings',
1119
- provider: 'anthropic',
1120
- displayName: 'Voyage law 2',
1121
- contextLength: 16000,
1122
- lastUpdated: '2025-12-24',
1123
- },
1124
- 'voyage-code-2': {
1125
- type: 'embeddings',
1126
- provider: 'anthropic',
1127
- displayName: 'Voyage code 2',
1128
- contextLength: 16000,
1129
- lastUpdated: '2025-12-24',
1130
- },
1131
- 'voyage-large-2': {
1132
- type: 'embeddings',
1133
- provider: 'anthropic',
1134
- displayName: 'Voyage large 2',
1135
- contextLength: 16000,
1136
- lastUpdated: '2025-12-24',
1137
- },
1138
- 'voyage-2': {
1139
- type: 'embeddings',
1140
- provider: 'anthropic',
1141
- displayName: 'Voyage 2',
1142
- contextLength: 4000,
1143
- lastUpdated: '2025-12-24',
1144
- },
1145
- // Google models
1146
- 'google/gemini-2.0-flash-exp': {
1147
- type: 'chat',
1148
- provider: 'google',
1149
- displayName: 'Gemini 2.0 Flash Experimental',
1150
- benchmarks: {
1151
- intelligence: 31.8,
1152
- mmluPro: 0.782,
1153
- gpqa: 0.636,
1154
- },
1155
- performance: {
1156
- outputTokenPerSecond: 166.706,
1157
- timeTofirstToken: 0.284,
1158
- intelligenceScore: 31.8,
1159
- },
1160
- lastUpdated: '2025-12-24',
1161
- },
1162
- 'google/gemini-2.0-flash': {
1163
- type: 'chat',
1164
- provider: 'google',
1165
- displayName: 'Gemini 2.0 Flash',
1166
- pricing: { input: 0.0001, output: 0.0004 },
1167
- benchmarks: {
1168
- intelligence: 33.6,
1169
- coding: 23.4,
1170
- math: 21.7,
1171
- mmluPro: 0.779,
1172
- gpqa: 0.623,
1173
- },
1174
- performance: {
1175
- outputTokenPerSecond: 0,
1176
- timeTofirstToken: 0,
1177
- intelligenceScore: 33.6,
1178
- },
1179
- lastUpdated: '2025-12-24',
1180
- },
1181
- 'google/gemini-2.5-pro': {
1182
- type: 'chat',
1183
- provider: 'google',
1184
- displayName: 'Gemini 2.5 Pro',
1185
- pricing: { input: 0.00125, output: 0.01 },
1186
- benchmarks: {
1187
- intelligence: 59.6,
1188
- coding: 49.3,
1189
- math: 87.7,
1190
- mmluPro: 0.862,
1191
- gpqa: 0.844,
1192
- },
1193
- performance: {
1194
- outputTokenPerSecond: 160.909,
1195
- timeTofirstToken: 34.11,
1196
- intelligenceScore: 59.6,
1197
- },
1198
- lastUpdated: '2025-12-24',
1199
- },
1200
- 'google/gemini-2.5-flash': {
1201
- type: 'chat',
1202
- provider: 'google',
1203
- displayName: 'Gemini 2.5 Flash',
1204
- pricing: { input: 0.0003, output: 0.0025 },
1205
- benchmarks: {
1206
- intelligence: 40.4,
1207
- coding: 30,
1208
- math: 60.3,
1209
- mmluPro: 0.809,
1210
- gpqa: 0.683,
1211
- },
1212
- performance: {
1213
- outputTokenPerSecond: 261.732,
1214
- timeTofirstToken: 0.421,
1215
- intelligenceScore: 40.4,
1216
- },
1217
- lastUpdated: '2025-12-24',
1218
- },
1219
- 'google/gemma-3-4b-it': {
1220
- type: 'chat',
1221
- provider: 'google',
1222
- displayName: 'Gemma 3 4B',
1223
- benchmarks: {
1224
- intelligence: 14.7,
1225
- coding: 6.4,
1226
- math: 12.7,
1227
- mmluPro: 0.417,
1228
- gpqa: 0.291,
1229
- },
1230
- performance: {
1231
- outputTokenPerSecond: 42.309,
1232
- timeTofirstToken: 0.976,
1233
- intelligenceScore: 14.7,
1234
- },
1235
- lastUpdated: '2025-12-24',
1236
- },
1237
- 'google/gemma-3-12b-it': {
1238
- type: 'chat',
1239
- provider: 'google',
1240
- displayName: 'Gemma 3 12B',
1241
- benchmarks: {
1242
- intelligence: 20.4,
1243
- coding: 10.6,
1244
- math: 18.3,
1245
- mmluPro: 0.595,
1246
- gpqa: 0.349,
1247
- },
1248
- performance: {
1249
- outputTokenPerSecond: 46.989,
1250
- timeTofirstToken: 7.926,
1251
- intelligenceScore: 20.4,
1252
- },
1253
- lastUpdated: '2025-12-24',
1254
- },
1255
- 'google/gemma-3-27b-it': {
1256
- type: 'chat',
1257
- provider: 'google',
1258
- displayName: 'Gemma 3 27B',
1259
- benchmarks: {
1260
- intelligence: 22.1,
1261
- coding: 12.8,
1262
- math: 20.7,
1263
- mmluPro: 0.669,
1264
- gpqa: 0.428,
1265
- },
1266
- performance: {
1267
- outputTokenPerSecond: 47.301,
1268
- timeTofirstToken: 0.781,
1269
- intelligenceScore: 22.1,
1270
- },
1271
- lastUpdated: '2025-12-24',
1272
- },
1273
- 'google/gemini-2.5-flash-lite-preview': {
1274
- type: 'chat',
1275
- provider: 'google',
1276
- displayName: 'Gemini 2.5 Flash Lite Preview',
1277
- pricing: { input: 0.0001, output: 0.0004 },
1278
- benchmarks: {
1279
- intelligence: 30.1,
1280
- coding: 19.9,
1281
- math: 35.3,
1282
- mmluPro: 0.724,
1283
- gpqa: 0.474,
1284
- },
1285
- performance: {
1286
- outputTokenPerSecond: 0,
1287
- timeTofirstToken: 0,
1288
- intelligenceScore: 30.1,
1289
- },
1290
- lastUpdated: '2025-12-24',
1291
- },
1292
- 'google/gemma-3n-e4b-it': {
1293
- type: 'chat',
1294
- provider: 'google',
1295
- displayName: 'Gemma 3n 4B',
1296
- pricing: { input: 0.00002, output: 0.00004 },
1297
- benchmarks: {
1298
- intelligence: 15.5,
1299
- coding: 8.3,
1300
- math: 14.3,
1301
- mmluPro: 0.488,
1302
- gpqa: 0.296,
1303
- },
1304
- performance: {
1305
- outputTokenPerSecond: 0,
1306
- timeTofirstToken: 0,
1307
- intelligenceScore: 15.5,
1308
- },
1309
- lastUpdated: '2025-12-24',
1310
- },
1311
- 'google/gemini-3-pro-preview': {
1312
- type: 'chat',
1313
- provider: 'google',
1314
- displayName: 'Gemini 3 Pro Preview',
1315
- pricing: { input: 0.002, output: 0.012 },
1316
- benchmarks: {
1317
- intelligence: 72.8,
1318
- coding: 62.3,
1319
- math: 95.7,
1320
- mmluPro: 0.898,
1321
- gpqa: 0.908,
1322
- },
1323
- performance: {
1324
- outputTokenPerSecond: 133.913,
1325
- timeTofirstToken: 29.692,
1326
- intelligenceScore: 72.8,
1327
- },
1328
- lastUpdated: '2025-12-24',
1329
- },
1330
- 'google/gemini-3-flash-preview': {
1331
- type: 'chat',
1332
- provider: 'google',
1333
- displayName: 'Gemini 3 Flash Preview',
1334
- pricing: { input: 0.0005, output: 0.003 },
1335
- benchmarks: {
1336
- intelligence: 54.5,
1337
- coding: 53.1,
1338
- math: 55.7,
1339
- mmluPro: 0.882,
1340
- gpqa: 0.812,
1341
- },
1342
- performance: {
1343
- outputTokenPerSecond: 191.798,
1344
- timeTofirstToken: 0.683,
1345
- intelligenceScore: 54.5,
1346
- },
1347
- lastUpdated: '2025-12-24',
1348
- },
1349
- 'google/gc-document-ai': {
1350
- type: 'document',
1351
- provider: 'google',
1352
- displayName: 'GC document AI',
1353
- lastUpdated: '2025-12-24',
1354
- },
1355
- 'imagen-3.0-generate-002': {
1356
- type: 'image',
1357
- provider: 'google',
1358
- displayName: 'Imagen 3.0',
1359
- lastUpdated: '2025-12-24',
1360
- },
1361
- 'imagen-4.0-ultra-generate-preview-06-06': {
1362
- type: 'image',
1363
- provider: 'google',
1364
- displayName: 'Imagen 4.0 Ultra',
1365
- lastUpdated: '2025-12-24',
1366
- },
1367
- 'google/imagen-4.0-generate-001': {
1368
- type: 'image',
1369
- provider: 'google',
1370
- displayName: 'Imagen 4.0 Generate',
1371
- lastUpdated: '2025-12-24',
1372
- },
1373
- 'google/imagen-4.0-fast-generate-001': {
1374
- type: 'image',
1375
- provider: 'google',
1376
- displayName: 'Imagen 4.0 Fast Generate',
1377
- lastUpdated: '2025-12-24',
1378
- },
1379
- 'google/imagen-4.0-ultra-generate-001': {
1380
- type: 'image',
1381
- provider: 'google',
1382
- displayName: 'Imagen 4.0 Ultra Generate',
1383
- lastUpdated: '2025-12-24',
1384
- },
1385
- 'google/imagen4/preview': {
1386
- type: 'image',
1387
- provider: 'google',
1388
- displayName: 'Imagen 4.0 Generate Preview',
1389
- lastUpdated: '2025-12-24',
1390
- },
1391
- 'google/gemini-2.5-flash-image': {
1392
- type: 'image',
1393
- provider: 'google',
1394
- displayName: 'Gemini 2.5 Flash Image',
1395
- lastUpdated: '2025-12-24',
1396
- },
1397
- 'google/gemini-2.5-flash-image-edit': {
1398
- type: 'image',
1399
- provider: 'google',
1400
- displayName: 'Gemini 2.5 Flash Image Edit',
1401
- lastUpdated: '2025-12-24',
1402
- },
1403
- 'google/gemini-3-pro-image-preview': {
1404
- type: 'image',
1405
- provider: 'google',
1406
- displayName: 'Gemini 3 Pro Image',
1407
- lastUpdated: '2025-12-24',
1408
- },
1409
- 'google/nano-banana-pro': {
1410
- type: 'image',
1411
- provider: 'google',
1412
- displayName: 'Nano Banana Pro',
1413
- lastUpdated: '2025-12-24',
1414
- },
1415
- 'google/gemini-3-pro-image-preview-edit': {
1416
- type: 'image',
1417
- provider: 'google',
1418
- displayName: 'Gemini 3 Pro Image Edit',
1419
- lastUpdated: '2025-12-24',
1420
- },
1421
- 'google/nano-banana-pro-edit': {
1422
- type: 'image',
1423
- provider: 'google',
1424
- displayName: 'Nano Banana Pro Edit',
1425
- lastUpdated: '2025-12-24',
1426
- },
1427
- 'text-embedding-004': {
1428
- type: 'embeddings',
1429
- provider: 'google',
1430
- displayName: 'Text embedding 004',
1431
- contextLength: 2000,
1432
- lastUpdated: '2025-12-24',
1433
- },
1434
- 'text-multilingual-embedding-002': {
1435
- type: 'embeddings',
1436
- provider: 'google',
1437
- displayName: 'Text multilingual embedding 002',
1438
- contextLength: 2000,
1439
- lastUpdated: '2025-12-24',
1440
- },
1441
- 'google/veo-3.1-t2v': {
1442
- type: 'video',
1443
- provider: 'google',
1444
- displayName: 'Veo3.1 Text-To-Video',
1445
- lastUpdated: '2025-12-24',
1446
- },
1447
- 'google/veo-3.1-i2v': {
1448
- type: 'video',
1449
- provider: 'google',
1450
- displayName: 'Veo3.1 Image-To-Video',
1451
- lastUpdated: '2025-12-24',
1452
- },
1453
- 'google/veo-3.1-first-last-image-to-video': {
1454
- type: 'video',
1455
- provider: 'google',
1456
- displayName: 'Veo3.1 First-Last-Frame-Image-To-Video',
1457
- lastUpdated: '2025-12-24',
1458
- },
1459
- 'google/veo-3.1-reference-to-video': {
1460
- type: 'video',
1461
- provider: 'google',
1462
- displayName: 'Veo3.1 Reference-To-Video',
1463
- lastUpdated: '2025-12-24',
1464
- },
1465
- 'google/veo-3.1-t2v-fast': {
1466
- type: 'video',
1467
- provider: 'google',
1468
- displayName: 'Veo3.1 Text-To-Video Fast',
1469
- lastUpdated: '2025-12-24',
1470
- },
1471
- 'google/veo-3.1-i2v-fast': {
1472
- type: 'video',
1473
- provider: 'google',
1474
- displayName: 'Veo3.1 Image-To-Video Fast',
1475
- lastUpdated: '2025-12-24',
1476
- },
1477
- 'google/veo-3.1-first-last-image-to-video-fast': {
1478
- type: 'video',
1479
- provider: 'google',
1480
- displayName: 'Veo3.1 First-Last-Frame-Image-To-Video Fast',
1481
- lastUpdated: '2025-12-24',
1482
- },
1483
- 'google/veo3-1-extend-video': {
1484
- type: 'video',
1485
- provider: 'google',
1486
- displayName: 'Veo 3.1 Extend Video',
1487
- lastUpdated: '2025-12-24',
1488
- },
1489
- 'google/veo3-1-fast-extend-video': {
1490
- type: 'video',
1491
- provider: 'google',
1492
- displayName: 'Veo 3.1 Fast Extend Video',
1493
- lastUpdated: '2025-12-24',
1494
- },
1495
- 'veo2/image-to-video': {
1496
- type: 'video',
1497
- provider: 'google',
1498
- displayName: 'Veo2 Image-to-Video',
1499
- lastUpdated: '2025-12-24',
1500
- },
1501
- 'veo2': {
1502
- type: 'video',
1503
- provider: 'google',
1504
- displayName: 'Veo2 Text-to-Video',
1505
- lastUpdated: '2025-12-24',
1506
- },
1507
- 'google/veo3': {
1508
- type: 'video',
1509
- provider: 'google',
1510
- displayName: 'Veo3 Text-to-Video',
1511
- lastUpdated: '2025-12-24',
1512
- },
1513
- 'google/veo-3.0-i2v': {
1514
- type: 'video',
1515
- provider: 'google',
1516
- displayName: 'Veo3 Image-to-Video',
1517
- lastUpdated: '2025-12-24',
1518
- },
1519
- 'google/veo-3.0-fast': {
1520
- type: 'video',
1521
- provider: 'google',
1522
- displayName: 'Veo3 Text-To-Video Fast',
1523
- lastUpdated: '2025-12-24',
1524
- },
1525
- 'google/veo-3.0-i2v-fast': {
1526
- type: 'video',
1527
- provider: 'google',
1528
- displayName: 'Veo3 Image-to-Video Fast',
1529
- lastUpdated: '2025-12-24',
1530
- },
1531
- 'google/lyria2': {
2939
+ description: 'Text-to-speech model optimized for quality',
2940
+ pricing: { input: 0, output: 0 },
2941
+ context: {
2942
+ input: {
2943
+ text: true,
2944
+ audio: false,
2945
+ image: false,
2946
+ video: false
2947
+ },
2948
+ output: {
2949
+ text: false,
2950
+ audio: true,
2951
+ image: false,
2952
+ video: false
2953
+ }
2954
+ },
2955
+ deprecated: false,
2956
+ isAvailable: true,
2957
+ lastUpdated: '2026-01-02',
2958
+ },
2959
+ 'whisper-1': {
1532
2960
  type: 'audio',
1533
- provider: 'google',
1534
- displayName: 'Lyria 2',
1535
- lastUpdated: '2025-12-24',
1536
- },
1537
- // Mistral models
1538
- 'mistralai/Mixtral-8x7B-Instruct-v0.1': {
1539
- type: 'chat',
1540
- provider: 'mistral',
1541
- displayName: 'Mixtral 8x7B Instruct v0.1',
1542
- pricing: { input: 0.00054, output: 0.0006 },
1543
- benchmarks: {
1544
- intelligence: 2.6,
1545
- mmluPro: 0.387,
1546
- gpqa: 0.292,
1547
- },
1548
- performance: {
1549
- outputTokenPerSecond: 0,
1550
- timeTofirstToken: 0,
1551
- intelligenceScore: 2.6,
1552
- },
1553
- lastUpdated: '2025-12-24',
1554
- },
1555
- 'mistralai/Mistral-7B-Instruct-v0.2': {
1556
- type: 'chat',
1557
- provider: 'mistral',
1558
- displayName: 'Mistral 7B Instruct v0.2',
1559
- pricing: { input: 0.00025, output: 0.00025 },
1560
- benchmarks: {
1561
- intelligence: 1,
1562
- mmluPro: 0.245,
1563
- gpqa: 0.177,
1564
- },
1565
- performance: {
1566
- outputTokenPerSecond: 123.408,
1567
- timeTofirstToken: 0.382,
1568
- intelligenceScore: 1,
1569
- },
1570
- lastUpdated: '2025-12-24',
1571
- },
1572
- 'mistralai/Mistral-7B-Instruct-v0.3': {
1573
- type: 'chat',
1574
- provider: 'mistral',
1575
- displayName: 'Mistral 7B Instruct v0.3',
1576
- pricing: { input: 0.00025, output: 0.00025 },
1577
- benchmarks: {
1578
- intelligence: 1,
1579
- mmluPro: 0.245,
1580
- gpqa: 0.177,
1581
- },
1582
- performance: {
1583
- outputTokenPerSecond: 123.408,
1584
- timeTofirstToken: 0.382,
1585
- intelligenceScore: 1,
1586
- },
1587
- lastUpdated: '2025-12-24',
1588
- },
1589
- 'mistralai/mistral-tiny': {
1590
- type: 'chat',
1591
- provider: 'mistral',
1592
- displayName: 'Mistral tiny',
1593
- pricing: { input: 0.0002, output: 0.0006 },
1594
- benchmarks: {
1595
- intelligence: 13,
1596
- mmluPro: 0.529,
1597
- gpqa: 0.381,
1598
- },
1599
- performance: {
1600
- outputTokenPerSecond: 115.713,
1601
- timeTofirstToken: 0.399,
1602
- intelligenceScore: 13,
1603
- },
1604
- lastUpdated: '2025-12-24',
1605
- },
1606
- 'mistralai/mistral-nemo': {
1607
- type: 'chat',
1608
- provider: 'mistral',
1609
- displayName: 'Mistral nemo',
1610
- pricing: { input: 0.0002, output: 0.0006 },
1611
- benchmarks: {
1612
- intelligence: 13,
1613
- mmluPro: 0.529,
1614
- gpqa: 0.381,
1615
- },
1616
- performance: {
1617
- outputTokenPerSecond: 115.713,
1618
- timeTofirstToken: 0.399,
1619
- intelligenceScore: 13,
1620
- },
1621
- lastUpdated: '2025-12-24',
1622
- },
1623
- 'mistral/mistral-ocr-latest': {
1624
- type: 'document',
1625
- provider: 'mistral',
1626
- displayName: 'Mistral OCR',
1627
- lastUpdated: '2025-12-24',
1628
- },
2961
+ provider: 'openai',
2962
+ displayName: 'Whisper',
2963
+ description: 'General-purpose speech recognition model',
2964
+ pricing: { input: 0, output: 0 },
2965
+ context: {
2966
+ input: {
2967
+ text: false,
2968
+ audio: true,
2969
+ image: false,
2970
+ video: false
2971
+ },
2972
+ output: {
2973
+ text: true,
2974
+ audio: false,
2975
+ image: false,
2976
+ video: false
2977
+ }
2978
+ },
2979
+ deprecated: false,
2980
+ isAvailable: true,
2981
+ lastUpdated: '2026-01-02',
2982
+ }
1629
2983
  };