@lov3kaizen/agentsea-costs 0.5.2 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/dist/index.js CHANGED
@@ -6,17 +6,628 @@ import { Cron } from 'croner';
6
6
 
7
7
  // src/pricing/ModelPricingRegistry.ts
8
8
  var DEFAULT_PRICING = [
9
- // Anthropic Models
9
+ // ---- Anthropic Models ----
10
+ // Claude Fable 5 — most capable model. Adaptive thinking + effort param;
11
+ // no budget_tokens extended thinking, no assistant prefill;
12
+ // temperature/top_p removed at the API level.
13
+ {
14
+ model: "claude-fable-5",
15
+ provider: "anthropic",
16
+ displayName: "Claude Fable 5",
17
+ inputPricePerMillion: 10,
18
+ outputPricePerMillion: 50,
19
+ cacheReadPricePerMillion: 1,
20
+ cacheWritePricePerMillion: 12.5,
21
+ contextWindow: 1e6,
22
+ maxOutputTokens: 128e3,
23
+ currency: "USD",
24
+ capabilities: {
25
+ vision: true,
26
+ functionCalling: true,
27
+ streaming: true,
28
+ jsonMode: true,
29
+ systemMessage: true,
30
+ extendedThinking: true
31
+ }
32
+ },
33
+ // Claude Opus 4.8 — recommended default. Adaptive thinking + effort param;
34
+ // no budget_tokens extended thinking, no assistant prefill;
35
+ // temperature/top_p removed at the API level.
36
+ {
37
+ model: "claude-opus-4-8",
38
+ provider: "anthropic",
39
+ displayName: "Claude Opus 4.8",
40
+ inputPricePerMillion: 5,
41
+ outputPricePerMillion: 25,
42
+ cacheReadPricePerMillion: 0.5,
43
+ cacheWritePricePerMillion: 6.25,
44
+ contextWindow: 1e6,
45
+ maxOutputTokens: 128e3,
46
+ currency: "USD",
47
+ capabilities: {
48
+ vision: true,
49
+ functionCalling: true,
50
+ streaming: true,
51
+ jsonMode: true,
52
+ systemMessage: true,
53
+ extendedThinking: true
54
+ }
55
+ },
56
+ // Claude Opus 4.7 — previous-generation Opus. Adaptive thinking + effort
57
+ // param; no budget_tokens extended thinking, no assistant prefill;
58
+ // temperature/top_p removed at the API level.
59
+ {
60
+ model: "claude-opus-4-7",
61
+ provider: "anthropic",
62
+ displayName: "Claude Opus 4.7",
63
+ inputPricePerMillion: 5,
64
+ outputPricePerMillion: 25,
65
+ cacheReadPricePerMillion: 0.5,
66
+ cacheWritePricePerMillion: 6.25,
67
+ contextWindow: 1e6,
68
+ maxOutputTokens: 128e3,
69
+ currency: "USD",
70
+ capabilities: {
71
+ vision: true,
72
+ functionCalling: true,
73
+ streaming: true,
74
+ jsonMode: true,
75
+ systemMessage: true,
76
+ extendedThinking: true
77
+ }
78
+ },
79
+ // Claude Sonnet 4.6 — best speed/intelligence balance. Adaptive thinking +
80
+ // effort param; no budget_tokens extended thinking, no assistant prefill.
81
+ {
82
+ model: "claude-sonnet-4-6",
83
+ provider: "anthropic",
84
+ displayName: "Claude Sonnet 4.6",
85
+ inputPricePerMillion: 3,
86
+ outputPricePerMillion: 15,
87
+ cacheReadPricePerMillion: 0.3,
88
+ cacheWritePricePerMillion: 3.75,
89
+ contextWindow: 1e6,
90
+ maxOutputTokens: 64e3,
91
+ currency: "USD",
92
+ capabilities: {
93
+ vision: true,
94
+ functionCalling: true,
95
+ streaming: true,
96
+ jsonMode: true,
97
+ systemMessage: true,
98
+ extendedThinking: true
99
+ }
100
+ },
101
+ {
102
+ model: "claude-opus-4-6",
103
+ provider: "anthropic",
104
+ displayName: "Claude Opus 4.6",
105
+ inputPricePerMillion: 5,
106
+ outputPricePerMillion: 25,
107
+ cacheReadPricePerMillion: 0.5,
108
+ cacheWritePricePerMillion: 6.25,
109
+ contextWindow: 1e6,
110
+ maxOutputTokens: 128e3,
111
+ currency: "USD",
112
+ capabilities: {
113
+ vision: true,
114
+ functionCalling: true,
115
+ streaming: true,
116
+ jsonMode: true,
117
+ systemMessage: true,
118
+ extendedThinking: true
119
+ }
120
+ },
121
+ {
122
+ model: "claude-sonnet-4-5-20250929",
123
+ provider: "anthropic",
124
+ displayName: "Claude Sonnet 4.5",
125
+ inputPricePerMillion: 3,
126
+ outputPricePerMillion: 15,
127
+ cacheReadPricePerMillion: 0.3,
128
+ cacheWritePricePerMillion: 3.75,
129
+ contextWindow: 2e5,
130
+ maxOutputTokens: 16e3,
131
+ currency: "USD",
132
+ capabilities: {
133
+ vision: true,
134
+ functionCalling: true,
135
+ streaming: true,
136
+ jsonMode: true,
137
+ systemMessage: true,
138
+ extendedThinking: true
139
+ }
140
+ },
141
+ {
142
+ model: "claude-haiku-4-5-20251001",
143
+ provider: "anthropic",
144
+ displayName: "Claude Haiku 4.5",
145
+ inputPricePerMillion: 0.8,
146
+ outputPricePerMillion: 4,
147
+ cacheReadPricePerMillion: 0.08,
148
+ cacheWritePricePerMillion: 1,
149
+ contextWindow: 2e5,
150
+ maxOutputTokens: 8192,
151
+ currency: "USD",
152
+ capabilities: {
153
+ vision: true,
154
+ functionCalling: true,
155
+ streaming: true,
156
+ jsonMode: true,
157
+ systemMessage: true
158
+ }
159
+ },
160
+ {
161
+ model: "claude-opus-4-5-20251101",
162
+ provider: "anthropic",
163
+ displayName: "Claude Opus 4.5",
164
+ inputPricePerMillion: 15,
165
+ outputPricePerMillion: 75,
166
+ cacheReadPricePerMillion: 1.5,
167
+ cacheWritePricePerMillion: 18.75,
168
+ contextWindow: 2e5,
169
+ maxOutputTokens: 32e3,
170
+ currency: "USD",
171
+ capabilities: {
172
+ vision: true,
173
+ functionCalling: true,
174
+ streaming: true,
175
+ jsonMode: true,
176
+ systemMessage: true,
177
+ extendedThinking: true
178
+ }
179
+ },
180
+ /** @deprecated Retiring 2026-06-15. Use 'claude-opus-4-8' instead. */
181
+ {
182
+ model: "claude-opus-4-0-20250514",
183
+ provider: "anthropic",
184
+ displayName: "Claude Opus 4",
185
+ deprecated: true,
186
+ inputPricePerMillion: 15,
187
+ outputPricePerMillion: 75,
188
+ cacheReadPricePerMillion: 1.5,
189
+ cacheWritePricePerMillion: 18.75,
190
+ contextWindow: 2e5,
191
+ maxOutputTokens: 32e3,
192
+ currency: "USD",
193
+ capabilities: {
194
+ vision: true,
195
+ functionCalling: true,
196
+ streaming: true,
197
+ jsonMode: true,
198
+ systemMessage: true,
199
+ extendedThinking: true
200
+ }
201
+ },
202
+ /** @deprecated Retiring 2026-06-15. Use 'claude-sonnet-4-6' instead. */
203
+ {
204
+ model: "claude-sonnet-4-0-20250514",
205
+ provider: "anthropic",
206
+ displayName: "Claude Sonnet 4",
207
+ deprecated: true,
208
+ inputPricePerMillion: 3,
209
+ outputPricePerMillion: 15,
210
+ cacheReadPricePerMillion: 0.3,
211
+ cacheWritePricePerMillion: 3.75,
212
+ contextWindow: 2e5,
213
+ maxOutputTokens: 16e3,
214
+ currency: "USD",
215
+ capabilities: {
216
+ vision: true,
217
+ functionCalling: true,
218
+ streaming: true,
219
+ jsonMode: true,
220
+ systemMessage: true,
221
+ extendedThinking: true
222
+ }
223
+ },
224
+ /** @deprecated Retired 2026-02-19 (API returns 404). Use 'claude-sonnet-4-6' instead. */
225
+ {
226
+ model: "claude-3-7-sonnet-20250219",
227
+ provider: "anthropic",
228
+ displayName: "Claude 3.7 Sonnet",
229
+ deprecated: true,
230
+ inputPricePerMillion: 3,
231
+ outputPricePerMillion: 15,
232
+ cacheReadPricePerMillion: 0.3,
233
+ cacheWritePricePerMillion: 3.75,
234
+ contextWindow: 2e5,
235
+ maxOutputTokens: 128e3,
236
+ currency: "USD",
237
+ capabilities: {
238
+ vision: true,
239
+ functionCalling: true,
240
+ streaming: true,
241
+ jsonMode: true,
242
+ systemMessage: true,
243
+ extendedThinking: true,
244
+ computerUse: true
245
+ }
246
+ },
247
+ /** @deprecated Retired 2025-10-28 (API returns 404). Use 'claude-sonnet-4-6' instead. */
10
248
  {
11
249
  model: "claude-3-5-sonnet-20241022",
12
250
  provider: "anthropic",
13
251
  displayName: "Claude 3.5 Sonnet",
252
+ deprecated: true,
14
253
  inputPricePerMillion: 3,
15
254
  outputPricePerMillion: 15,
16
255
  cacheReadPricePerMillion: 0.3,
17
256
  cacheWritePricePerMillion: 3.75,
18
257
  contextWindow: 2e5,
19
- maxOutputTokens: 8192,
258
+ maxOutputTokens: 8192,
259
+ currency: "USD",
260
+ capabilities: {
261
+ vision: true,
262
+ functionCalling: true,
263
+ streaming: true,
264
+ jsonMode: true,
265
+ systemMessage: true,
266
+ computerUse: true
267
+ }
268
+ },
269
+ /** @deprecated Retired 2026-02-19 (API returns 404). Use 'claude-haiku-4-5' instead. */
270
+ {
271
+ model: "claude-3-5-haiku-20241022",
272
+ provider: "anthropic",
273
+ displayName: "Claude 3.5 Haiku",
274
+ deprecated: true,
275
+ inputPricePerMillion: 0.8,
276
+ outputPricePerMillion: 4,
277
+ cacheReadPricePerMillion: 0.08,
278
+ cacheWritePricePerMillion: 1,
279
+ contextWindow: 2e5,
280
+ maxOutputTokens: 8192,
281
+ currency: "USD",
282
+ capabilities: {
283
+ vision: true,
284
+ functionCalling: true,
285
+ streaming: true,
286
+ jsonMode: true,
287
+ systemMessage: true
288
+ }
289
+ },
290
+ /** @deprecated Retired 2026-01-05 (API returns 404). Use 'claude-opus-4-8' instead. */
291
+ {
292
+ model: "claude-3-opus-20240229",
293
+ provider: "anthropic",
294
+ displayName: "Claude 3 Opus",
295
+ deprecated: true,
296
+ inputPricePerMillion: 15,
297
+ outputPricePerMillion: 75,
298
+ cacheReadPricePerMillion: 1.5,
299
+ cacheWritePricePerMillion: 18.75,
300
+ contextWindow: 2e5,
301
+ maxOutputTokens: 4096,
302
+ currency: "USD",
303
+ capabilities: {
304
+ vision: true,
305
+ functionCalling: true,
306
+ streaming: true,
307
+ jsonMode: true,
308
+ systemMessage: true
309
+ }
310
+ },
311
+ /** @deprecated Retired 2026-04-19 (API returns 404). Use 'claude-haiku-4-5' instead. */
312
+ {
313
+ model: "claude-3-haiku-20240307",
314
+ provider: "anthropic",
315
+ displayName: "Claude 3 Haiku",
316
+ deprecated: true,
317
+ inputPricePerMillion: 0.25,
318
+ outputPricePerMillion: 1.25,
319
+ cacheReadPricePerMillion: 0.03,
320
+ cacheWritePricePerMillion: 0.3,
321
+ contextWindow: 2e5,
322
+ maxOutputTokens: 4096,
323
+ currency: "USD",
324
+ capabilities: {
325
+ vision: true,
326
+ functionCalling: true,
327
+ streaming: true,
328
+ jsonMode: true,
329
+ systemMessage: true
330
+ }
331
+ },
332
+ // ---- OpenAI Models ----
333
+ {
334
+ model: "gpt-4.1",
335
+ provider: "openai",
336
+ displayName: "GPT-4.1",
337
+ inputPricePerMillion: 2,
338
+ outputPricePerMillion: 8,
339
+ contextWindow: 1047576,
340
+ maxOutputTokens: 32768,
341
+ currency: "USD",
342
+ capabilities: {
343
+ vision: true,
344
+ functionCalling: true,
345
+ streaming: true,
346
+ jsonMode: true,
347
+ systemMessage: true
348
+ }
349
+ },
350
+ {
351
+ model: "gpt-4.1-mini",
352
+ provider: "openai",
353
+ displayName: "GPT-4.1 Mini",
354
+ inputPricePerMillion: 0.4,
355
+ outputPricePerMillion: 1.6,
356
+ contextWindow: 1047576,
357
+ maxOutputTokens: 16384,
358
+ currency: "USD",
359
+ capabilities: {
360
+ vision: true,
361
+ functionCalling: true,
362
+ streaming: true,
363
+ jsonMode: true,
364
+ systemMessage: true
365
+ }
366
+ },
367
+ {
368
+ model: "gpt-4.1-nano",
369
+ provider: "openai",
370
+ displayName: "GPT-4.1 Nano",
371
+ inputPricePerMillion: 0.1,
372
+ outputPricePerMillion: 0.4,
373
+ contextWindow: 1047576,
374
+ maxOutputTokens: 16384,
375
+ currency: "USD",
376
+ capabilities: {
377
+ vision: true,
378
+ functionCalling: true,
379
+ streaming: true,
380
+ jsonMode: true,
381
+ systemMessage: true
382
+ }
383
+ },
384
+ {
385
+ model: "gpt-5.5",
386
+ provider: "openai",
387
+ displayName: "GPT-5.5",
388
+ inputPricePerMillion: 5,
389
+ outputPricePerMillion: 30,
390
+ contextWindow: 105e4,
391
+ maxOutputTokens: 128e3,
392
+ currency: "USD",
393
+ capabilities: {
394
+ vision: true,
395
+ functionCalling: true,
396
+ streaming: true,
397
+ jsonMode: true,
398
+ systemMessage: true
399
+ }
400
+ },
401
+ {
402
+ model: "gpt-5.4-mini",
403
+ provider: "openai",
404
+ displayName: "GPT-5.4 Mini",
405
+ inputPricePerMillion: 0.75,
406
+ outputPricePerMillion: 4.5,
407
+ contextWindow: 4e5,
408
+ maxOutputTokens: 128e3,
409
+ currency: "USD",
410
+ capabilities: {
411
+ vision: true,
412
+ functionCalling: true,
413
+ streaming: true,
414
+ jsonMode: true,
415
+ systemMessage: true
416
+ }
417
+ },
418
+ {
419
+ model: "gpt-5.2",
420
+ provider: "openai",
421
+ displayName: "GPT-5.2",
422
+ inputPricePerMillion: 1.75,
423
+ outputPricePerMillion: 14,
424
+ contextWindow: 4e5,
425
+ maxOutputTokens: 128e3,
426
+ currency: "USD",
427
+ capabilities: {
428
+ vision: true,
429
+ functionCalling: true,
430
+ streaming: true,
431
+ jsonMode: true,
432
+ systemMessage: true
433
+ }
434
+ },
435
+ {
436
+ model: "gpt-5.2-pro",
437
+ provider: "openai",
438
+ displayName: "GPT-5.2 Pro",
439
+ inputPricePerMillion: 21,
440
+ outputPricePerMillion: 168,
441
+ contextWindow: 4e5,
442
+ maxOutputTokens: 128e3,
443
+ currency: "USD",
444
+ capabilities: {
445
+ vision: true,
446
+ functionCalling: true,
447
+ streaming: true,
448
+ jsonMode: true,
449
+ systemMessage: true
450
+ }
451
+ },
452
+ {
453
+ model: "gpt-5.2-codex",
454
+ provider: "openai",
455
+ displayName: "GPT-5.2 Codex",
456
+ inputPricePerMillion: 1.75,
457
+ outputPricePerMillion: 14,
458
+ contextWindow: 4e5,
459
+ maxOutputTokens: 128e3,
460
+ currency: "USD",
461
+ capabilities: {
462
+ vision: true,
463
+ functionCalling: true,
464
+ streaming: true,
465
+ jsonMode: true,
466
+ systemMessage: true
467
+ }
468
+ },
469
+ {
470
+ model: "gpt-5.1",
471
+ provider: "openai",
472
+ displayName: "GPT-5.1",
473
+ inputPricePerMillion: 1.25,
474
+ outputPricePerMillion: 10,
475
+ contextWindow: 4e5,
476
+ maxOutputTokens: 128e3,
477
+ currency: "USD",
478
+ capabilities: {
479
+ vision: true,
480
+ functionCalling: true,
481
+ streaming: true,
482
+ jsonMode: true,
483
+ systemMessage: true
484
+ }
485
+ },
486
+ {
487
+ model: "gpt-5.1-codex",
488
+ provider: "openai",
489
+ displayName: "GPT-5.1 Codex",
490
+ inputPricePerMillion: 1.25,
491
+ outputPricePerMillion: 10,
492
+ contextWindow: 4e5,
493
+ maxOutputTokens: 128e3,
494
+ currency: "USD",
495
+ capabilities: {
496
+ vision: true,
497
+ functionCalling: true,
498
+ streaming: true,
499
+ jsonMode: true,
500
+ systemMessage: true
501
+ }
502
+ },
503
+ {
504
+ model: "gpt-5.1-codex-mini",
505
+ provider: "openai",
506
+ displayName: "GPT-5.1 Codex Mini",
507
+ inputPricePerMillion: 0.25,
508
+ outputPricePerMillion: 2,
509
+ contextWindow: 4e5,
510
+ maxOutputTokens: 128e3,
511
+ currency: "USD",
512
+ capabilities: {
513
+ vision: true,
514
+ functionCalling: true,
515
+ streaming: true,
516
+ jsonMode: true,
517
+ systemMessage: true
518
+ }
519
+ },
520
+ {
521
+ model: "gpt-5.1-codex-max",
522
+ provider: "openai",
523
+ displayName: "GPT-5.1 Codex Max",
524
+ inputPricePerMillion: 1.25,
525
+ outputPricePerMillion: 10,
526
+ contextWindow: 4e5,
527
+ maxOutputTokens: 128e3,
528
+ currency: "USD",
529
+ capabilities: {
530
+ vision: true,
531
+ functionCalling: true,
532
+ streaming: true,
533
+ jsonMode: true,
534
+ systemMessage: true
535
+ }
536
+ },
537
+ {
538
+ model: "gpt-5",
539
+ provider: "openai",
540
+ displayName: "GPT-5",
541
+ inputPricePerMillion: 1.25,
542
+ outputPricePerMillion: 10,
543
+ contextWindow: 4e5,
544
+ maxOutputTokens: 128e3,
545
+ currency: "USD",
546
+ capabilities: {
547
+ vision: true,
548
+ functionCalling: true,
549
+ streaming: true,
550
+ jsonMode: true,
551
+ systemMessage: true
552
+ }
553
+ },
554
+ {
555
+ model: "gpt-5-mini",
556
+ provider: "openai",
557
+ displayName: "GPT-5 Mini",
558
+ inputPricePerMillion: 0.25,
559
+ outputPricePerMillion: 2,
560
+ contextWindow: 4e5,
561
+ maxOutputTokens: 128e3,
562
+ currency: "USD",
563
+ capabilities: {
564
+ vision: true,
565
+ functionCalling: true,
566
+ streaming: true,
567
+ jsonMode: true,
568
+ systemMessage: true
569
+ }
570
+ },
571
+ {
572
+ model: "gpt-5-nano",
573
+ provider: "openai",
574
+ displayName: "GPT-5 Nano",
575
+ inputPricePerMillion: 0.05,
576
+ outputPricePerMillion: 0.4,
577
+ contextWindow: 4e5,
578
+ maxOutputTokens: 128e3,
579
+ currency: "USD",
580
+ capabilities: {
581
+ vision: true,
582
+ functionCalling: true,
583
+ streaming: true,
584
+ jsonMode: true,
585
+ systemMessage: true
586
+ }
587
+ },
588
+ {
589
+ model: "gpt-5-pro",
590
+ provider: "openai",
591
+ displayName: "GPT-5 Pro",
592
+ inputPricePerMillion: 15,
593
+ outputPricePerMillion: 120,
594
+ contextWindow: 4e5,
595
+ maxOutputTokens: 272e3,
596
+ currency: "USD",
597
+ capabilities: {
598
+ vision: true,
599
+ functionCalling: true,
600
+ streaming: true,
601
+ jsonMode: true,
602
+ systemMessage: true
603
+ }
604
+ },
605
+ {
606
+ model: "gpt-4.5-preview",
607
+ provider: "openai",
608
+ displayName: "GPT-4.5 Preview",
609
+ inputPricePerMillion: 75,
610
+ outputPricePerMillion: 150,
611
+ contextWindow: 128e3,
612
+ maxOutputTokens: 16384,
613
+ currency: "USD",
614
+ deprecated: true,
615
+ capabilities: {
616
+ vision: true,
617
+ functionCalling: true,
618
+ streaming: true,
619
+ jsonMode: true,
620
+ systemMessage: true
621
+ }
622
+ },
623
+ {
624
+ model: "o3",
625
+ provider: "openai",
626
+ displayName: "o3",
627
+ inputPricePerMillion: 2,
628
+ outputPricePerMillion: 8,
629
+ contextWindow: 2e5,
630
+ maxOutputTokens: 1e5,
20
631
  currency: "USD",
21
632
  capabilities: {
22
633
  vision: true,
@@ -24,84 +635,97 @@ var DEFAULT_PRICING = [
24
635
  streaming: true,
25
636
  jsonMode: true,
26
637
  systemMessage: true,
27
- computerUse: true
638
+ extendedThinking: true
28
639
  }
29
640
  },
30
641
  {
31
- model: "claude-3-5-haiku-20241022",
32
- provider: "anthropic",
33
- displayName: "Claude 3.5 Haiku",
34
- inputPricePerMillion: 0.8,
35
- outputPricePerMillion: 4,
36
- cacheReadPricePerMillion: 0.08,
37
- cacheWritePricePerMillion: 1,
642
+ model: "o3-pro",
643
+ provider: "openai",
644
+ displayName: "o3 Pro",
645
+ inputPricePerMillion: 20,
646
+ outputPricePerMillion: 80,
38
647
  contextWindow: 2e5,
39
- maxOutputTokens: 8192,
648
+ maxOutputTokens: 1e5,
40
649
  currency: "USD",
41
650
  capabilities: {
42
651
  vision: true,
43
652
  functionCalling: true,
44
653
  streaming: true,
45
654
  jsonMode: true,
46
- systemMessage: true
655
+ systemMessage: true,
656
+ extendedThinking: true
47
657
  }
48
658
  },
49
659
  {
50
- model: "claude-3-opus-20240229",
51
- provider: "anthropic",
52
- displayName: "Claude 3 Opus",
53
- inputPricePerMillion: 15,
54
- outputPricePerMillion: 75,
55
- cacheReadPricePerMillion: 1.5,
56
- cacheWritePricePerMillion: 18.75,
660
+ model: "o4-mini",
661
+ provider: "openai",
662
+ displayName: "o4 Mini",
663
+ inputPricePerMillion: 1.1,
664
+ outputPricePerMillion: 4.4,
57
665
  contextWindow: 2e5,
58
- maxOutputTokens: 4096,
666
+ maxOutputTokens: 1e5,
59
667
  currency: "USD",
60
668
  capabilities: {
61
669
  vision: true,
62
670
  functionCalling: true,
63
671
  streaming: true,
64
672
  jsonMode: true,
65
- systemMessage: true
673
+ systemMessage: true,
674
+ extendedThinking: true
66
675
  }
67
676
  },
68
677
  {
69
- model: "claude-3-sonnet-20240229",
70
- provider: "anthropic",
71
- displayName: "Claude 3 Sonnet",
72
- inputPricePerMillion: 3,
73
- outputPricePerMillion: 15,
678
+ model: "o3-deep-research",
679
+ provider: "openai",
680
+ displayName: "o3 Deep Research",
681
+ inputPricePerMillion: 10,
682
+ outputPricePerMillion: 40,
74
683
  contextWindow: 2e5,
75
- maxOutputTokens: 4096,
684
+ maxOutputTokens: 1e5,
76
685
  currency: "USD",
77
686
  capabilities: {
78
687
  vision: true,
79
688
  functionCalling: true,
80
689
  streaming: true,
81
690
  jsonMode: true,
82
- systemMessage: true
691
+ systemMessage: true,
692
+ extendedThinking: true
83
693
  }
84
694
  },
85
695
  {
86
- model: "claude-3-haiku-20240307",
87
- provider: "anthropic",
88
- displayName: "Claude 3 Haiku",
89
- inputPricePerMillion: 0.25,
90
- outputPricePerMillion: 1.25,
91
- cacheReadPricePerMillion: 0.03,
92
- cacheWritePricePerMillion: 0.3,
696
+ model: "o4-mini-deep-research",
697
+ provider: "openai",
698
+ displayName: "o4 Mini Deep Research",
699
+ inputPricePerMillion: 2,
700
+ outputPricePerMillion: 8,
93
701
  contextWindow: 2e5,
94
- maxOutputTokens: 4096,
702
+ maxOutputTokens: 1e5,
95
703
  currency: "USD",
96
704
  capabilities: {
97
705
  vision: true,
98
706
  functionCalling: true,
99
707
  streaming: true,
100
708
  jsonMode: true,
101
- systemMessage: true
709
+ systemMessage: true,
710
+ extendedThinking: true
711
+ }
712
+ },
713
+ {
714
+ model: "o3-mini",
715
+ provider: "openai",
716
+ displayName: "o3 Mini",
717
+ inputPricePerMillion: 1.1,
718
+ outputPricePerMillion: 4.4,
719
+ contextWindow: 2e5,
720
+ maxOutputTokens: 1e5,
721
+ currency: "USD",
722
+ capabilities: {
723
+ functionCalling: true,
724
+ streaming: true,
725
+ jsonMode: true,
726
+ extendedThinking: true
102
727
  }
103
728
  },
104
- // OpenAI Models
105
729
  {
106
730
  model: "gpt-4o",
107
731
  provider: "openai",
@@ -136,6 +760,38 @@ var DEFAULT_PRICING = [
136
760
  systemMessage: true
137
761
  }
138
762
  },
763
+ {
764
+ model: "o1",
765
+ provider: "openai",
766
+ displayName: "o1",
767
+ inputPricePerMillion: 15,
768
+ outputPricePerMillion: 60,
769
+ contextWindow: 2e5,
770
+ maxOutputTokens: 1e5,
771
+ currency: "USD",
772
+ capabilities: {
773
+ vision: true,
774
+ functionCalling: true,
775
+ streaming: true,
776
+ jsonMode: true,
777
+ extendedThinking: true
778
+ }
779
+ },
780
+ {
781
+ model: "o1-mini",
782
+ provider: "openai",
783
+ displayName: "o1 Mini",
784
+ inputPricePerMillion: 3,
785
+ outputPricePerMillion: 12,
786
+ contextWindow: 128e3,
787
+ maxOutputTokens: 65536,
788
+ currency: "USD",
789
+ deprecated: true,
790
+ capabilities: {
791
+ streaming: true,
792
+ extendedThinking: true
793
+ }
794
+ },
139
795
  {
140
796
  model: "gpt-4-turbo",
141
797
  provider: "openai",
@@ -162,6 +818,7 @@ var DEFAULT_PRICING = [
162
818
  contextWindow: 16385,
163
819
  maxOutputTokens: 4096,
164
820
  currency: "USD",
821
+ deprecated: true,
165
822
  capabilities: {
166
823
  functionCalling: true,
167
824
  streaming: true,
@@ -169,42 +826,84 @@ var DEFAULT_PRICING = [
169
826
  systemMessage: true
170
827
  }
171
828
  },
829
+ // ---- Google Models ----
172
830
  {
173
- model: "o1-preview",
174
- provider: "openai",
175
- displayName: "o1 Preview",
176
- inputPricePerMillion: 15,
177
- outputPricePerMillion: 60,
178
- contextWindow: 128e3,
179
- maxOutputTokens: 32768,
831
+ model: "gemini-3.1-pro-preview",
832
+ provider: "google",
833
+ displayName: "Gemini 3.1 Pro Preview",
834
+ inputPricePerMillion: 2,
835
+ outputPricePerMillion: 12,
836
+ contextWindow: 1048576,
837
+ maxOutputTokens: 65536,
838
+ currency: "USD",
839
+ capabilities: {
840
+ vision: true,
841
+ functionCalling: true,
842
+ streaming: true,
843
+ jsonMode: true,
844
+ systemMessage: true
845
+ }
846
+ },
847
+ {
848
+ model: "gemini-3.5-flash",
849
+ provider: "google",
850
+ displayName: "Gemini 3.5 Flash",
851
+ inputPricePerMillion: 1.5,
852
+ outputPricePerMillion: 9,
853
+ contextWindow: 1048576,
854
+ maxOutputTokens: 65536,
855
+ currency: "USD",
856
+ capabilities: {
857
+ vision: true,
858
+ functionCalling: true,
859
+ streaming: true,
860
+ jsonMode: true,
861
+ systemMessage: true
862
+ }
863
+ },
864
+ {
865
+ model: "gemini-2.5-pro",
866
+ provider: "google",
867
+ displayName: "Gemini 2.5 Pro",
868
+ inputPricePerMillion: 1.25,
869
+ outputPricePerMillion: 10,
870
+ contextWindow: 1048576,
871
+ maxOutputTokens: 65536,
180
872
  currency: "USD",
181
873
  capabilities: {
874
+ vision: true,
875
+ functionCalling: true,
182
876
  streaming: true,
877
+ jsonMode: true,
878
+ systemMessage: true,
183
879
  extendedThinking: true
184
880
  }
185
881
  },
186
882
  {
187
- model: "o1-mini",
188
- provider: "openai",
189
- displayName: "o1 Mini",
190
- inputPricePerMillion: 3,
191
- outputPricePerMillion: 12,
192
- contextWindow: 128e3,
883
+ model: "gemini-2.5-flash",
884
+ provider: "google",
885
+ displayName: "Gemini 2.5 Flash",
886
+ inputPricePerMillion: 0.15,
887
+ outputPricePerMillion: 0.6,
888
+ contextWindow: 1048576,
193
889
  maxOutputTokens: 65536,
194
890
  currency: "USD",
195
891
  capabilities: {
892
+ vision: true,
893
+ functionCalling: true,
196
894
  streaming: true,
895
+ jsonMode: true,
896
+ systemMessage: true,
197
897
  extendedThinking: true
198
898
  }
199
899
  },
200
- // Google Models
201
900
  {
202
- model: "gemini-1.5-pro",
901
+ model: "gemini-2.0-flash",
203
902
  provider: "google",
204
- displayName: "Gemini 1.5 Pro",
205
- inputPricePerMillion: 1.25,
206
- outputPricePerMillion: 5,
207
- contextWindow: 2e6,
903
+ displayName: "Gemini 2.0 Flash",
904
+ inputPricePerMillion: 0.1,
905
+ outputPricePerMillion: 0.4,
906
+ contextWindow: 1048576,
208
907
  maxOutputTokens: 8192,
209
908
  currency: "USD",
210
909
  capabilities: {
@@ -216,12 +915,12 @@ var DEFAULT_PRICING = [
216
915
  }
217
916
  },
218
917
  {
219
- model: "gemini-1.5-flash",
918
+ model: "gemini-1.5-pro",
220
919
  provider: "google",
221
- displayName: "Gemini 1.5 Flash",
222
- inputPricePerMillion: 0.075,
223
- outputPricePerMillion: 0.3,
224
- contextWindow: 1e6,
920
+ displayName: "Gemini 1.5 Pro",
921
+ inputPricePerMillion: 1.25,
922
+ outputPricePerMillion: 5,
923
+ contextWindow: 2097152,
225
924
  maxOutputTokens: 8192,
226
925
  currency: "USD",
227
926
  capabilities: {
@@ -233,12 +932,12 @@ var DEFAULT_PRICING = [
233
932
  }
234
933
  },
235
934
  {
236
- model: "gemini-2.0-flash-exp",
935
+ model: "gemini-1.5-flash",
237
936
  provider: "google",
238
- displayName: "Gemini 2.0 Flash",
239
- inputPricePerMillion: 0,
240
- outputPricePerMillion: 0,
241
- contextWindow: 1e6,
937
+ displayName: "Gemini 1.5 Flash",
938
+ inputPricePerMillion: 0.075,
939
+ outputPricePerMillion: 0.3,
940
+ contextWindow: 1048576,
242
941
  maxOutputTokens: 8192,
243
942
  currency: "USD",
244
943
  capabilities: {
@@ -249,7 +948,7 @@ var DEFAULT_PRICING = [
249
948
  systemMessage: true
250
949
  }
251
950
  },
252
- // Mistral Models
951
+ // ---- Mistral Models ----
253
952
  {
254
953
  model: "mistral-large-latest",
255
954
  provider: "mistral",
@@ -260,6 +959,7 @@ var DEFAULT_PRICING = [
260
959
  maxOutputTokens: 4096,
261
960
  currency: "USD",
262
961
  capabilities: {
962
+ vision: true,
263
963
  functionCalling: true,
264
964
  streaming: true,
265
965
  jsonMode: true,
@@ -270,9 +970,9 @@ var DEFAULT_PRICING = [
270
970
  model: "mistral-small-latest",
271
971
  provider: "mistral",
272
972
  displayName: "Mistral Small",
273
- inputPricePerMillion: 0.2,
274
- outputPricePerMillion: 0.6,
275
- contextWindow: 32e3,
973
+ inputPricePerMillion: 0.1,
974
+ outputPricePerMillion: 0.3,
975
+ contextWindow: 128e3,
276
976
  maxOutputTokens: 4096,
277
977
  currency: "USD",
278
978
  capabilities: {
@@ -286,9 +986,9 @@ var DEFAULT_PRICING = [
286
986
  model: "codestral-latest",
287
987
  provider: "mistral",
288
988
  displayName: "Codestral",
289
- inputPricePerMillion: 0.2,
290
- outputPricePerMillion: 0.6,
291
- contextWindow: 32e3,
989
+ inputPricePerMillion: 0.3,
990
+ outputPricePerMillion: 0.9,
991
+ contextWindow: 256e3,
292
992
  maxOutputTokens: 4096,
293
993
  currency: "USD",
294
994
  capabilities: {
@@ -296,7 +996,78 @@ var DEFAULT_PRICING = [
296
996
  systemMessage: true
297
997
  }
298
998
  },
299
- // Cohere Models
999
+ // ---- DeepSeek Models ----
1000
+ {
1001
+ model: "deepseek-chat",
1002
+ provider: "deepseek",
1003
+ displayName: "DeepSeek V3.2",
1004
+ inputPricePerMillion: 0.28,
1005
+ outputPricePerMillion: 0.42,
1006
+ cacheReadPricePerMillion: 0.028,
1007
+ contextWindow: 128e3,
1008
+ maxOutputTokens: 8192,
1009
+ currency: "USD",
1010
+ capabilities: {
1011
+ functionCalling: true,
1012
+ streaming: true,
1013
+ jsonMode: true,
1014
+ systemMessage: true
1015
+ }
1016
+ },
1017
+ {
1018
+ model: "deepseek-reasoner",
1019
+ provider: "deepseek",
1020
+ displayName: "DeepSeek R1",
1021
+ inputPricePerMillion: 0.28,
1022
+ outputPricePerMillion: 0.42,
1023
+ cacheReadPricePerMillion: 0.028,
1024
+ contextWindow: 128e3,
1025
+ maxOutputTokens: 65536,
1026
+ currency: "USD",
1027
+ capabilities: {
1028
+ functionCalling: true,
1029
+ streaming: true,
1030
+ jsonMode: true,
1031
+ systemMessage: true,
1032
+ extendedThinking: true
1033
+ }
1034
+ },
1035
+ // ---- xAI (Grok) Models ----
1036
+ {
1037
+ model: "grok-3",
1038
+ provider: "xai",
1039
+ displayName: "Grok 3",
1040
+ inputPricePerMillion: 3,
1041
+ outputPricePerMillion: 15,
1042
+ contextWindow: 131072,
1043
+ maxOutputTokens: 16384,
1044
+ currency: "USD",
1045
+ capabilities: {
1046
+ vision: true,
1047
+ functionCalling: true,
1048
+ streaming: true,
1049
+ jsonMode: true,
1050
+ systemMessage: true
1051
+ }
1052
+ },
1053
+ {
1054
+ model: "grok-3-mini",
1055
+ provider: "xai",
1056
+ displayName: "Grok 3 Mini",
1057
+ inputPricePerMillion: 0.3,
1058
+ outputPricePerMillion: 0.5,
1059
+ contextWindow: 131072,
1060
+ maxOutputTokens: 16384,
1061
+ currency: "USD",
1062
+ capabilities: {
1063
+ functionCalling: true,
1064
+ streaming: true,
1065
+ jsonMode: true,
1066
+ systemMessage: true,
1067
+ extendedThinking: true
1068
+ }
1069
+ },
1070
+ // ---- Cohere Models ----
300
1071
  {
301
1072
  model: "command-r-plus",
302
1073
  provider: "cohere",
@@ -617,6 +1388,8 @@ var PROVIDER_STRATEGIES = {
617
1388
  bedrock: { encoding: "approximate", charsPerToken: 3.5 },
618
1389
  cohere: { encoding: "approximate", charsPerToken: 4 },
619
1390
  mistral: { encoding: "approximate", charsPerToken: 4 },
1391
+ deepseek: { encoding: "approximate", charsPerToken: 4 },
1392
+ xai: { encoding: "approximate", charsPerToken: 4 },
620
1393
  replicate: { encoding: "approximate", charsPerToken: 4 },
621
1394
  custom: { encoding: "approximate", charsPerToken: 4 }
622
1395
  };