@everworker/oneringai 0.4.5 → 0.4.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -24,18 +24,30 @@ function isVendor(value) {
24
24
  // src/domain/entities/Model.ts
25
25
  var LLM_MODELS = {
26
26
  [Vendor.OpenAI]: {
27
+ // GPT-5.3 Series
28
+ GPT_5_3_CODEX: "gpt-5.3-codex",
29
+ GPT_5_3_CHAT: "gpt-5.3-chat-latest",
27
30
  // GPT-5.2 Series (Current Flagship)
28
31
  GPT_5_2: "gpt-5.2",
29
32
  GPT_5_2_PRO: "gpt-5.2-pro",
33
+ GPT_5_2_CODEX: "gpt-5.2-codex",
34
+ GPT_5_2_CHAT: "gpt-5.2-chat-latest",
35
+ // GPT-5.1 Series
36
+ GPT_5_1: "gpt-5.1",
37
+ GPT_5_1_CODEX: "gpt-5.1-codex",
38
+ GPT_5_1_CODEX_MAX: "gpt-5.1-codex-max",
39
+ GPT_5_1_CODEX_MINI: "gpt-5.1-codex-mini",
40
+ GPT_5_1_CHAT: "gpt-5.1-chat-latest",
30
41
  // GPT-5 Series
31
42
  GPT_5: "gpt-5",
32
43
  GPT_5_MINI: "gpt-5-mini",
33
44
  GPT_5_NANO: "gpt-5-nano",
45
+ GPT_5_CHAT: "gpt-5-chat-latest",
34
46
  // GPT-4.1 Series
35
47
  GPT_4_1: "gpt-4.1",
36
48
  GPT_4_1_MINI: "gpt-4.1-mini",
37
49
  GPT_4_1_NANO: "gpt-4.1-nano",
38
- // GPT-4o Series (Legacy, Audio Capable)
50
+ // GPT-4o Series (Legacy)
39
51
  GPT_4O: "gpt-4o",
40
52
  GPT_4O_MINI: "gpt-4o-mini",
41
53
  // Reasoning Models (o-series)
@@ -43,18 +55,26 @@ var LLM_MODELS = {
43
55
  O1: "o1"
44
56
  },
45
57
  [Vendor.Anthropic]: {
46
- // Claude 4.5 Series (Current)
58
+ // Claude 4.6 Series (Current)
59
+ CLAUDE_OPUS_4_6: "claude-opus-4-6",
60
+ CLAUDE_SONNET_4_6: "claude-sonnet-4-6",
61
+ // Claude 4.5 Series
47
62
  CLAUDE_OPUS_4_5: "claude-opus-4-5-20251101",
48
63
  CLAUDE_SONNET_4_5: "claude-sonnet-4-5-20250929",
49
64
  CLAUDE_HAIKU_4_5: "claude-haiku-4-5-20251001",
50
65
  // Claude 4.x Legacy
51
66
  CLAUDE_OPUS_4_1: "claude-opus-4-1-20250805",
67
+ CLAUDE_OPUS_4: "claude-opus-4-20250514",
52
68
  CLAUDE_SONNET_4: "claude-sonnet-4-20250514",
53
69
  CLAUDE_SONNET_3_7: "claude-3-7-sonnet-20250219",
54
- // Claude 3.x Legacy
70
+ // Claude 3.x Legacy (Deprecated)
55
71
  CLAUDE_HAIKU_3: "claude-3-haiku-20240307"
56
72
  },
57
73
  [Vendor.Google]: {
74
+ // Gemini 3.1 Series (Preview)
75
+ GEMINI_3_1_PRO_PREVIEW: "gemini-3.1-pro-preview",
76
+ GEMINI_3_1_FLASH_LITE_PREVIEW: "gemini-3.1-flash-lite-preview",
77
+ GEMINI_3_1_FLASH_IMAGE_PREVIEW: "gemini-3.1-flash-image-preview",
58
78
  // Gemini 3 Series (Preview)
59
79
  GEMINI_3_FLASH_PREVIEW: "gemini-3-flash-preview",
60
80
  GEMINI_3_PRO_PREVIEW: "gemini-3-pro-preview",
@@ -86,12 +106,91 @@ var MODEL_REGISTRY = {
86
106
  // ============================================================================
87
107
  // OpenAI Models (Verified from platform.openai.com)
88
108
  // ============================================================================
109
+ // GPT-5.3 Series
110
+ "gpt-5.3-codex": {
111
+ name: "gpt-5.3-codex",
112
+ provider: Vendor.OpenAI,
113
+ description: "Latest codex model for coding and agentic tasks. Reasoning.effort: low, medium, high, xhigh",
114
+ isActive: true,
115
+ releaseDate: "2026-02-01",
116
+ knowledgeCutoff: "2025-08-31",
117
+ features: {
118
+ reasoning: true,
119
+ streaming: true,
120
+ structuredOutput: true,
121
+ functionCalling: true,
122
+ fineTuning: false,
123
+ predictedOutputs: false,
124
+ realtime: false,
125
+ vision: true,
126
+ audio: false,
127
+ video: false,
128
+ batchAPI: true,
129
+ promptCaching: true,
130
+ parameters: {
131
+ temperature: false,
132
+ topP: false,
133
+ frequencyPenalty: false,
134
+ presencePenalty: false
135
+ },
136
+ input: {
137
+ tokens: 4e5,
138
+ text: true,
139
+ image: true,
140
+ cpm: 1.75,
141
+ cpmCached: 0.175
142
+ },
143
+ output: {
144
+ tokens: 128e3,
145
+ text: true,
146
+ cpm: 14
147
+ }
148
+ }
149
+ },
150
+ "gpt-5.3-chat-latest": {
151
+ name: "gpt-5.3-chat-latest",
152
+ provider: Vendor.OpenAI,
153
+ description: "Latest GPT-5.3 chat model for general-purpose use",
154
+ isActive: true,
155
+ releaseDate: "2026-02-01",
156
+ knowledgeCutoff: "2025-08-31",
157
+ features: {
158
+ reasoning: false,
159
+ streaming: true,
160
+ structuredOutput: true,
161
+ functionCalling: true,
162
+ fineTuning: false,
163
+ predictedOutputs: false,
164
+ realtime: false,
165
+ vision: true,
166
+ audio: false,
167
+ video: false,
168
+ batchAPI: true,
169
+ promptCaching: true,
170
+ parameters: {
171
+ temperature: false
172
+ },
173
+ input: {
174
+ tokens: 128e3,
175
+ text: true,
176
+ image: true,
177
+ cpm: 1.75,
178
+ cpmCached: 0.175
179
+ },
180
+ output: {
181
+ tokens: 16e3,
182
+ text: true,
183
+ cpm: 14
184
+ }
185
+ }
186
+ },
89
187
  // GPT-5.2 Series (Current Flagship)
90
188
  "gpt-5.2": {
91
189
  name: "gpt-5.2",
92
190
  provider: Vendor.OpenAI,
93
191
  description: "Flagship model for coding and agentic tasks. Reasoning.effort: none, low, medium, high, xhigh",
94
192
  isActive: true,
193
+ preferred: true,
95
194
  releaseDate: "2025-12-01",
96
195
  knowledgeCutoff: "2025-08-31",
97
196
  features: {
@@ -117,7 +216,8 @@ var MODEL_REGISTRY = {
117
216
  tokens: 4e5,
118
217
  text: true,
119
218
  image: true,
120
- cpm: 1.75
219
+ cpm: 1.75,
220
+ cpmCached: 0.175
121
221
  },
122
222
  output: {
123
223
  tokens: 128e3,
@@ -136,7 +236,7 @@ var MODEL_REGISTRY = {
136
236
  features: {
137
237
  reasoning: true,
138
238
  streaming: true,
139
- structuredOutput: true,
239
+ structuredOutput: false,
140
240
  functionCalling: true,
141
241
  fineTuning: false,
142
242
  predictedOutputs: false,
@@ -165,6 +265,276 @@ var MODEL_REGISTRY = {
165
265
  }
166
266
  }
167
267
  },
268
+ "gpt-5.2-codex": {
269
+ name: "gpt-5.2-codex",
270
+ provider: Vendor.OpenAI,
271
+ description: "GPT-5.2 codex for coding and agentic tasks. Reasoning.effort: low, medium, high, xhigh",
272
+ isActive: true,
273
+ preferred: true,
274
+ releaseDate: "2025-12-01",
275
+ knowledgeCutoff: "2025-08-31",
276
+ features: {
277
+ reasoning: true,
278
+ streaming: true,
279
+ structuredOutput: true,
280
+ functionCalling: true,
281
+ fineTuning: false,
282
+ predictedOutputs: false,
283
+ realtime: false,
284
+ vision: true,
285
+ audio: false,
286
+ video: false,
287
+ batchAPI: true,
288
+ promptCaching: true,
289
+ parameters: {
290
+ temperature: false,
291
+ topP: false,
292
+ frequencyPenalty: false,
293
+ presencePenalty: false
294
+ },
295
+ input: {
296
+ tokens: 4e5,
297
+ text: true,
298
+ image: true,
299
+ cpm: 1.75,
300
+ cpmCached: 0.175
301
+ },
302
+ output: {
303
+ tokens: 128e3,
304
+ text: true,
305
+ cpm: 14
306
+ }
307
+ }
308
+ },
309
+ "gpt-5.2-chat-latest": {
310
+ name: "gpt-5.2-chat-latest",
311
+ provider: Vendor.OpenAI,
312
+ description: "GPT-5.2 chat model for general-purpose use",
313
+ isActive: true,
314
+ releaseDate: "2025-12-01",
315
+ knowledgeCutoff: "2025-08-31",
316
+ features: {
317
+ reasoning: false,
318
+ streaming: true,
319
+ structuredOutput: true,
320
+ functionCalling: true,
321
+ fineTuning: false,
322
+ predictedOutputs: false,
323
+ realtime: false,
324
+ vision: true,
325
+ audio: false,
326
+ video: false,
327
+ batchAPI: true,
328
+ promptCaching: true,
329
+ input: {
330
+ tokens: 128e3,
331
+ text: true,
332
+ image: true,
333
+ cpm: 1.75,
334
+ cpmCached: 0.175
335
+ },
336
+ output: {
337
+ tokens: 16e3,
338
+ text: true,
339
+ cpm: 14
340
+ }
341
+ }
342
+ },
343
+ // GPT-5.1 Series
344
+ "gpt-5.1": {
345
+ name: "gpt-5.1",
346
+ provider: Vendor.OpenAI,
347
+ description: "Intelligent reasoning model for coding and agentic tasks. Reasoning.effort: none, low, medium, high",
348
+ isActive: true,
349
+ releaseDate: "2025-10-01",
350
+ knowledgeCutoff: "2024-09-30",
351
+ features: {
352
+ reasoning: true,
353
+ streaming: true,
354
+ structuredOutput: true,
355
+ functionCalling: true,
356
+ fineTuning: false,
357
+ predictedOutputs: false,
358
+ realtime: false,
359
+ vision: true,
360
+ audio: false,
361
+ video: false,
362
+ batchAPI: true,
363
+ promptCaching: true,
364
+ parameters: {
365
+ temperature: false,
366
+ topP: false,
367
+ frequencyPenalty: false,
368
+ presencePenalty: false
369
+ },
370
+ input: {
371
+ tokens: 4e5,
372
+ text: true,
373
+ image: true,
374
+ cpm: 1.25,
375
+ cpmCached: 0.125
376
+ },
377
+ output: {
378
+ tokens: 128e3,
379
+ text: true,
380
+ cpm: 10
381
+ }
382
+ }
383
+ },
384
+ "gpt-5.1-codex": {
385
+ name: "gpt-5.1-codex",
386
+ provider: Vendor.OpenAI,
387
+ description: "GPT-5.1 codex for coding and agentic tasks with reasoning",
388
+ isActive: true,
389
+ releaseDate: "2025-10-01",
390
+ knowledgeCutoff: "2024-09-30",
391
+ features: {
392
+ reasoning: true,
393
+ streaming: true,
394
+ structuredOutput: true,
395
+ functionCalling: true,
396
+ fineTuning: false,
397
+ predictedOutputs: false,
398
+ realtime: false,
399
+ vision: true,
400
+ audio: false,
401
+ video: false,
402
+ batchAPI: true,
403
+ promptCaching: true,
404
+ parameters: {
405
+ temperature: false,
406
+ topP: false,
407
+ frequencyPenalty: false,
408
+ presencePenalty: false
409
+ },
410
+ input: {
411
+ tokens: 4e5,
412
+ text: true,
413
+ image: true,
414
+ cpm: 1.25,
415
+ cpmCached: 0.125
416
+ },
417
+ output: {
418
+ tokens: 128e3,
419
+ text: true,
420
+ cpm: 10
421
+ }
422
+ }
423
+ },
424
+ "gpt-5.1-codex-max": {
425
+ name: "gpt-5.1-codex-max",
426
+ provider: Vendor.OpenAI,
427
+ description: "GPT-5.1 codex max for maximum reasoning depth on coding tasks",
428
+ isActive: true,
429
+ releaseDate: "2025-10-01",
430
+ knowledgeCutoff: "2024-09-30",
431
+ features: {
432
+ reasoning: true,
433
+ streaming: true,
434
+ structuredOutput: true,
435
+ functionCalling: true,
436
+ fineTuning: false,
437
+ predictedOutputs: false,
438
+ realtime: false,
439
+ vision: true,
440
+ audio: false,
441
+ video: false,
442
+ batchAPI: true,
443
+ promptCaching: true,
444
+ parameters: {
445
+ temperature: false,
446
+ topP: false,
447
+ frequencyPenalty: false,
448
+ presencePenalty: false
449
+ },
450
+ input: {
451
+ tokens: 4e5,
452
+ text: true,
453
+ image: true,
454
+ cpm: 1.25,
455
+ cpmCached: 0.125
456
+ },
457
+ output: {
458
+ tokens: 128e3,
459
+ text: true,
460
+ cpm: 10
461
+ }
462
+ }
463
+ },
464
+ "gpt-5.1-codex-mini": {
465
+ name: "gpt-5.1-codex-mini",
466
+ provider: Vendor.OpenAI,
467
+ description: "GPT-5.1 codex mini for cost-efficient coding tasks",
468
+ isActive: true,
469
+ releaseDate: "2025-10-01",
470
+ knowledgeCutoff: "2024-09-30",
471
+ features: {
472
+ reasoning: true,
473
+ streaming: true,
474
+ structuredOutput: true,
475
+ functionCalling: true,
476
+ fineTuning: false,
477
+ predictedOutputs: false,
478
+ realtime: false,
479
+ vision: true,
480
+ audio: false,
481
+ video: false,
482
+ batchAPI: true,
483
+ promptCaching: true,
484
+ parameters: {
485
+ temperature: false,
486
+ topP: false,
487
+ frequencyPenalty: false,
488
+ presencePenalty: false
489
+ },
490
+ input: {
491
+ tokens: 4e5,
492
+ text: true,
493
+ image: true,
494
+ cpm: 0.25,
495
+ cpmCached: 0.025
496
+ },
497
+ output: {
498
+ tokens: 128e3,
499
+ text: true,
500
+ cpm: 2
501
+ }
502
+ }
503
+ },
504
+ "gpt-5.1-chat-latest": {
505
+ name: "gpt-5.1-chat-latest",
506
+ provider: Vendor.OpenAI,
507
+ description: "GPT-5.1 chat model for general-purpose use",
508
+ isActive: true,
509
+ releaseDate: "2025-10-01",
510
+ knowledgeCutoff: "2024-09-30",
511
+ features: {
512
+ reasoning: false,
513
+ streaming: true,
514
+ structuredOutput: true,
515
+ functionCalling: true,
516
+ fineTuning: false,
517
+ predictedOutputs: false,
518
+ realtime: false,
519
+ vision: true,
520
+ audio: false,
521
+ video: false,
522
+ batchAPI: true,
523
+ promptCaching: true,
524
+ input: {
525
+ tokens: 128e3,
526
+ text: true,
527
+ image: true,
528
+ cpm: 1.25,
529
+ cpmCached: 0.125
530
+ },
531
+ output: {
532
+ tokens: 16e3,
533
+ text: true,
534
+ cpm: 10
535
+ }
536
+ }
537
+ },
168
538
  // GPT-5 Series
169
539
  "gpt-5": {
170
540
  name: "gpt-5",
@@ -196,7 +566,8 @@ var MODEL_REGISTRY = {
196
566
  tokens: 4e5,
197
567
  text: true,
198
568
  image: true,
199
- cpm: 1.25
569
+ cpm: 1.25,
570
+ cpmCached: 0.125
200
571
  },
201
572
  output: {
202
573
  tokens: 128e3,
@@ -235,7 +606,8 @@ var MODEL_REGISTRY = {
235
606
  tokens: 4e5,
236
607
  text: true,
237
608
  image: true,
238
- cpm: 0.25
609
+ cpm: 0.25,
610
+ cpmCached: 0.025
239
611
  },
240
612
  output: {
241
613
  tokens: 128e3,
@@ -274,7 +646,8 @@ var MODEL_REGISTRY = {
274
646
  tokens: 4e5,
275
647
  text: true,
276
648
  image: true,
277
- cpm: 0.05
649
+ cpm: 0.05,
650
+ cpmCached: 5e-3
278
651
  },
279
652
  output: {
280
653
  tokens: 128e3,
@@ -283,6 +656,40 @@ var MODEL_REGISTRY = {
283
656
  }
284
657
  }
285
658
  },
659
+ "gpt-5-chat-latest": {
660
+ name: "gpt-5-chat-latest",
661
+ provider: Vendor.OpenAI,
662
+ description: "GPT-5 chat model for general-purpose use",
663
+ isActive: true,
664
+ releaseDate: "2025-08-01",
665
+ knowledgeCutoff: "2024-09-30",
666
+ features: {
667
+ reasoning: false,
668
+ streaming: true,
669
+ structuredOutput: true,
670
+ functionCalling: true,
671
+ fineTuning: false,
672
+ predictedOutputs: false,
673
+ realtime: false,
674
+ vision: true,
675
+ audio: false,
676
+ video: false,
677
+ batchAPI: true,
678
+ promptCaching: true,
679
+ input: {
680
+ tokens: 128e3,
681
+ text: true,
682
+ image: true,
683
+ cpm: 1.25,
684
+ cpmCached: 0.125
685
+ },
686
+ output: {
687
+ tokens: 16e3,
688
+ text: true,
689
+ cpm: 10
690
+ }
691
+ }
692
+ },
286
693
  // GPT-4.1 Series
287
694
  "gpt-4.1": {
288
695
  name: "gpt-4.1",
@@ -290,7 +697,7 @@ var MODEL_REGISTRY = {
290
697
  description: "GPT-4.1 specialized for coding with 1M token context window",
291
698
  isActive: true,
292
699
  releaseDate: "2025-04-14",
293
- knowledgeCutoff: "2025-04-01",
700
+ knowledgeCutoff: "2024-06-01",
294
701
  features: {
295
702
  reasoning: false,
296
703
  streaming: true,
@@ -308,7 +715,8 @@ var MODEL_REGISTRY = {
308
715
  tokens: 1e6,
309
716
  text: true,
310
717
  image: true,
311
- cpm: 2
718
+ cpm: 2,
719
+ cpmCached: 0.5
312
720
  },
313
721
  output: {
314
722
  tokens: 32768,
@@ -323,7 +731,7 @@ var MODEL_REGISTRY = {
323
731
  description: "Efficient GPT-4.1 model, beats GPT-4o in many benchmarks at 83% lower cost",
324
732
  isActive: true,
325
733
  releaseDate: "2025-04-14",
326
- knowledgeCutoff: "2025-04-01",
734
+ knowledgeCutoff: "2024-06-01",
327
735
  features: {
328
736
  reasoning: false,
329
737
  streaming: true,
@@ -341,7 +749,8 @@ var MODEL_REGISTRY = {
341
749
  tokens: 1e6,
342
750
  text: true,
343
751
  image: true,
344
- cpm: 0.4
752
+ cpm: 0.4,
753
+ cpmCached: 0.1
345
754
  },
346
755
  output: {
347
756
  tokens: 16384,
@@ -356,7 +765,7 @@ var MODEL_REGISTRY = {
356
765
  description: "Fastest and cheapest model with 1M context. 80.1% MMLU, ideal for classification/autocompletion",
357
766
  isActive: true,
358
767
  releaseDate: "2025-04-14",
359
- knowledgeCutoff: "2025-04-01",
768
+ knowledgeCutoff: "2024-06-01",
360
769
  features: {
361
770
  reasoning: false,
362
771
  streaming: true,
@@ -374,7 +783,8 @@ var MODEL_REGISTRY = {
374
783
  tokens: 1e6,
375
784
  text: true,
376
785
  image: true,
377
- cpm: 0.1
786
+ cpm: 0.1,
787
+ cpmCached: 0.025
378
788
  },
379
789
  output: {
380
790
  tokens: 16384,
@@ -383,14 +793,14 @@ var MODEL_REGISTRY = {
383
793
  }
384
794
  }
385
795
  },
386
- // GPT-4o Series (Legacy, Audio Capable)
796
+ // GPT-4o Series (Legacy)
387
797
  "gpt-4o": {
388
798
  name: "gpt-4o",
389
799
  provider: Vendor.OpenAI,
390
- description: "Versatile omni model with audio support. Legacy but still available",
800
+ description: "Versatile omni model. Legacy but still available",
391
801
  isActive: true,
392
802
  releaseDate: "2024-05-13",
393
- knowledgeCutoff: "2024-04-01",
803
+ knowledgeCutoff: "2023-10-01",
394
804
  features: {
395
805
  reasoning: false,
396
806
  streaming: true,
@@ -400,7 +810,7 @@ var MODEL_REGISTRY = {
400
810
  predictedOutputs: true,
401
811
  realtime: true,
402
812
  vision: true,
403
- audio: true,
813
+ audio: false,
404
814
  video: false,
405
815
  batchAPI: true,
406
816
  promptCaching: true,
@@ -408,13 +818,12 @@ var MODEL_REGISTRY = {
408
818
  tokens: 128e3,
409
819
  text: true,
410
820
  image: true,
411
- audio: true,
412
- cpm: 2.5
821
+ cpm: 2.5,
822
+ cpmCached: 1.25
413
823
  },
414
824
  output: {
415
825
  tokens: 16384,
416
826
  text: true,
417
- audio: true,
418
827
  cpm: 10
419
828
  }
420
829
  }
@@ -422,10 +831,10 @@ var MODEL_REGISTRY = {
422
831
  "gpt-4o-mini": {
423
832
  name: "gpt-4o-mini",
424
833
  provider: Vendor.OpenAI,
425
- description: "Fast, affordable omni model with audio support",
834
+ description: "Fast, affordable omni model",
426
835
  isActive: true,
427
836
  releaseDate: "2024-07-18",
428
- knowledgeCutoff: "2024-04-01",
837
+ knowledgeCutoff: "2023-10-01",
429
838
  features: {
430
839
  reasoning: false,
431
840
  streaming: true,
@@ -435,7 +844,7 @@ var MODEL_REGISTRY = {
435
844
  predictedOutputs: false,
436
845
  realtime: true,
437
846
  vision: true,
438
- audio: true,
847
+ audio: false,
439
848
  video: false,
440
849
  batchAPI: true,
441
850
  promptCaching: true,
@@ -443,13 +852,12 @@ var MODEL_REGISTRY = {
443
852
  tokens: 128e3,
444
853
  text: true,
445
854
  image: true,
446
- audio: true,
447
- cpm: 0.15
855
+ cpm: 0.15,
856
+ cpmCached: 0.075
448
857
  },
449
858
  output: {
450
859
  tokens: 16384,
451
860
  text: true,
452
- audio: true,
453
861
  cpm: 0.6
454
862
  }
455
863
  }
@@ -461,7 +869,46 @@ var MODEL_REGISTRY = {
461
869
  description: "Fast reasoning model tailored for coding, math, and science",
462
870
  isActive: true,
463
871
  releaseDate: "2025-01-31",
464
- knowledgeCutoff: "2024-10-01",
872
+ knowledgeCutoff: "2023-10-01",
873
+ features: {
874
+ reasoning: true,
875
+ streaming: true,
876
+ structuredOutput: true,
877
+ functionCalling: true,
878
+ fineTuning: false,
879
+ predictedOutputs: false,
880
+ realtime: false,
881
+ vision: false,
882
+ audio: false,
883
+ video: false,
884
+ batchAPI: true,
885
+ promptCaching: true,
886
+ parameters: {
887
+ temperature: false,
888
+ topP: false,
889
+ frequencyPenalty: false,
890
+ presencePenalty: false
891
+ },
892
+ input: {
893
+ tokens: 2e5,
894
+ text: true,
895
+ cpm: 1.1,
896
+ cpmCached: 0.55
897
+ },
898
+ output: {
899
+ tokens: 1e5,
900
+ text: true,
901
+ cpm: 4.4
902
+ }
903
+ }
904
+ },
905
+ "o1": {
906
+ name: "o1",
907
+ provider: Vendor.OpenAI,
908
+ description: "Advanced reasoning model for complex problems",
909
+ isActive: true,
910
+ releaseDate: "2024-12-17",
911
+ knowledgeCutoff: "2023-10-01",
465
912
  features: {
466
913
  reasoning: true,
467
914
  streaming: true,
@@ -474,35 +921,78 @@ var MODEL_REGISTRY = {
474
921
  audio: false,
475
922
  video: false,
476
923
  batchAPI: true,
477
- promptCaching: false,
478
- parameters: {
479
- temperature: false,
480
- topP: false,
481
- frequencyPenalty: false,
482
- presencePenalty: false
483
- },
924
+ promptCaching: true,
925
+ parameters: {
926
+ temperature: false,
927
+ topP: false,
928
+ frequencyPenalty: false,
929
+ presencePenalty: false
930
+ },
931
+ input: {
932
+ tokens: 2e5,
933
+ text: true,
934
+ image: true,
935
+ cpm: 15,
936
+ cpmCached: 7.5
937
+ },
938
+ output: {
939
+ tokens: 1e5,
940
+ text: true,
941
+ cpm: 60
942
+ }
943
+ }
944
+ },
945
+ // ============================================================================
946
+ // Anthropic Models (Verified from platform.claude.com - March 2026)
947
+ // ============================================================================
948
+ // Claude 4.6 Series (Current)
949
+ "claude-opus-4-6": {
950
+ name: "claude-opus-4-6",
951
+ provider: Vendor.Anthropic,
952
+ description: "The most intelligent model for building agents and coding. 128K output, adaptive thinking",
953
+ isActive: true,
954
+ preferred: true,
955
+ releaseDate: "2026-02-01",
956
+ knowledgeCutoff: "2025-05-01",
957
+ features: {
958
+ reasoning: false,
959
+ streaming: true,
960
+ structuredOutput: true,
961
+ functionCalling: true,
962
+ fineTuning: false,
963
+ predictedOutputs: false,
964
+ realtime: false,
965
+ vision: true,
966
+ audio: false,
967
+ video: false,
968
+ extendedThinking: true,
969
+ batchAPI: true,
970
+ promptCaching: true,
484
971
  input: {
485
972
  tokens: 2e5,
973
+ // 1M with beta header
486
974
  text: true,
487
975
  image: true,
488
- cpm: 1.1
976
+ cpm: 5,
977
+ cpmCached: 0.5
489
978
  },
490
979
  output: {
491
- tokens: 1e5,
980
+ tokens: 128e3,
492
981
  text: true,
493
- cpm: 4.4
982
+ cpm: 25
494
983
  }
495
984
  }
496
985
  },
497
- "o1": {
498
- name: "o1",
499
- provider: Vendor.OpenAI,
500
- description: "Advanced reasoning model for complex problems",
986
+ "claude-sonnet-4-6": {
987
+ name: "claude-sonnet-4-6",
988
+ provider: Vendor.Anthropic,
989
+ description: "Best combination of speed and intelligence. Adaptive thinking, 1M context beta",
501
990
  isActive: true,
502
- releaseDate: "2024-12-17",
503
- knowledgeCutoff: "2024-10-01",
991
+ preferred: true,
992
+ releaseDate: "2026-02-01",
993
+ knowledgeCutoff: "2025-08-01",
504
994
  features: {
505
- reasoning: true,
995
+ reasoning: false,
506
996
  streaming: true,
507
997
  structuredOutput: true,
508
998
  functionCalling: true,
@@ -512,35 +1002,29 @@ var MODEL_REGISTRY = {
512
1002
  vision: true,
513
1003
  audio: false,
514
1004
  video: false,
1005
+ extendedThinking: true,
515
1006
  batchAPI: true,
516
- promptCaching: false,
517
- parameters: {
518
- temperature: false,
519
- topP: false,
520
- frequencyPenalty: false,
521
- presencePenalty: false
522
- },
1007
+ promptCaching: true,
523
1008
  input: {
524
1009
  tokens: 2e5,
1010
+ // 1M with beta header
525
1011
  text: true,
526
1012
  image: true,
527
- cpm: 15
1013
+ cpm: 3,
1014
+ cpmCached: 0.3
528
1015
  },
529
1016
  output: {
530
- tokens: 1e5,
1017
+ tokens: 64e3,
531
1018
  text: true,
532
- cpm: 60
1019
+ cpm: 15
533
1020
  }
534
1021
  }
535
1022
  },
536
- // ============================================================================
537
- // Anthropic Models (Verified from platform.claude.com)
538
- // ============================================================================
539
- // Claude 4.5 Series (Current)
1023
+ // Claude 4.5 Series
540
1024
  "claude-opus-4-5-20251101": {
541
1025
  name: "claude-opus-4-5-20251101",
542
1026
  provider: Vendor.Anthropic,
543
- description: "Premium model combining maximum intelligence with practical performance",
1027
+ description: "Legacy Opus 4.5. Premium model combining maximum intelligence with practical performance",
544
1028
  isActive: true,
545
1029
  releaseDate: "2025-11-01",
546
1030
  knowledgeCutoff: "2025-05-01",
@@ -575,7 +1059,7 @@ var MODEL_REGISTRY = {
575
1059
  "claude-sonnet-4-5-20250929": {
576
1060
  name: "claude-sonnet-4-5-20250929",
577
1061
  provider: Vendor.Anthropic,
578
- description: "Smart model for complex agents and coding. Best balance of intelligence, speed, cost",
1062
+ description: "Legacy Sonnet 4.5. Smart model for complex agents and coding",
579
1063
  isActive: true,
580
1064
  releaseDate: "2025-09-29",
581
1065
  knowledgeCutoff: "2025-01-01",
@@ -595,6 +1079,7 @@ var MODEL_REGISTRY = {
595
1079
  promptCaching: true,
596
1080
  input: {
597
1081
  tokens: 2e5,
1082
+ // 1M with beta header
598
1083
  text: true,
599
1084
  image: true,
600
1085
  cpm: 3,
@@ -678,10 +1163,45 @@ var MODEL_REGISTRY = {
678
1163
  }
679
1164
  }
680
1165
  },
1166
+ "claude-opus-4-20250514": {
1167
+ name: "claude-opus-4-20250514",
1168
+ provider: Vendor.Anthropic,
1169
+ description: "Legacy Opus 4. Agentic tasks and reasoning",
1170
+ isActive: true,
1171
+ releaseDate: "2025-05-14",
1172
+ knowledgeCutoff: "2025-01-01",
1173
+ features: {
1174
+ reasoning: false,
1175
+ streaming: true,
1176
+ structuredOutput: true,
1177
+ functionCalling: true,
1178
+ fineTuning: false,
1179
+ predictedOutputs: false,
1180
+ realtime: false,
1181
+ vision: true,
1182
+ audio: false,
1183
+ video: false,
1184
+ extendedThinking: true,
1185
+ batchAPI: true,
1186
+ promptCaching: true,
1187
+ input: {
1188
+ tokens: 2e5,
1189
+ text: true,
1190
+ image: true,
1191
+ cpm: 15,
1192
+ cpmCached: 1.5
1193
+ },
1194
+ output: {
1195
+ tokens: 32e3,
1196
+ text: true,
1197
+ cpm: 75
1198
+ }
1199
+ }
1200
+ },
681
1201
  "claude-sonnet-4-20250514": {
682
1202
  name: "claude-sonnet-4-20250514",
683
1203
  provider: Vendor.Anthropic,
684
- description: "Legacy Sonnet 4. Default for most users, supports 1M context beta",
1204
+ description: "Legacy Sonnet 4. Supports 1M context beta",
685
1205
  isActive: true,
686
1206
  releaseDate: "2025-05-14",
687
1207
  knowledgeCutoff: "2025-01-01",
@@ -717,7 +1237,7 @@ var MODEL_REGISTRY = {
717
1237
  "claude-3-7-sonnet-20250219": {
718
1238
  name: "claude-3-7-sonnet-20250219",
719
1239
  provider: Vendor.Anthropic,
720
- description: "Claude 3.7 Sonnet with extended thinking, supports 128K output beta",
1240
+ description: "Deprecated. Claude 3.7 Sonnet with extended thinking",
721
1241
  isActive: true,
722
1242
  releaseDate: "2025-02-19",
723
1243
  knowledgeCutoff: "2024-10-01",
@@ -744,17 +1264,16 @@ var MODEL_REGISTRY = {
744
1264
  },
745
1265
  output: {
746
1266
  tokens: 64e3,
747
- // 128K with beta header
748
1267
  text: true,
749
1268
  cpm: 15
750
1269
  }
751
1270
  }
752
1271
  },
753
- // Claude 3.x Legacy
1272
+ // Claude 3.x Legacy (Deprecated - retiring April 19, 2026)
754
1273
  "claude-3-haiku-20240307": {
755
1274
  name: "claude-3-haiku-20240307",
756
1275
  provider: Vendor.Anthropic,
757
- description: "Fast legacy model. Recommend migrating to Haiku 4.5",
1276
+ description: "Deprecated. Retiring April 19, 2026. Migrate to Haiku 4.5",
758
1277
  isActive: true,
759
1278
  releaseDate: "2024-03-07",
760
1279
  knowledgeCutoff: "2023-08-01",
@@ -787,16 +1306,124 @@ var MODEL_REGISTRY = {
787
1306
  }
788
1307
  },
789
1308
  // ============================================================================
790
- // Google Models (Verified from ai.google.dev)
1309
+ // Google Models (Verified from ai.google.dev - March 2026)
791
1310
  // ============================================================================
1311
+ // Gemini 3.1 Series (Preview)
1312
+ "gemini-3.1-pro-preview": {
1313
+ name: "gemini-3.1-pro-preview",
1314
+ provider: Vendor.Google,
1315
+ description: "Advanced intelligence with powerful agentic and coding capabilities. Replaces gemini-3-pro-preview",
1316
+ isActive: true,
1317
+ preferred: true,
1318
+ releaseDate: "2026-02-01",
1319
+ knowledgeCutoff: "2025-01-01",
1320
+ features: {
1321
+ reasoning: true,
1322
+ streaming: true,
1323
+ structuredOutput: true,
1324
+ functionCalling: true,
1325
+ fineTuning: false,
1326
+ predictedOutputs: false,
1327
+ realtime: false,
1328
+ vision: true,
1329
+ audio: true,
1330
+ video: true,
1331
+ batchAPI: true,
1332
+ promptCaching: true,
1333
+ input: {
1334
+ tokens: 1048576,
1335
+ text: true,
1336
+ image: true,
1337
+ audio: true,
1338
+ video: true,
1339
+ cpm: 2,
1340
+ cpmCached: 0.2
1341
+ },
1342
+ output: {
1343
+ tokens: 65536,
1344
+ text: true,
1345
+ cpm: 12
1346
+ }
1347
+ }
1348
+ },
1349
+ "gemini-3.1-flash-lite-preview": {
1350
+ name: "gemini-3.1-flash-lite-preview",
1351
+ provider: Vendor.Google,
1352
+ description: "High performance, budget-friendly for high-volume agentic tasks and data extraction",
1353
+ isActive: true,
1354
+ releaseDate: "2026-03-01",
1355
+ knowledgeCutoff: "2025-01-01",
1356
+ features: {
1357
+ reasoning: true,
1358
+ streaming: true,
1359
+ structuredOutput: true,
1360
+ functionCalling: true,
1361
+ fineTuning: false,
1362
+ predictedOutputs: false,
1363
+ realtime: false,
1364
+ vision: true,
1365
+ audio: true,
1366
+ video: true,
1367
+ batchAPI: true,
1368
+ promptCaching: true,
1369
+ input: {
1370
+ tokens: 1048576,
1371
+ text: true,
1372
+ image: true,
1373
+ audio: true,
1374
+ video: true,
1375
+ cpm: 0.25
1376
+ },
1377
+ output: {
1378
+ tokens: 65536,
1379
+ text: true,
1380
+ cpm: 1.5
1381
+ }
1382
+ }
1383
+ },
1384
+ "gemini-3.1-flash-image-preview": {
1385
+ name: "gemini-3.1-flash-image-preview",
1386
+ provider: Vendor.Google,
1387
+ description: "High-efficiency image generation with up to 4K output, search grounding support",
1388
+ isActive: true,
1389
+ releaseDate: "2026-02-01",
1390
+ knowledgeCutoff: "2025-01-01",
1391
+ features: {
1392
+ reasoning: true,
1393
+ streaming: true,
1394
+ structuredOutput: false,
1395
+ functionCalling: false,
1396
+ fineTuning: false,
1397
+ predictedOutputs: false,
1398
+ realtime: false,
1399
+ vision: true,
1400
+ audio: false,
1401
+ video: false,
1402
+ batchAPI: true,
1403
+ promptCaching: false,
1404
+ input: {
1405
+ tokens: 131072,
1406
+ text: true,
1407
+ image: true,
1408
+ cpm: 0.25
1409
+ },
1410
+ output: {
1411
+ tokens: 32768,
1412
+ text: true,
1413
+ image: true,
1414
+ cpm: 1.5
1415
+ }
1416
+ }
1417
+ },
792
1418
  // Gemini 3 Series (Preview)
793
1419
  "gemini-3-flash-preview": {
794
1420
  name: "gemini-3-flash-preview",
795
1421
  provider: Vendor.Google,
796
- description: "Pro-grade reasoning with Flash-level latency and efficiency",
1422
+ description: "Most powerful agentic and coding model with frontier-class reasoning",
797
1423
  isActive: true,
798
- releaseDate: "2025-11-18",
799
- knowledgeCutoff: "2025-08-01",
1424
+ preferred: true,
1425
+ releaseDate: "2025-12-01",
1426
+ knowledgeCutoff: "2025-01-01",
800
1427
  features: {
801
1428
  reasoning: true,
802
1429
  streaming: true,
@@ -811,27 +1438,28 @@ var MODEL_REGISTRY = {
811
1438
  batchAPI: true,
812
1439
  promptCaching: true,
813
1440
  input: {
814
- tokens: 1e6,
1441
+ tokens: 1048576,
815
1442
  text: true,
816
1443
  image: true,
817
1444
  audio: true,
818
1445
  video: true,
819
- cpm: 0.15
1446
+ cpm: 0.5,
1447
+ cpmCached: 0.05
820
1448
  },
821
1449
  output: {
822
1450
  tokens: 65536,
823
1451
  text: true,
824
- cpm: 0.6
1452
+ cpm: 3
825
1453
  }
826
1454
  }
827
1455
  },
828
1456
  "gemini-3-pro-preview": {
829
1457
  name: "gemini-3-pro-preview",
830
1458
  provider: Vendor.Google,
831
- description: "Most advanced reasoning Gemini model for complex tasks",
1459
+ description: "Deprecated. Shutting down March 9, 2026. Migrate to gemini-3.1-pro-preview",
832
1460
  isActive: true,
833
1461
  releaseDate: "2025-11-18",
834
- knowledgeCutoff: "2025-08-01",
1462
+ knowledgeCutoff: "2025-01-01",
835
1463
  features: {
836
1464
  reasoning: true,
837
1465
  streaming: true,
@@ -846,7 +1474,7 @@ var MODEL_REGISTRY = {
846
1474
  batchAPI: true,
847
1475
  promptCaching: true,
848
1476
  input: {
849
- tokens: 1e6,
1477
+ tokens: 1048576,
850
1478
  text: true,
851
1479
  image: true,
852
1480
  audio: true,
@@ -863,14 +1491,14 @@ var MODEL_REGISTRY = {
863
1491
  "gemini-3-pro-image-preview": {
864
1492
  name: "gemini-3-pro-image-preview",
865
1493
  provider: Vendor.Google,
866
- description: "Highest quality image generation model",
1494
+ description: "Professional-grade image generation and editing with reasoning",
867
1495
  isActive: true,
868
1496
  releaseDate: "2025-11-18",
869
- knowledgeCutoff: "2025-08-01",
1497
+ knowledgeCutoff: "2025-01-01",
870
1498
  features: {
871
1499
  reasoning: true,
872
1500
  streaming: true,
873
- structuredOutput: false,
1501
+ structuredOutput: true,
874
1502
  functionCalling: false,
875
1503
  fineTuning: false,
876
1504
  predictedOutputs: false,
@@ -879,15 +1507,15 @@ var MODEL_REGISTRY = {
879
1507
  audio: false,
880
1508
  video: false,
881
1509
  batchAPI: true,
882
- promptCaching: true,
1510
+ promptCaching: false,
883
1511
  input: {
884
- tokens: 1e6,
1512
+ tokens: 65536,
885
1513
  text: true,
886
1514
  image: true,
887
1515
  cpm: 1.25
888
1516
  },
889
1517
  output: {
890
- tokens: 65536,
1518
+ tokens: 32768,
891
1519
  text: true,
892
1520
  image: true,
893
1521
  cpm: 10
@@ -898,7 +1526,7 @@ var MODEL_REGISTRY = {
898
1526
  "gemini-2.5-pro": {
899
1527
  name: "gemini-2.5-pro",
900
1528
  provider: Vendor.Google,
901
- description: "Advanced multimodal model built for deep reasoning and agents",
1529
+ description: "Most advanced model for complex tasks with deep reasoning and coding",
902
1530
  isActive: true,
903
1531
  releaseDate: "2025-03-01",
904
1532
  knowledgeCutoff: "2025-01-01",
@@ -916,12 +1544,13 @@ var MODEL_REGISTRY = {
916
1544
  batchAPI: true,
917
1545
  promptCaching: true,
918
1546
  input: {
919
- tokens: 1e6,
1547
+ tokens: 1048576,
920
1548
  text: true,
921
1549
  image: true,
922
1550
  audio: true,
923
1551
  video: true,
924
- cpm: 1.25
1552
+ cpm: 1.25,
1553
+ cpmCached: 0.125
925
1554
  },
926
1555
  output: {
927
1556
  tokens: 65536,
@@ -933,7 +1562,7 @@ var MODEL_REGISTRY = {
933
1562
  "gemini-2.5-flash": {
934
1563
  name: "gemini-2.5-flash",
935
1564
  provider: Vendor.Google,
936
- description: "Fast, cost-effective model with excellent reasoning",
1565
+ description: "Best price-performance for low-latency, high-volume tasks with reasoning",
937
1566
  isActive: true,
938
1567
  releaseDate: "2025-06-17",
939
1568
  knowledgeCutoff: "2025-01-01",
@@ -951,24 +1580,25 @@ var MODEL_REGISTRY = {
951
1580
  batchAPI: true,
952
1581
  promptCaching: true,
953
1582
  input: {
954
- tokens: 1e6,
1583
+ tokens: 1048576,
955
1584
  text: true,
956
1585
  image: true,
957
1586
  audio: true,
958
1587
  video: true,
959
- cpm: 0.15
1588
+ cpm: 0.3,
1589
+ cpmCached: 0.03
960
1590
  },
961
1591
  output: {
962
1592
  tokens: 65536,
963
1593
  text: true,
964
- cpm: 0.6
1594
+ cpm: 2.5
965
1595
  }
966
1596
  }
967
1597
  },
968
1598
  "gemini-2.5-flash-lite": {
969
1599
  name: "gemini-2.5-flash-lite",
970
1600
  provider: Vendor.Google,
971
- description: "Lowest latency for high-volume tasks, summarization, classification",
1601
+ description: "Fastest and most budget-friendly multimodal model in the 2.5 family",
972
1602
  isActive: true,
973
1603
  releaseDate: "2025-06-17",
974
1604
  knowledgeCutoff: "2025-01-01",
@@ -986,31 +1616,31 @@ var MODEL_REGISTRY = {
986
1616
  batchAPI: true,
987
1617
  promptCaching: true,
988
1618
  input: {
989
- tokens: 1e6,
1619
+ tokens: 1048576,
990
1620
  text: true,
991
1621
  image: true,
992
1622
  audio: true,
993
1623
  video: true,
994
- cpm: 0.075
1624
+ cpm: 0.1
995
1625
  },
996
1626
  output: {
997
1627
  tokens: 65536,
998
1628
  text: true,
999
- cpm: 0.3
1629
+ cpm: 0.4
1000
1630
  }
1001
1631
  }
1002
1632
  },
1003
1633
  "gemini-2.5-flash-image": {
1004
1634
  name: "gemini-2.5-flash-image",
1005
1635
  provider: Vendor.Google,
1006
- description: "Image generation and editing model",
1636
+ description: "Fast native image generation and editing (Nano Banana)",
1007
1637
  isActive: true,
1008
- releaseDate: "2025-09-01",
1009
- knowledgeCutoff: "2025-01-01",
1638
+ releaseDate: "2025-10-01",
1639
+ knowledgeCutoff: "2025-06-01",
1010
1640
  features: {
1011
- reasoning: true,
1641
+ reasoning: false,
1012
1642
  streaming: true,
1013
- structuredOutput: false,
1643
+ structuredOutput: true,
1014
1644
  functionCalling: false,
1015
1645
  fineTuning: false,
1016
1646
  predictedOutputs: false,
@@ -1021,13 +1651,13 @@ var MODEL_REGISTRY = {
1021
1651
  batchAPI: true,
1022
1652
  promptCaching: true,
1023
1653
  input: {
1024
- tokens: 1e6,
1654
+ tokens: 65536,
1025
1655
  text: true,
1026
1656
  image: true,
1027
1657
  cpm: 0.15
1028
1658
  },
1029
1659
  output: {
1030
- tokens: 65536,
1660
+ tokens: 32768,
1031
1661
  text: true,
1032
1662
  image: true,
1033
1663
  cpm: 0.6
@@ -1035,7 +1665,7 @@ var MODEL_REGISTRY = {
1035
1665
  }
1036
1666
  },
1037
1667
  // ============================================================================
1038
- // xAI Grok Models (Verified from docs.x.ai - January 2026)
1668
+ // xAI Grok Models (Verified from docs.x.ai - March 2026)
1039
1669
  // ============================================================================
1040
1670
  // Grok 4.1 Series (2M context, fast)
1041
1671
  "grok-4-1-fast-reasoning": {
@@ -1056,13 +1686,14 @@ var MODEL_REGISTRY = {
1056
1686
  vision: true,
1057
1687
  audio: false,
1058
1688
  video: false,
1059
- batchAPI: false,
1060
- promptCaching: false,
1689
+ batchAPI: true,
1690
+ promptCaching: true,
1061
1691
  input: {
1062
1692
  tokens: 2e6,
1063
1693
  text: true,
1064
1694
  image: true,
1065
- cpm: 0.2
1695
+ cpm: 0.2,
1696
+ cpmCached: 0.05
1066
1697
  },
1067
1698
  output: {
1068
1699
  tokens: 65536,
@@ -1089,13 +1720,14 @@ var MODEL_REGISTRY = {
1089
1720
  vision: true,
1090
1721
  audio: false,
1091
1722
  video: false,
1092
- batchAPI: false,
1093
- promptCaching: false,
1723
+ batchAPI: true,
1724
+ promptCaching: true,
1094
1725
  input: {
1095
1726
  tokens: 2e6,
1096
1727
  text: true,
1097
1728
  image: true,
1098
- cpm: 0.2
1729
+ cpm: 0.2,
1730
+ cpmCached: 0.05
1099
1731
  },
1100
1732
  output: {
1101
1733
  tokens: 65536,
@@ -1123,12 +1755,13 @@ var MODEL_REGISTRY = {
1123
1755
  vision: false,
1124
1756
  audio: false,
1125
1757
  video: false,
1126
- batchAPI: false,
1127
- promptCaching: false,
1758
+ batchAPI: true,
1759
+ promptCaching: true,
1128
1760
  input: {
1129
1761
  tokens: 256e3,
1130
1762
  text: true,
1131
- cpm: 0.2
1763
+ cpm: 0.2,
1764
+ cpmCached: 0.02
1132
1765
  },
1133
1766
  output: {
1134
1767
  tokens: 32768,
@@ -1141,7 +1774,7 @@ var MODEL_REGISTRY = {
1141
1774
  "grok-4-fast-reasoning": {
1142
1775
  name: "grok-4-fast-reasoning",
1143
1776
  provider: Vendor.Grok,
1144
- description: "Fast Grok 4 with reasoning capabilities, 2M context window",
1777
+ description: "Fast Grok 4 with reasoning capabilities, 2M context window, vision support",
1145
1778
  isActive: true,
1146
1779
  releaseDate: "2025-09-01",
1147
1780
  knowledgeCutoff: "2024-11-01",
@@ -1153,15 +1786,17 @@ var MODEL_REGISTRY = {
1153
1786
  fineTuning: false,
1154
1787
  predictedOutputs: false,
1155
1788
  realtime: false,
1156
- vision: false,
1789
+ vision: true,
1157
1790
  audio: false,
1158
1791
  video: false,
1159
- batchAPI: false,
1160
- promptCaching: false,
1792
+ batchAPI: true,
1793
+ promptCaching: true,
1161
1794
  input: {
1162
1795
  tokens: 2e6,
1163
1796
  text: true,
1164
- cpm: 0.2
1797
+ image: true,
1798
+ cpm: 0.2,
1799
+ cpmCached: 0.05
1165
1800
  },
1166
1801
  output: {
1167
1802
  tokens: 65536,
@@ -1188,13 +1823,14 @@ var MODEL_REGISTRY = {
1188
1823
  vision: true,
1189
1824
  audio: false,
1190
1825
  video: false,
1191
- batchAPI: false,
1192
- promptCaching: false,
1826
+ batchAPI: true,
1827
+ promptCaching: true,
1193
1828
  input: {
1194
1829
  tokens: 2e6,
1195
1830
  text: true,
1196
1831
  image: true,
1197
- cpm: 0.2
1832
+ cpm: 0.2,
1833
+ cpmCached: 0.05
1198
1834
  },
1199
1835
  output: {
1200
1836
  tokens: 65536,
@@ -1206,12 +1842,12 @@ var MODEL_REGISTRY = {
1206
1842
  "grok-4-0709": {
1207
1843
  name: "grok-4-0709",
1208
1844
  provider: Vendor.Grok,
1209
- description: "Grok 4 flagship model (July 2025 release), 256K context, vision support",
1845
+ description: "Grok 4 flagship model (July 2025 release), 256K context, vision support, reasoning",
1210
1846
  isActive: true,
1211
1847
  releaseDate: "2025-07-09",
1212
1848
  knowledgeCutoff: "2024-11-01",
1213
1849
  features: {
1214
- reasoning: false,
1850
+ reasoning: true,
1215
1851
  streaming: true,
1216
1852
  structuredOutput: true,
1217
1853
  functionCalling: true,
@@ -1221,13 +1857,14 @@ var MODEL_REGISTRY = {
1221
1857
  vision: true,
1222
1858
  audio: false,
1223
1859
  video: false,
1224
- batchAPI: false,
1225
- promptCaching: false,
1860
+ batchAPI: true,
1861
+ promptCaching: true,
1226
1862
  input: {
1227
1863
  tokens: 256e3,
1228
1864
  text: true,
1229
1865
  image: true,
1230
- cpm: 3
1866
+ cpm: 3,
1867
+ cpmCached: 0.75
1231
1868
  },
1232
1869
  output: {
1233
1870
  tokens: 32768,
@@ -1240,12 +1877,12 @@ var MODEL_REGISTRY = {
1240
1877
  "grok-3-mini": {
1241
1878
  name: "grok-3-mini",
1242
1879
  provider: Vendor.Grok,
1243
- description: "Lightweight, cost-efficient model for simpler tasks, 131K context",
1880
+ description: "Lightweight, cost-efficient model with reasoning, 131K context",
1244
1881
  isActive: true,
1245
1882
  releaseDate: "2025-06-01",
1246
1883
  knowledgeCutoff: "2024-11-01",
1247
1884
  features: {
1248
- reasoning: false,
1885
+ reasoning: true,
1249
1886
  streaming: true,
1250
1887
  structuredOutput: true,
1251
1888
  functionCalling: true,
@@ -1255,12 +1892,13 @@ var MODEL_REGISTRY = {
1255
1892
  vision: false,
1256
1893
  audio: false,
1257
1894
  video: false,
1258
- batchAPI: false,
1259
- promptCaching: false,
1895
+ batchAPI: true,
1896
+ promptCaching: true,
1260
1897
  input: {
1261
1898
  tokens: 131072,
1262
1899
  text: true,
1263
- cpm: 0.3
1900
+ cpm: 0.3,
1901
+ cpmCached: 0.07
1264
1902
  },
1265
1903
  output: {
1266
1904
  tokens: 32768,
@@ -1287,12 +1925,13 @@ var MODEL_REGISTRY = {
1287
1925
  vision: false,
1288
1926
  audio: false,
1289
1927
  video: false,
1290
- batchAPI: false,
1291
- promptCaching: false,
1928
+ batchAPI: true,
1929
+ promptCaching: true,
1292
1930
  input: {
1293
1931
  tokens: 131072,
1294
1932
  text: true,
1295
- cpm: 3
1933
+ cpm: 3,
1934
+ cpmCached: 0.75
1296
1935
  },
1297
1936
  output: {
1298
1937
  tokens: 32768,
@@ -1301,11 +1940,11 @@ var MODEL_REGISTRY = {
1301
1940
  }
1302
1941
  }
1303
1942
  },
1304
- // Grok 2 Series (Vision)
1943
+ // Grok 2 Series (Legacy - not in current docs)
1305
1944
  "grok-2-vision-1212": {
1306
1945
  name: "grok-2-vision-1212",
1307
1946
  provider: Vendor.Grok,
1308
- description: "Vision-capable model for image understanding, 32K context",
1947
+ description: "Legacy vision model for image understanding, 32K context. Not in current xAI docs",
1309
1948
  isActive: true,
1310
1949
  releaseDate: "2024-12-12",
1311
1950
  knowledgeCutoff: "2024-11-01",
@@ -1578,6 +2217,14 @@ var SERVICE_DEFINITIONS = [
1578
2217
  baseURL: "https://aws.amazon.com",
1579
2218
  docsURL: "https://docs.aws.amazon.com/"
1580
2219
  },
2220
+ {
2221
+ id: "cloudflare",
2222
+ name: "Cloudflare",
2223
+ category: "cloud",
2224
+ urlPattern: /api\.cloudflare\.com/i,
2225
+ baseURL: "https://api.cloudflare.com/client/v4",
2226
+ docsURL: "https://developers.cloudflare.com/api/"
2227
+ },
1581
2228
  // ============ Storage ============
1582
2229
  {
1583
2230
  id: "dropbox",
@@ -1621,6 +2268,14 @@ var SERVICE_DEFINITIONS = [
1621
2268
  baseURL: "https://api.postmarkapp.com",
1622
2269
  docsURL: "https://postmarkapp.com/developer"
1623
2270
  },
2271
+ {
2272
+ id: "mailgun",
2273
+ name: "Mailgun",
2274
+ category: "email",
2275
+ urlPattern: /api\.mailgun\.net|api\.eu\.mailgun\.net/i,
2276
+ baseURL: "https://api.mailgun.net/v3",
2277
+ docsURL: "https://documentation.mailgun.com/docs/mailgun/api-reference/"
2278
+ },
1624
2279
  // ============ Monitoring & Observability ============
1625
2280
  {
1626
2281
  id: "datadog",