@everworker/oneringai 0.4.5 → 0.4.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -22,18 +22,30 @@ function isVendor(value) {
22
22
  // src/domain/entities/Model.ts
23
23
  var LLM_MODELS = {
24
24
  [Vendor.OpenAI]: {
25
+ // GPT-5.3 Series
26
+ GPT_5_3_CODEX: "gpt-5.3-codex",
27
+ GPT_5_3_CHAT: "gpt-5.3-chat-latest",
25
28
  // GPT-5.2 Series (Current Flagship)
26
29
  GPT_5_2: "gpt-5.2",
27
30
  GPT_5_2_PRO: "gpt-5.2-pro",
31
+ GPT_5_2_CODEX: "gpt-5.2-codex",
32
+ GPT_5_2_CHAT: "gpt-5.2-chat-latest",
33
+ // GPT-5.1 Series
34
+ GPT_5_1: "gpt-5.1",
35
+ GPT_5_1_CODEX: "gpt-5.1-codex",
36
+ GPT_5_1_CODEX_MAX: "gpt-5.1-codex-max",
37
+ GPT_5_1_CODEX_MINI: "gpt-5.1-codex-mini",
38
+ GPT_5_1_CHAT: "gpt-5.1-chat-latest",
28
39
  // GPT-5 Series
29
40
  GPT_5: "gpt-5",
30
41
  GPT_5_MINI: "gpt-5-mini",
31
42
  GPT_5_NANO: "gpt-5-nano",
43
+ GPT_5_CHAT: "gpt-5-chat-latest",
32
44
  // GPT-4.1 Series
33
45
  GPT_4_1: "gpt-4.1",
34
46
  GPT_4_1_MINI: "gpt-4.1-mini",
35
47
  GPT_4_1_NANO: "gpt-4.1-nano",
36
- // GPT-4o Series (Legacy, Audio Capable)
48
+ // GPT-4o Series (Legacy)
37
49
  GPT_4O: "gpt-4o",
38
50
  GPT_4O_MINI: "gpt-4o-mini",
39
51
  // Reasoning Models (o-series)
@@ -41,18 +53,26 @@ var LLM_MODELS = {
41
53
  O1: "o1"
42
54
  },
43
55
  [Vendor.Anthropic]: {
44
- // Claude 4.5 Series (Current)
56
+ // Claude 4.6 Series (Current)
57
+ CLAUDE_OPUS_4_6: "claude-opus-4-6",
58
+ CLAUDE_SONNET_4_6: "claude-sonnet-4-6",
59
+ // Claude 4.5 Series
45
60
  CLAUDE_OPUS_4_5: "claude-opus-4-5-20251101",
46
61
  CLAUDE_SONNET_4_5: "claude-sonnet-4-5-20250929",
47
62
  CLAUDE_HAIKU_4_5: "claude-haiku-4-5-20251001",
48
63
  // Claude 4.x Legacy
49
64
  CLAUDE_OPUS_4_1: "claude-opus-4-1-20250805",
65
+ CLAUDE_OPUS_4: "claude-opus-4-20250514",
50
66
  CLAUDE_SONNET_4: "claude-sonnet-4-20250514",
51
67
  CLAUDE_SONNET_3_7: "claude-3-7-sonnet-20250219",
52
- // Claude 3.x Legacy
68
+ // Claude 3.x Legacy (Deprecated)
53
69
  CLAUDE_HAIKU_3: "claude-3-haiku-20240307"
54
70
  },
55
71
  [Vendor.Google]: {
72
+ // Gemini 3.1 Series (Preview)
73
+ GEMINI_3_1_PRO_PREVIEW: "gemini-3.1-pro-preview",
74
+ GEMINI_3_1_FLASH_LITE_PREVIEW: "gemini-3.1-flash-lite-preview",
75
+ GEMINI_3_1_FLASH_IMAGE_PREVIEW: "gemini-3.1-flash-image-preview",
56
76
  // Gemini 3 Series (Preview)
57
77
  GEMINI_3_FLASH_PREVIEW: "gemini-3-flash-preview",
58
78
  GEMINI_3_PRO_PREVIEW: "gemini-3-pro-preview",
@@ -84,12 +104,91 @@ var MODEL_REGISTRY = {
84
104
  // ============================================================================
85
105
  // OpenAI Models (Verified from platform.openai.com)
86
106
  // ============================================================================
107
+ // GPT-5.3 Series
108
+ "gpt-5.3-codex": {
109
+ name: "gpt-5.3-codex",
110
+ provider: Vendor.OpenAI,
111
+ description: "Latest codex model for coding and agentic tasks. Reasoning.effort: low, medium, high, xhigh",
112
+ isActive: true,
113
+ releaseDate: "2026-02-01",
114
+ knowledgeCutoff: "2025-08-31",
115
+ features: {
116
+ reasoning: true,
117
+ streaming: true,
118
+ structuredOutput: true,
119
+ functionCalling: true,
120
+ fineTuning: false,
121
+ predictedOutputs: false,
122
+ realtime: false,
123
+ vision: true,
124
+ audio: false,
125
+ video: false,
126
+ batchAPI: true,
127
+ promptCaching: true,
128
+ parameters: {
129
+ temperature: false,
130
+ topP: false,
131
+ frequencyPenalty: false,
132
+ presencePenalty: false
133
+ },
134
+ input: {
135
+ tokens: 4e5,
136
+ text: true,
137
+ image: true,
138
+ cpm: 1.75,
139
+ cpmCached: 0.175
140
+ },
141
+ output: {
142
+ tokens: 128e3,
143
+ text: true,
144
+ cpm: 14
145
+ }
146
+ }
147
+ },
148
+ "gpt-5.3-chat-latest": {
149
+ name: "gpt-5.3-chat-latest",
150
+ provider: Vendor.OpenAI,
151
+ description: "Latest GPT-5.3 chat model for general-purpose use",
152
+ isActive: true,
153
+ releaseDate: "2026-02-01",
154
+ knowledgeCutoff: "2025-08-31",
155
+ features: {
156
+ reasoning: false,
157
+ streaming: true,
158
+ structuredOutput: true,
159
+ functionCalling: true,
160
+ fineTuning: false,
161
+ predictedOutputs: false,
162
+ realtime: false,
163
+ vision: true,
164
+ audio: false,
165
+ video: false,
166
+ batchAPI: true,
167
+ promptCaching: true,
168
+ parameters: {
169
+ temperature: false
170
+ },
171
+ input: {
172
+ tokens: 128e3,
173
+ text: true,
174
+ image: true,
175
+ cpm: 1.75,
176
+ cpmCached: 0.175
177
+ },
178
+ output: {
179
+ tokens: 16e3,
180
+ text: true,
181
+ cpm: 14
182
+ }
183
+ }
184
+ },
87
185
  // GPT-5.2 Series (Current Flagship)
88
186
  "gpt-5.2": {
89
187
  name: "gpt-5.2",
90
188
  provider: Vendor.OpenAI,
91
189
  description: "Flagship model for coding and agentic tasks. Reasoning.effort: none, low, medium, high, xhigh",
92
190
  isActive: true,
191
+ preferred: true,
93
192
  releaseDate: "2025-12-01",
94
193
  knowledgeCutoff: "2025-08-31",
95
194
  features: {
@@ -115,7 +214,8 @@ var MODEL_REGISTRY = {
115
214
  tokens: 4e5,
116
215
  text: true,
117
216
  image: true,
118
- cpm: 1.75
217
+ cpm: 1.75,
218
+ cpmCached: 0.175
119
219
  },
120
220
  output: {
121
221
  tokens: 128e3,
@@ -134,7 +234,7 @@ var MODEL_REGISTRY = {
134
234
  features: {
135
235
  reasoning: true,
136
236
  streaming: true,
137
- structuredOutput: true,
237
+ structuredOutput: false,
138
238
  functionCalling: true,
139
239
  fineTuning: false,
140
240
  predictedOutputs: false,
@@ -163,6 +263,276 @@ var MODEL_REGISTRY = {
163
263
  }
164
264
  }
165
265
  },
266
+ "gpt-5.2-codex": {
267
+ name: "gpt-5.2-codex",
268
+ provider: Vendor.OpenAI,
269
+ description: "GPT-5.2 codex for coding and agentic tasks. Reasoning.effort: low, medium, high, xhigh",
270
+ isActive: true,
271
+ preferred: true,
272
+ releaseDate: "2025-12-01",
273
+ knowledgeCutoff: "2025-08-31",
274
+ features: {
275
+ reasoning: true,
276
+ streaming: true,
277
+ structuredOutput: true,
278
+ functionCalling: true,
279
+ fineTuning: false,
280
+ predictedOutputs: false,
281
+ realtime: false,
282
+ vision: true,
283
+ audio: false,
284
+ video: false,
285
+ batchAPI: true,
286
+ promptCaching: true,
287
+ parameters: {
288
+ temperature: false,
289
+ topP: false,
290
+ frequencyPenalty: false,
291
+ presencePenalty: false
292
+ },
293
+ input: {
294
+ tokens: 4e5,
295
+ text: true,
296
+ image: true,
297
+ cpm: 1.75,
298
+ cpmCached: 0.175
299
+ },
300
+ output: {
301
+ tokens: 128e3,
302
+ text: true,
303
+ cpm: 14
304
+ }
305
+ }
306
+ },
307
+ "gpt-5.2-chat-latest": {
308
+ name: "gpt-5.2-chat-latest",
309
+ provider: Vendor.OpenAI,
310
+ description: "GPT-5.2 chat model for general-purpose use",
311
+ isActive: true,
312
+ releaseDate: "2025-12-01",
313
+ knowledgeCutoff: "2025-08-31",
314
+ features: {
315
+ reasoning: false,
316
+ streaming: true,
317
+ structuredOutput: true,
318
+ functionCalling: true,
319
+ fineTuning: false,
320
+ predictedOutputs: false,
321
+ realtime: false,
322
+ vision: true,
323
+ audio: false,
324
+ video: false,
325
+ batchAPI: true,
326
+ promptCaching: true,
327
+ input: {
328
+ tokens: 128e3,
329
+ text: true,
330
+ image: true,
331
+ cpm: 1.75,
332
+ cpmCached: 0.175
333
+ },
334
+ output: {
335
+ tokens: 16e3,
336
+ text: true,
337
+ cpm: 14
338
+ }
339
+ }
340
+ },
341
+ // GPT-5.1 Series
342
+ "gpt-5.1": {
343
+ name: "gpt-5.1",
344
+ provider: Vendor.OpenAI,
345
+ description: "Intelligent reasoning model for coding and agentic tasks. Reasoning.effort: none, low, medium, high",
346
+ isActive: true,
347
+ releaseDate: "2025-10-01",
348
+ knowledgeCutoff: "2024-09-30",
349
+ features: {
350
+ reasoning: true,
351
+ streaming: true,
352
+ structuredOutput: true,
353
+ functionCalling: true,
354
+ fineTuning: false,
355
+ predictedOutputs: false,
356
+ realtime: false,
357
+ vision: true,
358
+ audio: false,
359
+ video: false,
360
+ batchAPI: true,
361
+ promptCaching: true,
362
+ parameters: {
363
+ temperature: false,
364
+ topP: false,
365
+ frequencyPenalty: false,
366
+ presencePenalty: false
367
+ },
368
+ input: {
369
+ tokens: 4e5,
370
+ text: true,
371
+ image: true,
372
+ cpm: 1.25,
373
+ cpmCached: 0.125
374
+ },
375
+ output: {
376
+ tokens: 128e3,
377
+ text: true,
378
+ cpm: 10
379
+ }
380
+ }
381
+ },
382
+ "gpt-5.1-codex": {
383
+ name: "gpt-5.1-codex",
384
+ provider: Vendor.OpenAI,
385
+ description: "GPT-5.1 codex for coding and agentic tasks with reasoning",
386
+ isActive: true,
387
+ releaseDate: "2025-10-01",
388
+ knowledgeCutoff: "2024-09-30",
389
+ features: {
390
+ reasoning: true,
391
+ streaming: true,
392
+ structuredOutput: true,
393
+ functionCalling: true,
394
+ fineTuning: false,
395
+ predictedOutputs: false,
396
+ realtime: false,
397
+ vision: true,
398
+ audio: false,
399
+ video: false,
400
+ batchAPI: true,
401
+ promptCaching: true,
402
+ parameters: {
403
+ temperature: false,
404
+ topP: false,
405
+ frequencyPenalty: false,
406
+ presencePenalty: false
407
+ },
408
+ input: {
409
+ tokens: 4e5,
410
+ text: true,
411
+ image: true,
412
+ cpm: 1.25,
413
+ cpmCached: 0.125
414
+ },
415
+ output: {
416
+ tokens: 128e3,
417
+ text: true,
418
+ cpm: 10
419
+ }
420
+ }
421
+ },
422
+ "gpt-5.1-codex-max": {
423
+ name: "gpt-5.1-codex-max",
424
+ provider: Vendor.OpenAI,
425
+ description: "GPT-5.1 codex max for maximum reasoning depth on coding tasks",
426
+ isActive: true,
427
+ releaseDate: "2025-10-01",
428
+ knowledgeCutoff: "2024-09-30",
429
+ features: {
430
+ reasoning: true,
431
+ streaming: true,
432
+ structuredOutput: true,
433
+ functionCalling: true,
434
+ fineTuning: false,
435
+ predictedOutputs: false,
436
+ realtime: false,
437
+ vision: true,
438
+ audio: false,
439
+ video: false,
440
+ batchAPI: true,
441
+ promptCaching: true,
442
+ parameters: {
443
+ temperature: false,
444
+ topP: false,
445
+ frequencyPenalty: false,
446
+ presencePenalty: false
447
+ },
448
+ input: {
449
+ tokens: 4e5,
450
+ text: true,
451
+ image: true,
452
+ cpm: 1.25,
453
+ cpmCached: 0.125
454
+ },
455
+ output: {
456
+ tokens: 128e3,
457
+ text: true,
458
+ cpm: 10
459
+ }
460
+ }
461
+ },
462
+ "gpt-5.1-codex-mini": {
463
+ name: "gpt-5.1-codex-mini",
464
+ provider: Vendor.OpenAI,
465
+ description: "GPT-5.1 codex mini for cost-efficient coding tasks",
466
+ isActive: true,
467
+ releaseDate: "2025-10-01",
468
+ knowledgeCutoff: "2024-09-30",
469
+ features: {
470
+ reasoning: true,
471
+ streaming: true,
472
+ structuredOutput: true,
473
+ functionCalling: true,
474
+ fineTuning: false,
475
+ predictedOutputs: false,
476
+ realtime: false,
477
+ vision: true,
478
+ audio: false,
479
+ video: false,
480
+ batchAPI: true,
481
+ promptCaching: true,
482
+ parameters: {
483
+ temperature: false,
484
+ topP: false,
485
+ frequencyPenalty: false,
486
+ presencePenalty: false
487
+ },
488
+ input: {
489
+ tokens: 4e5,
490
+ text: true,
491
+ image: true,
492
+ cpm: 0.25,
493
+ cpmCached: 0.025
494
+ },
495
+ output: {
496
+ tokens: 128e3,
497
+ text: true,
498
+ cpm: 2
499
+ }
500
+ }
501
+ },
502
+ "gpt-5.1-chat-latest": {
503
+ name: "gpt-5.1-chat-latest",
504
+ provider: Vendor.OpenAI,
505
+ description: "GPT-5.1 chat model for general-purpose use",
506
+ isActive: true,
507
+ releaseDate: "2025-10-01",
508
+ knowledgeCutoff: "2024-09-30",
509
+ features: {
510
+ reasoning: false,
511
+ streaming: true,
512
+ structuredOutput: true,
513
+ functionCalling: true,
514
+ fineTuning: false,
515
+ predictedOutputs: false,
516
+ realtime: false,
517
+ vision: true,
518
+ audio: false,
519
+ video: false,
520
+ batchAPI: true,
521
+ promptCaching: true,
522
+ input: {
523
+ tokens: 128e3,
524
+ text: true,
525
+ image: true,
526
+ cpm: 1.25,
527
+ cpmCached: 0.125
528
+ },
529
+ output: {
530
+ tokens: 16e3,
531
+ text: true,
532
+ cpm: 10
533
+ }
534
+ }
535
+ },
166
536
  // GPT-5 Series
167
537
  "gpt-5": {
168
538
  name: "gpt-5",
@@ -194,7 +564,8 @@ var MODEL_REGISTRY = {
194
564
  tokens: 4e5,
195
565
  text: true,
196
566
  image: true,
197
- cpm: 1.25
567
+ cpm: 1.25,
568
+ cpmCached: 0.125
198
569
  },
199
570
  output: {
200
571
  tokens: 128e3,
@@ -233,7 +604,8 @@ var MODEL_REGISTRY = {
233
604
  tokens: 4e5,
234
605
  text: true,
235
606
  image: true,
236
- cpm: 0.25
607
+ cpm: 0.25,
608
+ cpmCached: 0.025
237
609
  },
238
610
  output: {
239
611
  tokens: 128e3,
@@ -272,7 +644,8 @@ var MODEL_REGISTRY = {
272
644
  tokens: 4e5,
273
645
  text: true,
274
646
  image: true,
275
- cpm: 0.05
647
+ cpm: 0.05,
648
+ cpmCached: 5e-3
276
649
  },
277
650
  output: {
278
651
  tokens: 128e3,
@@ -281,6 +654,40 @@ var MODEL_REGISTRY = {
281
654
  }
282
655
  }
283
656
  },
657
+ "gpt-5-chat-latest": {
658
+ name: "gpt-5-chat-latest",
659
+ provider: Vendor.OpenAI,
660
+ description: "GPT-5 chat model for general-purpose use",
661
+ isActive: true,
662
+ releaseDate: "2025-08-01",
663
+ knowledgeCutoff: "2024-09-30",
664
+ features: {
665
+ reasoning: false,
666
+ streaming: true,
667
+ structuredOutput: true,
668
+ functionCalling: true,
669
+ fineTuning: false,
670
+ predictedOutputs: false,
671
+ realtime: false,
672
+ vision: true,
673
+ audio: false,
674
+ video: false,
675
+ batchAPI: true,
676
+ promptCaching: true,
677
+ input: {
678
+ tokens: 128e3,
679
+ text: true,
680
+ image: true,
681
+ cpm: 1.25,
682
+ cpmCached: 0.125
683
+ },
684
+ output: {
685
+ tokens: 16e3,
686
+ text: true,
687
+ cpm: 10
688
+ }
689
+ }
690
+ },
284
691
  // GPT-4.1 Series
285
692
  "gpt-4.1": {
286
693
  name: "gpt-4.1",
@@ -288,7 +695,7 @@ var MODEL_REGISTRY = {
288
695
  description: "GPT-4.1 specialized for coding with 1M token context window",
289
696
  isActive: true,
290
697
  releaseDate: "2025-04-14",
291
- knowledgeCutoff: "2025-04-01",
698
+ knowledgeCutoff: "2024-06-01",
292
699
  features: {
293
700
  reasoning: false,
294
701
  streaming: true,
@@ -306,7 +713,8 @@ var MODEL_REGISTRY = {
306
713
  tokens: 1e6,
307
714
  text: true,
308
715
  image: true,
309
- cpm: 2
716
+ cpm: 2,
717
+ cpmCached: 0.5
310
718
  },
311
719
  output: {
312
720
  tokens: 32768,
@@ -321,7 +729,7 @@ var MODEL_REGISTRY = {
321
729
  description: "Efficient GPT-4.1 model, beats GPT-4o in many benchmarks at 83% lower cost",
322
730
  isActive: true,
323
731
  releaseDate: "2025-04-14",
324
- knowledgeCutoff: "2025-04-01",
732
+ knowledgeCutoff: "2024-06-01",
325
733
  features: {
326
734
  reasoning: false,
327
735
  streaming: true,
@@ -339,7 +747,8 @@ var MODEL_REGISTRY = {
339
747
  tokens: 1e6,
340
748
  text: true,
341
749
  image: true,
342
- cpm: 0.4
750
+ cpm: 0.4,
751
+ cpmCached: 0.1
343
752
  },
344
753
  output: {
345
754
  tokens: 16384,
@@ -354,7 +763,7 @@ var MODEL_REGISTRY = {
354
763
  description: "Fastest and cheapest model with 1M context. 80.1% MMLU, ideal for classification/autocompletion",
355
764
  isActive: true,
356
765
  releaseDate: "2025-04-14",
357
- knowledgeCutoff: "2025-04-01",
766
+ knowledgeCutoff: "2024-06-01",
358
767
  features: {
359
768
  reasoning: false,
360
769
  streaming: true,
@@ -372,7 +781,8 @@ var MODEL_REGISTRY = {
372
781
  tokens: 1e6,
373
782
  text: true,
374
783
  image: true,
375
- cpm: 0.1
784
+ cpm: 0.1,
785
+ cpmCached: 0.025
376
786
  },
377
787
  output: {
378
788
  tokens: 16384,
@@ -381,14 +791,14 @@ var MODEL_REGISTRY = {
381
791
  }
382
792
  }
383
793
  },
384
- // GPT-4o Series (Legacy, Audio Capable)
794
+ // GPT-4o Series (Legacy)
385
795
  "gpt-4o": {
386
796
  name: "gpt-4o",
387
797
  provider: Vendor.OpenAI,
388
- description: "Versatile omni model with audio support. Legacy but still available",
798
+ description: "Versatile omni model. Legacy but still available",
389
799
  isActive: true,
390
800
  releaseDate: "2024-05-13",
391
- knowledgeCutoff: "2024-04-01",
801
+ knowledgeCutoff: "2023-10-01",
392
802
  features: {
393
803
  reasoning: false,
394
804
  streaming: true,
@@ -398,7 +808,7 @@ var MODEL_REGISTRY = {
398
808
  predictedOutputs: true,
399
809
  realtime: true,
400
810
  vision: true,
401
- audio: true,
811
+ audio: false,
402
812
  video: false,
403
813
  batchAPI: true,
404
814
  promptCaching: true,
@@ -406,13 +816,12 @@ var MODEL_REGISTRY = {
406
816
  tokens: 128e3,
407
817
  text: true,
408
818
  image: true,
409
- audio: true,
410
- cpm: 2.5
819
+ cpm: 2.5,
820
+ cpmCached: 1.25
411
821
  },
412
822
  output: {
413
823
  tokens: 16384,
414
824
  text: true,
415
- audio: true,
416
825
  cpm: 10
417
826
  }
418
827
  }
@@ -420,10 +829,10 @@ var MODEL_REGISTRY = {
420
829
  "gpt-4o-mini": {
421
830
  name: "gpt-4o-mini",
422
831
  provider: Vendor.OpenAI,
423
- description: "Fast, affordable omni model with audio support",
832
+ description: "Fast, affordable omni model",
424
833
  isActive: true,
425
834
  releaseDate: "2024-07-18",
426
- knowledgeCutoff: "2024-04-01",
835
+ knowledgeCutoff: "2023-10-01",
427
836
  features: {
428
837
  reasoning: false,
429
838
  streaming: true,
@@ -433,7 +842,7 @@ var MODEL_REGISTRY = {
433
842
  predictedOutputs: false,
434
843
  realtime: true,
435
844
  vision: true,
436
- audio: true,
845
+ audio: false,
437
846
  video: false,
438
847
  batchAPI: true,
439
848
  promptCaching: true,
@@ -441,13 +850,12 @@ var MODEL_REGISTRY = {
441
850
  tokens: 128e3,
442
851
  text: true,
443
852
  image: true,
444
- audio: true,
445
- cpm: 0.15
853
+ cpm: 0.15,
854
+ cpmCached: 0.075
446
855
  },
447
856
  output: {
448
857
  tokens: 16384,
449
858
  text: true,
450
- audio: true,
451
859
  cpm: 0.6
452
860
  }
453
861
  }
@@ -459,7 +867,46 @@ var MODEL_REGISTRY = {
459
867
  description: "Fast reasoning model tailored for coding, math, and science",
460
868
  isActive: true,
461
869
  releaseDate: "2025-01-31",
462
- knowledgeCutoff: "2024-10-01",
870
+ knowledgeCutoff: "2023-10-01",
871
+ features: {
872
+ reasoning: true,
873
+ streaming: true,
874
+ structuredOutput: true,
875
+ functionCalling: true,
876
+ fineTuning: false,
877
+ predictedOutputs: false,
878
+ realtime: false,
879
+ vision: false,
880
+ audio: false,
881
+ video: false,
882
+ batchAPI: true,
883
+ promptCaching: true,
884
+ parameters: {
885
+ temperature: false,
886
+ topP: false,
887
+ frequencyPenalty: false,
888
+ presencePenalty: false
889
+ },
890
+ input: {
891
+ tokens: 2e5,
892
+ text: true,
893
+ cpm: 1.1,
894
+ cpmCached: 0.55
895
+ },
896
+ output: {
897
+ tokens: 1e5,
898
+ text: true,
899
+ cpm: 4.4
900
+ }
901
+ }
902
+ },
903
+ "o1": {
904
+ name: "o1",
905
+ provider: Vendor.OpenAI,
906
+ description: "Advanced reasoning model for complex problems",
907
+ isActive: true,
908
+ releaseDate: "2024-12-17",
909
+ knowledgeCutoff: "2023-10-01",
463
910
  features: {
464
911
  reasoning: true,
465
912
  streaming: true,
@@ -472,35 +919,78 @@ var MODEL_REGISTRY = {
472
919
  audio: false,
473
920
  video: false,
474
921
  batchAPI: true,
475
- promptCaching: false,
476
- parameters: {
477
- temperature: false,
478
- topP: false,
479
- frequencyPenalty: false,
480
- presencePenalty: false
481
- },
922
+ promptCaching: true,
923
+ parameters: {
924
+ temperature: false,
925
+ topP: false,
926
+ frequencyPenalty: false,
927
+ presencePenalty: false
928
+ },
929
+ input: {
930
+ tokens: 2e5,
931
+ text: true,
932
+ image: true,
933
+ cpm: 15,
934
+ cpmCached: 7.5
935
+ },
936
+ output: {
937
+ tokens: 1e5,
938
+ text: true,
939
+ cpm: 60
940
+ }
941
+ }
942
+ },
943
+ // ============================================================================
944
+ // Anthropic Models (Verified from platform.claude.com - March 2026)
945
+ // ============================================================================
946
+ // Claude 4.6 Series (Current)
947
+ "claude-opus-4-6": {
948
+ name: "claude-opus-4-6",
949
+ provider: Vendor.Anthropic,
950
+ description: "The most intelligent model for building agents and coding. 128K output, adaptive thinking",
951
+ isActive: true,
952
+ preferred: true,
953
+ releaseDate: "2026-02-01",
954
+ knowledgeCutoff: "2025-05-01",
955
+ features: {
956
+ reasoning: false,
957
+ streaming: true,
958
+ structuredOutput: true,
959
+ functionCalling: true,
960
+ fineTuning: false,
961
+ predictedOutputs: false,
962
+ realtime: false,
963
+ vision: true,
964
+ audio: false,
965
+ video: false,
966
+ extendedThinking: true,
967
+ batchAPI: true,
968
+ promptCaching: true,
482
969
  input: {
483
970
  tokens: 2e5,
971
+ // 1M with beta header
484
972
  text: true,
485
973
  image: true,
486
- cpm: 1.1
974
+ cpm: 5,
975
+ cpmCached: 0.5
487
976
  },
488
977
  output: {
489
- tokens: 1e5,
978
+ tokens: 128e3,
490
979
  text: true,
491
- cpm: 4.4
980
+ cpm: 25
492
981
  }
493
982
  }
494
983
  },
495
- "o1": {
496
- name: "o1",
497
- provider: Vendor.OpenAI,
498
- description: "Advanced reasoning model for complex problems",
984
+ "claude-sonnet-4-6": {
985
+ name: "claude-sonnet-4-6",
986
+ provider: Vendor.Anthropic,
987
+ description: "Best combination of speed and intelligence. Adaptive thinking, 1M context beta",
499
988
  isActive: true,
500
- releaseDate: "2024-12-17",
501
- knowledgeCutoff: "2024-10-01",
989
+ preferred: true,
990
+ releaseDate: "2026-02-01",
991
+ knowledgeCutoff: "2025-08-01",
502
992
  features: {
503
- reasoning: true,
993
+ reasoning: false,
504
994
  streaming: true,
505
995
  structuredOutput: true,
506
996
  functionCalling: true,
@@ -510,35 +1000,29 @@ var MODEL_REGISTRY = {
510
1000
  vision: true,
511
1001
  audio: false,
512
1002
  video: false,
1003
+ extendedThinking: true,
513
1004
  batchAPI: true,
514
- promptCaching: false,
515
- parameters: {
516
- temperature: false,
517
- topP: false,
518
- frequencyPenalty: false,
519
- presencePenalty: false
520
- },
1005
+ promptCaching: true,
521
1006
  input: {
522
1007
  tokens: 2e5,
1008
+ // 1M with beta header
523
1009
  text: true,
524
1010
  image: true,
525
- cpm: 15
1011
+ cpm: 3,
1012
+ cpmCached: 0.3
526
1013
  },
527
1014
  output: {
528
- tokens: 1e5,
1015
+ tokens: 64e3,
529
1016
  text: true,
530
- cpm: 60
1017
+ cpm: 15
531
1018
  }
532
1019
  }
533
1020
  },
534
- // ============================================================================
535
- // Anthropic Models (Verified from platform.claude.com)
536
- // ============================================================================
537
- // Claude 4.5 Series (Current)
1021
+ // Claude 4.5 Series
538
1022
  "claude-opus-4-5-20251101": {
539
1023
  name: "claude-opus-4-5-20251101",
540
1024
  provider: Vendor.Anthropic,
541
- description: "Premium model combining maximum intelligence with practical performance",
1025
+ description: "Legacy Opus 4.5. Premium model combining maximum intelligence with practical performance",
542
1026
  isActive: true,
543
1027
  releaseDate: "2025-11-01",
544
1028
  knowledgeCutoff: "2025-05-01",
@@ -573,7 +1057,7 @@ var MODEL_REGISTRY = {
573
1057
  "claude-sonnet-4-5-20250929": {
574
1058
  name: "claude-sonnet-4-5-20250929",
575
1059
  provider: Vendor.Anthropic,
576
- description: "Smart model for complex agents and coding. Best balance of intelligence, speed, cost",
1060
+ description: "Legacy Sonnet 4.5. Smart model for complex agents and coding",
577
1061
  isActive: true,
578
1062
  releaseDate: "2025-09-29",
579
1063
  knowledgeCutoff: "2025-01-01",
@@ -593,6 +1077,7 @@ var MODEL_REGISTRY = {
593
1077
  promptCaching: true,
594
1078
  input: {
595
1079
  tokens: 2e5,
1080
+ // 1M with beta header
596
1081
  text: true,
597
1082
  image: true,
598
1083
  cpm: 3,
@@ -676,10 +1161,45 @@ var MODEL_REGISTRY = {
676
1161
  }
677
1162
  }
678
1163
  },
1164
+ "claude-opus-4-20250514": {
1165
+ name: "claude-opus-4-20250514",
1166
+ provider: Vendor.Anthropic,
1167
+ description: "Legacy Opus 4. Agentic tasks and reasoning",
1168
+ isActive: true,
1169
+ releaseDate: "2025-05-14",
1170
+ knowledgeCutoff: "2025-01-01",
1171
+ features: {
1172
+ reasoning: false,
1173
+ streaming: true,
1174
+ structuredOutput: true,
1175
+ functionCalling: true,
1176
+ fineTuning: false,
1177
+ predictedOutputs: false,
1178
+ realtime: false,
1179
+ vision: true,
1180
+ audio: false,
1181
+ video: false,
1182
+ extendedThinking: true,
1183
+ batchAPI: true,
1184
+ promptCaching: true,
1185
+ input: {
1186
+ tokens: 2e5,
1187
+ text: true,
1188
+ image: true,
1189
+ cpm: 15,
1190
+ cpmCached: 1.5
1191
+ },
1192
+ output: {
1193
+ tokens: 32e3,
1194
+ text: true,
1195
+ cpm: 75
1196
+ }
1197
+ }
1198
+ },
679
1199
  "claude-sonnet-4-20250514": {
680
1200
  name: "claude-sonnet-4-20250514",
681
1201
  provider: Vendor.Anthropic,
682
- description: "Legacy Sonnet 4. Default for most users, supports 1M context beta",
1202
+ description: "Legacy Sonnet 4. Supports 1M context beta",
683
1203
  isActive: true,
684
1204
  releaseDate: "2025-05-14",
685
1205
  knowledgeCutoff: "2025-01-01",
@@ -715,7 +1235,7 @@ var MODEL_REGISTRY = {
715
1235
  "claude-3-7-sonnet-20250219": {
716
1236
  name: "claude-3-7-sonnet-20250219",
717
1237
  provider: Vendor.Anthropic,
718
- description: "Claude 3.7 Sonnet with extended thinking, supports 128K output beta",
1238
+ description: "Deprecated. Claude 3.7 Sonnet with extended thinking",
719
1239
  isActive: true,
720
1240
  releaseDate: "2025-02-19",
721
1241
  knowledgeCutoff: "2024-10-01",
@@ -742,17 +1262,16 @@ var MODEL_REGISTRY = {
742
1262
  },
743
1263
  output: {
744
1264
  tokens: 64e3,
745
- // 128K with beta header
746
1265
  text: true,
747
1266
  cpm: 15
748
1267
  }
749
1268
  }
750
1269
  },
751
- // Claude 3.x Legacy
1270
+ // Claude 3.x Legacy (Deprecated - retiring April 19, 2026)
752
1271
  "claude-3-haiku-20240307": {
753
1272
  name: "claude-3-haiku-20240307",
754
1273
  provider: Vendor.Anthropic,
755
- description: "Fast legacy model. Recommend migrating to Haiku 4.5",
1274
+ description: "Deprecated. Retiring April 19, 2026. Migrate to Haiku 4.5",
756
1275
  isActive: true,
757
1276
  releaseDate: "2024-03-07",
758
1277
  knowledgeCutoff: "2023-08-01",
@@ -785,16 +1304,124 @@ var MODEL_REGISTRY = {
785
1304
  }
786
1305
  },
787
1306
  // ============================================================================
788
- // Google Models (Verified from ai.google.dev)
1307
+ // Google Models (Verified from ai.google.dev - March 2026)
789
1308
  // ============================================================================
1309
+ // Gemini 3.1 Series (Preview)
1310
+ "gemini-3.1-pro-preview": {
1311
+ name: "gemini-3.1-pro-preview",
1312
+ provider: Vendor.Google,
1313
+ description: "Advanced intelligence with powerful agentic and coding capabilities. Replaces gemini-3-pro-preview",
1314
+ isActive: true,
1315
+ preferred: true,
1316
+ releaseDate: "2026-02-01",
1317
+ knowledgeCutoff: "2025-01-01",
1318
+ features: {
1319
+ reasoning: true,
1320
+ streaming: true,
1321
+ structuredOutput: true,
1322
+ functionCalling: true,
1323
+ fineTuning: false,
1324
+ predictedOutputs: false,
1325
+ realtime: false,
1326
+ vision: true,
1327
+ audio: true,
1328
+ video: true,
1329
+ batchAPI: true,
1330
+ promptCaching: true,
1331
+ input: {
1332
+ tokens: 1048576,
1333
+ text: true,
1334
+ image: true,
1335
+ audio: true,
1336
+ video: true,
1337
+ cpm: 2,
1338
+ cpmCached: 0.2
1339
+ },
1340
+ output: {
1341
+ tokens: 65536,
1342
+ text: true,
1343
+ cpm: 12
1344
+ }
1345
+ }
1346
+ },
1347
+ "gemini-3.1-flash-lite-preview": {
1348
+ name: "gemini-3.1-flash-lite-preview",
1349
+ provider: Vendor.Google,
1350
+ description: "High performance, budget-friendly for high-volume agentic tasks and data extraction",
1351
+ isActive: true,
1352
+ releaseDate: "2026-03-01",
1353
+ knowledgeCutoff: "2025-01-01",
1354
+ features: {
1355
+ reasoning: true,
1356
+ streaming: true,
1357
+ structuredOutput: true,
1358
+ functionCalling: true,
1359
+ fineTuning: false,
1360
+ predictedOutputs: false,
1361
+ realtime: false,
1362
+ vision: true,
1363
+ audio: true,
1364
+ video: true,
1365
+ batchAPI: true,
1366
+ promptCaching: true,
1367
+ input: {
1368
+ tokens: 1048576,
1369
+ text: true,
1370
+ image: true,
1371
+ audio: true,
1372
+ video: true,
1373
+ cpm: 0.25
1374
+ },
1375
+ output: {
1376
+ tokens: 65536,
1377
+ text: true,
1378
+ cpm: 1.5
1379
+ }
1380
+ }
1381
+ },
1382
+ "gemini-3.1-flash-image-preview": {
1383
+ name: "gemini-3.1-flash-image-preview",
1384
+ provider: Vendor.Google,
1385
+ description: "High-efficiency image generation with up to 4K output, search grounding support",
1386
+ isActive: true,
1387
+ releaseDate: "2026-02-01",
1388
+ knowledgeCutoff: "2025-01-01",
1389
+ features: {
1390
+ reasoning: true,
1391
+ streaming: true,
1392
+ structuredOutput: false,
1393
+ functionCalling: false,
1394
+ fineTuning: false,
1395
+ predictedOutputs: false,
1396
+ realtime: false,
1397
+ vision: true,
1398
+ audio: false,
1399
+ video: false,
1400
+ batchAPI: true,
1401
+ promptCaching: false,
1402
+ input: {
1403
+ tokens: 131072,
1404
+ text: true,
1405
+ image: true,
1406
+ cpm: 0.25
1407
+ },
1408
+ output: {
1409
+ tokens: 32768,
1410
+ text: true,
1411
+ image: true,
1412
+ cpm: 1.5
1413
+ }
1414
+ }
1415
+ },
790
1416
  // Gemini 3 Series (Preview)
791
1417
  "gemini-3-flash-preview": {
792
1418
  name: "gemini-3-flash-preview",
793
1419
  provider: Vendor.Google,
794
- description: "Pro-grade reasoning with Flash-level latency and efficiency",
1420
+ description: "Most powerful agentic and coding model with frontier-class reasoning",
795
1421
  isActive: true,
796
- releaseDate: "2025-11-18",
797
- knowledgeCutoff: "2025-08-01",
1422
+ preferred: true,
1423
+ releaseDate: "2025-12-01",
1424
+ knowledgeCutoff: "2025-01-01",
798
1425
  features: {
799
1426
  reasoning: true,
800
1427
  streaming: true,
@@ -809,27 +1436,28 @@ var MODEL_REGISTRY = {
809
1436
  batchAPI: true,
810
1437
  promptCaching: true,
811
1438
  input: {
812
- tokens: 1e6,
1439
+ tokens: 1048576,
813
1440
  text: true,
814
1441
  image: true,
815
1442
  audio: true,
816
1443
  video: true,
817
- cpm: 0.15
1444
+ cpm: 0.5,
1445
+ cpmCached: 0.05
818
1446
  },
819
1447
  output: {
820
1448
  tokens: 65536,
821
1449
  text: true,
822
- cpm: 0.6
1450
+ cpm: 3
823
1451
  }
824
1452
  }
825
1453
  },
826
1454
  "gemini-3-pro-preview": {
827
1455
  name: "gemini-3-pro-preview",
828
1456
  provider: Vendor.Google,
829
- description: "Most advanced reasoning Gemini model for complex tasks",
1457
+ description: "Deprecated. Shutting down March 9, 2026. Migrate to gemini-3.1-pro-preview",
830
1458
  isActive: true,
831
1459
  releaseDate: "2025-11-18",
832
- knowledgeCutoff: "2025-08-01",
1460
+ knowledgeCutoff: "2025-01-01",
833
1461
  features: {
834
1462
  reasoning: true,
835
1463
  streaming: true,
@@ -844,7 +1472,7 @@ var MODEL_REGISTRY = {
844
1472
  batchAPI: true,
845
1473
  promptCaching: true,
846
1474
  input: {
847
- tokens: 1e6,
1475
+ tokens: 1048576,
848
1476
  text: true,
849
1477
  image: true,
850
1478
  audio: true,
@@ -861,14 +1489,14 @@ var MODEL_REGISTRY = {
861
1489
  "gemini-3-pro-image-preview": {
862
1490
  name: "gemini-3-pro-image-preview",
863
1491
  provider: Vendor.Google,
864
- description: "Highest quality image generation model",
1492
+ description: "Professional-grade image generation and editing with reasoning",
865
1493
  isActive: true,
866
1494
  releaseDate: "2025-11-18",
867
- knowledgeCutoff: "2025-08-01",
1495
+ knowledgeCutoff: "2025-01-01",
868
1496
  features: {
869
1497
  reasoning: true,
870
1498
  streaming: true,
871
- structuredOutput: false,
1499
+ structuredOutput: true,
872
1500
  functionCalling: false,
873
1501
  fineTuning: false,
874
1502
  predictedOutputs: false,
@@ -877,15 +1505,15 @@ var MODEL_REGISTRY = {
877
1505
  audio: false,
878
1506
  video: false,
879
1507
  batchAPI: true,
880
- promptCaching: true,
1508
+ promptCaching: false,
881
1509
  input: {
882
- tokens: 1e6,
1510
+ tokens: 65536,
883
1511
  text: true,
884
1512
  image: true,
885
1513
  cpm: 1.25
886
1514
  },
887
1515
  output: {
888
- tokens: 65536,
1516
+ tokens: 32768,
889
1517
  text: true,
890
1518
  image: true,
891
1519
  cpm: 10
@@ -896,7 +1524,7 @@ var MODEL_REGISTRY = {
896
1524
  "gemini-2.5-pro": {
897
1525
  name: "gemini-2.5-pro",
898
1526
  provider: Vendor.Google,
899
- description: "Advanced multimodal model built for deep reasoning and agents",
1527
+ description: "Most advanced model for complex tasks with deep reasoning and coding",
900
1528
  isActive: true,
901
1529
  releaseDate: "2025-03-01",
902
1530
  knowledgeCutoff: "2025-01-01",
@@ -914,12 +1542,13 @@ var MODEL_REGISTRY = {
914
1542
  batchAPI: true,
915
1543
  promptCaching: true,
916
1544
  input: {
917
- tokens: 1e6,
1545
+ tokens: 1048576,
918
1546
  text: true,
919
1547
  image: true,
920
1548
  audio: true,
921
1549
  video: true,
922
- cpm: 1.25
1550
+ cpm: 1.25,
1551
+ cpmCached: 0.125
923
1552
  },
924
1553
  output: {
925
1554
  tokens: 65536,
@@ -931,7 +1560,7 @@ var MODEL_REGISTRY = {
931
1560
  "gemini-2.5-flash": {
932
1561
  name: "gemini-2.5-flash",
933
1562
  provider: Vendor.Google,
934
- description: "Fast, cost-effective model with excellent reasoning",
1563
+ description: "Best price-performance for low-latency, high-volume tasks with reasoning",
935
1564
  isActive: true,
936
1565
  releaseDate: "2025-06-17",
937
1566
  knowledgeCutoff: "2025-01-01",
@@ -949,24 +1578,25 @@ var MODEL_REGISTRY = {
949
1578
  batchAPI: true,
950
1579
  promptCaching: true,
951
1580
  input: {
952
- tokens: 1e6,
1581
+ tokens: 1048576,
953
1582
  text: true,
954
1583
  image: true,
955
1584
  audio: true,
956
1585
  video: true,
957
- cpm: 0.15
1586
+ cpm: 0.3,
1587
+ cpmCached: 0.03
958
1588
  },
959
1589
  output: {
960
1590
  tokens: 65536,
961
1591
  text: true,
962
- cpm: 0.6
1592
+ cpm: 2.5
963
1593
  }
964
1594
  }
965
1595
  },
966
1596
  "gemini-2.5-flash-lite": {
967
1597
  name: "gemini-2.5-flash-lite",
968
1598
  provider: Vendor.Google,
969
- description: "Lowest latency for high-volume tasks, summarization, classification",
1599
+ description: "Fastest and most budget-friendly multimodal model in the 2.5 family",
970
1600
  isActive: true,
971
1601
  releaseDate: "2025-06-17",
972
1602
  knowledgeCutoff: "2025-01-01",
@@ -984,31 +1614,31 @@ var MODEL_REGISTRY = {
984
1614
  batchAPI: true,
985
1615
  promptCaching: true,
986
1616
  input: {
987
- tokens: 1e6,
1617
+ tokens: 1048576,
988
1618
  text: true,
989
1619
  image: true,
990
1620
  audio: true,
991
1621
  video: true,
992
- cpm: 0.075
1622
+ cpm: 0.1
993
1623
  },
994
1624
  output: {
995
1625
  tokens: 65536,
996
1626
  text: true,
997
- cpm: 0.3
1627
+ cpm: 0.4
998
1628
  }
999
1629
  }
1000
1630
  },
1001
1631
  "gemini-2.5-flash-image": {
1002
1632
  name: "gemini-2.5-flash-image",
1003
1633
  provider: Vendor.Google,
1004
- description: "Image generation and editing model",
1634
+ description: "Fast native image generation and editing (Nano Banana)",
1005
1635
  isActive: true,
1006
- releaseDate: "2025-09-01",
1007
- knowledgeCutoff: "2025-01-01",
1636
+ releaseDate: "2025-10-01",
1637
+ knowledgeCutoff: "2025-06-01",
1008
1638
  features: {
1009
- reasoning: true,
1639
+ reasoning: false,
1010
1640
  streaming: true,
1011
- structuredOutput: false,
1641
+ structuredOutput: true,
1012
1642
  functionCalling: false,
1013
1643
  fineTuning: false,
1014
1644
  predictedOutputs: false,
@@ -1019,13 +1649,13 @@ var MODEL_REGISTRY = {
1019
1649
  batchAPI: true,
1020
1650
  promptCaching: true,
1021
1651
  input: {
1022
- tokens: 1e6,
1652
+ tokens: 65536,
1023
1653
  text: true,
1024
1654
  image: true,
1025
1655
  cpm: 0.15
1026
1656
  },
1027
1657
  output: {
1028
- tokens: 65536,
1658
+ tokens: 32768,
1029
1659
  text: true,
1030
1660
  image: true,
1031
1661
  cpm: 0.6
@@ -1033,7 +1663,7 @@ var MODEL_REGISTRY = {
1033
1663
  }
1034
1664
  },
1035
1665
  // ============================================================================
1036
- // xAI Grok Models (Verified from docs.x.ai - January 2026)
1666
+ // xAI Grok Models (Verified from docs.x.ai - March 2026)
1037
1667
  // ============================================================================
1038
1668
  // Grok 4.1 Series (2M context, fast)
1039
1669
  "grok-4-1-fast-reasoning": {
@@ -1054,13 +1684,14 @@ var MODEL_REGISTRY = {
1054
1684
  vision: true,
1055
1685
  audio: false,
1056
1686
  video: false,
1057
- batchAPI: false,
1058
- promptCaching: false,
1687
+ batchAPI: true,
1688
+ promptCaching: true,
1059
1689
  input: {
1060
1690
  tokens: 2e6,
1061
1691
  text: true,
1062
1692
  image: true,
1063
- cpm: 0.2
1693
+ cpm: 0.2,
1694
+ cpmCached: 0.05
1064
1695
  },
1065
1696
  output: {
1066
1697
  tokens: 65536,
@@ -1087,13 +1718,14 @@ var MODEL_REGISTRY = {
1087
1718
  vision: true,
1088
1719
  audio: false,
1089
1720
  video: false,
1090
- batchAPI: false,
1091
- promptCaching: false,
1721
+ batchAPI: true,
1722
+ promptCaching: true,
1092
1723
  input: {
1093
1724
  tokens: 2e6,
1094
1725
  text: true,
1095
1726
  image: true,
1096
- cpm: 0.2
1727
+ cpm: 0.2,
1728
+ cpmCached: 0.05
1097
1729
  },
1098
1730
  output: {
1099
1731
  tokens: 65536,
@@ -1121,12 +1753,13 @@ var MODEL_REGISTRY = {
1121
1753
  vision: false,
1122
1754
  audio: false,
1123
1755
  video: false,
1124
- batchAPI: false,
1125
- promptCaching: false,
1756
+ batchAPI: true,
1757
+ promptCaching: true,
1126
1758
  input: {
1127
1759
  tokens: 256e3,
1128
1760
  text: true,
1129
- cpm: 0.2
1761
+ cpm: 0.2,
1762
+ cpmCached: 0.02
1130
1763
  },
1131
1764
  output: {
1132
1765
  tokens: 32768,
@@ -1139,7 +1772,7 @@ var MODEL_REGISTRY = {
1139
1772
  "grok-4-fast-reasoning": {
1140
1773
  name: "grok-4-fast-reasoning",
1141
1774
  provider: Vendor.Grok,
1142
- description: "Fast Grok 4 with reasoning capabilities, 2M context window",
1775
+ description: "Fast Grok 4 with reasoning capabilities, 2M context window, vision support",
1143
1776
  isActive: true,
1144
1777
  releaseDate: "2025-09-01",
1145
1778
  knowledgeCutoff: "2024-11-01",
@@ -1151,15 +1784,17 @@ var MODEL_REGISTRY = {
1151
1784
  fineTuning: false,
1152
1785
  predictedOutputs: false,
1153
1786
  realtime: false,
1154
- vision: false,
1787
+ vision: true,
1155
1788
  audio: false,
1156
1789
  video: false,
1157
- batchAPI: false,
1158
- promptCaching: false,
1790
+ batchAPI: true,
1791
+ promptCaching: true,
1159
1792
  input: {
1160
1793
  tokens: 2e6,
1161
1794
  text: true,
1162
- cpm: 0.2
1795
+ image: true,
1796
+ cpm: 0.2,
1797
+ cpmCached: 0.05
1163
1798
  },
1164
1799
  output: {
1165
1800
  tokens: 65536,
@@ -1186,13 +1821,14 @@ var MODEL_REGISTRY = {
1186
1821
  vision: true,
1187
1822
  audio: false,
1188
1823
  video: false,
1189
- batchAPI: false,
1190
- promptCaching: false,
1824
+ batchAPI: true,
1825
+ promptCaching: true,
1191
1826
  input: {
1192
1827
  tokens: 2e6,
1193
1828
  text: true,
1194
1829
  image: true,
1195
- cpm: 0.2
1830
+ cpm: 0.2,
1831
+ cpmCached: 0.05
1196
1832
  },
1197
1833
  output: {
1198
1834
  tokens: 65536,
@@ -1204,12 +1840,12 @@ var MODEL_REGISTRY = {
1204
1840
  "grok-4-0709": {
1205
1841
  name: "grok-4-0709",
1206
1842
  provider: Vendor.Grok,
1207
- description: "Grok 4 flagship model (July 2025 release), 256K context, vision support",
1843
+ description: "Grok 4 flagship model (July 2025 release), 256K context, vision support, reasoning",
1208
1844
  isActive: true,
1209
1845
  releaseDate: "2025-07-09",
1210
1846
  knowledgeCutoff: "2024-11-01",
1211
1847
  features: {
1212
- reasoning: false,
1848
+ reasoning: true,
1213
1849
  streaming: true,
1214
1850
  structuredOutput: true,
1215
1851
  functionCalling: true,
@@ -1219,13 +1855,14 @@ var MODEL_REGISTRY = {
1219
1855
  vision: true,
1220
1856
  audio: false,
1221
1857
  video: false,
1222
- batchAPI: false,
1223
- promptCaching: false,
1858
+ batchAPI: true,
1859
+ promptCaching: true,
1224
1860
  input: {
1225
1861
  tokens: 256e3,
1226
1862
  text: true,
1227
1863
  image: true,
1228
- cpm: 3
1864
+ cpm: 3,
1865
+ cpmCached: 0.75
1229
1866
  },
1230
1867
  output: {
1231
1868
  tokens: 32768,
@@ -1238,12 +1875,12 @@ var MODEL_REGISTRY = {
1238
1875
  "grok-3-mini": {
1239
1876
  name: "grok-3-mini",
1240
1877
  provider: Vendor.Grok,
1241
- description: "Lightweight, cost-efficient model for simpler tasks, 131K context",
1878
+ description: "Lightweight, cost-efficient model with reasoning, 131K context",
1242
1879
  isActive: true,
1243
1880
  releaseDate: "2025-06-01",
1244
1881
  knowledgeCutoff: "2024-11-01",
1245
1882
  features: {
1246
- reasoning: false,
1883
+ reasoning: true,
1247
1884
  streaming: true,
1248
1885
  structuredOutput: true,
1249
1886
  functionCalling: true,
@@ -1253,12 +1890,13 @@ var MODEL_REGISTRY = {
1253
1890
  vision: false,
1254
1891
  audio: false,
1255
1892
  video: false,
1256
- batchAPI: false,
1257
- promptCaching: false,
1893
+ batchAPI: true,
1894
+ promptCaching: true,
1258
1895
  input: {
1259
1896
  tokens: 131072,
1260
1897
  text: true,
1261
- cpm: 0.3
1898
+ cpm: 0.3,
1899
+ cpmCached: 0.07
1262
1900
  },
1263
1901
  output: {
1264
1902
  tokens: 32768,
@@ -1285,12 +1923,13 @@ var MODEL_REGISTRY = {
1285
1923
  vision: false,
1286
1924
  audio: false,
1287
1925
  video: false,
1288
- batchAPI: false,
1289
- promptCaching: false,
1926
+ batchAPI: true,
1927
+ promptCaching: true,
1290
1928
  input: {
1291
1929
  tokens: 131072,
1292
1930
  text: true,
1293
- cpm: 3
1931
+ cpm: 3,
1932
+ cpmCached: 0.75
1294
1933
  },
1295
1934
  output: {
1296
1935
  tokens: 32768,
@@ -1299,11 +1938,11 @@ var MODEL_REGISTRY = {
1299
1938
  }
1300
1939
  }
1301
1940
  },
1302
- // Grok 2 Series (Vision)
1941
+ // Grok 2 Series (Legacy - not in current docs)
1303
1942
  "grok-2-vision-1212": {
1304
1943
  name: "grok-2-vision-1212",
1305
1944
  provider: Vendor.Grok,
1306
- description: "Vision-capable model for image understanding, 32K context",
1945
+ description: "Legacy vision model for image understanding, 32K context. Not in current xAI docs",
1307
1946
  isActive: true,
1308
1947
  releaseDate: "2024-12-12",
1309
1948
  knowledgeCutoff: "2024-11-01",
@@ -1576,6 +2215,14 @@ var SERVICE_DEFINITIONS = [
1576
2215
  baseURL: "https://aws.amazon.com",
1577
2216
  docsURL: "https://docs.aws.amazon.com/"
1578
2217
  },
2218
+ {
2219
+ id: "cloudflare",
2220
+ name: "Cloudflare",
2221
+ category: "cloud",
2222
+ urlPattern: /api\.cloudflare\.com/i,
2223
+ baseURL: "https://api.cloudflare.com/client/v4",
2224
+ docsURL: "https://developers.cloudflare.com/api/"
2225
+ },
1579
2226
  // ============ Storage ============
1580
2227
  {
1581
2228
  id: "dropbox",
@@ -1619,6 +2266,14 @@ var SERVICE_DEFINITIONS = [
1619
2266
  baseURL: "https://api.postmarkapp.com",
1620
2267
  docsURL: "https://postmarkapp.com/developer"
1621
2268
  },
2269
+ {
2270
+ id: "mailgun",
2271
+ name: "Mailgun",
2272
+ category: "email",
2273
+ urlPattern: /api\.mailgun\.net|api\.eu\.mailgun\.net/i,
2274
+ baseURL: "https://api.mailgun.net/v3",
2275
+ docsURL: "https://documentation.mailgun.com/docs/mailgun/api-reference/"
2276
+ },
1622
2277
  // ============ Monitoring & Observability ============
1623
2278
  {
1624
2279
  id: "datadog",