@mariozechner/pi-ai 0.53.0 → 0.53.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -359,6 +359,23 @@ export const MODELS = {
359
359
  contextWindow: 200000,
360
360
  maxTokens: 64000,
361
361
  },
362
+ "anthropic.claude-sonnet-4-6": {
363
+ id: "anthropic.claude-sonnet-4-6",
364
+ name: "Claude Sonnet 4.6",
365
+ api: "bedrock-converse-stream",
366
+ provider: "amazon-bedrock",
367
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
368
+ reasoning: true,
369
+ input: ["text", "image"],
370
+ cost: {
371
+ input: 3,
372
+ output: 15,
373
+ cacheRead: 0.3,
374
+ cacheWrite: 3.75,
375
+ },
376
+ contextWindow: 200000,
377
+ maxTokens: 64000,
378
+ },
362
379
  "cohere.command-r-plus-v1:0": {
363
380
  id: "cohere.command-r-plus-v1:0",
364
381
  name: "Command R+",
@@ -529,6 +546,23 @@ export const MODELS = {
529
546
  contextWindow: 200000,
530
547
  maxTokens: 64000,
531
548
  },
549
+ "eu.anthropic.claude-sonnet-4-6": {
550
+ id: "eu.anthropic.claude-sonnet-4-6",
551
+ name: "Claude Sonnet 4.6 (EU)",
552
+ api: "bedrock-converse-stream",
553
+ provider: "amazon-bedrock",
554
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
555
+ reasoning: true,
556
+ input: ["text", "image"],
557
+ cost: {
558
+ input: 3,
559
+ output: 15,
560
+ cacheRead: 0.3,
561
+ cacheWrite: 3.75,
562
+ },
563
+ contextWindow: 200000,
564
+ maxTokens: 64000,
565
+ },
532
566
  "global.anthropic.claude-haiku-4-5-20251001-v1:0": {
533
567
  id: "global.anthropic.claude-haiku-4-5-20251001-v1:0",
534
568
  name: "Claude Haiku 4.5 (Global)",
@@ -614,6 +648,23 @@ export const MODELS = {
614
648
  contextWindow: 200000,
615
649
  maxTokens: 64000,
616
650
  },
651
+ "global.anthropic.claude-sonnet-4-6": {
652
+ id: "global.anthropic.claude-sonnet-4-6",
653
+ name: "Claude Sonnet 4.6 (Global)",
654
+ api: "bedrock-converse-stream",
655
+ provider: "amazon-bedrock",
656
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
657
+ reasoning: true,
658
+ input: ["text", "image"],
659
+ cost: {
660
+ input: 3,
661
+ output: 15,
662
+ cacheRead: 0.3,
663
+ cacheWrite: 3.75,
664
+ },
665
+ contextWindow: 200000,
666
+ maxTokens: 64000,
667
+ },
617
668
  "google.gemma-3-27b-it": {
618
669
  id: "google.gemma-3-27b-it",
619
670
  name: "Google Gemma 3 27B Instruct",
@@ -1277,6 +1328,23 @@ export const MODELS = {
1277
1328
  contextWindow: 200000,
1278
1329
  maxTokens: 64000,
1279
1330
  },
1331
+ "us.anthropic.claude-sonnet-4-6": {
1332
+ id: "us.anthropic.claude-sonnet-4-6",
1333
+ name: "Claude Sonnet 4.6 (US)",
1334
+ api: "bedrock-converse-stream",
1335
+ provider: "amazon-bedrock",
1336
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1337
+ reasoning: true,
1338
+ input: ["text", "image"],
1339
+ cost: {
1340
+ input: 3,
1341
+ output: 15,
1342
+ cacheRead: 0.3,
1343
+ cacheWrite: 3.75,
1344
+ },
1345
+ contextWindow: 200000,
1346
+ maxTokens: 64000,
1347
+ },
1280
1348
  "writer.palmyra-x4-v1:0": {
1281
1349
  id: "writer.palmyra-x4-v1:0",
1282
1350
  name: "Palmyra X4",
@@ -2514,6 +2582,24 @@ export const MODELS = {
2514
2582
  contextWindow: 128000,
2515
2583
  maxTokens: 32000,
2516
2584
  },
2585
+ "claude-sonnet-4.6": {
2586
+ id: "claude-sonnet-4.6",
2587
+ name: "Claude Sonnet 4.6",
2588
+ api: "anthropic-messages",
2589
+ provider: "github-copilot",
2590
+ baseUrl: "https://api.individual.githubcopilot.com",
2591
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
2592
+ reasoning: true,
2593
+ input: ["text", "image"],
2594
+ cost: {
2595
+ input: 0,
2596
+ output: 0,
2597
+ cacheRead: 0,
2598
+ cacheWrite: 0,
2599
+ },
2600
+ contextWindow: 128000,
2601
+ maxTokens: 32000,
2602
+ },
2517
2603
  "gemini-2.5-pro": {
2518
2604
  id: "gemini-2.5-pro",
2519
2605
  name: "Gemini 2.5 Pro",
@@ -3063,6 +3149,40 @@ export const MODELS = {
3063
3149
  contextWindow: 1000000,
3064
3150
  maxTokens: 64000,
3065
3151
  },
3152
+ "gemini-3.1-pro-preview": {
3153
+ id: "gemini-3.1-pro-preview",
3154
+ name: "Gemini 3.1 Pro Preview",
3155
+ api: "google-generative-ai",
3156
+ provider: "google",
3157
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
3158
+ reasoning: true,
3159
+ input: ["text", "image"],
3160
+ cost: {
3161
+ input: 2,
3162
+ output: 12,
3163
+ cacheRead: 0.2,
3164
+ cacheWrite: 0,
3165
+ },
3166
+ contextWindow: 1048576,
3167
+ maxTokens: 65536,
3168
+ },
3169
+ "gemini-3.1-pro-preview-customtools": {
3170
+ id: "gemini-3.1-pro-preview-customtools",
3171
+ name: "Gemini 3.1 Pro Preview Custom Tools",
3172
+ api: "google-generative-ai",
3173
+ provider: "google",
3174
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
3175
+ reasoning: true,
3176
+ input: ["text", "image"],
3177
+ cost: {
3178
+ input: 2,
3179
+ output: 12,
3180
+ cacheRead: 0.2,
3181
+ cacheWrite: 0,
3182
+ },
3183
+ contextWindow: 1048576,
3184
+ maxTokens: 65536,
3185
+ },
3066
3186
  "gemini-flash-latest": {
3067
3187
  id: "gemini-flash-latest",
3068
3188
  name: "Gemini Flash Latest",
@@ -3150,6 +3270,23 @@ export const MODELS = {
3150
3270
  contextWindow: 200000,
3151
3271
  maxTokens: 64000,
3152
3272
  },
3273
+ "claude-opus-4-6-thinking": {
3274
+ id: "claude-opus-4-6-thinking",
3275
+ name: "Claude Opus 4.6 Thinking (Antigravity)",
3276
+ api: "google-gemini-cli",
3277
+ provider: "google-antigravity",
3278
+ baseUrl: "https://daily-cloudcode-pa.sandbox.googleapis.com",
3279
+ reasoning: true,
3280
+ input: ["text", "image"],
3281
+ cost: {
3282
+ input: 5,
3283
+ output: 25,
3284
+ cacheRead: 0.5,
3285
+ cacheWrite: 6.25,
3286
+ },
3287
+ contextWindow: 200000,
3288
+ maxTokens: 128000,
3289
+ },
3153
3290
  "claude-sonnet-4-5": {
3154
3291
  id: "claude-sonnet-4-5",
3155
3292
  name: "Claude Sonnet 4.5 (Antigravity)",
@@ -3528,6 +3665,23 @@ export const MODELS = {
3528
3665
  contextWindow: 1000000,
3529
3666
  maxTokens: 64000,
3530
3667
  },
3668
+ "gemini-3.1-pro-preview": {
3669
+ id: "gemini-3.1-pro-preview",
3670
+ name: "Gemini 3.1 Pro Preview (Vertex)",
3671
+ api: "google-vertex",
3672
+ provider: "google-vertex",
3673
+ baseUrl: "https://{location}-aiplatform.googleapis.com",
3674
+ reasoning: true,
3675
+ input: ["text", "image"],
3676
+ cost: {
3677
+ input: 2,
3678
+ output: 12,
3679
+ cacheRead: 0.2,
3680
+ cacheWrite: 0,
3681
+ },
3682
+ contextWindow: 1048576,
3683
+ maxTokens: 65536,
3684
+ },
3531
3685
  },
3532
3686
  "groq": {
3533
3687
  "deepseek-r1-distill-llama-70b": {
@@ -5454,9 +5608,9 @@ export const MODELS = {
5454
5608
  "big-pickle": {
5455
5609
  id: "big-pickle",
5456
5610
  name: "Big Pickle",
5457
- api: "openai-completions",
5611
+ api: "anthropic-messages",
5458
5612
  provider: "opencode",
5459
- baseUrl: "https://opencode.ai/zen/v1",
5613
+ baseUrl: "https://opencode.ai/zen",
5460
5614
  reasoning: true,
5461
5615
  input: ["text"],
5462
5616
  cost: {
@@ -5587,6 +5741,23 @@ export const MODELS = {
5587
5741
  contextWindow: 200000,
5588
5742
  maxTokens: 64000,
5589
5743
  },
5744
+ "claude-sonnet-4-6": {
5745
+ id: "claude-sonnet-4-6",
5746
+ name: "Claude Sonnet 4.6",
5747
+ api: "anthropic-messages",
5748
+ provider: "opencode",
5749
+ baseUrl: "https://opencode.ai/zen",
5750
+ reasoning: true,
5751
+ input: ["text", "image"],
5752
+ cost: {
5753
+ input: 3,
5754
+ output: 15,
5755
+ cacheRead: 0.3,
5756
+ cacheWrite: 3.75,
5757
+ },
5758
+ contextWindow: 1000000,
5759
+ maxTokens: 64000,
5760
+ },
5590
5761
  "gemini-3-flash": {
5591
5762
  id: "gemini-3-flash",
5592
5763
  name: "Gemini 3 Flash",
@@ -5621,6 +5792,23 @@ export const MODELS = {
5621
5792
  contextWindow: 1048576,
5622
5793
  maxTokens: 65536,
5623
5794
  },
5795
+ "gemini-3.1-pro": {
5796
+ id: "gemini-3.1-pro",
5797
+ name: "Gemini 3.1 Pro Preview",
5798
+ api: "google-generative-ai",
5799
+ provider: "opencode",
5800
+ baseUrl: "https://opencode.ai/zen/v1",
5801
+ reasoning: true,
5802
+ input: ["text", "image"],
5803
+ cost: {
5804
+ input: 2,
5805
+ output: 12,
5806
+ cacheRead: 0.2,
5807
+ cacheWrite: 0,
5808
+ },
5809
+ contextWindow: 1048576,
5810
+ maxTokens: 65536,
5811
+ },
5624
5812
  "glm-4.6": {
5625
5813
  id: "glm-4.6",
5626
5814
  name: "GLM-4.6",
@@ -5893,23 +6081,6 @@ export const MODELS = {
5893
6081
  contextWindow: 262144,
5894
6082
  maxTokens: 262144,
5895
6083
  },
5896
- "kimi-k2.5-free": {
5897
- id: "kimi-k2.5-free",
5898
- name: "Kimi K2.5 Free",
5899
- api: "openai-completions",
5900
- provider: "opencode",
5901
- baseUrl: "https://opencode.ai/zen/v1",
5902
- reasoning: true,
5903
- input: ["text", "image"],
5904
- cost: {
5905
- input: 0,
5906
- output: 0,
5907
- cacheRead: 0,
5908
- cacheWrite: 0,
5909
- },
5910
- contextWindow: 262144,
5911
- maxTokens: 262144,
5912
- },
5913
6084
  "minimax-m2.1": {
5914
6085
  id: "minimax-m2.1",
5915
6086
  name: "MiniMax M2.1",
@@ -5947,9 +6118,9 @@ export const MODELS = {
5947
6118
  "minimax-m2.5-free": {
5948
6119
  id: "minimax-m2.5-free",
5949
6120
  name: "MiniMax M2.5 Free",
5950
- api: "openai-completions",
6121
+ api: "anthropic-messages",
5951
6122
  provider: "opencode",
5952
- baseUrl: "https://opencode.ai/zen/v1",
6123
+ baseUrl: "https://opencode.ai/zen",
5953
6124
  reasoning: true,
5954
6125
  input: ["text"],
5955
6126
  cost: {
@@ -5961,6 +6132,23 @@ export const MODELS = {
5961
6132
  contextWindow: 204800,
5962
6133
  maxTokens: 131072,
5963
6134
  },
6135
+ "trinity-large-preview-free": {
6136
+ id: "trinity-large-preview-free",
6137
+ name: "Trinity Large Preview",
6138
+ api: "openai-completions",
6139
+ provider: "opencode",
6140
+ baseUrl: "https://opencode.ai/zen/v1",
6141
+ reasoning: false,
6142
+ input: ["text"],
6143
+ cost: {
6144
+ input: 0,
6145
+ output: 0,
6146
+ cacheRead: 0,
6147
+ cacheWrite: 0,
6148
+ },
6149
+ contextWindow: 131072,
6150
+ maxTokens: 131072,
6151
+ },
5964
6152
  },
5965
6153
  "openrouter": {
5966
6154
  "ai21/jamba-large-1.7": {
@@ -6144,8 +6332,8 @@ export const MODELS = {
6144
6332
  cost: {
6145
6333
  input: 6,
6146
6334
  output: 30,
6147
- cacheRead: 0,
6148
- cacheWrite: 0,
6335
+ cacheRead: 0.6,
6336
+ cacheWrite: 7.5,
6149
6337
  },
6150
6338
  contextWindow: 200000,
6151
6339
  maxTokens: 8192,
@@ -6516,9 +6704,9 @@ export const MODELS = {
6516
6704
  reasoning: false,
6517
6705
  input: ["text"],
6518
6706
  cost: {
6519
- input: 0.3,
6520
- output: 1.2,
6521
- cacheRead: 0.15,
6707
+ input: 0.32,
6708
+ output: 0.8899999999999999,
6709
+ cacheRead: 0,
6522
6710
  cacheWrite: 0,
6523
6711
  },
6524
6712
  contextWindow: 163840,
@@ -6745,23 +6933,6 @@ export const MODELS = {
6745
6933
  contextWindow: 1048576,
6746
6934
  maxTokens: 65535,
6747
6935
  },
6748
- "google/gemini-2.5-flash-preview-09-2025": {
6749
- id: "google/gemini-2.5-flash-preview-09-2025",
6750
- name: "Google: Gemini 2.5 Flash Preview 09-2025",
6751
- api: "openai-completions",
6752
- provider: "openrouter",
6753
- baseUrl: "https://openrouter.ai/api/v1",
6754
- reasoning: true,
6755
- input: ["text", "image"],
6756
- cost: {
6757
- input: 0.3,
6758
- output: 2.5,
6759
- cacheRead: 0.03,
6760
- cacheWrite: 0.08333333333333334,
6761
- },
6762
- contextWindow: 1048576,
6763
- maxTokens: 65536,
6764
- },
6765
6936
  "google/gemini-2.5-pro": {
6766
6937
  id: "google/gemini-2.5-pro",
6767
6938
  name: "Google: Gemini 2.5 Pro",
@@ -6847,6 +7018,23 @@ export const MODELS = {
6847
7018
  contextWindow: 1048576,
6848
7019
  maxTokens: 65536,
6849
7020
  },
7021
+ "google/gemini-3.1-pro-preview": {
7022
+ id: "google/gemini-3.1-pro-preview",
7023
+ name: "Google: Gemini 3.1 Pro Preview",
7024
+ api: "openai-completions",
7025
+ provider: "openrouter",
7026
+ baseUrl: "https://openrouter.ai/api/v1",
7027
+ reasoning: true,
7028
+ input: ["text", "image"],
7029
+ cost: {
7030
+ input: 2,
7031
+ output: 12,
7032
+ cacheRead: 0.19999999999999998,
7033
+ cacheWrite: 0.375,
7034
+ },
7035
+ contextWindow: 1048576,
7036
+ maxTokens: 65536,
7037
+ },
6850
7038
  "google/gemma-3-27b-it": {
6851
7039
  id: "google/gemma-3-27b-it",
6852
7040
  name: "Google: Gemma 3 27B",
@@ -7162,13 +7350,13 @@ export const MODELS = {
7162
7350
  reasoning: false,
7163
7351
  input: ["text"],
7164
7352
  cost: {
7165
- input: 0.049999999999999996,
7166
- output: 0.22,
7167
- cacheRead: 0.024999999999999998,
7353
+ input: 0.39999999999999997,
7354
+ output: 2,
7355
+ cacheRead: 0,
7168
7356
  cacheWrite: 0,
7169
7357
  },
7170
7358
  contextWindow: 262144,
7171
- maxTokens: 65536,
7359
+ maxTokens: 4096,
7172
7360
  },
7173
7361
  "mistralai/devstral-medium": {
7174
7362
  id: "mistralai/devstral-medium",
@@ -7408,23 +7596,6 @@ export const MODELS = {
7408
7596
  contextWindow: 32768,
7409
7597
  maxTokens: 16384,
7410
7598
  },
7411
- "mistralai/mistral-small-3.1-24b-instruct": {
7412
- id: "mistralai/mistral-small-3.1-24b-instruct",
7413
- name: "Mistral: Mistral Small 3.1 24B",
7414
- api: "openai-completions",
7415
- provider: "openrouter",
7416
- baseUrl: "https://openrouter.ai/api/v1",
7417
- reasoning: false,
7418
- input: ["text", "image"],
7419
- cost: {
7420
- input: 0.03,
7421
- output: 0.11,
7422
- cacheRead: 0.015,
7423
- cacheWrite: 0,
7424
- },
7425
- contextWindow: 131072,
7426
- maxTokens: 131072,
7427
- },
7428
7599
  "mistralai/mistral-small-3.1-24b-instruct:free": {
7429
7600
  id: "mistralai/mistral-small-3.1-24b-instruct:free",
7430
7601
  name: "Mistral: Mistral Small 3.1 24B (free)",
@@ -7604,13 +7775,13 @@ export const MODELS = {
7604
7775
  reasoning: true,
7605
7776
  input: ["text"],
7606
7777
  cost: {
7607
- input: 0.39999999999999997,
7608
- output: 1.75,
7609
- cacheRead: 0.19999999999999998,
7778
+ input: 0.47,
7779
+ output: 2,
7780
+ cacheRead: 0.14100000000000001,
7610
7781
  cacheWrite: 0,
7611
7782
  },
7612
- contextWindow: 262144,
7613
- maxTokens: 65535,
7783
+ contextWindow: 131072,
7784
+ maxTokens: 4096,
7614
7785
  },
7615
7786
  "moonshotai/kimi-k2.5": {
7616
7787
  id: "moonshotai/kimi-k2.5",
@@ -7646,40 +7817,6 @@ export const MODELS = {
7646
7817
  contextWindow: 131072,
7647
7818
  maxTokens: 163840,
7648
7819
  },
7649
- "nousresearch/deephermes-3-mistral-24b-preview": {
7650
- id: "nousresearch/deephermes-3-mistral-24b-preview",
7651
- name: "Nous: DeepHermes 3 Mistral 24B Preview",
7652
- api: "openai-completions",
7653
- provider: "openrouter",
7654
- baseUrl: "https://openrouter.ai/api/v1",
7655
- reasoning: true,
7656
- input: ["text"],
7657
- cost: {
7658
- input: 0.02,
7659
- output: 0.09999999999999999,
7660
- cacheRead: 0.01,
7661
- cacheWrite: 0,
7662
- },
7663
- contextWindow: 32768,
7664
- maxTokens: 32768,
7665
- },
7666
- "nousresearch/hermes-4-70b": {
7667
- id: "nousresearch/hermes-4-70b",
7668
- name: "Nous: Hermes 4 70B",
7669
- api: "openai-completions",
7670
- provider: "openrouter",
7671
- baseUrl: "https://openrouter.ai/api/v1",
7672
- reasoning: true,
7673
- input: ["text"],
7674
- cost: {
7675
- input: 0.11,
7676
- output: 0.38,
7677
- cacheRead: 0.055,
7678
- cacheWrite: 0,
7679
- },
7680
- contextWindow: 131072,
7681
- maxTokens: 131072,
7682
- },
7683
7820
  "nvidia/llama-3.1-nemotron-70b-instruct": {
7684
7821
  id: "nvidia/llama-3.1-nemotron-70b-instruct",
7685
7822
  name: "NVIDIA: Llama 3.1 Nemotron 70B Instruct",
@@ -8862,9 +8999,9 @@ export const MODELS = {
8862
8999
  reasoning: true,
8863
9000
  input: ["text"],
8864
9001
  cost: {
8865
- input: 0.049999999999999996,
8866
- output: 0.22,
8867
- cacheRead: 0.024999999999999998,
9002
+ input: 0.06,
9003
+ output: 0.24,
9004
+ cacheRead: 0,
8868
9005
  cacheWrite: 0,
8869
9006
  },
8870
9007
  contextWindow: 40960,
@@ -8879,13 +9016,13 @@ export const MODELS = {
8879
9016
  reasoning: true,
8880
9017
  input: ["text"],
8881
9018
  cost: {
8882
- input: 0.3,
8883
- output: 1.2,
8884
- cacheRead: 0.15,
9019
+ input: 0.45499999999999996,
9020
+ output: 1.8199999999999998,
9021
+ cacheRead: 0,
8885
9022
  cacheWrite: 0,
8886
9023
  },
8887
- contextWindow: 40960,
8888
- maxTokens: 40960,
9024
+ contextWindow: 131072,
9025
+ maxTokens: 8192,
8889
9026
  },
8890
9027
  "qwen/qwen3-235b-a22b-2507": {
8891
9028
  id: "qwen/qwen3-235b-a22b-2507",
@@ -8930,9 +9067,9 @@ export const MODELS = {
8930
9067
  reasoning: true,
8931
9068
  input: ["text"],
8932
9069
  cost: {
8933
- input: 0.06,
8934
- output: 0.22,
8935
- cacheRead: 0.03,
9070
+ input: 0.08,
9071
+ output: 0.28,
9072
+ cacheRead: 0,
8936
9073
  cacheWrite: 0,
8937
9074
  },
8938
9075
  contextWindow: 40960,
@@ -8947,9 +9084,9 @@ export const MODELS = {
8947
9084
  reasoning: false,
8948
9085
  input: ["text"],
8949
9086
  cost: {
8950
- input: 0.08,
8951
- output: 0.33,
8952
- cacheRead: 0.04,
9087
+ input: 0.09,
9088
+ output: 0.3,
9089
+ cacheRead: 0,
8953
9090
  cacheWrite: 0,
8954
9091
  },
8955
9092
  contextWindow: 262144,
@@ -8989,23 +9126,6 @@ export const MODELS = {
8989
9126
  contextWindow: 40960,
8990
9127
  maxTokens: 40960,
8991
9128
  },
8992
- "qwen/qwen3-4b": {
8993
- id: "qwen/qwen3-4b",
8994
- name: "Qwen: Qwen3 4B",
8995
- api: "openai-completions",
8996
- provider: "openrouter",
8997
- baseUrl: "https://openrouter.ai/api/v1",
8998
- reasoning: true,
8999
- input: ["text"],
9000
- cost: {
9001
- input: 0.0715,
9002
- output: 0.273,
9003
- cacheRead: 0,
9004
- cacheWrite: 0,
9005
- },
9006
- contextWindow: 131072,
9007
- maxTokens: 8192,
9008
- },
9009
9129
  "qwen/qwen3-4b:free": {
9010
9130
  id: "qwen/qwen3-4b:free",
9011
9131
  name: "Qwen: Qwen3 4B (free)",
@@ -9550,23 +9670,6 @@ export const MODELS = {
9550
9670
  contextWindow: 163840,
9551
9671
  maxTokens: 163840,
9552
9672
  },
9553
- "tngtech/tng-r1t-chimera": {
9554
- id: "tngtech/tng-r1t-chimera",
9555
- name: "TNG: R1T Chimera",
9556
- api: "openai-completions",
9557
- provider: "openrouter",
9558
- baseUrl: "https://openrouter.ai/api/v1",
9559
- reasoning: true,
9560
- input: ["text"],
9561
- cost: {
9562
- input: 0.25,
9563
- output: 0.85,
9564
- cacheRead: 0.125,
9565
- cacheWrite: 0,
9566
- },
9567
- contextWindow: 163840,
9568
- maxTokens: 65536,
9569
- },
9570
9673
  "upstage/solar-pro-3:free": {
9571
9674
  id: "upstage/solar-pro-3:free",
9572
9675
  name: "Upstage: Solar Pro 3 (free)",
@@ -9763,13 +9866,13 @@ export const MODELS = {
9763
9866
  reasoning: true,
9764
9867
  input: ["text"],
9765
9868
  cost: {
9766
- input: 0.35,
9767
- output: 1.55,
9768
- cacheRead: 0.175,
9869
+ input: 0.55,
9870
+ output: 2,
9871
+ cacheRead: 0,
9769
9872
  cacheWrite: 0,
9770
9873
  },
9771
- contextWindow: 131072,
9772
- maxTokens: 65536,
9874
+ contextWindow: 131000,
9875
+ maxTokens: 131000,
9773
9876
  },
9774
9877
  "z-ai/glm-4.5-air": {
9775
9878
  id: "z-ai/glm-4.5-air",
@@ -9831,13 +9934,13 @@ export const MODELS = {
9831
9934
  reasoning: true,
9832
9935
  input: ["text"],
9833
9936
  cost: {
9834
- input: 0.33999999999999997,
9835
- output: 1.7,
9836
- cacheRead: 0.16999999999999998,
9937
+ input: 0.35,
9938
+ output: 1.71,
9939
+ cacheRead: 0,
9837
9940
  cacheWrite: 0,
9838
9941
  },
9839
9942
  contextWindow: 202752,
9840
- maxTokens: 65536,
9943
+ maxTokens: 131072,
9841
9944
  },
9842
9945
  "z-ai/glm-4.6:exacto": {
9843
9946
  id: "z-ai/glm-4.6:exacto",
@@ -10366,7 +10469,7 @@ export const MODELS = {
10366
10469
  cacheWrite: 3.75,
10367
10470
  },
10368
10471
  contextWindow: 1000000,
10369
- maxTokens: 64000,
10472
+ maxTokens: 128000,
10370
10473
  },
10371
10474
  "arcee-ai/trinity-large-preview": {
10372
10475
  id: "arcee-ai/trinity-large-preview",
@@ -10623,6 +10726,23 @@ export const MODELS = {
10623
10726
  contextWindow: 1000000,
10624
10727
  maxTokens: 64000,
10625
10728
  },
10729
+ "google/gemini-3.1-pro-preview": {
10730
+ id: "google/gemini-3.1-pro-preview",
10731
+ name: "Gemini 3.1 Pro Preview",
10732
+ api: "anthropic-messages",
10733
+ provider: "vercel-ai-gateway",
10734
+ baseUrl: "https://ai-gateway.vercel.sh",
10735
+ reasoning: true,
10736
+ input: ["text", "image"],
10737
+ cost: {
10738
+ input: 2,
10739
+ output: 12,
10740
+ cacheRead: 0.19999999999999998,
10741
+ cacheWrite: 0,
10742
+ },
10743
+ contextWindow: 1000000,
10744
+ maxTokens: 64000,
10745
+ },
10626
10746
  "inception/mercury-coder-small": {
10627
10747
  id: "inception/mercury-coder-small",
10628
10748
  name: "Mercury Coder Small Beta",