@earendil-works/pi-ai 0.74.1 → 0.74.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -908,8 +908,8 @@ export const MODELS = {
908
908
  cacheRead: 0,
909
909
  cacheWrite: 0,
910
910
  },
911
- contextWindow: 256000,
912
- maxTokens: 256000,
911
+ contextWindow: 262143,
912
+ maxTokens: 16000,
913
913
  },
914
914
  "moonshotai.kimi-k2.5": {
915
915
  id: "moonshotai.kimi-k2.5",
@@ -925,8 +925,8 @@ export const MODELS = {
925
925
  cacheRead: 0,
926
926
  cacheWrite: 0,
927
927
  },
928
- contextWindow: 256000,
929
- maxTokens: 256000,
928
+ contextWindow: 262143,
929
+ maxTokens: 16000,
930
930
  },
931
931
  "nvidia.nemotron-nano-12b-v2": {
932
932
  id: "nvidia.nemotron-nano-12b-v2",
@@ -3275,6 +3275,42 @@ export const MODELS = {
3275
3275
  contextWindow: 256000,
3276
3276
  maxTokens: 16384,
3277
3277
  },
3278
+ "@cf/ibm-granite/granite-4.0-h-micro": {
3279
+ id: "@cf/ibm-granite/granite-4.0-h-micro",
3280
+ name: "Granite 4.0 H Micro",
3281
+ api: "openai-completions",
3282
+ provider: "cloudflare-workers-ai",
3283
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3284
+ compat: { "sendSessionAffinityHeaders": true },
3285
+ reasoning: false,
3286
+ input: ["text"],
3287
+ cost: {
3288
+ input: 0.017,
3289
+ output: 0.112,
3290
+ cacheRead: 0,
3291
+ cacheWrite: 0,
3292
+ },
3293
+ contextWindow: 131000,
3294
+ maxTokens: 131000,
3295
+ },
3296
+ "@cf/meta/llama-3.3-70b-instruct-fp8-fast": {
3297
+ id: "@cf/meta/llama-3.3-70b-instruct-fp8-fast",
3298
+ name: "Llama 3.3 70B Instruct fp8 Fast",
3299
+ api: "openai-completions",
3300
+ provider: "cloudflare-workers-ai",
3301
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3302
+ compat: { "sendSessionAffinityHeaders": true },
3303
+ reasoning: false,
3304
+ input: ["text"],
3305
+ cost: {
3306
+ input: 0.293,
3307
+ output: 2.253,
3308
+ cacheRead: 0,
3309
+ cacheWrite: 0,
3310
+ },
3311
+ contextWindow: 24000,
3312
+ maxTokens: 24000,
3313
+ },
3278
3314
  "@cf/meta/llama-4-scout-17b-16e-instruct": {
3279
3315
  id: "@cf/meta/llama-4-scout-17b-16e-instruct",
3280
3316
  name: "Llama 4 Scout 17B 16E Instruct",
@@ -3290,9 +3326,27 @@ export const MODELS = {
3290
3326
  cacheRead: 0,
3291
3327
  cacheWrite: 0,
3292
3328
  },
3293
- contextWindow: 128000,
3329
+ contextWindow: 131000,
3294
3330
  maxTokens: 16384,
3295
3331
  },
3332
+ "@cf/mistralai/mistral-small-3.1-24b-instruct": {
3333
+ id: "@cf/mistralai/mistral-small-3.1-24b-instruct",
3334
+ name: "Mistral Small 3.1 24B Instruct",
3335
+ api: "openai-completions",
3336
+ provider: "cloudflare-workers-ai",
3337
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3338
+ compat: { "sendSessionAffinityHeaders": true },
3339
+ reasoning: false,
3340
+ input: ["text"],
3341
+ cost: {
3342
+ input: 0.351,
3343
+ output: 0.555,
3344
+ cacheRead: 0,
3345
+ cacheWrite: 0,
3346
+ },
3347
+ contextWindow: 128000,
3348
+ maxTokens: 128000,
3349
+ },
3296
3350
  "@cf/moonshotai/kimi-k2.5": {
3297
3351
  id: "@cf/moonshotai/kimi-k2.5",
3298
3352
  name: "Kimi K2.5",
@@ -3326,7 +3380,7 @@ export const MODELS = {
3326
3380
  cacheRead: 0.16,
3327
3381
  cacheWrite: 0,
3328
3382
  },
3329
- contextWindow: 256000,
3383
+ contextWindow: 262144,
3330
3384
  maxTokens: 256000,
3331
3385
  },
3332
3386
  "@cf/nvidia/nemotron-3-120b-a12b": {
@@ -3383,6 +3437,24 @@ export const MODELS = {
3383
3437
  contextWindow: 128000,
3384
3438
  maxTokens: 16384,
3385
3439
  },
3440
+ "@cf/qwen/qwen3-30b-a3b-fp8": {
3441
+ id: "@cf/qwen/qwen3-30b-a3b-fp8",
3442
+ name: "Qwen3 30B A3b fp8",
3443
+ api: "openai-completions",
3444
+ provider: "cloudflare-workers-ai",
3445
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3446
+ compat: { "sendSessionAffinityHeaders": true },
3447
+ reasoning: true,
3448
+ input: ["text"],
3449
+ cost: {
3450
+ input: 0.0509,
3451
+ output: 0.335,
3452
+ cacheRead: 0,
3453
+ cacheWrite: 0,
3454
+ },
3455
+ contextWindow: 32768,
3456
+ maxTokens: 32768,
3457
+ },
3386
3458
  "@cf/zai-org/glm-4.7-flash": {
3387
3459
  id: "@cf/zai-org/glm-4.7-flash",
3388
3460
  name: "GLM-4.7-Flash",
@@ -3393,7 +3465,7 @@ export const MODELS = {
3393
3465
  reasoning: true,
3394
3466
  input: ["text"],
3395
3467
  cost: {
3396
- input: 0.06,
3468
+ input: 0.0605,
3397
3469
  output: 0.4,
3398
3470
  cacheRead: 0,
3399
3471
  cacheWrite: 0,
@@ -3479,6 +3551,24 @@ export const MODELS = {
3479
3551
  contextWindow: 160000,
3480
3552
  maxTokens: 160000,
3481
3553
  },
3554
+ "accounts/fireworks/models/deepseek-v4-flash": {
3555
+ id: "accounts/fireworks/models/deepseek-v4-flash",
3556
+ name: "DeepSeek V4 Flash",
3557
+ api: "anthropic-messages",
3558
+ provider: "fireworks",
3559
+ baseUrl: "https://api.fireworks.ai/inference",
3560
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3561
+ reasoning: true,
3562
+ input: ["text"],
3563
+ cost: {
3564
+ input: 0.14,
3565
+ output: 0.28,
3566
+ cacheRead: 0.03,
3567
+ cacheWrite: 0,
3568
+ },
3569
+ contextWindow: 1000000,
3570
+ maxTokens: 384000,
3571
+ },
3482
3572
  "accounts/fireworks/models/deepseek-v4-pro": {
3483
3573
  id: "accounts/fireworks/models/deepseek-v4-pro",
3484
3574
  name: "DeepSeek V4 Pro",
@@ -4148,57 +4238,6 @@ export const MODELS = {
4148
4238
  },
4149
4239
  },
4150
4240
  "google": {
4151
- "gemini-1.5-flash": {
4152
- id: "gemini-1.5-flash",
4153
- name: "Gemini 1.5 Flash",
4154
- api: "google-generative-ai",
4155
- provider: "google",
4156
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4157
- reasoning: false,
4158
- input: ["text", "image"],
4159
- cost: {
4160
- input: 0.075,
4161
- output: 0.3,
4162
- cacheRead: 0.01875,
4163
- cacheWrite: 0,
4164
- },
4165
- contextWindow: 1000000,
4166
- maxTokens: 8192,
4167
- },
4168
- "gemini-1.5-flash-8b": {
4169
- id: "gemini-1.5-flash-8b",
4170
- name: "Gemini 1.5 Flash-8B",
4171
- api: "google-generative-ai",
4172
- provider: "google",
4173
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4174
- reasoning: false,
4175
- input: ["text", "image"],
4176
- cost: {
4177
- input: 0.0375,
4178
- output: 0.15,
4179
- cacheRead: 0.01,
4180
- cacheWrite: 0,
4181
- },
4182
- contextWindow: 1000000,
4183
- maxTokens: 8192,
4184
- },
4185
- "gemini-1.5-pro": {
4186
- id: "gemini-1.5-pro",
4187
- name: "Gemini 1.5 Pro",
4188
- api: "google-generative-ai",
4189
- provider: "google",
4190
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4191
- reasoning: false,
4192
- input: ["text", "image"],
4193
- cost: {
4194
- input: 1.25,
4195
- output: 5,
4196
- cacheRead: 0.3125,
4197
- cacheWrite: 0,
4198
- },
4199
- contextWindow: 1000000,
4200
- maxTokens: 8192,
4201
- },
4202
4241
  "gemini-2.0-flash": {
4203
4242
  id: "gemini-2.0-flash",
4204
4243
  name: "Gemini 2.0 Flash",
@@ -4218,7 +4257,7 @@ export const MODELS = {
4218
4257
  },
4219
4258
  "gemini-2.0-flash-lite": {
4220
4259
  id: "gemini-2.0-flash-lite",
4221
- name: "Gemini 2.0 Flash Lite",
4260
+ name: "Gemini 2.0 Flash-Lite",
4222
4261
  api: "google-generative-ai",
4223
4262
  provider: "google",
4224
4263
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4252,7 +4291,7 @@ export const MODELS = {
4252
4291
  },
4253
4292
  "gemini-2.5-flash-lite": {
4254
4293
  id: "gemini-2.5-flash-lite",
4255
- name: "Gemini 2.5 Flash Lite",
4294
+ name: "Gemini 2.5 Flash-Lite",
4256
4295
  api: "google-generative-ai",
4257
4296
  provider: "google",
4258
4297
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4267,91 +4306,6 @@ export const MODELS = {
4267
4306
  contextWindow: 1048576,
4268
4307
  maxTokens: 65536,
4269
4308
  },
4270
- "gemini-2.5-flash-lite-preview-06-17": {
4271
- id: "gemini-2.5-flash-lite-preview-06-17",
4272
- name: "Gemini 2.5 Flash Lite Preview 06-17",
4273
- api: "google-generative-ai",
4274
- provider: "google",
4275
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4276
- reasoning: true,
4277
- input: ["text", "image"],
4278
- cost: {
4279
- input: 0.1,
4280
- output: 0.4,
4281
- cacheRead: 0.025,
4282
- cacheWrite: 0,
4283
- },
4284
- contextWindow: 1048576,
4285
- maxTokens: 65536,
4286
- },
4287
- "gemini-2.5-flash-lite-preview-09-2025": {
4288
- id: "gemini-2.5-flash-lite-preview-09-2025",
4289
- name: "Gemini 2.5 Flash Lite Preview 09-25",
4290
- api: "google-generative-ai",
4291
- provider: "google",
4292
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4293
- reasoning: true,
4294
- input: ["text", "image"],
4295
- cost: {
4296
- input: 0.1,
4297
- output: 0.4,
4298
- cacheRead: 0.025,
4299
- cacheWrite: 0,
4300
- },
4301
- contextWindow: 1048576,
4302
- maxTokens: 65536,
4303
- },
4304
- "gemini-2.5-flash-preview-04-17": {
4305
- id: "gemini-2.5-flash-preview-04-17",
4306
- name: "Gemini 2.5 Flash Preview 04-17",
4307
- api: "google-generative-ai",
4308
- provider: "google",
4309
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4310
- reasoning: true,
4311
- input: ["text", "image"],
4312
- cost: {
4313
- input: 0.15,
4314
- output: 0.6,
4315
- cacheRead: 0.0375,
4316
- cacheWrite: 0,
4317
- },
4318
- contextWindow: 1048576,
4319
- maxTokens: 65536,
4320
- },
4321
- "gemini-2.5-flash-preview-05-20": {
4322
- id: "gemini-2.5-flash-preview-05-20",
4323
- name: "Gemini 2.5 Flash Preview 05-20",
4324
- api: "google-generative-ai",
4325
- provider: "google",
4326
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4327
- reasoning: true,
4328
- input: ["text", "image"],
4329
- cost: {
4330
- input: 0.15,
4331
- output: 0.6,
4332
- cacheRead: 0.0375,
4333
- cacheWrite: 0,
4334
- },
4335
- contextWindow: 1048576,
4336
- maxTokens: 65536,
4337
- },
4338
- "gemini-2.5-flash-preview-09-2025": {
4339
- id: "gemini-2.5-flash-preview-09-2025",
4340
- name: "Gemini 2.5 Flash Preview 09-25",
4341
- api: "google-generative-ai",
4342
- provider: "google",
4343
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4344
- reasoning: true,
4345
- input: ["text", "image"],
4346
- cost: {
4347
- input: 0.3,
4348
- output: 2.5,
4349
- cacheRead: 0.075,
4350
- cacheWrite: 0,
4351
- },
4352
- contextWindow: 1048576,
4353
- maxTokens: 65536,
4354
- },
4355
4309
  "gemini-2.5-pro": {
4356
4310
  id: "gemini-2.5-pro",
4357
4311
  name: "Gemini 2.5 Pro",
@@ -4369,40 +4323,6 @@ export const MODELS = {
4369
4323
  contextWindow: 1048576,
4370
4324
  maxTokens: 65536,
4371
4325
  },
4372
- "gemini-2.5-pro-preview-05-06": {
4373
- id: "gemini-2.5-pro-preview-05-06",
4374
- name: "Gemini 2.5 Pro Preview 05-06",
4375
- api: "google-generative-ai",
4376
- provider: "google",
4377
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4378
- reasoning: true,
4379
- input: ["text", "image"],
4380
- cost: {
4381
- input: 1.25,
4382
- output: 10,
4383
- cacheRead: 0.31,
4384
- cacheWrite: 0,
4385
- },
4386
- contextWindow: 1048576,
4387
- maxTokens: 65536,
4388
- },
4389
- "gemini-2.5-pro-preview-06-05": {
4390
- id: "gemini-2.5-pro-preview-06-05",
4391
- name: "Gemini 2.5 Pro Preview 06-05",
4392
- api: "google-generative-ai",
4393
- provider: "google",
4394
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4395
- reasoning: true,
4396
- input: ["text", "image"],
4397
- cost: {
4398
- input: 1.25,
4399
- output: 10,
4400
- cacheRead: 0.31,
4401
- cacheWrite: 0,
4402
- },
4403
- contextWindow: 1048576,
4404
- maxTokens: 65536,
4405
- },
4406
4326
  "gemini-3-flash-preview": {
4407
4327
  id: "gemini-3-flash-preview",
4408
4328
  name: "Gemini 3 Flash Preview",
@@ -4436,8 +4356,8 @@ export const MODELS = {
4436
4356
  cacheRead: 0.2,
4437
4357
  cacheWrite: 0,
4438
4358
  },
4439
- contextWindow: 1000000,
4440
- maxTokens: 64000,
4359
+ contextWindow: 1048576,
4360
+ maxTokens: 65536,
4441
4361
  },
4442
4362
  "gemini-3.1-flash-lite": {
4443
4363
  id: "gemini-3.1-flash-lite",
@@ -4511,6 +4431,24 @@ export const MODELS = {
4511
4431
  contextWindow: 1048576,
4512
4432
  maxTokens: 65536,
4513
4433
  },
4434
+ "gemini-3.5-flash": {
4435
+ id: "gemini-3.5-flash",
4436
+ name: "Gemini 3.5 Flash",
4437
+ api: "google-generative-ai",
4438
+ provider: "google",
4439
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4440
+ reasoning: true,
4441
+ thinkingLevelMap: { "off": null },
4442
+ input: ["text", "image"],
4443
+ cost: {
4444
+ input: 1.5,
4445
+ output: 9,
4446
+ cacheRead: 0.15,
4447
+ cacheWrite: 0,
4448
+ },
4449
+ contextWindow: 1048576,
4450
+ maxTokens: 65536,
4451
+ },
4514
4452
  "gemini-flash-latest": {
4515
4453
  id: "gemini-flash-latest",
4516
4454
  name: "Gemini Flash Latest",
@@ -4545,60 +4483,9 @@ export const MODELS = {
4545
4483
  contextWindow: 1048576,
4546
4484
  maxTokens: 65536,
4547
4485
  },
4548
- "gemini-live-2.5-flash": {
4549
- id: "gemini-live-2.5-flash",
4550
- name: "Gemini Live 2.5 Flash",
4551
- api: "google-generative-ai",
4552
- provider: "google",
4553
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4554
- reasoning: true,
4555
- input: ["text", "image"],
4556
- cost: {
4557
- input: 0.5,
4558
- output: 2,
4559
- cacheRead: 0,
4560
- cacheWrite: 0,
4561
- },
4562
- contextWindow: 128000,
4563
- maxTokens: 8000,
4564
- },
4565
- "gemini-live-2.5-flash-preview-native-audio": {
4566
- id: "gemini-live-2.5-flash-preview-native-audio",
4567
- name: "Gemini Live 2.5 Flash Preview Native Audio",
4568
- api: "google-generative-ai",
4569
- provider: "google",
4570
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4571
- reasoning: true,
4572
- input: ["text"],
4573
- cost: {
4574
- input: 0.5,
4575
- output: 2,
4576
- cacheRead: 0,
4577
- cacheWrite: 0,
4578
- },
4579
- contextWindow: 131072,
4580
- maxTokens: 65536,
4581
- },
4582
- "gemma-3-27b-it": {
4583
- id: "gemma-3-27b-it",
4584
- name: "Gemma 3 27B",
4585
- api: "google-generative-ai",
4586
- provider: "google",
4587
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4588
- reasoning: false,
4589
- input: ["text", "image"],
4590
- cost: {
4591
- input: 0,
4592
- output: 0,
4593
- cacheRead: 0,
4594
- cacheWrite: 0,
4595
- },
4596
- contextWindow: 131072,
4597
- maxTokens: 8192,
4598
- },
4599
4486
  "gemma-4-26b-a4b-it": {
4600
4487
  id: "gemma-4-26b-a4b-it",
4601
- name: "Gemma 4 26B",
4488
+ name: "Gemma 4 26B A4B IT",
4602
4489
  api: "google-generative-ai",
4603
4490
  provider: "google",
4604
4491
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4611,12 +4498,12 @@ export const MODELS = {
4611
4498
  cacheRead: 0,
4612
4499
  cacheWrite: 0,
4613
4500
  },
4614
- contextWindow: 256000,
4615
- maxTokens: 8192,
4501
+ contextWindow: 262144,
4502
+ maxTokens: 32768,
4616
4503
  },
4617
4504
  "gemma-4-31b-it": {
4618
4505
  id: "gemma-4-31b-it",
4619
- name: "Gemma 4 31B",
4506
+ name: "Gemma 4 31B IT",
4620
4507
  api: "google-generative-ai",
4621
4508
  provider: "google",
4622
4509
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4629,8 +4516,8 @@ export const MODELS = {
4629
4516
  cacheRead: 0,
4630
4517
  cacheWrite: 0,
4631
4518
  },
4632
- contextWindow: 256000,
4633
- maxTokens: 8192,
4519
+ contextWindow: 262144,
4520
+ maxTokens: 32768,
4634
4521
  },
4635
4522
  },
4636
4523
  "google-vertex": {
@@ -7542,6 +7429,24 @@ export const MODELS = {
7542
7429
  contextWindow: 1048576,
7543
7430
  maxTokens: 65536,
7544
7431
  },
7432
+ "gemini-3.5-flash": {
7433
+ id: "gemini-3.5-flash",
7434
+ name: "Gemini 3.5 Flash",
7435
+ api: "google-generative-ai",
7436
+ provider: "opencode",
7437
+ baseUrl: "https://opencode.ai/zen/v1",
7438
+ reasoning: true,
7439
+ thinkingLevelMap: { "off": null },
7440
+ input: ["text", "image"],
7441
+ cost: {
7442
+ input: 1.5,
7443
+ output: 9,
7444
+ cacheRead: 0.15,
7445
+ cacheWrite: 0,
7446
+ },
7447
+ contextWindow: 1048576,
7448
+ maxTokens: 65536,
7449
+ },
7545
7450
  "glm-5": {
7546
7451
  id: "glm-5",
7547
7452
  name: "GLM-5",
@@ -7864,6 +7769,23 @@ export const MODELS = {
7864
7769
  contextWindow: 1050000,
7865
7770
  maxTokens: 128000,
7866
7771
  },
7772
+ "grok-build-0.1": {
7773
+ id: "grok-build-0.1",
7774
+ name: "Grok Build 0.1",
7775
+ api: "openai-completions",
7776
+ provider: "opencode",
7777
+ baseUrl: "https://opencode.ai/zen/v1",
7778
+ reasoning: true,
7779
+ input: ["text", "image"],
7780
+ cost: {
7781
+ input: 1,
7782
+ output: 2,
7783
+ cacheRead: 0.2,
7784
+ cacheWrite: 0,
7785
+ },
7786
+ contextWindow: 256000,
7787
+ maxTokens: 256000,
7788
+ },
7867
7789
  "kimi-k2.5": {
7868
7790
  id: "kimi-k2.5",
7869
7791
  name: "Kimi K2.5",
@@ -7915,23 +7837,6 @@ export const MODELS = {
7915
7837
  contextWindow: 204800,
7916
7838
  maxTokens: 131072,
7917
7839
  },
7918
- "minimax-m2.5-free": {
7919
- id: "minimax-m2.5-free",
7920
- name: "MiniMax M2.5 Free",
7921
- api: "anthropic-messages",
7922
- provider: "opencode",
7923
- baseUrl: "https://opencode.ai/zen",
7924
- reasoning: true,
7925
- input: ["text"],
7926
- cost: {
7927
- input: 0,
7928
- output: 0,
7929
- cacheRead: 0,
7930
- cacheWrite: 0,
7931
- },
7932
- contextWindow: 204800,
7933
- maxTokens: 131072,
7934
- },
7935
7840
  "minimax-m2.7": {
7936
7841
  id: "minimax-m2.7",
7937
7842
  name: "MiniMax M2.7",
@@ -8567,30 +8472,13 @@ export const MODELS = {
8567
8472
  reasoning: true,
8568
8473
  input: ["text", "image"],
8569
8474
  cost: {
8570
- input: 3,
8571
- output: 15,
8572
- cacheRead: 0.3,
8573
- cacheWrite: 3.75,
8574
- },
8575
- contextWindow: 1000000,
8576
- maxTokens: 128000,
8577
- },
8578
- "arcee-ai/trinity-large-preview": {
8579
- id: "arcee-ai/trinity-large-preview",
8580
- name: "Arcee AI: Trinity Large Preview",
8581
- api: "openai-completions",
8582
- provider: "openrouter",
8583
- baseUrl: "https://openrouter.ai/api/v1",
8584
- reasoning: false,
8585
- input: ["text"],
8586
- cost: {
8587
- input: 0.15,
8588
- output: 0.44999999999999996,
8589
- cacheRead: 0,
8590
- cacheWrite: 0,
8475
+ input: 3,
8476
+ output: 15,
8477
+ cacheRead: 0.3,
8478
+ cacheWrite: 3.75,
8591
8479
  },
8592
- contextWindow: 131000,
8593
- maxTokens: 4096,
8480
+ contextWindow: 1000000,
8481
+ maxTokens: 128000,
8594
8482
  },
8595
8483
  "arcee-ai/trinity-large-thinking": {
8596
8484
  id: "arcee-ai/trinity-large-thinking",
@@ -9054,7 +8942,7 @@ export const MODELS = {
9054
8942
  cacheRead: 0.024999999999999998,
9055
8943
  cacheWrite: 0.08333333333333334,
9056
8944
  },
9057
- contextWindow: 1048576,
8945
+ contextWindow: 1000000,
9058
8946
  maxTokens: 8192,
9059
8947
  },
9060
8948
  "google/gemini-2.0-flash-lite-001": {
@@ -9261,6 +9149,23 @@ export const MODELS = {
9261
9149
  contextWindow: 1048756,
9262
9150
  maxTokens: 65536,
9263
9151
  },
9152
+ "google/gemini-3.5-flash": {
9153
+ id: "google/gemini-3.5-flash",
9154
+ name: "Google: Gemini 3.5 Flash",
9155
+ api: "openai-completions",
9156
+ provider: "openrouter",
9157
+ baseUrl: "https://openrouter.ai/api/v1",
9158
+ reasoning: true,
9159
+ input: ["text", "image"],
9160
+ cost: {
9161
+ input: 1.5,
9162
+ output: 9,
9163
+ cacheRead: 0.15,
9164
+ cacheWrite: 0.08333333333333334,
9165
+ },
9166
+ contextWindow: 1048576,
9167
+ maxTokens: 65536,
9168
+ },
9264
9169
  "google/gemma-3-12b-it": {
9265
9170
  id: "google/gemma-3-12b-it",
9266
9171
  name: "Google: Gemma 3 12B",
@@ -9304,13 +9209,13 @@ export const MODELS = {
9304
9209
  reasoning: true,
9305
9210
  input: ["text", "image"],
9306
9211
  cost: {
9307
- input: 0.07,
9308
- output: 0.33999999999999997,
9212
+ input: 0.06,
9213
+ output: 0.33,
9309
9214
  cacheRead: 0,
9310
9215
  cacheWrite: 0,
9311
9216
  },
9312
9217
  contextWindow: 262144,
9313
- maxTokens: 16384,
9218
+ maxTokens: 4096,
9314
9219
  },
9315
9220
  "google/gemma-4-26b-a4b-it:free": {
9316
9221
  id: "google/gemma-4-26b-a4b-it:free",
@@ -9407,9 +9312,9 @@ export const MODELS = {
9407
9312
  reasoning: false,
9408
9313
  input: ["text"],
9409
9314
  cost: {
9410
- input: 0.3,
9411
- output: 2.5,
9412
- cacheRead: 0.06,
9315
+ input: 0.075,
9316
+ output: 0.625,
9317
+ cacheRead: 0.015,
9413
9318
  cacheWrite: 0,
9414
9319
  },
9415
9320
  contextWindow: 262144,
@@ -9901,12 +9806,12 @@ export const MODELS = {
9901
9806
  input: ["text"],
9902
9807
  cost: {
9903
9808
  input: 0.02,
9904
- output: 0.04,
9809
+ output: 0.03,
9905
9810
  cacheRead: 0,
9906
9811
  cacheWrite: 0,
9907
9812
  },
9908
9813
  contextWindow: 131072,
9909
- maxTokens: 16384,
9814
+ maxTokens: 4096,
9910
9815
  },
9911
9816
  "mistralai/mistral-saba": {
9912
9817
  id: "mistralai/mistral-saba",
@@ -10189,13 +10094,13 @@ export const MODELS = {
10189
10094
  reasoning: true,
10190
10095
  input: ["text"],
10191
10096
  cost: {
10192
- input: 0.09999999999999999,
10193
- output: 0.5,
10097
+ input: 0.09,
10098
+ output: 0.44999999999999996,
10194
10099
  cacheRead: 0,
10195
10100
  cacheWrite: 0,
10196
10101
  },
10197
10102
  contextWindow: 1000000,
10198
- maxTokens: 16384,
10103
+ maxTokens: 4096,
10199
10104
  },
10200
10105
  "nvidia/nemotron-3-super-120b-a12b:free": {
10201
10106
  id: "nvidia/nemotron-3-super-120b-a12b:free",
@@ -11018,12 +10923,12 @@ export const MODELS = {
11018
10923
  input: ["text"],
11019
10924
  cost: {
11020
10925
  input: 0.039,
11021
- output: 0.19,
10926
+ output: 0.18,
11022
10927
  cacheRead: 0,
11023
10928
  cacheWrite: 0,
11024
10929
  },
11025
10930
  contextWindow: 131072,
11026
- maxTokens: 131072,
10931
+ maxTokens: 4096,
11027
10932
  },
11028
10933
  "openai/gpt-oss-120b:free": {
11029
10934
  id: "openai/gpt-oss-120b:free",
@@ -11935,13 +11840,13 @@ export const MODELS = {
11935
11840
  reasoning: true,
11936
11841
  input: ["text", "image"],
11937
11842
  cost: {
11938
- input: 0.14,
11843
+ input: 0.13899999999999998,
11939
11844
  output: 1,
11940
- cacheRead: 0.049999999999999996,
11845
+ cacheRead: 0,
11941
11846
  cacheWrite: 0,
11942
11847
  },
11943
11848
  contextWindow: 262144,
11944
- maxTokens: 81920,
11849
+ maxTokens: 4096,
11945
11850
  },
11946
11851
  "qwen/qwen3.5-397b-a17b": {
11947
11852
  id: "qwen/qwen3.5-397b-a17b",
@@ -11954,7 +11859,7 @@ export const MODELS = {
11954
11859
  cost: {
11955
11860
  input: 0.39,
11956
11861
  output: 2.34,
11957
- cacheRead: 0.195,
11862
+ cacheRead: 0,
11958
11863
  cacheWrite: 0,
11959
11864
  },
11960
11865
  contextWindow: 262144,
@@ -12037,13 +11942,13 @@ export const MODELS = {
12037
11942
  reasoning: true,
12038
11943
  input: ["text", "image"],
12039
11944
  cost: {
12040
- input: 0.32,
11945
+ input: 0.317,
12041
11946
  output: 3.1999999999999997,
12042
11947
  cacheRead: 0,
12043
11948
  cacheWrite: 0,
12044
11949
  },
12045
11950
  contextWindow: 262144,
12046
- maxTokens: 81920,
11951
+ maxTokens: 262140,
12047
11952
  },
12048
11953
  "qwen/qwen3.6-35b-a3b": {
12049
11954
  id: "qwen/qwen3.6-35b-a3b",
@@ -12113,6 +12018,23 @@ export const MODELS = {
12113
12018
  contextWindow: 1000000,
12114
12019
  maxTokens: 65536,
12115
12020
  },
12021
+ "qwen/qwen3.7-max": {
12022
+ id: "qwen/qwen3.7-max",
12023
+ name: "Qwen: Qwen3.7 Max",
12024
+ api: "openai-completions",
12025
+ provider: "openrouter",
12026
+ baseUrl: "https://openrouter.ai/api/v1",
12027
+ reasoning: true,
12028
+ input: ["text"],
12029
+ cost: {
12030
+ input: 2.5,
12031
+ output: 7.5,
12032
+ cacheRead: 0,
12033
+ cacheWrite: 3.125,
12034
+ },
12035
+ contextWindow: 1000000,
12036
+ maxTokens: 65536,
12037
+ },
12116
12038
  "rekaai/reka-edge": {
12117
12039
  id: "rekaai/reka-edge",
12118
12040
  name: "Reka Edge",
@@ -12190,13 +12112,13 @@ export const MODELS = {
12190
12112
  reasoning: true,
12191
12113
  input: ["text"],
12192
12114
  cost: {
12193
- input: 0.09999999999999999,
12115
+ input: 0.09,
12194
12116
  output: 0.3,
12195
- cacheRead: 0,
12117
+ cacheRead: 0.02,
12196
12118
  cacheWrite: 0,
12197
12119
  },
12198
12120
  contextWindow: 262144,
12199
- maxTokens: 65536,
12121
+ maxTokens: 16384,
12200
12122
  },
12201
12123
  "tencent/hy3-preview": {
12202
12124
  id: "tencent/hy3-preview",
@@ -12300,6 +12222,23 @@ export const MODELS = {
12300
12222
  contextWindow: 1000000,
12301
12223
  maxTokens: 4096,
12302
12224
  },
12225
+ "x-ai/grok-build-0.1": {
12226
+ id: "x-ai/grok-build-0.1",
12227
+ name: "xAI: Grok Build 0.1",
12228
+ api: "openai-completions",
12229
+ provider: "openrouter",
12230
+ baseUrl: "https://openrouter.ai/api/v1",
12231
+ reasoning: true,
12232
+ input: ["text", "image"],
12233
+ cost: {
12234
+ input: 1,
12235
+ output: 2,
12236
+ cacheRead: 0.19999999999999998,
12237
+ cacheWrite: 0,
12238
+ },
12239
+ contextWindow: 256000,
12240
+ maxTokens: 4096,
12241
+ },
12303
12242
  "xiaomi/mimo-v2-flash": {
12304
12243
  id: "xiaomi/mimo-v2-flash",
12305
12244
  name: "Xiaomi: MiMo-V2-Flash",
@@ -12666,9 +12605,9 @@ export const MODELS = {
12666
12605
  reasoning: true,
12667
12606
  input: ["text", "image"],
12668
12607
  cost: {
12669
- input: 0.5,
12670
- output: 3,
12671
- cacheRead: 0.049999999999999996,
12608
+ input: 1.5,
12609
+ output: 9,
12610
+ cacheRead: 0.15,
12672
12611
  cacheWrite: 0.08333333333333334,
12673
12612
  },
12674
12613
  contextWindow: 1048576,
@@ -13372,6 +13311,23 @@ export const MODELS = {
13372
13311
  contextWindow: 1000000,
13373
13312
  maxTokens: 64000,
13374
13313
  },
13314
+ "alibaba/qwen3.7-max": {
13315
+ id: "alibaba/qwen3.7-max",
13316
+ name: "Qwen 3.7 Max",
13317
+ api: "anthropic-messages",
13318
+ provider: "vercel-ai-gateway",
13319
+ baseUrl: "https://ai-gateway.vercel.sh",
13320
+ reasoning: true,
13321
+ input: ["text", "image"],
13322
+ cost: {
13323
+ input: 2.5,
13324
+ output: 7.5,
13325
+ cacheRead: 0.5,
13326
+ cacheWrite: 3.125,
13327
+ },
13328
+ contextWindow: 991000,
13329
+ maxTokens: 64000,
13330
+ },
13375
13331
  "anthropic/claude-3-haiku": {
13376
13332
  id: "anthropic/claude-3-haiku",
13377
13333
  name: "Claude 3 Haiku",
@@ -13935,6 +13891,23 @@ export const MODELS = {
13935
13891
  contextWindow: 1000000,
13936
13892
  maxTokens: 64000,
13937
13893
  },
13894
+ "google/gemini-3.5-flash": {
13895
+ id: "google/gemini-3.5-flash",
13896
+ name: "Gemini 3.5 Flash",
13897
+ api: "anthropic-messages",
13898
+ provider: "vercel-ai-gateway",
13899
+ baseUrl: "https://ai-gateway.vercel.sh",
13900
+ reasoning: true,
13901
+ input: ["text", "image"],
13902
+ cost: {
13903
+ input: 1.5,
13904
+ output: 9,
13905
+ cacheRead: 0.15,
13906
+ cacheWrite: 0,
13907
+ },
13908
+ contextWindow: 1000000,
13909
+ maxTokens: 64000,
13910
+ },
13938
13911
  "google/gemma-4-26b-a4b-it": {
13939
13912
  id: "google/gemma-4-26b-a4b-it",
13940
13913
  name: "Gemma 4 26B A4B IT",
@@ -14394,6 +14367,23 @@ export const MODELS = {
14394
14367
  contextWindow: 128000,
14395
14368
  maxTokens: 64000,
14396
14369
  },
14370
+ "mistral/mistral-medium-3.5": {
14371
+ id: "mistral/mistral-medium-3.5",
14372
+ name: "Mistral Medium Latest",
14373
+ api: "anthropic-messages",
14374
+ provider: "vercel-ai-gateway",
14375
+ baseUrl: "https://ai-gateway.vercel.sh",
14376
+ reasoning: true,
14377
+ input: ["text"],
14378
+ cost: {
14379
+ input: 1.5,
14380
+ output: 7.5,
14381
+ cacheRead: 0,
14382
+ cacheWrite: 0,
14383
+ },
14384
+ contextWindow: 256000,
14385
+ maxTokens: 256000,
14386
+ },
14397
14387
  "mistral/mistral-small": {
14398
14388
  id: "mistral/mistral-small",
14399
14389
  name: "Mistral Small",
@@ -15409,6 +15399,23 @@ export const MODELS = {
15409
15399
  contextWindow: 1000000,
15410
15400
  maxTokens: 1000000,
15411
15401
  },
15402
+ "xai/grok-build-0.1": {
15403
+ id: "xai/grok-build-0.1",
15404
+ name: "Grok Build 0.1",
15405
+ api: "anthropic-messages",
15406
+ provider: "vercel-ai-gateway",
15407
+ baseUrl: "https://ai-gateway.vercel.sh",
15408
+ reasoning: true,
15409
+ input: ["text", "image"],
15410
+ cost: {
15411
+ input: 1,
15412
+ output: 2,
15413
+ cacheRead: 0.19999999999999998,
15414
+ cacheWrite: 0,
15415
+ },
15416
+ contextWindow: 256000,
15417
+ maxTokens: 256000,
15418
+ },
15412
15419
  "xiaomi/mimo-v2-flash": {
15413
15420
  id: "xiaomi/mimo-v2-flash",
15414
15421
  name: "MiMo V2 Flash",
@@ -15700,108 +15707,6 @@ export const MODELS = {
15700
15707
  },
15701
15708
  },
15702
15709
  "xai": {
15703
- "grok-2": {
15704
- id: "grok-2",
15705
- name: "Grok 2",
15706
- api: "openai-completions",
15707
- provider: "xai",
15708
- baseUrl: "https://api.x.ai/v1",
15709
- reasoning: false,
15710
- input: ["text"],
15711
- cost: {
15712
- input: 2,
15713
- output: 10,
15714
- cacheRead: 2,
15715
- cacheWrite: 0,
15716
- },
15717
- contextWindow: 131072,
15718
- maxTokens: 8192,
15719
- },
15720
- "grok-2-1212": {
15721
- id: "grok-2-1212",
15722
- name: "Grok 2 (1212)",
15723
- api: "openai-completions",
15724
- provider: "xai",
15725
- baseUrl: "https://api.x.ai/v1",
15726
- reasoning: false,
15727
- input: ["text"],
15728
- cost: {
15729
- input: 2,
15730
- output: 10,
15731
- cacheRead: 2,
15732
- cacheWrite: 0,
15733
- },
15734
- contextWindow: 131072,
15735
- maxTokens: 8192,
15736
- },
15737
- "grok-2-latest": {
15738
- id: "grok-2-latest",
15739
- name: "Grok 2 Latest",
15740
- api: "openai-completions",
15741
- provider: "xai",
15742
- baseUrl: "https://api.x.ai/v1",
15743
- reasoning: false,
15744
- input: ["text"],
15745
- cost: {
15746
- input: 2,
15747
- output: 10,
15748
- cacheRead: 2,
15749
- cacheWrite: 0,
15750
- },
15751
- contextWindow: 131072,
15752
- maxTokens: 8192,
15753
- },
15754
- "grok-2-vision": {
15755
- id: "grok-2-vision",
15756
- name: "Grok 2 Vision",
15757
- api: "openai-completions",
15758
- provider: "xai",
15759
- baseUrl: "https://api.x.ai/v1",
15760
- reasoning: false,
15761
- input: ["text", "image"],
15762
- cost: {
15763
- input: 2,
15764
- output: 10,
15765
- cacheRead: 2,
15766
- cacheWrite: 0,
15767
- },
15768
- contextWindow: 8192,
15769
- maxTokens: 4096,
15770
- },
15771
- "grok-2-vision-1212": {
15772
- id: "grok-2-vision-1212",
15773
- name: "Grok 2 Vision (1212)",
15774
- api: "openai-completions",
15775
- provider: "xai",
15776
- baseUrl: "https://api.x.ai/v1",
15777
- reasoning: false,
15778
- input: ["text", "image"],
15779
- cost: {
15780
- input: 2,
15781
- output: 10,
15782
- cacheRead: 2,
15783
- cacheWrite: 0,
15784
- },
15785
- contextWindow: 8192,
15786
- maxTokens: 4096,
15787
- },
15788
- "grok-2-vision-latest": {
15789
- id: "grok-2-vision-latest",
15790
- name: "Grok 2 Vision Latest",
15791
- api: "openai-completions",
15792
- provider: "xai",
15793
- baseUrl: "https://api.x.ai/v1",
15794
- reasoning: false,
15795
- input: ["text", "image"],
15796
- cost: {
15797
- input: 2,
15798
- output: 10,
15799
- cacheRead: 2,
15800
- cacheWrite: 0,
15801
- },
15802
- contextWindow: 8192,
15803
- maxTokens: 4096,
15804
- },
15805
15710
  "grok-3": {
15806
15711
  id: "grok-3",
15807
15712
  name: "Grok 3",
@@ -15845,8 +15750,8 @@ export const MODELS = {
15845
15750
  reasoning: false,
15846
15751
  input: ["text", "image"],
15847
15752
  cost: {
15848
- input: 2,
15849
- output: 6,
15753
+ input: 1.25,
15754
+ output: 2.5,
15850
15755
  cacheRead: 0.2,
15851
15756
  cacheWrite: 0,
15852
15757
  },
@@ -15862,8 +15767,8 @@ export const MODELS = {
15862
15767
  reasoning: true,
15863
15768
  input: ["text", "image"],
15864
15769
  cost: {
15865
- input: 2,
15866
- output: 6,
15770
+ input: 1.25,
15771
+ output: 2.5,
15867
15772
  cacheRead: 0.2,
15868
15773
  cacheWrite: 0,
15869
15774
  },
@@ -15887,22 +15792,22 @@ export const MODELS = {
15887
15792
  contextWindow: 1000000,
15888
15793
  maxTokens: 30000,
15889
15794
  },
15890
- "grok-beta": {
15891
- id: "grok-beta",
15892
- name: "Grok Beta",
15795
+ "grok-build-0.1": {
15796
+ id: "grok-build-0.1",
15797
+ name: "Grok Build 0.1",
15893
15798
  api: "openai-completions",
15894
15799
  provider: "xai",
15895
15800
  baseUrl: "https://api.x.ai/v1",
15896
- reasoning: false,
15897
- input: ["text"],
15801
+ reasoning: true,
15802
+ input: ["text", "image"],
15898
15803
  cost: {
15899
- input: 5,
15900
- output: 15,
15901
- cacheRead: 5,
15804
+ input: 1,
15805
+ output: 2,
15806
+ cacheRead: 0.2,
15902
15807
  cacheWrite: 0,
15903
15808
  },
15904
- contextWindow: 131072,
15905
- maxTokens: 4096,
15809
+ contextWindow: 256000,
15810
+ maxTokens: 256000,
15906
15811
  },
15907
15812
  "grok-code-fast-1": {
15908
15813
  id: "grok-code-fast-1",
@@ -15921,23 +15826,6 @@ export const MODELS = {
15921
15826
  contextWindow: 32768,
15922
15827
  maxTokens: 8192,
15923
15828
  },
15924
- "grok-vision-beta": {
15925
- id: "grok-vision-beta",
15926
- name: "Grok Vision Beta",
15927
- api: "openai-completions",
15928
- provider: "xai",
15929
- baseUrl: "https://api.x.ai/v1",
15930
- reasoning: false,
15931
- input: ["text", "image"],
15932
- cost: {
15933
- input: 5,
15934
- output: 15,
15935
- cacheRead: 5,
15936
- cacheWrite: 0,
15937
- },
15938
- contextWindow: 8192,
15939
- maxTokens: 4096,
15940
- },
15941
15829
  },
15942
15830
  "xiaomi": {
15943
15831
  "mimo-v2-flash": {