@earendil-works/pi-ai 0.79.2 → 0.79.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -3942,9 +3942,9 @@ export const MODELS = {
3942
3942
  contextWindow: 131072,
3943
3943
  maxTokens: 32768,
3944
3944
  },
3945
- "accounts/fireworks/models/kimi-k2p5": {
3946
- id: "accounts/fireworks/models/kimi-k2p5",
3947
- name: "Kimi K2.5",
3945
+ "accounts/fireworks/models/kimi-k2p6": {
3946
+ id: "accounts/fireworks/models/kimi-k2p6",
3947
+ name: "Kimi K2.6",
3948
3948
  api: "anthropic-messages",
3949
3949
  provider: "fireworks",
3950
3950
  baseUrl: "https://api.fireworks.ai/inference",
@@ -3952,17 +3952,17 @@ export const MODELS = {
3952
3952
  reasoning: true,
3953
3953
  input: ["text", "image"],
3954
3954
  cost: {
3955
- input: 0.6,
3956
- output: 3,
3957
- cacheRead: 0.1,
3955
+ input: 0.95,
3956
+ output: 4,
3957
+ cacheRead: 0.16,
3958
3958
  cacheWrite: 0,
3959
3959
  },
3960
- contextWindow: 256000,
3961
- maxTokens: 256000,
3960
+ contextWindow: 262000,
3961
+ maxTokens: 262000,
3962
3962
  },
3963
- "accounts/fireworks/models/kimi-k2p6": {
3964
- id: "accounts/fireworks/models/kimi-k2p6",
3965
- name: "Kimi K2.6",
3963
+ "accounts/fireworks/models/kimi-k2p7-code": {
3964
+ id: "accounts/fireworks/models/kimi-k2p7-code",
3965
+ name: "Kimi K2.7 Code",
3966
3966
  api: "anthropic-messages",
3967
3967
  provider: "fireworks",
3968
3968
  baseUrl: "https://api.fireworks.ai/inference",
@@ -3972,15 +3972,15 @@ export const MODELS = {
3972
3972
  cost: {
3973
3973
  input: 0.95,
3974
3974
  output: 4,
3975
- cacheRead: 0.16,
3975
+ cacheRead: 0.19,
3976
3976
  cacheWrite: 0,
3977
3977
  },
3978
3978
  contextWindow: 262000,
3979
3979
  maxTokens: 262000,
3980
3980
  },
3981
- "accounts/fireworks/models/minimax-m2p5": {
3982
- id: "accounts/fireworks/models/minimax-m2p5",
3983
- name: "MiniMax-M2.5",
3981
+ "accounts/fireworks/models/minimax-m2p7": {
3982
+ id: "accounts/fireworks/models/minimax-m2p7",
3983
+ name: "MiniMax-M2.7",
3984
3984
  api: "anthropic-messages",
3985
3985
  provider: "fireworks",
3986
3986
  baseUrl: "https://api.fireworks.ai/inference",
@@ -3990,15 +3990,15 @@ export const MODELS = {
3990
3990
  cost: {
3991
3991
  input: 0.3,
3992
3992
  output: 1.2,
3993
- cacheRead: 0.03,
3993
+ cacheRead: 0.06,
3994
3994
  cacheWrite: 0,
3995
3995
  },
3996
3996
  contextWindow: 196608,
3997
3997
  maxTokens: 196608,
3998
3998
  },
3999
- "accounts/fireworks/models/minimax-m2p7": {
4000
- id: "accounts/fireworks/models/minimax-m2p7",
4001
- name: "MiniMax-M2.7",
3999
+ "accounts/fireworks/models/minimax-m3": {
4000
+ id: "accounts/fireworks/models/minimax-m3",
4001
+ name: "MiniMax-M3",
4002
4002
  api: "anthropic-messages",
4003
4003
  provider: "fireworks",
4004
4004
  baseUrl: "https://api.fireworks.ai/inference",
@@ -4011,12 +4011,12 @@ export const MODELS = {
4011
4011
  cacheRead: 0.06,
4012
4012
  cacheWrite: 0,
4013
4013
  },
4014
- contextWindow: 196608,
4015
- maxTokens: 196608,
4014
+ contextWindow: 512000,
4015
+ maxTokens: 512000,
4016
4016
  },
4017
- "accounts/fireworks/models/qwen3p6-plus": {
4018
- id: "accounts/fireworks/models/qwen3p6-plus",
4019
- name: "Qwen 3.6 Plus",
4017
+ "accounts/fireworks/models/qwen3p7-plus": {
4018
+ id: "accounts/fireworks/models/qwen3p7-plus",
4019
+ name: "Qwen 3.7 Plus",
4020
4020
  api: "anthropic-messages",
4021
4021
  provider: "fireworks",
4022
4022
  baseUrl: "https://api.fireworks.ai/inference",
@@ -4024,9 +4024,9 @@ export const MODELS = {
4024
4024
  reasoning: true,
4025
4025
  input: ["text", "image"],
4026
4026
  cost: {
4027
- input: 0.5,
4028
- output: 3,
4029
- cacheRead: 0.1,
4027
+ input: 0.4,
4028
+ output: 1.6,
4029
+ cacheRead: 0.08,
4030
4030
  cacheWrite: 0,
4031
4031
  },
4032
4032
  contextWindow: 262144,
@@ -4086,6 +4086,24 @@ export const MODELS = {
4086
4086
  contextWindow: 262000,
4087
4087
  maxTokens: 262000,
4088
4088
  },
4089
+ "accounts/fireworks/routers/kimi-k2p7-code-fast": {
4090
+ id: "accounts/fireworks/routers/kimi-k2p7-code-fast",
4091
+ name: "Kimi K2.7 Code Fast",
4092
+ api: "anthropic-messages",
4093
+ provider: "fireworks",
4094
+ baseUrl: "https://api.fireworks.ai/inference",
4095
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
4096
+ reasoning: true,
4097
+ input: ["text", "image"],
4098
+ cost: {
4099
+ input: 2,
4100
+ output: 8,
4101
+ cacheRead: 0.38,
4102
+ cacheWrite: 0,
4103
+ },
4104
+ contextWindow: 262000,
4105
+ maxTokens: 262000,
4106
+ },
4089
4107
  },
4090
4108
  "github-copilot": {
4091
4109
  "claude-fable-5": {
@@ -4173,7 +4191,7 @@ export const MODELS = {
4173
4191
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4174
4192
  compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
4175
4193
  reasoning: true,
4176
- thinkingLevelMap: { "xhigh": "xhigh" },
4194
+ thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
4177
4195
  input: ["text", "image"],
4178
4196
  cost: {
4179
4197
  input: 5,
@@ -4193,7 +4211,7 @@ export const MODELS = {
4193
4211
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4194
4212
  compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
4195
4213
  reasoning: true,
4196
- thinkingLevelMap: { "xhigh": "xhigh" },
4214
+ thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
4197
4215
  input: ["text", "image"],
4198
4216
  cost: {
4199
4217
  input: 5,
@@ -4251,6 +4269,7 @@ export const MODELS = {
4251
4269
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4252
4270
  compat: { "forceAdaptiveThinking": true },
4253
4271
  reasoning: true,
4272
+ thinkingLevelMap: { "minimal": "low", "xhigh": "max" },
4254
4273
  input: ["text", "image"],
4255
4274
  cost: {
4256
4275
  input: 3,
@@ -4810,6 +4829,42 @@ export const MODELS = {
4810
4829
  contextWindow: 262144,
4811
4830
  maxTokens: 32768,
4812
4831
  },
4832
+ "gemma-4-E2B-it": {
4833
+ id: "gemma-4-E2B-it",
4834
+ name: "Gemma 4 E2B IT",
4835
+ api: "google-generative-ai",
4836
+ provider: "google",
4837
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4838
+ reasoning: true,
4839
+ thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
4840
+ input: ["text", "image"],
4841
+ cost: {
4842
+ input: 0,
4843
+ output: 0,
4844
+ cacheRead: 0,
4845
+ cacheWrite: 0,
4846
+ },
4847
+ contextWindow: 131072,
4848
+ maxTokens: 8192,
4849
+ },
4850
+ "gemma-4-E4B-it": {
4851
+ id: "gemma-4-E4B-it",
4852
+ name: "Gemma 4 E4B IT",
4853
+ api: "google-generative-ai",
4854
+ provider: "google",
4855
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4856
+ reasoning: true,
4857
+ thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
4858
+ input: ["text", "image"],
4859
+ cost: {
4860
+ input: 0,
4861
+ output: 0,
4862
+ cacheRead: 0,
4863
+ cacheWrite: 0,
4864
+ },
4865
+ contextWindow: 131072,
4866
+ maxTokens: 8192,
4867
+ },
4813
4868
  },
4814
4869
  "google-vertex": {
4815
4870
  "gemini-1.5-flash": {
@@ -7379,7 +7434,7 @@ export const MODELS = {
7379
7434
  cacheRead: 0.25,
7380
7435
  cacheWrite: 0,
7381
7436
  },
7382
- contextWindow: 1050000,
7437
+ contextWindow: 272000,
7383
7438
  maxTokens: 128000,
7384
7439
  },
7385
7440
  "gpt-5.4-mini": {
@@ -7451,7 +7506,7 @@ export const MODELS = {
7451
7506
  cacheRead: 0.5,
7452
7507
  cacheWrite: 0,
7453
7508
  },
7454
- contextWindow: 1050000,
7509
+ contextWindow: 272000,
7455
7510
  maxTokens: 128000,
7456
7511
  },
7457
7512
  "gpt-5.5-pro": {
@@ -7643,7 +7698,7 @@ export const MODELS = {
7643
7698
  cacheRead: 0.25,
7644
7699
  cacheWrite: 0,
7645
7700
  },
7646
- contextWindow: 1000000,
7701
+ contextWindow: 272000,
7647
7702
  maxTokens: 128000,
7648
7703
  },
7649
7704
  "gpt-5.4-mini": {
@@ -7661,7 +7716,7 @@ export const MODELS = {
7661
7716
  cacheRead: 0.075,
7662
7717
  cacheWrite: 0,
7663
7718
  },
7664
- contextWindow: 400000,
7719
+ contextWindow: 272000,
7665
7720
  maxTokens: 128000,
7666
7721
  },
7667
7722
  "gpt-5.5": {
@@ -7679,7 +7734,7 @@ export const MODELS = {
7679
7734
  cacheRead: 0.5,
7680
7735
  cacheWrite: 0,
7681
7736
  },
7682
- contextWindow: 400000,
7737
+ contextWindow: 272000,
7683
7738
  maxTokens: 128000,
7684
7739
  },
7685
7740
  },
@@ -7702,25 +7757,6 @@ export const MODELS = {
7702
7757
  contextWindow: 200000,
7703
7758
  maxTokens: 32000,
7704
7759
  },
7705
- "claude-fable-5": {
7706
- id: "claude-fable-5",
7707
- name: "Claude Fable 5",
7708
- api: "anthropic-messages",
7709
- provider: "opencode",
7710
- baseUrl: "https://opencode.ai/zen",
7711
- compat: { "forceAdaptiveThinking": true },
7712
- reasoning: true,
7713
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
7714
- input: ["text", "image"],
7715
- cost: {
7716
- input: 10,
7717
- output: 50,
7718
- cacheRead: 1,
7719
- cacheWrite: 12.5,
7720
- },
7721
- contextWindow: 1000000,
7722
- maxTokens: 128000,
7723
- },
7724
7760
  "claude-haiku-4-5": {
7725
7761
  id: "claude-haiku-4-5",
7726
7762
  name: "Claude Haiku 4.5",
@@ -7887,7 +7923,7 @@ export const MODELS = {
7887
7923
  api: "openai-completions",
7888
7924
  provider: "opencode",
7889
7925
  baseUrl: "https://opencode.ai/zen/v1",
7890
- compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7926
+ compat: { "maxTokensField": "max_tokens", "supportsLongCacheRetention": false, "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7891
7927
  reasoning: true,
7892
7928
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7893
7929
  input: ["text"],
@@ -7925,7 +7961,7 @@ export const MODELS = {
7925
7961
  api: "openai-completions",
7926
7962
  provider: "opencode",
7927
7963
  baseUrl: "https://opencode.ai/zen/v1",
7928
- compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7964
+ compat: { "maxTokensField": "max_tokens", "supportsLongCacheRetention": false, "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7929
7965
  reasoning: true,
7930
7966
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7931
7967
  input: ["text"],
@@ -8341,7 +8377,7 @@ export const MODELS = {
8341
8377
  api: "openai-completions",
8342
8378
  provider: "opencode",
8343
8379
  baseUrl: "https://opencode.ai/zen/v1",
8344
- compat: { "maxTokensField": "max_tokens" },
8380
+ compat: { "maxTokensField": "max_tokens", "supportsLongCacheRetention": false },
8345
8381
  reasoning: true,
8346
8382
  input: ["text", "image"],
8347
8383
  cost: {
@@ -8359,7 +8395,7 @@ export const MODELS = {
8359
8395
  api: "openai-completions",
8360
8396
  provider: "opencode",
8361
8397
  baseUrl: "https://opencode.ai/zen/v1",
8362
- compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens" },
8398
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsLongCacheRetention": false },
8363
8399
  reasoning: true,
8364
8400
  input: ["text", "image"],
8365
8401
  cost: {
@@ -8413,7 +8449,7 @@ export const MODELS = {
8413
8449
  api: "openai-completions",
8414
8450
  provider: "opencode",
8415
8451
  baseUrl: "https://opencode.ai/zen/v1",
8416
- compat: { "maxTokensField": "max_tokens" },
8452
+ compat: { "maxTokensField": "max_tokens", "supportsLongCacheRetention": false },
8417
8453
  reasoning: true,
8418
8454
  input: ["text"],
8419
8455
  cost: {
@@ -8577,7 +8613,7 @@ export const MODELS = {
8577
8613
  api: "openai-completions",
8578
8614
  provider: "opencode-go",
8579
8615
  baseUrl: "https://opencode.ai/zen/go/v1",
8580
- compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens" },
8616
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsLongCacheRetention": false },
8581
8617
  reasoning: true,
8582
8618
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
8583
8619
  input: ["text", "image"],
@@ -9430,13 +9466,13 @@ export const MODELS = {
9430
9466
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
9431
9467
  input: ["text"],
9432
9468
  cost: {
9433
- input: 0.098,
9434
- output: 0.196,
9469
+ input: 0.09,
9470
+ output: 0.18,
9435
9471
  cacheRead: 0.02,
9436
9472
  cacheWrite: 0,
9437
9473
  },
9438
9474
  contextWindow: 1048576,
9439
- maxTokens: 4096,
9475
+ maxTokens: 65536,
9440
9476
  },
9441
9477
  "deepseek/deepseek-v4-pro": {
9442
9478
  id: "deepseek/deepseek-v4-pro",
@@ -10471,13 +10507,13 @@ export const MODELS = {
10471
10507
  reasoning: true,
10472
10508
  input: ["text", "image"],
10473
10509
  cost: {
10474
- input: 0.95,
10475
- output: 4,
10476
- cacheRead: 0.19,
10510
+ input: 0.75,
10511
+ output: 3.5,
10512
+ cacheRead: 0.16,
10477
10513
  cacheWrite: 0,
10478
10514
  },
10479
10515
  contextWindow: 262144,
10480
- maxTokens: 4096,
10516
+ maxTokens: 262144,
10481
10517
  },
10482
10518
  "nex-agi/nex-n2-pro:free": {
10483
10519
  id: "nex-agi/nex-n2-pro:free",
@@ -13079,6 +13115,25 @@ export const MODELS = {
13079
13115
  contextWindow: 202752,
13080
13116
  maxTokens: 131072,
13081
13117
  },
13118
+ "MiniMaxAI/MiniMax-M3": {
13119
+ id: "MiniMaxAI/MiniMax-M3",
13120
+ name: "MiniMax-M3",
13121
+ api: "openai-completions",
13122
+ provider: "together",
13123
+ baseUrl: "https://api.together.ai/v1",
13124
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13125
+ reasoning: true,
13126
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13127
+ input: ["text", "image"],
13128
+ cost: {
13129
+ input: 0.3,
13130
+ output: 1.2,
13131
+ cacheRead: 0.06,
13132
+ cacheWrite: 0,
13133
+ },
13134
+ contextWindow: 524288,
13135
+ maxTokens: 250000,
13136
+ },
13082
13137
  "Qwen/Qwen2.5-7B-Instruct-Turbo": {
13083
13138
  id: "Qwen/Qwen2.5-7B-Instruct-Turbo",
13084
13139
  name: "Qwen 2.5 7B Instruct Turbo",
@@ -13283,6 +13338,25 @@ export const MODELS = {
13283
13338
  contextWindow: 262144,
13284
13339
  maxTokens: 131000,
13285
13340
  },
13341
+ "moonshotai/Kimi-K2.7-Code": {
13342
+ id: "moonshotai/Kimi-K2.7-Code",
13343
+ name: "Kimi K2.7 Code",
13344
+ api: "openai-completions",
13345
+ provider: "together",
13346
+ baseUrl: "https://api.together.ai/v1",
13347
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13348
+ reasoning: true,
13349
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13350
+ input: ["text"],
13351
+ cost: {
13352
+ input: 0.95,
13353
+ output: 4,
13354
+ cacheRead: 0.19,
13355
+ cacheWrite: 0,
13356
+ },
13357
+ contextWindow: 262144,
13358
+ maxTokens: 131072,
13359
+ },
13286
13360
  "nvidia/nemotron-3-ultra-550b-a55b": {
13287
13361
  id: "nvidia/nemotron-3-ultra-550b-a55b",
13288
13362
  name: "Nemotron 3 Ultra 550B A55B",
@@ -13788,25 +13862,6 @@ export const MODELS = {
13788
13862
  contextWindow: 200000,
13789
13863
  maxTokens: 8192,
13790
13864
  },
13791
- "anthropic/claude-fable-5": {
13792
- id: "anthropic/claude-fable-5",
13793
- name: "Claude Fable 5",
13794
- api: "anthropic-messages",
13795
- provider: "vercel-ai-gateway",
13796
- baseUrl: "https://ai-gateway.vercel.sh",
13797
- compat: { "forceAdaptiveThinking": true },
13798
- reasoning: true,
13799
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
13800
- input: ["text", "image"],
13801
- cost: {
13802
- input: 10,
13803
- output: 50,
13804
- cacheRead: 1,
13805
- cacheWrite: 12.5,
13806
- },
13807
- contextWindow: 1000000,
13808
- maxTokens: 128000,
13809
- },
13810
13865
  "anthropic/claude-haiku-4.5": {
13811
13866
  id: "anthropic/claude-haiku-4.5",
13812
13867
  name: "Claude Haiku 4.5",
@@ -16821,6 +16876,24 @@ export const MODELS = {
16821
16876
  contextWindow: 200000,
16822
16877
  maxTokens: 131072,
16823
16878
  },
16879
+ "glm-5.2": {
16880
+ id: "glm-5.2",
16881
+ name: "GLM-5.2",
16882
+ api: "openai-completions",
16883
+ provider: "zai",
16884
+ baseUrl: "https://api.z.ai/api/coding/paas/v4",
16885
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
16886
+ reasoning: true,
16887
+ input: ["text"],
16888
+ cost: {
16889
+ input: 0,
16890
+ output: 0,
16891
+ cacheRead: 0,
16892
+ cacheWrite: 0,
16893
+ },
16894
+ contextWindow: 1000000,
16895
+ maxTokens: 131072,
16896
+ },
16824
16897
  "glm-5v-turbo": {
16825
16898
  id: "glm-5v-turbo",
16826
16899
  name: "GLM-5V-Turbo",
@@ -16913,6 +16986,24 @@ export const MODELS = {
16913
16986
  contextWindow: 200000,
16914
16987
  maxTokens: 131072,
16915
16988
  },
16989
+ "glm-5.2": {
16990
+ id: "glm-5.2",
16991
+ name: "GLM-5.2",
16992
+ api: "openai-completions",
16993
+ provider: "zai-coding-cn",
16994
+ baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
16995
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
16996
+ reasoning: true,
16997
+ input: ["text"],
16998
+ cost: {
16999
+ input: 0,
17000
+ output: 0,
17001
+ cacheRead: 0,
17002
+ cacheWrite: 0,
17003
+ },
17004
+ contextWindow: 1000000,
17005
+ maxTokens: 131072,
17006
+ },
16916
17007
  "glm-5v-turbo": {
16917
17008
  id: "glm-5v-turbo",
16918
17009
  name: "GLM-5V-Turbo",