@earendil-works/pi-ai 0.79.3 → 0.79.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (67) hide show
  1. package/README.md +19 -0
  2. package/dist/env-api-keys.d.ts +5 -5
  3. package/dist/env-api-keys.d.ts.map +1 -1
  4. package/dist/env-api-keys.js +21 -57
  5. package/dist/env-api-keys.js.map +1 -1
  6. package/dist/models.d.ts.map +1 -1
  7. package/dist/models.generated.d.ts +316 -52
  8. package/dist/models.generated.d.ts.map +1 -1
  9. package/dist/models.generated.js +317 -142
  10. package/dist/models.generated.js.map +1 -1
  11. package/dist/models.js +4 -1
  12. package/dist/models.js.map +1 -1
  13. package/dist/providers/amazon-bedrock.d.ts.map +1 -1
  14. package/dist/providers/amazon-bedrock.js +52 -34
  15. package/dist/providers/amazon-bedrock.js.map +1 -1
  16. package/dist/providers/anthropic.d.ts.map +1 -1
  17. package/dist/providers/anthropic.js +11 -9
  18. package/dist/providers/anthropic.js.map +1 -1
  19. package/dist/providers/azure-openai-responses.d.ts.map +1 -1
  20. package/dist/providers/azure-openai-responses.js +7 -4
  21. package/dist/providers/azure-openai-responses.js.map +1 -1
  22. package/dist/providers/cloudflare.d.ts +3 -3
  23. package/dist/providers/cloudflare.d.ts.map +1 -1
  24. package/dist/providers/cloudflare.js +4 -3
  25. package/dist/providers/cloudflare.js.map +1 -1
  26. package/dist/providers/google-vertex.d.ts.map +1 -1
  27. package/dist/providers/google-vertex.js +15 -5
  28. package/dist/providers/google-vertex.js.map +1 -1
  29. package/dist/providers/google.d.ts.map +1 -1
  30. package/dist/providers/google.js +2 -1
  31. package/dist/providers/google.js.map +1 -1
  32. package/dist/providers/openai-codex-responses.d.ts.map +1 -1
  33. package/dist/providers/openai-codex-responses.js +18 -17
  34. package/dist/providers/openai-codex-responses.js.map +1 -1
  35. package/dist/providers/openai-completions.d.ts.map +1 -1
  36. package/dist/providers/openai-completions.js +21 -8
  37. package/dist/providers/openai-completions.js.map +1 -1
  38. package/dist/providers/openai-responses-shared.d.ts.map +1 -1
  39. package/dist/providers/openai-responses-shared.js +2 -1
  40. package/dist/providers/openai-responses-shared.js.map +1 -1
  41. package/dist/providers/openai-responses.d.ts.map +1 -1
  42. package/dist/providers/openai-responses.js +8 -7
  43. package/dist/providers/openai-responses.js.map +1 -1
  44. package/dist/providers/simple-options.d.ts.map +1 -1
  45. package/dist/providers/simple-options.js +1 -0
  46. package/dist/providers/simple-options.js.map +1 -1
  47. package/dist/stream.d.ts.map +1 -1
  48. package/dist/stream.js +1 -1
  49. package/dist/stream.js.map +1 -1
  50. package/dist/types.d.ts +10 -0
  51. package/dist/types.d.ts.map +1 -1
  52. package/dist/types.js.map +1 -1
  53. package/dist/utils/node-http-proxy.d.ts +2 -8
  54. package/dist/utils/node-http-proxy.d.ts.map +1 -1
  55. package/dist/utils/node-http-proxy.js +17 -22
  56. package/dist/utils/node-http-proxy.js.map +1 -1
  57. package/dist/utils/oauth/anthropic.d.ts.map +1 -1
  58. package/dist/utils/oauth/anthropic.js +2 -1
  59. package/dist/utils/oauth/anthropic.js.map +1 -1
  60. package/dist/utils/oauth/openai-codex.d.ts.map +1 -1
  61. package/dist/utils/oauth/openai-codex.js +2 -1
  62. package/dist/utils/oauth/openai-codex.js.map +1 -1
  63. package/dist/utils/provider-env.d.ts +7 -0
  64. package/dist/utils/provider-env.d.ts.map +1 -0
  65. package/dist/utils/provider-env.js +44 -0
  66. package/dist/utils/provider-env.js.map +1 -0
  67. package/package.json +1 -1
@@ -3810,6 +3810,24 @@ export const MODELS = {
3810
3810
  contextWindow: 131072,
3811
3811
  maxTokens: 131072,
3812
3812
  },
3813
+ "@cf/zai-org/glm-5.2": {
3814
+ id: "@cf/zai-org/glm-5.2",
3815
+ name: "Glm 5.2",
3816
+ api: "openai-completions",
3817
+ provider: "cloudflare-workers-ai",
3818
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3819
+ compat: { "sendSessionAffinityHeaders": true },
3820
+ reasoning: true,
3821
+ input: ["text"],
3822
+ cost: {
3823
+ input: 1.4,
3824
+ output: 4.4,
3825
+ cacheRead: 0.26,
3826
+ cacheWrite: 0,
3827
+ },
3828
+ contextWindow: 262144,
3829
+ maxTokens: 262144,
3830
+ },
3813
3831
  },
3814
3832
  "deepseek": {
3815
3833
  "deepseek-v4-flash": {
@@ -3918,7 +3936,7 @@ export const MODELS = {
3918
3936
  cost: {
3919
3937
  input: 0.15,
3920
3938
  output: 0.6,
3921
- cacheRead: 0.015,
3939
+ cacheRead: 0.01,
3922
3940
  cacheWrite: 0,
3923
3941
  },
3924
3942
  contextWindow: 131072,
@@ -4191,7 +4209,7 @@ export const MODELS = {
4191
4209
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4192
4210
  compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
4193
4211
  reasoning: true,
4194
- thinkingLevelMap: { "xhigh": "xhigh" },
4212
+ thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
4195
4213
  input: ["text", "image"],
4196
4214
  cost: {
4197
4215
  input: 5,
@@ -4211,7 +4229,7 @@ export const MODELS = {
4211
4229
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4212
4230
  compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
4213
4231
  reasoning: true,
4214
- thinkingLevelMap: { "xhigh": "xhigh" },
4232
+ thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
4215
4233
  input: ["text", "image"],
4216
4234
  cost: {
4217
4235
  input: 5,
@@ -4269,6 +4287,7 @@ export const MODELS = {
4269
4287
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4270
4288
  compat: { "forceAdaptiveThinking": true },
4271
4289
  reasoning: true,
4290
+ thinkingLevelMap: { "minimal": "low", "xhigh": "max" },
4272
4291
  input: ["text", "image"],
4273
4292
  cost: {
4274
4293
  input: 3,
@@ -4765,11 +4784,12 @@ export const MODELS = {
4765
4784
  provider: "google",
4766
4785
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4767
4786
  reasoning: true,
4787
+ thinkingLevelMap: { "off": null },
4768
4788
  input: ["text", "image"],
4769
4789
  cost: {
4770
- input: 0.3,
4771
- output: 2.5,
4772
- cacheRead: 0.075,
4790
+ input: 1.5,
4791
+ output: 9,
4792
+ cacheRead: 0.15,
4773
4793
  cacheWrite: 0,
4774
4794
  },
4775
4795
  contextWindow: 1048576,
@@ -4782,10 +4802,11 @@ export const MODELS = {
4782
4802
  provider: "google",
4783
4803
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4784
4804
  reasoning: true,
4805
+ thinkingLevelMap: { "off": null },
4785
4806
  input: ["text", "image"],
4786
4807
  cost: {
4787
- input: 0.1,
4788
- output: 0.4,
4808
+ input: 0.25,
4809
+ output: 1.5,
4789
4810
  cacheRead: 0.025,
4790
4811
  cacheWrite: 0,
4791
4812
  },
@@ -4828,96 +4849,47 @@ export const MODELS = {
4828
4849
  contextWindow: 262144,
4829
4850
  maxTokens: 32768,
4830
4851
  },
4831
- },
4832
- "google-vertex": {
4833
- "gemini-1.5-flash": {
4834
- id: "gemini-1.5-flash",
4835
- name: "Gemini 1.5 Flash (Vertex)",
4836
- api: "google-vertex",
4837
- provider: "google-vertex",
4838
- baseUrl: "https://{location}-aiplatform.googleapis.com",
4839
- reasoning: false,
4840
- input: ["text", "image"],
4841
- cost: {
4842
- input: 0.075,
4843
- output: 0.3,
4844
- cacheRead: 0.01875,
4845
- cacheWrite: 0,
4846
- },
4847
- contextWindow: 1000000,
4848
- maxTokens: 8192,
4849
- },
4850
- "gemini-1.5-flash-8b": {
4851
- id: "gemini-1.5-flash-8b",
4852
- name: "Gemini 1.5 Flash-8B (Vertex)",
4853
- api: "google-vertex",
4854
- provider: "google-vertex",
4855
- baseUrl: "https://{location}-aiplatform.googleapis.com",
4856
- reasoning: false,
4857
- input: ["text", "image"],
4858
- cost: {
4859
- input: 0.0375,
4860
- output: 0.15,
4861
- cacheRead: 0.01,
4862
- cacheWrite: 0,
4863
- },
4864
- contextWindow: 1000000,
4865
- maxTokens: 8192,
4866
- },
4867
- "gemini-1.5-pro": {
4868
- id: "gemini-1.5-pro",
4869
- name: "Gemini 1.5 Pro (Vertex)",
4870
- api: "google-vertex",
4871
- provider: "google-vertex",
4872
- baseUrl: "https://{location}-aiplatform.googleapis.com",
4873
- reasoning: false,
4874
- input: ["text", "image"],
4875
- cost: {
4876
- input: 1.25,
4877
- output: 5,
4878
- cacheRead: 0.3125,
4879
- cacheWrite: 0,
4880
- },
4881
- contextWindow: 1000000,
4882
- maxTokens: 8192,
4883
- },
4884
- "gemini-2.0-flash": {
4885
- id: "gemini-2.0-flash",
4886
- name: "Gemini 2.0 Flash (Vertex)",
4887
- api: "google-vertex",
4888
- provider: "google-vertex",
4889
- baseUrl: "https://{location}-aiplatform.googleapis.com",
4890
- reasoning: false,
4852
+ "gemma-4-E2B-it": {
4853
+ id: "gemma-4-E2B-it",
4854
+ name: "Gemma 4 E2B IT",
4855
+ api: "google-generative-ai",
4856
+ provider: "google",
4857
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4858
+ reasoning: true,
4859
+ thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
4891
4860
  input: ["text", "image"],
4892
4861
  cost: {
4893
- input: 0.15,
4894
- output: 0.6,
4895
- cacheRead: 0.0375,
4862
+ input: 0,
4863
+ output: 0,
4864
+ cacheRead: 0,
4896
4865
  cacheWrite: 0,
4897
4866
  },
4898
- contextWindow: 1048576,
4867
+ contextWindow: 131072,
4899
4868
  maxTokens: 8192,
4900
4869
  },
4901
- "gemini-2.0-flash-lite": {
4902
- id: "gemini-2.0-flash-lite",
4903
- name: "Gemini 2.0 Flash Lite (Vertex)",
4904
- api: "google-vertex",
4905
- provider: "google-vertex",
4906
- baseUrl: "https://{location}-aiplatform.googleapis.com",
4870
+ "gemma-4-E4B-it": {
4871
+ id: "gemma-4-E4B-it",
4872
+ name: "Gemma 4 E4B IT",
4873
+ api: "google-generative-ai",
4874
+ provider: "google",
4875
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4907
4876
  reasoning: true,
4877
+ thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
4908
4878
  input: ["text", "image"],
4909
4879
  cost: {
4910
- input: 0.075,
4911
- output: 0.3,
4912
- cacheRead: 0.01875,
4880
+ input: 0,
4881
+ output: 0,
4882
+ cacheRead: 0,
4913
4883
  cacheWrite: 0,
4914
4884
  },
4915
- contextWindow: 1048576,
4916
- maxTokens: 65536,
4885
+ contextWindow: 131072,
4886
+ maxTokens: 8192,
4917
4887
  },
4888
+ },
4889
+ "google-vertex": {
4918
4890
  "gemini-2.5-flash": {
4919
4891
  id: "gemini-2.5-flash",
4920
- name: "Gemini 2.5 Flash (Vertex)",
4892
+ name: "Gemini 2.5 Flash",
4921
4893
  api: "google-vertex",
4922
4894
  provider: "google-vertex",
4923
4895
  baseUrl: "https://{location}-aiplatform.googleapis.com",
@@ -4934,24 +4906,7 @@ export const MODELS = {
4934
4906
  },
4935
4907
  "gemini-2.5-flash-lite": {
4936
4908
  id: "gemini-2.5-flash-lite",
4937
- name: "Gemini 2.5 Flash Lite (Vertex)",
4938
- api: "google-vertex",
4939
- provider: "google-vertex",
4940
- baseUrl: "https://{location}-aiplatform.googleapis.com",
4941
- reasoning: true,
4942
- input: ["text", "image"],
4943
- cost: {
4944
- input: 0.1,
4945
- output: 0.4,
4946
- cacheRead: 0.01,
4947
- cacheWrite: 0,
4948
- },
4949
- contextWindow: 1048576,
4950
- maxTokens: 65536,
4951
- },
4952
- "gemini-2.5-flash-lite-preview-09-2025": {
4953
- id: "gemini-2.5-flash-lite-preview-09-2025",
4954
- name: "Gemini 2.5 Flash Lite Preview 09-25 (Vertex)",
4909
+ name: "Gemini 2.5 Flash-Lite",
4955
4910
  api: "google-vertex",
4956
4911
  provider: "google-vertex",
4957
4912
  baseUrl: "https://{location}-aiplatform.googleapis.com",
@@ -4968,7 +4923,7 @@ export const MODELS = {
4968
4923
  },
4969
4924
  "gemini-2.5-pro": {
4970
4925
  id: "gemini-2.5-pro",
4971
- name: "Gemini 2.5 Pro (Vertex)",
4926
+ name: "Gemini 2.5 Pro",
4972
4927
  api: "google-vertex",
4973
4928
  provider: "google-vertex",
4974
4929
  baseUrl: "https://{location}-aiplatform.googleapis.com",
@@ -4985,7 +4940,7 @@ export const MODELS = {
4985
4940
  },
4986
4941
  "gemini-3-flash-preview": {
4987
4942
  id: "gemini-3-flash-preview",
4988
- name: "Gemini 3 Flash Preview (Vertex)",
4943
+ name: "Gemini 3 Flash Preview",
4989
4944
  api: "google-vertex",
4990
4945
  provider: "google-vertex",
4991
4946
  baseUrl: "https://{location}-aiplatform.googleapis.com",
@@ -5001,27 +4956,27 @@ export const MODELS = {
5001
4956
  contextWindow: 1048576,
5002
4957
  maxTokens: 65536,
5003
4958
  },
5004
- "gemini-3-pro-preview": {
5005
- id: "gemini-3-pro-preview",
5006
- name: "Gemini 3 Pro Preview (Vertex)",
4959
+ "gemini-3.1-flash-lite": {
4960
+ id: "gemini-3.1-flash-lite",
4961
+ name: "Gemini 3.1 Flash Lite",
5007
4962
  api: "google-vertex",
5008
4963
  provider: "google-vertex",
5009
4964
  baseUrl: "https://{location}-aiplatform.googleapis.com",
5010
4965
  reasoning: true,
5011
- thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
4966
+ thinkingLevelMap: { "off": null },
5012
4967
  input: ["text", "image"],
5013
4968
  cost: {
5014
- input: 2,
5015
- output: 12,
5016
- cacheRead: 0.2,
4969
+ input: 0.25,
4970
+ output: 1.5,
4971
+ cacheRead: 0.025,
5017
4972
  cacheWrite: 0,
5018
4973
  },
5019
- contextWindow: 1000000,
5020
- maxTokens: 64000,
4974
+ contextWindow: 1048576,
4975
+ maxTokens: 65536,
5021
4976
  },
5022
4977
  "gemini-3.1-pro-preview": {
5023
4978
  id: "gemini-3.1-pro-preview",
5024
- name: "Gemini 3.1 Pro Preview (Vertex)",
4979
+ name: "Gemini 3.1 Pro Preview",
5025
4980
  api: "google-vertex",
5026
4981
  provider: "google-vertex",
5027
4982
  baseUrl: "https://{location}-aiplatform.googleapis.com",
@@ -5039,7 +4994,7 @@ export const MODELS = {
5039
4994
  },
5040
4995
  "gemini-3.1-pro-preview-customtools": {
5041
4996
  id: "gemini-3.1-pro-preview-customtools",
5042
- name: "Gemini 3.1 Pro Preview Custom Tools (Vertex)",
4997
+ name: "Gemini 3.1 Pro Preview Custom Tools",
5043
4998
  api: "google-vertex",
5044
4999
  provider: "google-vertex",
5045
5000
  baseUrl: "https://{location}-aiplatform.googleapis.com",
@@ -5055,6 +5010,60 @@ export const MODELS = {
5055
5010
  contextWindow: 1048576,
5056
5011
  maxTokens: 65536,
5057
5012
  },
5013
+ "gemini-3.5-flash": {
5014
+ id: "gemini-3.5-flash",
5015
+ name: "Gemini 3.5 Flash",
5016
+ api: "google-vertex",
5017
+ provider: "google-vertex",
5018
+ baseUrl: "https://{location}-aiplatform.googleapis.com",
5019
+ reasoning: true,
5020
+ thinkingLevelMap: { "off": null },
5021
+ input: ["text", "image"],
5022
+ cost: {
5023
+ input: 1.5,
5024
+ output: 9,
5025
+ cacheRead: 0.15,
5026
+ cacheWrite: 0,
5027
+ },
5028
+ contextWindow: 1048576,
5029
+ maxTokens: 65536,
5030
+ },
5031
+ "gemini-flash-latest": {
5032
+ id: "gemini-flash-latest",
5033
+ name: "Gemini Flash Latest",
5034
+ api: "google-vertex",
5035
+ provider: "google-vertex",
5036
+ baseUrl: "https://{location}-aiplatform.googleapis.com",
5037
+ reasoning: true,
5038
+ thinkingLevelMap: { "off": null },
5039
+ input: ["text", "image"],
5040
+ cost: {
5041
+ input: 1.5,
5042
+ output: 9,
5043
+ cacheRead: 0.15,
5044
+ cacheWrite: 0,
5045
+ },
5046
+ contextWindow: 1048576,
5047
+ maxTokens: 65536,
5048
+ },
5049
+ "gemini-flash-lite-latest": {
5050
+ id: "gemini-flash-lite-latest",
5051
+ name: "Gemini Flash-Lite Latest",
5052
+ api: "google-vertex",
5053
+ provider: "google-vertex",
5054
+ baseUrl: "https://{location}-aiplatform.googleapis.com",
5055
+ reasoning: true,
5056
+ thinkingLevelMap: { "off": null },
5057
+ input: ["text", "image"],
5058
+ cost: {
5059
+ input: 0.25,
5060
+ output: 1.5,
5061
+ cacheRead: 0.025,
5062
+ cacheWrite: 0,
5063
+ },
5064
+ contextWindow: 1048576,
5065
+ maxTokens: 65536,
5066
+ },
5058
5067
  },
5059
5068
  "groq": {
5060
5069
  "llama-3.1-8b-instant": {
@@ -6385,6 +6394,7 @@ export const MODELS = {
6385
6394
  baseUrl: "https://api.moonshot.ai/v1",
6386
6395
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6387
6396
  reasoning: true,
6397
+ thinkingLevelMap: { "off": null },
6388
6398
  input: ["text", "image"],
6389
6399
  cost: {
6390
6400
  input: 0.95,
@@ -6395,6 +6405,25 @@ export const MODELS = {
6395
6405
  contextWindow: 262144,
6396
6406
  maxTokens: 262144,
6397
6407
  },
6408
+ "kimi-k2.7-code-highspeed": {
6409
+ id: "kimi-k2.7-code-highspeed",
6410
+ name: "Kimi K2.7 Code HighSpeed",
6411
+ api: "openai-completions",
6412
+ provider: "moonshotai",
6413
+ baseUrl: "https://api.moonshot.ai/v1",
6414
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6415
+ reasoning: true,
6416
+ thinkingLevelMap: { "off": null },
6417
+ input: ["text", "image"],
6418
+ cost: {
6419
+ input: 1.9,
6420
+ output: 8,
6421
+ cacheRead: 0.38,
6422
+ cacheWrite: 0,
6423
+ },
6424
+ contextWindow: 262144,
6425
+ maxTokens: 262144,
6426
+ },
6398
6427
  },
6399
6428
  "moonshotai-cn": {
6400
6429
  "kimi-k2-0711-preview": {
@@ -6523,6 +6552,44 @@ export const MODELS = {
6523
6552
  contextWindow: 262144,
6524
6553
  maxTokens: 262144,
6525
6554
  },
6555
+ "kimi-k2.7-code": {
6556
+ id: "kimi-k2.7-code",
6557
+ name: "Kimi K2.7 Code",
6558
+ api: "openai-completions",
6559
+ provider: "moonshotai-cn",
6560
+ baseUrl: "https://api.moonshot.cn/v1",
6561
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6562
+ reasoning: true,
6563
+ thinkingLevelMap: { "off": null },
6564
+ input: ["text", "image"],
6565
+ cost: {
6566
+ input: 0.95,
6567
+ output: 4,
6568
+ cacheRead: 0.19,
6569
+ cacheWrite: 0,
6570
+ },
6571
+ contextWindow: 262144,
6572
+ maxTokens: 262144,
6573
+ },
6574
+ "kimi-k2.7-code-highspeed": {
6575
+ id: "kimi-k2.7-code-highspeed",
6576
+ name: "Kimi K2.7 Code HighSpeed",
6577
+ api: "openai-completions",
6578
+ provider: "moonshotai-cn",
6579
+ baseUrl: "https://api.moonshot.cn/v1",
6580
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6581
+ reasoning: true,
6582
+ thinkingLevelMap: { "off": null },
6583
+ input: ["text", "image"],
6584
+ cost: {
6585
+ input: 1.9,
6586
+ output: 8,
6587
+ cacheRead: 0.38,
6588
+ cacheWrite: 0,
6589
+ },
6590
+ contextWindow: 262144,
6591
+ maxTokens: 262144,
6592
+ },
6526
6593
  },
6527
6594
  "nvidia": {
6528
6595
  "meta/llama-3.1-70b-instruct": {
@@ -7886,7 +7953,7 @@ export const MODELS = {
7886
7953
  api: "openai-completions",
7887
7954
  provider: "opencode",
7888
7955
  baseUrl: "https://opencode.ai/zen/v1",
7889
- compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7956
+ compat: { "maxTokensField": "max_tokens", "supportsLongCacheRetention": false, "requiresReasoningContentOnAssistantMessages": true },
7890
7957
  reasoning: true,
7891
7958
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7892
7959
  input: ["text"],
@@ -7905,7 +7972,7 @@ export const MODELS = {
7905
7972
  api: "openai-completions",
7906
7973
  provider: "opencode",
7907
7974
  baseUrl: "https://opencode.ai/zen/v1",
7908
- compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7975
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true },
7909
7976
  reasoning: true,
7910
7977
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7911
7978
  input: ["text"],
@@ -7924,7 +7991,7 @@ export const MODELS = {
7924
7991
  api: "openai-completions",
7925
7992
  provider: "opencode",
7926
7993
  baseUrl: "https://opencode.ai/zen/v1",
7927
- compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7994
+ compat: { "maxTokensField": "max_tokens", "supportsLongCacheRetention": false, "requiresReasoningContentOnAssistantMessages": true },
7928
7995
  reasoning: true,
7929
7996
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7930
7997
  input: ["text"],
@@ -8340,7 +8407,7 @@ export const MODELS = {
8340
8407
  api: "openai-completions",
8341
8408
  provider: "opencode",
8342
8409
  baseUrl: "https://opencode.ai/zen/v1",
8343
- compat: { "maxTokensField": "max_tokens" },
8410
+ compat: { "maxTokensField": "max_tokens", "supportsLongCacheRetention": false },
8344
8411
  reasoning: true,
8345
8412
  input: ["text", "image"],
8346
8413
  cost: {
@@ -8358,7 +8425,7 @@ export const MODELS = {
8358
8425
  api: "openai-completions",
8359
8426
  provider: "opencode",
8360
8427
  baseUrl: "https://opencode.ai/zen/v1",
8361
- compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens" },
8428
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsLongCacheRetention": false },
8362
8429
  reasoning: true,
8363
8430
  input: ["text", "image"],
8364
8431
  cost: {
@@ -8412,7 +8479,7 @@ export const MODELS = {
8412
8479
  api: "openai-completions",
8413
8480
  provider: "opencode",
8414
8481
  baseUrl: "https://opencode.ai/zen/v1",
8415
- compat: { "maxTokensField": "max_tokens" },
8482
+ compat: { "maxTokensField": "max_tokens", "supportsLongCacheRetention": false },
8416
8483
  reasoning: true,
8417
8484
  input: ["text"],
8418
8485
  cost: {
@@ -8502,7 +8569,7 @@ export const MODELS = {
8502
8569
  api: "openai-completions",
8503
8570
  provider: "opencode-go",
8504
8571
  baseUrl: "https://opencode.ai/zen/go/v1",
8505
- compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8572
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true },
8506
8573
  reasoning: true,
8507
8574
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8508
8575
  input: ["text"],
@@ -8521,7 +8588,7 @@ export const MODELS = {
8521
8588
  api: "openai-completions",
8522
8589
  provider: "opencode-go",
8523
8590
  baseUrl: "https://opencode.ai/zen/go/v1",
8524
- compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8591
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true },
8525
8592
  reasoning: true,
8526
8593
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8527
8594
  input: ["text"],
@@ -8576,7 +8643,7 @@ export const MODELS = {
8576
8643
  api: "openai-completions",
8577
8644
  provider: "opencode-go",
8578
8645
  baseUrl: "https://opencode.ai/zen/go/v1",
8579
- compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens" },
8646
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsLongCacheRetention": false },
8580
8647
  reasoning: true,
8581
8648
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
8582
8649
  input: ["text", "image"],
@@ -10470,13 +10537,13 @@ export const MODELS = {
10470
10537
  reasoning: true,
10471
10538
  input: ["text", "image"],
10472
10539
  cost: {
10473
- input: 0.95,
10474
- output: 4,
10475
- cacheRead: 0.19,
10540
+ input: 0.75,
10541
+ output: 3.5,
10542
+ cacheRead: 0.16,
10476
10543
  cacheWrite: 0,
10477
10544
  },
10478
10545
  contextWindow: 262144,
10479
- maxTokens: 4096,
10546
+ maxTokens: 262144,
10480
10547
  },
10481
10548
  "nex-agi/nex-n2-pro:free": {
10482
10549
  id: "nex-agi/nex-n2-pro:free",
@@ -12273,7 +12340,7 @@ export const MODELS = {
12273
12340
  cacheWrite: 0,
12274
12341
  },
12275
12342
  contextWindow: 262144,
12276
- maxTokens: 262144,
12343
+ maxTokens: 81920,
12277
12344
  },
12278
12345
  "qwen/qwen3.5-397b-a17b": {
12279
12346
  id: "qwen/qwen3.5-397b-a17b",
@@ -12284,13 +12351,13 @@ export const MODELS = {
12284
12351
  reasoning: true,
12285
12352
  input: ["text", "image"],
12286
12353
  cost: {
12287
- input: 0.39,
12288
- output: 2.34,
12354
+ input: 0.385,
12355
+ output: 2.45,
12289
12356
  cacheRead: 0,
12290
12357
  cacheWrite: 0,
12291
12358
  },
12292
- contextWindow: 262144,
12293
- maxTokens: 65536,
12359
+ contextWindow: 256000,
12360
+ maxTokens: 4096,
12294
12361
  },
12295
12362
  "qwen/qwen3.5-9b": {
12296
12363
  id: "qwen/qwen3.5-9b",
@@ -12573,13 +12640,13 @@ export const MODELS = {
12573
12640
  reasoning: true,
12574
12641
  input: ["text"],
12575
12642
  cost: {
12576
- input: 0.063,
12577
- output: 0.21,
12578
- cacheRead: 0.021,
12643
+ input: 0.066,
12644
+ output: 0.26,
12645
+ cacheRead: 0.029,
12579
12646
  cacheWrite: 0,
12580
12647
  },
12581
12648
  contextWindow: 262144,
12582
- maxTokens: 4096,
12649
+ maxTokens: 262144,
12583
12650
  },
12584
12651
  "thedrummer/rocinante-12b": {
12585
12652
  id: "thedrummer/rocinante-12b",
@@ -12760,13 +12827,13 @@ export const MODELS = {
12760
12827
  reasoning: true,
12761
12828
  input: ["text"],
12762
12829
  cost: {
12763
- input: 0.125,
12830
+ input: 0.13,
12764
12831
  output: 0.85,
12765
- cacheRead: 0.06,
12832
+ cacheRead: 0.025,
12766
12833
  cacheWrite: 0,
12767
12834
  },
12768
12835
  contextWindow: 131072,
12769
- maxTokens: 131070,
12836
+ maxTokens: 98304,
12770
12837
  },
12771
12838
  "z-ai/glm-4.5v": {
12772
12839
  id: "z-ai/glm-4.5v",
@@ -12904,6 +12971,23 @@ export const MODELS = {
12904
12971
  contextWindow: 202752,
12905
12972
  maxTokens: 4096,
12906
12973
  },
12974
+ "z-ai/glm-5.2": {
12975
+ id: "z-ai/glm-5.2",
12976
+ name: "Z.ai: GLM 5.2",
12977
+ api: "openai-completions",
12978
+ provider: "openrouter",
12979
+ baseUrl: "https://openrouter.ai/api/v1",
12980
+ reasoning: true,
12981
+ input: ["text"],
12982
+ cost: {
12983
+ input: 1.4,
12984
+ output: 4.4,
12985
+ cacheRead: 0.26,
12986
+ cacheWrite: 0,
12987
+ },
12988
+ contextWindow: 1048576,
12989
+ maxTokens: 131072,
12990
+ },
12907
12991
  "~anthropic/claude-fable-latest": {
12908
12992
  id: "~anthropic/claude-fable-latest",
12909
12993
  name: "Anthropic: Claude Fable Latest",
@@ -13200,8 +13284,8 @@ export const MODELS = {
13200
13284
  reasoning: false,
13201
13285
  input: ["text"],
13202
13286
  cost: {
13203
- input: 2.5,
13204
- output: 7.5,
13287
+ input: 1.25,
13288
+ output: 3.75,
13205
13289
  cacheRead: 0,
13206
13290
  cacheWrite: 0,
13207
13291
  },
@@ -13301,6 +13385,25 @@ export const MODELS = {
13301
13385
  contextWindow: 262144,
13302
13386
  maxTokens: 131000,
13303
13387
  },
13388
+ "moonshotai/Kimi-K2.7-Code": {
13389
+ id: "moonshotai/Kimi-K2.7-Code",
13390
+ name: "Kimi K2.7 Code",
13391
+ api: "openai-completions",
13392
+ provider: "together",
13393
+ baseUrl: "https://api.together.ai/v1",
13394
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13395
+ reasoning: true,
13396
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13397
+ input: ["text"],
13398
+ cost: {
13399
+ input: 0.95,
13400
+ output: 4,
13401
+ cacheRead: 0.19,
13402
+ cacheWrite: 0,
13403
+ },
13404
+ contextWindow: 262144,
13405
+ maxTokens: 131072,
13406
+ },
13304
13407
  "nvidia/nemotron-3-ultra-550b-a55b": {
13305
13408
  id: "nvidia/nemotron-3-ultra-550b-a55b",
13306
13409
  name: "Nemotron 3 Ultra 550B A55B",
@@ -14986,6 +15089,23 @@ export const MODELS = {
14986
15089
  contextWindow: 256000,
14987
15090
  maxTokens: 32768,
14988
15091
  },
15092
+ "moonshotai/kimi-k2.7-code-highspeed": {
15093
+ id: "moonshotai/kimi-k2.7-code-highspeed",
15094
+ name: "Kimi K2.7 Code High Speed",
15095
+ api: "anthropic-messages",
15096
+ provider: "vercel-ai-gateway",
15097
+ baseUrl: "https://ai-gateway.vercel.sh",
15098
+ reasoning: true,
15099
+ input: ["text", "image"],
15100
+ cost: {
15101
+ input: 1.9,
15102
+ output: 8,
15103
+ cacheRead: 0.38,
15104
+ cacheWrite: 0,
15105
+ },
15106
+ contextWindow: 262144,
15107
+ maxTokens: 4096,
15108
+ },
14989
15109
  "nvidia/nemotron-3-super-120b-a12b": {
14990
15110
  id: "nvidia/nemotron-3-super-120b-a12b",
14991
15111
  name: "NVIDIA Nemotron 3 Super 120B A12B",
@@ -16222,6 +16342,23 @@ export const MODELS = {
16222
16342
  contextWindow: 202800,
16223
16343
  maxTokens: 64000,
16224
16344
  },
16345
+ "zai/glm-5.2": {
16346
+ id: "zai/glm-5.2",
16347
+ name: "GLM 5.2",
16348
+ api: "anthropic-messages",
16349
+ provider: "vercel-ai-gateway",
16350
+ baseUrl: "https://ai-gateway.vercel.sh",
16351
+ reasoning: true,
16352
+ input: ["text"],
16353
+ cost: {
16354
+ input: 1.4,
16355
+ output: 4.4,
16356
+ cacheRead: 0.26,
16357
+ cacheWrite: 0,
16358
+ },
16359
+ contextWindow: 1000000,
16360
+ maxTokens: 128000,
16361
+ },
16225
16362
  "zai/glm-5v-turbo": {
16226
16363
  id: "zai/glm-5v-turbo",
16227
16364
  name: "GLM 5V Turbo",
@@ -16820,6 +16957,25 @@ export const MODELS = {
16820
16957
  contextWindow: 200000,
16821
16958
  maxTokens: 131072,
16822
16959
  },
16960
+ "glm-5.2": {
16961
+ id: "glm-5.2",
16962
+ name: "GLM-5.2",
16963
+ api: "openai-completions",
16964
+ provider: "zai",
16965
+ baseUrl: "https://api.z.ai/api/coding/paas/v4",
16966
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "supportsReasoningEffort": true, "zaiToolStream": true },
16967
+ reasoning: true,
16968
+ thinkingLevelMap: { "minimal": null, "low": "high", "medium": "high", "high": "high", "xhigh": "max" },
16969
+ input: ["text"],
16970
+ cost: {
16971
+ input: 0,
16972
+ output: 0,
16973
+ cacheRead: 0,
16974
+ cacheWrite: 0,
16975
+ },
16976
+ contextWindow: 1000000,
16977
+ maxTokens: 131072,
16978
+ },
16823
16979
  "glm-5v-turbo": {
16824
16980
  id: "glm-5v-turbo",
16825
16981
  name: "GLM-5V-Turbo",
@@ -16912,6 +17068,25 @@ export const MODELS = {
16912
17068
  contextWindow: 200000,
16913
17069
  maxTokens: 131072,
16914
17070
  },
17071
+ "glm-5.2": {
17072
+ id: "glm-5.2",
17073
+ name: "GLM-5.2",
17074
+ api: "openai-completions",
17075
+ provider: "zai-coding-cn",
17076
+ baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
17077
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "supportsReasoningEffort": true, "zaiToolStream": true },
17078
+ reasoning: true,
17079
+ thinkingLevelMap: { "minimal": null, "low": "high", "medium": "high", "high": "high", "xhigh": "max" },
17080
+ input: ["text"],
17081
+ cost: {
17082
+ input: 0,
17083
+ output: 0,
17084
+ cacheRead: 0,
17085
+ cacheWrite: 0,
17086
+ },
17087
+ contextWindow: 1000000,
17088
+ maxTokens: 131072,
17089
+ },
16915
17090
  "glm-5v-turbo": {
16916
17091
  id: "glm-5v-turbo",
16917
17092
  name: "GLM-5V-Turbo",