@earendil-works/pi-ai 0.79.4 → 0.79.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (64) hide show
  1. package/README.md +19 -0
  2. package/dist/env-api-keys.d.ts +5 -5
  3. package/dist/env-api-keys.d.ts.map +1 -1
  4. package/dist/env-api-keys.js +21 -57
  5. package/dist/env-api-keys.js.map +1 -1
  6. package/dist/models.generated.d.ts +208 -79
  7. package/dist/models.generated.d.ts.map +1 -1
  8. package/dist/models.generated.js +230 -147
  9. package/dist/models.generated.js.map +1 -1
  10. package/dist/providers/amazon-bedrock.d.ts.map +1 -1
  11. package/dist/providers/amazon-bedrock.js +52 -34
  12. package/dist/providers/amazon-bedrock.js.map +1 -1
  13. package/dist/providers/anthropic.d.ts.map +1 -1
  14. package/dist/providers/anthropic.js +10 -9
  15. package/dist/providers/anthropic.js.map +1 -1
  16. package/dist/providers/azure-openai-responses.d.ts.map +1 -1
  17. package/dist/providers/azure-openai-responses.js +7 -4
  18. package/dist/providers/azure-openai-responses.js.map +1 -1
  19. package/dist/providers/cloudflare.d.ts +3 -3
  20. package/dist/providers/cloudflare.d.ts.map +1 -1
  21. package/dist/providers/cloudflare.js +4 -3
  22. package/dist/providers/cloudflare.js.map +1 -1
  23. package/dist/providers/google-vertex.d.ts.map +1 -1
  24. package/dist/providers/google-vertex.js +15 -5
  25. package/dist/providers/google-vertex.js.map +1 -1
  26. package/dist/providers/google.d.ts.map +1 -1
  27. package/dist/providers/google.js +2 -1
  28. package/dist/providers/google.js.map +1 -1
  29. package/dist/providers/openai-codex-responses.d.ts.map +1 -1
  30. package/dist/providers/openai-codex-responses.js +18 -17
  31. package/dist/providers/openai-codex-responses.js.map +1 -1
  32. package/dist/providers/openai-completions.d.ts.map +1 -1
  33. package/dist/providers/openai-completions.js +21 -8
  34. package/dist/providers/openai-completions.js.map +1 -1
  35. package/dist/providers/openai-responses-shared.d.ts.map +1 -1
  36. package/dist/providers/openai-responses-shared.js +2 -1
  37. package/dist/providers/openai-responses-shared.js.map +1 -1
  38. package/dist/providers/openai-responses.d.ts.map +1 -1
  39. package/dist/providers/openai-responses.js +8 -7
  40. package/dist/providers/openai-responses.js.map +1 -1
  41. package/dist/providers/simple-options.d.ts.map +1 -1
  42. package/dist/providers/simple-options.js +1 -0
  43. package/dist/providers/simple-options.js.map +1 -1
  44. package/dist/stream.d.ts.map +1 -1
  45. package/dist/stream.js +1 -1
  46. package/dist/stream.js.map +1 -1
  47. package/dist/types.d.ts +8 -0
  48. package/dist/types.d.ts.map +1 -1
  49. package/dist/types.js.map +1 -1
  50. package/dist/utils/node-http-proxy.d.ts +2 -8
  51. package/dist/utils/node-http-proxy.d.ts.map +1 -1
  52. package/dist/utils/node-http-proxy.js +17 -22
  53. package/dist/utils/node-http-proxy.js.map +1 -1
  54. package/dist/utils/oauth/anthropic.d.ts.map +1 -1
  55. package/dist/utils/oauth/anthropic.js +2 -1
  56. package/dist/utils/oauth/anthropic.js.map +1 -1
  57. package/dist/utils/oauth/openai-codex.d.ts.map +1 -1
  58. package/dist/utils/oauth/openai-codex.js +2 -1
  59. package/dist/utils/oauth/openai-codex.js.map +1 -1
  60. package/dist/utils/provider-env.d.ts +7 -0
  61. package/dist/utils/provider-env.d.ts.map +1 -0
  62. package/dist/utils/provider-env.js +44 -0
  63. package/dist/utils/provider-env.js.map +1 -0
  64. package/package.json +1 -1
@@ -3810,6 +3810,24 @@ export const MODELS = {
3810
3810
  contextWindow: 131072,
3811
3811
  maxTokens: 131072,
3812
3812
  },
3813
+ "@cf/zai-org/glm-5.2": {
3814
+ id: "@cf/zai-org/glm-5.2",
3815
+ name: "Glm 5.2",
3816
+ api: "openai-completions",
3817
+ provider: "cloudflare-workers-ai",
3818
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3819
+ compat: { "sendSessionAffinityHeaders": true },
3820
+ reasoning: true,
3821
+ input: ["text"],
3822
+ cost: {
3823
+ input: 1.4,
3824
+ output: 4.4,
3825
+ cacheRead: 0.26,
3826
+ cacheWrite: 0,
3827
+ },
3828
+ contextWindow: 262144,
3829
+ maxTokens: 262144,
3830
+ },
3813
3831
  },
3814
3832
  "deepseek": {
3815
3833
  "deepseek-v4-flash": {
@@ -3918,7 +3936,7 @@ export const MODELS = {
3918
3936
  cost: {
3919
3937
  input: 0.15,
3920
3938
  output: 0.6,
3921
- cacheRead: 0.015,
3939
+ cacheRead: 0.01,
3922
3940
  cacheWrite: 0,
3923
3941
  },
3924
3942
  contextWindow: 131072,
@@ -4766,11 +4784,12 @@ export const MODELS = {
4766
4784
  provider: "google",
4767
4785
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4768
4786
  reasoning: true,
4787
+ thinkingLevelMap: { "off": null },
4769
4788
  input: ["text", "image"],
4770
4789
  cost: {
4771
- input: 0.3,
4772
- output: 2.5,
4773
- cacheRead: 0.075,
4790
+ input: 1.5,
4791
+ output: 9,
4792
+ cacheRead: 0.15,
4774
4793
  cacheWrite: 0,
4775
4794
  },
4776
4795
  contextWindow: 1048576,
@@ -4783,10 +4802,11 @@ export const MODELS = {
4783
4802
  provider: "google",
4784
4803
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4785
4804
  reasoning: true,
4805
+ thinkingLevelMap: { "off": null },
4786
4806
  input: ["text", "image"],
4787
4807
  cost: {
4788
- input: 0.1,
4789
- output: 0.4,
4808
+ input: 0.25,
4809
+ output: 1.5,
4790
4810
  cacheRead: 0.025,
4791
4811
  cacheWrite: 0,
4792
4812
  },
@@ -4867,94 +4887,9 @@ export const MODELS = {
4867
4887
  },
4868
4888
  },
4869
4889
  "google-vertex": {
4870
- "gemini-1.5-flash": {
4871
- id: "gemini-1.5-flash",
4872
- name: "Gemini 1.5 Flash (Vertex)",
4873
- api: "google-vertex",
4874
- provider: "google-vertex",
4875
- baseUrl: "https://{location}-aiplatform.googleapis.com",
4876
- reasoning: false,
4877
- input: ["text", "image"],
4878
- cost: {
4879
- input: 0.075,
4880
- output: 0.3,
4881
- cacheRead: 0.01875,
4882
- cacheWrite: 0,
4883
- },
4884
- contextWindow: 1000000,
4885
- maxTokens: 8192,
4886
- },
4887
- "gemini-1.5-flash-8b": {
4888
- id: "gemini-1.5-flash-8b",
4889
- name: "Gemini 1.5 Flash-8B (Vertex)",
4890
- api: "google-vertex",
4891
- provider: "google-vertex",
4892
- baseUrl: "https://{location}-aiplatform.googleapis.com",
4893
- reasoning: false,
4894
- input: ["text", "image"],
4895
- cost: {
4896
- input: 0.0375,
4897
- output: 0.15,
4898
- cacheRead: 0.01,
4899
- cacheWrite: 0,
4900
- },
4901
- contextWindow: 1000000,
4902
- maxTokens: 8192,
4903
- },
4904
- "gemini-1.5-pro": {
4905
- id: "gemini-1.5-pro",
4906
- name: "Gemini 1.5 Pro (Vertex)",
4907
- api: "google-vertex",
4908
- provider: "google-vertex",
4909
- baseUrl: "https://{location}-aiplatform.googleapis.com",
4910
- reasoning: false,
4911
- input: ["text", "image"],
4912
- cost: {
4913
- input: 1.25,
4914
- output: 5,
4915
- cacheRead: 0.3125,
4916
- cacheWrite: 0,
4917
- },
4918
- contextWindow: 1000000,
4919
- maxTokens: 8192,
4920
- },
4921
- "gemini-2.0-flash": {
4922
- id: "gemini-2.0-flash",
4923
- name: "Gemini 2.0 Flash (Vertex)",
4924
- api: "google-vertex",
4925
- provider: "google-vertex",
4926
- baseUrl: "https://{location}-aiplatform.googleapis.com",
4927
- reasoning: false,
4928
- input: ["text", "image"],
4929
- cost: {
4930
- input: 0.15,
4931
- output: 0.6,
4932
- cacheRead: 0.0375,
4933
- cacheWrite: 0,
4934
- },
4935
- contextWindow: 1048576,
4936
- maxTokens: 8192,
4937
- },
4938
- "gemini-2.0-flash-lite": {
4939
- id: "gemini-2.0-flash-lite",
4940
- name: "Gemini 2.0 Flash Lite (Vertex)",
4941
- api: "google-vertex",
4942
- provider: "google-vertex",
4943
- baseUrl: "https://{location}-aiplatform.googleapis.com",
4944
- reasoning: true,
4945
- input: ["text", "image"],
4946
- cost: {
4947
- input: 0.075,
4948
- output: 0.3,
4949
- cacheRead: 0.01875,
4950
- cacheWrite: 0,
4951
- },
4952
- contextWindow: 1048576,
4953
- maxTokens: 65536,
4954
- },
4955
4890
  "gemini-2.5-flash": {
4956
4891
  id: "gemini-2.5-flash",
4957
- name: "Gemini 2.5 Flash (Vertex)",
4892
+ name: "Gemini 2.5 Flash",
4958
4893
  api: "google-vertex",
4959
4894
  provider: "google-vertex",
4960
4895
  baseUrl: "https://{location}-aiplatform.googleapis.com",
@@ -4971,24 +4906,7 @@ export const MODELS = {
4971
4906
  },
4972
4907
  "gemini-2.5-flash-lite": {
4973
4908
  id: "gemini-2.5-flash-lite",
4974
- name: "Gemini 2.5 Flash Lite (Vertex)",
4975
- api: "google-vertex",
4976
- provider: "google-vertex",
4977
- baseUrl: "https://{location}-aiplatform.googleapis.com",
4978
- reasoning: true,
4979
- input: ["text", "image"],
4980
- cost: {
4981
- input: 0.1,
4982
- output: 0.4,
4983
- cacheRead: 0.01,
4984
- cacheWrite: 0,
4985
- },
4986
- contextWindow: 1048576,
4987
- maxTokens: 65536,
4988
- },
4989
- "gemini-2.5-flash-lite-preview-09-2025": {
4990
- id: "gemini-2.5-flash-lite-preview-09-2025",
4991
- name: "Gemini 2.5 Flash Lite Preview 09-25 (Vertex)",
4909
+ name: "Gemini 2.5 Flash-Lite",
4992
4910
  api: "google-vertex",
4993
4911
  provider: "google-vertex",
4994
4912
  baseUrl: "https://{location}-aiplatform.googleapis.com",
@@ -5005,7 +4923,7 @@ export const MODELS = {
5005
4923
  },
5006
4924
  "gemini-2.5-pro": {
5007
4925
  id: "gemini-2.5-pro",
5008
- name: "Gemini 2.5 Pro (Vertex)",
4926
+ name: "Gemini 2.5 Pro",
5009
4927
  api: "google-vertex",
5010
4928
  provider: "google-vertex",
5011
4929
  baseUrl: "https://{location}-aiplatform.googleapis.com",
@@ -5022,7 +4940,7 @@ export const MODELS = {
5022
4940
  },
5023
4941
  "gemini-3-flash-preview": {
5024
4942
  id: "gemini-3-flash-preview",
5025
- name: "Gemini 3 Flash Preview (Vertex)",
4943
+ name: "Gemini 3 Flash Preview",
5026
4944
  api: "google-vertex",
5027
4945
  provider: "google-vertex",
5028
4946
  baseUrl: "https://{location}-aiplatform.googleapis.com",
@@ -5038,27 +4956,27 @@ export const MODELS = {
5038
4956
  contextWindow: 1048576,
5039
4957
  maxTokens: 65536,
5040
4958
  },
5041
- "gemini-3-pro-preview": {
5042
- id: "gemini-3-pro-preview",
5043
- name: "Gemini 3 Pro Preview (Vertex)",
4959
+ "gemini-3.1-flash-lite": {
4960
+ id: "gemini-3.1-flash-lite",
4961
+ name: "Gemini 3.1 Flash Lite",
5044
4962
  api: "google-vertex",
5045
4963
  provider: "google-vertex",
5046
4964
  baseUrl: "https://{location}-aiplatform.googleapis.com",
5047
4965
  reasoning: true,
5048
- thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
4966
+ thinkingLevelMap: { "off": null },
5049
4967
  input: ["text", "image"],
5050
4968
  cost: {
5051
- input: 2,
5052
- output: 12,
5053
- cacheRead: 0.2,
4969
+ input: 0.25,
4970
+ output: 1.5,
4971
+ cacheRead: 0.025,
5054
4972
  cacheWrite: 0,
5055
4973
  },
5056
- contextWindow: 1000000,
5057
- maxTokens: 64000,
4974
+ contextWindow: 1048576,
4975
+ maxTokens: 65536,
5058
4976
  },
5059
4977
  "gemini-3.1-pro-preview": {
5060
4978
  id: "gemini-3.1-pro-preview",
5061
- name: "Gemini 3.1 Pro Preview (Vertex)",
4979
+ name: "Gemini 3.1 Pro Preview",
5062
4980
  api: "google-vertex",
5063
4981
  provider: "google-vertex",
5064
4982
  baseUrl: "https://{location}-aiplatform.googleapis.com",
@@ -5076,7 +4994,7 @@ export const MODELS = {
5076
4994
  },
5077
4995
  "gemini-3.1-pro-preview-customtools": {
5078
4996
  id: "gemini-3.1-pro-preview-customtools",
5079
- name: "Gemini 3.1 Pro Preview Custom Tools (Vertex)",
4997
+ name: "Gemini 3.1 Pro Preview Custom Tools",
5080
4998
  api: "google-vertex",
5081
4999
  provider: "google-vertex",
5082
5000
  baseUrl: "https://{location}-aiplatform.googleapis.com",
@@ -5092,6 +5010,60 @@ export const MODELS = {
5092
5010
  contextWindow: 1048576,
5093
5011
  maxTokens: 65536,
5094
5012
  },
5013
+ "gemini-3.5-flash": {
5014
+ id: "gemini-3.5-flash",
5015
+ name: "Gemini 3.5 Flash",
5016
+ api: "google-vertex",
5017
+ provider: "google-vertex",
5018
+ baseUrl: "https://{location}-aiplatform.googleapis.com",
5019
+ reasoning: true,
5020
+ thinkingLevelMap: { "off": null },
5021
+ input: ["text", "image"],
5022
+ cost: {
5023
+ input: 1.5,
5024
+ output: 9,
5025
+ cacheRead: 0.15,
5026
+ cacheWrite: 0,
5027
+ },
5028
+ contextWindow: 1048576,
5029
+ maxTokens: 65536,
5030
+ },
5031
+ "gemini-flash-latest": {
5032
+ id: "gemini-flash-latest",
5033
+ name: "Gemini Flash Latest",
5034
+ api: "google-vertex",
5035
+ provider: "google-vertex",
5036
+ baseUrl: "https://{location}-aiplatform.googleapis.com",
5037
+ reasoning: true,
5038
+ thinkingLevelMap: { "off": null },
5039
+ input: ["text", "image"],
5040
+ cost: {
5041
+ input: 1.5,
5042
+ output: 9,
5043
+ cacheRead: 0.15,
5044
+ cacheWrite: 0,
5045
+ },
5046
+ contextWindow: 1048576,
5047
+ maxTokens: 65536,
5048
+ },
5049
+ "gemini-flash-lite-latest": {
5050
+ id: "gemini-flash-lite-latest",
5051
+ name: "Gemini Flash-Lite Latest",
5052
+ api: "google-vertex",
5053
+ provider: "google-vertex",
5054
+ baseUrl: "https://{location}-aiplatform.googleapis.com",
5055
+ reasoning: true,
5056
+ thinkingLevelMap: { "off": null },
5057
+ input: ["text", "image"],
5058
+ cost: {
5059
+ input: 0.25,
5060
+ output: 1.5,
5061
+ cacheRead: 0.025,
5062
+ cacheWrite: 0,
5063
+ },
5064
+ contextWindow: 1048576,
5065
+ maxTokens: 65536,
5066
+ },
5095
5067
  },
5096
5068
  "groq": {
5097
5069
  "llama-3.1-8b-instant": {
@@ -6422,6 +6394,7 @@ export const MODELS = {
6422
6394
  baseUrl: "https://api.moonshot.ai/v1",
6423
6395
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6424
6396
  reasoning: true,
6397
+ thinkingLevelMap: { "off": null },
6425
6398
  input: ["text", "image"],
6426
6399
  cost: {
6427
6400
  input: 0.95,
@@ -6432,6 +6405,25 @@ export const MODELS = {
6432
6405
  contextWindow: 262144,
6433
6406
  maxTokens: 262144,
6434
6407
  },
6408
+ "kimi-k2.7-code-highspeed": {
6409
+ id: "kimi-k2.7-code-highspeed",
6410
+ name: "Kimi K2.7 Code HighSpeed",
6411
+ api: "openai-completions",
6412
+ provider: "moonshotai",
6413
+ baseUrl: "https://api.moonshot.ai/v1",
6414
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6415
+ reasoning: true,
6416
+ thinkingLevelMap: { "off": null },
6417
+ input: ["text", "image"],
6418
+ cost: {
6419
+ input: 1.9,
6420
+ output: 8,
6421
+ cacheRead: 0.38,
6422
+ cacheWrite: 0,
6423
+ },
6424
+ contextWindow: 262144,
6425
+ maxTokens: 262144,
6426
+ },
6435
6427
  },
6436
6428
  "moonshotai-cn": {
6437
6429
  "kimi-k2-0711-preview": {
@@ -6560,6 +6552,44 @@ export const MODELS = {
6560
6552
  contextWindow: 262144,
6561
6553
  maxTokens: 262144,
6562
6554
  },
6555
+ "kimi-k2.7-code": {
6556
+ id: "kimi-k2.7-code",
6557
+ name: "Kimi K2.7 Code",
6558
+ api: "openai-completions",
6559
+ provider: "moonshotai-cn",
6560
+ baseUrl: "https://api.moonshot.cn/v1",
6561
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6562
+ reasoning: true,
6563
+ thinkingLevelMap: { "off": null },
6564
+ input: ["text", "image"],
6565
+ cost: {
6566
+ input: 0.95,
6567
+ output: 4,
6568
+ cacheRead: 0.19,
6569
+ cacheWrite: 0,
6570
+ },
6571
+ contextWindow: 262144,
6572
+ maxTokens: 262144,
6573
+ },
6574
+ "kimi-k2.7-code-highspeed": {
6575
+ id: "kimi-k2.7-code-highspeed",
6576
+ name: "Kimi K2.7 Code HighSpeed",
6577
+ api: "openai-completions",
6578
+ provider: "moonshotai-cn",
6579
+ baseUrl: "https://api.moonshot.cn/v1",
6580
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6581
+ reasoning: true,
6582
+ thinkingLevelMap: { "off": null },
6583
+ input: ["text", "image"],
6584
+ cost: {
6585
+ input: 1.9,
6586
+ output: 8,
6587
+ cacheRead: 0.38,
6588
+ cacheWrite: 0,
6589
+ },
6590
+ contextWindow: 262144,
6591
+ maxTokens: 262144,
6592
+ },
6563
6593
  },
6564
6594
  "nvidia": {
6565
6595
  "meta/llama-3.1-70b-instruct": {
@@ -7923,7 +7953,7 @@ export const MODELS = {
7923
7953
  api: "openai-completions",
7924
7954
  provider: "opencode",
7925
7955
  baseUrl: "https://opencode.ai/zen/v1",
7926
- compat: { "maxTokensField": "max_tokens", "supportsLongCacheRetention": false, "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7956
+ compat: { "maxTokensField": "max_tokens", "supportsLongCacheRetention": false, "requiresReasoningContentOnAssistantMessages": true },
7927
7957
  reasoning: true,
7928
7958
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7929
7959
  input: ["text"],
@@ -7942,7 +7972,7 @@ export const MODELS = {
7942
7972
  api: "openai-completions",
7943
7973
  provider: "opencode",
7944
7974
  baseUrl: "https://opencode.ai/zen/v1",
7945
- compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7975
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true },
7946
7976
  reasoning: true,
7947
7977
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7948
7978
  input: ["text"],
@@ -7961,7 +7991,7 @@ export const MODELS = {
7961
7991
  api: "openai-completions",
7962
7992
  provider: "opencode",
7963
7993
  baseUrl: "https://opencode.ai/zen/v1",
7964
- compat: { "maxTokensField": "max_tokens", "supportsLongCacheRetention": false, "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7994
+ compat: { "maxTokensField": "max_tokens", "supportsLongCacheRetention": false, "requiresReasoningContentOnAssistantMessages": true },
7965
7995
  reasoning: true,
7966
7996
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7967
7997
  input: ["text"],
@@ -8539,7 +8569,7 @@ export const MODELS = {
8539
8569
  api: "openai-completions",
8540
8570
  provider: "opencode-go",
8541
8571
  baseUrl: "https://opencode.ai/zen/go/v1",
8542
- compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8572
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true },
8543
8573
  reasoning: true,
8544
8574
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8545
8575
  input: ["text"],
@@ -8558,7 +8588,7 @@ export const MODELS = {
8558
8588
  api: "openai-completions",
8559
8589
  provider: "opencode-go",
8560
8590
  baseUrl: "https://opencode.ai/zen/go/v1",
8561
- compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8591
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true },
8562
8592
  reasoning: true,
8563
8593
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8564
8594
  input: ["text"],
@@ -9466,13 +9496,13 @@ export const MODELS = {
9466
9496
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
9467
9497
  input: ["text"],
9468
9498
  cost: {
9469
- input: 0.09,
9470
- output: 0.18,
9499
+ input: 0.098,
9500
+ output: 0.196,
9471
9501
  cacheRead: 0.02,
9472
9502
  cacheWrite: 0,
9473
9503
  },
9474
9504
  contextWindow: 1048576,
9475
- maxTokens: 65536,
9505
+ maxTokens: 4096,
9476
9506
  },
9477
9507
  "deepseek/deepseek-v4-pro": {
9478
9508
  id: "deepseek/deepseek-v4-pro",
@@ -12310,7 +12340,7 @@ export const MODELS = {
12310
12340
  cacheWrite: 0,
12311
12341
  },
12312
12342
  contextWindow: 262144,
12313
- maxTokens: 262144,
12343
+ maxTokens: 81920,
12314
12344
  },
12315
12345
  "qwen/qwen3.5-397b-a17b": {
12316
12346
  id: "qwen/qwen3.5-397b-a17b",
@@ -12321,13 +12351,13 @@ export const MODELS = {
12321
12351
  reasoning: true,
12322
12352
  input: ["text", "image"],
12323
12353
  cost: {
12324
- input: 0.39,
12325
- output: 2.34,
12354
+ input: 0.385,
12355
+ output: 2.45,
12326
12356
  cacheRead: 0,
12327
12357
  cacheWrite: 0,
12328
12358
  },
12329
- contextWindow: 262144,
12330
- maxTokens: 65536,
12359
+ contextWindow: 256000,
12360
+ maxTokens: 4096,
12331
12361
  },
12332
12362
  "qwen/qwen3.5-9b": {
12333
12363
  id: "qwen/qwen3.5-9b",
@@ -12610,13 +12640,13 @@ export const MODELS = {
12610
12640
  reasoning: true,
12611
12641
  input: ["text"],
12612
12642
  cost: {
12613
- input: 0.063,
12614
- output: 0.21,
12615
- cacheRead: 0.021,
12643
+ input: 0.066,
12644
+ output: 0.26,
12645
+ cacheRead: 0.029,
12616
12646
  cacheWrite: 0,
12617
12647
  },
12618
12648
  contextWindow: 262144,
12619
- maxTokens: 4096,
12649
+ maxTokens: 262144,
12620
12650
  },
12621
12651
  "thedrummer/rocinante-12b": {
12622
12652
  id: "thedrummer/rocinante-12b",
@@ -12797,13 +12827,13 @@ export const MODELS = {
12797
12827
  reasoning: true,
12798
12828
  input: ["text"],
12799
12829
  cost: {
12800
- input: 0.125,
12830
+ input: 0.13,
12801
12831
  output: 0.85,
12802
- cacheRead: 0.06,
12832
+ cacheRead: 0.025,
12803
12833
  cacheWrite: 0,
12804
12834
  },
12805
12835
  contextWindow: 131072,
12806
- maxTokens: 131070,
12836
+ maxTokens: 98304,
12807
12837
  },
12808
12838
  "z-ai/glm-4.5v": {
12809
12839
  id: "z-ai/glm-4.5v",
@@ -12941,6 +12971,23 @@ export const MODELS = {
12941
12971
  contextWindow: 202752,
12942
12972
  maxTokens: 4096,
12943
12973
  },
12974
+ "z-ai/glm-5.2": {
12975
+ id: "z-ai/glm-5.2",
12976
+ name: "Z.ai: GLM 5.2",
12977
+ api: "openai-completions",
12978
+ provider: "openrouter",
12979
+ baseUrl: "https://openrouter.ai/api/v1",
12980
+ reasoning: true,
12981
+ input: ["text"],
12982
+ cost: {
12983
+ input: 1.4,
12984
+ output: 4.4,
12985
+ cacheRead: 0.26,
12986
+ cacheWrite: 0,
12987
+ },
12988
+ contextWindow: 1048576,
12989
+ maxTokens: 131072,
12990
+ },
12944
12991
  "~anthropic/claude-fable-latest": {
12945
12992
  id: "~anthropic/claude-fable-latest",
12946
12993
  name: "Anthropic: Claude Fable Latest",
@@ -13237,8 +13284,8 @@ export const MODELS = {
13237
13284
  reasoning: false,
13238
13285
  input: ["text"],
13239
13286
  cost: {
13240
- input: 2.5,
13241
- output: 7.5,
13287
+ input: 1.25,
13288
+ output: 3.75,
13242
13289
  cacheRead: 0,
13243
13290
  cacheWrite: 0,
13244
13291
  },
@@ -15042,6 +15089,23 @@ export const MODELS = {
15042
15089
  contextWindow: 256000,
15043
15090
  maxTokens: 32768,
15044
15091
  },
15092
+ "moonshotai/kimi-k2.7-code-highspeed": {
15093
+ id: "moonshotai/kimi-k2.7-code-highspeed",
15094
+ name: "Kimi K2.7 Code High Speed",
15095
+ api: "anthropic-messages",
15096
+ provider: "vercel-ai-gateway",
15097
+ baseUrl: "https://ai-gateway.vercel.sh",
15098
+ reasoning: true,
15099
+ input: ["text", "image"],
15100
+ cost: {
15101
+ input: 1.9,
15102
+ output: 8,
15103
+ cacheRead: 0.38,
15104
+ cacheWrite: 0,
15105
+ },
15106
+ contextWindow: 262144,
15107
+ maxTokens: 4096,
15108
+ },
15045
15109
  "nvidia/nemotron-3-super-120b-a12b": {
15046
15110
  id: "nvidia/nemotron-3-super-120b-a12b",
15047
15111
  name: "NVIDIA Nemotron 3 Super 120B A12B",
@@ -16278,6 +16342,23 @@ export const MODELS = {
16278
16342
  contextWindow: 202800,
16279
16343
  maxTokens: 64000,
16280
16344
  },
16345
+ "zai/glm-5.2": {
16346
+ id: "zai/glm-5.2",
16347
+ name: "GLM 5.2",
16348
+ api: "anthropic-messages",
16349
+ provider: "vercel-ai-gateway",
16350
+ baseUrl: "https://ai-gateway.vercel.sh",
16351
+ reasoning: true,
16352
+ input: ["text"],
16353
+ cost: {
16354
+ input: 1.4,
16355
+ output: 4.4,
16356
+ cacheRead: 0.26,
16357
+ cacheWrite: 0,
16358
+ },
16359
+ contextWindow: 1000000,
16360
+ maxTokens: 128000,
16361
+ },
16281
16362
  "zai/glm-5v-turbo": {
16282
16363
  id: "zai/glm-5v-turbo",
16283
16364
  name: "GLM 5V Turbo",
@@ -16882,8 +16963,9 @@ export const MODELS = {
16882
16963
  api: "openai-completions",
16883
16964
  provider: "zai",
16884
16965
  baseUrl: "https://api.z.ai/api/coding/paas/v4",
16885
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
16966
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "supportsReasoningEffort": true, "zaiToolStream": true },
16886
16967
  reasoning: true,
16968
+ thinkingLevelMap: { "minimal": null, "low": "high", "medium": "high", "high": "high", "xhigh": "max" },
16887
16969
  input: ["text"],
16888
16970
  cost: {
16889
16971
  input: 0,
@@ -16992,8 +17074,9 @@ export const MODELS = {
16992
17074
  api: "openai-completions",
16993
17075
  provider: "zai-coding-cn",
16994
17076
  baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
16995
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
17077
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "supportsReasoningEffort": true, "zaiToolStream": true },
16996
17078
  reasoning: true,
17079
+ thinkingLevelMap: { "minimal": null, "low": "high", "medium": "high", "high": "high", "xhigh": "max" },
16997
17080
  input: ["text"],
16998
17081
  cost: {
16999
17082
  input: 0,