gsd-pi 2.72.0-dev.3159350 → 2.72.0-dev.4f3264a

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (189) hide show
  1. package/dist/resources/extensions/async-jobs/await-tool.js +4 -7
  2. package/dist/resources/extensions/async-jobs/job-manager.js +3 -28
  3. package/dist/resources/extensions/claude-code-cli/stream-adapter.js +26 -27
  4. package/dist/resources/extensions/gsd/auto/loop.js +1 -84
  5. package/dist/resources/extensions/gsd/auto-observability.js +54 -0
  6. package/dist/resources/extensions/gsd/auto-post-unit.js +0 -6
  7. package/dist/resources/extensions/gsd/auto.js +19 -25
  8. package/dist/resources/extensions/gsd/bootstrap/register-hooks.js +11 -9
  9. package/dist/resources/extensions/gsd/commands-handlers.js +1 -4
  10. package/dist/resources/extensions/gsd/context-injector.js +1 -1
  11. package/dist/resources/extensions/gsd/custom-workflow-engine.js +7 -3
  12. package/dist/resources/extensions/gsd/file-watcher.js +80 -0
  13. package/dist/resources/extensions/gsd/gsd-db.js +5 -47
  14. package/dist/resources/extensions/gsd/key-manager.js +0 -2
  15. package/dist/resources/extensions/gsd/preferences-skills.js +34 -2
  16. package/dist/resources/extensions/gsd/preferences-types.js +0 -15
  17. package/dist/resources/extensions/gsd/preferences.js +3 -16
  18. package/dist/resources/extensions/gsd/prompt-loader.js +1 -4
  19. package/dist/resources/extensions/gsd/rtk-status.js +43 -0
  20. package/dist/resources/extensions/gsd/state.js +1 -21
  21. package/dist/resources/extensions/gsd/write-intercept.js +1 -10
  22. package/dist/resources/extensions/ollama/index.js +5 -4
  23. package/dist/resources/extensions/ollama/ollama-client.js +6 -35
  24. package/dist/resources/extensions/ollama/ollama-discovery.js +6 -32
  25. package/dist/web/standalone/.next/BUILD_ID +1 -1
  26. package/dist/web/standalone/.next/app-path-routes-manifest.json +11 -11
  27. package/dist/web/standalone/.next/build-manifest.json +2 -2
  28. package/dist/web/standalone/.next/prerender-manifest.json +3 -3
  29. package/dist/web/standalone/.next/server/app/_global-error/page.js +3 -3
  30. package/dist/web/standalone/.next/server/app/_global-error/page_client-reference-manifest.js +1 -1
  31. package/dist/web/standalone/.next/server/app/_global-error.html +1 -1
  32. package/dist/web/standalone/.next/server/app/_global-error.rsc +1 -1
  33. package/dist/web/standalone/.next/server/app/_global-error.segments/_full.segment.rsc +1 -1
  34. package/dist/web/standalone/.next/server/app/_global-error.segments/_global-error/__PAGE__.segment.rsc +1 -1
  35. package/dist/web/standalone/.next/server/app/_global-error.segments/_global-error.segment.rsc +1 -1
  36. package/dist/web/standalone/.next/server/app/_global-error.segments/_head.segment.rsc +1 -1
  37. package/dist/web/standalone/.next/server/app/_global-error.segments/_index.segment.rsc +1 -1
  38. package/dist/web/standalone/.next/server/app/_global-error.segments/_tree.segment.rsc +1 -1
  39. package/dist/web/standalone/.next/server/app/_not-found/page.js +2 -2
  40. package/dist/web/standalone/.next/server/app/_not-found/page_client-reference-manifest.js +1 -1
  41. package/dist/web/standalone/.next/server/app/_not-found.html +1 -1
  42. package/dist/web/standalone/.next/server/app/_not-found.rsc +1 -1
  43. package/dist/web/standalone/.next/server/app/_not-found.segments/_full.segment.rsc +1 -1
  44. package/dist/web/standalone/.next/server/app/_not-found.segments/_head.segment.rsc +1 -1
  45. package/dist/web/standalone/.next/server/app/_not-found.segments/_index.segment.rsc +1 -1
  46. package/dist/web/standalone/.next/server/app/_not-found.segments/_not-found/__PAGE__.segment.rsc +1 -1
  47. package/dist/web/standalone/.next/server/app/_not-found.segments/_not-found.segment.rsc +1 -1
  48. package/dist/web/standalone/.next/server/app/_not-found.segments/_tree.segment.rsc +1 -1
  49. package/dist/web/standalone/.next/server/app/api/boot/route.js +1 -1
  50. package/dist/web/standalone/.next/server/app/api/bridge-terminal/input/route.js +1 -1
  51. package/dist/web/standalone/.next/server/app/api/bridge-terminal/resize/route.js +1 -1
  52. package/dist/web/standalone/.next/server/app/api/bridge-terminal/stream/route.js +2 -2
  53. package/dist/web/standalone/.next/server/app/api/browse-directories/route.js +1 -1
  54. package/dist/web/standalone/.next/server/app/api/captures/route.js +1 -1
  55. package/dist/web/standalone/.next/server/app/api/cleanup/route.js +1 -1
  56. package/dist/web/standalone/.next/server/app/api/dev-mode/route.js +1 -1
  57. package/dist/web/standalone/.next/server/app/api/doctor/route.js +1 -1
  58. package/dist/web/standalone/.next/server/app/api/experimental/route.js +2 -2
  59. package/dist/web/standalone/.next/server/app/api/export-data/route.js +1 -1
  60. package/dist/web/standalone/.next/server/app/api/files/route.js +1 -1
  61. package/dist/web/standalone/.next/server/app/api/forensics/route.js +1 -1
  62. package/dist/web/standalone/.next/server/app/api/git/route.js +1 -1
  63. package/dist/web/standalone/.next/server/app/api/history/route.js +1 -1
  64. package/dist/web/standalone/.next/server/app/api/hooks/route.js +1 -1
  65. package/dist/web/standalone/.next/server/app/api/inspect/route.js +1 -1
  66. package/dist/web/standalone/.next/server/app/api/knowledge/route.js +1 -1
  67. package/dist/web/standalone/.next/server/app/api/live-state/route.js +1 -1
  68. package/dist/web/standalone/.next/server/app/api/notifications/route.js +2 -2
  69. package/dist/web/standalone/.next/server/app/api/onboarding/route.js +1 -1
  70. package/dist/web/standalone/.next/server/app/api/preferences/route.js +1 -1
  71. package/dist/web/standalone/.next/server/app/api/projects/route.js +1 -1
  72. package/dist/web/standalone/.next/server/app/api/recovery/route.js +1 -1
  73. package/dist/web/standalone/.next/server/app/api/remote-questions/route.js +2 -2
  74. package/dist/web/standalone/.next/server/app/api/session/browser/route.js +1 -1
  75. package/dist/web/standalone/.next/server/app/api/session/command/route.js +1 -1
  76. package/dist/web/standalone/.next/server/app/api/session/events/route.js +2 -2
  77. package/dist/web/standalone/.next/server/app/api/session/manage/route.js +1 -1
  78. package/dist/web/standalone/.next/server/app/api/settings-data/route.js +1 -1
  79. package/dist/web/standalone/.next/server/app/api/shutdown/route.js +1 -1
  80. package/dist/web/standalone/.next/server/app/api/skill-health/route.js +1 -1
  81. package/dist/web/standalone/.next/server/app/api/steer/route.js +1 -1
  82. package/dist/web/standalone/.next/server/app/api/switch-root/route.js +1 -1
  83. package/dist/web/standalone/.next/server/app/api/terminal/input/route.js +2 -2
  84. package/dist/web/standalone/.next/server/app/api/terminal/resize/route.js +2 -2
  85. package/dist/web/standalone/.next/server/app/api/terminal/sessions/route.js +2 -2
  86. package/dist/web/standalone/.next/server/app/api/terminal/stream/route.js +3 -3
  87. package/dist/web/standalone/.next/server/app/api/terminal/upload/route.js +1 -1
  88. package/dist/web/standalone/.next/server/app/api/undo/route.js +1 -1
  89. package/dist/web/standalone/.next/server/app/api/update/route.js +1 -1
  90. package/dist/web/standalone/.next/server/app/api/visualizer/route.js +1 -1
  91. package/dist/web/standalone/.next/server/app/index.html +1 -1
  92. package/dist/web/standalone/.next/server/app/index.rsc +1 -1
  93. package/dist/web/standalone/.next/server/app/index.segments/__PAGE__.segment.rsc +1 -1
  94. package/dist/web/standalone/.next/server/app/index.segments/_full.segment.rsc +1 -1
  95. package/dist/web/standalone/.next/server/app/index.segments/_head.segment.rsc +1 -1
  96. package/dist/web/standalone/.next/server/app/index.segments/_index.segment.rsc +1 -1
  97. package/dist/web/standalone/.next/server/app/index.segments/_tree.segment.rsc +1 -1
  98. package/dist/web/standalone/.next/server/app/page.js +2 -2
  99. package/dist/web/standalone/.next/server/app/page_client-reference-manifest.js +1 -1
  100. package/dist/web/standalone/.next/server/app-paths-manifest.json +11 -11
  101. package/dist/web/standalone/.next/server/chunks/2331.js +16 -16
  102. package/dist/web/standalone/.next/server/chunks/4741.js +12 -12
  103. package/dist/web/standalone/.next/server/chunks/5822.js +2 -2
  104. package/dist/web/standalone/.next/server/chunks/63.js +8 -8
  105. package/dist/web/standalone/.next/server/chunks/6897.js +3 -3
  106. package/dist/web/standalone/.next/server/functions-config-manifest.json +9 -0
  107. package/dist/web/standalone/.next/server/middleware-build-manifest.js +1 -1
  108. package/dist/web/standalone/.next/server/middleware-manifest.json +2 -29
  109. package/dist/web/standalone/.next/server/middleware.js +12 -4
  110. package/dist/web/standalone/.next/server/pages/404.html +1 -1
  111. package/dist/web/standalone/.next/server/pages/500.html +1 -1
  112. package/dist/web/standalone/.next/server/server-reference-manifest.json +1 -1
  113. package/dist/web/standalone/.next/server/webpack-runtime.js +1 -1
  114. package/package.json +1 -1
  115. package/packages/pi-ai/dist/env-api-keys.js +0 -1
  116. package/packages/pi-ai/dist/env-api-keys.js.map +1 -1
  117. package/packages/pi-ai/dist/models.custom.d.ts +0 -105
  118. package/packages/pi-ai/dist/models.custom.d.ts.map +1 -1
  119. package/packages/pi-ai/dist/models.custom.js +0 -97
  120. package/packages/pi-ai/dist/models.custom.js.map +1 -1
  121. package/packages/pi-ai/dist/models.generated.d.ts +140 -648
  122. package/packages/pi-ai/dist/models.generated.d.ts.map +1 -1
  123. package/packages/pi-ai/dist/models.generated.js +364 -861
  124. package/packages/pi-ai/dist/models.generated.js.map +1 -1
  125. package/packages/pi-ai/dist/models.test.js +0 -105
  126. package/packages/pi-ai/dist/models.test.js.map +1 -1
  127. package/packages/pi-ai/dist/types.d.ts +1 -1
  128. package/packages/pi-ai/dist/types.d.ts.map +1 -1
  129. package/packages/pi-ai/dist/types.js.map +1 -1
  130. package/packages/pi-ai/src/env-api-keys.ts +0 -1
  131. package/packages/pi-ai/src/models.custom.ts +0 -98
  132. package/packages/pi-ai/src/models.generated.ts +364 -861
  133. package/packages/pi-ai/src/models.test.ts +0 -135
  134. package/packages/pi-ai/src/types.ts +0 -1
  135. package/packages/pi-coding-agent/dist/core/model-resolver.d.ts.map +1 -1
  136. package/packages/pi-coding-agent/dist/core/model-resolver.js +0 -1
  137. package/packages/pi-coding-agent/dist/core/model-resolver.js.map +1 -1
  138. package/packages/pi-coding-agent/src/core/model-resolver.ts +0 -1
  139. package/src/resources/extensions/async-jobs/await-tool.test.ts +7 -40
  140. package/src/resources/extensions/async-jobs/await-tool.ts +4 -7
  141. package/src/resources/extensions/async-jobs/job-manager.ts +3 -33
  142. package/src/resources/extensions/claude-code-cli/stream-adapter.ts +26 -27
  143. package/src/resources/extensions/claude-code-cli/tests/stream-adapter.test.ts +2 -20
  144. package/src/resources/extensions/gsd/auto/loop.ts +1 -89
  145. package/src/resources/extensions/gsd/auto-observability.ts +72 -0
  146. package/src/resources/extensions/gsd/auto-post-unit.ts +0 -7
  147. package/src/resources/extensions/gsd/auto.ts +20 -25
  148. package/src/resources/extensions/gsd/bootstrap/register-hooks.ts +10 -8
  149. package/src/resources/extensions/gsd/commands-handlers.ts +1 -5
  150. package/src/resources/extensions/gsd/context-injector.ts +1 -1
  151. package/src/resources/extensions/gsd/custom-workflow-engine.ts +8 -4
  152. package/src/resources/extensions/gsd/file-watcher.ts +100 -0
  153. package/src/resources/extensions/gsd/gsd-db.ts +5 -52
  154. package/src/resources/extensions/gsd/key-manager.ts +0 -2
  155. package/src/resources/extensions/gsd/preferences-skills.ts +36 -2
  156. package/src/resources/extensions/gsd/preferences-types.ts +0 -16
  157. package/src/resources/extensions/gsd/preferences.ts +6 -19
  158. package/src/resources/extensions/gsd/prompt-loader.ts +1 -6
  159. package/src/resources/extensions/gsd/rtk-status.ts +53 -0
  160. package/src/resources/extensions/gsd/state.ts +0 -20
  161. package/src/resources/extensions/gsd/tests/gsd-db.test.ts +0 -74
  162. package/src/resources/extensions/gsd/tests/key-manager.test.ts +0 -63
  163. package/src/resources/extensions/gsd/tests/preferences.test.ts +0 -53
  164. package/src/resources/extensions/gsd/write-intercept.ts +1 -10
  165. package/src/resources/extensions/ollama/index.ts +5 -4
  166. package/src/resources/extensions/ollama/ollama-client.ts +6 -35
  167. package/src/resources/extensions/ollama/ollama-discovery.ts +6 -37
  168. package/src/resources/extensions/ollama/tests/ollama-discovery.test.ts +0 -54
  169. package/dist/resources/extensions/gsd/definition-io.js +0 -15
  170. package/dist/web/standalone/.next/server/edge-runtime-webpack.js +0 -2
  171. package/packages/pi-ai/dist/models.generated.test.d.ts +0 -2
  172. package/packages/pi-ai/dist/models.generated.test.d.ts.map +0 -1
  173. package/packages/pi-ai/dist/models.generated.test.js +0 -334
  174. package/packages/pi-ai/dist/models.generated.test.js.map +0 -1
  175. package/packages/pi-ai/src/models.generated.test.ts +0 -373
  176. package/src/resources/extensions/gsd/definition-io.ts +0 -18
  177. package/src/resources/extensions/gsd/tests/auto-paused-ui-cleanup.test.ts +0 -27
  178. package/src/resources/extensions/gsd/tests/block-db-writes.test.ts +0 -63
  179. package/src/resources/extensions/gsd/tests/definition-io.test.ts +0 -57
  180. package/src/resources/extensions/gsd/tests/doctor-heal-fixable-warnings.test.ts +0 -14
  181. package/src/resources/extensions/gsd/tests/false-degraded-mode-warning.test.ts +0 -104
  182. package/src/resources/extensions/gsd/tests/memory-pressure-stuck-state.test.ts +0 -54
  183. package/src/resources/extensions/gsd/tests/post-unit-state-rebuild.test.ts +0 -34
  184. package/src/resources/extensions/gsd/tests/preferences-formatting.test.ts +0 -87
  185. package/src/resources/extensions/gsd/tests/prompt-loader-working-directory.test.ts +0 -19
  186. package/src/resources/extensions/gsd/tests/register-hooks-depth-verification.test.ts +0 -97
  187. package/src/resources/extensions/gsd/tests/stale-slice-rows.test.ts +0 -41
  188. /package/dist/web/standalone/.next/static/{eR2tLKungpmiiOyUIhqjF → vr6Pbde48w4rMUplqDdh_}/_buildManifest.js +0 -0
  189. /package/dist/web/standalone/.next/static/{eR2tLKungpmiiOyUIhqjF → vr6Pbde48w4rMUplqDdh_}/_ssgManifest.js +0 -0
@@ -804,23 +804,6 @@ export const MODELS = {
804
804
  contextWindow: 204800,
805
805
  maxTokens: 131072,
806
806
  } satisfies Model<"bedrock-converse-stream">,
807
- "minimax.minimax-m2.5": {
808
- id: "minimax.minimax-m2.5",
809
- name: "MiniMax M2.5",
810
- api: "bedrock-converse-stream",
811
- provider: "amazon-bedrock",
812
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
813
- reasoning: true,
814
- input: ["text"],
815
- cost: {
816
- input: 0.3,
817
- output: 1.2,
818
- cacheRead: 0,
819
- cacheWrite: 0,
820
- },
821
- contextWindow: 196608,
822
- maxTokens: 98304,
823
- } satisfies Model<"bedrock-converse-stream">,
824
807
  "mistral.devstral-2-123b": {
825
808
  id: "mistral.devstral-2-123b",
826
809
  name: "Devstral 2 123B",
@@ -1059,23 +1042,6 @@ export const MODELS = {
1059
1042
  contextWindow: 128000,
1060
1043
  maxTokens: 4096,
1061
1044
  } satisfies Model<"bedrock-converse-stream">,
1062
- "nvidia.nemotron-super-3-120b": {
1063
- id: "nvidia.nemotron-super-3-120b",
1064
- name: "NVIDIA Nemotron 3 Super 120B A12B",
1065
- api: "bedrock-converse-stream",
1066
- provider: "amazon-bedrock",
1067
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1068
- reasoning: true,
1069
- input: ["text"],
1070
- cost: {
1071
- input: 0.15,
1072
- output: 0.65,
1073
- cacheRead: 0,
1074
- cacheWrite: 0,
1075
- },
1076
- contextWindow: 262144,
1077
- maxTokens: 131072,
1078
- } satisfies Model<"bedrock-converse-stream">,
1079
1045
  "openai.gpt-oss-120b-1:0": {
1080
1046
  id: "openai.gpt-oss-120b-1:0",
1081
1047
  name: "gpt-oss-120b",
@@ -1212,23 +1178,6 @@ export const MODELS = {
1212
1178
  contextWindow: 131072,
1213
1179
  maxTokens: 65536,
1214
1180
  } satisfies Model<"bedrock-converse-stream">,
1215
- "qwen.qwen3-coder-next": {
1216
- id: "qwen.qwen3-coder-next",
1217
- name: "Qwen3 Coder Next",
1218
- api: "bedrock-converse-stream",
1219
- provider: "amazon-bedrock",
1220
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1221
- reasoning: true,
1222
- input: ["text"],
1223
- cost: {
1224
- input: 0.22,
1225
- output: 1.8,
1226
- cacheRead: 0,
1227
- cacheWrite: 0,
1228
- },
1229
- contextWindow: 131072,
1230
- maxTokens: 65536,
1231
- } satisfies Model<"bedrock-converse-stream">,
1232
1181
  "qwen.qwen3-next-80b-a3b": {
1233
1182
  id: "qwen.qwen3-next-80b-a3b",
1234
1183
  name: "Qwen/Qwen3-Next-80B-A3B-Instruct",
@@ -1467,23 +1416,6 @@ export const MODELS = {
1467
1416
  contextWindow: 200000,
1468
1417
  maxTokens: 131072,
1469
1418
  } satisfies Model<"bedrock-converse-stream">,
1470
- "zai.glm-5": {
1471
- id: "zai.glm-5",
1472
- name: "GLM-5",
1473
- api: "bedrock-converse-stream",
1474
- provider: "amazon-bedrock",
1475
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1476
- reasoning: true,
1477
- input: ["text"],
1478
- cost: {
1479
- input: 1,
1480
- output: 3.2,
1481
- cacheRead: 0,
1482
- cacheWrite: 0,
1483
- },
1484
- contextWindow: 202752,
1485
- maxTokens: 101376,
1486
- } satisfies Model<"bedrock-converse-stream">,
1487
1419
  },
1488
1420
  "anthropic": {
1489
1421
  "claude-3-5-haiku-20241022": {
@@ -1571,6 +1503,23 @@ export const MODELS = {
1571
1503
  contextWindow: 200000,
1572
1504
  maxTokens: 64000,
1573
1505
  } satisfies Model<"anthropic-messages">,
1506
+ "claude-3-7-sonnet-latest": {
1507
+ id: "claude-3-7-sonnet-latest",
1508
+ name: "Claude Sonnet 3.7 (latest)",
1509
+ api: "anthropic-messages",
1510
+ provider: "anthropic",
1511
+ baseUrl: "https://api.anthropic.com",
1512
+ reasoning: true,
1513
+ input: ["text", "image"],
1514
+ cost: {
1515
+ input: 3,
1516
+ output: 15,
1517
+ cacheRead: 0.3,
1518
+ cacheWrite: 3.75,
1519
+ },
1520
+ contextWindow: 200000,
1521
+ maxTokens: 64000,
1522
+ } satisfies Model<"anthropic-messages">,
1574
1523
  "claude-3-haiku-20240307": {
1575
1524
  id: "claude-3-haiku-20240307",
1576
1525
  name: "Claude Haiku 3",
@@ -2304,23 +2253,6 @@ export const MODELS = {
2304
2253
  contextWindow: 400000,
2305
2254
  maxTokens: 128000,
2306
2255
  } satisfies Model<"azure-openai-responses">,
2307
- "gpt-5.3-chat-latest": {
2308
- id: "gpt-5.3-chat-latest",
2309
- name: "GPT-5.3 Chat (latest)",
2310
- api: "azure-openai-responses",
2311
- provider: "azure-openai-responses",
2312
- baseUrl: "",
2313
- reasoning: false,
2314
- input: ["text", "image"],
2315
- cost: {
2316
- input: 1.75,
2317
- output: 14,
2318
- cacheRead: 0.175,
2319
- cacheWrite: 0,
2320
- },
2321
- contextWindow: 128000,
2322
- maxTokens: 16384,
2323
- } satisfies Model<"azure-openai-responses">,
2324
2256
  "gpt-5.3-codex": {
2325
2257
  id: "gpt-5.3-codex",
2326
2258
  name: "GPT-5.3 Codex",
@@ -3035,7 +2967,7 @@ export const MODELS = {
3035
2967
  } satisfies Model<"openai-responses">,
3036
2968
  "gpt-5.4-mini": {
3037
2969
  id: "gpt-5.4-mini",
3038
- name: "GPT-5.4 Mini",
2970
+ name: "GPT-5.4 mini",
3039
2971
  api: "openai-responses",
3040
2972
  provider: "github-copilot",
3041
2973
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3480,57 +3412,6 @@ export const MODELS = {
3480
3412
  contextWindow: 131072,
3481
3413
  maxTokens: 65536,
3482
3414
  } satisfies Model<"google-generative-ai">,
3483
- "gemma-3-27b-it": {
3484
- id: "gemma-3-27b-it",
3485
- name: "Gemma 3 27B",
3486
- api: "google-generative-ai",
3487
- provider: "google",
3488
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
3489
- reasoning: false,
3490
- input: ["text", "image"],
3491
- cost: {
3492
- input: 0,
3493
- output: 0,
3494
- cacheRead: 0,
3495
- cacheWrite: 0,
3496
- },
3497
- contextWindow: 131072,
3498
- maxTokens: 8192,
3499
- } satisfies Model<"google-generative-ai">,
3500
- "gemma-4-26b-it": {
3501
- id: "gemma-4-26b-it",
3502
- name: "Gemma 4 26B",
3503
- api: "google-generative-ai",
3504
- provider: "google",
3505
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
3506
- reasoning: true,
3507
- input: ["text", "image"],
3508
- cost: {
3509
- input: 0,
3510
- output: 0,
3511
- cacheRead: 0,
3512
- cacheWrite: 0,
3513
- },
3514
- contextWindow: 256000,
3515
- maxTokens: 8192,
3516
- } satisfies Model<"google-generative-ai">,
3517
- "gemma-4-31b-it": {
3518
- id: "gemma-4-31b-it",
3519
- name: "Gemma 4 31B",
3520
- api: "google-generative-ai",
3521
- provider: "google",
3522
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
3523
- reasoning: true,
3524
- input: ["text", "image"],
3525
- cost: {
3526
- input: 0,
3527
- output: 0,
3528
- cacheRead: 0,
3529
- cacheWrite: 0,
3530
- },
3531
- contextWindow: 256000,
3532
- maxTokens: 8192,
3533
- } satisfies Model<"google-generative-ai">,
3534
3415
  },
3535
3416
  "google-antigravity": {
3536
3417
  "claude-opus-4-5-thinking": {
@@ -4032,40 +3913,6 @@ export const MODELS = {
4032
3913
  contextWindow: 8192,
4033
3914
  maxTokens: 8192,
4034
3915
  } satisfies Model<"openai-completions">,
4035
- "groq/compound": {
4036
- id: "groq/compound",
4037
- name: "Compound",
4038
- api: "openai-completions",
4039
- provider: "groq",
4040
- baseUrl: "https://api.groq.com/openai/v1",
4041
- reasoning: true,
4042
- input: ["text"],
4043
- cost: {
4044
- input: 0,
4045
- output: 0,
4046
- cacheRead: 0,
4047
- cacheWrite: 0,
4048
- },
4049
- contextWindow: 131072,
4050
- maxTokens: 8192,
4051
- } satisfies Model<"openai-completions">,
4052
- "groq/compound-mini": {
4053
- id: "groq/compound-mini",
4054
- name: "Compound Mini",
4055
- api: "openai-completions",
4056
- provider: "groq",
4057
- baseUrl: "https://api.groq.com/openai/v1",
4058
- reasoning: true,
4059
- input: ["text"],
4060
- cost: {
4061
- input: 0,
4062
- output: 0,
4063
- cacheRead: 0,
4064
- cacheWrite: 0,
4065
- },
4066
- contextWindow: 131072,
4067
- maxTokens: 8192,
4068
- } satisfies Model<"openai-completions">,
4069
3916
  "llama-3.1-8b-instant": {
4070
3917
  id: "llama-3.1-8b-instant",
4071
3918
  name: "Llama 3.1 8B Instant",
@@ -4253,23 +4100,6 @@ export const MODELS = {
4253
4100
  contextWindow: 131072,
4254
4101
  maxTokens: 65536,
4255
4102
  } satisfies Model<"openai-completions">,
4256
- "openai/gpt-oss-safeguard-20b": {
4257
- id: "openai/gpt-oss-safeguard-20b",
4258
- name: "Safety GPT OSS 20B",
4259
- api: "openai-completions",
4260
- provider: "groq",
4261
- baseUrl: "https://api.groq.com/openai/v1",
4262
- reasoning: true,
4263
- input: ["text"],
4264
- cost: {
4265
- input: 0.075,
4266
- output: 0.3,
4267
- cacheRead: 0.037,
4268
- cacheWrite: 0,
4269
- },
4270
- contextWindow: 131072,
4271
- maxTokens: 65536,
4272
- } satisfies Model<"openai-completions">,
4273
4103
  "qwen-qwq-32b": {
4274
4104
  id: "qwen-qwq-32b",
4275
4105
  name: "Qwen QwQ 32B",
@@ -4302,7 +4132,7 @@ export const MODELS = {
4302
4132
  cacheWrite: 0,
4303
4133
  },
4304
4134
  contextWindow: 131072,
4305
- maxTokens: 40960,
4135
+ maxTokens: 16384,
4306
4136
  } satisfies Model<"openai-completions">,
4307
4137
  },
4308
4138
  "huggingface": {
@@ -4630,24 +4460,6 @@ export const MODELS = {
4630
4460
  contextWindow: 202752,
4631
4461
  maxTokens: 131072,
4632
4462
  } satisfies Model<"openai-completions">,
4633
- "zai-org/GLM-5.1": {
4634
- id: "zai-org/GLM-5.1",
4635
- name: "GLM-5.1",
4636
- api: "openai-completions",
4637
- provider: "huggingface",
4638
- baseUrl: "https://router.huggingface.co/v1",
4639
- compat: {"supportsDeveloperRole":false},
4640
- reasoning: true,
4641
- input: ["text"],
4642
- cost: {
4643
- input: 1,
4644
- output: 3.2,
4645
- cacheRead: 0.2,
4646
- cacheWrite: 0,
4647
- },
4648
- contextWindow: 202752,
4649
- maxTokens: 131072,
4650
- } satisfies Model<"openai-completions">,
4651
4463
  },
4652
4464
  "kimi-coding": {
4653
4465
  "k2p5": {
@@ -5217,39 +5029,22 @@ export const MODELS = {
5217
5029
  contextWindow: 128000,
5218
5030
  maxTokens: 16384,
5219
5031
  } satisfies Model<"mistral-conversations">,
5220
- "mistral-small-2603": {
5221
- id: "mistral-small-2603",
5222
- name: "Mistral Small 4",
5223
- api: "mistral-conversations",
5224
- provider: "mistral",
5225
- baseUrl: "https://api.mistral.ai",
5226
- reasoning: true,
5227
- input: ["text", "image"],
5228
- cost: {
5229
- input: 0.15,
5230
- output: 0.6,
5231
- cacheRead: 0,
5232
- cacheWrite: 0,
5233
- },
5234
- contextWindow: 256000,
5235
- maxTokens: 256000,
5236
- } satisfies Model<"mistral-conversations">,
5237
5032
  "mistral-small-latest": {
5238
5033
  id: "mistral-small-latest",
5239
5034
  name: "Mistral Small (latest)",
5240
5035
  api: "mistral-conversations",
5241
5036
  provider: "mistral",
5242
5037
  baseUrl: "https://api.mistral.ai",
5243
- reasoning: true,
5038
+ reasoning: false,
5244
5039
  input: ["text", "image"],
5245
5040
  cost: {
5246
- input: 0.15,
5247
- output: 0.6,
5041
+ input: 0.1,
5042
+ output: 0.3,
5248
5043
  cacheRead: 0,
5249
5044
  cacheWrite: 0,
5250
5045
  },
5251
- contextWindow: 256000,
5252
- maxTokens: 256000,
5046
+ contextWindow: 128000,
5047
+ maxTokens: 16384,
5253
5048
  } satisfies Model<"mistral-conversations">,
5254
5049
  "open-mistral-7b": {
5255
5050
  id: "open-mistral-7b",
@@ -5780,23 +5575,6 @@ export const MODELS = {
5780
5575
  contextWindow: 400000,
5781
5576
  maxTokens: 128000,
5782
5577
  } satisfies Model<"openai-responses">,
5783
- "gpt-5.3-chat-latest": {
5784
- id: "gpt-5.3-chat-latest",
5785
- name: "GPT-5.3 Chat (latest)",
5786
- api: "openai-responses",
5787
- provider: "openai",
5788
- baseUrl: "https://api.openai.com/v1",
5789
- reasoning: false,
5790
- input: ["text", "image"],
5791
- cost: {
5792
- input: 1.75,
5793
- output: 14,
5794
- cacheRead: 0.175,
5795
- cacheWrite: 0,
5796
- },
5797
- contextWindow: 128000,
5798
- maxTokens: 16384,
5799
- } satisfies Model<"openai-responses">,
5800
5578
  "gpt-5.3-codex": {
5801
5579
  id: "gpt-5.3-codex",
5802
5580
  name: "GPT-5.3 Codex",
@@ -6379,23 +6157,6 @@ export const MODELS = {
6379
6157
  contextWindow: 204800,
6380
6158
  maxTokens: 131072,
6381
6159
  } satisfies Model<"openai-completions">,
6382
- "glm-5.1": {
6383
- id: "glm-5.1",
6384
- name: "GLM-5.1",
6385
- api: "openai-completions",
6386
- provider: "opencode",
6387
- baseUrl: "https://opencode.ai/zen/v1",
6388
- reasoning: true,
6389
- input: ["text"],
6390
- cost: {
6391
- input: 1.4,
6392
- output: 4.4,
6393
- cacheRead: 0.26,
6394
- cacheWrite: 0,
6395
- },
6396
- contextWindow: 204800,
6397
- maxTokens: 131072,
6398
- } satisfies Model<"openai-completions">,
6399
6160
  "gpt-5": {
6400
6161
  id: "gpt-5",
6401
6162
  name: "GPT-5",
@@ -6651,24 +6412,58 @@ export const MODELS = {
6651
6412
  contextWindow: 262144,
6652
6413
  maxTokens: 65536,
6653
6414
  } satisfies Model<"openai-completions">,
6654
- "minimax-m2.5": {
6655
- id: "minimax-m2.5",
6656
- name: "MiniMax M2.5",
6415
+ "mimo-v2-omni-free": {
6416
+ id: "mimo-v2-omni-free",
6417
+ name: "MiMo V2 Omni Free",
6657
6418
  api: "openai-completions",
6658
6419
  provider: "opencode",
6659
6420
  baseUrl: "https://opencode.ai/zen/v1",
6660
6421
  reasoning: true,
6661
- input: ["text"],
6422
+ input: ["text", "image"],
6662
6423
  cost: {
6663
- input: 0.3,
6664
- output: 1.2,
6665
- cacheRead: 0.06,
6424
+ input: 0,
6425
+ output: 0,
6426
+ cacheRead: 0,
6666
6427
  cacheWrite: 0,
6667
6428
  },
6668
- contextWindow: 204800,
6669
- maxTokens: 131072,
6429
+ contextWindow: 262144,
6430
+ maxTokens: 64000,
6670
6431
  } satisfies Model<"openai-completions">,
6671
- "minimax-m2.5-free": {
6432
+ "mimo-v2-pro-free": {
6433
+ id: "mimo-v2-pro-free",
6434
+ name: "MiMo V2 Pro Free",
6435
+ api: "openai-completions",
6436
+ provider: "opencode",
6437
+ baseUrl: "https://opencode.ai/zen/v1",
6438
+ reasoning: true,
6439
+ input: ["text"],
6440
+ cost: {
6441
+ input: 0,
6442
+ output: 0,
6443
+ cacheRead: 0,
6444
+ cacheWrite: 0,
6445
+ },
6446
+ contextWindow: 1048576,
6447
+ maxTokens: 64000,
6448
+ } satisfies Model<"openai-completions">,
6449
+ "minimax-m2.5": {
6450
+ id: "minimax-m2.5",
6451
+ name: "MiniMax M2.5",
6452
+ api: "openai-completions",
6453
+ provider: "opencode",
6454
+ baseUrl: "https://opencode.ai/zen/v1",
6455
+ reasoning: true,
6456
+ input: ["text"],
6457
+ cost: {
6458
+ input: 0.3,
6459
+ output: 1.2,
6460
+ cacheRead: 0.06,
6461
+ cacheWrite: 0,
6462
+ },
6463
+ contextWindow: 204800,
6464
+ maxTokens: 131072,
6465
+ } satisfies Model<"openai-completions">,
6466
+ "minimax-m2.5-free": {
6672
6467
  id: "minimax-m2.5-free",
6673
6468
  name: "MiniMax M2.5 Free",
6674
6469
  api: "anthropic-messages",
@@ -6699,7 +6494,7 @@ export const MODELS = {
6699
6494
  cacheRead: 0,
6700
6495
  cacheWrite: 0,
6701
6496
  },
6702
- contextWindow: 204800,
6497
+ contextWindow: 1000000,
6703
6498
  maxTokens: 128000,
6704
6499
  } satisfies Model<"openai-completions">,
6705
6500
  },
@@ -6721,23 +6516,6 @@ export const MODELS = {
6721
6516
  contextWindow: 204800,
6722
6517
  maxTokens: 131072,
6723
6518
  } satisfies Model<"openai-completions">,
6724
- "glm-5.1": {
6725
- id: "glm-5.1",
6726
- name: "GLM-5.1",
6727
- api: "openai-completions",
6728
- provider: "opencode-go",
6729
- baseUrl: "https://opencode.ai/zen/go/v1",
6730
- reasoning: true,
6731
- input: ["text"],
6732
- cost: {
6733
- input: 1.4,
6734
- output: 4.4,
6735
- cacheRead: 0.26,
6736
- cacheWrite: 0,
6737
- },
6738
- contextWindow: 204800,
6739
- maxTokens: 131072,
6740
- } satisfies Model<"openai-completions">,
6741
6519
  "kimi-k2.5": {
6742
6520
  id: "kimi-k2.5",
6743
6521
  name: "Kimi K2.5",
@@ -6755,40 +6533,6 @@ export const MODELS = {
6755
6533
  contextWindow: 262144,
6756
6534
  maxTokens: 65536,
6757
6535
  } satisfies Model<"openai-completions">,
6758
- "mimo-v2-omni": {
6759
- id: "mimo-v2-omni",
6760
- name: "MiMo V2 Omni",
6761
- api: "openai-completions",
6762
- provider: "opencode-go",
6763
- baseUrl: "https://opencode.ai/zen/go/v1",
6764
- reasoning: true,
6765
- input: ["text", "image"],
6766
- cost: {
6767
- input: 0.4,
6768
- output: 2,
6769
- cacheRead: 0.08,
6770
- cacheWrite: 0,
6771
- },
6772
- contextWindow: 262144,
6773
- maxTokens: 64000,
6774
- } satisfies Model<"openai-completions">,
6775
- "mimo-v2-pro": {
6776
- id: "mimo-v2-pro",
6777
- name: "MiMo V2 Pro",
6778
- api: "openai-completions",
6779
- provider: "opencode-go",
6780
- baseUrl: "https://opencode.ai/zen/go/v1",
6781
- reasoning: true,
6782
- input: ["text"],
6783
- cost: {
6784
- input: 1,
6785
- output: 3,
6786
- cacheRead: 0.2,
6787
- cacheWrite: 0,
6788
- },
6789
- contextWindow: 1048576,
6790
- maxTokens: 64000,
6791
- } satisfies Model<"openai-completions">,
6792
6536
  "minimax-m2.5": {
6793
6537
  id: "minimax-m2.5",
6794
6538
  name: "MiniMax M2.5",
@@ -6995,6 +6739,23 @@ export const MODELS = {
6995
6739
  contextWindow: 200000,
6996
6740
  maxTokens: 8192,
6997
6741
  } satisfies Model<"openai-completions">,
6742
+ "anthropic/claude-3.5-sonnet": {
6743
+ id: "anthropic/claude-3.5-sonnet",
6744
+ name: "Anthropic: Claude 3.5 Sonnet",
6745
+ api: "openai-completions",
6746
+ provider: "openrouter",
6747
+ baseUrl: "https://openrouter.ai/api/v1",
6748
+ reasoning: false,
6749
+ input: ["text", "image"],
6750
+ cost: {
6751
+ input: 6,
6752
+ output: 30,
6753
+ cacheRead: 0.6,
6754
+ cacheWrite: 7.5,
6755
+ },
6756
+ contextWindow: 200000,
6757
+ maxTokens: 8192,
6758
+ } satisfies Model<"openai-completions">,
6998
6759
  "anthropic/claude-3.7-sonnet": {
6999
6760
  id: "anthropic/claude-3.7-sonnet",
7000
6761
  name: "Anthropic: Claude 3.7 Sonnet",
@@ -7010,7 +6771,7 @@ export const MODELS = {
7010
6771
  cacheWrite: 3.75,
7011
6772
  },
7012
6773
  contextWindow: 200000,
7013
- maxTokens: 128000,
6774
+ maxTokens: 64000,
7014
6775
  } satisfies Model<"openai-completions">,
7015
6776
  "anthropic/claude-3.7-sonnet:thinking": {
7016
6777
  id: "anthropic/claude-3.7-sonnet:thinking",
@@ -7114,23 +6875,6 @@ export const MODELS = {
7114
6875
  contextWindow: 1000000,
7115
6876
  maxTokens: 128000,
7116
6877
  } satisfies Model<"openai-completions">,
7117
- "anthropic/claude-opus-4.6-fast": {
7118
- id: "anthropic/claude-opus-4.6-fast",
7119
- name: "Anthropic: Claude Opus 4.6 (Fast)",
7120
- api: "openai-completions",
7121
- provider: "openrouter",
7122
- baseUrl: "https://openrouter.ai/api/v1",
7123
- reasoning: true,
7124
- input: ["text", "image"],
7125
- cost: {
7126
- input: 30,
7127
- output: 150,
7128
- cacheRead: 3,
7129
- cacheWrite: 37.5,
7130
- },
7131
- contextWindow: 1000000,
7132
- maxTokens: 128000,
7133
- } satisfies Model<"openai-completions">,
7134
6878
  "anthropic/claude-sonnet-4": {
7135
6879
  id: "anthropic/claude-sonnet-4",
7136
6880
  name: "Anthropic: Claude Sonnet 4",
@@ -7145,7 +6889,7 @@ export const MODELS = {
7145
6889
  cacheRead: 0.3,
7146
6890
  cacheWrite: 3.75,
7147
6891
  },
7148
- contextWindow: 1000000,
6892
+ contextWindow: 200000,
7149
6893
  maxTokens: 64000,
7150
6894
  } satisfies Model<"openai-completions">,
7151
6895
  "anthropic/claude-sonnet-4.5": {
@@ -7199,39 +6943,39 @@ export const MODELS = {
7199
6943
  contextWindow: 131000,
7200
6944
  maxTokens: 4096,
7201
6945
  } satisfies Model<"openai-completions">,
7202
- "arcee-ai/trinity-large-thinking": {
7203
- id: "arcee-ai/trinity-large-thinking",
7204
- name: "Arcee AI: Trinity Large Thinking",
6946
+ "arcee-ai/trinity-mini": {
6947
+ id: "arcee-ai/trinity-mini",
6948
+ name: "Arcee AI: Trinity Mini",
7205
6949
  api: "openai-completions",
7206
6950
  provider: "openrouter",
7207
6951
  baseUrl: "https://openrouter.ai/api/v1",
7208
6952
  reasoning: true,
7209
6953
  input: ["text"],
7210
6954
  cost: {
7211
- input: 0.22,
7212
- output: 0.85,
6955
+ input: 0.045,
6956
+ output: 0.15,
7213
6957
  cacheRead: 0,
7214
6958
  cacheWrite: 0,
7215
6959
  },
7216
- contextWindow: 262144,
7217
- maxTokens: 262144,
6960
+ contextWindow: 131072,
6961
+ maxTokens: 131072,
7218
6962
  } satisfies Model<"openai-completions">,
7219
- "arcee-ai/trinity-mini": {
7220
- id: "arcee-ai/trinity-mini",
7221
- name: "Arcee AI: Trinity Mini",
6963
+ "arcee-ai/trinity-mini:free": {
6964
+ id: "arcee-ai/trinity-mini:free",
6965
+ name: "Arcee AI: Trinity Mini (free)",
7222
6966
  api: "openai-completions",
7223
6967
  provider: "openrouter",
7224
6968
  baseUrl: "https://openrouter.ai/api/v1",
7225
6969
  reasoning: true,
7226
6970
  input: ["text"],
7227
6971
  cost: {
7228
- input: 0.045,
7229
- output: 0.15,
6972
+ input: 0,
6973
+ output: 0,
7230
6974
  cacheRead: 0,
7231
6975
  cacheWrite: 0,
7232
6976
  },
7233
6977
  contextWindow: 131072,
7234
- maxTokens: 131072,
6978
+ maxTokens: 4096,
7235
6979
  } satisfies Model<"openai-completions">,
7236
6980
  "arcee-ai/virtuoso-large": {
7237
6981
  id: "arcee-ai/virtuoso-large",
@@ -7480,13 +7224,13 @@ export const MODELS = {
7480
7224
  reasoning: true,
7481
7225
  input: ["text"],
7482
7226
  cost: {
7483
- input: 0.5,
7227
+ input: 0.44999999999999996,
7484
7228
  output: 2.1500000000000004,
7485
- cacheRead: 0.35,
7229
+ cacheRead: 0.22499999999999998,
7486
7230
  cacheWrite: 0,
7487
7231
  },
7488
7232
  contextWindow: 163840,
7489
- maxTokens: 4096,
7233
+ maxTokens: 65536,
7490
7234
  } satisfies Model<"openai-completions">,
7491
7235
  "deepseek/deepseek-v3.1-terminus": {
7492
7236
  id: "deepseek/deepseek-v3.1-terminus",
@@ -7639,7 +7383,7 @@ export const MODELS = {
7639
7383
  cacheWrite: 0.08333333333333334,
7640
7384
  },
7641
7385
  contextWindow: 1048576,
7642
- maxTokens: 65535,
7386
+ maxTokens: 65536,
7643
7387
  } satisfies Model<"openai-completions">,
7644
7388
  "google/gemini-2.5-pro": {
7645
7389
  id: "google/gemini-2.5-pro",
@@ -7709,6 +7453,23 @@ export const MODELS = {
7709
7453
  contextWindow: 1048576,
7710
7454
  maxTokens: 65536,
7711
7455
  } satisfies Model<"openai-completions">,
7456
+ "google/gemini-3-pro-preview": {
7457
+ id: "google/gemini-3-pro-preview",
7458
+ name: "Google: Gemini 3 Pro Preview",
7459
+ api: "openai-completions",
7460
+ provider: "openrouter",
7461
+ baseUrl: "https://openrouter.ai/api/v1",
7462
+ reasoning: true,
7463
+ input: ["text", "image"],
7464
+ cost: {
7465
+ input: 2,
7466
+ output: 12,
7467
+ cacheRead: 0.19999999999999998,
7468
+ cacheWrite: 0.375,
7469
+ },
7470
+ contextWindow: 1048576,
7471
+ maxTokens: 65536,
7472
+ } satisfies Model<"openai-completions">,
7712
7473
  "google/gemini-3.1-flash-lite-preview": {
7713
7474
  id: "google/gemini-3.1-flash-lite-preview",
7714
7475
  name: "Google: Gemini 3.1 Flash Lite Preview",
@@ -7760,74 +7521,6 @@ export const MODELS = {
7760
7521
  contextWindow: 1048576,
7761
7522
  maxTokens: 65536,
7762
7523
  } satisfies Model<"openai-completions">,
7763
- "google/gemma-4-26b-a4b-it": {
7764
- id: "google/gemma-4-26b-a4b-it",
7765
- name: "Google: Gemma 4 26B A4B ",
7766
- api: "openai-completions",
7767
- provider: "openrouter",
7768
- baseUrl: "https://openrouter.ai/api/v1",
7769
- reasoning: true,
7770
- input: ["text", "image"],
7771
- cost: {
7772
- input: 0.12,
7773
- output: 0.39999999999999997,
7774
- cacheRead: 0,
7775
- cacheWrite: 0,
7776
- },
7777
- contextWindow: 262144,
7778
- maxTokens: 262144,
7779
- } satisfies Model<"openai-completions">,
7780
- "google/gemma-4-26b-a4b-it:free": {
7781
- id: "google/gemma-4-26b-a4b-it:free",
7782
- name: "Google: Gemma 4 26B A4B (free)",
7783
- api: "openai-completions",
7784
- provider: "openrouter",
7785
- baseUrl: "https://openrouter.ai/api/v1",
7786
- reasoning: true,
7787
- input: ["text", "image"],
7788
- cost: {
7789
- input: 0,
7790
- output: 0,
7791
- cacheRead: 0,
7792
- cacheWrite: 0,
7793
- },
7794
- contextWindow: 262144,
7795
- maxTokens: 32768,
7796
- } satisfies Model<"openai-completions">,
7797
- "google/gemma-4-31b-it": {
7798
- id: "google/gemma-4-31b-it",
7799
- name: "Google: Gemma 4 31B",
7800
- api: "openai-completions",
7801
- provider: "openrouter",
7802
- baseUrl: "https://openrouter.ai/api/v1",
7803
- reasoning: true,
7804
- input: ["text", "image"],
7805
- cost: {
7806
- input: 0.14,
7807
- output: 0.39999999999999997,
7808
- cacheRead: 0,
7809
- cacheWrite: 0,
7810
- },
7811
- contextWindow: 262144,
7812
- maxTokens: 131072,
7813
- } satisfies Model<"openai-completions">,
7814
- "google/gemma-4-31b-it:free": {
7815
- id: "google/gemma-4-31b-it:free",
7816
- name: "Google: Gemma 4 31B (free)",
7817
- api: "openai-completions",
7818
- provider: "openrouter",
7819
- baseUrl: "https://openrouter.ai/api/v1",
7820
- reasoning: true,
7821
- input: ["text", "image"],
7822
- cost: {
7823
- input: 0,
7824
- output: 0,
7825
- cacheRead: 0,
7826
- cacheWrite: 0,
7827
- },
7828
- contextWindow: 262144,
7829
- maxTokens: 32768,
7830
- } satisfies Model<"openai-completions">,
7831
7524
  "inception/mercury": {
7832
7525
  id: "inception/mercury",
7833
7526
  name: "Inception: Mercury",
@@ -7879,22 +7572,22 @@ export const MODELS = {
7879
7572
  contextWindow: 128000,
7880
7573
  maxTokens: 32000,
7881
7574
  } satisfies Model<"openai-completions">,
7882
- "kwaipilot/kat-coder-pro-v2": {
7883
- id: "kwaipilot/kat-coder-pro-v2",
7884
- name: "Kwaipilot: KAT-Coder-Pro V2",
7575
+ "kwaipilot/kat-coder-pro": {
7576
+ id: "kwaipilot/kat-coder-pro",
7577
+ name: "Kwaipilot: KAT-Coder-Pro V1",
7885
7578
  api: "openai-completions",
7886
7579
  provider: "openrouter",
7887
7580
  baseUrl: "https://openrouter.ai/api/v1",
7888
7581
  reasoning: false,
7889
7582
  input: ["text"],
7890
7583
  cost: {
7891
- input: 0.3,
7892
- output: 1.2,
7893
- cacheRead: 0.06,
7584
+ input: 0.207,
7585
+ output: 0.828,
7586
+ cacheRead: 0.0414,
7894
7587
  cacheWrite: 0,
7895
7588
  },
7896
7589
  contextWindow: 256000,
7897
- maxTokens: 80000,
7590
+ maxTokens: 128000,
7898
7591
  } satisfies Model<"openai-completions">,
7899
7592
  "meituan/longcat-flash-chat": {
7900
7593
  id: "meituan/longcat-flash-chat",
@@ -8075,13 +7768,13 @@ export const MODELS = {
8075
7768
  reasoning: true,
8076
7769
  input: ["text"],
8077
7770
  cost: {
8078
- input: 0.29,
7771
+ input: 0.27,
8079
7772
  output: 0.95,
8080
- cacheRead: 0.03,
7773
+ cacheRead: 0.0290000007,
8081
7774
  cacheWrite: 0,
8082
7775
  },
8083
7776
  contextWindow: 196608,
8084
- maxTokens: 196608,
7777
+ maxTokens: 4096,
8085
7778
  } satisfies Model<"openai-completions">,
8086
7779
  "minimax/minimax-m2.5": {
8087
7780
  id: "minimax/minimax-m2.5",
@@ -8092,9 +7785,9 @@ export const MODELS = {
8092
7785
  reasoning: true,
8093
7786
  input: ["text"],
8094
7787
  cost: {
8095
- input: 0.118,
8096
- output: 0.9900000000000001,
8097
- cacheRead: 0.059,
7788
+ input: 0.19999999999999998,
7789
+ output: 1.17,
7790
+ cacheRead: 0.09999999999999999,
8098
7791
  cacheWrite: 0,
8099
7792
  },
8100
7793
  contextWindow: 196608,
@@ -8115,7 +7808,7 @@ export const MODELS = {
8115
7808
  cacheWrite: 0,
8116
7809
  },
8117
7810
  contextWindow: 196608,
8118
- maxTokens: 8192,
7811
+ maxTokens: 196608,
8119
7812
  } satisfies Model<"openai-completions">,
8120
7813
  "minimax/minimax-m2.7": {
8121
7814
  id: "minimax/minimax-m2.7",
@@ -8128,11 +7821,11 @@ export const MODELS = {
8128
7821
  cost: {
8129
7822
  input: 0.3,
8130
7823
  output: 1.2,
8131
- cacheRead: 0.059,
7824
+ cacheRead: 0.06,
8132
7825
  cacheWrite: 0,
8133
7826
  },
8134
- contextWindow: 196608,
8135
- maxTokens: 4096,
7827
+ contextWindow: 204800,
7828
+ maxTokens: 131072,
8136
7829
  } satisfies Model<"openai-completions">,
8137
7830
  "mistralai/codestral-2508": {
8138
7831
  id: "mistralai/codestral-2508",
@@ -8389,6 +8082,23 @@ export const MODELS = {
8389
8082
  contextWindow: 32768,
8390
8083
  maxTokens: 4096,
8391
8084
  } satisfies Model<"openai-completions">,
8085
+ "mistralai/mistral-small-24b-instruct-2501": {
8086
+ id: "mistralai/mistral-small-24b-instruct-2501",
8087
+ name: "Mistral: Mistral Small 3",
8088
+ api: "openai-completions",
8089
+ provider: "openrouter",
8090
+ baseUrl: "https://openrouter.ai/api/v1",
8091
+ reasoning: false,
8092
+ input: ["text"],
8093
+ cost: {
8094
+ input: 0.049999999999999996,
8095
+ output: 0.08,
8096
+ cacheRead: 0,
8097
+ cacheWrite: 0,
8098
+ },
8099
+ contextWindow: 32768,
8100
+ maxTokens: 16384,
8101
+ } satisfies Model<"openai-completions">,
8392
8102
  "mistralai/mistral-small-2603": {
8393
8103
  id: "mistralai/mistral-small-2603",
8394
8104
  name: "Mistral: Mistral Small 4",
@@ -8406,6 +8116,23 @@ export const MODELS = {
8406
8116
  contextWindow: 262144,
8407
8117
  maxTokens: 4096,
8408
8118
  } satisfies Model<"openai-completions">,
8119
+ "mistralai/mistral-small-3.1-24b-instruct:free": {
8120
+ id: "mistralai/mistral-small-3.1-24b-instruct:free",
8121
+ name: "Mistral: Mistral Small 3.1 24B (free)",
8122
+ api: "openai-completions",
8123
+ provider: "openrouter",
8124
+ baseUrl: "https://openrouter.ai/api/v1",
8125
+ reasoning: false,
8126
+ input: ["text", "image"],
8127
+ cost: {
8128
+ input: 0,
8129
+ output: 0,
8130
+ cacheRead: 0,
8131
+ cacheWrite: 0,
8132
+ },
8133
+ contextWindow: 128000,
8134
+ maxTokens: 4096,
8135
+ } satisfies Model<"openai-completions">,
8409
8136
  "mistralai/mistral-small-3.2-24b-instruct": {
8410
8137
  id: "mistralai/mistral-small-3.2-24b-instruct",
8411
8138
  name: "Mistral: Mistral Small 3.2 24B",
@@ -8517,13 +8244,13 @@ export const MODELS = {
8517
8244
  reasoning: false,
8518
8245
  input: ["text"],
8519
8246
  cost: {
8520
- input: 0.5700000000000001,
8521
- output: 2.3,
8247
+ input: 0.55,
8248
+ output: 2.2,
8522
8249
  cacheRead: 0,
8523
8250
  cacheWrite: 0,
8524
8251
  },
8525
- contextWindow: 131072,
8526
- maxTokens: 131072,
8252
+ contextWindow: 131000,
8253
+ maxTokens: 4096,
8527
8254
  } satisfies Model<"openai-completions">,
8528
8255
  "moonshotai/kimi-k2-0905": {
8529
8256
  id: "moonshotai/kimi-k2-0905",
@@ -8536,11 +8263,11 @@ export const MODELS = {
8536
8263
  cost: {
8537
8264
  input: 0.39999999999999997,
8538
8265
  output: 2,
8539
- cacheRead: 0,
8266
+ cacheRead: 0.15,
8540
8267
  cacheWrite: 0,
8541
8268
  },
8542
- contextWindow: 262144,
8543
- maxTokens: 262144,
8269
+ contextWindow: 131072,
8270
+ maxTokens: 4096,
8544
8271
  } satisfies Model<"openai-completions">,
8545
8272
  "moonshotai/kimi-k2-thinking": {
8546
8273
  id: "moonshotai/kimi-k2-thinking",
@@ -8551,12 +8278,12 @@ export const MODELS = {
8551
8278
  reasoning: true,
8552
8279
  input: ["text"],
8553
8280
  cost: {
8554
- input: 0.6,
8555
- output: 2.5,
8556
- cacheRead: 0,
8281
+ input: 0.47,
8282
+ output: 2,
8283
+ cacheRead: 0.14100000000000001,
8557
8284
  cacheWrite: 0,
8558
8285
  },
8559
- contextWindow: 262144,
8286
+ contextWindow: 131072,
8560
8287
  maxTokens: 4096,
8561
8288
  } satisfies Model<"openai-completions">,
8562
8289
  "moonshotai/kimi-k2.5": {
@@ -8585,8 +8312,8 @@ export const MODELS = {
8585
8312
  reasoning: false,
8586
8313
  input: ["text"],
8587
8314
  cost: {
8588
- input: 0.135,
8589
- output: 0.5,
8315
+ input: 0.27,
8316
+ output: 1,
8590
8317
  cacheRead: 0,
8591
8318
  cacheWrite: 0,
8592
8319
  },
@@ -8672,7 +8399,7 @@ export const MODELS = {
8672
8399
  cost: {
8673
8400
  input: 0.09999999999999999,
8674
8401
  output: 0.5,
8675
- cacheRead: 0.09999999999999999,
8402
+ cacheRead: 0.04,
8676
8403
  cacheWrite: 0,
8677
8404
  },
8678
8405
  contextWindow: 262144,
@@ -8897,7 +8624,7 @@ export const MODELS = {
8897
8624
  cacheWrite: 0,
8898
8625
  },
8899
8626
  contextWindow: 1047576,
8900
- maxTokens: 4096,
8627
+ maxTokens: 32768,
8901
8628
  } satisfies Model<"openai-completions">,
8902
8629
  "openai/gpt-4.1-mini": {
8903
8630
  id: "openai/gpt-4.1-mini",
@@ -8944,7 +8671,7 @@ export const MODELS = {
8944
8671
  cost: {
8945
8672
  input: 2.5,
8946
8673
  output: 10,
8947
- cacheRead: 0,
8674
+ cacheRead: 1.25,
8948
8675
  cacheWrite: 0,
8949
8676
  },
8950
8677
  contextWindow: 128000,
@@ -9165,11 +8892,11 @@ export const MODELS = {
9165
8892
  cost: {
9166
8893
  input: 0.049999999999999996,
9167
8894
  output: 0.39999999999999997,
9168
- cacheRead: 0.01,
8895
+ cacheRead: 0.005,
9169
8896
  cacheWrite: 0,
9170
8897
  },
9171
8898
  contextWindow: 400000,
9172
- maxTokens: 4096,
8899
+ maxTokens: 128000,
9173
8900
  } satisfies Model<"openai-completions">,
9174
8901
  "openai/gpt-5-pro": {
9175
8902
  id: "openai/gpt-5-pro",
@@ -9199,7 +8926,7 @@ export const MODELS = {
9199
8926
  cost: {
9200
8927
  input: 1.25,
9201
8928
  output: 10,
9202
- cacheRead: 0.13,
8929
+ cacheRead: 0.125,
9203
8930
  cacheWrite: 0,
9204
8931
  },
9205
8932
  contextWindow: 400000,
@@ -9267,11 +8994,11 @@ export const MODELS = {
9267
8994
  cost: {
9268
8995
  input: 0.25,
9269
8996
  output: 2,
9270
- cacheRead: 0.03,
8997
+ cacheRead: 0.024999999999999998,
9271
8998
  cacheWrite: 0,
9272
8999
  },
9273
9000
  contextWindow: 400000,
9274
- maxTokens: 128000,
9001
+ maxTokens: 100000,
9275
9002
  } satisfies Model<"openai-completions">,
9276
9003
  "openai/gpt-5.2": {
9277
9004
  id: "openai/gpt-5.2",
@@ -9305,7 +9032,7 @@ export const MODELS = {
9305
9032
  cacheWrite: 0,
9306
9033
  },
9307
9034
  contextWindow: 128000,
9308
- maxTokens: 32000,
9035
+ maxTokens: 16384,
9309
9036
  } satisfies Model<"openai-completions">,
9310
9037
  "openai/gpt-5.2-codex": {
9311
9038
  id: "openai/gpt-5.2-codex",
@@ -9443,40 +9170,6 @@ export const MODELS = {
9443
9170
  contextWindow: 1050000,
9444
9171
  maxTokens: 128000,
9445
9172
  } satisfies Model<"openai-completions">,
9446
- "openai/gpt-audio": {
9447
- id: "openai/gpt-audio",
9448
- name: "OpenAI: GPT Audio",
9449
- api: "openai-completions",
9450
- provider: "openrouter",
9451
- baseUrl: "https://openrouter.ai/api/v1",
9452
- reasoning: false,
9453
- input: ["text"],
9454
- cost: {
9455
- input: 2.5,
9456
- output: 10,
9457
- cacheRead: 0,
9458
- cacheWrite: 0,
9459
- },
9460
- contextWindow: 128000,
9461
- maxTokens: 16384,
9462
- } satisfies Model<"openai-completions">,
9463
- "openai/gpt-audio-mini": {
9464
- id: "openai/gpt-audio-mini",
9465
- name: "OpenAI: GPT Audio Mini",
9466
- api: "openai-completions",
9467
- provider: "openrouter",
9468
- baseUrl: "https://openrouter.ai/api/v1",
9469
- reasoning: false,
9470
- input: ["text"],
9471
- cost: {
9472
- input: 0.6,
9473
- output: 2.4,
9474
- cacheRead: 0,
9475
- cacheWrite: 0,
9476
- },
9477
- contextWindow: 128000,
9478
- maxTokens: 16384,
9479
- } satisfies Model<"openai-completions">,
9480
9173
  "openai/gpt-oss-120b": {
9481
9174
  id: "openai/gpt-oss-120b",
9482
9175
  name: "OpenAI: gpt-oss-120b",
@@ -9521,12 +9214,12 @@ export const MODELS = {
9521
9214
  input: ["text"],
9522
9215
  cost: {
9523
9216
  input: 0.03,
9524
- output: 0.14,
9525
- cacheRead: 0,
9217
+ output: 0.11,
9218
+ cacheRead: 0.015,
9526
9219
  cacheWrite: 0,
9527
9220
  },
9528
9221
  contextWindow: 131072,
9529
- maxTokens: 4096,
9222
+ maxTokens: 131072,
9530
9223
  } satisfies Model<"openai-completions">,
9531
9224
  "openai/gpt-oss-20b:free": {
9532
9225
  id: "openai/gpt-oss-20b:free",
@@ -9543,7 +9236,7 @@ export const MODELS = {
9543
9236
  cacheWrite: 0,
9544
9237
  },
9545
9238
  contextWindow: 131072,
9546
- maxTokens: 8192,
9239
+ maxTokens: 131072,
9547
9240
  } satisfies Model<"openai-completions">,
9548
9241
  "openai/gpt-oss-safeguard-20b": {
9549
9242
  id: "openai/gpt-oss-safeguard-20b",
@@ -9798,7 +9491,7 @@ export const MODELS = {
9798
9491
  cacheWrite: 0,
9799
9492
  },
9800
9493
  contextWindow: 32768,
9801
- maxTokens: 32768,
9494
+ maxTokens: 4096,
9802
9495
  } satisfies Model<"openai-completions">,
9803
9496
  "qwen/qwen-max": {
9804
9497
  id: "qwen/qwen-max",
@@ -10038,6 +9731,23 @@ export const MODELS = {
10038
9731
  contextWindow: 40960,
10039
9732
  maxTokens: 40960,
10040
9733
  } satisfies Model<"openai-completions">,
9734
+ "qwen/qwen3-4b:free": {
9735
+ id: "qwen/qwen3-4b:free",
9736
+ name: "Qwen: Qwen3 4B (free)",
9737
+ api: "openai-completions",
9738
+ provider: "openrouter",
9739
+ baseUrl: "https://openrouter.ai/api/v1",
9740
+ reasoning: true,
9741
+ input: ["text"],
9742
+ cost: {
9743
+ input: 0,
9744
+ output: 0,
9745
+ cacheRead: 0,
9746
+ cacheWrite: 0,
9747
+ },
9748
+ contextWindow: 40960,
9749
+ maxTokens: 4096,
9750
+ } satisfies Model<"openai-completions">,
10041
9751
  "qwen/qwen3-8b": {
10042
9752
  id: "qwen/qwen3-8b",
10043
9753
  name: "Qwen: Qwen3 8B",
@@ -10115,13 +9825,13 @@ export const MODELS = {
10115
9825
  reasoning: false,
10116
9826
  input: ["text"],
10117
9827
  cost: {
10118
- input: 0.15,
10119
- output: 0.7999999999999999,
10120
- cacheRead: 0.12,
9828
+ input: 0.12,
9829
+ output: 0.75,
9830
+ cacheRead: 0.06,
10121
9831
  cacheWrite: 0,
10122
9832
  },
10123
9833
  contextWindow: 262144,
10124
- maxTokens: 262144,
9834
+ maxTokens: 65536,
10125
9835
  } satisfies Model<"openai-completions">,
10126
9836
  "qwen/qwen3-coder-plus": {
10127
9837
  id: "qwen/qwen3-coder-plus",
@@ -10444,7 +10154,7 @@ export const MODELS = {
10444
10154
  cacheWrite: 0,
10445
10155
  },
10446
10156
  contextWindow: 256000,
10447
- maxTokens: 32768,
10157
+ maxTokens: 4096,
10448
10158
  } satisfies Model<"openai-completions">,
10449
10159
  "qwen/qwen3.5-flash-02-23": {
10450
10160
  id: "qwen/qwen3.5-flash-02-23",
@@ -10480,23 +10190,6 @@ export const MODELS = {
10480
10190
  contextWindow: 1000000,
10481
10191
  maxTokens: 65536,
10482
10192
  } satisfies Model<"openai-completions">,
10483
- "qwen/qwen3.6-plus": {
10484
- id: "qwen/qwen3.6-plus",
10485
- name: "Qwen: Qwen3.6 Plus",
10486
- api: "openai-completions",
10487
- provider: "openrouter",
10488
- baseUrl: "https://openrouter.ai/api/v1",
10489
- reasoning: true,
10490
- input: ["text", "image"],
10491
- cost: {
10492
- input: 0.325,
10493
- output: 1.95,
10494
- cacheRead: 0,
10495
- cacheWrite: 0,
10496
- },
10497
- contextWindow: 1000000,
10498
- maxTokens: 65536,
10499
- } satisfies Model<"openai-completions">,
10500
10193
  "qwen/qwq-32b": {
10501
10194
  id: "qwen/qwq-32b",
10502
10195
  name: "Qwen: QwQ 32B",
@@ -10514,23 +10207,6 @@ export const MODELS = {
10514
10207
  contextWindow: 131072,
10515
10208
  maxTokens: 131072,
10516
10209
  } satisfies Model<"openai-completions">,
10517
- "rekaai/reka-edge": {
10518
- id: "rekaai/reka-edge",
10519
- name: "Reka Edge",
10520
- api: "openai-completions",
10521
- provider: "openrouter",
10522
- baseUrl: "https://openrouter.ai/api/v1",
10523
- reasoning: false,
10524
- input: ["text", "image"],
10525
- cost: {
10526
- input: 0.09999999999999999,
10527
- output: 0.09999999999999999,
10528
- cacheRead: 0,
10529
- cacheWrite: 0,
10530
- },
10531
- contextWindow: 16384,
10532
- maxTokens: 16384,
10533
- } satisfies Model<"openai-completions">,
10534
10210
  "relace/relace-search": {
10535
10211
  id: "relace/relace-search",
10536
10212
  name: "Relace: Relace Search",
@@ -10593,11 +10269,28 @@ export const MODELS = {
10593
10269
  cost: {
10594
10270
  input: 0.09999999999999999,
10595
10271
  output: 0.3,
10272
+ cacheRead: 0.02,
10273
+ cacheWrite: 0,
10274
+ },
10275
+ contextWindow: 256000,
10276
+ maxTokens: 256000,
10277
+ } satisfies Model<"openai-completions">,
10278
+ "stepfun/step-3.5-flash:free": {
10279
+ id: "stepfun/step-3.5-flash:free",
10280
+ name: "StepFun: Step 3.5 Flash (free)",
10281
+ api: "openai-completions",
10282
+ provider: "openrouter",
10283
+ baseUrl: "https://openrouter.ai/api/v1",
10284
+ reasoning: true,
10285
+ input: ["text"],
10286
+ cost: {
10287
+ input: 0,
10288
+ output: 0,
10596
10289
  cacheRead: 0,
10597
10290
  cacheWrite: 0,
10598
10291
  },
10599
- contextWindow: 262144,
10600
- maxTokens: 65536,
10292
+ contextWindow: 256000,
10293
+ maxTokens: 256000,
10601
10294
  } satisfies Model<"openai-completions">,
10602
10295
  "thedrummer/rocinante-12b": {
10603
10296
  id: "thedrummer/rocinante-12b",
@@ -10786,9 +10479,9 @@ export const MODELS = {
10786
10479
  contextWindow: 2000000,
10787
10480
  maxTokens: 30000,
10788
10481
  } satisfies Model<"openai-completions">,
10789
- "x-ai/grok-4.20": {
10790
- id: "x-ai/grok-4.20",
10791
- name: "xAI: Grok 4.20",
10482
+ "x-ai/grok-4.20-beta": {
10483
+ id: "x-ai/grok-4.20-beta",
10484
+ name: "xAI: Grok 4.20 Beta",
10792
10485
  api: "openai-completions",
10793
10486
  provider: "openrouter",
10794
10487
  baseUrl: "https://openrouter.ai/api/v1",
@@ -11050,43 +10743,9 @@ export const MODELS = {
11050
10743
  reasoning: true,
11051
10744
  input: ["text"],
11052
10745
  cost: {
11053
- input: 1.2,
11054
- output: 4,
11055
- cacheRead: 0.24,
11056
- cacheWrite: 0,
11057
- },
11058
- contextWindow: 202752,
11059
- maxTokens: 131072,
11060
- } satisfies Model<"openai-completions">,
11061
- "z-ai/glm-5.1": {
11062
- id: "z-ai/glm-5.1",
11063
- name: "Z.ai: GLM 5.1",
11064
- api: "openai-completions",
11065
- provider: "openrouter",
11066
- baseUrl: "https://openrouter.ai/api/v1",
11067
- reasoning: true,
11068
- input: ["text"],
11069
- cost: {
11070
- input: 0.95,
11071
- output: 3.15,
11072
- cacheRead: 0.475,
11073
- cacheWrite: 0,
11074
- },
11075
- contextWindow: 202752,
11076
- maxTokens: 65535,
11077
- } satisfies Model<"openai-completions">,
11078
- "z-ai/glm-5v-turbo": {
11079
- id: "z-ai/glm-5v-turbo",
11080
- name: "Z.ai: GLM 5V Turbo",
11081
- api: "openai-completions",
11082
- provider: "openrouter",
11083
- baseUrl: "https://openrouter.ai/api/v1",
11084
- reasoning: true,
11085
- input: ["text", "image"],
11086
- cost: {
11087
- input: 1.2,
11088
- output: 4,
11089
- cacheRead: 0.24,
10746
+ input: 0.96,
10747
+ output: 3.1999999999999997,
10748
+ cacheRead: 0.192,
11090
10749
  cacheWrite: 0,
11091
10750
  },
11092
10751
  contextWindow: 202752,
@@ -11113,20 +10772,20 @@ export const MODELS = {
11113
10772
  } satisfies Model<"anthropic-messages">,
11114
10773
  "alibaba/qwen-3-235b": {
11115
10774
  id: "alibaba/qwen-3-235b",
11116
- name: "Qwen3 235B A22b Instruct 2507",
10775
+ name: "Qwen3-235B-A22B",
11117
10776
  api: "anthropic-messages",
11118
10777
  provider: "vercel-ai-gateway",
11119
10778
  baseUrl: "https://ai-gateway.vercel.sh",
11120
10779
  reasoning: false,
11121
10780
  input: ["text"],
11122
10781
  cost: {
11123
- input: 0.6,
11124
- output: 1.2,
11125
- cacheRead: 0.6,
10782
+ input: 0.071,
10783
+ output: 0.463,
10784
+ cacheRead: 0,
11126
10785
  cacheWrite: 0,
11127
10786
  },
11128
- contextWindow: 131000,
11129
- maxTokens: 40000,
10787
+ contextWindow: 40960,
10788
+ maxTokens: 16384,
11130
10789
  } satisfies Model<"anthropic-messages">,
11131
10790
  "alibaba/qwen-3-30b": {
11132
10791
  id: "alibaba/qwen-3-30b",
@@ -11154,13 +10813,13 @@ export const MODELS = {
11154
10813
  reasoning: true,
11155
10814
  input: ["text"],
11156
10815
  cost: {
11157
- input: 0.16,
11158
- output: 0.64,
11159
- cacheRead: 0,
10816
+ input: 0.29,
10817
+ output: 0.59,
10818
+ cacheRead: 0.145,
11160
10819
  cacheWrite: 0,
11161
10820
  },
11162
- contextWindow: 128000,
11163
- maxTokens: 8192,
10821
+ contextWindow: 131072,
10822
+ maxTokens: 40960,
11164
10823
  } satisfies Model<"anthropic-messages">,
11165
10824
  "alibaba/qwen3-235b-a22b-thinking": {
11166
10825
  id: "alibaba/qwen3-235b-a22b-thinking",
@@ -11188,13 +10847,13 @@ export const MODELS = {
11188
10847
  reasoning: false,
11189
10848
  input: ["text"],
11190
10849
  cost: {
11191
- input: 1.5,
11192
- output: 7.5,
11193
- cacheRead: 0.3,
10850
+ input: 0.39999999999999997,
10851
+ output: 1.5999999999999999,
10852
+ cacheRead: 0.022,
11194
10853
  cacheWrite: 0,
11195
10854
  },
11196
10855
  contextWindow: 262144,
11197
- maxTokens: 65536,
10856
+ maxTokens: 66536,
11198
10857
  } satisfies Model<"anthropic-messages">,
11199
10858
  "alibaba/qwen3-coder-30b-a3b": {
11200
10859
  id: "alibaba/qwen3-coder-30b-a3b",
@@ -11307,13 +10966,13 @@ export const MODELS = {
11307
10966
  reasoning: true,
11308
10967
  input: ["text", "image"],
11309
10968
  cost: {
11310
- input: 0.39999999999999997,
11311
- output: 4,
10969
+ input: 0.22,
10970
+ output: 0.88,
11312
10971
  cacheRead: 0,
11313
10972
  cacheWrite: 0,
11314
10973
  },
11315
- contextWindow: 131072,
11316
- maxTokens: 32768,
10974
+ contextWindow: 256000,
10975
+ maxTokens: 256000,
11317
10976
  } satisfies Model<"anthropic-messages">,
11318
10977
  "alibaba/qwen3.5-flash": {
11319
10978
  id: "alibaba/qwen3.5-flash",
@@ -11349,23 +11008,6 @@ export const MODELS = {
11349
11008
  contextWindow: 1000000,
11350
11009
  maxTokens: 64000,
11351
11010
  } satisfies Model<"anthropic-messages">,
11352
- "alibaba/qwen3.6-plus": {
11353
- id: "alibaba/qwen3.6-plus",
11354
- name: "Qwen 3.6 Plus",
11355
- api: "anthropic-messages",
11356
- provider: "vercel-ai-gateway",
11357
- baseUrl: "https://ai-gateway.vercel.sh",
11358
- reasoning: true,
11359
- input: ["text", "image"],
11360
- cost: {
11361
- input: 0.5,
11362
- output: 3,
11363
- cacheRead: 0.09999999999999999,
11364
- cacheWrite: 0,
11365
- },
11366
- contextWindow: 1000000,
11367
- maxTokens: 64000,
11368
- } satisfies Model<"anthropic-messages">,
11369
11011
  "anthropic/claude-3-haiku": {
11370
11012
  id: "anthropic/claude-3-haiku",
11371
11013
  name: "Claude 3 Haiku",
@@ -11400,6 +11042,40 @@ export const MODELS = {
11400
11042
  contextWindow: 200000,
11401
11043
  maxTokens: 8192,
11402
11044
  } satisfies Model<"anthropic-messages">,
11045
+ "anthropic/claude-3.5-sonnet": {
11046
+ id: "anthropic/claude-3.5-sonnet",
11047
+ name: "Claude 3.5 Sonnet",
11048
+ api: "anthropic-messages",
11049
+ provider: "vercel-ai-gateway",
11050
+ baseUrl: "https://ai-gateway.vercel.sh",
11051
+ reasoning: false,
11052
+ input: ["text", "image"],
11053
+ cost: {
11054
+ input: 3,
11055
+ output: 15,
11056
+ cacheRead: 0.3,
11057
+ cacheWrite: 3.75,
11058
+ },
11059
+ contextWindow: 200000,
11060
+ maxTokens: 8192,
11061
+ } satisfies Model<"anthropic-messages">,
11062
+ "anthropic/claude-3.5-sonnet-20240620": {
11063
+ id: "anthropic/claude-3.5-sonnet-20240620",
11064
+ name: "Claude 3.5 Sonnet (2024-06-20)",
11065
+ api: "anthropic-messages",
11066
+ provider: "vercel-ai-gateway",
11067
+ baseUrl: "https://ai-gateway.vercel.sh",
11068
+ reasoning: false,
11069
+ input: ["text", "image"],
11070
+ cost: {
11071
+ input: 3,
11072
+ output: 15,
11073
+ cacheRead: 0.3,
11074
+ cacheWrite: 3.75,
11075
+ },
11076
+ contextWindow: 200000,
11077
+ maxTokens: 8192,
11078
+ } satisfies Model<"anthropic-messages">,
11403
11079
  "anthropic/claude-3.7-sonnet": {
11404
11080
  id: "anthropic/claude-3.7-sonnet",
11405
11081
  name: "Claude 3.7 Sonnet",
@@ -11570,23 +11246,6 @@ export const MODELS = {
11570
11246
  contextWindow: 131000,
11571
11247
  maxTokens: 131000,
11572
11248
  } satisfies Model<"anthropic-messages">,
11573
- "arcee-ai/trinity-large-thinking": {
11574
- id: "arcee-ai/trinity-large-thinking",
11575
- name: "Trinity Large Thinking",
11576
- api: "anthropic-messages",
11577
- provider: "vercel-ai-gateway",
11578
- baseUrl: "https://ai-gateway.vercel.sh",
11579
- reasoning: true,
11580
- input: ["text"],
11581
- cost: {
11582
- input: 0.25,
11583
- output: 0.8999999999999999,
11584
- cacheRead: 0,
11585
- cacheWrite: 0,
11586
- },
11587
- contextWindow: 262100,
11588
- maxTokens: 80000,
11589
- } satisfies Model<"anthropic-messages">,
11590
11249
  "bytedance/seed-1.6": {
11591
11250
  id: "bytedance/seed-1.6",
11592
11251
  name: "Seed 1.6",
@@ -11664,13 +11323,13 @@ export const MODELS = {
11664
11323
  reasoning: true,
11665
11324
  input: ["text"],
11666
11325
  cost: {
11667
- input: 0.56,
11668
- output: 1.68,
11669
- cacheRead: 0.28,
11326
+ input: 0.5,
11327
+ output: 1.5,
11328
+ cacheRead: 0,
11670
11329
  cacheWrite: 0,
11671
11330
  },
11672
11331
  contextWindow: 163840,
11673
- maxTokens: 8192,
11332
+ maxTokens: 16384,
11674
11333
  } satisfies Model<"anthropic-messages">,
11675
11334
  "deepseek/deepseek-v3.1-terminus": {
11676
11335
  id: "deepseek/deepseek-v3.1-terminus",
@@ -11853,7 +11512,7 @@ export const MODELS = {
11853
11512
  cost: {
11854
11513
  input: 0.25,
11855
11514
  output: 1.5,
11856
- cacheRead: 0.03,
11515
+ cacheRead: 0,
11857
11516
  cacheWrite: 0,
11858
11517
  },
11859
11518
  contextWindow: 1000000,
@@ -11876,40 +11535,6 @@ export const MODELS = {
11876
11535
  contextWindow: 1000000,
11877
11536
  maxTokens: 64000,
11878
11537
  } satisfies Model<"anthropic-messages">,
11879
- "google/gemma-4-26b-a4b-it": {
11880
- id: "google/gemma-4-26b-a4b-it",
11881
- name: "Gemma 4 26B A4B IT",
11882
- api: "anthropic-messages",
11883
- provider: "vercel-ai-gateway",
11884
- baseUrl: "https://ai-gateway.vercel.sh",
11885
- reasoning: false,
11886
- input: ["text", "image"],
11887
- cost: {
11888
- input: 0.13,
11889
- output: 0.39999999999999997,
11890
- cacheRead: 0,
11891
- cacheWrite: 0,
11892
- },
11893
- contextWindow: 262144,
11894
- maxTokens: 131072,
11895
- } satisfies Model<"anthropic-messages">,
11896
- "google/gemma-4-31b-it": {
11897
- id: "google/gemma-4-31b-it",
11898
- name: "Gemma 4 31B IT",
11899
- api: "anthropic-messages",
11900
- provider: "vercel-ai-gateway",
11901
- baseUrl: "https://ai-gateway.vercel.sh",
11902
- reasoning: false,
11903
- input: ["text", "image"],
11904
- cost: {
11905
- input: 0.14,
11906
- output: 0.39999999999999997,
11907
- cacheRead: 0,
11908
- cacheWrite: 0,
11909
- },
11910
- contextWindow: 262144,
11911
- maxTokens: 131072,
11912
- } satisfies Model<"anthropic-messages">,
11913
11538
  "inception/mercury-2": {
11914
11539
  id: "inception/mercury-2",
11915
11540
  name: "Mercury 2",
@@ -11944,39 +11569,39 @@ export const MODELS = {
11944
11569
  contextWindow: 32000,
11945
11570
  maxTokens: 16384,
11946
11571
  } satisfies Model<"anthropic-messages">,
11947
- "kwaipilot/kat-coder-pro-v2": {
11948
- id: "kwaipilot/kat-coder-pro-v2",
11949
- name: "Kat Coder Pro V2",
11572
+ "meituan/longcat-flash-chat": {
11573
+ id: "meituan/longcat-flash-chat",
11574
+ name: "LongCat Flash Chat",
11950
11575
  api: "anthropic-messages",
11951
11576
  provider: "vercel-ai-gateway",
11952
11577
  baseUrl: "https://ai-gateway.vercel.sh",
11953
- reasoning: true,
11578
+ reasoning: false,
11954
11579
  input: ["text"],
11955
11580
  cost: {
11956
- input: 0.3,
11957
- output: 1.2,
11958
- cacheRead: 0.06,
11581
+ input: 0,
11582
+ output: 0,
11583
+ cacheRead: 0,
11959
11584
  cacheWrite: 0,
11960
11585
  },
11961
- contextWindow: 256000,
11962
- maxTokens: 256000,
11586
+ contextWindow: 128000,
11587
+ maxTokens: 100000,
11963
11588
  } satisfies Model<"anthropic-messages">,
11964
- "meituan/longcat-flash-chat": {
11965
- id: "meituan/longcat-flash-chat",
11966
- name: "LongCat Flash Chat",
11589
+ "meituan/longcat-flash-thinking": {
11590
+ id: "meituan/longcat-flash-thinking",
11591
+ name: "LongCat Flash Thinking",
11967
11592
  api: "anthropic-messages",
11968
11593
  provider: "vercel-ai-gateway",
11969
11594
  baseUrl: "https://ai-gateway.vercel.sh",
11970
- reasoning: false,
11595
+ reasoning: true,
11971
11596
  input: ["text"],
11972
11597
  cost: {
11973
- input: 0,
11974
- output: 0,
11598
+ input: 0.15,
11599
+ output: 1.5,
11975
11600
  cacheRead: 0,
11976
11601
  cacheWrite: 0,
11977
11602
  },
11978
11603
  contextWindow: 128000,
11979
- maxTokens: 100000,
11604
+ maxTokens: 8192,
11980
11605
  } satisfies Model<"anthropic-messages">,
11981
11606
  "meta/llama-3.1-70b": {
11982
11607
  id: "meta/llama-3.1-70b",
@@ -12004,13 +11629,13 @@ export const MODELS = {
12004
11629
  reasoning: false,
12005
11630
  input: ["text"],
12006
11631
  cost: {
12007
- input: 0.22,
12008
- output: 0.22,
12009
- cacheRead: 0,
11632
+ input: 0.09999999999999999,
11633
+ output: 0.09999999999999999,
11634
+ cacheRead: 0.09999999999999999,
12010
11635
  cacheWrite: 0,
12011
11636
  },
12012
11637
  contextWindow: 128000,
12013
- maxTokens: 8192,
11638
+ maxTokens: 16384,
12014
11639
  } satisfies Model<"anthropic-messages">,
12015
11640
  "meta/llama-3.2-11b": {
12016
11641
  id: "meta/llama-3.2-11b",
@@ -12388,20 +12013,20 @@ export const MODELS = {
12388
12013
  } satisfies Model<"anthropic-messages">,
12389
12014
  "moonshotai/kimi-k2": {
12390
12015
  id: "moonshotai/kimi-k2",
12391
- name: "Kimi K2 Instruct",
12016
+ name: "Kimi K2",
12392
12017
  api: "anthropic-messages",
12393
12018
  provider: "vercel-ai-gateway",
12394
12019
  baseUrl: "https://ai-gateway.vercel.sh",
12395
12020
  reasoning: false,
12396
12021
  input: ["text"],
12397
12022
  cost: {
12398
- input: 0.5700000000000001,
12399
- output: 2.3,
12400
- cacheRead: 0,
12023
+ input: 0.6,
12024
+ output: 2.5,
12025
+ cacheRead: 0.15,
12401
12026
  cacheWrite: 0,
12402
12027
  },
12403
12028
  contextWindow: 131072,
12404
- maxTokens: 131072,
12029
+ maxTokens: 16384,
12405
12030
  } satisfies Model<"anthropic-messages">,
12406
12031
  "moonshotai/kimi-k2-0905": {
12407
12032
  id: "moonshotai/kimi-k2-0905",
@@ -12414,11 +12039,11 @@ export const MODELS = {
12414
12039
  cost: {
12415
12040
  input: 0.6,
12416
12041
  output: 2.5,
12417
- cacheRead: 0.3,
12042
+ cacheRead: 0.15,
12418
12043
  cacheWrite: 0,
12419
12044
  },
12420
12045
  contextWindow: 256000,
12421
- maxTokens: 128000,
12046
+ maxTokens: 16384,
12422
12047
  } satisfies Model<"anthropic-messages">,
12423
12048
  "moonshotai/kimi-k2-thinking": {
12424
12049
  id: "moonshotai/kimi-k2-thinking",
@@ -12990,12 +12615,12 @@ export const MODELS = {
12990
12615
  reasoning: true,
12991
12616
  input: ["text"],
12992
12617
  cost: {
12993
- input: 0.049999999999999996,
12994
- output: 0.19999999999999998,
12618
+ input: 0.07,
12619
+ output: 0.3,
12995
12620
  cacheRead: 0,
12996
12621
  cacheWrite: 0,
12997
12622
  },
12998
- contextWindow: 131072,
12623
+ contextWindow: 128000,
12999
12624
  maxTokens: 8192,
13000
12625
  } satisfies Model<"anthropic-messages">,
13001
12626
  "openai/gpt-oss-safeguard-20b": {
@@ -13126,8 +12751,8 @@ export const MODELS = {
13126
12751
  reasoning: false,
13127
12752
  input: ["text", "image"],
13128
12753
  cost: {
13129
- input: 0,
13130
- output: 0,
12754
+ input: 1,
12755
+ output: 1,
13131
12756
  cacheRead: 0,
13132
12757
  cacheWrite: 0,
13133
12758
  },
@@ -13143,8 +12768,8 @@ export const MODELS = {
13143
12768
  reasoning: false,
13144
12769
  input: ["text", "image"],
13145
12770
  cost: {
13146
- input: 0,
13147
- output: 0,
12771
+ input: 3,
12772
+ output: 15,
13148
12773
  cacheRead: 0,
13149
12774
  cacheWrite: 0,
13150
12775
  },
@@ -13168,6 +12793,23 @@ export const MODELS = {
13168
12793
  contextWindow: 131072,
13169
12794
  maxTokens: 131072,
13170
12795
  } satisfies Model<"anthropic-messages">,
12796
+ "xai/grok-2-vision": {
12797
+ id: "xai/grok-2-vision",
12798
+ name: "Grok 2 Vision",
12799
+ api: "anthropic-messages",
12800
+ provider: "vercel-ai-gateway",
12801
+ baseUrl: "https://ai-gateway.vercel.sh",
12802
+ reasoning: false,
12803
+ input: ["text", "image"],
12804
+ cost: {
12805
+ input: 2,
12806
+ output: 10,
12807
+ cacheRead: 0,
12808
+ cacheWrite: 0,
12809
+ },
12810
+ contextWindow: 32768,
12811
+ maxTokens: 32768,
12812
+ } satisfies Model<"anthropic-messages">,
13171
12813
  "xai/grok-3": {
13172
12814
  id: "xai/grok-3",
13173
12815
  name: "Grok 3 Beta",
@@ -13321,23 +12963,6 @@ export const MODELS = {
13321
12963
  contextWindow: 2000000,
13322
12964
  maxTokens: 30000,
13323
12965
  } satisfies Model<"anthropic-messages">,
13324
- "xai/grok-4.20-multi-agent": {
13325
- id: "xai/grok-4.20-multi-agent",
13326
- name: "Grok 4.20 Multi-Agent",
13327
- api: "anthropic-messages",
13328
- provider: "vercel-ai-gateway",
13329
- baseUrl: "https://ai-gateway.vercel.sh",
13330
- reasoning: true,
13331
- input: ["text"],
13332
- cost: {
13333
- input: 2,
13334
- output: 6,
13335
- cacheRead: 0.19999999999999998,
13336
- cacheWrite: 0,
13337
- },
13338
- contextWindow: 2000000,
13339
- maxTokens: 2000000,
13340
- } satisfies Model<"anthropic-messages">,
13341
12966
  "xai/grok-4.20-multi-agent-beta": {
13342
12967
  id: "xai/grok-4.20-multi-agent-beta",
13343
12968
  name: "Grok 4.20 Multi Agent Beta",
@@ -13355,23 +12980,6 @@ export const MODELS = {
13355
12980
  contextWindow: 2000000,
13356
12981
  maxTokens: 2000000,
13357
12982
  } satisfies Model<"anthropic-messages">,
13358
- "xai/grok-4.20-non-reasoning": {
13359
- id: "xai/grok-4.20-non-reasoning",
13360
- name: "Grok 4.20 Non-Reasoning",
13361
- api: "anthropic-messages",
13362
- provider: "vercel-ai-gateway",
13363
- baseUrl: "https://ai-gateway.vercel.sh",
13364
- reasoning: false,
13365
- input: ["text", "image"],
13366
- cost: {
13367
- input: 2,
13368
- output: 6,
13369
- cacheRead: 0.19999999999999998,
13370
- cacheWrite: 0,
13371
- },
13372
- contextWindow: 2000000,
13373
- maxTokens: 2000000,
13374
- } satisfies Model<"anthropic-messages">,
13375
12983
  "xai/grok-4.20-non-reasoning-beta": {
13376
12984
  id: "xai/grok-4.20-non-reasoning-beta",
13377
12985
  name: "Grok 4.20 Beta Non-Reasoning",
@@ -13389,23 +12997,6 @@ export const MODELS = {
13389
12997
  contextWindow: 2000000,
13390
12998
  maxTokens: 2000000,
13391
12999
  } satisfies Model<"anthropic-messages">,
13392
- "xai/grok-4.20-reasoning": {
13393
- id: "xai/grok-4.20-reasoning",
13394
- name: "Grok 4.20 Reasoning",
13395
- api: "anthropic-messages",
13396
- provider: "vercel-ai-gateway",
13397
- baseUrl: "https://ai-gateway.vercel.sh",
13398
- reasoning: true,
13399
- input: ["text", "image"],
13400
- cost: {
13401
- input: 2,
13402
- output: 6,
13403
- cacheRead: 0.19999999999999998,
13404
- cacheWrite: 0,
13405
- },
13406
- contextWindow: 2000000,
13407
- maxTokens: 2000000,
13408
- } satisfies Model<"anthropic-messages">,
13409
13000
  "xai/grok-4.20-reasoning-beta": {
13410
13001
  id: "xai/grok-4.20-reasoning-beta",
13411
13002
  name: "Grok 4.20 Beta Reasoning",
@@ -13449,9 +13040,9 @@ export const MODELS = {
13449
13040
  reasoning: true,
13450
13041
  input: ["text"],
13451
13042
  cost: {
13452
- input: 0.09,
13453
- output: 0.29,
13454
- cacheRead: 0.045,
13043
+ input: 0.09999999999999999,
13044
+ output: 0.3,
13045
+ cacheRead: 0.02,
13455
13046
  cacheWrite: 0,
13456
13047
  },
13457
13048
  contextWindow: 262144,
@@ -13585,13 +13176,13 @@ export const MODELS = {
13585
13176
  reasoning: true,
13586
13177
  input: ["text"],
13587
13178
  cost: {
13588
- input: 2.25,
13589
- output: 2.75,
13590
- cacheRead: 2.25,
13179
+ input: 0.6,
13180
+ output: 2.2,
13181
+ cacheRead: 0,
13591
13182
  cacheWrite: 0,
13592
13183
  },
13593
- contextWindow: 131000,
13594
- maxTokens: 40000,
13184
+ contextWindow: 200000,
13185
+ maxTokens: 120000,
13595
13186
  } satisfies Model<"anthropic-messages">,
13596
13187
  "zai/glm-4.7-flash": {
13597
13188
  id: "zai/glm-4.7-flash",
@@ -13661,40 +13252,6 @@ export const MODELS = {
13661
13252
  contextWindow: 202800,
13662
13253
  maxTokens: 131100,
13663
13254
  } satisfies Model<"anthropic-messages">,
13664
- "zai/glm-5.1": {
13665
- id: "zai/glm-5.1",
13666
- name: "GLM 5.1",
13667
- api: "anthropic-messages",
13668
- provider: "vercel-ai-gateway",
13669
- baseUrl: "https://ai-gateway.vercel.sh",
13670
- reasoning: true,
13671
- input: ["text"],
13672
- cost: {
13673
- input: 1.4,
13674
- output: 4.4,
13675
- cacheRead: 0.26,
13676
- cacheWrite: 0,
13677
- },
13678
- contextWindow: 202800,
13679
- maxTokens: 64000,
13680
- } satisfies Model<"anthropic-messages">,
13681
- "zai/glm-5v-turbo": {
13682
- id: "zai/glm-5v-turbo",
13683
- name: "GLM 5V Turbo",
13684
- api: "anthropic-messages",
13685
- provider: "vercel-ai-gateway",
13686
- baseUrl: "https://ai-gateway.vercel.sh",
13687
- reasoning: true,
13688
- input: ["text", "image"],
13689
- cost: {
13690
- input: 1.2,
13691
- output: 4,
13692
- cacheRead: 0.24,
13693
- cacheWrite: 0,
13694
- },
13695
- contextWindow: 200000,
13696
- maxTokens: 128000,
13697
- } satisfies Model<"anthropic-messages">,
13698
13255
  },
13699
13256
  "xai": {
13700
13257
  "grok-2": {
@@ -14251,24 +13808,6 @@ export const MODELS = {
14251
13808
  contextWindow: 200000,
14252
13809
  maxTokens: 131072,
14253
13810
  } satisfies Model<"openai-completions">,
14254
- "glm-4.7-flashx": {
14255
- id: "glm-4.7-flashx",
14256
- name: "GLM-4.7-FlashX",
14257
- api: "openai-completions",
14258
- provider: "zai",
14259
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14260
- compat: {"supportsDeveloperRole":false,"thinkingFormat":"zai"},
14261
- reasoning: true,
14262
- input: ["text"],
14263
- cost: {
14264
- input: 0.07,
14265
- output: 0.4,
14266
- cacheRead: 0.01,
14267
- cacheWrite: 0,
14268
- },
14269
- contextWindow: 200000,
14270
- maxTokens: 131072,
14271
- } satisfies Model<"openai-completions">,
14272
13811
  "glm-5": {
14273
13812
  id: "glm-5",
14274
13813
  name: "GLM-5",
@@ -14305,41 +13844,5 @@ export const MODELS = {
14305
13844
  contextWindow: 200000,
14306
13845
  maxTokens: 131072,
14307
13846
  } satisfies Model<"openai-completions">,
14308
- "glm-5.1": {
14309
- id: "glm-5.1",
14310
- name: "GLM-5.1",
14311
- api: "openai-completions",
14312
- provider: "zai",
14313
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14314
- compat: {"supportsDeveloperRole":false,"thinkingFormat":"zai"},
14315
- reasoning: true,
14316
- input: ["text"],
14317
- cost: {
14318
- input: 1.4,
14319
- output: 4.4,
14320
- cacheRead: 0.26,
14321
- cacheWrite: 0,
14322
- },
14323
- contextWindow: 200000,
14324
- maxTokens: 131072,
14325
- } satisfies Model<"openai-completions">,
14326
- "glm-5v-turbo": {
14327
- id: "glm-5v-turbo",
14328
- name: "glm-5v-turbo",
14329
- api: "openai-completions",
14330
- provider: "zai",
14331
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14332
- compat: {"supportsDeveloperRole":false,"thinkingFormat":"zai"},
14333
- reasoning: true,
14334
- input: ["text", "image"],
14335
- cost: {
14336
- input: 1.2,
14337
- output: 4,
14338
- cacheRead: 0.24,
14339
- cacheWrite: 0,
14340
- },
14341
- contextWindow: 200000,
14342
- maxTokens: 131072,
14343
- } satisfies Model<"openai-completions">,
14344
13847
  },
14345
13848
  } as const;