@mastra/core 0.21.1 → 0.21.2-alpha.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (212) hide show
  1. package/CHANGELOG.md +44 -0
  2. package/dist/agent/__tests__/mock-model.d.ts +6 -0
  3. package/dist/agent/__tests__/mock-model.d.ts.map +1 -0
  4. package/dist/agent/agent.d.ts +9 -4
  5. package/dist/agent/agent.d.ts.map +1 -1
  6. package/dist/agent/agent.types.d.ts +4 -3
  7. package/dist/agent/agent.types.d.ts.map +1 -1
  8. package/dist/agent/index.cjs +13 -13
  9. package/dist/agent/index.js +2 -2
  10. package/dist/agent/input-processor/index.cjs +6 -6
  11. package/dist/agent/input-processor/index.js +1 -1
  12. package/dist/agent/message-list/index.d.ts.map +1 -1
  13. package/dist/agent/message-list/utils/ai-v5/gemini-compatibility.d.ts +22 -0
  14. package/dist/agent/message-list/utils/ai-v5/gemini-compatibility.d.ts.map +1 -0
  15. package/dist/agent/types.d.ts +5 -0
  16. package/dist/agent/types.d.ts.map +1 -1
  17. package/dist/agent/utils.d.ts.map +1 -1
  18. package/dist/agent/workflows/prepare-stream/index.d.ts +7 -4
  19. package/dist/agent/workflows/prepare-stream/index.d.ts.map +1 -1
  20. package/dist/agent/workflows/prepare-stream/prepare-memory-step.d.ts +7 -4
  21. package/dist/agent/workflows/prepare-stream/prepare-memory-step.d.ts.map +1 -1
  22. package/dist/agent/workflows/prepare-stream/schema.d.ts +4 -4
  23. package/dist/agent/workflows/prepare-stream/stream-step.d.ts +3 -0
  24. package/dist/agent/workflows/prepare-stream/stream-step.d.ts.map +1 -1
  25. package/dist/ai-tracing/index.cjs +32 -32
  26. package/dist/ai-tracing/index.js +1 -1
  27. package/dist/{chunk-NHKXTGR6.js → chunk-4ZFVJA3A.js} +3 -3
  28. package/dist/{chunk-NHKXTGR6.js.map → chunk-4ZFVJA3A.js.map} +1 -1
  29. package/dist/{chunk-XVREJCOW.cjs → chunk-7P5FMQQK.cjs} +6 -6
  30. package/dist/{chunk-XVREJCOW.cjs.map → chunk-7P5FMQQK.cjs.map} +1 -1
  31. package/dist/{chunk-3V4O35FO.js → chunk-BLVB2IJK.js} +3 -3
  32. package/dist/{chunk-3V4O35FO.js.map → chunk-BLVB2IJK.js.map} +1 -1
  33. package/dist/{chunk-FESSBG5D.cjs → chunk-D3IOLHNB.cjs} +12 -12
  34. package/dist/{chunk-FESSBG5D.cjs.map → chunk-D3IOLHNB.cjs.map} +1 -1
  35. package/dist/{chunk-KAV4EP3T.cjs → chunk-EGNHIPGJ.cjs} +4 -4
  36. package/dist/{chunk-KAV4EP3T.cjs.map → chunk-EGNHIPGJ.cjs.map} +1 -1
  37. package/dist/{chunk-5NR2GY4U.js → chunk-GB5BIA4V.js} +5 -3
  38. package/dist/chunk-GB5BIA4V.js.map +1 -0
  39. package/dist/{chunk-J2OKI2L3.js → chunk-GKTRUHKB.js} +10 -5
  40. package/dist/chunk-GKTRUHKB.js.map +1 -0
  41. package/dist/{chunk-A3QHQYMC.js → chunk-HGNRQ3OG.js} +12 -2
  42. package/dist/chunk-HGNRQ3OG.js.map +1 -0
  43. package/dist/{chunk-MUAFIPD7.js → chunk-KLWDUSBX.js} +4 -4
  44. package/dist/{chunk-MUAFIPD7.js.map → chunk-KLWDUSBX.js.map} +1 -1
  45. package/dist/chunk-LJFJTTZQ.cjs +4 -0
  46. package/dist/chunk-LJFJTTZQ.cjs.map +1 -0
  47. package/dist/{chunk-T3PBU7JK.js → chunk-LMP5KMU3.js} +34 -45
  48. package/dist/chunk-LMP5KMU3.js.map +1 -0
  49. package/dist/{chunk-OXAN5SM7.cjs → chunk-LRSB62Z6.cjs} +12 -2
  50. package/dist/chunk-LRSB62Z6.cjs.map +1 -0
  51. package/dist/{chunk-3ORA5EFD.cjs → chunk-LZUSZT7R.cjs} +5 -3
  52. package/dist/chunk-LZUSZT7R.cjs.map +1 -0
  53. package/dist/{chunk-XHPBKALR.cjs → chunk-MVVMHOAC.cjs} +15 -12
  54. package/dist/chunk-MVVMHOAC.cjs.map +1 -0
  55. package/dist/{chunk-HBJVAMCS.js → chunk-N3ZSX5OS.js} +31 -32
  56. package/dist/chunk-N3ZSX5OS.js.map +1 -0
  57. package/dist/{chunk-HP7B2TQQ.js → chunk-NIESGYOH.js} +1654 -1469
  58. package/dist/chunk-NIESGYOH.js.map +1 -0
  59. package/dist/{chunk-F6BMIPYW.js → chunk-NL3P7IFI.js} +3 -3
  60. package/dist/{chunk-F6BMIPYW.js.map → chunk-NL3P7IFI.js.map} +1 -1
  61. package/dist/{chunk-U6CUPKV2.js → chunk-R35PINKN.js} +5 -5
  62. package/dist/{chunk-U6CUPKV2.js.map → chunk-R35PINKN.js.map} +1 -1
  63. package/dist/{chunk-W3DS6F6G.cjs → chunk-UN653TND.cjs} +4 -4
  64. package/dist/{chunk-W3DS6F6G.cjs.map → chunk-UN653TND.cjs.map} +1 -1
  65. package/dist/{chunk-44ODA6L3.cjs → chunk-URQI7RJ3.cjs} +4 -4
  66. package/dist/{chunk-44ODA6L3.cjs.map → chunk-URQI7RJ3.cjs.map} +1 -1
  67. package/dist/{chunk-APY2BE4K.cjs → chunk-URVM3Y4T.cjs} +35 -46
  68. package/dist/chunk-URVM3Y4T.cjs.map +1 -0
  69. package/dist/{chunk-AJK7QPSD.cjs → chunk-V5WDWSQ5.cjs} +11 -11
  70. package/dist/{chunk-AJK7QPSD.cjs.map → chunk-V5WDWSQ5.cjs.map} +1 -1
  71. package/dist/{chunk-FLXB6WXO.js → chunk-VQLW7LPO.js} +5 -3
  72. package/dist/chunk-VQLW7LPO.js.map +1 -0
  73. package/dist/{chunk-462DRETM.cjs → chunk-WI2YMBNG.cjs} +64 -66
  74. package/dist/chunk-WI2YMBNG.cjs.map +1 -0
  75. package/dist/{chunk-NUURZ3AY.js → chunk-XBJP7THY.js} +6 -3
  76. package/dist/chunk-XBJP7THY.js.map +1 -0
  77. package/dist/{chunk-5DZ4RYWL.js → chunk-XYNSPEJO.js} +3 -3
  78. package/dist/{chunk-5DZ4RYWL.js.map → chunk-XYNSPEJO.js.map} +1 -1
  79. package/dist/{chunk-OY6UJ3QL.cjs → chunk-YGL6E6PD.cjs} +5 -3
  80. package/dist/chunk-YGL6E6PD.cjs.map +1 -0
  81. package/dist/{chunk-BV6CD4IZ.cjs → chunk-YKVVW65D.cjs} +12 -7
  82. package/dist/chunk-YKVVW65D.cjs.map +1 -0
  83. package/dist/{chunk-DGQW5VRR.cjs → chunk-ZMPSVDDO.cjs} +1658 -1472
  84. package/dist/chunk-ZMPSVDDO.cjs.map +1 -0
  85. package/dist/chunk-ZV5CC35D.js +3 -0
  86. package/dist/chunk-ZV5CC35D.js.map +1 -0
  87. package/dist/index.cjs +50 -46
  88. package/dist/index.js +8 -8
  89. package/dist/llm/index.cjs +10 -6
  90. package/dist/llm/index.d.ts +1 -0
  91. package/dist/llm/index.d.ts.map +1 -1
  92. package/dist/llm/index.js +1 -1
  93. package/dist/llm/model/embedding-router.d.ts +50 -0
  94. package/dist/llm/model/embedding-router.d.ts.map +1 -0
  95. package/dist/llm/model/gateways/models-dev.d.ts.map +1 -1
  96. package/dist/llm/model/gateways/netlify.d.ts.map +1 -1
  97. package/dist/llm/model/index.d.ts +1 -0
  98. package/dist/llm/model/index.d.ts.map +1 -1
  99. package/dist/llm/model/model.loop.d.ts +1 -1
  100. package/dist/llm/model/model.loop.d.ts.map +1 -1
  101. package/dist/llm/model/provider-options.d.ts +42 -0
  102. package/dist/llm/model/provider-options.d.ts.map +1 -0
  103. package/dist/llm/model/provider-types.generated.d.ts +629 -590
  104. package/dist/llm/model/router.d.ts.map +1 -1
  105. package/dist/loop/index.cjs +2 -2
  106. package/dist/loop/index.js +1 -1
  107. package/dist/loop/network/index.d.ts +4 -1
  108. package/dist/loop/network/index.d.ts.map +1 -1
  109. package/dist/loop/test-utils/fullStream.d.ts.map +1 -1
  110. package/dist/loop/test-utils/generateText.d.ts.map +1 -1
  111. package/dist/loop/test-utils/options.d.ts.map +1 -1
  112. package/dist/loop/test-utils/resultObject.d.ts.map +1 -1
  113. package/dist/loop/test-utils/streamObject.d.ts.map +1 -1
  114. package/dist/loop/test-utils/telemetry.d.ts.map +1 -1
  115. package/dist/loop/test-utils/textStream.d.ts.map +1 -1
  116. package/dist/loop/test-utils/toUIMessageStream.d.ts.map +1 -1
  117. package/dist/loop/test-utils/tools.d.ts.map +1 -1
  118. package/dist/loop/test-utils/utils.d.ts +2 -0
  119. package/dist/loop/test-utils/utils.d.ts.map +1 -1
  120. package/dist/loop/workflows/agentic-execution/index.d.ts +42 -42
  121. package/dist/loop/workflows/agentic-execution/llm-execution-step.d.ts +28 -28
  122. package/dist/loop/workflows/agentic-execution/llm-mapping-step.d.ts +14 -14
  123. package/dist/loop/workflows/agentic-loop/index.d.ts +42 -42
  124. package/dist/loop/workflows/schema.d.ts +14 -14
  125. package/dist/mastra/index.cjs +2 -2
  126. package/dist/mastra/index.js +1 -1
  127. package/dist/memory/index.cjs +4 -4
  128. package/dist/memory/index.js +1 -1
  129. package/dist/memory/memory.d.ts.map +1 -1
  130. package/dist/memory/types.d.ts +10 -1
  131. package/dist/memory/types.d.ts.map +1 -1
  132. package/dist/models-dev-4VGIWYS3.js +3 -0
  133. package/dist/{models-dev-3VEABUH4.js.map → models-dev-4VGIWYS3.js.map} +1 -1
  134. package/dist/models-dev-AXZASLL2.cjs +12 -0
  135. package/dist/{models-dev-L42ORGVT.cjs.map → models-dev-AXZASLL2.cjs.map} +1 -1
  136. package/dist/netlify-26MMY5X4.js +3 -0
  137. package/dist/{netlify-NYFKA6UB.js.map → netlify-26MMY5X4.js.map} +1 -1
  138. package/dist/netlify-F3MVGV4Y.cjs +12 -0
  139. package/dist/{netlify-3B6HDHRP.cjs.map → netlify-F3MVGV4Y.cjs.map} +1 -1
  140. package/dist/processors/index.cjs +11 -11
  141. package/dist/processors/index.js +1 -1
  142. package/dist/provider-registry.json +1542 -1464
  143. package/dist/relevance/index.cjs +4 -4
  144. package/dist/relevance/index.js +1 -1
  145. package/dist/scores/index.cjs +9 -9
  146. package/dist/scores/index.js +2 -2
  147. package/dist/scores/scoreTraces/index.cjs +8 -8
  148. package/dist/scores/scoreTraces/index.js +3 -3
  149. package/dist/storage/domains/workflows/inmemory.d.ts.map +1 -1
  150. package/dist/storage/index.cjs +5 -3
  151. package/dist/storage/index.cjs.map +1 -1
  152. package/dist/storage/index.js +3 -1
  153. package/dist/storage/index.js.map +1 -1
  154. package/dist/stream/aisdk/v5/execute.d.ts.map +1 -1
  155. package/dist/stream/aisdk/v5/output.d.ts +9 -10
  156. package/dist/stream/aisdk/v5/output.d.ts.map +1 -1
  157. package/dist/stream/base/output-format-handlers.d.ts +1 -2
  158. package/dist/stream/base/output-format-handlers.d.ts.map +1 -1
  159. package/dist/stream/base/output.d.ts.map +1 -1
  160. package/dist/stream/index.cjs +10 -10
  161. package/dist/stream/index.d.ts +1 -1
  162. package/dist/stream/index.d.ts.map +1 -1
  163. package/dist/stream/index.js +2 -2
  164. package/dist/stream/types.d.ts +17 -1
  165. package/dist/stream/types.d.ts.map +1 -1
  166. package/dist/test-utils/llm-mock.cjs +2 -2
  167. package/dist/test-utils/llm-mock.js +1 -1
  168. package/dist/tools/index.cjs +2 -2
  169. package/dist/tools/index.js +1 -1
  170. package/dist/tools/stream.d.ts +7 -0
  171. package/dist/tools/stream.d.ts.map +1 -1
  172. package/dist/utils.cjs +17 -17
  173. package/dist/utils.js +1 -1
  174. package/dist/workflows/default.d.ts +1 -0
  175. package/dist/workflows/default.d.ts.map +1 -1
  176. package/dist/workflows/evented/index.cjs +10 -10
  177. package/dist/workflows/evented/index.js +1 -1
  178. package/dist/workflows/evented/workflow-event-processor/index.d.ts.map +1 -1
  179. package/dist/workflows/evented/workflow.d.ts.map +1 -1
  180. package/dist/workflows/index.cjs +12 -12
  181. package/dist/workflows/index.js +1 -1
  182. package/dist/workflows/legacy/index.cjs +22 -22
  183. package/dist/workflows/legacy/index.js +1 -1
  184. package/dist/workflows/legacy/machine.d.ts +1 -1
  185. package/dist/workflows/step.d.ts +4 -1
  186. package/dist/workflows/step.d.ts.map +1 -1
  187. package/dist/workflows/types.d.ts +1 -0
  188. package/dist/workflows/types.d.ts.map +1 -1
  189. package/dist/workflows/workflow.d.ts +3 -1
  190. package/dist/workflows/workflow.d.ts.map +1 -1
  191. package/package.json +11 -10
  192. package/src/llm/model/provider-types.generated.d.ts +629 -590
  193. package/dist/chunk-3ORA5EFD.cjs.map +0 -1
  194. package/dist/chunk-462DRETM.cjs.map +0 -1
  195. package/dist/chunk-5NR2GY4U.js.map +0 -1
  196. package/dist/chunk-A3QHQYMC.js.map +0 -1
  197. package/dist/chunk-APY2BE4K.cjs.map +0 -1
  198. package/dist/chunk-BV6CD4IZ.cjs.map +0 -1
  199. package/dist/chunk-DGQW5VRR.cjs.map +0 -1
  200. package/dist/chunk-FLXB6WXO.js.map +0 -1
  201. package/dist/chunk-HBJVAMCS.js.map +0 -1
  202. package/dist/chunk-HP7B2TQQ.js.map +0 -1
  203. package/dist/chunk-J2OKI2L3.js.map +0 -1
  204. package/dist/chunk-NUURZ3AY.js.map +0 -1
  205. package/dist/chunk-OXAN5SM7.cjs.map +0 -1
  206. package/dist/chunk-OY6UJ3QL.cjs.map +0 -1
  207. package/dist/chunk-T3PBU7JK.js.map +0 -1
  208. package/dist/chunk-XHPBKALR.cjs.map +0 -1
  209. package/dist/models-dev-3VEABUH4.js +0 -3
  210. package/dist/models-dev-L42ORGVT.cjs +0 -12
  211. package/dist/netlify-3B6HDHRP.cjs +0 -12
  212. package/dist/netlify-NYFKA6UB.js +0 -3
@@ -1,15 +1,17 @@
1
1
  'use strict';
2
2
 
3
- var chunk3ORA5EFD_cjs = require('./chunk-3ORA5EFD.cjs');
4
- var chunkOY6UJ3QL_cjs = require('./chunk-OY6UJ3QL.cjs');
3
+ var chunkLZUSZT7R_cjs = require('./chunk-LZUSZT7R.cjs');
4
+ var chunkYGL6E6PD_cjs = require('./chunk-YGL6E6PD.cjs');
5
5
  var chunkGPWMM745_cjs = require('./chunk-GPWMM745.cjs');
6
6
  var chunkWM4VQWOZ_cjs = require('./chunk-WM4VQWOZ.cjs');
7
- var crypto = require('crypto');
8
- var openaiCompatibleV5 = require('@ai-sdk/openai-compatible-v5');
9
7
  var fs = require('fs');
10
8
  var module$1 = require('module');
11
9
  var os = require('os');
12
10
  var path = require('path');
11
+ var crypto = require('crypto');
12
+ var openaiCompatibleV5 = require('@ai-sdk/openai-compatible-v5');
13
+ var googleV5 = require('@ai-sdk/google-v5');
14
+ var openaiV5 = require('@ai-sdk/openai-v5');
13
15
 
14
16
  var _documentCurrentScript = typeof document !== 'undefined' ? document.currentScript : null;
15
17
  function _interopDefault (e) { return e && e.__esModule ? e : { default: e }; }
@@ -18,110 +20,91 @@ var fs__default = /*#__PURE__*/_interopDefault(fs);
18
20
  var os__default = /*#__PURE__*/_interopDefault(os);
19
21
  var path__default = /*#__PURE__*/_interopDefault(path);
20
22
 
21
- // src/llm/model/gateways/index.ts
22
- function findGatewayForModel(gatewayId, gateways2) {
23
- const prefixedGateway = gateways2.find((g) => g.prefix && gatewayId.startsWith(`${g.prefix}/`));
24
- if (prefixedGateway) {
25
- return prefixedGateway;
26
- }
27
- const unprefixedGateways = gateways2.filter((g) => !g.prefix);
28
- for (const gateway of unprefixedGateways) {
29
- return gateway;
30
- }
31
- throw new chunkWM4VQWOZ_cjs.MastraError({
32
- id: "MODEL_ROUTER_NO_GATEWAY_FOUND",
33
- category: "USER",
34
- domain: "MODEL_ROUTER",
35
- text: `No Mastra model router gateway found for model id ${gatewayId}`
36
- });
37
- }
38
-
39
23
  // src/llm/model/provider-registry.json
40
24
  var provider_registry_default = {
41
25
  providers: {
42
- "moonshotai-cn": {
43
- url: "https://api.moonshot.cn/v1",
44
- apiKeyEnvVar: "MOONSHOT_API_KEY",
45
- apiKeyHeader: "Authorization",
46
- name: "Moonshot AI (China)",
47
- models: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
48
- docUrl: "https://platform.moonshot.cn/docs/api/chat",
49
- gateway: "models.dev"
50
- },
51
- lucidquery: {
52
- url: "https://lucidquery.com/api/v1",
53
- apiKeyEnvVar: "LUCIDQUERY_API_KEY",
26
+ nvidia: {
27
+ url: "https://integrate.api.nvidia.com/v1",
28
+ apiKeyEnvVar: "NVIDIA_API_KEY",
54
29
  apiKeyHeader: "Authorization",
55
- name: "LucidQuery AI",
56
- models: ["lucidnova-rf1-100b", "lucidquery-nexus-coder"],
57
- docUrl: "https://lucidquery.com/api/docs",
30
+ name: "Nvidia",
31
+ models: [
32
+ "black-forest-labs/flux.1-dev",
33
+ "deepseek-ai/deepseek-v3.1",
34
+ "deepseek-ai/deepseek-v3.1-terminus",
35
+ "google/gemma-3-27b-it",
36
+ "microsoft/phi-4-mini-instruct",
37
+ "moonshotai/kimi-k2-instruct",
38
+ "moonshotai/kimi-k2-instruct-0905",
39
+ "nvidia/cosmos-nemotron-34b",
40
+ "nvidia/llama-3.1-nemotron-ultra-253b-v1",
41
+ "nvidia/nemoretriever-ocr-v1",
42
+ "nvidia/parakeet-tdt-0.6b-v2",
43
+ "openai/gpt-oss-120b",
44
+ "openai/whisper-large-v3",
45
+ "qwen/qwen3-235b-a22b",
46
+ "qwen/qwen3-coder-480b-a35b-instruct"
47
+ ],
48
+ docUrl: "https://docs.api.nvidia.com/nim/",
58
49
  gateway: "models.dev"
59
50
  },
60
- moonshotai: {
61
- url: "https://api.moonshot.ai/v1",
62
- apiKeyEnvVar: "MOONSHOT_API_KEY",
51
+ modelscope: {
52
+ url: "https://api-inference.modelscope.cn/v1",
53
+ apiKeyEnvVar: "MODELSCOPE_API_KEY",
63
54
  apiKeyHeader: "Authorization",
64
- name: "Moonshot AI",
65
- models: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
66
- docUrl: "https://platform.moonshot.ai/docs/api/chat",
55
+ name: "ModelScope",
56
+ models: [
57
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
58
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
59
+ "Qwen/Qwen3-30B-A3B-Instruct-2507",
60
+ "Qwen/Qwen3-30B-A3B-Thinking-2507",
61
+ "Qwen/Qwen3-Coder-30B-A3B-Instruct",
62
+ "ZhipuAI/GLM-4.5",
63
+ "ZhipuAI/GLM-4.6"
64
+ ],
65
+ docUrl: "https://modelscope.cn/docs/model-service/API-Inference/intro",
67
66
  gateway: "models.dev"
68
67
  },
69
- "zai-coding-plan": {
70
- url: "https://api.z.ai/api/coding/paas/v4",
71
- apiKeyEnvVar: "ZHIPU_API_KEY",
68
+ aihubmix: {
69
+ url: "https://api.aihubmix.com/v1",
70
+ apiKeyEnvVar: "AIHUBMIX_API_KEY",
72
71
  apiKeyHeader: "Authorization",
73
- name: "Z.AI Coding Plan",
74
- models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
75
- docUrl: "https://docs.z.ai/devpack/overview",
72
+ name: "AIHubMix",
73
+ models: [
74
+ "DeepSeek-V3.2-Exp",
75
+ "DeepSeek-V3.2-Exp-Think",
76
+ "Kimi-K2-0905",
77
+ "claude-haiku-4-5",
78
+ "claude-opus-4-1",
79
+ "claude-sonnet-4-5",
80
+ "gemini-2.5-flash",
81
+ "gemini-2.5-pro",
82
+ "glm-4.6",
83
+ "gpt-4.1",
84
+ "gpt-4.1-mini",
85
+ "gpt-4.1-nano",
86
+ "gpt-4o",
87
+ "gpt-4o-2024-11-20",
88
+ "gpt-5",
89
+ "gpt-5-codex",
90
+ "gpt-5-mini",
91
+ "gpt-5-nano",
92
+ "gpt-5-pro",
93
+ "o4-mini",
94
+ "qwen3-235b-a22b-instruct-2507",
95
+ "qwen3-235b-a22b-thinking-2507",
96
+ "qwen3-coder-480b-a35b-instruct"
97
+ ],
98
+ docUrl: "https://aihubmix.com/docs/models",
76
99
  gateway: "models.dev"
77
100
  },
78
- alibaba: {
79
- url: "https://dashscope-intl.aliyuncs.com/compatible-mode/v1",
80
- apiKeyEnvVar: "DASHSCOPE_API_KEY",
101
+ lucidquery: {
102
+ url: "https://lucidquery.com/api/v1",
103
+ apiKeyEnvVar: "LUCIDQUERY_API_KEY",
81
104
  apiKeyHeader: "Authorization",
82
- name: "Alibaba",
83
- models: [
84
- "qvq-max",
85
- "qwen-flash",
86
- "qwen-max",
87
- "qwen-mt-plus",
88
- "qwen-mt-turbo",
89
- "qwen-omni-turbo",
90
- "qwen-omni-turbo-realtime",
91
- "qwen-plus",
92
- "qwen-plus-character-ja",
93
- "qwen-turbo",
94
- "qwen-vl-max",
95
- "qwen-vl-ocr",
96
- "qwen-vl-plus",
97
- "qwen2-5-14b-instruct",
98
- "qwen2-5-32b-instruct",
99
- "qwen2-5-72b-instruct",
100
- "qwen2-5-7b-instruct",
101
- "qwen2-5-omni-7b",
102
- "qwen2-5-vl-72b-instruct",
103
- "qwen2-5-vl-7b-instruct",
104
- "qwen3-14b",
105
- "qwen3-235b-a22b",
106
- "qwen3-32b",
107
- "qwen3-8b",
108
- "qwen3-asr-flash",
109
- "qwen3-coder-30b-a3b-instruct",
110
- "qwen3-coder-480b-a35b-instruct",
111
- "qwen3-coder-flash",
112
- "qwen3-coder-plus",
113
- "qwen3-livetranslate-flash-realtime",
114
- "qwen3-max",
115
- "qwen3-next-80b-a3b-instruct",
116
- "qwen3-next-80b-a3b-thinking",
117
- "qwen3-omni-flash",
118
- "qwen3-omni-flash-realtime",
119
- "qwen3-vl-235b-a22b",
120
- "qwen3-vl-30b-a3b",
121
- "qwen3-vl-plus",
122
- "qwq-plus"
123
- ],
124
- docUrl: "https://www.alibabacloud.com/help/en/model-studio/models",
105
+ name: "LucidQuery AI",
106
+ models: ["lucidnova-rf1-100b", "lucidquery-nexus-coder"],
107
+ docUrl: "https://lucidquery.com/api/docs",
125
108
  gateway: "models.dev"
126
109
  },
127
110
  xai: {
@@ -152,537 +135,450 @@ var provider_registry_default = {
152
135
  docUrl: "https://docs.x.ai/docs/models",
153
136
  gateway: "models.dev"
154
137
  },
155
- nvidia: {
156
- url: "https://integrate.api.nvidia.com/v1",
157
- apiKeyEnvVar: "NVIDIA_API_KEY",
138
+ deepseek: {
139
+ url: "https://api.deepseek.com",
140
+ apiKeyEnvVar: "DEEPSEEK_API_KEY",
158
141
  apiKeyHeader: "Authorization",
159
- name: "Nvidia",
160
- models: [
161
- "black-forest-labs/flux.1-dev",
162
- "deepseek-ai/deepseek-v3.1",
163
- "google/gemma-3-27b-it",
164
- "microsoft/phi-4-mini-instruct",
165
- "moonshotai/kimi-k2-instruct",
166
- "moonshotai/kimi-k2-instruct-0905",
167
- "nvidia/cosmos-nemotron-34b",
168
- "nvidia/llama-3.1-nemotron-ultra-253b-v1",
169
- "nvidia/nemoretriever-ocr-v1",
170
- "nvidia/parakeet-tdt-0.6b-v2",
171
- "openai/gpt-oss-120b",
172
- "openai/whisper-large-v3",
173
- "qwen/qwen3-235b-a22b",
174
- "qwen/qwen3-coder-480b-a35b-instruct"
175
- ],
176
- docUrl: "https://docs.api.nvidia.com/nim/",
142
+ name: "DeepSeek",
143
+ models: ["deepseek-chat", "deepseek-reasoner"],
144
+ docUrl: "https://platform.deepseek.com/api-docs/pricing",
177
145
  gateway: "models.dev"
178
146
  },
179
- upstage: {
180
- url: "https://api.upstage.ai",
181
- apiKeyEnvVar: "UPSTAGE_API_KEY",
147
+ requesty: {
148
+ url: "https://router.requesty.ai/v1",
149
+ apiKeyEnvVar: "REQUESTY_API_KEY",
182
150
  apiKeyHeader: "Authorization",
183
- name: "Upstage",
184
- models: ["solar-mini", "solar-pro2"],
185
- docUrl: "https://developers.upstage.ai/docs/apis/chat",
151
+ name: "Requesty",
152
+ models: [
153
+ "anthropic/claude-3-7-sonnet",
154
+ "anthropic/claude-4-sonnet-20250522",
155
+ "anthropic/claude-opus-4",
156
+ "anthropic/claude-opus-4-1-20250805",
157
+ "google/gemini-2.5-flash",
158
+ "google/gemini-2.5-pro",
159
+ "openai/gpt-4.1",
160
+ "openai/gpt-4.1-mini",
161
+ "openai/gpt-4o-mini",
162
+ "openai/gpt-5",
163
+ "openai/gpt-5-mini",
164
+ "openai/gpt-5-nano",
165
+ "openai/o4-mini"
166
+ ],
167
+ docUrl: "https://requesty.ai/solution/llm-routing/models",
186
168
  gateway: "models.dev"
187
169
  },
188
- groq: {
189
- url: "https://api.groq.com/openai/v1",
190
- apiKeyEnvVar: "GROQ_API_KEY",
170
+ nebius: {
171
+ url: "https://api.studio.nebius.com/v1/",
172
+ apiKeyEnvVar: "NEBIUS_API_KEY",
191
173
  apiKeyHeader: "Authorization",
192
- name: "Groq",
174
+ name: "Nebius AI Studio",
193
175
  models: [
194
- "deepseek-r1-distill-llama-70b",
195
- "gemma2-9b-it",
196
- "llama-3.1-8b-instant",
197
- "llama-3.3-70b-versatile",
198
- "llama-guard-3-8b",
199
- "llama3-70b-8192",
200
- "llama3-8b-8192",
201
- "meta-llama/llama-4-maverick-17b-128e-instruct",
202
- "meta-llama/llama-4-scout-17b-16e-instruct",
203
- "meta-llama/llama-guard-4-12b",
204
- "mistral-saba-24b",
176
+ "NousResearch/hermes-4-405b",
177
+ "NousResearch/hermes-4-70b",
178
+ "deepseek-ai/deepseek-v3",
179
+ "meta-llama/llama-3.3-70b-instruct-base",
180
+ "meta-llama/llama-3.3-70b-instruct-fast",
181
+ "meta-llama/llama-3_1-405b-instruct",
205
182
  "moonshotai/kimi-k2-instruct",
206
- "moonshotai/kimi-k2-instruct-0905",
183
+ "nvidia/llama-3_1-nemotron-ultra-253b-v1",
207
184
  "openai/gpt-oss-120b",
208
185
  "openai/gpt-oss-20b",
209
- "qwen-qwq-32b",
210
- "qwen/qwen3-32b"
186
+ "qwen/qwen3-235b-a22b-instruct-2507",
187
+ "qwen/qwen3-235b-a22b-thinking-2507",
188
+ "qwen/qwen3-coder-480b-a35b-instruct",
189
+ "zai-org/glm-4.5",
190
+ "zai-org/glm-4.5-air"
211
191
  ],
212
- docUrl: "https://console.groq.com/docs/models",
192
+ docUrl: "https://docs.studio.nebius.com/quickstart",
213
193
  gateway: "models.dev"
214
194
  },
215
- mistral: {
216
- url: "https://api.mistral.ai/v1",
217
- apiKeyEnvVar: "MISTRAL_API_KEY",
195
+ fastrouter: {
196
+ url: "https://go.fastrouter.ai/api/v1",
197
+ apiKeyEnvVar: "FASTROUTER_API_KEY",
218
198
  apiKeyHeader: "Authorization",
219
- name: "Mistral",
199
+ name: "FastRouter",
220
200
  models: [
221
- "codestral-latest",
222
- "devstral-medium-2507",
223
- "devstral-small-2505",
224
- "devstral-small-2507",
225
- "magistral-medium-latest",
226
- "magistral-small",
227
- "ministral-3b-latest",
228
- "ministral-8b-latest",
229
- "mistral-large-latest",
230
- "mistral-medium-2505",
231
- "mistral-medium-2508",
232
- "mistral-medium-latest",
233
- "mistral-nemo",
234
- "mistral-small-latest",
235
- "open-mistral-7b",
236
- "open-mixtral-8x22b",
237
- "open-mixtral-8x7b",
238
- "pixtral-12b",
239
- "pixtral-large-latest"
201
+ "anthropic/claude-opus-4.1",
202
+ "anthropic/claude-sonnet-4",
203
+ "deepseek-ai/deepseek-r1-distill-llama-70b",
204
+ "google/gemini-2.5-flash",
205
+ "google/gemini-2.5-pro",
206
+ "moonshotai/kimi-k2",
207
+ "openai/gpt-4.1",
208
+ "openai/gpt-5",
209
+ "openai/gpt-5-mini",
210
+ "openai/gpt-5-nano",
211
+ "openai/gpt-oss-120b",
212
+ "openai/gpt-oss-20b",
213
+ "qwen/qwen3-coder",
214
+ "x-ai/grok-4"
240
215
  ],
241
- docUrl: "https://docs.mistral.ai/getting-started/models/",
216
+ docUrl: "https://fastrouter.ai/models",
242
217
  gateway: "models.dev"
243
218
  },
244
- vercel: {
245
- url: "https://ai-gateway.vercel.sh/v1",
246
- apiKeyEnvVar: "AI_GATEWAY_API_KEY",
219
+ perplexity: {
220
+ url: "https://api.perplexity.ai",
221
+ apiKeyEnvVar: "PERPLEXITY_API_KEY",
247
222
  apiKeyHeader: "Authorization",
248
- name: "Vercel AI Gateway",
223
+ name: "Perplexity",
224
+ models: ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
225
+ docUrl: "https://docs.perplexity.ai",
226
+ gateway: "models.dev"
227
+ },
228
+ morph: {
229
+ url: "https://api.morphllm.com/v1",
230
+ apiKeyEnvVar: "MORPH_API_KEY",
231
+ apiKeyHeader: "Authorization",
232
+ name: "Morph",
233
+ models: ["auto", "morph-v3-fast", "morph-v3-large"],
234
+ docUrl: "https://docs.morphllm.com/api-reference/introduction",
235
+ gateway: "models.dev"
236
+ },
237
+ "zai-coding-plan": {
238
+ url: "https://api.z.ai/api/coding/paas/v4",
239
+ apiKeyEnvVar: "ZHIPU_API_KEY",
240
+ apiKeyHeader: "Authorization",
241
+ name: "Z.AI Coding Plan",
242
+ models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
243
+ docUrl: "https://docs.z.ai/devpack/overview",
244
+ gateway: "models.dev"
245
+ },
246
+ huggingface: {
247
+ url: "https://router.huggingface.co/v1",
248
+ apiKeyEnvVar: "HF_TOKEN",
249
+ apiKeyHeader: "Authorization",
250
+ name: "Hugging Face",
249
251
  models: [
250
- "alibaba/qwen3-coder-plus",
251
- "alibaba/qwen3-max",
252
- "alibaba/qwen3-next-80b-a3b-instruct",
253
- "alibaba/qwen3-next-80b-a3b-thinking",
254
- "alibaba/qwen3-vl-instruct",
255
- "alibaba/qwen3-vl-thinking",
256
- "amazon/nova-lite",
257
- "amazon/nova-micro",
258
- "amazon/nova-pro",
259
- "anthropic/claude-3-5-haiku",
260
- "anthropic/claude-3-haiku",
261
- "anthropic/claude-3-opus",
262
- "anthropic/claude-3.5-sonnet",
252
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
253
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
254
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
255
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
256
+ "deepseek-ai/DeepSeek-R1-0528",
257
+ "deepseek-ai/Deepseek-V3-0324",
258
+ "moonshotai/Kimi-K2-Instruct",
259
+ "moonshotai/Kimi-K2-Instruct-0905",
260
+ "zai-org/GLM-4.5",
261
+ "zai-org/GLM-4.5-Air",
262
+ "zai-org/GLM-4.6"
263
+ ],
264
+ docUrl: "https://huggingface.co/docs/inference-providers",
265
+ gateway: "models.dev"
266
+ },
267
+ openrouter: {
268
+ url: "https://openrouter.ai/api/v1",
269
+ apiKeyEnvVar: "OPENROUTER_API_KEY",
270
+ name: "OpenRouter",
271
+ models: [
272
+ "anthropic/claude-3.5-haiku",
263
273
  "anthropic/claude-3.7-sonnet",
264
- "anthropic/claude-4-1-opus",
265
- "anthropic/claude-4-opus",
266
- "anthropic/claude-4-sonnet",
267
- "anthropic/claude-4.5-sonnet",
268
274
  "anthropic/claude-haiku-4.5",
269
- "cerebras/qwen3-coder",
270
- "deepseek/deepseek-r1",
275
+ "anthropic/claude-opus-4",
276
+ "anthropic/claude-opus-4.1",
277
+ "anthropic/claude-sonnet-4",
278
+ "anthropic/claude-sonnet-4.5",
279
+ "cognitivecomputations/dolphin3.0-mistral-24b",
280
+ "cognitivecomputations/dolphin3.0-r1-mistral-24b",
281
+ "deepseek/deepseek-chat-v3-0324",
282
+ "deepseek/deepseek-chat-v3.1",
283
+ "deepseek/deepseek-r1-0528-qwen3-8b:free",
284
+ "deepseek/deepseek-r1-0528:free",
271
285
  "deepseek/deepseek-r1-distill-llama-70b",
286
+ "deepseek/deepseek-r1-distill-qwen-14b",
287
+ "deepseek/deepseek-r1:free",
288
+ "deepseek/deepseek-v3-base:free",
272
289
  "deepseek/deepseek-v3.1-terminus",
273
- "deepseek/deepseek-v3.2-exp",
274
- "deepseek/deepseek-v3.2-exp-thinking",
275
- "google/gemini-2.0-flash",
276
- "google/gemini-2.0-flash-lite",
290
+ "featherless/qwerky-72b",
291
+ "google/gemini-2.0-flash-001",
292
+ "google/gemini-2.0-flash-exp:free",
277
293
  "google/gemini-2.5-flash",
278
294
  "google/gemini-2.5-flash-lite",
279
295
  "google/gemini-2.5-flash-lite-preview-09-2025",
280
296
  "google/gemini-2.5-flash-preview-09-2025",
281
297
  "google/gemini-2.5-pro",
282
- "meta/llama-3.3-70b",
283
- "meta/llama-4-maverick",
284
- "meta/llama-4-scout",
285
- "mistral/codestral",
286
- "mistral/magistral-medium",
287
- "mistral/magistral-small",
288
- "mistral/ministral-3b",
289
- "mistral/ministral-8b",
290
- "mistral/mistral-large",
291
- "mistral/mistral-small",
292
- "mistral/mixtral-8x22b-instruct",
293
- "mistral/pixtral-12b",
294
- "mistral/pixtral-large",
298
+ "google/gemini-2.5-pro-preview-05-06",
299
+ "google/gemini-2.5-pro-preview-06-05",
300
+ "google/gemma-2-9b-it:free",
301
+ "google/gemma-3-12b-it",
302
+ "google/gemma-3-27b-it",
303
+ "google/gemma-3n-e4b-it",
304
+ "google/gemma-3n-e4b-it:free",
305
+ "meta-llama/llama-3.2-11b-vision-instruct",
306
+ "meta-llama/llama-3.3-70b-instruct:free",
307
+ "meta-llama/llama-4-scout:free",
308
+ "microsoft/mai-ds-r1:free",
309
+ "mistralai/codestral-2508",
310
+ "mistralai/devstral-medium-2507",
311
+ "mistralai/devstral-small-2505",
312
+ "mistralai/devstral-small-2505:free",
313
+ "mistralai/devstral-small-2507",
314
+ "mistralai/mistral-7b-instruct:free",
315
+ "mistralai/mistral-medium-3",
316
+ "mistralai/mistral-medium-3.1",
317
+ "mistralai/mistral-nemo:free",
318
+ "mistralai/mistral-small-3.1-24b-instruct",
319
+ "mistralai/mistral-small-3.2-24b-instruct",
320
+ "mistralai/mistral-small-3.2-24b-instruct:free",
321
+ "moonshotai/kimi-dev-72b:free",
295
322
  "moonshotai/kimi-k2",
296
- "morph/morph-v3-fast",
297
- "morph/morph-v3-large",
298
- "openai/gpt-4-turbo",
323
+ "moonshotai/kimi-k2-0905",
324
+ "moonshotai/kimi-k2:free",
325
+ "nousresearch/deephermes-3-llama-3-8b-preview",
326
+ "nousresearch/hermes-4-405b",
327
+ "nousresearch/hermes-4-70b",
299
328
  "openai/gpt-4.1",
300
329
  "openai/gpt-4.1-mini",
301
- "openai/gpt-4.1-nano",
302
- "openai/gpt-4o",
303
330
  "openai/gpt-4o-mini",
304
331
  "openai/gpt-5",
332
+ "openai/gpt-5-chat",
305
333
  "openai/gpt-5-codex",
334
+ "openai/gpt-5-image",
306
335
  "openai/gpt-5-mini",
307
336
  "openai/gpt-5-nano",
308
337
  "openai/gpt-oss-120b",
309
338
  "openai/gpt-oss-20b",
310
- "openai/o1",
311
- "openai/o3",
312
- "openai/o3-mini",
313
339
  "openai/o4-mini",
314
- "perplexity/sonar",
315
- "perplexity/sonar-pro",
316
- "perplexity/sonar-reasoning",
317
- "perplexity/sonar-reasoning-pro",
318
- "vercel/v0-1.0-md",
319
- "vercel/v0-1.5-md",
320
- "xai/grok-2",
321
- "xai/grok-2-vision",
322
- "xai/grok-3",
323
- "xai/grok-3-fast",
324
- "xai/grok-3-mini",
325
- "xai/grok-3-mini-fast",
326
- "xai/grok-4",
327
- "xai/grok-4-fast",
328
- "xai/grok-4-fast-non-reasoning",
329
- "xai/grok-code-fast-1",
330
- "zai/glm-4.5",
331
- "zai/glm-4.5-air",
332
- "zai/glm-4.5v",
333
- "zai/glm-4.6"
340
+ "openrouter/cypher-alpha:free",
341
+ "openrouter/horizon-alpha",
342
+ "openrouter/horizon-beta",
343
+ "openrouter/sonoma-dusk-alpha",
344
+ "openrouter/sonoma-sky-alpha",
345
+ "qwen/qwen-2.5-coder-32b-instruct",
346
+ "qwen/qwen2.5-vl-32b-instruct:free",
347
+ "qwen/qwen2.5-vl-72b-instruct",
348
+ "qwen/qwen2.5-vl-72b-instruct:free",
349
+ "qwen/qwen3-14b:free",
350
+ "qwen/qwen3-235b-a22b-07-25",
351
+ "qwen/qwen3-235b-a22b-07-25:free",
352
+ "qwen/qwen3-235b-a22b-thinking-2507",
353
+ "qwen/qwen3-235b-a22b:free",
354
+ "qwen/qwen3-30b-a3b-instruct-2507",
355
+ "qwen/qwen3-30b-a3b-thinking-2507",
356
+ "qwen/qwen3-30b-a3b:free",
357
+ "qwen/qwen3-32b:free",
358
+ "qwen/qwen3-8b:free",
359
+ "qwen/qwen3-coder",
360
+ "qwen/qwen3-coder:free",
361
+ "qwen/qwen3-max",
362
+ "qwen/qwen3-next-80b-a3b-instruct",
363
+ "qwen/qwen3-next-80b-a3b-thinking",
364
+ "qwen/qwq-32b:free",
365
+ "rekaai/reka-flash-3",
366
+ "sarvamai/sarvam-m:free",
367
+ "thudm/glm-z1-32b:free",
368
+ "tngtech/deepseek-r1t2-chimera:free",
369
+ "x-ai/grok-3",
370
+ "x-ai/grok-3-beta",
371
+ "x-ai/grok-3-mini",
372
+ "x-ai/grok-3-mini-beta",
373
+ "x-ai/grok-4",
374
+ "x-ai/grok-4-fast",
375
+ "x-ai/grok-4-fast:free",
376
+ "x-ai/grok-code-fast-1",
377
+ "z-ai/glm-4.5",
378
+ "z-ai/glm-4.5-air",
379
+ "z-ai/glm-4.5-air:free",
380
+ "z-ai/glm-4.5v",
381
+ "z-ai/glm-4.6"
334
382
  ],
335
- docUrl: "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway",
383
+ docUrl: "https://openrouter.ai/models",
336
384
  gateway: "models.dev"
337
385
  },
338
- nebius: {
339
- url: "https://api.studio.nebius.com/v1/",
340
- apiKeyEnvVar: "NEBIUS_API_KEY",
386
+ cerebras: {
387
+ url: "https://api.cerebras.ai/v1",
388
+ apiKeyEnvVar: "CEREBRAS_API_KEY",
341
389
  apiKeyHeader: "Authorization",
342
- name: "Nebius AI Studio",
343
- models: [
344
- "NousResearch/hermes-4-405b",
345
- "NousResearch/hermes-4-70b",
346
- "deepseek-ai/deepseek-v3",
347
- "meta-llama/llama-3.3-70b-instruct-base",
348
- "meta-llama/llama-3.3-70b-instruct-fast",
349
- "meta-llama/llama-3_1-405b-instruct",
350
- "moonshotai/kimi-k2-instruct",
351
- "nvidia/llama-3_1-nemotron-ultra-253b-v1",
352
- "openai/gpt-oss-120b",
353
- "openai/gpt-oss-20b",
354
- "qwen/qwen3-235b-a22b-instruct-2507",
355
- "qwen/qwen3-235b-a22b-thinking-2507",
356
- "qwen/qwen3-coder-480b-a35b-instruct",
357
- "zai-org/glm-4.5",
358
- "zai-org/glm-4.5-air"
359
- ],
360
- docUrl: "https://docs.studio.nebius.com/quickstart",
390
+ name: "Cerebras",
391
+ models: ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
392
+ docUrl: "https://inference-docs.cerebras.ai/models/overview",
361
393
  gateway: "models.dev"
362
394
  },
363
- deepseek: {
364
- url: "https://api.deepseek.com",
365
- apiKeyEnvVar: "DEEPSEEK_API_KEY",
395
+ zhipuai: {
396
+ url: "https://open.bigmodel.cn/api/paas/v4",
397
+ apiKeyEnvVar: "ZHIPU_API_KEY",
366
398
  apiKeyHeader: "Authorization",
367
- name: "DeepSeek",
368
- models: ["deepseek-chat", "deepseek-reasoner"],
369
- docUrl: "https://platform.deepseek.com/api-docs/pricing",
399
+ name: "Zhipu AI",
400
+ models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
401
+ docUrl: "https://docs.z.ai/guides/overview/pricing",
370
402
  gateway: "models.dev"
371
403
  },
372
- "alibaba-cn": {
373
- url: "https://dashscope.aliyuncs.com/compatible-mode/v1",
374
- apiKeyEnvVar: "DASHSCOPE_API_KEY",
404
+ togetherai: {
405
+ url: "https://api.together.xyz/v1",
406
+ apiKeyEnvVar: "TOGETHER_API_KEY",
375
407
  apiKeyHeader: "Authorization",
376
- name: "Alibaba (China)",
408
+ name: "Together AI",
377
409
  models: [
378
- "deepseek-r1",
379
- "deepseek-r1-0528",
380
- "deepseek-r1-distill-llama-70b",
381
- "deepseek-r1-distill-llama-8b",
382
- "deepseek-r1-distill-qwen-1-5b",
383
- "deepseek-r1-distill-qwen-14b",
384
- "deepseek-r1-distill-qwen-32b",
385
- "deepseek-r1-distill-qwen-7b",
386
- "deepseek-v3",
387
- "deepseek-v3-1",
388
- "deepseek-v3-2-exp",
389
- "moonshot-kimi-k2-instruct",
390
- "qvq-max",
391
- "qwen-deep-research",
392
- "qwen-doc-turbo",
393
- "qwen-flash",
394
- "qwen-long",
395
- "qwen-math-plus",
396
- "qwen-math-turbo",
397
- "qwen-max",
398
- "qwen-mt-plus",
399
- "qwen-mt-turbo",
400
- "qwen-omni-turbo",
401
- "qwen-omni-turbo-realtime",
402
- "qwen-plus",
403
- "qwen-plus-character",
404
- "qwen-turbo",
405
- "qwen-vl-max",
406
- "qwen-vl-ocr",
407
- "qwen-vl-plus",
408
- "qwen2-5-14b-instruct",
409
- "qwen2-5-32b-instruct",
410
- "qwen2-5-72b-instruct",
411
- "qwen2-5-7b-instruct",
412
- "qwen2-5-coder-32b-instruct",
413
- "qwen2-5-coder-7b-instruct",
414
- "qwen2-5-math-72b-instruct",
415
- "qwen2-5-math-7b-instruct",
416
- "qwen2-5-omni-7b",
417
- "qwen2-5-vl-72b-instruct",
418
- "qwen2-5-vl-7b-instruct",
419
- "qwen3-14b",
420
- "qwen3-235b-a22b",
421
- "qwen3-32b",
422
- "qwen3-8b",
423
- "qwen3-asr-flash",
424
- "qwen3-coder-30b-a3b-instruct",
425
- "qwen3-coder-480b-a35b-instruct",
426
- "qwen3-coder-flash",
427
- "qwen3-coder-plus",
428
- "qwen3-max",
429
- "qwen3-next-80b-a3b-instruct",
430
- "qwen3-next-80b-a3b-thinking",
431
- "qwen3-omni-flash",
432
- "qwen3-omni-flash-realtime",
433
- "qwen3-vl-235b-a22b",
434
- "qwen3-vl-30b-a3b",
435
- "qwen3-vl-plus",
436
- "qwq-32b",
437
- "qwq-plus",
438
- "tongyi-intent-detect-v3"
410
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
411
+ "deepseek-ai/DeepSeek-R1",
412
+ "deepseek-ai/DeepSeek-V3",
413
+ "meta-llama/Llama-3.3-70B-Instruct-Turbo",
414
+ "moonshotai/Kimi-K2-Instruct",
415
+ "openai/gpt-oss-120b"
439
416
  ],
440
- docUrl: "https://www.alibabacloud.com/help/en/model-studio/models",
417
+ docUrl: "https://docs.together.ai/docs/serverless-models",
441
418
  gateway: "models.dev"
442
419
  },
443
- venice: {
444
- url: "https://api.venice.ai/api/v1",
445
- apiKeyEnvVar: "VENICE_API_KEY",
420
+ wandb: {
421
+ url: "https://api.inference.wandb.ai/v1",
422
+ apiKeyEnvVar: "WANDB_API_KEY",
446
423
  apiKeyHeader: "Authorization",
447
- name: "Venice AI",
424
+ name: "Weights & Biases",
448
425
  models: [
449
- "deepseek-coder-v2-lite",
450
- "deepseek-r1-671b",
451
- "dolphin-2.9.2-qwen2-72b",
452
- "llama-3.1-405b",
453
- "llama-3.2-3b",
454
- "llama-3.3-70b",
455
- "mistral-31-24b",
456
- "qwen-2.5-coder-32b",
457
- "qwen-2.5-qwq-32b",
458
- "qwen-2.5-vl",
459
- "qwen3-235b",
460
- "qwen3-4b",
461
- "venice-uncensored"
426
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
427
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
428
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
429
+ "deepseek-ai/DeepSeek-R1-0528",
430
+ "deepseek-ai/DeepSeek-V3-0324",
431
+ "meta-llama/Llama-3.1-8B-Instruct",
432
+ "meta-llama/Llama-3.3-70B-Instruct",
433
+ "meta-llama/Llama-4-Scout-17B-16E-Instruct",
434
+ "microsoft/Phi-4-mini-instruct",
435
+ "moonshotai/Kimi-K2-Instruct"
462
436
  ],
463
- docUrl: "https://docs.venice.ai",
437
+ docUrl: "https://weave-docs.wandb.ai/guides/integrations/inference/",
464
438
  gateway: "models.dev"
465
439
  },
466
- chutes: {
467
- url: "https://llm.chutes.ai/v1",
468
- apiKeyEnvVar: "CHUTES_API_KEY",
440
+ submodel: {
441
+ url: "https://llm.submodel.ai/v1",
442
+ apiKeyEnvVar: "SUBMODEL_INSTAGEN_ACCESS_KEY",
469
443
  apiKeyHeader: "Authorization",
470
- name: "Chutes",
444
+ name: "submodel",
471
445
  models: [
472
446
  "Qwen/Qwen3-235B-A22B-Instruct-2507",
473
447
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
474
- "Qwen/Qwen3-30B-A3B",
475
- "Qwen/Qwen3-30B-A3B-Instruct-2507",
476
- "Qwen/Qwen3-30B-A3B-Thinking-2507",
477
- "Qwen/Qwen3-Coder-30B-A3B-Instruct",
478
448
  "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
479
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
480
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
481
- "chutesai/Devstral-Small-2505",
482
- "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
483
449
  "deepseek-ai/DeepSeek-R1-0528",
484
- "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
485
- "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
486
450
  "deepseek-ai/DeepSeek-V3-0324",
487
451
  "deepseek-ai/DeepSeek-V3.1",
488
- "deepseek-ai/DeepSeek-V3.1-Terminus",
489
- "deepseek-ai/DeepSeek-V3.1-turbo",
490
- "deepseek-ai/DeepSeek-V3.1:THINKING",
491
- "deepseek-ai/DeepSeek-V3.2-Exp",
492
- "meituan-longcat/LongCat-Flash-Chat-FP8",
493
- "moonshotai/Kimi-Dev-72B",
494
- "moonshotai/Kimi-K2-Instruct-0905",
495
- "moonshotai/Kimi-K2-Instruct-75k",
496
- "moonshotai/Kimi-VL-A3B-Thinking",
497
452
  "openai/gpt-oss-120b",
498
- "tngtech/DeepSeek-R1T-Chimera",
499
- "tngtech/DeepSeek-TNG-R1T2-Chimera",
500
453
  "zai-org/GLM-4.5-Air",
501
- "zai-org/GLM-4.5-FP8",
502
- "zai-org/GLM-4.5-turbo",
503
- "zai-org/GLM-4.6-FP8",
504
- "zai-org/GLM-4.6-turbo"
505
- ],
506
- docUrl: "https://llm.chutes.ai/v1/models",
507
- gateway: "models.dev"
508
- },
509
- cortecs: {
510
- url: "https://api.cortecs.ai/v1",
511
- apiKeyEnvVar: "CORTECS_API_KEY",
512
- apiKeyHeader: "Authorization",
513
- name: "Cortecs",
514
- models: [
515
- "claude-4-5-sonnet",
516
- "claude-sonnet-4",
517
- "deepseek-v3-0324",
518
- "gemini-2.5-pro",
519
- "gpt-4.1",
520
- "gpt-oss-120b",
521
- "kimi-k2-instruct",
522
- "llama-3.1-405b-instruct",
523
- "nova-pro-v1",
524
- "qwen3-32b",
525
- "qwen3-coder-480b-a35b-instruct"
454
+ "zai-org/GLM-4.5-FP8"
526
455
  ],
527
- docUrl: "https://api.cortecs.ai/v1/models",
456
+ docUrl: "https://submodel.gitbook.io",
528
457
  gateway: "models.dev"
529
458
  },
530
- "github-models": {
531
- url: "https://models.github.ai/inference",
532
- apiKeyEnvVar: "GITHUB_TOKEN",
459
+ vercel: {
460
+ url: "https://ai-gateway.vercel.sh/v1",
461
+ apiKeyEnvVar: "AI_GATEWAY_API_KEY",
533
462
  apiKeyHeader: "Authorization",
534
- name: "GitHub Models",
463
+ name: "Vercel AI Gateway",
535
464
  models: [
536
- "ai21-labs/ai21-jamba-1.5-large",
537
- "ai21-labs/ai21-jamba-1.5-mini",
538
- "cohere/cohere-command-a",
539
- "cohere/cohere-command-r",
540
- "cohere/cohere-command-r-08-2024",
541
- "cohere/cohere-command-r-plus",
542
- "cohere/cohere-command-r-plus-08-2024",
543
- "core42/jais-30b-chat",
465
+ "alibaba/qwen3-coder-plus",
466
+ "alibaba/qwen3-max",
467
+ "alibaba/qwen3-next-80b-a3b-instruct",
468
+ "alibaba/qwen3-next-80b-a3b-thinking",
469
+ "alibaba/qwen3-vl-instruct",
470
+ "alibaba/qwen3-vl-thinking",
471
+ "amazon/nova-lite",
472
+ "amazon/nova-micro",
473
+ "amazon/nova-pro",
474
+ "anthropic/claude-3-5-haiku",
475
+ "anthropic/claude-3-haiku",
476
+ "anthropic/claude-3-opus",
477
+ "anthropic/claude-3.5-sonnet",
478
+ "anthropic/claude-3.7-sonnet",
479
+ "anthropic/claude-4-1-opus",
480
+ "anthropic/claude-4-opus",
481
+ "anthropic/claude-4-sonnet",
482
+ "anthropic/claude-4.5-sonnet",
483
+ "anthropic/claude-haiku-4.5",
484
+ "cerebras/qwen3-coder",
544
485
  "deepseek/deepseek-r1",
545
- "deepseek/deepseek-r1-0528",
546
- "deepseek/deepseek-v3-0324",
547
- "meta/llama-3.2-11b-vision-instruct",
548
- "meta/llama-3.2-90b-vision-instruct",
549
- "meta/llama-3.3-70b-instruct",
550
- "meta/llama-4-maverick-17b-128e-instruct-fp8",
551
- "meta/llama-4-scout-17b-16e-instruct",
552
- "meta/meta-llama-3-70b-instruct",
553
- "meta/meta-llama-3-8b-instruct",
554
- "meta/meta-llama-3.1-405b-instruct",
555
- "meta/meta-llama-3.1-70b-instruct",
556
- "meta/meta-llama-3.1-8b-instruct",
557
- "microsoft/mai-ds-r1",
558
- "microsoft/phi-3-medium-128k-instruct",
559
- "microsoft/phi-3-medium-4k-instruct",
560
- "microsoft/phi-3-mini-128k-instruct",
561
- "microsoft/phi-3-mini-4k-instruct",
562
- "microsoft/phi-3-small-128k-instruct",
563
- "microsoft/phi-3-small-8k-instruct",
564
- "microsoft/phi-3.5-mini-instruct",
565
- "microsoft/phi-3.5-moe-instruct",
566
- "microsoft/phi-3.5-vision-instruct",
567
- "microsoft/phi-4",
568
- "microsoft/phi-4-mini-instruct",
569
- "microsoft/phi-4-mini-reasoning",
570
- "microsoft/phi-4-multimodal-instruct",
571
- "microsoft/phi-4-reasoning",
572
- "mistral-ai/codestral-2501",
573
- "mistral-ai/ministral-3b",
574
- "mistral-ai/mistral-large-2411",
575
- "mistral-ai/mistral-medium-2505",
576
- "mistral-ai/mistral-nemo",
577
- "mistral-ai/mistral-small-2503",
486
+ "deepseek/deepseek-r1-distill-llama-70b",
487
+ "deepseek/deepseek-v3.1-terminus",
488
+ "deepseek/deepseek-v3.2-exp",
489
+ "deepseek/deepseek-v3.2-exp-thinking",
490
+ "google/gemini-2.0-flash",
491
+ "google/gemini-2.0-flash-lite",
492
+ "google/gemini-2.5-flash",
493
+ "google/gemini-2.5-flash-lite",
494
+ "google/gemini-2.5-flash-lite-preview-09-2025",
495
+ "google/gemini-2.5-flash-preview-09-2025",
496
+ "google/gemini-2.5-pro",
497
+ "meta/llama-3.3-70b",
498
+ "meta/llama-4-maverick",
499
+ "meta/llama-4-scout",
500
+ "mistral/codestral",
501
+ "mistral/magistral-medium",
502
+ "mistral/magistral-small",
503
+ "mistral/ministral-3b",
504
+ "mistral/ministral-8b",
505
+ "mistral/mistral-large",
506
+ "mistral/mistral-small",
507
+ "mistral/mixtral-8x22b-instruct",
508
+ "mistral/pixtral-12b",
509
+ "mistral/pixtral-large",
510
+ "moonshotai/kimi-k2",
511
+ "morph/morph-v3-fast",
512
+ "morph/morph-v3-large",
513
+ "openai/gpt-4-turbo",
578
514
  "openai/gpt-4.1",
579
515
  "openai/gpt-4.1-mini",
580
516
  "openai/gpt-4.1-nano",
581
517
  "openai/gpt-4o",
582
518
  "openai/gpt-4o-mini",
519
+ "openai/gpt-5",
520
+ "openai/gpt-5-codex",
521
+ "openai/gpt-5-mini",
522
+ "openai/gpt-5-nano",
523
+ "openai/gpt-oss-120b",
524
+ "openai/gpt-oss-20b",
583
525
  "openai/o1",
584
- "openai/o1-mini",
585
- "openai/o1-preview",
586
526
  "openai/o3",
587
527
  "openai/o3-mini",
588
528
  "openai/o4-mini",
529
+ "perplexity/sonar",
530
+ "perplexity/sonar-pro",
531
+ "perplexity/sonar-reasoning",
532
+ "perplexity/sonar-reasoning-pro",
533
+ "vercel/v0-1.0-md",
534
+ "vercel/v0-1.5-md",
535
+ "xai/grok-2",
536
+ "xai/grok-2-vision",
589
537
  "xai/grok-3",
590
- "xai/grok-3-mini"
591
- ],
592
- docUrl: "https://docs.github.com/en/github-models",
593
- gateway: "models.dev"
594
- },
595
- togetherai: {
596
- url: "https://api.together.xyz/v1",
597
- apiKeyEnvVar: "TOGETHER_API_KEY",
598
- apiKeyHeader: "Authorization",
599
- name: "Together AI",
600
- models: [
601
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
602
- "deepseek-ai/DeepSeek-R1",
603
- "deepseek-ai/DeepSeek-V3",
604
- "meta-llama/Llama-3.3-70B-Instruct-Turbo",
605
- "moonshotai/Kimi-K2-Instruct",
606
- "openai/gpt-oss-120b"
607
- ],
608
- docUrl: "https://docs.together.ai/docs/serverless-models",
609
- gateway: "models.dev"
610
- },
611
- baseten: {
612
- url: "https://inference.baseten.co/v1",
613
- apiKeyEnvVar: "BASETEN_API_KEY",
614
- apiKeyHeader: "Authorization",
615
- name: "Baseten",
616
- models: ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905"],
617
- docUrl: "https://docs.baseten.co/development/model-apis/overview",
618
- gateway: "models.dev"
619
- },
620
- huggingface: {
621
- url: "https://router.huggingface.co/v1",
622
- apiKeyEnvVar: "HF_TOKEN",
623
- apiKeyHeader: "Authorization",
624
- name: "Hugging Face",
625
- models: [
626
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
627
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
628
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
629
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
630
- "deepseek-ai/DeepSeek-R1-0528",
631
- "deepseek-ai/Deepseek-V3-0324",
632
- "moonshotai/Kimi-K2-Instruct",
633
- "moonshotai/Kimi-K2-Instruct-0905",
634
- "zai-org/GLM-4.5",
635
- "zai-org/GLM-4.5-Air",
636
- "zai-org/GLM-4.6"
637
- ],
638
- docUrl: "https://huggingface.co/docs/inference-providers",
639
- gateway: "models.dev"
640
- },
641
- opencode: {
642
- url: "https://opencode.ai/zen/v1",
643
- apiKeyEnvVar: "OPENCODE_API_KEY",
644
- apiKeyHeader: "Authorization",
645
- name: "OpenCode Zen",
646
- models: [
647
- "an-g8x",
648
- "claude-3-5-haiku",
649
- "claude-haiku-4-5",
650
- "claude-opus-4-1",
651
- "claude-sonnet-4",
652
- "claude-sonnet-4-5",
653
- "code-supernova",
654
- "glm-4.6",
655
- "gpt-5",
656
- "gpt-5-codex",
657
- "grok-code",
658
- "kimi-k2",
659
- "qwen3-coder"
538
+ "xai/grok-3-fast",
539
+ "xai/grok-3-mini",
540
+ "xai/grok-3-mini-fast",
541
+ "xai/grok-4",
542
+ "xai/grok-4-fast",
543
+ "xai/grok-4-fast-non-reasoning",
544
+ "xai/grok-code-fast-1",
545
+ "zai/glm-4.5",
546
+ "zai/glm-4.5-air",
547
+ "zai/glm-4.5v",
548
+ "zai/glm-4.6"
660
549
  ],
661
- docUrl: "https://opencode.ai/docs/zen",
550
+ docUrl: "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway",
662
551
  gateway: "models.dev"
663
552
  },
664
- fastrouter: {
665
- url: "https://go.fastrouter.ai/api/v1",
666
- apiKeyEnvVar: "FASTROUTER_API_KEY",
553
+ synthetic: {
554
+ url: "https://api.synthetic.new/v1",
555
+ apiKeyEnvVar: "SYNTHETIC_API_KEY",
667
556
  apiKeyHeader: "Authorization",
668
- name: "FastRouter",
557
+ name: "Synthetic",
669
558
  models: [
670
- "anthropic/claude-opus-4.1",
671
- "anthropic/claude-sonnet-4",
672
- "deepseek-ai/deepseek-r1-distill-llama-70b",
673
- "google/gemini-2.5-flash",
674
- "google/gemini-2.5-pro",
675
- "moonshotai/kimi-k2",
676
- "openai/gpt-4.1",
677
- "openai/gpt-5",
678
- "openai/gpt-5-mini",
679
- "openai/gpt-5-nano",
680
- "openai/gpt-oss-120b",
681
- "openai/gpt-oss-20b",
682
- "qwen/qwen3-coder",
683
- "x-ai/grok-4"
559
+ "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
560
+ "hf:Qwen/Qwen3-235B-A22B-Instruct-2507",
561
+ "hf:Qwen/Qwen3-235B-A22B-Thinking-2507",
562
+ "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct",
563
+ "hf:deepseek-ai/DeepSeek-R1",
564
+ "hf:deepseek-ai/DeepSeek-R1-0528",
565
+ "hf:deepseek-ai/DeepSeek-V3",
566
+ "hf:deepseek-ai/DeepSeek-V3-0324",
567
+ "hf:deepseek-ai/DeepSeek-V3.1",
568
+ "hf:deepseek-ai/DeepSeek-V3.1-Terminus",
569
+ "hf:meta-llama/Llama-3.1-405B-Instruct",
570
+ "hf:meta-llama/Llama-3.1-70B-Instruct",
571
+ "hf:meta-llama/Llama-3.1-8B-Instruct",
572
+ "hf:meta-llama/Llama-3.3-70B-Instruct",
573
+ "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
574
+ "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct",
575
+ "hf:moonshotai/Kimi-K2-Instruct",
576
+ "hf:moonshotai/Kimi-K2-Instruct-0905",
577
+ "hf:openai/gpt-oss-120b",
578
+ "hf:zai-org/GLM-4.5",
579
+ "hf:zai-org/GLM-4.6"
684
580
  ],
685
- docUrl: "https://fastrouter.ai/models",
581
+ docUrl: "https://synthetic.new/pricing",
686
582
  gateway: "models.dev"
687
583
  },
688
584
  google: {
@@ -716,236 +612,105 @@ var provider_registry_default = {
716
612
  docUrl: "https://ai.google.dev/gemini-api/docs/pricing",
717
613
  gateway: "models.dev"
718
614
  },
719
- inception: {
720
- url: "https://api.inceptionlabs.ai/v1/",
721
- apiKeyEnvVar: "INCEPTION_API_KEY",
615
+ groq: {
616
+ url: "https://api.groq.com/openai/v1",
617
+ apiKeyEnvVar: "GROQ_API_KEY",
722
618
  apiKeyHeader: "Authorization",
723
- name: "Inception",
724
- models: ["mercury", "mercury-coder"],
725
- docUrl: "https://platform.inceptionlabs.ai/docs",
619
+ name: "Groq",
620
+ models: [
621
+ "deepseek-r1-distill-llama-70b",
622
+ "gemma2-9b-it",
623
+ "llama-3.1-8b-instant",
624
+ "llama-3.3-70b-versatile",
625
+ "llama-guard-3-8b",
626
+ "llama3-70b-8192",
627
+ "llama3-8b-8192",
628
+ "meta-llama/llama-4-maverick-17b-128e-instruct",
629
+ "meta-llama/llama-4-scout-17b-16e-instruct",
630
+ "meta-llama/llama-guard-4-12b",
631
+ "mistral-saba-24b",
632
+ "moonshotai/kimi-k2-instruct",
633
+ "moonshotai/kimi-k2-instruct-0905",
634
+ "openai/gpt-oss-120b",
635
+ "openai/gpt-oss-20b",
636
+ "qwen-qwq-32b",
637
+ "qwen/qwen3-32b"
638
+ ],
639
+ docUrl: "https://console.groq.com/docs/models",
726
640
  gateway: "models.dev"
727
641
  },
728
- wandb: {
729
- url: "https://api.inference.wandb.ai/v1",
730
- apiKeyEnvVar: "WANDB_API_KEY",
642
+ "moonshotai-cn": {
643
+ url: "https://api.moonshot.cn/v1",
644
+ apiKeyEnvVar: "MOONSHOT_API_KEY",
731
645
  apiKeyHeader: "Authorization",
732
- name: "Weights & Biases",
733
- models: [
734
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
735
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
736
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
737
- "deepseek-ai/DeepSeek-R1-0528",
738
- "deepseek-ai/DeepSeek-V3-0324",
739
- "meta-llama/Llama-3.1-8B-Instruct",
740
- "meta-llama/Llama-3.3-70B-Instruct",
741
- "meta-llama/Llama-4-Scout-17B-16E-Instruct",
742
- "microsoft/Phi-4-mini-instruct",
743
- "moonshotai/Kimi-K2-Instruct"
744
- ],
745
- docUrl: "https://weave-docs.wandb.ai/guides/integrations/inference/",
646
+ name: "Moonshot AI (China)",
647
+ models: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
648
+ docUrl: "https://platform.moonshot.cn/docs/api/chat",
746
649
  gateway: "models.dev"
747
650
  },
748
- openai: {
749
- apiKeyEnvVar: "OPENAI_API_KEY",
750
- name: "OpenAI",
651
+ "github-models": {
652
+ url: "https://models.github.ai/inference",
653
+ apiKeyEnvVar: "GITHUB_TOKEN",
654
+ apiKeyHeader: "Authorization",
655
+ name: "GitHub Models",
751
656
  models: [
752
- "codex-mini-latest",
753
- "gpt-3.5-turbo",
754
- "gpt-4",
755
- "gpt-4-turbo",
756
- "gpt-4.1",
757
- "gpt-4.1-mini",
758
- "gpt-4.1-nano",
759
- "gpt-4o",
760
- "gpt-4o-2024-05-13",
761
- "gpt-4o-2024-08-06",
762
- "gpt-4o-2024-11-20",
763
- "gpt-4o-mini",
764
- "gpt-5",
765
- "gpt-5-chat-latest",
766
- "gpt-5-codex",
767
- "gpt-5-mini",
768
- "gpt-5-nano",
769
- "o1",
770
- "o1-mini",
771
- "o1-preview",
772
- "o1-pro",
773
- "o3",
774
- "o3-deep-research",
775
- "o3-mini",
776
- "o3-pro",
777
- "o4-mini",
778
- "o4-mini-deep-research"
779
- ],
780
- docUrl: "https://platform.openai.com/docs/models",
781
- gateway: "models.dev"
782
- },
783
- "zhipuai-coding-plan": {
784
- url: "https://open.bigmodel.cn/api/coding/paas/v4",
785
- apiKeyEnvVar: "ZHIPU_API_KEY",
786
- apiKeyHeader: "Authorization",
787
- name: "Zhipu AI Coding Plan",
788
- models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
789
- docUrl: "https://docs.bigmodel.cn/cn/coding-plan/overview",
790
- gateway: "models.dev"
791
- },
792
- perplexity: {
793
- url: "https://api.perplexity.ai",
794
- apiKeyEnvVar: "PERPLEXITY_API_KEY",
795
- apiKeyHeader: "Authorization",
796
- name: "Perplexity",
797
- models: ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
798
- docUrl: "https://docs.perplexity.ai",
799
- gateway: "models.dev"
800
- },
801
- openrouter: {
802
- url: "https://openrouter.ai/api/v1",
803
- apiKeyEnvVar: "OPENROUTER_API_KEY",
804
- name: "OpenRouter",
805
- models: [
806
- "anthropic/claude-3.5-haiku",
807
- "anthropic/claude-3.7-sonnet",
808
- "anthropic/claude-4.5-haiku",
809
- "anthropic/claude-opus-4",
810
- "anthropic/claude-opus-4.1",
811
- "anthropic/claude-sonnet-4",
812
- "anthropic/claude-sonnet-4.5",
813
- "cognitivecomputations/dolphin3.0-mistral-24b",
814
- "cognitivecomputations/dolphin3.0-r1-mistral-24b",
815
- "deepseek/deepseek-chat-v3-0324",
816
- "deepseek/deepseek-chat-v3.1",
817
- "deepseek/deepseek-r1-0528-qwen3-8b:free",
818
- "deepseek/deepseek-r1-0528:free",
819
- "deepseek/deepseek-r1-distill-llama-70b",
820
- "deepseek/deepseek-r1-distill-qwen-14b",
821
- "deepseek/deepseek-r1:free",
822
- "deepseek/deepseek-v3-base:free",
823
- "deepseek/deepseek-v3.1-terminus",
824
- "featherless/qwerky-72b",
825
- "google/gemini-2.0-flash-001",
826
- "google/gemini-2.0-flash-exp:free",
827
- "google/gemini-2.5-flash",
828
- "google/gemini-2.5-flash-lite",
829
- "google/gemini-2.5-flash-lite-preview-09-2025",
830
- "google/gemini-2.5-flash-preview-09-2025",
831
- "google/gemini-2.5-pro",
832
- "google/gemini-2.5-pro-preview-05-06",
833
- "google/gemini-2.5-pro-preview-06-05",
834
- "google/gemma-2-9b-it:free",
835
- "google/gemma-3-12b-it",
836
- "google/gemma-3-27b-it",
837
- "google/gemma-3n-e4b-it",
838
- "google/gemma-3n-e4b-it:free",
839
- "meta-llama/llama-3.2-11b-vision-instruct",
840
- "meta-llama/llama-3.3-70b-instruct:free",
841
- "meta-llama/llama-4-scout:free",
842
- "microsoft/mai-ds-r1:free",
843
- "mistralai/codestral-2508",
844
- "mistralai/devstral-medium-2507",
845
- "mistralai/devstral-small-2505",
846
- "mistralai/devstral-small-2505:free",
847
- "mistralai/devstral-small-2507",
848
- "mistralai/mistral-7b-instruct:free",
849
- "mistralai/mistral-medium-3",
850
- "mistralai/mistral-medium-3.1",
851
- "mistralai/mistral-nemo:free",
852
- "mistralai/mistral-small-3.1-24b-instruct",
853
- "mistralai/mistral-small-3.2-24b-instruct",
854
- "mistralai/mistral-small-3.2-24b-instruct:free",
855
- "moonshotai/kimi-dev-72b:free",
856
- "moonshotai/kimi-k2",
857
- "moonshotai/kimi-k2-0905",
858
- "moonshotai/kimi-k2:free",
859
- "nousresearch/deephermes-3-llama-3-8b-preview",
860
- "nousresearch/hermes-4-405b",
861
- "nousresearch/hermes-4-70b",
657
+ "ai21-labs/ai21-jamba-1.5-large",
658
+ "ai21-labs/ai21-jamba-1.5-mini",
659
+ "cohere/cohere-command-a",
660
+ "cohere/cohere-command-r",
661
+ "cohere/cohere-command-r-08-2024",
662
+ "cohere/cohere-command-r-plus",
663
+ "cohere/cohere-command-r-plus-08-2024",
664
+ "core42/jais-30b-chat",
665
+ "deepseek/deepseek-r1",
666
+ "deepseek/deepseek-r1-0528",
667
+ "deepseek/deepseek-v3-0324",
668
+ "meta/llama-3.2-11b-vision-instruct",
669
+ "meta/llama-3.2-90b-vision-instruct",
670
+ "meta/llama-3.3-70b-instruct",
671
+ "meta/llama-4-maverick-17b-128e-instruct-fp8",
672
+ "meta/llama-4-scout-17b-16e-instruct",
673
+ "meta/meta-llama-3-70b-instruct",
674
+ "meta/meta-llama-3-8b-instruct",
675
+ "meta/meta-llama-3.1-405b-instruct",
676
+ "meta/meta-llama-3.1-70b-instruct",
677
+ "meta/meta-llama-3.1-8b-instruct",
678
+ "microsoft/mai-ds-r1",
679
+ "microsoft/phi-3-medium-128k-instruct",
680
+ "microsoft/phi-3-medium-4k-instruct",
681
+ "microsoft/phi-3-mini-128k-instruct",
682
+ "microsoft/phi-3-mini-4k-instruct",
683
+ "microsoft/phi-3-small-128k-instruct",
684
+ "microsoft/phi-3-small-8k-instruct",
685
+ "microsoft/phi-3.5-mini-instruct",
686
+ "microsoft/phi-3.5-moe-instruct",
687
+ "microsoft/phi-3.5-vision-instruct",
688
+ "microsoft/phi-4",
689
+ "microsoft/phi-4-mini-instruct",
690
+ "microsoft/phi-4-mini-reasoning",
691
+ "microsoft/phi-4-multimodal-instruct",
692
+ "microsoft/phi-4-reasoning",
693
+ "mistral-ai/codestral-2501",
694
+ "mistral-ai/ministral-3b",
695
+ "mistral-ai/mistral-large-2411",
696
+ "mistral-ai/mistral-medium-2505",
697
+ "mistral-ai/mistral-nemo",
698
+ "mistral-ai/mistral-small-2503",
862
699
  "openai/gpt-4.1",
863
700
  "openai/gpt-4.1-mini",
701
+ "openai/gpt-4.1-nano",
702
+ "openai/gpt-4o",
864
703
  "openai/gpt-4o-mini",
865
- "openai/gpt-5",
866
- "openai/gpt-5-chat",
867
- "openai/gpt-5-codex",
868
- "openai/gpt-5-image",
869
- "openai/gpt-5-mini",
870
- "openai/gpt-5-nano",
871
- "openai/gpt-oss-120b",
872
- "openai/gpt-oss-20b",
704
+ "openai/o1",
705
+ "openai/o1-mini",
706
+ "openai/o1-preview",
707
+ "openai/o3",
708
+ "openai/o3-mini",
873
709
  "openai/o4-mini",
874
- "openrouter/cypher-alpha:free",
875
- "openrouter/horizon-alpha",
876
- "openrouter/horizon-beta",
877
- "openrouter/sonoma-dusk-alpha",
878
- "openrouter/sonoma-sky-alpha",
879
- "qwen/qwen-2.5-coder-32b-instruct",
880
- "qwen/qwen2.5-vl-32b-instruct:free",
881
- "qwen/qwen2.5-vl-72b-instruct",
882
- "qwen/qwen2.5-vl-72b-instruct:free",
883
- "qwen/qwen3-14b:free",
884
- "qwen/qwen3-235b-a22b-07-25",
885
- "qwen/qwen3-235b-a22b-07-25:free",
886
- "qwen/qwen3-235b-a22b-thinking-2507",
887
- "qwen/qwen3-235b-a22b:free",
888
- "qwen/qwen3-30b-a3b-instruct-2507",
889
- "qwen/qwen3-30b-a3b-thinking-2507",
890
- "qwen/qwen3-30b-a3b:free",
891
- "qwen/qwen3-32b:free",
892
- "qwen/qwen3-8b:free",
893
- "qwen/qwen3-coder",
894
- "qwen/qwen3-coder:free",
895
- "qwen/qwen3-max",
896
- "qwen/qwen3-next-80b-a3b-instruct",
897
- "qwen/qwen3-next-80b-a3b-thinking",
898
- "qwen/qwq-32b:free",
899
- "rekaai/reka-flash-3",
900
- "sarvamai/sarvam-m:free",
901
- "thudm/glm-z1-32b:free",
902
- "tngtech/deepseek-r1t2-chimera:free",
903
- "x-ai/grok-3",
904
- "x-ai/grok-3-beta",
905
- "x-ai/grok-3-mini",
906
- "x-ai/grok-3-mini-beta",
907
- "x-ai/grok-4",
908
- "x-ai/grok-4-fast",
909
- "x-ai/grok-4-fast:free",
910
- "x-ai/grok-code-fast-1",
911
- "z-ai/glm-4.5",
912
- "z-ai/glm-4.5-air",
913
- "z-ai/glm-4.5-air:free",
914
- "z-ai/glm-4.5v",
915
- "z-ai/glm-4.6"
916
- ],
917
- docUrl: "https://openrouter.ai/models",
918
- gateway: "models.dev"
919
- },
920
- synthetic: {
921
- url: "https://api.synthetic.new/v1",
922
- apiKeyEnvVar: "SYNTHETIC_API_KEY",
923
- apiKeyHeader: "Authorization",
924
- name: "Synthetic",
925
- models: [
926
- "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
927
- "hf:Qwen/Qwen3-235B-A22B-Instruct-2507",
928
- "hf:Qwen/Qwen3-235B-A22B-Thinking-2507",
929
- "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct",
930
- "hf:deepseek-ai/DeepSeek-R1",
931
- "hf:deepseek-ai/DeepSeek-R1-0528",
932
- "hf:deepseek-ai/DeepSeek-V3",
933
- "hf:deepseek-ai/DeepSeek-V3-0324",
934
- "hf:deepseek-ai/DeepSeek-V3.1",
935
- "hf:deepseek-ai/DeepSeek-V3.1-Terminus",
936
- "hf:meta-llama/Llama-3.1-405B-Instruct",
937
- "hf:meta-llama/Llama-3.1-70B-Instruct",
938
- "hf:meta-llama/Llama-3.1-8B-Instruct",
939
- "hf:meta-llama/Llama-3.3-70B-Instruct",
940
- "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
941
- "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct",
942
- "hf:moonshotai/Kimi-K2-Instruct",
943
- "hf:moonshotai/Kimi-K2-Instruct-0905",
944
- "hf:openai/gpt-oss-120b",
945
- "hf:zai-org/GLM-4.5",
946
- "hf:zai-org/GLM-4.6"
710
+ "xai/grok-3",
711
+ "xai/grok-3-mini"
947
712
  ],
948
- docUrl: "https://synthetic.new/pricing",
713
+ docUrl: "https://docs.github.com/en/github-models",
949
714
  gateway: "models.dev"
950
715
  },
951
716
  deepinfra: {
@@ -962,92 +727,92 @@ var provider_registry_default = {
962
727
  docUrl: "https://deepinfra.com/models",
963
728
  gateway: "models.dev"
964
729
  },
965
- zhipuai: {
966
- url: "https://open.bigmodel.cn/api/paas/v4",
730
+ "fireworks-ai": {
731
+ url: "https://api.fireworks.ai/inference/v1/",
732
+ apiKeyEnvVar: "FIREWORKS_API_KEY",
733
+ apiKeyHeader: "Authorization",
734
+ name: "Fireworks AI",
735
+ models: [
736
+ "accounts/fireworks/models/deepseek-r1-0528",
737
+ "accounts/fireworks/models/deepseek-v3-0324",
738
+ "accounts/fireworks/models/deepseek-v3p1",
739
+ "accounts/fireworks/models/glm-4p5",
740
+ "accounts/fireworks/models/glm-4p5-air",
741
+ "accounts/fireworks/models/gpt-oss-120b",
742
+ "accounts/fireworks/models/gpt-oss-20b",
743
+ "accounts/fireworks/models/kimi-k2-instruct",
744
+ "accounts/fireworks/models/qwen3-235b-a22b",
745
+ "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
746
+ ],
747
+ docUrl: "https://fireworks.ai/docs/",
748
+ gateway: "models.dev"
749
+ },
750
+ zai: {
751
+ url: "https://api.z.ai/api/paas/v4",
967
752
  apiKeyEnvVar: "ZHIPU_API_KEY",
968
753
  apiKeyHeader: "Authorization",
969
- name: "Zhipu AI",
754
+ name: "Z.AI",
970
755
  models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
971
756
  docUrl: "https://docs.z.ai/guides/overview/pricing",
972
757
  gateway: "models.dev"
973
758
  },
974
- submodel: {
975
- url: "https://llm.submodel.ai/v1",
976
- apiKeyEnvVar: "SUBMODEL_INSTAGEN_ACCESS_KEY",
759
+ opencode: {
760
+ url: "https://opencode.ai/zen/v1",
761
+ apiKeyEnvVar: "OPENCODE_API_KEY",
977
762
  apiKeyHeader: "Authorization",
978
- name: "submodel",
763
+ name: "OpenCode Zen",
979
764
  models: [
980
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
981
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
982
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
983
- "deepseek-ai/DeepSeek-R1-0528",
984
- "deepseek-ai/DeepSeek-V3-0324",
985
- "deepseek-ai/DeepSeek-V3.1",
986
- "openai/gpt-oss-120b",
987
- "zai-org/GLM-4.5-Air",
988
- "zai-org/GLM-4.5-FP8"
765
+ "an-gbt",
766
+ "big-pickle",
767
+ "claude-3-5-haiku",
768
+ "claude-haiku-4-5",
769
+ "claude-opus-4-1",
770
+ "claude-sonnet-4",
771
+ "claude-sonnet-4-5",
772
+ "code-supernova",
773
+ "glm-4.6",
774
+ "gpt-5",
775
+ "gpt-5-codex",
776
+ "grok-code",
777
+ "kimi-k2",
778
+ "qwen3-coder"
989
779
  ],
990
- docUrl: "https://submodel.gitbook.io",
780
+ docUrl: "https://opencode.ai/docs/zen",
991
781
  gateway: "models.dev"
992
782
  },
993
- zai: {
994
- url: "https://api.z.ai/api/paas/v4",
783
+ "zhipuai-coding-plan": {
784
+ url: "https://open.bigmodel.cn/api/coding/paas/v4",
995
785
  apiKeyEnvVar: "ZHIPU_API_KEY",
996
786
  apiKeyHeader: "Authorization",
997
- name: "Z.AI",
787
+ name: "Zhipu AI Coding Plan",
998
788
  models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
999
- docUrl: "https://docs.z.ai/guides/overview/pricing",
789
+ docUrl: "https://docs.bigmodel.cn/cn/coding-plan/overview",
1000
790
  gateway: "models.dev"
1001
791
  },
1002
- inference: {
1003
- url: "https://inference.net/v1",
1004
- apiKeyEnvVar: "INFERENCE_API_KEY",
792
+ inception: {
793
+ url: "https://api.inceptionlabs.ai/v1/",
794
+ apiKeyEnvVar: "INCEPTION_API_KEY",
1005
795
  apiKeyHeader: "Authorization",
1006
- name: "Inference",
1007
- models: [
1008
- "google/gemma-3",
1009
- "meta/llama-3.1-8b-instruct",
1010
- "meta/llama-3.2-11b-vision-instruct",
1011
- "meta/llama-3.2-1b-instruct",
1012
- "meta/llama-3.2-3b-instruct",
1013
- "mistral/mistral-nemo-12b-instruct",
1014
- "osmosis/osmosis-structure-0.6b",
1015
- "qwen/qwen-2.5-7b-vision-instruct",
1016
- "qwen/qwen3-embedding-4b"
1017
- ],
1018
- docUrl: "https://inference.net/models",
796
+ name: "Inception",
797
+ models: ["mercury", "mercury-coder"],
798
+ docUrl: "https://platform.inceptionlabs.ai/docs",
1019
799
  gateway: "models.dev"
1020
800
  },
1021
- requesty: {
1022
- url: "https://router.requesty.ai/v1",
1023
- apiKeyEnvVar: "REQUESTY_API_KEY",
801
+ llama: {
802
+ url: "https://api.llama.com/compat/v1/",
803
+ apiKeyEnvVar: "LLAMA_API_KEY",
1024
804
  apiKeyHeader: "Authorization",
1025
- name: "Requesty",
805
+ name: "Llama",
1026
806
  models: [
1027
- "anthropic/claude-3-7-sonnet",
1028
- "anthropic/claude-4-sonnet-20250522",
1029
- "anthropic/claude-opus-4",
1030
- "anthropic/claude-opus-4-1-20250805",
1031
- "google/gemini-2.5-flash",
1032
- "google/gemini-2.5-pro",
1033
- "openai/gpt-4.1",
1034
- "openai/gpt-4.1-mini",
1035
- "openai/gpt-4o-mini",
1036
- "openai/gpt-5",
1037
- "openai/gpt-5-mini",
1038
- "openai/gpt-5-nano",
1039
- "openai/o4-mini"
807
+ "cerebras-llama-4-maverick-17b-128e-instruct",
808
+ "cerebras-llama-4-scout-17b-16e-instruct",
809
+ "groq-llama-4-maverick-17b-128e-instruct",
810
+ "llama-3.3-70b-instruct",
811
+ "llama-3.3-8b-instruct",
812
+ "llama-4-maverick-17b-128e-instruct-fp8",
813
+ "llama-4-scout-17b-16e-instruct-fp8"
1040
814
  ],
1041
- docUrl: "https://requesty.ai/solution/llm-routing/models",
1042
- gateway: "models.dev"
1043
- },
1044
- morph: {
1045
- url: "https://api.morphllm.com/v1",
1046
- apiKeyEnvVar: "MORPH_API_KEY",
1047
- apiKeyHeader: "Authorization",
1048
- name: "Morph",
1049
- models: ["auto", "morph-v3-fast", "morph-v3-large"],
1050
- docUrl: "https://docs.morphllm.com/api-reference/introduction",
815
+ docUrl: "https://llama.developer.meta.com/docs/models",
1051
816
  gateway: "models.dev"
1052
817
  },
1053
818
  lmstudio: {
@@ -1059,97 +824,359 @@ var provider_registry_default = {
1059
824
  docUrl: "https://lmstudio.ai/models",
1060
825
  gateway: "models.dev"
1061
826
  },
827
+ openai: {
828
+ apiKeyEnvVar: "OPENAI_API_KEY",
829
+ name: "OpenAI",
830
+ models: [
831
+ "codex-mini-latest",
832
+ "gpt-3.5-turbo",
833
+ "gpt-4",
834
+ "gpt-4-turbo",
835
+ "gpt-4.1",
836
+ "gpt-4.1-mini",
837
+ "gpt-4.1-nano",
838
+ "gpt-4o",
839
+ "gpt-4o-2024-05-13",
840
+ "gpt-4o-2024-08-06",
841
+ "gpt-4o-2024-11-20",
842
+ "gpt-4o-mini",
843
+ "gpt-5",
844
+ "gpt-5-chat-latest",
845
+ "gpt-5-codex",
846
+ "gpt-5-mini",
847
+ "gpt-5-nano",
848
+ "o1",
849
+ "o1-mini",
850
+ "o1-preview",
851
+ "o1-pro",
852
+ "o3",
853
+ "o3-deep-research",
854
+ "o3-mini",
855
+ "o3-pro",
856
+ "o4-mini",
857
+ "o4-mini-deep-research"
858
+ ],
859
+ docUrl: "https://platform.openai.com/docs/models",
860
+ gateway: "models.dev"
861
+ },
1062
862
  anthropic: {
1063
863
  apiKeyEnvVar: "ANTHROPIC_API_KEY",
1064
864
  name: "Anthropic",
1065
865
  models: [
1066
866
  "claude-3-5-haiku-20241022",
867
+ "claude-3-5-haiku-latest",
1067
868
  "claude-3-5-sonnet-20240620",
1068
869
  "claude-3-5-sonnet-20241022",
1069
870
  "claude-3-7-sonnet-20250219",
871
+ "claude-3-7-sonnet-latest",
1070
872
  "claude-3-haiku-20240307",
1071
873
  "claude-3-opus-20240229",
1072
874
  "claude-3-sonnet-20240229",
875
+ "claude-haiku-4-5",
1073
876
  "claude-haiku-4-5-20251001",
877
+ "claude-opus-4-0",
878
+ "claude-opus-4-1",
1074
879
  "claude-opus-4-1-20250805",
1075
880
  "claude-opus-4-20250514",
881
+ "claude-sonnet-4-0",
1076
882
  "claude-sonnet-4-20250514",
883
+ "claude-sonnet-4-5",
1077
884
  "claude-sonnet-4-5-20250929"
1078
885
  ],
1079
886
  docUrl: "https://docs.anthropic.com/en/docs/about-claude/models",
1080
887
  gateway: "models.dev"
1081
888
  },
1082
- "fireworks-ai": {
1083
- url: "https://api.fireworks.ai/inference/v1/",
1084
- apiKeyEnvVar: "FIREWORKS_API_KEY",
889
+ moonshotai: {
890
+ url: "https://api.moonshot.ai/v1",
891
+ apiKeyEnvVar: "MOONSHOT_API_KEY",
1085
892
  apiKeyHeader: "Authorization",
1086
- name: "Fireworks AI",
1087
- models: [
1088
- "accounts/fireworks/models/deepseek-r1-0528",
1089
- "accounts/fireworks/models/deepseek-v3-0324",
1090
- "accounts/fireworks/models/deepseek-v3p1",
1091
- "accounts/fireworks/models/glm-4p5",
1092
- "accounts/fireworks/models/glm-4p5-air",
1093
- "accounts/fireworks/models/gpt-oss-120b",
1094
- "accounts/fireworks/models/gpt-oss-20b",
1095
- "accounts/fireworks/models/kimi-k2-instruct",
1096
- "accounts/fireworks/models/qwen3-235b-a22b",
1097
- "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
1098
- ],
1099
- docUrl: "https://fireworks.ai/docs/",
893
+ name: "Moonshot AI",
894
+ models: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
895
+ docUrl: "https://platform.moonshot.ai/docs/api/chat",
1100
896
  gateway: "models.dev"
1101
897
  },
1102
- modelscope: {
1103
- url: "https://api-inference.modelscope.cn/v1",
1104
- apiKeyEnvVar: "MODELSCOPE_API_KEY",
898
+ inference: {
899
+ url: "https://inference.net/v1",
900
+ apiKeyEnvVar: "INFERENCE_API_KEY",
1105
901
  apiKeyHeader: "Authorization",
1106
- name: "ModelScope",
902
+ name: "Inference",
1107
903
  models: [
1108
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1109
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1110
- "Qwen/Qwen3-30B-A3B-Instruct-2507",
1111
- "Qwen/Qwen3-30B-A3B-Thinking-2507",
1112
- "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1113
- "ZhipuAI/GLM-4.5"
904
+ "google/gemma-3",
905
+ "meta/llama-3.1-8b-instruct",
906
+ "meta/llama-3.2-11b-vision-instruct",
907
+ "meta/llama-3.2-1b-instruct",
908
+ "meta/llama-3.2-3b-instruct",
909
+ "mistral/mistral-nemo-12b-instruct",
910
+ "osmosis/osmosis-structure-0.6b",
911
+ "qwen/qwen-2.5-7b-vision-instruct",
912
+ "qwen/qwen3-embedding-4b"
1114
913
  ],
1115
- docUrl: "https://modelscope.cn/docs/model-service/API-Inference/intro",
914
+ docUrl: "https://inference.net/models",
1116
915
  gateway: "models.dev"
1117
916
  },
1118
- llama: {
1119
- url: "https://api.llama.com/compat/v1/",
1120
- apiKeyEnvVar: "LLAMA_API_KEY",
917
+ baseten: {
918
+ url: "https://inference.baseten.co/v1",
919
+ apiKeyEnvVar: "BASETEN_API_KEY",
1121
920
  apiKeyHeader: "Authorization",
1122
- name: "Llama",
921
+ name: "Baseten",
922
+ models: ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
923
+ docUrl: "https://docs.baseten.co/development/model-apis/overview",
924
+ gateway: "models.dev"
925
+ },
926
+ cortecs: {
927
+ url: "https://api.cortecs.ai/v1",
928
+ apiKeyEnvVar: "CORTECS_API_KEY",
929
+ apiKeyHeader: "Authorization",
930
+ name: "Cortecs",
1123
931
  models: [
1124
- "cerebras-llama-4-maverick-17b-128e-instruct",
1125
- "cerebras-llama-4-scout-17b-16e-instruct",
1126
- "groq-llama-4-maverick-17b-128e-instruct",
1127
- "llama-3.3-70b-instruct",
1128
- "llama-3.3-8b-instruct",
1129
- "llama-4-maverick-17b-128e-instruct-fp8",
1130
- "llama-4-scout-17b-16e-instruct-fp8"
932
+ "claude-4-5-sonnet",
933
+ "claude-sonnet-4",
934
+ "deepseek-v3-0324",
935
+ "gemini-2.5-pro",
936
+ "gpt-4.1",
937
+ "gpt-oss-120b",
938
+ "kimi-k2-instruct",
939
+ "llama-3.1-405b-instruct",
940
+ "nova-pro-v1",
941
+ "qwen3-32b",
942
+ "qwen3-coder-480b-a35b-instruct"
1131
943
  ],
1132
- docUrl: "https://llama.developer.meta.com/docs/models",
944
+ docUrl: "https://api.cortecs.ai/v1/models",
1133
945
  gateway: "models.dev"
1134
946
  },
1135
- cerebras: {
1136
- url: "https://api.cerebras.ai/v1",
1137
- apiKeyEnvVar: "CEREBRAS_API_KEY",
947
+ mistral: {
948
+ url: "https://api.mistral.ai/v1",
949
+ apiKeyEnvVar: "MISTRAL_API_KEY",
1138
950
  apiKeyHeader: "Authorization",
1139
- name: "Cerebras",
1140
- models: ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
1141
- docUrl: "https://inference-docs.cerebras.ai/models/overview",
951
+ name: "Mistral",
952
+ models: [
953
+ "codestral-latest",
954
+ "devstral-medium-2507",
955
+ "devstral-small-2505",
956
+ "devstral-small-2507",
957
+ "magistral-medium-latest",
958
+ "magistral-small",
959
+ "ministral-3b-latest",
960
+ "ministral-8b-latest",
961
+ "mistral-large-latest",
962
+ "mistral-medium-2505",
963
+ "mistral-medium-2508",
964
+ "mistral-medium-latest",
965
+ "mistral-nemo",
966
+ "mistral-small-latest",
967
+ "open-mistral-7b",
968
+ "open-mixtral-8x22b",
969
+ "open-mixtral-8x7b",
970
+ "pixtral-12b",
971
+ "pixtral-large-latest"
972
+ ],
973
+ docUrl: "https://docs.mistral.ai/getting-started/models/",
1142
974
  gateway: "models.dev"
1143
975
  },
1144
- netlify: {
1145
- apiKeyEnvVar: ["NETLIFY_TOKEN", "NETLIFY_SITE_ID"],
976
+ venice: {
977
+ url: "https://api.venice.ai/api/v1",
978
+ apiKeyEnvVar: "VENICE_API_KEY",
1146
979
  apiKeyHeader: "Authorization",
1147
- name: "Netlify",
1148
- gateway: "netlify",
980
+ name: "Venice AI",
1149
981
  models: [
1150
- "anthropic/claude-3-5-haiku-20241022",
1151
- "anthropic/claude-3-5-haiku-latest",
1152
- "anthropic/claude-3-7-sonnet-20250219",
982
+ "deepseek-coder-v2-lite",
983
+ "deepseek-r1-671b",
984
+ "dolphin-2.9.2-qwen2-72b",
985
+ "llama-3.1-405b",
986
+ "llama-3.2-3b",
987
+ "llama-3.3-70b",
988
+ "mistral-31-24b",
989
+ "qwen-2.5-coder-32b",
990
+ "qwen-2.5-qwq-32b",
991
+ "qwen-2.5-vl",
992
+ "qwen3-235b",
993
+ "qwen3-4b",
994
+ "venice-uncensored"
995
+ ],
996
+ docUrl: "https://docs.venice.ai",
997
+ gateway: "models.dev"
998
+ },
999
+ alibaba: {
1000
+ url: "https://dashscope-intl.aliyuncs.com/compatible-mode/v1",
1001
+ apiKeyEnvVar: "DASHSCOPE_API_KEY",
1002
+ apiKeyHeader: "Authorization",
1003
+ name: "Alibaba",
1004
+ models: [
1005
+ "qvq-max",
1006
+ "qwen-flash",
1007
+ "qwen-max",
1008
+ "qwen-mt-plus",
1009
+ "qwen-mt-turbo",
1010
+ "qwen-omni-turbo",
1011
+ "qwen-omni-turbo-realtime",
1012
+ "qwen-plus",
1013
+ "qwen-plus-character-ja",
1014
+ "qwen-turbo",
1015
+ "qwen-vl-max",
1016
+ "qwen-vl-ocr",
1017
+ "qwen-vl-plus",
1018
+ "qwen2-5-14b-instruct",
1019
+ "qwen2-5-32b-instruct",
1020
+ "qwen2-5-72b-instruct",
1021
+ "qwen2-5-7b-instruct",
1022
+ "qwen2-5-omni-7b",
1023
+ "qwen2-5-vl-72b-instruct",
1024
+ "qwen2-5-vl-7b-instruct",
1025
+ "qwen3-14b",
1026
+ "qwen3-235b-a22b",
1027
+ "qwen3-32b",
1028
+ "qwen3-8b",
1029
+ "qwen3-asr-flash",
1030
+ "qwen3-coder-30b-a3b-instruct",
1031
+ "qwen3-coder-480b-a35b-instruct",
1032
+ "qwen3-coder-flash",
1033
+ "qwen3-coder-plus",
1034
+ "qwen3-livetranslate-flash-realtime",
1035
+ "qwen3-max",
1036
+ "qwen3-next-80b-a3b-instruct",
1037
+ "qwen3-next-80b-a3b-thinking",
1038
+ "qwen3-omni-flash",
1039
+ "qwen3-omni-flash-realtime",
1040
+ "qwen3-vl-235b-a22b",
1041
+ "qwen3-vl-30b-a3b",
1042
+ "qwen3-vl-plus",
1043
+ "qwq-plus"
1044
+ ],
1045
+ docUrl: "https://www.alibabacloud.com/help/en/model-studio/models",
1046
+ gateway: "models.dev"
1047
+ },
1048
+ "alibaba-cn": {
1049
+ url: "https://dashscope.aliyuncs.com/compatible-mode/v1",
1050
+ apiKeyEnvVar: "DASHSCOPE_API_KEY",
1051
+ apiKeyHeader: "Authorization",
1052
+ name: "Alibaba (China)",
1053
+ models: [
1054
+ "deepseek-r1",
1055
+ "deepseek-r1-0528",
1056
+ "deepseek-r1-distill-llama-70b",
1057
+ "deepseek-r1-distill-llama-8b",
1058
+ "deepseek-r1-distill-qwen-1-5b",
1059
+ "deepseek-r1-distill-qwen-14b",
1060
+ "deepseek-r1-distill-qwen-32b",
1061
+ "deepseek-r1-distill-qwen-7b",
1062
+ "deepseek-v3",
1063
+ "deepseek-v3-1",
1064
+ "deepseek-v3-2-exp",
1065
+ "moonshot-kimi-k2-instruct",
1066
+ "qvq-max",
1067
+ "qwen-deep-research",
1068
+ "qwen-doc-turbo",
1069
+ "qwen-flash",
1070
+ "qwen-long",
1071
+ "qwen-math-plus",
1072
+ "qwen-math-turbo",
1073
+ "qwen-max",
1074
+ "qwen-mt-plus",
1075
+ "qwen-mt-turbo",
1076
+ "qwen-omni-turbo",
1077
+ "qwen-omni-turbo-realtime",
1078
+ "qwen-plus",
1079
+ "qwen-plus-character",
1080
+ "qwen-turbo",
1081
+ "qwen-vl-max",
1082
+ "qwen-vl-ocr",
1083
+ "qwen-vl-plus",
1084
+ "qwen2-5-14b-instruct",
1085
+ "qwen2-5-32b-instruct",
1086
+ "qwen2-5-72b-instruct",
1087
+ "qwen2-5-7b-instruct",
1088
+ "qwen2-5-coder-32b-instruct",
1089
+ "qwen2-5-coder-7b-instruct",
1090
+ "qwen2-5-math-72b-instruct",
1091
+ "qwen2-5-math-7b-instruct",
1092
+ "qwen2-5-omni-7b",
1093
+ "qwen2-5-vl-72b-instruct",
1094
+ "qwen2-5-vl-7b-instruct",
1095
+ "qwen3-14b",
1096
+ "qwen3-235b-a22b",
1097
+ "qwen3-32b",
1098
+ "qwen3-8b",
1099
+ "qwen3-asr-flash",
1100
+ "qwen3-coder-30b-a3b-instruct",
1101
+ "qwen3-coder-480b-a35b-instruct",
1102
+ "qwen3-coder-flash",
1103
+ "qwen3-coder-plus",
1104
+ "qwen3-max",
1105
+ "qwen3-next-80b-a3b-instruct",
1106
+ "qwen3-next-80b-a3b-thinking",
1107
+ "qwen3-omni-flash",
1108
+ "qwen3-omni-flash-realtime",
1109
+ "qwen3-vl-235b-a22b",
1110
+ "qwen3-vl-30b-a3b",
1111
+ "qwen3-vl-plus",
1112
+ "qwq-32b",
1113
+ "qwq-plus",
1114
+ "tongyi-intent-detect-v3"
1115
+ ],
1116
+ docUrl: "https://www.alibabacloud.com/help/en/model-studio/models",
1117
+ gateway: "models.dev"
1118
+ },
1119
+ chutes: {
1120
+ url: "https://llm.chutes.ai/v1",
1121
+ apiKeyEnvVar: "CHUTES_API_KEY",
1122
+ apiKeyHeader: "Authorization",
1123
+ name: "Chutes",
1124
+ models: [
1125
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1126
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1127
+ "Qwen/Qwen3-30B-A3B",
1128
+ "Qwen/Qwen3-30B-A3B-Instruct-2507",
1129
+ "Qwen/Qwen3-30B-A3B-Thinking-2507",
1130
+ "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1131
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1132
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
1133
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
1134
+ "chutesai/Devstral-Small-2505",
1135
+ "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
1136
+ "deepseek-ai/DeepSeek-R1-0528",
1137
+ "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
1138
+ "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1139
+ "deepseek-ai/DeepSeek-V3-0324",
1140
+ "deepseek-ai/DeepSeek-V3.1",
1141
+ "deepseek-ai/DeepSeek-V3.1-Terminus",
1142
+ "deepseek-ai/DeepSeek-V3.1-turbo",
1143
+ "deepseek-ai/DeepSeek-V3.1:THINKING",
1144
+ "deepseek-ai/DeepSeek-V3.2-Exp",
1145
+ "meituan-longcat/LongCat-Flash-Chat-FP8",
1146
+ "moonshotai/Kimi-Dev-72B",
1147
+ "moonshotai/Kimi-K2-Instruct-0905",
1148
+ "moonshotai/Kimi-K2-Instruct-75k",
1149
+ "moonshotai/Kimi-VL-A3B-Thinking",
1150
+ "openai/gpt-oss-120b",
1151
+ "tngtech/DeepSeek-R1T-Chimera",
1152
+ "tngtech/DeepSeek-TNG-R1T2-Chimera",
1153
+ "zai-org/GLM-4.5-Air",
1154
+ "zai-org/GLM-4.5-FP8",
1155
+ "zai-org/GLM-4.5-turbo",
1156
+ "zai-org/GLM-4.6-FP8",
1157
+ "zai-org/GLM-4.6-turbo"
1158
+ ],
1159
+ docUrl: "https://llm.chutes.ai/v1/models",
1160
+ gateway: "models.dev"
1161
+ },
1162
+ upstage: {
1163
+ url: "https://api.upstage.ai",
1164
+ apiKeyEnvVar: "UPSTAGE_API_KEY",
1165
+ apiKeyHeader: "Authorization",
1166
+ name: "Upstage",
1167
+ models: ["solar-mini", "solar-pro2"],
1168
+ docUrl: "https://developers.upstage.ai/docs/apis/chat",
1169
+ gateway: "models.dev"
1170
+ },
1171
+ netlify: {
1172
+ apiKeyEnvVar: ["NETLIFY_TOKEN", "NETLIFY_SITE_ID"],
1173
+ apiKeyHeader: "Authorization",
1174
+ name: "Netlify",
1175
+ gateway: "netlify",
1176
+ models: [
1177
+ "anthropic/claude-3-5-haiku-20241022",
1178
+ "anthropic/claude-3-5-haiku-latest",
1179
+ "anthropic/claude-3-7-sonnet-20250219",
1153
1180
  "anthropic/claude-3-7-sonnet-latest",
1154
1181
  "anthropic/claude-3-haiku-20240307",
1155
1182
  "anthropic/claude-haiku-4-5-20251001",
@@ -1186,51 +1213,58 @@ var provider_registry_default = {
1186
1213
  }
1187
1214
  },
1188
1215
  models: {
1189
- "moonshotai-cn": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1216
+ nvidia: [
1217
+ "black-forest-labs/flux.1-dev",
1218
+ "deepseek-ai/deepseek-v3.1",
1219
+ "deepseek-ai/deepseek-v3.1-terminus",
1220
+ "google/gemma-3-27b-it",
1221
+ "microsoft/phi-4-mini-instruct",
1222
+ "moonshotai/kimi-k2-instruct",
1223
+ "moonshotai/kimi-k2-instruct-0905",
1224
+ "nvidia/cosmos-nemotron-34b",
1225
+ "nvidia/llama-3.1-nemotron-ultra-253b-v1",
1226
+ "nvidia/nemoretriever-ocr-v1",
1227
+ "nvidia/parakeet-tdt-0.6b-v2",
1228
+ "openai/gpt-oss-120b",
1229
+ "openai/whisper-large-v3",
1230
+ "qwen/qwen3-235b-a22b",
1231
+ "qwen/qwen3-coder-480b-a35b-instruct"
1232
+ ],
1233
+ modelscope: [
1234
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1235
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1236
+ "Qwen/Qwen3-30B-A3B-Instruct-2507",
1237
+ "Qwen/Qwen3-30B-A3B-Thinking-2507",
1238
+ "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1239
+ "ZhipuAI/GLM-4.5",
1240
+ "ZhipuAI/GLM-4.6"
1241
+ ],
1242
+ aihubmix: [
1243
+ "DeepSeek-V3.2-Exp",
1244
+ "DeepSeek-V3.2-Exp-Think",
1245
+ "Kimi-K2-0905",
1246
+ "claude-haiku-4-5",
1247
+ "claude-opus-4-1",
1248
+ "claude-sonnet-4-5",
1249
+ "gemini-2.5-flash",
1250
+ "gemini-2.5-pro",
1251
+ "glm-4.6",
1252
+ "gpt-4.1",
1253
+ "gpt-4.1-mini",
1254
+ "gpt-4.1-nano",
1255
+ "gpt-4o",
1256
+ "gpt-4o-2024-11-20",
1257
+ "gpt-5",
1258
+ "gpt-5-codex",
1259
+ "gpt-5-mini",
1260
+ "gpt-5-nano",
1261
+ "gpt-5-pro",
1262
+ "o4-mini",
1263
+ "qwen3-235b-a22b-instruct-2507",
1264
+ "qwen3-235b-a22b-thinking-2507",
1265
+ "qwen3-coder-480b-a35b-instruct"
1266
+ ],
1190
1267
  lucidquery: ["lucidnova-rf1-100b", "lucidquery-nexus-coder"],
1191
- moonshotai: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1192
- "zai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1193
- alibaba: [
1194
- "qvq-max",
1195
- "qwen-flash",
1196
- "qwen-max",
1197
- "qwen-mt-plus",
1198
- "qwen-mt-turbo",
1199
- "qwen-omni-turbo",
1200
- "qwen-omni-turbo-realtime",
1201
- "qwen-plus",
1202
- "qwen-plus-character-ja",
1203
- "qwen-turbo",
1204
- "qwen-vl-max",
1205
- "qwen-vl-ocr",
1206
- "qwen-vl-plus",
1207
- "qwen2-5-14b-instruct",
1208
- "qwen2-5-32b-instruct",
1209
- "qwen2-5-72b-instruct",
1210
- "qwen2-5-7b-instruct",
1211
- "qwen2-5-omni-7b",
1212
- "qwen2-5-vl-72b-instruct",
1213
- "qwen2-5-vl-7b-instruct",
1214
- "qwen3-14b",
1215
- "qwen3-235b-a22b",
1216
- "qwen3-32b",
1217
- "qwen3-8b",
1218
- "qwen3-asr-flash",
1219
- "qwen3-coder-30b-a3b-instruct",
1220
- "qwen3-coder-480b-a35b-instruct",
1221
- "qwen3-coder-flash",
1222
- "qwen3-coder-plus",
1223
- "qwen3-livetranslate-flash-realtime",
1224
- "qwen3-max",
1225
- "qwen3-next-80b-a3b-instruct",
1226
- "qwen3-next-80b-a3b-thinking",
1227
- "qwen3-omni-flash",
1228
- "qwen3-omni-flash-realtime",
1229
- "qwen3-vl-235b-a22b",
1230
- "qwen3-vl-30b-a3b",
1231
- "qwen3-vl-plus",
1232
- "qwq-plus"
1233
- ],
1234
1268
  xai: [
1235
1269
  "grok-2",
1236
1270
  "grok-2-1212",
@@ -1253,293 +1287,370 @@ var provider_registry_default = {
1253
1287
  "grok-code-fast-1",
1254
1288
  "grok-vision-beta"
1255
1289
  ],
1256
- nvidia: [
1257
- "black-forest-labs/flux.1-dev",
1258
- "deepseek-ai/deepseek-v3.1",
1259
- "google/gemma-3-27b-it",
1260
- "microsoft/phi-4-mini-instruct",
1290
+ deepseek: ["deepseek-chat", "deepseek-reasoner"],
1291
+ requesty: [
1292
+ "anthropic/claude-3-7-sonnet",
1293
+ "anthropic/claude-4-sonnet-20250522",
1294
+ "anthropic/claude-opus-4",
1295
+ "anthropic/claude-opus-4-1-20250805",
1296
+ "google/gemini-2.5-flash",
1297
+ "google/gemini-2.5-pro",
1298
+ "openai/gpt-4.1",
1299
+ "openai/gpt-4.1-mini",
1300
+ "openai/gpt-4o-mini",
1301
+ "openai/gpt-5",
1302
+ "openai/gpt-5-mini",
1303
+ "openai/gpt-5-nano",
1304
+ "openai/o4-mini"
1305
+ ],
1306
+ nebius: [
1307
+ "NousResearch/hermes-4-405b",
1308
+ "NousResearch/hermes-4-70b",
1309
+ "deepseek-ai/deepseek-v3",
1310
+ "meta-llama/llama-3.3-70b-instruct-base",
1311
+ "meta-llama/llama-3.3-70b-instruct-fast",
1312
+ "meta-llama/llama-3_1-405b-instruct",
1261
1313
  "moonshotai/kimi-k2-instruct",
1262
- "moonshotai/kimi-k2-instruct-0905",
1263
- "nvidia/cosmos-nemotron-34b",
1264
- "nvidia/llama-3.1-nemotron-ultra-253b-v1",
1265
- "nvidia/nemoretriever-ocr-v1",
1266
- "nvidia/parakeet-tdt-0.6b-v2",
1314
+ "nvidia/llama-3_1-nemotron-ultra-253b-v1",
1267
1315
  "openai/gpt-oss-120b",
1268
- "openai/whisper-large-v3",
1269
- "qwen/qwen3-235b-a22b",
1270
- "qwen/qwen3-coder-480b-a35b-instruct"
1316
+ "openai/gpt-oss-20b",
1317
+ "qwen/qwen3-235b-a22b-instruct-2507",
1318
+ "qwen/qwen3-235b-a22b-thinking-2507",
1319
+ "qwen/qwen3-coder-480b-a35b-instruct",
1320
+ "zai-org/glm-4.5",
1321
+ "zai-org/glm-4.5-air"
1271
1322
  ],
1272
- upstage: ["solar-mini", "solar-pro2"],
1273
- groq: [
1274
- "deepseek-r1-distill-llama-70b",
1275
- "gemma2-9b-it",
1276
- "llama-3.1-8b-instant",
1277
- "llama-3.3-70b-versatile",
1278
- "llama-guard-3-8b",
1279
- "llama3-70b-8192",
1280
- "llama3-8b-8192",
1281
- "meta-llama/llama-4-maverick-17b-128e-instruct",
1282
- "meta-llama/llama-4-scout-17b-16e-instruct",
1283
- "meta-llama/llama-guard-4-12b",
1284
- "mistral-saba-24b",
1285
- "moonshotai/kimi-k2-instruct",
1286
- "moonshotai/kimi-k2-instruct-0905",
1323
+ fastrouter: [
1324
+ "anthropic/claude-opus-4.1",
1325
+ "anthropic/claude-sonnet-4",
1326
+ "deepseek-ai/deepseek-r1-distill-llama-70b",
1327
+ "google/gemini-2.5-flash",
1328
+ "google/gemini-2.5-pro",
1329
+ "moonshotai/kimi-k2",
1330
+ "openai/gpt-4.1",
1331
+ "openai/gpt-5",
1332
+ "openai/gpt-5-mini",
1333
+ "openai/gpt-5-nano",
1287
1334
  "openai/gpt-oss-120b",
1288
1335
  "openai/gpt-oss-20b",
1289
- "qwen-qwq-32b",
1290
- "qwen/qwen3-32b"
1336
+ "qwen/qwen3-coder",
1337
+ "x-ai/grok-4"
1291
1338
  ],
1292
- mistral: [
1293
- "codestral-latest",
1294
- "devstral-medium-2507",
1295
- "devstral-small-2505",
1296
- "devstral-small-2507",
1297
- "magistral-medium-latest",
1298
- "magistral-small",
1299
- "ministral-3b-latest",
1300
- "ministral-8b-latest",
1301
- "mistral-large-latest",
1302
- "mistral-medium-2505",
1303
- "mistral-medium-2508",
1304
- "mistral-medium-latest",
1305
- "mistral-nemo",
1306
- "mistral-small-latest",
1307
- "open-mistral-7b",
1308
- "open-mixtral-8x22b",
1309
- "open-mixtral-8x7b",
1310
- "pixtral-12b",
1311
- "pixtral-large-latest"
1339
+ perplexity: ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
1340
+ morph: ["auto", "morph-v3-fast", "morph-v3-large"],
1341
+ "zai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1342
+ huggingface: [
1343
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1344
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1345
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
1346
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
1347
+ "deepseek-ai/DeepSeek-R1-0528",
1348
+ "deepseek-ai/Deepseek-V3-0324",
1349
+ "moonshotai/Kimi-K2-Instruct",
1350
+ "moonshotai/Kimi-K2-Instruct-0905",
1351
+ "zai-org/GLM-4.5",
1352
+ "zai-org/GLM-4.5-Air",
1353
+ "zai-org/GLM-4.6"
1312
1354
  ],
1313
- vercel: [
1314
- "alibaba/qwen3-coder-plus",
1315
- "alibaba/qwen3-max",
1316
- "alibaba/qwen3-next-80b-a3b-instruct",
1317
- "alibaba/qwen3-next-80b-a3b-thinking",
1318
- "alibaba/qwen3-vl-instruct",
1319
- "alibaba/qwen3-vl-thinking",
1320
- "amazon/nova-lite",
1321
- "amazon/nova-micro",
1322
- "amazon/nova-pro",
1323
- "anthropic/claude-3-5-haiku",
1324
- "anthropic/claude-3-haiku",
1325
- "anthropic/claude-3-opus",
1326
- "anthropic/claude-3.5-sonnet",
1355
+ openrouter: [
1356
+ "anthropic/claude-3.5-haiku",
1327
1357
  "anthropic/claude-3.7-sonnet",
1328
- "anthropic/claude-4-1-opus",
1329
- "anthropic/claude-4-opus",
1330
- "anthropic/claude-4-sonnet",
1331
- "anthropic/claude-4.5-sonnet",
1332
1358
  "anthropic/claude-haiku-4.5",
1333
- "cerebras/qwen3-coder",
1334
- "deepseek/deepseek-r1",
1359
+ "anthropic/claude-opus-4",
1360
+ "anthropic/claude-opus-4.1",
1361
+ "anthropic/claude-sonnet-4",
1362
+ "anthropic/claude-sonnet-4.5",
1363
+ "cognitivecomputations/dolphin3.0-mistral-24b",
1364
+ "cognitivecomputations/dolphin3.0-r1-mistral-24b",
1365
+ "deepseek/deepseek-chat-v3-0324",
1366
+ "deepseek/deepseek-chat-v3.1",
1367
+ "deepseek/deepseek-r1-0528-qwen3-8b:free",
1368
+ "deepseek/deepseek-r1-0528:free",
1335
1369
  "deepseek/deepseek-r1-distill-llama-70b",
1370
+ "deepseek/deepseek-r1-distill-qwen-14b",
1371
+ "deepseek/deepseek-r1:free",
1372
+ "deepseek/deepseek-v3-base:free",
1336
1373
  "deepseek/deepseek-v3.1-terminus",
1337
- "deepseek/deepseek-v3.2-exp",
1338
- "deepseek/deepseek-v3.2-exp-thinking",
1339
- "google/gemini-2.0-flash",
1340
- "google/gemini-2.0-flash-lite",
1374
+ "featherless/qwerky-72b",
1375
+ "google/gemini-2.0-flash-001",
1376
+ "google/gemini-2.0-flash-exp:free",
1341
1377
  "google/gemini-2.5-flash",
1342
1378
  "google/gemini-2.5-flash-lite",
1343
1379
  "google/gemini-2.5-flash-lite-preview-09-2025",
1344
1380
  "google/gemini-2.5-flash-preview-09-2025",
1345
1381
  "google/gemini-2.5-pro",
1346
- "meta/llama-3.3-70b",
1347
- "meta/llama-4-maverick",
1348
- "meta/llama-4-scout",
1349
- "mistral/codestral",
1350
- "mistral/magistral-medium",
1351
- "mistral/magistral-small",
1352
- "mistral/ministral-3b",
1353
- "mistral/ministral-8b",
1354
- "mistral/mistral-large",
1355
- "mistral/mistral-small",
1356
- "mistral/mixtral-8x22b-instruct",
1357
- "mistral/pixtral-12b",
1358
- "mistral/pixtral-large",
1382
+ "google/gemini-2.5-pro-preview-05-06",
1383
+ "google/gemini-2.5-pro-preview-06-05",
1384
+ "google/gemma-2-9b-it:free",
1385
+ "google/gemma-3-12b-it",
1386
+ "google/gemma-3-27b-it",
1387
+ "google/gemma-3n-e4b-it",
1388
+ "google/gemma-3n-e4b-it:free",
1389
+ "meta-llama/llama-3.2-11b-vision-instruct",
1390
+ "meta-llama/llama-3.3-70b-instruct:free",
1391
+ "meta-llama/llama-4-scout:free",
1392
+ "microsoft/mai-ds-r1:free",
1393
+ "mistralai/codestral-2508",
1394
+ "mistralai/devstral-medium-2507",
1395
+ "mistralai/devstral-small-2505",
1396
+ "mistralai/devstral-small-2505:free",
1397
+ "mistralai/devstral-small-2507",
1398
+ "mistralai/mistral-7b-instruct:free",
1399
+ "mistralai/mistral-medium-3",
1400
+ "mistralai/mistral-medium-3.1",
1401
+ "mistralai/mistral-nemo:free",
1402
+ "mistralai/mistral-small-3.1-24b-instruct",
1403
+ "mistralai/mistral-small-3.2-24b-instruct",
1404
+ "mistralai/mistral-small-3.2-24b-instruct:free",
1405
+ "moonshotai/kimi-dev-72b:free",
1359
1406
  "moonshotai/kimi-k2",
1360
- "morph/morph-v3-fast",
1361
- "morph/morph-v3-large",
1362
- "openai/gpt-4-turbo",
1407
+ "moonshotai/kimi-k2-0905",
1408
+ "moonshotai/kimi-k2:free",
1409
+ "nousresearch/deephermes-3-llama-3-8b-preview",
1410
+ "nousresearch/hermes-4-405b",
1411
+ "nousresearch/hermes-4-70b",
1363
1412
  "openai/gpt-4.1",
1364
1413
  "openai/gpt-4.1-mini",
1365
- "openai/gpt-4.1-nano",
1366
- "openai/gpt-4o",
1367
1414
  "openai/gpt-4o-mini",
1368
1415
  "openai/gpt-5",
1416
+ "openai/gpt-5-chat",
1369
1417
  "openai/gpt-5-codex",
1418
+ "openai/gpt-5-image",
1370
1419
  "openai/gpt-5-mini",
1371
1420
  "openai/gpt-5-nano",
1372
1421
  "openai/gpt-oss-120b",
1373
1422
  "openai/gpt-oss-20b",
1374
- "openai/o1",
1375
- "openai/o3",
1376
- "openai/o3-mini",
1377
1423
  "openai/o4-mini",
1378
- "perplexity/sonar",
1379
- "perplexity/sonar-pro",
1380
- "perplexity/sonar-reasoning",
1381
- "perplexity/sonar-reasoning-pro",
1382
- "vercel/v0-1.0-md",
1383
- "vercel/v0-1.5-md",
1384
- "xai/grok-2",
1385
- "xai/grok-2-vision",
1386
- "xai/grok-3",
1387
- "xai/grok-3-fast",
1388
- "xai/grok-3-mini",
1389
- "xai/grok-3-mini-fast",
1390
- "xai/grok-4",
1391
- "xai/grok-4-fast",
1392
- "xai/grok-4-fast-non-reasoning",
1393
- "xai/grok-code-fast-1",
1394
- "zai/glm-4.5",
1395
- "zai/glm-4.5-air",
1396
- "zai/glm-4.5v",
1397
- "zai/glm-4.6"
1398
- ],
1399
- nebius: [
1400
- "NousResearch/hermes-4-405b",
1401
- "NousResearch/hermes-4-70b",
1402
- "deepseek-ai/deepseek-v3",
1403
- "meta-llama/llama-3.3-70b-instruct-base",
1404
- "meta-llama/llama-3.3-70b-instruct-fast",
1405
- "meta-llama/llama-3_1-405b-instruct",
1406
- "moonshotai/kimi-k2-instruct",
1407
- "nvidia/llama-3_1-nemotron-ultra-253b-v1",
1408
- "openai/gpt-oss-120b",
1409
- "openai/gpt-oss-20b",
1410
- "qwen/qwen3-235b-a22b-instruct-2507",
1424
+ "openrouter/cypher-alpha:free",
1425
+ "openrouter/horizon-alpha",
1426
+ "openrouter/horizon-beta",
1427
+ "openrouter/sonoma-dusk-alpha",
1428
+ "openrouter/sonoma-sky-alpha",
1429
+ "qwen/qwen-2.5-coder-32b-instruct",
1430
+ "qwen/qwen2.5-vl-32b-instruct:free",
1431
+ "qwen/qwen2.5-vl-72b-instruct",
1432
+ "qwen/qwen2.5-vl-72b-instruct:free",
1433
+ "qwen/qwen3-14b:free",
1434
+ "qwen/qwen3-235b-a22b-07-25",
1435
+ "qwen/qwen3-235b-a22b-07-25:free",
1411
1436
  "qwen/qwen3-235b-a22b-thinking-2507",
1412
- "qwen/qwen3-coder-480b-a35b-instruct",
1413
- "zai-org/glm-4.5",
1414
- "zai-org/glm-4.5-air"
1415
- ],
1416
- deepseek: ["deepseek-chat", "deepseek-reasoner"],
1417
- "alibaba-cn": [
1418
- "deepseek-r1",
1419
- "deepseek-r1-0528",
1420
- "deepseek-r1-distill-llama-70b",
1421
- "deepseek-r1-distill-llama-8b",
1422
- "deepseek-r1-distill-qwen-1-5b",
1423
- "deepseek-r1-distill-qwen-14b",
1424
- "deepseek-r1-distill-qwen-32b",
1425
- "deepseek-r1-distill-qwen-7b",
1426
- "deepseek-v3",
1427
- "deepseek-v3-1",
1428
- "deepseek-v3-2-exp",
1429
- "moonshot-kimi-k2-instruct",
1430
- "qvq-max",
1431
- "qwen-deep-research",
1432
- "qwen-doc-turbo",
1433
- "qwen-flash",
1434
- "qwen-long",
1435
- "qwen-math-plus",
1436
- "qwen-math-turbo",
1437
- "qwen-max",
1438
- "qwen-mt-plus",
1439
- "qwen-mt-turbo",
1440
- "qwen-omni-turbo",
1441
- "qwen-omni-turbo-realtime",
1442
- "qwen-plus",
1443
- "qwen-plus-character",
1444
- "qwen-turbo",
1445
- "qwen-vl-max",
1446
- "qwen-vl-ocr",
1447
- "qwen-vl-plus",
1448
- "qwen2-5-14b-instruct",
1449
- "qwen2-5-32b-instruct",
1450
- "qwen2-5-72b-instruct",
1451
- "qwen2-5-7b-instruct",
1452
- "qwen2-5-coder-32b-instruct",
1453
- "qwen2-5-coder-7b-instruct",
1454
- "qwen2-5-math-72b-instruct",
1455
- "qwen2-5-math-7b-instruct",
1456
- "qwen2-5-omni-7b",
1457
- "qwen2-5-vl-72b-instruct",
1458
- "qwen2-5-vl-7b-instruct",
1459
- "qwen3-14b",
1460
- "qwen3-235b-a22b",
1461
- "qwen3-32b",
1462
- "qwen3-8b",
1463
- "qwen3-asr-flash",
1464
- "qwen3-coder-30b-a3b-instruct",
1465
- "qwen3-coder-480b-a35b-instruct",
1466
- "qwen3-coder-flash",
1467
- "qwen3-coder-plus",
1468
- "qwen3-max",
1469
- "qwen3-next-80b-a3b-instruct",
1470
- "qwen3-next-80b-a3b-thinking",
1471
- "qwen3-omni-flash",
1472
- "qwen3-omni-flash-realtime",
1473
- "qwen3-vl-235b-a22b",
1474
- "qwen3-vl-30b-a3b",
1475
- "qwen3-vl-plus",
1476
- "qwq-32b",
1477
- "qwq-plus",
1478
- "tongyi-intent-detect-v3"
1437
+ "qwen/qwen3-235b-a22b:free",
1438
+ "qwen/qwen3-30b-a3b-instruct-2507",
1439
+ "qwen/qwen3-30b-a3b-thinking-2507",
1440
+ "qwen/qwen3-30b-a3b:free",
1441
+ "qwen/qwen3-32b:free",
1442
+ "qwen/qwen3-8b:free",
1443
+ "qwen/qwen3-coder",
1444
+ "qwen/qwen3-coder:free",
1445
+ "qwen/qwen3-max",
1446
+ "qwen/qwen3-next-80b-a3b-instruct",
1447
+ "qwen/qwen3-next-80b-a3b-thinking",
1448
+ "qwen/qwq-32b:free",
1449
+ "rekaai/reka-flash-3",
1450
+ "sarvamai/sarvam-m:free",
1451
+ "thudm/glm-z1-32b:free",
1452
+ "tngtech/deepseek-r1t2-chimera:free",
1453
+ "x-ai/grok-3",
1454
+ "x-ai/grok-3-beta",
1455
+ "x-ai/grok-3-mini",
1456
+ "x-ai/grok-3-mini-beta",
1457
+ "x-ai/grok-4",
1458
+ "x-ai/grok-4-fast",
1459
+ "x-ai/grok-4-fast:free",
1460
+ "x-ai/grok-code-fast-1",
1461
+ "z-ai/glm-4.5",
1462
+ "z-ai/glm-4.5-air",
1463
+ "z-ai/glm-4.5-air:free",
1464
+ "z-ai/glm-4.5v",
1465
+ "z-ai/glm-4.6"
1479
1466
  ],
1480
- venice: [
1481
- "deepseek-coder-v2-lite",
1482
- "deepseek-r1-671b",
1483
- "dolphin-2.9.2-qwen2-72b",
1484
- "llama-3.1-405b",
1485
- "llama-3.2-3b",
1486
- "llama-3.3-70b",
1487
- "mistral-31-24b",
1488
- "qwen-2.5-coder-32b",
1489
- "qwen-2.5-qwq-32b",
1490
- "qwen-2.5-vl",
1491
- "qwen3-235b",
1492
- "qwen3-4b",
1493
- "venice-uncensored"
1467
+ cerebras: ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
1468
+ zhipuai: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1469
+ togetherai: [
1470
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1471
+ "deepseek-ai/DeepSeek-R1",
1472
+ "deepseek-ai/DeepSeek-V3",
1473
+ "meta-llama/Llama-3.3-70B-Instruct-Turbo",
1474
+ "moonshotai/Kimi-K2-Instruct",
1475
+ "openai/gpt-oss-120b"
1494
1476
  ],
1495
- chutes: [
1477
+ wandb: [
1496
1478
  "Qwen/Qwen3-235B-A22B-Instruct-2507",
1497
1479
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
1498
- "Qwen/Qwen3-30B-A3B",
1499
- "Qwen/Qwen3-30B-A3B-Instruct-2507",
1500
- "Qwen/Qwen3-30B-A3B-Thinking-2507",
1501
- "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1502
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1503
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
1504
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
1505
- "chutesai/Devstral-Small-2505",
1506
- "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
1480
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1507
1481
  "deepseek-ai/DeepSeek-R1-0528",
1508
- "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
1509
- "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1510
1482
  "deepseek-ai/DeepSeek-V3-0324",
1511
- "deepseek-ai/DeepSeek-V3.1",
1512
- "deepseek-ai/DeepSeek-V3.1-Terminus",
1513
- "deepseek-ai/DeepSeek-V3.1-turbo",
1514
- "deepseek-ai/DeepSeek-V3.1:THINKING",
1515
- "deepseek-ai/DeepSeek-V3.2-Exp",
1516
- "meituan-longcat/LongCat-Flash-Chat-FP8",
1517
- "moonshotai/Kimi-Dev-72B",
1518
- "moonshotai/Kimi-K2-Instruct-0905",
1519
- "moonshotai/Kimi-K2-Instruct-75k",
1520
- "moonshotai/Kimi-VL-A3B-Thinking",
1483
+ "meta-llama/Llama-3.1-8B-Instruct",
1484
+ "meta-llama/Llama-3.3-70B-Instruct",
1485
+ "meta-llama/Llama-4-Scout-17B-16E-Instruct",
1486
+ "microsoft/Phi-4-mini-instruct",
1487
+ "moonshotai/Kimi-K2-Instruct"
1488
+ ],
1489
+ submodel: [
1490
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1491
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1492
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1493
+ "deepseek-ai/DeepSeek-R1-0528",
1494
+ "deepseek-ai/DeepSeek-V3-0324",
1495
+ "deepseek-ai/DeepSeek-V3.1",
1521
1496
  "openai/gpt-oss-120b",
1522
- "tngtech/DeepSeek-R1T-Chimera",
1523
- "tngtech/DeepSeek-TNG-R1T2-Chimera",
1524
1497
  "zai-org/GLM-4.5-Air",
1525
- "zai-org/GLM-4.5-FP8",
1526
- "zai-org/GLM-4.5-turbo",
1527
- "zai-org/GLM-4.6-FP8",
1528
- "zai-org/GLM-4.6-turbo"
1498
+ "zai-org/GLM-4.5-FP8"
1529
1499
  ],
1530
- cortecs: [
1531
- "claude-4-5-sonnet",
1532
- "claude-sonnet-4",
1533
- "deepseek-v3-0324",
1500
+ vercel: [
1501
+ "alibaba/qwen3-coder-plus",
1502
+ "alibaba/qwen3-max",
1503
+ "alibaba/qwen3-next-80b-a3b-instruct",
1504
+ "alibaba/qwen3-next-80b-a3b-thinking",
1505
+ "alibaba/qwen3-vl-instruct",
1506
+ "alibaba/qwen3-vl-thinking",
1507
+ "amazon/nova-lite",
1508
+ "amazon/nova-micro",
1509
+ "amazon/nova-pro",
1510
+ "anthropic/claude-3-5-haiku",
1511
+ "anthropic/claude-3-haiku",
1512
+ "anthropic/claude-3-opus",
1513
+ "anthropic/claude-3.5-sonnet",
1514
+ "anthropic/claude-3.7-sonnet",
1515
+ "anthropic/claude-4-1-opus",
1516
+ "anthropic/claude-4-opus",
1517
+ "anthropic/claude-4-sonnet",
1518
+ "anthropic/claude-4.5-sonnet",
1519
+ "anthropic/claude-haiku-4.5",
1520
+ "cerebras/qwen3-coder",
1521
+ "deepseek/deepseek-r1",
1522
+ "deepseek/deepseek-r1-distill-llama-70b",
1523
+ "deepseek/deepseek-v3.1-terminus",
1524
+ "deepseek/deepseek-v3.2-exp",
1525
+ "deepseek/deepseek-v3.2-exp-thinking",
1526
+ "google/gemini-2.0-flash",
1527
+ "google/gemini-2.0-flash-lite",
1528
+ "google/gemini-2.5-flash",
1529
+ "google/gemini-2.5-flash-lite",
1530
+ "google/gemini-2.5-flash-lite-preview-09-2025",
1531
+ "google/gemini-2.5-flash-preview-09-2025",
1532
+ "google/gemini-2.5-pro",
1533
+ "meta/llama-3.3-70b",
1534
+ "meta/llama-4-maverick",
1535
+ "meta/llama-4-scout",
1536
+ "mistral/codestral",
1537
+ "mistral/magistral-medium",
1538
+ "mistral/magistral-small",
1539
+ "mistral/ministral-3b",
1540
+ "mistral/ministral-8b",
1541
+ "mistral/mistral-large",
1542
+ "mistral/mistral-small",
1543
+ "mistral/mixtral-8x22b-instruct",
1544
+ "mistral/pixtral-12b",
1545
+ "mistral/pixtral-large",
1546
+ "moonshotai/kimi-k2",
1547
+ "morph/morph-v3-fast",
1548
+ "morph/morph-v3-large",
1549
+ "openai/gpt-4-turbo",
1550
+ "openai/gpt-4.1",
1551
+ "openai/gpt-4.1-mini",
1552
+ "openai/gpt-4.1-nano",
1553
+ "openai/gpt-4o",
1554
+ "openai/gpt-4o-mini",
1555
+ "openai/gpt-5",
1556
+ "openai/gpt-5-codex",
1557
+ "openai/gpt-5-mini",
1558
+ "openai/gpt-5-nano",
1559
+ "openai/gpt-oss-120b",
1560
+ "openai/gpt-oss-20b",
1561
+ "openai/o1",
1562
+ "openai/o3",
1563
+ "openai/o3-mini",
1564
+ "openai/o4-mini",
1565
+ "perplexity/sonar",
1566
+ "perplexity/sonar-pro",
1567
+ "perplexity/sonar-reasoning",
1568
+ "perplexity/sonar-reasoning-pro",
1569
+ "vercel/v0-1.0-md",
1570
+ "vercel/v0-1.5-md",
1571
+ "xai/grok-2",
1572
+ "xai/grok-2-vision",
1573
+ "xai/grok-3",
1574
+ "xai/grok-3-fast",
1575
+ "xai/grok-3-mini",
1576
+ "xai/grok-3-mini-fast",
1577
+ "xai/grok-4",
1578
+ "xai/grok-4-fast",
1579
+ "xai/grok-4-fast-non-reasoning",
1580
+ "xai/grok-code-fast-1",
1581
+ "zai/glm-4.5",
1582
+ "zai/glm-4.5-air",
1583
+ "zai/glm-4.5v",
1584
+ "zai/glm-4.6"
1585
+ ],
1586
+ synthetic: [
1587
+ "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
1588
+ "hf:Qwen/Qwen3-235B-A22B-Instruct-2507",
1589
+ "hf:Qwen/Qwen3-235B-A22B-Thinking-2507",
1590
+ "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct",
1591
+ "hf:deepseek-ai/DeepSeek-R1",
1592
+ "hf:deepseek-ai/DeepSeek-R1-0528",
1593
+ "hf:deepseek-ai/DeepSeek-V3",
1594
+ "hf:deepseek-ai/DeepSeek-V3-0324",
1595
+ "hf:deepseek-ai/DeepSeek-V3.1",
1596
+ "hf:deepseek-ai/DeepSeek-V3.1-Terminus",
1597
+ "hf:meta-llama/Llama-3.1-405B-Instruct",
1598
+ "hf:meta-llama/Llama-3.1-70B-Instruct",
1599
+ "hf:meta-llama/Llama-3.1-8B-Instruct",
1600
+ "hf:meta-llama/Llama-3.3-70B-Instruct",
1601
+ "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
1602
+ "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct",
1603
+ "hf:moonshotai/Kimi-K2-Instruct",
1604
+ "hf:moonshotai/Kimi-K2-Instruct-0905",
1605
+ "hf:openai/gpt-oss-120b",
1606
+ "hf:zai-org/GLM-4.5",
1607
+ "hf:zai-org/GLM-4.6"
1608
+ ],
1609
+ google: [
1610
+ "gemini-1.5-flash",
1611
+ "gemini-1.5-flash-8b",
1612
+ "gemini-1.5-pro",
1613
+ "gemini-2.0-flash",
1614
+ "gemini-2.0-flash-lite",
1615
+ "gemini-2.5-flash",
1616
+ "gemini-2.5-flash-image",
1617
+ "gemini-2.5-flash-image-preview",
1618
+ "gemini-2.5-flash-lite",
1619
+ "gemini-2.5-flash-lite-preview-06-17",
1620
+ "gemini-2.5-flash-lite-preview-09-2025",
1621
+ "gemini-2.5-flash-preview-04-17",
1622
+ "gemini-2.5-flash-preview-05-20",
1623
+ "gemini-2.5-flash-preview-09-2025",
1624
+ "gemini-2.5-flash-preview-tts",
1534
1625
  "gemini-2.5-pro",
1535
- "gpt-4.1",
1536
- "gpt-oss-120b",
1537
- "kimi-k2-instruct",
1538
- "llama-3.1-405b-instruct",
1539
- "nova-pro-v1",
1540
- "qwen3-32b",
1541
- "qwen3-coder-480b-a35b-instruct"
1626
+ "gemini-2.5-pro-preview-05-06",
1627
+ "gemini-2.5-pro-preview-06-05",
1628
+ "gemini-2.5-pro-preview-tts",
1629
+ "gemini-flash-latest",
1630
+ "gemini-flash-lite-latest",
1631
+ "gemini-live-2.5-flash",
1632
+ "gemini-live-2.5-flash-preview-native-audio"
1633
+ ],
1634
+ groq: [
1635
+ "deepseek-r1-distill-llama-70b",
1636
+ "gemma2-9b-it",
1637
+ "llama-3.1-8b-instant",
1638
+ "llama-3.3-70b-versatile",
1639
+ "llama-guard-3-8b",
1640
+ "llama3-70b-8192",
1641
+ "llama3-8b-8192",
1642
+ "meta-llama/llama-4-maverick-17b-128e-instruct",
1643
+ "meta-llama/llama-4-scout-17b-16e-instruct",
1644
+ "meta-llama/llama-guard-4-12b",
1645
+ "mistral-saba-24b",
1646
+ "moonshotai/kimi-k2-instruct",
1647
+ "moonshotai/kimi-k2-instruct-0905",
1648
+ "openai/gpt-oss-120b",
1649
+ "openai/gpt-oss-20b",
1650
+ "qwen-qwq-32b",
1651
+ "qwen/qwen3-32b"
1542
1652
  ],
1653
+ "moonshotai-cn": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1543
1654
  "github-models": [
1544
1655
  "ai21-labs/ai21-jamba-1.5-large",
1545
1656
  "ai21-labs/ai21-jamba-1.5-mini",
@@ -1597,97 +1708,53 @@ var provider_registry_default = {
1597
1708
  "xai/grok-3",
1598
1709
  "xai/grok-3-mini"
1599
1710
  ],
1600
- togetherai: [
1601
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1602
- "deepseek-ai/DeepSeek-R1",
1603
- "deepseek-ai/DeepSeek-V3",
1604
- "meta-llama/Llama-3.3-70B-Instruct-Turbo",
1605
- "moonshotai/Kimi-K2-Instruct",
1606
- "openai/gpt-oss-120b"
1607
- ],
1608
- baseten: ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905"],
1609
- huggingface: [
1610
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1711
+ deepinfra: [
1611
1712
  "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1612
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
1613
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
1614
- "deepseek-ai/DeepSeek-R1-0528",
1615
- "deepseek-ai/Deepseek-V3-0324",
1713
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo",
1616
1714
  "moonshotai/Kimi-K2-Instruct",
1617
- "moonshotai/Kimi-K2-Instruct-0905",
1618
- "zai-org/GLM-4.5",
1619
- "zai-org/GLM-4.5-Air",
1620
- "zai-org/GLM-4.6"
1621
- ],
1622
- opencode: [
1623
- "an-g8x",
1624
- "claude-3-5-haiku",
1625
- "claude-haiku-4-5",
1626
- "claude-opus-4-1",
1627
- "claude-sonnet-4",
1628
- "claude-sonnet-4-5",
1629
- "code-supernova",
1630
- "glm-4.6",
1631
- "gpt-5",
1632
- "gpt-5-codex",
1633
- "grok-code",
1634
- "kimi-k2",
1635
- "qwen3-coder"
1636
- ],
1637
- fastrouter: [
1638
- "anthropic/claude-opus-4.1",
1639
- "anthropic/claude-sonnet-4",
1640
- "deepseek-ai/deepseek-r1-distill-llama-70b",
1641
- "google/gemini-2.5-flash",
1642
- "google/gemini-2.5-pro",
1643
- "moonshotai/kimi-k2",
1644
- "openai/gpt-4.1",
1645
- "openai/gpt-5",
1646
- "openai/gpt-5-mini",
1647
- "openai/gpt-5-nano",
1648
- "openai/gpt-oss-120b",
1649
- "openai/gpt-oss-20b",
1650
- "qwen/qwen3-coder",
1651
- "x-ai/grok-4"
1715
+ "zai-org/GLM-4.5"
1652
1716
  ],
1653
- google: [
1654
- "gemini-1.5-flash",
1655
- "gemini-1.5-flash-8b",
1656
- "gemini-1.5-pro",
1657
- "gemini-2.0-flash",
1658
- "gemini-2.0-flash-lite",
1659
- "gemini-2.5-flash",
1660
- "gemini-2.5-flash-image",
1661
- "gemini-2.5-flash-image-preview",
1662
- "gemini-2.5-flash-lite",
1663
- "gemini-2.5-flash-lite-preview-06-17",
1664
- "gemini-2.5-flash-lite-preview-09-2025",
1665
- "gemini-2.5-flash-preview-04-17",
1666
- "gemini-2.5-flash-preview-05-20",
1667
- "gemini-2.5-flash-preview-09-2025",
1668
- "gemini-2.5-flash-preview-tts",
1669
- "gemini-2.5-pro",
1670
- "gemini-2.5-pro-preview-05-06",
1671
- "gemini-2.5-pro-preview-06-05",
1672
- "gemini-2.5-pro-preview-tts",
1673
- "gemini-flash-latest",
1674
- "gemini-flash-lite-latest",
1675
- "gemini-live-2.5-flash",
1676
- "gemini-live-2.5-flash-preview-native-audio"
1717
+ "fireworks-ai": [
1718
+ "accounts/fireworks/models/deepseek-r1-0528",
1719
+ "accounts/fireworks/models/deepseek-v3-0324",
1720
+ "accounts/fireworks/models/deepseek-v3p1",
1721
+ "accounts/fireworks/models/glm-4p5",
1722
+ "accounts/fireworks/models/glm-4p5-air",
1723
+ "accounts/fireworks/models/gpt-oss-120b",
1724
+ "accounts/fireworks/models/gpt-oss-20b",
1725
+ "accounts/fireworks/models/kimi-k2-instruct",
1726
+ "accounts/fireworks/models/qwen3-235b-a22b",
1727
+ "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
1728
+ ],
1729
+ zai: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1730
+ opencode: [
1731
+ "an-gbt",
1732
+ "big-pickle",
1733
+ "claude-3-5-haiku",
1734
+ "claude-haiku-4-5",
1735
+ "claude-opus-4-1",
1736
+ "claude-sonnet-4",
1737
+ "claude-sonnet-4-5",
1738
+ "code-supernova",
1739
+ "glm-4.6",
1740
+ "gpt-5",
1741
+ "gpt-5-codex",
1742
+ "grok-code",
1743
+ "kimi-k2",
1744
+ "qwen3-coder"
1677
1745
  ],
1746
+ "zhipuai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1678
1747
  inception: ["mercury", "mercury-coder"],
1679
- wandb: [
1680
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1681
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1682
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1683
- "deepseek-ai/DeepSeek-R1-0528",
1684
- "deepseek-ai/DeepSeek-V3-0324",
1685
- "meta-llama/Llama-3.1-8B-Instruct",
1686
- "meta-llama/Llama-3.3-70B-Instruct",
1687
- "meta-llama/Llama-4-Scout-17B-16E-Instruct",
1688
- "microsoft/Phi-4-mini-instruct",
1689
- "moonshotai/Kimi-K2-Instruct"
1748
+ llama: [
1749
+ "cerebras-llama-4-maverick-17b-128e-instruct",
1750
+ "cerebras-llama-4-scout-17b-16e-instruct",
1751
+ "groq-llama-4-maverick-17b-128e-instruct",
1752
+ "llama-3.3-70b-instruct",
1753
+ "llama-3.3-8b-instruct",
1754
+ "llama-4-maverick-17b-128e-instruct-fp8",
1755
+ "llama-4-scout-17b-16e-instruct-fp8"
1690
1756
  ],
1757
+ lmstudio: ["openai/gpt-oss-20b", "qwen/qwen3-30b-a3b-2507", "qwen/qwen3-coder-30b"],
1691
1758
  openai: [
1692
1759
  "codex-mini-latest",
1693
1760
  "gpt-3.5-turbo",
@@ -1717,234 +1784,229 @@ var provider_registry_default = {
1717
1784
  "o4-mini",
1718
1785
  "o4-mini-deep-research"
1719
1786
  ],
1720
- "zhipuai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1721
- perplexity: ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
1722
- openrouter: [
1723
- "anthropic/claude-3.5-haiku",
1724
- "anthropic/claude-3.7-sonnet",
1725
- "anthropic/claude-4.5-haiku",
1726
- "anthropic/claude-opus-4",
1727
- "anthropic/claude-opus-4.1",
1728
- "anthropic/claude-sonnet-4",
1729
- "anthropic/claude-sonnet-4.5",
1730
- "cognitivecomputations/dolphin3.0-mistral-24b",
1731
- "cognitivecomputations/dolphin3.0-r1-mistral-24b",
1732
- "deepseek/deepseek-chat-v3-0324",
1733
- "deepseek/deepseek-chat-v3.1",
1734
- "deepseek/deepseek-r1-0528-qwen3-8b:free",
1735
- "deepseek/deepseek-r1-0528:free",
1736
- "deepseek/deepseek-r1-distill-llama-70b",
1737
- "deepseek/deepseek-r1-distill-qwen-14b",
1738
- "deepseek/deepseek-r1:free",
1739
- "deepseek/deepseek-v3-base:free",
1740
- "deepseek/deepseek-v3.1-terminus",
1741
- "featherless/qwerky-72b",
1742
- "google/gemini-2.0-flash-001",
1743
- "google/gemini-2.0-flash-exp:free",
1744
- "google/gemini-2.5-flash",
1745
- "google/gemini-2.5-flash-lite",
1746
- "google/gemini-2.5-flash-lite-preview-09-2025",
1747
- "google/gemini-2.5-flash-preview-09-2025",
1748
- "google/gemini-2.5-pro",
1749
- "google/gemini-2.5-pro-preview-05-06",
1750
- "google/gemini-2.5-pro-preview-06-05",
1751
- "google/gemma-2-9b-it:free",
1752
- "google/gemma-3-12b-it",
1753
- "google/gemma-3-27b-it",
1754
- "google/gemma-3n-e4b-it",
1755
- "google/gemma-3n-e4b-it:free",
1756
- "meta-llama/llama-3.2-11b-vision-instruct",
1757
- "meta-llama/llama-3.3-70b-instruct:free",
1758
- "meta-llama/llama-4-scout:free",
1759
- "microsoft/mai-ds-r1:free",
1760
- "mistralai/codestral-2508",
1761
- "mistralai/devstral-medium-2507",
1762
- "mistralai/devstral-small-2505",
1763
- "mistralai/devstral-small-2505:free",
1764
- "mistralai/devstral-small-2507",
1765
- "mistralai/mistral-7b-instruct:free",
1766
- "mistralai/mistral-medium-3",
1767
- "mistralai/mistral-medium-3.1",
1768
- "mistralai/mistral-nemo:free",
1769
- "mistralai/mistral-small-3.1-24b-instruct",
1770
- "mistralai/mistral-small-3.2-24b-instruct",
1771
- "mistralai/mistral-small-3.2-24b-instruct:free",
1772
- "moonshotai/kimi-dev-72b:free",
1773
- "moonshotai/kimi-k2",
1774
- "moonshotai/kimi-k2-0905",
1775
- "moonshotai/kimi-k2:free",
1776
- "nousresearch/deephermes-3-llama-3-8b-preview",
1777
- "nousresearch/hermes-4-405b",
1778
- "nousresearch/hermes-4-70b",
1779
- "openai/gpt-4.1",
1780
- "openai/gpt-4.1-mini",
1781
- "openai/gpt-4o-mini",
1782
- "openai/gpt-5",
1783
- "openai/gpt-5-chat",
1784
- "openai/gpt-5-codex",
1785
- "openai/gpt-5-image",
1786
- "openai/gpt-5-mini",
1787
- "openai/gpt-5-nano",
1788
- "openai/gpt-oss-120b",
1789
- "openai/gpt-oss-20b",
1790
- "openai/o4-mini",
1791
- "openrouter/cypher-alpha:free",
1792
- "openrouter/horizon-alpha",
1793
- "openrouter/horizon-beta",
1794
- "openrouter/sonoma-dusk-alpha",
1795
- "openrouter/sonoma-sky-alpha",
1796
- "qwen/qwen-2.5-coder-32b-instruct",
1797
- "qwen/qwen2.5-vl-32b-instruct:free",
1798
- "qwen/qwen2.5-vl-72b-instruct",
1799
- "qwen/qwen2.5-vl-72b-instruct:free",
1800
- "qwen/qwen3-14b:free",
1801
- "qwen/qwen3-235b-a22b-07-25",
1802
- "qwen/qwen3-235b-a22b-07-25:free",
1803
- "qwen/qwen3-235b-a22b-thinking-2507",
1804
- "qwen/qwen3-235b-a22b:free",
1805
- "qwen/qwen3-30b-a3b-instruct-2507",
1806
- "qwen/qwen3-30b-a3b-thinking-2507",
1807
- "qwen/qwen3-30b-a3b:free",
1808
- "qwen/qwen3-32b:free",
1809
- "qwen/qwen3-8b:free",
1810
- "qwen/qwen3-coder",
1811
- "qwen/qwen3-coder:free",
1812
- "qwen/qwen3-max",
1813
- "qwen/qwen3-next-80b-a3b-instruct",
1814
- "qwen/qwen3-next-80b-a3b-thinking",
1815
- "qwen/qwq-32b:free",
1816
- "rekaai/reka-flash-3",
1817
- "sarvamai/sarvam-m:free",
1818
- "thudm/glm-z1-32b:free",
1819
- "tngtech/deepseek-r1t2-chimera:free",
1820
- "x-ai/grok-3",
1821
- "x-ai/grok-3-beta",
1822
- "x-ai/grok-3-mini",
1823
- "x-ai/grok-3-mini-beta",
1824
- "x-ai/grok-4",
1825
- "x-ai/grok-4-fast",
1826
- "x-ai/grok-4-fast:free",
1827
- "x-ai/grok-code-fast-1",
1828
- "z-ai/glm-4.5",
1829
- "z-ai/glm-4.5-air",
1830
- "z-ai/glm-4.5-air:free",
1831
- "z-ai/glm-4.5v",
1832
- "z-ai/glm-4.6"
1787
+ anthropic: [
1788
+ "claude-3-5-haiku-20241022",
1789
+ "claude-3-5-haiku-latest",
1790
+ "claude-3-5-sonnet-20240620",
1791
+ "claude-3-5-sonnet-20241022",
1792
+ "claude-3-7-sonnet-20250219",
1793
+ "claude-3-7-sonnet-latest",
1794
+ "claude-3-haiku-20240307",
1795
+ "claude-3-opus-20240229",
1796
+ "claude-3-sonnet-20240229",
1797
+ "claude-haiku-4-5",
1798
+ "claude-haiku-4-5-20251001",
1799
+ "claude-opus-4-0",
1800
+ "claude-opus-4-1",
1801
+ "claude-opus-4-1-20250805",
1802
+ "claude-opus-4-20250514",
1803
+ "claude-sonnet-4-0",
1804
+ "claude-sonnet-4-20250514",
1805
+ "claude-sonnet-4-5",
1806
+ "claude-sonnet-4-5-20250929"
1833
1807
  ],
1834
- synthetic: [
1835
- "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
1836
- "hf:Qwen/Qwen3-235B-A22B-Instruct-2507",
1837
- "hf:Qwen/Qwen3-235B-A22B-Thinking-2507",
1838
- "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct",
1839
- "hf:deepseek-ai/DeepSeek-R1",
1840
- "hf:deepseek-ai/DeepSeek-R1-0528",
1841
- "hf:deepseek-ai/DeepSeek-V3",
1842
- "hf:deepseek-ai/DeepSeek-V3-0324",
1843
- "hf:deepseek-ai/DeepSeek-V3.1",
1844
- "hf:deepseek-ai/DeepSeek-V3.1-Terminus",
1845
- "hf:meta-llama/Llama-3.1-405B-Instruct",
1846
- "hf:meta-llama/Llama-3.1-70B-Instruct",
1847
- "hf:meta-llama/Llama-3.1-8B-Instruct",
1848
- "hf:meta-llama/Llama-3.3-70B-Instruct",
1849
- "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
1850
- "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct",
1851
- "hf:moonshotai/Kimi-K2-Instruct",
1852
- "hf:moonshotai/Kimi-K2-Instruct-0905",
1853
- "hf:openai/gpt-oss-120b",
1854
- "hf:zai-org/GLM-4.5",
1855
- "hf:zai-org/GLM-4.6"
1808
+ moonshotai: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1809
+ inference: [
1810
+ "google/gemma-3",
1811
+ "meta/llama-3.1-8b-instruct",
1812
+ "meta/llama-3.2-11b-vision-instruct",
1813
+ "meta/llama-3.2-1b-instruct",
1814
+ "meta/llama-3.2-3b-instruct",
1815
+ "mistral/mistral-nemo-12b-instruct",
1816
+ "osmosis/osmosis-structure-0.6b",
1817
+ "qwen/qwen-2.5-7b-vision-instruct",
1818
+ "qwen/qwen3-embedding-4b"
1819
+ ],
1820
+ baseten: ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
1821
+ cortecs: [
1822
+ "claude-4-5-sonnet",
1823
+ "claude-sonnet-4",
1824
+ "deepseek-v3-0324",
1825
+ "gemini-2.5-pro",
1826
+ "gpt-4.1",
1827
+ "gpt-oss-120b",
1828
+ "kimi-k2-instruct",
1829
+ "llama-3.1-405b-instruct",
1830
+ "nova-pro-v1",
1831
+ "qwen3-32b",
1832
+ "qwen3-coder-480b-a35b-instruct"
1833
+ ],
1834
+ mistral: [
1835
+ "codestral-latest",
1836
+ "devstral-medium-2507",
1837
+ "devstral-small-2505",
1838
+ "devstral-small-2507",
1839
+ "magistral-medium-latest",
1840
+ "magistral-small",
1841
+ "ministral-3b-latest",
1842
+ "ministral-8b-latest",
1843
+ "mistral-large-latest",
1844
+ "mistral-medium-2505",
1845
+ "mistral-medium-2508",
1846
+ "mistral-medium-latest",
1847
+ "mistral-nemo",
1848
+ "mistral-small-latest",
1849
+ "open-mistral-7b",
1850
+ "open-mixtral-8x22b",
1851
+ "open-mixtral-8x7b",
1852
+ "pixtral-12b",
1853
+ "pixtral-large-latest"
1854
+ ],
1855
+ venice: [
1856
+ "deepseek-coder-v2-lite",
1857
+ "deepseek-r1-671b",
1858
+ "dolphin-2.9.2-qwen2-72b",
1859
+ "llama-3.1-405b",
1860
+ "llama-3.2-3b",
1861
+ "llama-3.3-70b",
1862
+ "mistral-31-24b",
1863
+ "qwen-2.5-coder-32b",
1864
+ "qwen-2.5-qwq-32b",
1865
+ "qwen-2.5-vl",
1866
+ "qwen3-235b",
1867
+ "qwen3-4b",
1868
+ "venice-uncensored"
1869
+ ],
1870
+ alibaba: [
1871
+ "qvq-max",
1872
+ "qwen-flash",
1873
+ "qwen-max",
1874
+ "qwen-mt-plus",
1875
+ "qwen-mt-turbo",
1876
+ "qwen-omni-turbo",
1877
+ "qwen-omni-turbo-realtime",
1878
+ "qwen-plus",
1879
+ "qwen-plus-character-ja",
1880
+ "qwen-turbo",
1881
+ "qwen-vl-max",
1882
+ "qwen-vl-ocr",
1883
+ "qwen-vl-plus",
1884
+ "qwen2-5-14b-instruct",
1885
+ "qwen2-5-32b-instruct",
1886
+ "qwen2-5-72b-instruct",
1887
+ "qwen2-5-7b-instruct",
1888
+ "qwen2-5-omni-7b",
1889
+ "qwen2-5-vl-72b-instruct",
1890
+ "qwen2-5-vl-7b-instruct",
1891
+ "qwen3-14b",
1892
+ "qwen3-235b-a22b",
1893
+ "qwen3-32b",
1894
+ "qwen3-8b",
1895
+ "qwen3-asr-flash",
1896
+ "qwen3-coder-30b-a3b-instruct",
1897
+ "qwen3-coder-480b-a35b-instruct",
1898
+ "qwen3-coder-flash",
1899
+ "qwen3-coder-plus",
1900
+ "qwen3-livetranslate-flash-realtime",
1901
+ "qwen3-max",
1902
+ "qwen3-next-80b-a3b-instruct",
1903
+ "qwen3-next-80b-a3b-thinking",
1904
+ "qwen3-omni-flash",
1905
+ "qwen3-omni-flash-realtime",
1906
+ "qwen3-vl-235b-a22b",
1907
+ "qwen3-vl-30b-a3b",
1908
+ "qwen3-vl-plus",
1909
+ "qwq-plus"
1856
1910
  ],
1857
- deepinfra: [
1858
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1859
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo",
1860
- "moonshotai/Kimi-K2-Instruct",
1861
- "zai-org/GLM-4.5"
1911
+ "alibaba-cn": [
1912
+ "deepseek-r1",
1913
+ "deepseek-r1-0528",
1914
+ "deepseek-r1-distill-llama-70b",
1915
+ "deepseek-r1-distill-llama-8b",
1916
+ "deepseek-r1-distill-qwen-1-5b",
1917
+ "deepseek-r1-distill-qwen-14b",
1918
+ "deepseek-r1-distill-qwen-32b",
1919
+ "deepseek-r1-distill-qwen-7b",
1920
+ "deepseek-v3",
1921
+ "deepseek-v3-1",
1922
+ "deepseek-v3-2-exp",
1923
+ "moonshot-kimi-k2-instruct",
1924
+ "qvq-max",
1925
+ "qwen-deep-research",
1926
+ "qwen-doc-turbo",
1927
+ "qwen-flash",
1928
+ "qwen-long",
1929
+ "qwen-math-plus",
1930
+ "qwen-math-turbo",
1931
+ "qwen-max",
1932
+ "qwen-mt-plus",
1933
+ "qwen-mt-turbo",
1934
+ "qwen-omni-turbo",
1935
+ "qwen-omni-turbo-realtime",
1936
+ "qwen-plus",
1937
+ "qwen-plus-character",
1938
+ "qwen-turbo",
1939
+ "qwen-vl-max",
1940
+ "qwen-vl-ocr",
1941
+ "qwen-vl-plus",
1942
+ "qwen2-5-14b-instruct",
1943
+ "qwen2-5-32b-instruct",
1944
+ "qwen2-5-72b-instruct",
1945
+ "qwen2-5-7b-instruct",
1946
+ "qwen2-5-coder-32b-instruct",
1947
+ "qwen2-5-coder-7b-instruct",
1948
+ "qwen2-5-math-72b-instruct",
1949
+ "qwen2-5-math-7b-instruct",
1950
+ "qwen2-5-omni-7b",
1951
+ "qwen2-5-vl-72b-instruct",
1952
+ "qwen2-5-vl-7b-instruct",
1953
+ "qwen3-14b",
1954
+ "qwen3-235b-a22b",
1955
+ "qwen3-32b",
1956
+ "qwen3-8b",
1957
+ "qwen3-asr-flash",
1958
+ "qwen3-coder-30b-a3b-instruct",
1959
+ "qwen3-coder-480b-a35b-instruct",
1960
+ "qwen3-coder-flash",
1961
+ "qwen3-coder-plus",
1962
+ "qwen3-max",
1963
+ "qwen3-next-80b-a3b-instruct",
1964
+ "qwen3-next-80b-a3b-thinking",
1965
+ "qwen3-omni-flash",
1966
+ "qwen3-omni-flash-realtime",
1967
+ "qwen3-vl-235b-a22b",
1968
+ "qwen3-vl-30b-a3b",
1969
+ "qwen3-vl-plus",
1970
+ "qwq-32b",
1971
+ "qwq-plus",
1972
+ "tongyi-intent-detect-v3"
1862
1973
  ],
1863
- zhipuai: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1864
- submodel: [
1974
+ chutes: [
1865
1975
  "Qwen/Qwen3-235B-A22B-Instruct-2507",
1866
1976
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
1977
+ "Qwen/Qwen3-30B-A3B",
1978
+ "Qwen/Qwen3-30B-A3B-Instruct-2507",
1979
+ "Qwen/Qwen3-30B-A3B-Thinking-2507",
1980
+ "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1867
1981
  "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1982
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
1983
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
1984
+ "chutesai/Devstral-Small-2505",
1985
+ "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
1868
1986
  "deepseek-ai/DeepSeek-R1-0528",
1987
+ "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
1988
+ "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1869
1989
  "deepseek-ai/DeepSeek-V3-0324",
1870
1990
  "deepseek-ai/DeepSeek-V3.1",
1991
+ "deepseek-ai/DeepSeek-V3.1-Terminus",
1992
+ "deepseek-ai/DeepSeek-V3.1-turbo",
1993
+ "deepseek-ai/DeepSeek-V3.1:THINKING",
1994
+ "deepseek-ai/DeepSeek-V3.2-Exp",
1995
+ "meituan-longcat/LongCat-Flash-Chat-FP8",
1996
+ "moonshotai/Kimi-Dev-72B",
1997
+ "moonshotai/Kimi-K2-Instruct-0905",
1998
+ "moonshotai/Kimi-K2-Instruct-75k",
1999
+ "moonshotai/Kimi-VL-A3B-Thinking",
1871
2000
  "openai/gpt-oss-120b",
2001
+ "tngtech/DeepSeek-R1T-Chimera",
2002
+ "tngtech/DeepSeek-TNG-R1T2-Chimera",
1872
2003
  "zai-org/GLM-4.5-Air",
1873
- "zai-org/GLM-4.5-FP8"
1874
- ],
1875
- zai: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1876
- inference: [
1877
- "google/gemma-3",
1878
- "meta/llama-3.1-8b-instruct",
1879
- "meta/llama-3.2-11b-vision-instruct",
1880
- "meta/llama-3.2-1b-instruct",
1881
- "meta/llama-3.2-3b-instruct",
1882
- "mistral/mistral-nemo-12b-instruct",
1883
- "osmosis/osmosis-structure-0.6b",
1884
- "qwen/qwen-2.5-7b-vision-instruct",
1885
- "qwen/qwen3-embedding-4b"
1886
- ],
1887
- requesty: [
1888
- "anthropic/claude-3-7-sonnet",
1889
- "anthropic/claude-4-sonnet-20250522",
1890
- "anthropic/claude-opus-4",
1891
- "anthropic/claude-opus-4-1-20250805",
1892
- "google/gemini-2.5-flash",
1893
- "google/gemini-2.5-pro",
1894
- "openai/gpt-4.1",
1895
- "openai/gpt-4.1-mini",
1896
- "openai/gpt-4o-mini",
1897
- "openai/gpt-5",
1898
- "openai/gpt-5-mini",
1899
- "openai/gpt-5-nano",
1900
- "openai/o4-mini"
1901
- ],
1902
- morph: ["auto", "morph-v3-fast", "morph-v3-large"],
1903
- lmstudio: ["openai/gpt-oss-20b", "qwen/qwen3-30b-a3b-2507", "qwen/qwen3-coder-30b"],
1904
- anthropic: [
1905
- "claude-3-5-haiku-20241022",
1906
- "claude-3-5-sonnet-20240620",
1907
- "claude-3-5-sonnet-20241022",
1908
- "claude-3-7-sonnet-20250219",
1909
- "claude-3-haiku-20240307",
1910
- "claude-3-opus-20240229",
1911
- "claude-3-sonnet-20240229",
1912
- "claude-haiku-4-5-20251001",
1913
- "claude-opus-4-1-20250805",
1914
- "claude-opus-4-20250514",
1915
- "claude-sonnet-4-20250514",
1916
- "claude-sonnet-4-5-20250929"
1917
- ],
1918
- "fireworks-ai": [
1919
- "accounts/fireworks/models/deepseek-r1-0528",
1920
- "accounts/fireworks/models/deepseek-v3-0324",
1921
- "accounts/fireworks/models/deepseek-v3p1",
1922
- "accounts/fireworks/models/glm-4p5",
1923
- "accounts/fireworks/models/glm-4p5-air",
1924
- "accounts/fireworks/models/gpt-oss-120b",
1925
- "accounts/fireworks/models/gpt-oss-20b",
1926
- "accounts/fireworks/models/kimi-k2-instruct",
1927
- "accounts/fireworks/models/qwen3-235b-a22b",
1928
- "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
1929
- ],
1930
- modelscope: [
1931
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1932
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1933
- "Qwen/Qwen3-30B-A3B-Instruct-2507",
1934
- "Qwen/Qwen3-30B-A3B-Thinking-2507",
1935
- "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1936
- "ZhipuAI/GLM-4.5"
1937
- ],
1938
- llama: [
1939
- "cerebras-llama-4-maverick-17b-128e-instruct",
1940
- "cerebras-llama-4-scout-17b-16e-instruct",
1941
- "groq-llama-4-maverick-17b-128e-instruct",
1942
- "llama-3.3-70b-instruct",
1943
- "llama-3.3-8b-instruct",
1944
- "llama-4-maverick-17b-128e-instruct-fp8",
1945
- "llama-4-scout-17b-16e-instruct-fp8"
2004
+ "zai-org/GLM-4.5-FP8",
2005
+ "zai-org/GLM-4.5-turbo",
2006
+ "zai-org/GLM-4.6-FP8",
2007
+ "zai-org/GLM-4.6-turbo"
1946
2008
  ],
1947
- cerebras: ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
2009
+ upstage: ["solar-mini", "solar-pro2"],
1948
2010
  netlify: [
1949
2011
  "anthropic/claude-3-5-haiku-20241022",
1950
2012
  "anthropic/claude-3-5-haiku-latest",
@@ -2016,7 +2078,7 @@ function saveLastRefreshTimeToDisk(date) {
2016
2078
  }
2017
2079
  function getPackageRoot() {
2018
2080
  try {
2019
- const require2 = module$1.createRequire((typeof document === 'undefined' ? require('u' + 'rl').pathToFileURL(__filename).href : (_documentCurrentScript && _documentCurrentScript.tagName.toUpperCase() === 'SCRIPT' && _documentCurrentScript.src || new URL('chunk-DGQW5VRR.cjs', document.baseURI).href)) || "file://");
2081
+ const require2 = module$1.createRequire((typeof document === 'undefined' ? require('u' + 'rl').pathToFileURL(__filename).href : (_documentCurrentScript && _documentCurrentScript.tagName.toUpperCase() === 'SCRIPT' && _documentCurrentScript.src || new URL('chunk-ZMPSVDDO.cjs', document.baseURI).href)) || "file://");
2020
2082
  const packageJsonPath = require2.resolve("@mastra/core/package.json");
2021
2083
  return path__default.default.dirname(packageJsonPath);
2022
2084
  } catch {
@@ -2169,8 +2231,8 @@ var GatewayRegistry = class _GatewayRegistry {
2169
2231
  }
2170
2232
  this.isRefreshing = true;
2171
2233
  try {
2172
- const { ModelsDevGateway: ModelsDevGateway2 } = await import('./models-dev-L42ORGVT.cjs');
2173
- const { NetlifyGateway: NetlifyGateway2 } = await import('./netlify-3B6HDHRP.cjs');
2234
+ const { ModelsDevGateway: ModelsDevGateway2 } = await import('./models-dev-AXZASLL2.cjs');
2235
+ const { NetlifyGateway: NetlifyGateway2 } = await import('./netlify-F3MVGV4Y.cjs');
2174
2236
  const { fetchProvidersFromGateways, writeRegistryFiles } = await import('./registry-generator-6WVOHM2L.cjs');
2175
2237
  const gateways2 = [new ModelsDevGateway2({}), new NetlifyGateway2()];
2176
2238
  const { providers, models } = await fetchProvidersFromGateways(gateways2);
@@ -2279,11 +2341,29 @@ if (autoRefreshEnabled) {
2279
2341
  GatewayRegistry.getInstance({ useDynamicLoading: isDev }).startAutoRefresh();
2280
2342
  }
2281
2343
 
2344
+ // src/llm/model/gateways/index.ts
2345
+ function findGatewayForModel(gatewayId, gateways2) {
2346
+ const prefixedGateway = gateways2.find((g) => g.prefix && gatewayId.startsWith(`${g.prefix}/`));
2347
+ if (prefixedGateway) {
2348
+ return prefixedGateway;
2349
+ }
2350
+ const unprefixedGateways = gateways2.filter((g) => !g.prefix);
2351
+ for (const gateway of unprefixedGateways) {
2352
+ return gateway;
2353
+ }
2354
+ throw new chunkWM4VQWOZ_cjs.MastraError({
2355
+ id: "MODEL_ROUTER_NO_GATEWAY_FOUND",
2356
+ category: "USER",
2357
+ domain: "MODEL_ROUTER",
2358
+ text: `No Mastra model router gateway found for model id ${gatewayId}`
2359
+ });
2360
+ }
2361
+
2282
2362
  // src/llm/model/router.ts
2283
2363
  function getStaticProvidersByGateway(name) {
2284
2364
  return Object.fromEntries(Object.entries(PROVIDER_REGISTRY).filter(([_provider, config]) => config.gateway === name));
2285
2365
  }
2286
- var gateways = [new chunkOY6UJ3QL_cjs.NetlifyGateway(), new chunk3ORA5EFD_cjs.ModelsDevGateway(getStaticProvidersByGateway(`models.dev`))];
2366
+ var gateways = [new chunkYGL6E6PD_cjs.NetlifyGateway(), new chunkLZUSZT7R_cjs.ModelsDevGateway(getStaticProvidersByGateway(`models.dev`))];
2287
2367
  var ModelRouterLanguageModel = class _ModelRouterLanguageModel {
2288
2368
  specificationVersion = "v2";
2289
2369
  defaultObjectGenerationMode = "json";
@@ -2318,7 +2398,7 @@ var ModelRouterLanguageModel = class _ModelRouterLanguageModel {
2318
2398
  routerId: normalizedConfig.id
2319
2399
  };
2320
2400
  this.gateway = findGatewayForModel(normalizedConfig.id, gateways);
2321
- const parsed = chunk3ORA5EFD_cjs.parseModelRouterId(normalizedConfig.id, this.gateway.prefix);
2401
+ const parsed = chunkLZUSZT7R_cjs.parseModelRouterId(normalizedConfig.id, this.gateway.prefix);
2322
2402
  this.provider = parsed.providerId || "openai-compatible";
2323
2403
  if (parsed.providerId && parsed.modelId !== normalizedConfig.id) {
2324
2404
  parsedConfig.id = parsed.modelId;
@@ -2334,7 +2414,11 @@ var ModelRouterLanguageModel = class _ModelRouterLanguageModel {
2334
2414
  async doStream(options) {
2335
2415
  let apiKey;
2336
2416
  try {
2337
- apiKey = this.config.apiKey || await this.gateway.getApiKey(this.config.routerId);
2417
+ if (this.config.url) {
2418
+ apiKey = this.config.apiKey || "";
2419
+ } else {
2420
+ apiKey = this.config.apiKey || await this.gateway.getApiKey(this.config.routerId);
2421
+ }
2338
2422
  } catch (error) {
2339
2423
  return {
2340
2424
  stream: new ReadableStream({
@@ -2349,7 +2433,7 @@ var ModelRouterLanguageModel = class _ModelRouterLanguageModel {
2349
2433
  }
2350
2434
  const model = await this.resolveLanguageModel({
2351
2435
  apiKey,
2352
- ...chunk3ORA5EFD_cjs.parseModelRouterId(this.config.routerId, this.gateway.prefix)
2436
+ ...chunkLZUSZT7R_cjs.parseModelRouterId(this.config.routerId, this.gateway.prefix)
2353
2437
  });
2354
2438
  return model.doStream(options);
2355
2439
  }
@@ -2365,7 +2449,8 @@ var ModelRouterLanguageModel = class _ModelRouterLanguageModel {
2365
2449
  name: providerId,
2366
2450
  apiKey,
2367
2451
  baseURL: this.config.url,
2368
- headers: this.config.headers
2452
+ headers: this.config.headers,
2453
+ supportsStructuredOutputs: true
2369
2454
  }).chatModel(modelId);
2370
2455
  _ModelRouterLanguageModel.modelInstances.set(key, modelInstance2);
2371
2456
  return modelInstance2;
@@ -2402,11 +2487,112 @@ async function resolveModelConfig(modelConfig, runtimeContext = new chunkGPWMM74
2402
2487
  }
2403
2488
  throw new Error("Invalid model configuration provided");
2404
2489
  }
2490
+ var ModelRouterEmbeddingModel = class {
2491
+ specificationVersion = "v2";
2492
+ modelId;
2493
+ provider;
2494
+ maxEmbeddingsPerCall = 2048;
2495
+ supportsParallelCalls = true;
2496
+ providerModel;
2497
+ constructor(config) {
2498
+ let normalizedConfig;
2499
+ if (typeof config === "string") {
2500
+ const parts = config.split("/");
2501
+ if (parts.length !== 2) {
2502
+ throw new Error(`Invalid model string format: "${config}". Expected format: "provider/model"`);
2503
+ }
2504
+ const [providerId, modelId] = parts;
2505
+ normalizedConfig = { providerId, modelId };
2506
+ } else if ("providerId" in config && "modelId" in config) {
2507
+ normalizedConfig = {
2508
+ providerId: config.providerId,
2509
+ modelId: config.modelId,
2510
+ url: config.url,
2511
+ apiKey: config.apiKey,
2512
+ headers: config.headers
2513
+ };
2514
+ } else {
2515
+ const parts = config.id.split("/");
2516
+ if (parts.length !== 2) {
2517
+ throw new Error(`Invalid model string format: "${config.id}". Expected format: "provider/model"`);
2518
+ }
2519
+ const [providerId, modelId] = parts;
2520
+ normalizedConfig = {
2521
+ providerId,
2522
+ modelId,
2523
+ url: config.url,
2524
+ apiKey: config.apiKey,
2525
+ headers: config.headers
2526
+ };
2527
+ }
2528
+ this.provider = normalizedConfig.providerId;
2529
+ this.modelId = normalizedConfig.modelId;
2530
+ if (normalizedConfig.url) {
2531
+ const apiKey = normalizedConfig.apiKey || "";
2532
+ this.providerModel = openaiCompatibleV5.createOpenAICompatible({
2533
+ name: normalizedConfig.providerId,
2534
+ apiKey,
2535
+ baseURL: normalizedConfig.url,
2536
+ headers: normalizedConfig.headers
2537
+ }).textEmbeddingModel(normalizedConfig.modelId);
2538
+ } else {
2539
+ const registry = GatewayRegistry.getInstance();
2540
+ const providerConfig = registry.getProviderConfig(normalizedConfig.providerId);
2541
+ if (!providerConfig) {
2542
+ throw new Error(`Unknown provider: ${normalizedConfig.providerId}`);
2543
+ }
2544
+ let apiKey = normalizedConfig.apiKey;
2545
+ if (!apiKey) {
2546
+ const apiKeyEnvVar = providerConfig.apiKeyEnvVar;
2547
+ if (Array.isArray(apiKeyEnvVar)) {
2548
+ for (const envVar of apiKeyEnvVar) {
2549
+ apiKey = process.env[envVar];
2550
+ if (apiKey) break;
2551
+ }
2552
+ } else {
2553
+ apiKey = process.env[apiKeyEnvVar];
2554
+ }
2555
+ }
2556
+ if (!apiKey) {
2557
+ const envVarDisplay = Array.isArray(providerConfig.apiKeyEnvVar) ? providerConfig.apiKeyEnvVar.join(" or ") : providerConfig.apiKeyEnvVar;
2558
+ throw new Error(`API key not found for provider ${normalizedConfig.providerId}. Set ${envVarDisplay}`);
2559
+ }
2560
+ if (normalizedConfig.providerId === "openai") {
2561
+ this.providerModel = openaiV5.createOpenAI({ apiKey }).textEmbeddingModel(
2562
+ normalizedConfig.modelId
2563
+ );
2564
+ } else if (normalizedConfig.providerId === "google") {
2565
+ this.providerModel = googleV5.createGoogleGenerativeAI({ apiKey }).textEmbedding(
2566
+ normalizedConfig.modelId
2567
+ );
2568
+ } else {
2569
+ if (!providerConfig.url) {
2570
+ throw new Error(`Provider ${normalizedConfig.providerId} does not have a URL configured`);
2571
+ }
2572
+ this.providerModel = openaiCompatibleV5.createOpenAICompatible({
2573
+ name: normalizedConfig.providerId,
2574
+ apiKey,
2575
+ baseURL: providerConfig.url
2576
+ }).textEmbeddingModel(normalizedConfig.modelId);
2577
+ }
2578
+ }
2579
+ if (this.providerModel.maxEmbeddingsPerCall !== void 0) {
2580
+ this.maxEmbeddingsPerCall = this.providerModel.maxEmbeddingsPerCall;
2581
+ }
2582
+ if (this.providerModel.supportsParallelCalls !== void 0) {
2583
+ this.supportsParallelCalls = this.providerModel.supportsParallelCalls;
2584
+ }
2585
+ }
2586
+ async doEmbed(args) {
2587
+ return this.providerModel.doEmbed(args);
2588
+ }
2589
+ };
2405
2590
 
2591
+ exports.ModelRouterEmbeddingModel = ModelRouterEmbeddingModel;
2406
2592
  exports.ModelRouterLanguageModel = ModelRouterLanguageModel;
2407
2593
  exports.PROVIDER_REGISTRY = PROVIDER_REGISTRY;
2408
2594
  exports.getProviderConfig = getProviderConfig;
2409
2595
  exports.parseModelString = parseModelString;
2410
2596
  exports.resolveModelConfig = resolveModelConfig;
2411
- //# sourceMappingURL=chunk-DGQW5VRR.cjs.map
2412
- //# sourceMappingURL=chunk-DGQW5VRR.cjs.map
2597
+ //# sourceMappingURL=chunk-ZMPSVDDO.cjs.map
2598
+ //# sourceMappingURL=chunk-ZMPSVDDO.cjs.map