@mastra/core 0.21.2-alpha.0 → 0.22.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (181) hide show
  1. package/CHANGELOG.md +194 -0
  2. package/dist/agent/agent.d.ts +1 -0
  3. package/dist/agent/agent.d.ts.map +1 -1
  4. package/dist/agent/index.cjs +13 -13
  5. package/dist/agent/index.js +2 -2
  6. package/dist/agent/input-processor/index.cjs +6 -6
  7. package/dist/agent/input-processor/index.js +1 -1
  8. package/dist/agent/message-list/index.d.ts +14 -1
  9. package/dist/agent/message-list/index.d.ts.map +1 -1
  10. package/dist/agent/test-utils.d.ts +1 -0
  11. package/dist/agent/test-utils.d.ts.map +1 -1
  12. package/dist/agent/types.d.ts +6 -1
  13. package/dist/agent/types.d.ts.map +1 -1
  14. package/dist/agent/utils.d.ts +1 -1
  15. package/dist/agent/utils.d.ts.map +1 -1
  16. package/dist/ai-tracing/chunk-tracing.d.ts +76 -0
  17. package/dist/ai-tracing/chunk-tracing.d.ts.map +1 -0
  18. package/dist/ai-tracing/exporters/base.d.ts +111 -0
  19. package/dist/ai-tracing/exporters/base.d.ts.map +1 -0
  20. package/dist/ai-tracing/exporters/cloud.d.ts +6 -8
  21. package/dist/ai-tracing/exporters/cloud.d.ts.map +1 -1
  22. package/dist/ai-tracing/exporters/console.d.ts +6 -6
  23. package/dist/ai-tracing/exporters/console.d.ts.map +1 -1
  24. package/dist/ai-tracing/exporters/index.d.ts +1 -0
  25. package/dist/ai-tracing/exporters/index.d.ts.map +1 -1
  26. package/dist/ai-tracing/index.cjs +48 -32
  27. package/dist/ai-tracing/index.d.ts +1 -0
  28. package/dist/ai-tracing/index.d.ts.map +1 -1
  29. package/dist/ai-tracing/index.js +1 -1
  30. package/dist/ai-tracing/spans/base.d.ts +4 -1
  31. package/dist/ai-tracing/spans/base.d.ts.map +1 -1
  32. package/dist/ai-tracing/spans/default.d.ts.map +1 -1
  33. package/dist/ai-tracing/tracers/base.d.ts +15 -1
  34. package/dist/ai-tracing/tracers/base.d.ts.map +1 -1
  35. package/dist/ai-tracing/types.d.ts +85 -11
  36. package/dist/ai-tracing/types.d.ts.map +1 -1
  37. package/dist/ai-tracing/utils.d.ts +14 -0
  38. package/dist/ai-tracing/utils.d.ts.map +1 -1
  39. package/dist/{chunk-D3IOLHNB.cjs → chunk-34L2Z6PH.cjs} +12 -12
  40. package/dist/{chunk-D3IOLHNB.cjs.map → chunk-34L2Z6PH.cjs.map} +1 -1
  41. package/dist/{chunk-BLVB2IJK.js → chunk-3CVE7NQC.js} +728 -267
  42. package/dist/chunk-3CVE7NQC.js.map +1 -0
  43. package/dist/{chunk-URQI7RJ3.cjs → chunk-5GIAZ3CH.cjs} +734 -269
  44. package/dist/chunk-5GIAZ3CH.cjs.map +1 -0
  45. package/dist/{chunk-XYNSPEJO.js → chunk-5NYWRAJN.js} +3 -3
  46. package/dist/{chunk-XYNSPEJO.js.map → chunk-5NYWRAJN.js.map} +1 -1
  47. package/dist/{chunk-URVM3Y4T.cjs → chunk-634YFL42.cjs} +44 -7
  48. package/dist/chunk-634YFL42.cjs.map +1 -0
  49. package/dist/{chunk-NIESGYOH.js → chunk-A3TQYIIR.js} +1392 -1416
  50. package/dist/chunk-A3TQYIIR.js.map +1 -0
  51. package/dist/{chunk-EGNHIPGJ.cjs → chunk-A4B6IAKN.cjs} +4 -4
  52. package/dist/{chunk-EGNHIPGJ.cjs.map → chunk-A4B6IAKN.cjs.map} +1 -1
  53. package/dist/{chunk-LMP5KMU3.js → chunk-AGD5B3FB.js} +43 -6
  54. package/dist/chunk-AGD5B3FB.js.map +1 -0
  55. package/dist/{chunk-V5WDWSQ5.cjs → chunk-CAZTWPDK.cjs} +11 -11
  56. package/dist/{chunk-V5WDWSQ5.cjs.map → chunk-CAZTWPDK.cjs.map} +1 -1
  57. package/dist/{chunk-N3ZSX5OS.js → chunk-F7OMDF5K.js} +72 -36
  58. package/dist/chunk-F7OMDF5K.js.map +1 -0
  59. package/dist/{chunk-ZMPSVDDO.cjs → chunk-FMNZ3BPT.cjs} +1393 -1417
  60. package/dist/chunk-FMNZ3BPT.cjs.map +1 -0
  61. package/dist/{chunk-4ZFVJA3A.js → chunk-HZIF7HQC.js} +3 -3
  62. package/dist/{chunk-4ZFVJA3A.js.map → chunk-HZIF7HQC.js.map} +1 -1
  63. package/dist/{chunk-KLWDUSBX.js → chunk-ITFEGBP2.js} +4 -4
  64. package/dist/{chunk-KLWDUSBX.js.map → chunk-ITFEGBP2.js.map} +1 -1
  65. package/dist/{chunk-GKTRUHKB.js → chunk-KQBF5ZEN.js} +5 -5
  66. package/dist/{chunk-GKTRUHKB.js.map → chunk-KQBF5ZEN.js.map} +1 -1
  67. package/dist/{chunk-R35PINKN.js → chunk-MHICZASQ.js} +5 -5
  68. package/dist/{chunk-R35PINKN.js.map → chunk-MHICZASQ.js.map} +1 -1
  69. package/dist/{chunk-H4KO46HZ.js → chunk-MKCC5K77.js} +3 -3
  70. package/dist/{chunk-H4KO46HZ.js.map → chunk-MKCC5K77.js.map} +1 -1
  71. package/dist/{chunk-UN653TND.cjs → chunk-O4KVF3MI.cjs} +4 -4
  72. package/dist/{chunk-UN653TND.cjs.map → chunk-O4KVF3MI.cjs.map} +1 -1
  73. package/dist/{chunk-WI2YMBNG.cjs → chunk-QBPTDMR7.cjs} +102 -64
  74. package/dist/chunk-QBPTDMR7.cjs.map +1 -0
  75. package/dist/{chunk-7P5FMQQK.cjs → chunk-RWWOJXMF.cjs} +6 -6
  76. package/dist/{chunk-7P5FMQQK.cjs.map → chunk-RWWOJXMF.cjs.map} +1 -1
  77. package/dist/{chunk-XBJP7THY.js → chunk-RXBG6UV2.js} +4 -4
  78. package/dist/chunk-RXBG6UV2.js.map +1 -0
  79. package/dist/{chunk-NL3P7IFI.js → chunk-SF75RENF.js} +3 -3
  80. package/dist/{chunk-NL3P7IFI.js.map → chunk-SF75RENF.js.map} +1 -1
  81. package/dist/{chunk-SE4PA467.cjs → chunk-VF676YCO.cjs} +2 -2
  82. package/dist/chunk-VF676YCO.cjs.map +1 -0
  83. package/dist/{chunk-6OLRLZJ3.js → chunk-WM4RO23J.js} +2 -2
  84. package/dist/chunk-WM4RO23J.js.map +1 -0
  85. package/dist/{chunk-MVVMHOAC.cjs → chunk-YOVX3R5U.cjs} +14 -14
  86. package/dist/chunk-YOVX3R5U.cjs.map +1 -0
  87. package/dist/{chunk-L5A4MRCK.cjs → chunk-ZABG3SZ2.cjs} +4 -4
  88. package/dist/{chunk-L5A4MRCK.cjs.map → chunk-ZABG3SZ2.cjs.map} +1 -1
  89. package/dist/{chunk-YKVVW65D.cjs → chunk-ZDW322JC.cjs} +8 -8
  90. package/dist/{chunk-YKVVW65D.cjs.map → chunk-ZDW322JC.cjs.map} +1 -1
  91. package/dist/index.cjs +53 -53
  92. package/dist/index.js +11 -11
  93. package/dist/integration/index.cjs +3 -3
  94. package/dist/integration/index.js +1 -1
  95. package/dist/llm/index.cjs +7 -7
  96. package/dist/llm/index.js +1 -1
  97. package/dist/llm/model/model.loop.d.ts.map +1 -1
  98. package/dist/llm/model/provider-types.generated.d.ts +585 -597
  99. package/dist/loop/index.cjs +2 -2
  100. package/dist/loop/index.js +1 -1
  101. package/dist/loop/loop.d.ts.map +1 -1
  102. package/dist/loop/test-utils/mock-server-response.d.ts +7 -2
  103. package/dist/loop/test-utils/mock-server-response.d.ts.map +1 -1
  104. package/dist/loop/test-utils/options.d.ts.map +1 -1
  105. package/dist/loop/types.d.ts +2 -1
  106. package/dist/loop/types.d.ts.map +1 -1
  107. package/dist/loop/workflows/agentic-execution/llm-execution-step.d.ts.map +1 -1
  108. package/dist/loop/workflows/agentic-execution/tool-call-step.d.ts +1 -1
  109. package/dist/loop/workflows/agentic-execution/tool-call-step.d.ts.map +1 -1
  110. package/dist/mastra/index.cjs +2 -2
  111. package/dist/mastra/index.js +1 -1
  112. package/dist/memory/index.cjs +4 -4
  113. package/dist/memory/index.js +1 -1
  114. package/dist/memory/memory.d.ts +3 -2
  115. package/dist/memory/memory.d.ts.map +1 -1
  116. package/dist/processors/index.cjs +11 -11
  117. package/dist/processors/index.js +1 -1
  118. package/dist/provider-registry.json +1390 -1414
  119. package/dist/relevance/index.cjs +4 -4
  120. package/dist/relevance/index.js +1 -1
  121. package/dist/scores/index.cjs +9 -9
  122. package/dist/scores/index.js +2 -2
  123. package/dist/scores/scoreTraces/index.cjs +8 -8
  124. package/dist/scores/scoreTraces/index.js +3 -3
  125. package/dist/storage/index.cjs +3 -3
  126. package/dist/storage/index.js +1 -1
  127. package/dist/stream/RunOutput.d.ts +72 -0
  128. package/dist/stream/RunOutput.d.ts.map +1 -0
  129. package/dist/stream/aisdk/v5/output.d.ts +2 -2
  130. package/dist/stream/aisdk/v5/output.d.ts.map +1 -1
  131. package/dist/stream/base/base.d.ts +7 -0
  132. package/dist/stream/base/base.d.ts.map +1 -0
  133. package/dist/stream/base/consume-stream.d.ts +5 -0
  134. package/dist/stream/base/consume-stream.d.ts.map +1 -0
  135. package/dist/stream/base/output.d.ts.map +1 -1
  136. package/dist/stream/index.cjs +14 -10
  137. package/dist/stream/index.d.ts +2 -1
  138. package/dist/stream/index.d.ts.map +1 -1
  139. package/dist/stream/index.js +2 -2
  140. package/dist/stream/types.d.ts +1 -1
  141. package/dist/stream/types.d.ts.map +1 -1
  142. package/dist/test-utils/llm-mock.cjs +2 -2
  143. package/dist/test-utils/llm-mock.js +1 -1
  144. package/dist/tools/index.cjs +4 -4
  145. package/dist/tools/index.js +1 -1
  146. package/dist/tools/is-vercel-tool.cjs +2 -2
  147. package/dist/tools/is-vercel-tool.js +1 -1
  148. package/dist/tools/tool-builder/builder.d.ts +75 -2
  149. package/dist/tools/tool-builder/builder.d.ts.map +1 -1
  150. package/dist/tools/tool.d.ts +2 -2
  151. package/dist/tools/tool.d.ts.map +1 -1
  152. package/dist/tools/types.d.ts +17 -12
  153. package/dist/tools/types.d.ts.map +1 -1
  154. package/dist/utils.cjs +17 -17
  155. package/dist/utils.d.ts +1 -0
  156. package/dist/utils.d.ts.map +1 -1
  157. package/dist/utils.js +1 -1
  158. package/dist/workflows/evented/index.cjs +10 -10
  159. package/dist/workflows/evented/index.js +1 -1
  160. package/dist/workflows/evented/workflow.d.ts +5 -3
  161. package/dist/workflows/evented/workflow.d.ts.map +1 -1
  162. package/dist/workflows/index.cjs +12 -12
  163. package/dist/workflows/index.js +1 -1
  164. package/dist/workflows/legacy/index.cjs +22 -22
  165. package/dist/workflows/legacy/index.js +1 -1
  166. package/dist/workflows/workflow.d.ts +30 -23
  167. package/dist/workflows/workflow.d.ts.map +1 -1
  168. package/package.json +12 -10
  169. package/src/llm/model/provider-types.generated.d.ts +585 -597
  170. package/dist/chunk-6OLRLZJ3.js.map +0 -1
  171. package/dist/chunk-BLVB2IJK.js.map +0 -1
  172. package/dist/chunk-LMP5KMU3.js.map +0 -1
  173. package/dist/chunk-MVVMHOAC.cjs.map +0 -1
  174. package/dist/chunk-N3ZSX5OS.js.map +0 -1
  175. package/dist/chunk-NIESGYOH.js.map +0 -1
  176. package/dist/chunk-SE4PA467.cjs.map +0 -1
  177. package/dist/chunk-URQI7RJ3.cjs.map +0 -1
  178. package/dist/chunk-URVM3Y4T.cjs.map +0 -1
  179. package/dist/chunk-WI2YMBNG.cjs.map +0 -1
  180. package/dist/chunk-XBJP7THY.js.map +0 -1
  181. package/dist/chunk-ZMPSVDDO.cjs.map +0 -1
@@ -23,79 +23,13 @@ var path__default = /*#__PURE__*/_interopDefault(path);
23
23
  // src/llm/model/provider-registry.json
24
24
  var provider_registry_default = {
25
25
  providers: {
26
- nvidia: {
27
- url: "https://integrate.api.nvidia.com/v1",
28
- apiKeyEnvVar: "NVIDIA_API_KEY",
29
- apiKeyHeader: "Authorization",
30
- name: "Nvidia",
31
- models: [
32
- "black-forest-labs/flux.1-dev",
33
- "deepseek-ai/deepseek-v3.1",
34
- "deepseek-ai/deepseek-v3.1-terminus",
35
- "google/gemma-3-27b-it",
36
- "microsoft/phi-4-mini-instruct",
37
- "moonshotai/kimi-k2-instruct",
38
- "moonshotai/kimi-k2-instruct-0905",
39
- "nvidia/cosmos-nemotron-34b",
40
- "nvidia/llama-3.1-nemotron-ultra-253b-v1",
41
- "nvidia/nemoretriever-ocr-v1",
42
- "nvidia/parakeet-tdt-0.6b-v2",
43
- "openai/gpt-oss-120b",
44
- "openai/whisper-large-v3",
45
- "qwen/qwen3-235b-a22b",
46
- "qwen/qwen3-coder-480b-a35b-instruct"
47
- ],
48
- docUrl: "https://docs.api.nvidia.com/nim/",
49
- gateway: "models.dev"
50
- },
51
- modelscope: {
52
- url: "https://api-inference.modelscope.cn/v1",
53
- apiKeyEnvVar: "MODELSCOPE_API_KEY",
54
- apiKeyHeader: "Authorization",
55
- name: "ModelScope",
56
- models: [
57
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
58
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
59
- "Qwen/Qwen3-30B-A3B-Instruct-2507",
60
- "Qwen/Qwen3-30B-A3B-Thinking-2507",
61
- "Qwen/Qwen3-Coder-30B-A3B-Instruct",
62
- "ZhipuAI/GLM-4.5",
63
- "ZhipuAI/GLM-4.6"
64
- ],
65
- docUrl: "https://modelscope.cn/docs/model-service/API-Inference/intro",
66
- gateway: "models.dev"
67
- },
68
- aihubmix: {
69
- url: "https://api.aihubmix.com/v1",
70
- apiKeyEnvVar: "AIHUBMIX_API_KEY",
26
+ "moonshotai-cn": {
27
+ url: "https://api.moonshot.cn/v1",
28
+ apiKeyEnvVar: "MOONSHOT_API_KEY",
71
29
  apiKeyHeader: "Authorization",
72
- name: "AIHubMix",
73
- models: [
74
- "DeepSeek-V3.2-Exp",
75
- "DeepSeek-V3.2-Exp-Think",
76
- "Kimi-K2-0905",
77
- "claude-haiku-4-5",
78
- "claude-opus-4-1",
79
- "claude-sonnet-4-5",
80
- "gemini-2.5-flash",
81
- "gemini-2.5-pro",
82
- "glm-4.6",
83
- "gpt-4.1",
84
- "gpt-4.1-mini",
85
- "gpt-4.1-nano",
86
- "gpt-4o",
87
- "gpt-4o-2024-11-20",
88
- "gpt-5",
89
- "gpt-5-codex",
90
- "gpt-5-mini",
91
- "gpt-5-nano",
92
- "gpt-5-pro",
93
- "o4-mini",
94
- "qwen3-235b-a22b-instruct-2507",
95
- "qwen3-235b-a22b-thinking-2507",
96
- "qwen3-coder-480b-a35b-instruct"
97
- ],
98
- docUrl: "https://aihubmix.com/docs/models",
30
+ name: "Moonshot AI (China)",
31
+ models: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
32
+ docUrl: "https://platform.moonshot.cn/docs/api/chat",
99
33
  gateway: "models.dev"
100
34
  },
101
35
  lucidquery: {
@@ -107,6 +41,73 @@ var provider_registry_default = {
107
41
  docUrl: "https://lucidquery.com/api/docs",
108
42
  gateway: "models.dev"
109
43
  },
44
+ moonshotai: {
45
+ url: "https://api.moonshot.ai/v1",
46
+ apiKeyEnvVar: "MOONSHOT_API_KEY",
47
+ apiKeyHeader: "Authorization",
48
+ name: "Moonshot AI",
49
+ models: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
50
+ docUrl: "https://platform.moonshot.ai/docs/api/chat",
51
+ gateway: "models.dev"
52
+ },
53
+ "zai-coding-plan": {
54
+ url: "https://api.z.ai/api/coding/paas/v4",
55
+ apiKeyEnvVar: "ZHIPU_API_KEY",
56
+ apiKeyHeader: "Authorization",
57
+ name: "Z.AI Coding Plan",
58
+ models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
59
+ docUrl: "https://docs.z.ai/devpack/overview",
60
+ gateway: "models.dev"
61
+ },
62
+ alibaba: {
63
+ url: "https://dashscope-intl.aliyuncs.com/compatible-mode/v1",
64
+ apiKeyEnvVar: "DASHSCOPE_API_KEY",
65
+ apiKeyHeader: "Authorization",
66
+ name: "Alibaba",
67
+ models: [
68
+ "qvq-max",
69
+ "qwen-flash",
70
+ "qwen-max",
71
+ "qwen-mt-plus",
72
+ "qwen-mt-turbo",
73
+ "qwen-omni-turbo",
74
+ "qwen-omni-turbo-realtime",
75
+ "qwen-plus",
76
+ "qwen-plus-character-ja",
77
+ "qwen-turbo",
78
+ "qwen-vl-max",
79
+ "qwen-vl-ocr",
80
+ "qwen-vl-plus",
81
+ "qwen2-5-14b-instruct",
82
+ "qwen2-5-32b-instruct",
83
+ "qwen2-5-72b-instruct",
84
+ "qwen2-5-7b-instruct",
85
+ "qwen2-5-omni-7b",
86
+ "qwen2-5-vl-72b-instruct",
87
+ "qwen2-5-vl-7b-instruct",
88
+ "qwen3-14b",
89
+ "qwen3-235b-a22b",
90
+ "qwen3-32b",
91
+ "qwen3-8b",
92
+ "qwen3-asr-flash",
93
+ "qwen3-coder-30b-a3b-instruct",
94
+ "qwen3-coder-480b-a35b-instruct",
95
+ "qwen3-coder-flash",
96
+ "qwen3-coder-plus",
97
+ "qwen3-livetranslate-flash-realtime",
98
+ "qwen3-max",
99
+ "qwen3-next-80b-a3b-instruct",
100
+ "qwen3-next-80b-a3b-thinking",
101
+ "qwen3-omni-flash",
102
+ "qwen3-omni-flash-realtime",
103
+ "qwen3-vl-235b-a22b",
104
+ "qwen3-vl-30b-a3b",
105
+ "qwen3-vl-plus",
106
+ "qwq-plus"
107
+ ],
108
+ docUrl: "https://www.alibabacloud.com/help/en/model-studio/models",
109
+ gateway: "models.dev"
110
+ },
110
111
  xai: {
111
112
  apiKeyEnvVar: "XAI_API_KEY",
112
113
  name: "xAI",
@@ -135,325 +136,94 @@ var provider_registry_default = {
135
136
  docUrl: "https://docs.x.ai/docs/models",
136
137
  gateway: "models.dev"
137
138
  },
138
- deepseek: {
139
- url: "https://api.deepseek.com",
140
- apiKeyEnvVar: "DEEPSEEK_API_KEY",
141
- apiKeyHeader: "Authorization",
142
- name: "DeepSeek",
143
- models: ["deepseek-chat", "deepseek-reasoner"],
144
- docUrl: "https://platform.deepseek.com/api-docs/pricing",
145
- gateway: "models.dev"
146
- },
147
- requesty: {
148
- url: "https://router.requesty.ai/v1",
149
- apiKeyEnvVar: "REQUESTY_API_KEY",
139
+ nvidia: {
140
+ url: "https://integrate.api.nvidia.com/v1",
141
+ apiKeyEnvVar: "NVIDIA_API_KEY",
150
142
  apiKeyHeader: "Authorization",
151
- name: "Requesty",
143
+ name: "Nvidia",
152
144
  models: [
153
- "anthropic/claude-3-7-sonnet",
154
- "anthropic/claude-4-sonnet-20250522",
155
- "anthropic/claude-opus-4",
156
- "anthropic/claude-opus-4-1-20250805",
157
- "google/gemini-2.5-flash",
158
- "google/gemini-2.5-pro",
159
- "openai/gpt-4.1",
160
- "openai/gpt-4.1-mini",
161
- "openai/gpt-4o-mini",
162
- "openai/gpt-5",
163
- "openai/gpt-5-mini",
164
- "openai/gpt-5-nano",
165
- "openai/o4-mini"
145
+ "black-forest-labs/flux.1-dev",
146
+ "deepseek-ai/deepseek-v3.1",
147
+ "deepseek-ai/deepseek-v3.1-terminus",
148
+ "google/gemma-3-27b-it",
149
+ "microsoft/phi-4-mini-instruct",
150
+ "moonshotai/kimi-k2-instruct",
151
+ "moonshotai/kimi-k2-instruct-0905",
152
+ "nvidia/cosmos-nemotron-34b",
153
+ "nvidia/llama-3.1-nemotron-ultra-253b-v1",
154
+ "nvidia/nemoretriever-ocr-v1",
155
+ "nvidia/parakeet-tdt-0.6b-v2",
156
+ "openai/gpt-oss-120b",
157
+ "openai/whisper-large-v3",
158
+ "qwen/qwen3-235b-a22b",
159
+ "qwen/qwen3-coder-480b-a35b-instruct"
166
160
  ],
167
- docUrl: "https://requesty.ai/solution/llm-routing/models",
161
+ docUrl: "https://docs.api.nvidia.com/nim/",
168
162
  gateway: "models.dev"
169
163
  },
170
- nebius: {
171
- url: "https://api.studio.nebius.com/v1/",
172
- apiKeyEnvVar: "NEBIUS_API_KEY",
164
+ upstage: {
165
+ url: "https://api.upstage.ai",
166
+ apiKeyEnvVar: "UPSTAGE_API_KEY",
173
167
  apiKeyHeader: "Authorization",
174
- name: "Nebius AI Studio",
175
- models: [
176
- "NousResearch/hermes-4-405b",
177
- "NousResearch/hermes-4-70b",
178
- "deepseek-ai/deepseek-v3",
179
- "meta-llama/llama-3.3-70b-instruct-base",
180
- "meta-llama/llama-3.3-70b-instruct-fast",
181
- "meta-llama/llama-3_1-405b-instruct",
182
- "moonshotai/kimi-k2-instruct",
183
- "nvidia/llama-3_1-nemotron-ultra-253b-v1",
184
- "openai/gpt-oss-120b",
185
- "openai/gpt-oss-20b",
186
- "qwen/qwen3-235b-a22b-instruct-2507",
187
- "qwen/qwen3-235b-a22b-thinking-2507",
188
- "qwen/qwen3-coder-480b-a35b-instruct",
189
- "zai-org/glm-4.5",
190
- "zai-org/glm-4.5-air"
191
- ],
192
- docUrl: "https://docs.studio.nebius.com/quickstart",
168
+ name: "Upstage",
169
+ models: ["solar-mini", "solar-pro2"],
170
+ docUrl: "https://developers.upstage.ai/docs/apis/chat",
193
171
  gateway: "models.dev"
194
172
  },
195
- fastrouter: {
196
- url: "https://go.fastrouter.ai/api/v1",
197
- apiKeyEnvVar: "FASTROUTER_API_KEY",
173
+ groq: {
174
+ url: "https://api.groq.com/openai/v1",
175
+ apiKeyEnvVar: "GROQ_API_KEY",
198
176
  apiKeyHeader: "Authorization",
199
- name: "FastRouter",
177
+ name: "Groq",
200
178
  models: [
201
- "anthropic/claude-opus-4.1",
202
- "anthropic/claude-sonnet-4",
203
- "deepseek-ai/deepseek-r1-distill-llama-70b",
204
- "google/gemini-2.5-flash",
205
- "google/gemini-2.5-pro",
206
- "moonshotai/kimi-k2",
207
- "openai/gpt-4.1",
208
- "openai/gpt-5",
209
- "openai/gpt-5-mini",
210
- "openai/gpt-5-nano",
179
+ "deepseek-r1-distill-llama-70b",
180
+ "gemma2-9b-it",
181
+ "llama-3.1-8b-instant",
182
+ "llama-3.3-70b-versatile",
183
+ "llama-guard-3-8b",
184
+ "llama3-70b-8192",
185
+ "llama3-8b-8192",
186
+ "meta-llama/llama-4-maverick-17b-128e-instruct",
187
+ "meta-llama/llama-4-scout-17b-16e-instruct",
188
+ "meta-llama/llama-guard-4-12b",
189
+ "mistral-saba-24b",
190
+ "moonshotai/kimi-k2-instruct",
191
+ "moonshotai/kimi-k2-instruct-0905",
211
192
  "openai/gpt-oss-120b",
212
193
  "openai/gpt-oss-20b",
213
- "qwen/qwen3-coder",
214
- "x-ai/grok-4"
194
+ "qwen-qwq-32b",
195
+ "qwen/qwen3-32b"
215
196
  ],
216
- docUrl: "https://fastrouter.ai/models",
197
+ docUrl: "https://console.groq.com/docs/models",
217
198
  gateway: "models.dev"
218
199
  },
219
- perplexity: {
220
- url: "https://api.perplexity.ai",
221
- apiKeyEnvVar: "PERPLEXITY_API_KEY",
200
+ mistral: {
201
+ url: "https://api.mistral.ai/v1",
202
+ apiKeyEnvVar: "MISTRAL_API_KEY",
222
203
  apiKeyHeader: "Authorization",
223
- name: "Perplexity",
224
- models: ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
225
- docUrl: "https://docs.perplexity.ai",
226
- gateway: "models.dev"
227
- },
228
- morph: {
229
- url: "https://api.morphllm.com/v1",
230
- apiKeyEnvVar: "MORPH_API_KEY",
231
- apiKeyHeader: "Authorization",
232
- name: "Morph",
233
- models: ["auto", "morph-v3-fast", "morph-v3-large"],
234
- docUrl: "https://docs.morphllm.com/api-reference/introduction",
235
- gateway: "models.dev"
236
- },
237
- "zai-coding-plan": {
238
- url: "https://api.z.ai/api/coding/paas/v4",
239
- apiKeyEnvVar: "ZHIPU_API_KEY",
240
- apiKeyHeader: "Authorization",
241
- name: "Z.AI Coding Plan",
242
- models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
243
- docUrl: "https://docs.z.ai/devpack/overview",
244
- gateway: "models.dev"
245
- },
246
- huggingface: {
247
- url: "https://router.huggingface.co/v1",
248
- apiKeyEnvVar: "HF_TOKEN",
249
- apiKeyHeader: "Authorization",
250
- name: "Hugging Face",
251
- models: [
252
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
253
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
254
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
255
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
256
- "deepseek-ai/DeepSeek-R1-0528",
257
- "deepseek-ai/Deepseek-V3-0324",
258
- "moonshotai/Kimi-K2-Instruct",
259
- "moonshotai/Kimi-K2-Instruct-0905",
260
- "zai-org/GLM-4.5",
261
- "zai-org/GLM-4.5-Air",
262
- "zai-org/GLM-4.6"
263
- ],
264
- docUrl: "https://huggingface.co/docs/inference-providers",
265
- gateway: "models.dev"
266
- },
267
- openrouter: {
268
- url: "https://openrouter.ai/api/v1",
269
- apiKeyEnvVar: "OPENROUTER_API_KEY",
270
- name: "OpenRouter",
271
- models: [
272
- "anthropic/claude-3.5-haiku",
273
- "anthropic/claude-3.7-sonnet",
274
- "anthropic/claude-haiku-4.5",
275
- "anthropic/claude-opus-4",
276
- "anthropic/claude-opus-4.1",
277
- "anthropic/claude-sonnet-4",
278
- "anthropic/claude-sonnet-4.5",
279
- "cognitivecomputations/dolphin3.0-mistral-24b",
280
- "cognitivecomputations/dolphin3.0-r1-mistral-24b",
281
- "deepseek/deepseek-chat-v3-0324",
282
- "deepseek/deepseek-chat-v3.1",
283
- "deepseek/deepseek-r1-0528-qwen3-8b:free",
284
- "deepseek/deepseek-r1-0528:free",
285
- "deepseek/deepseek-r1-distill-llama-70b",
286
- "deepseek/deepseek-r1-distill-qwen-14b",
287
- "deepseek/deepseek-r1:free",
288
- "deepseek/deepseek-v3-base:free",
289
- "deepseek/deepseek-v3.1-terminus",
290
- "featherless/qwerky-72b",
291
- "google/gemini-2.0-flash-001",
292
- "google/gemini-2.0-flash-exp:free",
293
- "google/gemini-2.5-flash",
294
- "google/gemini-2.5-flash-lite",
295
- "google/gemini-2.5-flash-lite-preview-09-2025",
296
- "google/gemini-2.5-flash-preview-09-2025",
297
- "google/gemini-2.5-pro",
298
- "google/gemini-2.5-pro-preview-05-06",
299
- "google/gemini-2.5-pro-preview-06-05",
300
- "google/gemma-2-9b-it:free",
301
- "google/gemma-3-12b-it",
302
- "google/gemma-3-27b-it",
303
- "google/gemma-3n-e4b-it",
304
- "google/gemma-3n-e4b-it:free",
305
- "meta-llama/llama-3.2-11b-vision-instruct",
306
- "meta-llama/llama-3.3-70b-instruct:free",
307
- "meta-llama/llama-4-scout:free",
308
- "microsoft/mai-ds-r1:free",
309
- "mistralai/codestral-2508",
310
- "mistralai/devstral-medium-2507",
311
- "mistralai/devstral-small-2505",
312
- "mistralai/devstral-small-2505:free",
313
- "mistralai/devstral-small-2507",
314
- "mistralai/mistral-7b-instruct:free",
315
- "mistralai/mistral-medium-3",
316
- "mistralai/mistral-medium-3.1",
317
- "mistralai/mistral-nemo:free",
318
- "mistralai/mistral-small-3.1-24b-instruct",
319
- "mistralai/mistral-small-3.2-24b-instruct",
320
- "mistralai/mistral-small-3.2-24b-instruct:free",
321
- "moonshotai/kimi-dev-72b:free",
322
- "moonshotai/kimi-k2",
323
- "moonshotai/kimi-k2-0905",
324
- "moonshotai/kimi-k2:free",
325
- "nousresearch/deephermes-3-llama-3-8b-preview",
326
- "nousresearch/hermes-4-405b",
327
- "nousresearch/hermes-4-70b",
328
- "openai/gpt-4.1",
329
- "openai/gpt-4.1-mini",
330
- "openai/gpt-4o-mini",
331
- "openai/gpt-5",
332
- "openai/gpt-5-chat",
333
- "openai/gpt-5-codex",
334
- "openai/gpt-5-image",
335
- "openai/gpt-5-mini",
336
- "openai/gpt-5-nano",
337
- "openai/gpt-oss-120b",
338
- "openai/gpt-oss-20b",
339
- "openai/o4-mini",
340
- "openrouter/cypher-alpha:free",
341
- "openrouter/horizon-alpha",
342
- "openrouter/horizon-beta",
343
- "openrouter/sonoma-dusk-alpha",
344
- "openrouter/sonoma-sky-alpha",
345
- "qwen/qwen-2.5-coder-32b-instruct",
346
- "qwen/qwen2.5-vl-32b-instruct:free",
347
- "qwen/qwen2.5-vl-72b-instruct",
348
- "qwen/qwen2.5-vl-72b-instruct:free",
349
- "qwen/qwen3-14b:free",
350
- "qwen/qwen3-235b-a22b-07-25",
351
- "qwen/qwen3-235b-a22b-07-25:free",
352
- "qwen/qwen3-235b-a22b-thinking-2507",
353
- "qwen/qwen3-235b-a22b:free",
354
- "qwen/qwen3-30b-a3b-instruct-2507",
355
- "qwen/qwen3-30b-a3b-thinking-2507",
356
- "qwen/qwen3-30b-a3b:free",
357
- "qwen/qwen3-32b:free",
358
- "qwen/qwen3-8b:free",
359
- "qwen/qwen3-coder",
360
- "qwen/qwen3-coder:free",
361
- "qwen/qwen3-max",
362
- "qwen/qwen3-next-80b-a3b-instruct",
363
- "qwen/qwen3-next-80b-a3b-thinking",
364
- "qwen/qwq-32b:free",
365
- "rekaai/reka-flash-3",
366
- "sarvamai/sarvam-m:free",
367
- "thudm/glm-z1-32b:free",
368
- "tngtech/deepseek-r1t2-chimera:free",
369
- "x-ai/grok-3",
370
- "x-ai/grok-3-beta",
371
- "x-ai/grok-3-mini",
372
- "x-ai/grok-3-mini-beta",
373
- "x-ai/grok-4",
374
- "x-ai/grok-4-fast",
375
- "x-ai/grok-4-fast:free",
376
- "x-ai/grok-code-fast-1",
377
- "z-ai/glm-4.5",
378
- "z-ai/glm-4.5-air",
379
- "z-ai/glm-4.5-air:free",
380
- "z-ai/glm-4.5v",
381
- "z-ai/glm-4.6"
382
- ],
383
- docUrl: "https://openrouter.ai/models",
384
- gateway: "models.dev"
385
- },
386
- cerebras: {
387
- url: "https://api.cerebras.ai/v1",
388
- apiKeyEnvVar: "CEREBRAS_API_KEY",
389
- apiKeyHeader: "Authorization",
390
- name: "Cerebras",
391
- models: ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
392
- docUrl: "https://inference-docs.cerebras.ai/models/overview",
393
- gateway: "models.dev"
394
- },
395
- zhipuai: {
396
- url: "https://open.bigmodel.cn/api/paas/v4",
397
- apiKeyEnvVar: "ZHIPU_API_KEY",
398
- apiKeyHeader: "Authorization",
399
- name: "Zhipu AI",
400
- models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
401
- docUrl: "https://docs.z.ai/guides/overview/pricing",
402
- gateway: "models.dev"
403
- },
404
- togetherai: {
405
- url: "https://api.together.xyz/v1",
406
- apiKeyEnvVar: "TOGETHER_API_KEY",
407
- apiKeyHeader: "Authorization",
408
- name: "Together AI",
409
- models: [
410
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
411
- "deepseek-ai/DeepSeek-R1",
412
- "deepseek-ai/DeepSeek-V3",
413
- "meta-llama/Llama-3.3-70B-Instruct-Turbo",
414
- "moonshotai/Kimi-K2-Instruct",
415
- "openai/gpt-oss-120b"
416
- ],
417
- docUrl: "https://docs.together.ai/docs/serverless-models",
418
- gateway: "models.dev"
419
- },
420
- wandb: {
421
- url: "https://api.inference.wandb.ai/v1",
422
- apiKeyEnvVar: "WANDB_API_KEY",
423
- apiKeyHeader: "Authorization",
424
- name: "Weights & Biases",
425
- models: [
426
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
427
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
428
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
429
- "deepseek-ai/DeepSeek-R1-0528",
430
- "deepseek-ai/DeepSeek-V3-0324",
431
- "meta-llama/Llama-3.1-8B-Instruct",
432
- "meta-llama/Llama-3.3-70B-Instruct",
433
- "meta-llama/Llama-4-Scout-17B-16E-Instruct",
434
- "microsoft/Phi-4-mini-instruct",
435
- "moonshotai/Kimi-K2-Instruct"
436
- ],
437
- docUrl: "https://weave-docs.wandb.ai/guides/integrations/inference/",
438
- gateway: "models.dev"
439
- },
440
- submodel: {
441
- url: "https://llm.submodel.ai/v1",
442
- apiKeyEnvVar: "SUBMODEL_INSTAGEN_ACCESS_KEY",
443
- apiKeyHeader: "Authorization",
444
- name: "submodel",
204
+ name: "Mistral",
445
205
  models: [
446
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
447
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
448
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
449
- "deepseek-ai/DeepSeek-R1-0528",
450
- "deepseek-ai/DeepSeek-V3-0324",
451
- "deepseek-ai/DeepSeek-V3.1",
452
- "openai/gpt-oss-120b",
453
- "zai-org/GLM-4.5-Air",
454
- "zai-org/GLM-4.5-FP8"
206
+ "codestral-latest",
207
+ "devstral-medium-2507",
208
+ "devstral-small-2505",
209
+ "devstral-small-2507",
210
+ "magistral-medium-latest",
211
+ "magistral-small",
212
+ "ministral-3b-latest",
213
+ "ministral-8b-latest",
214
+ "mistral-large-latest",
215
+ "mistral-medium-2505",
216
+ "mistral-medium-2508",
217
+ "mistral-medium-latest",
218
+ "mistral-nemo",
219
+ "mistral-small-latest",
220
+ "open-mistral-7b",
221
+ "open-mixtral-8x22b",
222
+ "open-mixtral-8x7b",
223
+ "pixtral-12b",
224
+ "pixtral-large-latest"
455
225
  ],
456
- docUrl: "https://submodel.gitbook.io",
226
+ docUrl: "https://docs.mistral.ai/getting-started/models/",
457
227
  gateway: "models.dev"
458
228
  },
459
229
  vercel: {
@@ -550,102 +320,196 @@ var provider_registry_default = {
550
320
  docUrl: "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway",
551
321
  gateway: "models.dev"
552
322
  },
553
- synthetic: {
554
- url: "https://api.synthetic.new/v1",
555
- apiKeyEnvVar: "SYNTHETIC_API_KEY",
323
+ nebius: {
324
+ url: "https://api.studio.nebius.com/v1/",
325
+ apiKeyEnvVar: "NEBIUS_API_KEY",
556
326
  apiKeyHeader: "Authorization",
557
- name: "Synthetic",
327
+ name: "Nebius AI Studio",
558
328
  models: [
559
- "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
560
- "hf:Qwen/Qwen3-235B-A22B-Instruct-2507",
561
- "hf:Qwen/Qwen3-235B-A22B-Thinking-2507",
562
- "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct",
563
- "hf:deepseek-ai/DeepSeek-R1",
564
- "hf:deepseek-ai/DeepSeek-R1-0528",
565
- "hf:deepseek-ai/DeepSeek-V3",
566
- "hf:deepseek-ai/DeepSeek-V3-0324",
567
- "hf:deepseek-ai/DeepSeek-V3.1",
568
- "hf:deepseek-ai/DeepSeek-V3.1-Terminus",
569
- "hf:meta-llama/Llama-3.1-405B-Instruct",
570
- "hf:meta-llama/Llama-3.1-70B-Instruct",
571
- "hf:meta-llama/Llama-3.1-8B-Instruct",
572
- "hf:meta-llama/Llama-3.3-70B-Instruct",
573
- "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
574
- "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct",
575
- "hf:moonshotai/Kimi-K2-Instruct",
576
- "hf:moonshotai/Kimi-K2-Instruct-0905",
577
- "hf:openai/gpt-oss-120b",
578
- "hf:zai-org/GLM-4.5",
579
- "hf:zai-org/GLM-4.6"
329
+ "NousResearch/hermes-4-405b",
330
+ "NousResearch/hermes-4-70b",
331
+ "deepseek-ai/deepseek-v3",
332
+ "meta-llama/llama-3.3-70b-instruct-base",
333
+ "meta-llama/llama-3.3-70b-instruct-fast",
334
+ "meta-llama/llama-3_1-405b-instruct",
335
+ "moonshotai/kimi-k2-instruct",
336
+ "nvidia/llama-3_1-nemotron-ultra-253b-v1",
337
+ "openai/gpt-oss-120b",
338
+ "openai/gpt-oss-20b",
339
+ "qwen/qwen3-235b-a22b-instruct-2507",
340
+ "qwen/qwen3-235b-a22b-thinking-2507",
341
+ "qwen/qwen3-coder-480b-a35b-instruct",
342
+ "zai-org/glm-4.5",
343
+ "zai-org/glm-4.5-air"
580
344
  ],
581
- docUrl: "https://synthetic.new/pricing",
345
+ docUrl: "https://docs.studio.nebius.com/quickstart",
582
346
  gateway: "models.dev"
583
347
  },
584
- google: {
585
- apiKeyEnvVar: "GOOGLE_GENERATIVE_AI_API_KEY",
586
- name: "Google",
348
+ deepseek: {
349
+ url: "https://api.deepseek.com",
350
+ apiKeyEnvVar: "DEEPSEEK_API_KEY",
351
+ apiKeyHeader: "Authorization",
352
+ name: "DeepSeek",
353
+ models: ["deepseek-chat", "deepseek-reasoner"],
354
+ docUrl: "https://platform.deepseek.com/api-docs/pricing",
355
+ gateway: "models.dev"
356
+ },
357
+ "alibaba-cn": {
358
+ url: "https://dashscope.aliyuncs.com/compatible-mode/v1",
359
+ apiKeyEnvVar: "DASHSCOPE_API_KEY",
360
+ apiKeyHeader: "Authorization",
361
+ name: "Alibaba (China)",
587
362
  models: [
588
- "gemini-1.5-flash",
589
- "gemini-1.5-flash-8b",
590
- "gemini-1.5-pro",
591
- "gemini-2.0-flash",
592
- "gemini-2.0-flash-lite",
593
- "gemini-2.5-flash",
594
- "gemini-2.5-flash-image",
595
- "gemini-2.5-flash-image-preview",
596
- "gemini-2.5-flash-lite",
597
- "gemini-2.5-flash-lite-preview-06-17",
598
- "gemini-2.5-flash-lite-preview-09-2025",
599
- "gemini-2.5-flash-preview-04-17",
600
- "gemini-2.5-flash-preview-05-20",
601
- "gemini-2.5-flash-preview-09-2025",
602
- "gemini-2.5-flash-preview-tts",
603
- "gemini-2.5-pro",
604
- "gemini-2.5-pro-preview-05-06",
605
- "gemini-2.5-pro-preview-06-05",
606
- "gemini-2.5-pro-preview-tts",
607
- "gemini-flash-latest",
608
- "gemini-flash-lite-latest",
609
- "gemini-live-2.5-flash",
610
- "gemini-live-2.5-flash-preview-native-audio"
363
+ "deepseek-r1",
364
+ "deepseek-r1-0528",
365
+ "deepseek-r1-distill-llama-70b",
366
+ "deepseek-r1-distill-llama-8b",
367
+ "deepseek-r1-distill-qwen-1-5b",
368
+ "deepseek-r1-distill-qwen-14b",
369
+ "deepseek-r1-distill-qwen-32b",
370
+ "deepseek-r1-distill-qwen-7b",
371
+ "deepseek-v3",
372
+ "deepseek-v3-1",
373
+ "deepseek-v3-2-exp",
374
+ "moonshot-kimi-k2-instruct",
375
+ "qvq-max",
376
+ "qwen-deep-research",
377
+ "qwen-doc-turbo",
378
+ "qwen-flash",
379
+ "qwen-long",
380
+ "qwen-math-plus",
381
+ "qwen-math-turbo",
382
+ "qwen-max",
383
+ "qwen-mt-plus",
384
+ "qwen-mt-turbo",
385
+ "qwen-omni-turbo",
386
+ "qwen-omni-turbo-realtime",
387
+ "qwen-plus",
388
+ "qwen-plus-character",
389
+ "qwen-turbo",
390
+ "qwen-vl-max",
391
+ "qwen-vl-ocr",
392
+ "qwen-vl-plus",
393
+ "qwen2-5-14b-instruct",
394
+ "qwen2-5-32b-instruct",
395
+ "qwen2-5-72b-instruct",
396
+ "qwen2-5-7b-instruct",
397
+ "qwen2-5-coder-32b-instruct",
398
+ "qwen2-5-coder-7b-instruct",
399
+ "qwen2-5-math-72b-instruct",
400
+ "qwen2-5-math-7b-instruct",
401
+ "qwen2-5-omni-7b",
402
+ "qwen2-5-vl-72b-instruct",
403
+ "qwen2-5-vl-7b-instruct",
404
+ "qwen3-14b",
405
+ "qwen3-235b-a22b",
406
+ "qwen3-32b",
407
+ "qwen3-8b",
408
+ "qwen3-asr-flash",
409
+ "qwen3-coder-30b-a3b-instruct",
410
+ "qwen3-coder-480b-a35b-instruct",
411
+ "qwen3-coder-flash",
412
+ "qwen3-coder-plus",
413
+ "qwen3-max",
414
+ "qwen3-next-80b-a3b-instruct",
415
+ "qwen3-next-80b-a3b-thinking",
416
+ "qwen3-omni-flash",
417
+ "qwen3-omni-flash-realtime",
418
+ "qwen3-vl-235b-a22b",
419
+ "qwen3-vl-30b-a3b",
420
+ "qwen3-vl-plus",
421
+ "qwq-32b",
422
+ "qwq-plus",
423
+ "tongyi-intent-detect-v3"
611
424
  ],
612
- docUrl: "https://ai.google.dev/gemini-api/docs/pricing",
425
+ docUrl: "https://www.alibabacloud.com/help/en/model-studio/models",
613
426
  gateway: "models.dev"
614
427
  },
615
- groq: {
616
- url: "https://api.groq.com/openai/v1",
617
- apiKeyEnvVar: "GROQ_API_KEY",
428
+ venice: {
429
+ url: "https://api.venice.ai/api/v1",
430
+ apiKeyEnvVar: "VENICE_API_KEY",
618
431
  apiKeyHeader: "Authorization",
619
- name: "Groq",
432
+ name: "Venice AI",
620
433
  models: [
621
- "deepseek-r1-distill-llama-70b",
622
- "gemma2-9b-it",
623
- "llama-3.1-8b-instant",
624
- "llama-3.3-70b-versatile",
625
- "llama-guard-3-8b",
626
- "llama3-70b-8192",
627
- "llama3-8b-8192",
628
- "meta-llama/llama-4-maverick-17b-128e-instruct",
629
- "meta-llama/llama-4-scout-17b-16e-instruct",
630
- "meta-llama/llama-guard-4-12b",
631
- "mistral-saba-24b",
632
- "moonshotai/kimi-k2-instruct",
633
- "moonshotai/kimi-k2-instruct-0905",
434
+ "deepseek-coder-v2-lite",
435
+ "deepseek-r1-671b",
436
+ "dolphin-2.9.2-qwen2-72b",
437
+ "llama-3.1-405b",
438
+ "llama-3.2-3b",
439
+ "llama-3.3-70b",
440
+ "mistral-31-24b",
441
+ "qwen-2.5-coder-32b",
442
+ "qwen-2.5-qwq-32b",
443
+ "qwen-2.5-vl",
444
+ "qwen3-235b",
445
+ "qwen3-4b",
446
+ "venice-uncensored"
447
+ ],
448
+ docUrl: "https://docs.venice.ai",
449
+ gateway: "models.dev"
450
+ },
451
+ chutes: {
452
+ url: "https://llm.chutes.ai/v1",
453
+ apiKeyEnvVar: "CHUTES_API_KEY",
454
+ apiKeyHeader: "Authorization",
455
+ name: "Chutes",
456
+ models: [
457
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
458
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
459
+ "Qwen/Qwen3-30B-A3B",
460
+ "Qwen/Qwen3-30B-A3B-Instruct-2507",
461
+ "Qwen/Qwen3-30B-A3B-Thinking-2507",
462
+ "Qwen/Qwen3-Coder-30B-A3B-Instruct",
463
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
464
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
465
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
466
+ "chutesai/Devstral-Small-2505",
467
+ "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
468
+ "deepseek-ai/DeepSeek-R1-0528",
469
+ "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
470
+ "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
471
+ "deepseek-ai/DeepSeek-V3-0324",
472
+ "deepseek-ai/DeepSeek-V3.1",
473
+ "deepseek-ai/DeepSeek-V3.1-Terminus",
474
+ "deepseek-ai/DeepSeek-V3.1-turbo",
475
+ "deepseek-ai/DeepSeek-V3.1:THINKING",
476
+ "deepseek-ai/DeepSeek-V3.2-Exp",
477
+ "meituan-longcat/LongCat-Flash-Chat-FP8",
478
+ "moonshotai/Kimi-Dev-72B",
479
+ "moonshotai/Kimi-K2-Instruct-0905",
480
+ "moonshotai/Kimi-K2-Instruct-75k",
481
+ "moonshotai/Kimi-VL-A3B-Thinking",
634
482
  "openai/gpt-oss-120b",
635
- "openai/gpt-oss-20b",
636
- "qwen-qwq-32b",
637
- "qwen/qwen3-32b"
483
+ "tngtech/DeepSeek-R1T-Chimera",
484
+ "tngtech/DeepSeek-TNG-R1T2-Chimera",
485
+ "zai-org/GLM-4.5-Air",
486
+ "zai-org/GLM-4.5-FP8",
487
+ "zai-org/GLM-4.5-turbo",
488
+ "zai-org/GLM-4.6-FP8",
489
+ "zai-org/GLM-4.6-turbo"
638
490
  ],
639
- docUrl: "https://console.groq.com/docs/models",
491
+ docUrl: "https://llm.chutes.ai/v1/models",
640
492
  gateway: "models.dev"
641
493
  },
642
- "moonshotai-cn": {
643
- url: "https://api.moonshot.cn/v1",
644
- apiKeyEnvVar: "MOONSHOT_API_KEY",
494
+ cortecs: {
495
+ url: "https://api.cortecs.ai/v1",
496
+ apiKeyEnvVar: "CORTECS_API_KEY",
645
497
  apiKeyHeader: "Authorization",
646
- name: "Moonshot AI (China)",
647
- models: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
648
- docUrl: "https://platform.moonshot.cn/docs/api/chat",
498
+ name: "Cortecs",
499
+ models: [
500
+ "claude-4-5-sonnet",
501
+ "claude-sonnet-4",
502
+ "deepseek-v3-0324",
503
+ "gemini-2.5-pro",
504
+ "gpt-4.1",
505
+ "gpt-oss-120b",
506
+ "kimi-k2-instruct",
507
+ "llama-3.1-405b-instruct",
508
+ "nova-pro-v1",
509
+ "qwen3-32b",
510
+ "qwen3-coder-480b-a35b-instruct"
511
+ ],
512
+ docUrl: "https://api.cortecs.ai/v1/models",
649
513
  gateway: "models.dev"
650
514
  },
651
515
  "github-models": {
@@ -713,47 +577,50 @@ var provider_registry_default = {
713
577
  docUrl: "https://docs.github.com/en/github-models",
714
578
  gateway: "models.dev"
715
579
  },
716
- deepinfra: {
717
- url: "https://api.deepinfra.com/v1/openai",
718
- apiKeyEnvVar: "DEEPINFRA_API_KEY",
580
+ togetherai: {
581
+ url: "https://api.together.xyz/v1",
582
+ apiKeyEnvVar: "TOGETHER_API_KEY",
719
583
  apiKeyHeader: "Authorization",
720
- name: "Deep Infra",
584
+ name: "Together AI",
721
585
  models: [
722
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
723
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo",
586
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
587
+ "deepseek-ai/DeepSeek-R1",
588
+ "deepseek-ai/DeepSeek-V3",
589
+ "meta-llama/Llama-3.3-70B-Instruct-Turbo",
724
590
  "moonshotai/Kimi-K2-Instruct",
725
- "zai-org/GLM-4.5"
591
+ "openai/gpt-oss-120b"
726
592
  ],
727
- docUrl: "https://deepinfra.com/models",
593
+ docUrl: "https://docs.together.ai/docs/serverless-models",
728
594
  gateway: "models.dev"
729
595
  },
730
- "fireworks-ai": {
731
- url: "https://api.fireworks.ai/inference/v1/",
732
- apiKeyEnvVar: "FIREWORKS_API_KEY",
596
+ baseten: {
597
+ url: "https://inference.baseten.co/v1",
598
+ apiKeyEnvVar: "BASETEN_API_KEY",
733
599
  apiKeyHeader: "Authorization",
734
- name: "Fireworks AI",
735
- models: [
736
- "accounts/fireworks/models/deepseek-r1-0528",
737
- "accounts/fireworks/models/deepseek-v3-0324",
738
- "accounts/fireworks/models/deepseek-v3p1",
739
- "accounts/fireworks/models/glm-4p5",
740
- "accounts/fireworks/models/glm-4p5-air",
741
- "accounts/fireworks/models/gpt-oss-120b",
742
- "accounts/fireworks/models/gpt-oss-20b",
743
- "accounts/fireworks/models/kimi-k2-instruct",
744
- "accounts/fireworks/models/qwen3-235b-a22b",
745
- "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
746
- ],
747
- docUrl: "https://fireworks.ai/docs/",
600
+ name: "Baseten",
601
+ models: ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
602
+ docUrl: "https://docs.baseten.co/development/model-apis/overview",
748
603
  gateway: "models.dev"
749
604
  },
750
- zai: {
751
- url: "https://api.z.ai/api/paas/v4",
752
- apiKeyEnvVar: "ZHIPU_API_KEY",
605
+ huggingface: {
606
+ url: "https://router.huggingface.co/v1",
607
+ apiKeyEnvVar: "HF_TOKEN",
753
608
  apiKeyHeader: "Authorization",
754
- name: "Z.AI",
755
- models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
756
- docUrl: "https://docs.z.ai/guides/overview/pricing",
609
+ name: "Hugging Face",
610
+ models: [
611
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
612
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
613
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
614
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
615
+ "deepseek-ai/DeepSeek-R1-0528",
616
+ "deepseek-ai/Deepseek-V3-0324",
617
+ "moonshotai/Kimi-K2-Instruct",
618
+ "moonshotai/Kimi-K2-Instruct-0905",
619
+ "zai-org/GLM-4.5",
620
+ "zai-org/GLM-4.5-Air",
621
+ "zai-org/GLM-4.6"
622
+ ],
623
+ docUrl: "https://huggingface.co/docs/inference-providers",
757
624
  gateway: "models.dev"
758
625
  },
759
626
  opencode: {
@@ -780,13 +647,59 @@ var provider_registry_default = {
780
647
  docUrl: "https://opencode.ai/docs/zen",
781
648
  gateway: "models.dev"
782
649
  },
783
- "zhipuai-coding-plan": {
784
- url: "https://open.bigmodel.cn/api/coding/paas/v4",
785
- apiKeyEnvVar: "ZHIPU_API_KEY",
650
+ fastrouter: {
651
+ url: "https://go.fastrouter.ai/api/v1",
652
+ apiKeyEnvVar: "FASTROUTER_API_KEY",
786
653
  apiKeyHeader: "Authorization",
787
- name: "Zhipu AI Coding Plan",
788
- models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
789
- docUrl: "https://docs.bigmodel.cn/cn/coding-plan/overview",
654
+ name: "FastRouter",
655
+ models: [
656
+ "anthropic/claude-opus-4.1",
657
+ "anthropic/claude-sonnet-4",
658
+ "deepseek-ai/deepseek-r1-distill-llama-70b",
659
+ "google/gemini-2.5-flash",
660
+ "google/gemini-2.5-pro",
661
+ "moonshotai/kimi-k2",
662
+ "openai/gpt-4.1",
663
+ "openai/gpt-5",
664
+ "openai/gpt-5-mini",
665
+ "openai/gpt-5-nano",
666
+ "openai/gpt-oss-120b",
667
+ "openai/gpt-oss-20b",
668
+ "qwen/qwen3-coder",
669
+ "x-ai/grok-4"
670
+ ],
671
+ docUrl: "https://fastrouter.ai/models",
672
+ gateway: "models.dev"
673
+ },
674
+ google: {
675
+ apiKeyEnvVar: "GOOGLE_GENERATIVE_AI_API_KEY",
676
+ name: "Google",
677
+ models: [
678
+ "gemini-1.5-flash",
679
+ "gemini-1.5-flash-8b",
680
+ "gemini-1.5-pro",
681
+ "gemini-2.0-flash",
682
+ "gemini-2.0-flash-lite",
683
+ "gemini-2.5-flash",
684
+ "gemini-2.5-flash-image",
685
+ "gemini-2.5-flash-image-preview",
686
+ "gemini-2.5-flash-lite",
687
+ "gemini-2.5-flash-lite-preview-06-17",
688
+ "gemini-2.5-flash-lite-preview-09-2025",
689
+ "gemini-2.5-flash-preview-04-17",
690
+ "gemini-2.5-flash-preview-05-20",
691
+ "gemini-2.5-flash-preview-09-2025",
692
+ "gemini-2.5-flash-preview-tts",
693
+ "gemini-2.5-pro",
694
+ "gemini-2.5-pro-preview-05-06",
695
+ "gemini-2.5-pro-preview-06-05",
696
+ "gemini-2.5-pro-preview-tts",
697
+ "gemini-flash-latest",
698
+ "gemini-flash-lite-latest",
699
+ "gemini-live-2.5-flash",
700
+ "gemini-live-2.5-flash-preview-native-audio"
701
+ ],
702
+ docUrl: "https://ai.google.dev/gemini-api/docs/pricing",
790
703
  gateway: "models.dev"
791
704
  },
792
705
  inception: {
@@ -798,30 +711,24 @@ var provider_registry_default = {
798
711
  docUrl: "https://platform.inceptionlabs.ai/docs",
799
712
  gateway: "models.dev"
800
713
  },
801
- llama: {
802
- url: "https://api.llama.com/compat/v1/",
803
- apiKeyEnvVar: "LLAMA_API_KEY",
714
+ wandb: {
715
+ url: "https://api.inference.wandb.ai/v1",
716
+ apiKeyEnvVar: "WANDB_API_KEY",
804
717
  apiKeyHeader: "Authorization",
805
- name: "Llama",
718
+ name: "Weights & Biases",
806
719
  models: [
807
- "cerebras-llama-4-maverick-17b-128e-instruct",
808
- "cerebras-llama-4-scout-17b-16e-instruct",
809
- "groq-llama-4-maverick-17b-128e-instruct",
810
- "llama-3.3-70b-instruct",
811
- "llama-3.3-8b-instruct",
812
- "llama-4-maverick-17b-128e-instruct-fp8",
813
- "llama-4-scout-17b-16e-instruct-fp8"
720
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
721
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
722
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
723
+ "deepseek-ai/DeepSeek-R1-0528",
724
+ "deepseek-ai/DeepSeek-V3-0324",
725
+ "meta-llama/Llama-3.1-8B-Instruct",
726
+ "meta-llama/Llama-3.3-70B-Instruct",
727
+ "meta-llama/Llama-4-Scout-17B-16E-Instruct",
728
+ "microsoft/Phi-4-mini-instruct",
729
+ "moonshotai/Kimi-K2-Instruct"
814
730
  ],
815
- docUrl: "https://llama.developer.meta.com/docs/models",
816
- gateway: "models.dev"
817
- },
818
- lmstudio: {
819
- url: "http://127.0.0.1:1234/v1",
820
- apiKeyEnvVar: "LMSTUDIO_API_KEY",
821
- apiKeyHeader: "Authorization",
822
- name: "LMStudio",
823
- models: ["openai/gpt-oss-20b", "qwen/qwen3-30b-a3b-2507", "qwen/qwen3-coder-30b"],
824
- docUrl: "https://lmstudio.ai/models",
731
+ docUrl: "https://weave-docs.wandb.ai/guides/integrations/inference/",
825
732
  gateway: "models.dev"
826
733
  },
827
734
  openai: {
@@ -859,313 +766,394 @@ var provider_registry_default = {
859
766
  docUrl: "https://platform.openai.com/docs/models",
860
767
  gateway: "models.dev"
861
768
  },
862
- anthropic: {
863
- apiKeyEnvVar: "ANTHROPIC_API_KEY",
864
- name: "Anthropic",
865
- models: [
866
- "claude-3-5-haiku-20241022",
867
- "claude-3-5-haiku-latest",
868
- "claude-3-5-sonnet-20240620",
869
- "claude-3-5-sonnet-20241022",
870
- "claude-3-7-sonnet-20250219",
871
- "claude-3-7-sonnet-latest",
872
- "claude-3-haiku-20240307",
873
- "claude-3-opus-20240229",
874
- "claude-3-sonnet-20240229",
875
- "claude-haiku-4-5",
876
- "claude-haiku-4-5-20251001",
877
- "claude-opus-4-0",
878
- "claude-opus-4-1",
879
- "claude-opus-4-1-20250805",
880
- "claude-opus-4-20250514",
881
- "claude-sonnet-4-0",
882
- "claude-sonnet-4-20250514",
883
- "claude-sonnet-4-5",
884
- "claude-sonnet-4-5-20250929"
885
- ],
886
- docUrl: "https://docs.anthropic.com/en/docs/about-claude/models",
887
- gateway: "models.dev"
888
- },
889
- moonshotai: {
890
- url: "https://api.moonshot.ai/v1",
891
- apiKeyEnvVar: "MOONSHOT_API_KEY",
892
- apiKeyHeader: "Authorization",
893
- name: "Moonshot AI",
894
- models: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
895
- docUrl: "https://platform.moonshot.ai/docs/api/chat",
896
- gateway: "models.dev"
897
- },
898
- inference: {
899
- url: "https://inference.net/v1",
900
- apiKeyEnvVar: "INFERENCE_API_KEY",
901
- apiKeyHeader: "Authorization",
902
- name: "Inference",
903
- models: [
904
- "google/gemma-3",
905
- "meta/llama-3.1-8b-instruct",
906
- "meta/llama-3.2-11b-vision-instruct",
907
- "meta/llama-3.2-1b-instruct",
908
- "meta/llama-3.2-3b-instruct",
909
- "mistral/mistral-nemo-12b-instruct",
910
- "osmosis/osmosis-structure-0.6b",
911
- "qwen/qwen-2.5-7b-vision-instruct",
912
- "qwen/qwen3-embedding-4b"
913
- ],
914
- docUrl: "https://inference.net/models",
915
- gateway: "models.dev"
916
- },
917
- baseten: {
918
- url: "https://inference.baseten.co/v1",
919
- apiKeyEnvVar: "BASETEN_API_KEY",
769
+ "zhipuai-coding-plan": {
770
+ url: "https://open.bigmodel.cn/api/coding/paas/v4",
771
+ apiKeyEnvVar: "ZHIPU_API_KEY",
920
772
  apiKeyHeader: "Authorization",
921
- name: "Baseten",
922
- models: ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
923
- docUrl: "https://docs.baseten.co/development/model-apis/overview",
773
+ name: "Zhipu AI Coding Plan",
774
+ models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
775
+ docUrl: "https://docs.bigmodel.cn/cn/coding-plan/overview",
924
776
  gateway: "models.dev"
925
777
  },
926
- cortecs: {
927
- url: "https://api.cortecs.ai/v1",
928
- apiKeyEnvVar: "CORTECS_API_KEY",
778
+ perplexity: {
779
+ url: "https://api.perplexity.ai",
780
+ apiKeyEnvVar: "PERPLEXITY_API_KEY",
929
781
  apiKeyHeader: "Authorization",
930
- name: "Cortecs",
931
- models: [
932
- "claude-4-5-sonnet",
933
- "claude-sonnet-4",
934
- "deepseek-v3-0324",
935
- "gemini-2.5-pro",
936
- "gpt-4.1",
937
- "gpt-oss-120b",
938
- "kimi-k2-instruct",
939
- "llama-3.1-405b-instruct",
940
- "nova-pro-v1",
941
- "qwen3-32b",
942
- "qwen3-coder-480b-a35b-instruct"
943
- ],
944
- docUrl: "https://api.cortecs.ai/v1/models",
782
+ name: "Perplexity",
783
+ models: ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
784
+ docUrl: "https://docs.perplexity.ai",
945
785
  gateway: "models.dev"
946
786
  },
947
- mistral: {
948
- url: "https://api.mistral.ai/v1",
949
- apiKeyEnvVar: "MISTRAL_API_KEY",
950
- apiKeyHeader: "Authorization",
951
- name: "Mistral",
787
+ openrouter: {
788
+ url: "https://openrouter.ai/api/v1",
789
+ apiKeyEnvVar: "OPENROUTER_API_KEY",
790
+ name: "OpenRouter",
952
791
  models: [
953
- "codestral-latest",
954
- "devstral-medium-2507",
955
- "devstral-small-2505",
956
- "devstral-small-2507",
957
- "magistral-medium-latest",
958
- "magistral-small",
959
- "ministral-3b-latest",
960
- "ministral-8b-latest",
961
- "mistral-large-latest",
962
- "mistral-medium-2505",
963
- "mistral-medium-2508",
964
- "mistral-medium-latest",
965
- "mistral-nemo",
966
- "mistral-small-latest",
967
- "open-mistral-7b",
968
- "open-mixtral-8x22b",
969
- "open-mixtral-8x7b",
970
- "pixtral-12b",
971
- "pixtral-large-latest"
792
+ "anthropic/claude-3.5-haiku",
793
+ "anthropic/claude-3.7-sonnet",
794
+ "anthropic/claude-haiku-4.5",
795
+ "anthropic/claude-opus-4",
796
+ "anthropic/claude-opus-4.1",
797
+ "anthropic/claude-sonnet-4",
798
+ "anthropic/claude-sonnet-4.5",
799
+ "cognitivecomputations/dolphin3.0-mistral-24b",
800
+ "cognitivecomputations/dolphin3.0-r1-mistral-24b",
801
+ "deepseek/deepseek-chat-v3-0324",
802
+ "deepseek/deepseek-chat-v3.1",
803
+ "deepseek/deepseek-r1-0528-qwen3-8b:free",
804
+ "deepseek/deepseek-r1-0528:free",
805
+ "deepseek/deepseek-r1-distill-llama-70b",
806
+ "deepseek/deepseek-r1-distill-qwen-14b",
807
+ "deepseek/deepseek-r1:free",
808
+ "deepseek/deepseek-v3-base:free",
809
+ "deepseek/deepseek-v3.1-terminus",
810
+ "featherless/qwerky-72b",
811
+ "google/gemini-2.0-flash-001",
812
+ "google/gemini-2.0-flash-exp:free",
813
+ "google/gemini-2.5-flash",
814
+ "google/gemini-2.5-flash-lite",
815
+ "google/gemini-2.5-flash-lite-preview-09-2025",
816
+ "google/gemini-2.5-flash-preview-09-2025",
817
+ "google/gemini-2.5-pro",
818
+ "google/gemini-2.5-pro-preview-05-06",
819
+ "google/gemini-2.5-pro-preview-06-05",
820
+ "google/gemma-2-9b-it:free",
821
+ "google/gemma-3-12b-it",
822
+ "google/gemma-3-27b-it",
823
+ "google/gemma-3n-e4b-it",
824
+ "google/gemma-3n-e4b-it:free",
825
+ "meta-llama/llama-3.2-11b-vision-instruct",
826
+ "meta-llama/llama-3.3-70b-instruct:free",
827
+ "meta-llama/llama-4-scout:free",
828
+ "microsoft/mai-ds-r1:free",
829
+ "mistralai/codestral-2508",
830
+ "mistralai/devstral-medium-2507",
831
+ "mistralai/devstral-small-2505",
832
+ "mistralai/devstral-small-2505:free",
833
+ "mistralai/devstral-small-2507",
834
+ "mistralai/mistral-7b-instruct:free",
835
+ "mistralai/mistral-medium-3",
836
+ "mistralai/mistral-medium-3.1",
837
+ "mistralai/mistral-nemo:free",
838
+ "mistralai/mistral-small-3.1-24b-instruct",
839
+ "mistralai/mistral-small-3.2-24b-instruct",
840
+ "mistralai/mistral-small-3.2-24b-instruct:free",
841
+ "moonshotai/kimi-dev-72b:free",
842
+ "moonshotai/kimi-k2",
843
+ "moonshotai/kimi-k2-0905",
844
+ "moonshotai/kimi-k2:free",
845
+ "nousresearch/deephermes-3-llama-3-8b-preview",
846
+ "nousresearch/hermes-4-405b",
847
+ "nousresearch/hermes-4-70b",
848
+ "openai/gpt-4.1",
849
+ "openai/gpt-4.1-mini",
850
+ "openai/gpt-4o-mini",
851
+ "openai/gpt-5",
852
+ "openai/gpt-5-chat",
853
+ "openai/gpt-5-codex",
854
+ "openai/gpt-5-image",
855
+ "openai/gpt-5-mini",
856
+ "openai/gpt-5-nano",
857
+ "openai/gpt-oss-120b",
858
+ "openai/gpt-oss-20b",
859
+ "openai/o4-mini",
860
+ "openrouter/cypher-alpha:free",
861
+ "openrouter/horizon-alpha",
862
+ "openrouter/horizon-beta",
863
+ "openrouter/sonoma-dusk-alpha",
864
+ "openrouter/sonoma-sky-alpha",
865
+ "qwen/qwen-2.5-coder-32b-instruct",
866
+ "qwen/qwen2.5-vl-32b-instruct:free",
867
+ "qwen/qwen2.5-vl-72b-instruct",
868
+ "qwen/qwen2.5-vl-72b-instruct:free",
869
+ "qwen/qwen3-14b:free",
870
+ "qwen/qwen3-235b-a22b-07-25",
871
+ "qwen/qwen3-235b-a22b-07-25:free",
872
+ "qwen/qwen3-235b-a22b-thinking-2507",
873
+ "qwen/qwen3-235b-a22b:free",
874
+ "qwen/qwen3-30b-a3b-instruct-2507",
875
+ "qwen/qwen3-30b-a3b-thinking-2507",
876
+ "qwen/qwen3-30b-a3b:free",
877
+ "qwen/qwen3-32b:free",
878
+ "qwen/qwen3-8b:free",
879
+ "qwen/qwen3-coder",
880
+ "qwen/qwen3-coder:free",
881
+ "qwen/qwen3-max",
882
+ "qwen/qwen3-next-80b-a3b-instruct",
883
+ "qwen/qwen3-next-80b-a3b-thinking",
884
+ "qwen/qwq-32b:free",
885
+ "rekaai/reka-flash-3",
886
+ "sarvamai/sarvam-m:free",
887
+ "thudm/glm-z1-32b:free",
888
+ "tngtech/deepseek-r1t2-chimera:free",
889
+ "x-ai/grok-3",
890
+ "x-ai/grok-3-beta",
891
+ "x-ai/grok-3-mini",
892
+ "x-ai/grok-3-mini-beta",
893
+ "x-ai/grok-4",
894
+ "x-ai/grok-4-fast",
895
+ "x-ai/grok-4-fast:free",
896
+ "x-ai/grok-code-fast-1",
897
+ "z-ai/glm-4.5",
898
+ "z-ai/glm-4.5-air",
899
+ "z-ai/glm-4.5-air:free",
900
+ "z-ai/glm-4.5v",
901
+ "z-ai/glm-4.6"
972
902
  ],
973
- docUrl: "https://docs.mistral.ai/getting-started/models/",
903
+ docUrl: "https://openrouter.ai/models",
974
904
  gateway: "models.dev"
975
905
  },
976
- venice: {
977
- url: "https://api.venice.ai/api/v1",
978
- apiKeyEnvVar: "VENICE_API_KEY",
906
+ synthetic: {
907
+ url: "https://api.synthetic.new/v1",
908
+ apiKeyEnvVar: "SYNTHETIC_API_KEY",
979
909
  apiKeyHeader: "Authorization",
980
- name: "Venice AI",
910
+ name: "Synthetic",
981
911
  models: [
982
- "deepseek-coder-v2-lite",
983
- "deepseek-r1-671b",
984
- "dolphin-2.9.2-qwen2-72b",
985
- "llama-3.1-405b",
986
- "llama-3.2-3b",
987
- "llama-3.3-70b",
988
- "mistral-31-24b",
989
- "qwen-2.5-coder-32b",
990
- "qwen-2.5-qwq-32b",
991
- "qwen-2.5-vl",
992
- "qwen3-235b",
993
- "qwen3-4b",
994
- "venice-uncensored"
912
+ "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
913
+ "hf:Qwen/Qwen3-235B-A22B-Instruct-2507",
914
+ "hf:Qwen/Qwen3-235B-A22B-Thinking-2507",
915
+ "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct",
916
+ "hf:deepseek-ai/DeepSeek-R1",
917
+ "hf:deepseek-ai/DeepSeek-R1-0528",
918
+ "hf:deepseek-ai/DeepSeek-V3",
919
+ "hf:deepseek-ai/DeepSeek-V3-0324",
920
+ "hf:deepseek-ai/DeepSeek-V3.1",
921
+ "hf:deepseek-ai/DeepSeek-V3.1-Terminus",
922
+ "hf:meta-llama/Llama-3.1-405B-Instruct",
923
+ "hf:meta-llama/Llama-3.1-70B-Instruct",
924
+ "hf:meta-llama/Llama-3.1-8B-Instruct",
925
+ "hf:meta-llama/Llama-3.3-70B-Instruct",
926
+ "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
927
+ "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct",
928
+ "hf:moonshotai/Kimi-K2-Instruct",
929
+ "hf:moonshotai/Kimi-K2-Instruct-0905",
930
+ "hf:openai/gpt-oss-120b",
931
+ "hf:zai-org/GLM-4.5",
932
+ "hf:zai-org/GLM-4.6"
995
933
  ],
996
- docUrl: "https://docs.venice.ai",
934
+ docUrl: "https://synthetic.new/pricing",
997
935
  gateway: "models.dev"
998
936
  },
999
- alibaba: {
1000
- url: "https://dashscope-intl.aliyuncs.com/compatible-mode/v1",
1001
- apiKeyEnvVar: "DASHSCOPE_API_KEY",
937
+ deepinfra: {
938
+ url: "https://api.deepinfra.com/v1/openai",
939
+ apiKeyEnvVar: "DEEPINFRA_API_KEY",
1002
940
  apiKeyHeader: "Authorization",
1003
- name: "Alibaba",
941
+ name: "Deep Infra",
1004
942
  models: [
1005
- "qvq-max",
1006
- "qwen-flash",
1007
- "qwen-max",
1008
- "qwen-mt-plus",
1009
- "qwen-mt-turbo",
1010
- "qwen-omni-turbo",
1011
- "qwen-omni-turbo-realtime",
1012
- "qwen-plus",
1013
- "qwen-plus-character-ja",
1014
- "qwen-turbo",
1015
- "qwen-vl-max",
1016
- "qwen-vl-ocr",
1017
- "qwen-vl-plus",
1018
- "qwen2-5-14b-instruct",
1019
- "qwen2-5-32b-instruct",
1020
- "qwen2-5-72b-instruct",
1021
- "qwen2-5-7b-instruct",
1022
- "qwen2-5-omni-7b",
1023
- "qwen2-5-vl-72b-instruct",
1024
- "qwen2-5-vl-7b-instruct",
1025
- "qwen3-14b",
1026
- "qwen3-235b-a22b",
1027
- "qwen3-32b",
1028
- "qwen3-8b",
1029
- "qwen3-asr-flash",
1030
- "qwen3-coder-30b-a3b-instruct",
1031
- "qwen3-coder-480b-a35b-instruct",
1032
- "qwen3-coder-flash",
1033
- "qwen3-coder-plus",
1034
- "qwen3-livetranslate-flash-realtime",
1035
- "qwen3-max",
1036
- "qwen3-next-80b-a3b-instruct",
1037
- "qwen3-next-80b-a3b-thinking",
1038
- "qwen3-omni-flash",
1039
- "qwen3-omni-flash-realtime",
1040
- "qwen3-vl-235b-a22b",
1041
- "qwen3-vl-30b-a3b",
1042
- "qwen3-vl-plus",
1043
- "qwq-plus"
943
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
944
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo",
945
+ "moonshotai/Kimi-K2-Instruct",
946
+ "zai-org/GLM-4.5"
1044
947
  ],
1045
- docUrl: "https://www.alibabacloud.com/help/en/model-studio/models",
948
+ docUrl: "https://deepinfra.com/models",
1046
949
  gateway: "models.dev"
1047
950
  },
1048
- "alibaba-cn": {
1049
- url: "https://dashscope.aliyuncs.com/compatible-mode/v1",
1050
- apiKeyEnvVar: "DASHSCOPE_API_KEY",
951
+ zhipuai: {
952
+ url: "https://open.bigmodel.cn/api/paas/v4",
953
+ apiKeyEnvVar: "ZHIPU_API_KEY",
1051
954
  apiKeyHeader: "Authorization",
1052
- name: "Alibaba (China)",
955
+ name: "Zhipu AI",
956
+ models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
957
+ docUrl: "https://docs.z.ai/guides/overview/pricing",
958
+ gateway: "models.dev"
959
+ },
960
+ submodel: {
961
+ url: "https://llm.submodel.ai/v1",
962
+ apiKeyEnvVar: "SUBMODEL_INSTAGEN_ACCESS_KEY",
963
+ apiKeyHeader: "Authorization",
964
+ name: "submodel",
1053
965
  models: [
1054
- "deepseek-r1",
1055
- "deepseek-r1-0528",
1056
- "deepseek-r1-distill-llama-70b",
1057
- "deepseek-r1-distill-llama-8b",
1058
- "deepseek-r1-distill-qwen-1-5b",
1059
- "deepseek-r1-distill-qwen-14b",
1060
- "deepseek-r1-distill-qwen-32b",
1061
- "deepseek-r1-distill-qwen-7b",
1062
- "deepseek-v3",
1063
- "deepseek-v3-1",
1064
- "deepseek-v3-2-exp",
1065
- "moonshot-kimi-k2-instruct",
1066
- "qvq-max",
1067
- "qwen-deep-research",
1068
- "qwen-doc-turbo",
1069
- "qwen-flash",
1070
- "qwen-long",
1071
- "qwen-math-plus",
1072
- "qwen-math-turbo",
1073
- "qwen-max",
1074
- "qwen-mt-plus",
1075
- "qwen-mt-turbo",
1076
- "qwen-omni-turbo",
1077
- "qwen-omni-turbo-realtime",
1078
- "qwen-plus",
1079
- "qwen-plus-character",
1080
- "qwen-turbo",
1081
- "qwen-vl-max",
1082
- "qwen-vl-ocr",
1083
- "qwen-vl-plus",
1084
- "qwen2-5-14b-instruct",
1085
- "qwen2-5-32b-instruct",
1086
- "qwen2-5-72b-instruct",
1087
- "qwen2-5-7b-instruct",
1088
- "qwen2-5-coder-32b-instruct",
1089
- "qwen2-5-coder-7b-instruct",
1090
- "qwen2-5-math-72b-instruct",
1091
- "qwen2-5-math-7b-instruct",
1092
- "qwen2-5-omni-7b",
1093
- "qwen2-5-vl-72b-instruct",
1094
- "qwen2-5-vl-7b-instruct",
1095
- "qwen3-14b",
1096
- "qwen3-235b-a22b",
1097
- "qwen3-32b",
1098
- "qwen3-8b",
1099
- "qwen3-asr-flash",
1100
- "qwen3-coder-30b-a3b-instruct",
1101
- "qwen3-coder-480b-a35b-instruct",
1102
- "qwen3-coder-flash",
1103
- "qwen3-coder-plus",
1104
- "qwen3-max",
1105
- "qwen3-next-80b-a3b-instruct",
1106
- "qwen3-next-80b-a3b-thinking",
1107
- "qwen3-omni-flash",
1108
- "qwen3-omni-flash-realtime",
1109
- "qwen3-vl-235b-a22b",
1110
- "qwen3-vl-30b-a3b",
1111
- "qwen3-vl-plus",
1112
- "qwq-32b",
1113
- "qwq-plus",
1114
- "tongyi-intent-detect-v3"
966
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
967
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
968
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
969
+ "deepseek-ai/DeepSeek-R1-0528",
970
+ "deepseek-ai/DeepSeek-V3-0324",
971
+ "deepseek-ai/DeepSeek-V3.1",
972
+ "openai/gpt-oss-120b",
973
+ "zai-org/GLM-4.5-Air",
974
+ "zai-org/GLM-4.5-FP8"
1115
975
  ],
1116
- docUrl: "https://www.alibabacloud.com/help/en/model-studio/models",
976
+ docUrl: "https://submodel.gitbook.io",
1117
977
  gateway: "models.dev"
1118
978
  },
1119
- chutes: {
1120
- url: "https://llm.chutes.ai/v1",
1121
- apiKeyEnvVar: "CHUTES_API_KEY",
979
+ zai: {
980
+ url: "https://api.z.ai/api/paas/v4",
981
+ apiKeyEnvVar: "ZHIPU_API_KEY",
1122
982
  apiKeyHeader: "Authorization",
1123
- name: "Chutes",
983
+ name: "Z.AI",
984
+ models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
985
+ docUrl: "https://docs.z.ai/guides/overview/pricing",
986
+ gateway: "models.dev"
987
+ },
988
+ inference: {
989
+ url: "https://inference.net/v1",
990
+ apiKeyEnvVar: "INFERENCE_API_KEY",
991
+ apiKeyHeader: "Authorization",
992
+ name: "Inference",
993
+ models: [
994
+ "google/gemma-3",
995
+ "meta/llama-3.1-8b-instruct",
996
+ "meta/llama-3.2-11b-vision-instruct",
997
+ "meta/llama-3.2-1b-instruct",
998
+ "meta/llama-3.2-3b-instruct",
999
+ "mistral/mistral-nemo-12b-instruct",
1000
+ "osmosis/osmosis-structure-0.6b",
1001
+ "qwen/qwen-2.5-7b-vision-instruct",
1002
+ "qwen/qwen3-embedding-4b"
1003
+ ],
1004
+ docUrl: "https://inference.net/models",
1005
+ gateway: "models.dev"
1006
+ },
1007
+ requesty: {
1008
+ url: "https://router.requesty.ai/v1",
1009
+ apiKeyEnvVar: "REQUESTY_API_KEY",
1010
+ apiKeyHeader: "Authorization",
1011
+ name: "Requesty",
1012
+ models: [
1013
+ "anthropic/claude-3-7-sonnet",
1014
+ "anthropic/claude-4-sonnet-20250522",
1015
+ "anthropic/claude-opus-4",
1016
+ "anthropic/claude-opus-4-1-20250805",
1017
+ "google/gemini-2.5-flash",
1018
+ "google/gemini-2.5-pro",
1019
+ "openai/gpt-4.1",
1020
+ "openai/gpt-4.1-mini",
1021
+ "openai/gpt-4o-mini",
1022
+ "openai/gpt-5",
1023
+ "openai/gpt-5-mini",
1024
+ "openai/gpt-5-nano",
1025
+ "openai/o4-mini"
1026
+ ],
1027
+ docUrl: "https://requesty.ai/solution/llm-routing/models",
1028
+ gateway: "models.dev"
1029
+ },
1030
+ morph: {
1031
+ url: "https://api.morphllm.com/v1",
1032
+ apiKeyEnvVar: "MORPH_API_KEY",
1033
+ apiKeyHeader: "Authorization",
1034
+ name: "Morph",
1035
+ models: ["auto", "morph-v3-fast", "morph-v3-large"],
1036
+ docUrl: "https://docs.morphllm.com/api-reference/introduction",
1037
+ gateway: "models.dev"
1038
+ },
1039
+ lmstudio: {
1040
+ url: "http://127.0.0.1:1234/v1",
1041
+ apiKeyEnvVar: "LMSTUDIO_API_KEY",
1042
+ apiKeyHeader: "Authorization",
1043
+ name: "LMStudio",
1044
+ models: ["openai/gpt-oss-20b", "qwen/qwen3-30b-a3b-2507", "qwen/qwen3-coder-30b"],
1045
+ docUrl: "https://lmstudio.ai/models",
1046
+ gateway: "models.dev"
1047
+ },
1048
+ anthropic: {
1049
+ apiKeyEnvVar: "ANTHROPIC_API_KEY",
1050
+ name: "Anthropic",
1051
+ models: [
1052
+ "claude-3-5-haiku-20241022",
1053
+ "claude-3-5-haiku-latest",
1054
+ "claude-3-5-sonnet-20240620",
1055
+ "claude-3-5-sonnet-20241022",
1056
+ "claude-3-7-sonnet-20250219",
1057
+ "claude-3-7-sonnet-latest",
1058
+ "claude-3-haiku-20240307",
1059
+ "claude-3-opus-20240229",
1060
+ "claude-3-sonnet-20240229",
1061
+ "claude-haiku-4-5",
1062
+ "claude-haiku-4-5-20251001",
1063
+ "claude-opus-4-0",
1064
+ "claude-opus-4-1",
1065
+ "claude-opus-4-1-20250805",
1066
+ "claude-opus-4-20250514",
1067
+ "claude-sonnet-4-0",
1068
+ "claude-sonnet-4-20250514",
1069
+ "claude-sonnet-4-5",
1070
+ "claude-sonnet-4-5-20250929"
1071
+ ],
1072
+ docUrl: "https://docs.anthropic.com/en/docs/about-claude/models",
1073
+ gateway: "models.dev"
1074
+ },
1075
+ "fireworks-ai": {
1076
+ url: "https://api.fireworks.ai/inference/v1/",
1077
+ apiKeyEnvVar: "FIREWORKS_API_KEY",
1078
+ apiKeyHeader: "Authorization",
1079
+ name: "Fireworks AI",
1080
+ models: [
1081
+ "accounts/fireworks/models/deepseek-r1-0528",
1082
+ "accounts/fireworks/models/deepseek-v3-0324",
1083
+ "accounts/fireworks/models/deepseek-v3p1",
1084
+ "accounts/fireworks/models/glm-4p5",
1085
+ "accounts/fireworks/models/glm-4p5-air",
1086
+ "accounts/fireworks/models/gpt-oss-120b",
1087
+ "accounts/fireworks/models/gpt-oss-20b",
1088
+ "accounts/fireworks/models/kimi-k2-instruct",
1089
+ "accounts/fireworks/models/qwen3-235b-a22b",
1090
+ "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
1091
+ ],
1092
+ docUrl: "https://fireworks.ai/docs/",
1093
+ gateway: "models.dev"
1094
+ },
1095
+ modelscope: {
1096
+ url: "https://api-inference.modelscope.cn/v1",
1097
+ apiKeyEnvVar: "MODELSCOPE_API_KEY",
1098
+ apiKeyHeader: "Authorization",
1099
+ name: "ModelScope",
1100
+ models: [
1101
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1102
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1103
+ "Qwen/Qwen3-30B-A3B-Instruct-2507",
1104
+ "Qwen/Qwen3-30B-A3B-Thinking-2507",
1105
+ "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1106
+ "ZhipuAI/GLM-4.5",
1107
+ "ZhipuAI/GLM-4.6"
1108
+ ],
1109
+ docUrl: "https://modelscope.cn/docs/model-service/API-Inference/intro",
1110
+ gateway: "models.dev"
1111
+ },
1112
+ llama: {
1113
+ url: "https://api.llama.com/compat/v1/",
1114
+ apiKeyEnvVar: "LLAMA_API_KEY",
1115
+ apiKeyHeader: "Authorization",
1116
+ name: "Llama",
1117
+ models: [
1118
+ "cerebras-llama-4-maverick-17b-128e-instruct",
1119
+ "cerebras-llama-4-scout-17b-16e-instruct",
1120
+ "groq-llama-4-maverick-17b-128e-instruct",
1121
+ "llama-3.3-70b-instruct",
1122
+ "llama-3.3-8b-instruct",
1123
+ "llama-4-maverick-17b-128e-instruct-fp8",
1124
+ "llama-4-scout-17b-16e-instruct-fp8"
1125
+ ],
1126
+ docUrl: "https://llama.developer.meta.com/docs/models",
1127
+ gateway: "models.dev"
1128
+ },
1129
+ scaleway: {
1130
+ url: "https://api.scaleway.ai/v1",
1131
+ apiKeyEnvVar: "SCALEWAY_API_KEY",
1132
+ apiKeyHeader: "Authorization",
1133
+ name: "Scaleway",
1124
1134
  models: [
1125
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1126
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1127
- "Qwen/Qwen3-30B-A3B",
1128
- "Qwen/Qwen3-30B-A3B-Instruct-2507",
1129
- "Qwen/Qwen3-30B-A3B-Thinking-2507",
1130
- "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1131
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1132
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
1133
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
1134
- "chutesai/Devstral-Small-2505",
1135
- "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
1136
- "deepseek-ai/DeepSeek-R1-0528",
1137
- "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
1138
- "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1139
- "deepseek-ai/DeepSeek-V3-0324",
1140
- "deepseek-ai/DeepSeek-V3.1",
1141
- "deepseek-ai/DeepSeek-V3.1-Terminus",
1142
- "deepseek-ai/DeepSeek-V3.1-turbo",
1143
- "deepseek-ai/DeepSeek-V3.1:THINKING",
1144
- "deepseek-ai/DeepSeek-V3.2-Exp",
1145
- "meituan-longcat/LongCat-Flash-Chat-FP8",
1146
- "moonshotai/Kimi-Dev-72B",
1147
- "moonshotai/Kimi-K2-Instruct-0905",
1148
- "moonshotai/Kimi-K2-Instruct-75k",
1149
- "moonshotai/Kimi-VL-A3B-Thinking",
1150
- "openai/gpt-oss-120b",
1151
- "tngtech/DeepSeek-R1T-Chimera",
1152
- "tngtech/DeepSeek-TNG-R1T2-Chimera",
1153
- "zai-org/GLM-4.5-Air",
1154
- "zai-org/GLM-4.5-FP8",
1155
- "zai-org/GLM-4.5-turbo",
1156
- "zai-org/GLM-4.6-FP8",
1157
- "zai-org/GLM-4.6-turbo"
1135
+ "deepseek-r1-distill-llama-70b",
1136
+ "gemma-3-27b-it",
1137
+ "gpt-oss-120b",
1138
+ "llama-3.1-8b-instruct",
1139
+ "llama-3.3-70b-instruct",
1140
+ "mistral-nemo-instruct-2407",
1141
+ "mistral-small-3.2-24b-instruct-2506",
1142
+ "pixtral-12b-2409",
1143
+ "qwen3-235b-a22b-instruct-2507",
1144
+ "qwen3-coder-30b-a3b-instruct",
1145
+ "voxtral-small-24b-2507"
1158
1146
  ],
1159
- docUrl: "https://llm.chutes.ai/v1/models",
1147
+ docUrl: "https://www.scaleway.com/en/docs/generative-apis/",
1160
1148
  gateway: "models.dev"
1161
1149
  },
1162
- upstage: {
1163
- url: "https://api.upstage.ai",
1164
- apiKeyEnvVar: "UPSTAGE_API_KEY",
1150
+ cerebras: {
1151
+ url: "https://api.cerebras.ai/v1",
1152
+ apiKeyEnvVar: "CEREBRAS_API_KEY",
1165
1153
  apiKeyHeader: "Authorization",
1166
- name: "Upstage",
1167
- models: ["solar-mini", "solar-pro2"],
1168
- docUrl: "https://developers.upstage.ai/docs/apis/chat",
1154
+ name: "Cerebras",
1155
+ models: ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
1156
+ docUrl: "https://inference-docs.cerebras.ai/models/overview",
1169
1157
  gateway: "models.dev"
1170
1158
  },
1171
1159
  netlify: {
@@ -1213,6 +1201,73 @@ var provider_registry_default = {
1213
1201
  }
1214
1202
  },
1215
1203
  models: {
1204
+ "moonshotai-cn": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1205
+ lucidquery: ["lucidnova-rf1-100b", "lucidquery-nexus-coder"],
1206
+ moonshotai: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1207
+ "zai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1208
+ alibaba: [
1209
+ "qvq-max",
1210
+ "qwen-flash",
1211
+ "qwen-max",
1212
+ "qwen-mt-plus",
1213
+ "qwen-mt-turbo",
1214
+ "qwen-omni-turbo",
1215
+ "qwen-omni-turbo-realtime",
1216
+ "qwen-plus",
1217
+ "qwen-plus-character-ja",
1218
+ "qwen-turbo",
1219
+ "qwen-vl-max",
1220
+ "qwen-vl-ocr",
1221
+ "qwen-vl-plus",
1222
+ "qwen2-5-14b-instruct",
1223
+ "qwen2-5-32b-instruct",
1224
+ "qwen2-5-72b-instruct",
1225
+ "qwen2-5-7b-instruct",
1226
+ "qwen2-5-omni-7b",
1227
+ "qwen2-5-vl-72b-instruct",
1228
+ "qwen2-5-vl-7b-instruct",
1229
+ "qwen3-14b",
1230
+ "qwen3-235b-a22b",
1231
+ "qwen3-32b",
1232
+ "qwen3-8b",
1233
+ "qwen3-asr-flash",
1234
+ "qwen3-coder-30b-a3b-instruct",
1235
+ "qwen3-coder-480b-a35b-instruct",
1236
+ "qwen3-coder-flash",
1237
+ "qwen3-coder-plus",
1238
+ "qwen3-livetranslate-flash-realtime",
1239
+ "qwen3-max",
1240
+ "qwen3-next-80b-a3b-instruct",
1241
+ "qwen3-next-80b-a3b-thinking",
1242
+ "qwen3-omni-flash",
1243
+ "qwen3-omni-flash-realtime",
1244
+ "qwen3-vl-235b-a22b",
1245
+ "qwen3-vl-30b-a3b",
1246
+ "qwen3-vl-plus",
1247
+ "qwq-plus"
1248
+ ],
1249
+ xai: [
1250
+ "grok-2",
1251
+ "grok-2-1212",
1252
+ "grok-2-latest",
1253
+ "grok-2-vision",
1254
+ "grok-2-vision-1212",
1255
+ "grok-2-vision-latest",
1256
+ "grok-3",
1257
+ "grok-3-fast",
1258
+ "grok-3-fast-latest",
1259
+ "grok-3-latest",
1260
+ "grok-3-mini",
1261
+ "grok-3-mini-fast",
1262
+ "grok-3-mini-fast-latest",
1263
+ "grok-3-mini-latest",
1264
+ "grok-4",
1265
+ "grok-4-fast",
1266
+ "grok-4-fast-non-reasoning",
1267
+ "grok-beta",
1268
+ "grok-code-fast-1",
1269
+ "grok-vision-beta"
1270
+ ],
1216
1271
  nvidia: [
1217
1272
  "black-forest-labs/flux.1-dev",
1218
1273
  "deepseek-ai/deepseek-v3.1",
@@ -1226,99 +1281,375 @@ var provider_registry_default = {
1226
1281
  "nvidia/nemoretriever-ocr-v1",
1227
1282
  "nvidia/parakeet-tdt-0.6b-v2",
1228
1283
  "openai/gpt-oss-120b",
1229
- "openai/whisper-large-v3",
1230
- "qwen/qwen3-235b-a22b",
1231
- "qwen/qwen3-coder-480b-a35b-instruct"
1284
+ "openai/whisper-large-v3",
1285
+ "qwen/qwen3-235b-a22b",
1286
+ "qwen/qwen3-coder-480b-a35b-instruct"
1287
+ ],
1288
+ upstage: ["solar-mini", "solar-pro2"],
1289
+ groq: [
1290
+ "deepseek-r1-distill-llama-70b",
1291
+ "gemma2-9b-it",
1292
+ "llama-3.1-8b-instant",
1293
+ "llama-3.3-70b-versatile",
1294
+ "llama-guard-3-8b",
1295
+ "llama3-70b-8192",
1296
+ "llama3-8b-8192",
1297
+ "meta-llama/llama-4-maverick-17b-128e-instruct",
1298
+ "meta-llama/llama-4-scout-17b-16e-instruct",
1299
+ "meta-llama/llama-guard-4-12b",
1300
+ "mistral-saba-24b",
1301
+ "moonshotai/kimi-k2-instruct",
1302
+ "moonshotai/kimi-k2-instruct-0905",
1303
+ "openai/gpt-oss-120b",
1304
+ "openai/gpt-oss-20b",
1305
+ "qwen-qwq-32b",
1306
+ "qwen/qwen3-32b"
1307
+ ],
1308
+ mistral: [
1309
+ "codestral-latest",
1310
+ "devstral-medium-2507",
1311
+ "devstral-small-2505",
1312
+ "devstral-small-2507",
1313
+ "magistral-medium-latest",
1314
+ "magistral-small",
1315
+ "ministral-3b-latest",
1316
+ "ministral-8b-latest",
1317
+ "mistral-large-latest",
1318
+ "mistral-medium-2505",
1319
+ "mistral-medium-2508",
1320
+ "mistral-medium-latest",
1321
+ "mistral-nemo",
1322
+ "mistral-small-latest",
1323
+ "open-mistral-7b",
1324
+ "open-mixtral-8x22b",
1325
+ "open-mixtral-8x7b",
1326
+ "pixtral-12b",
1327
+ "pixtral-large-latest"
1328
+ ],
1329
+ vercel: [
1330
+ "alibaba/qwen3-coder-plus",
1331
+ "alibaba/qwen3-max",
1332
+ "alibaba/qwen3-next-80b-a3b-instruct",
1333
+ "alibaba/qwen3-next-80b-a3b-thinking",
1334
+ "alibaba/qwen3-vl-instruct",
1335
+ "alibaba/qwen3-vl-thinking",
1336
+ "amazon/nova-lite",
1337
+ "amazon/nova-micro",
1338
+ "amazon/nova-pro",
1339
+ "anthropic/claude-3-5-haiku",
1340
+ "anthropic/claude-3-haiku",
1341
+ "anthropic/claude-3-opus",
1342
+ "anthropic/claude-3.5-sonnet",
1343
+ "anthropic/claude-3.7-sonnet",
1344
+ "anthropic/claude-4-1-opus",
1345
+ "anthropic/claude-4-opus",
1346
+ "anthropic/claude-4-sonnet",
1347
+ "anthropic/claude-4.5-sonnet",
1348
+ "anthropic/claude-haiku-4.5",
1349
+ "cerebras/qwen3-coder",
1350
+ "deepseek/deepseek-r1",
1351
+ "deepseek/deepseek-r1-distill-llama-70b",
1352
+ "deepseek/deepseek-v3.1-terminus",
1353
+ "deepseek/deepseek-v3.2-exp",
1354
+ "deepseek/deepseek-v3.2-exp-thinking",
1355
+ "google/gemini-2.0-flash",
1356
+ "google/gemini-2.0-flash-lite",
1357
+ "google/gemini-2.5-flash",
1358
+ "google/gemini-2.5-flash-lite",
1359
+ "google/gemini-2.5-flash-lite-preview-09-2025",
1360
+ "google/gemini-2.5-flash-preview-09-2025",
1361
+ "google/gemini-2.5-pro",
1362
+ "meta/llama-3.3-70b",
1363
+ "meta/llama-4-maverick",
1364
+ "meta/llama-4-scout",
1365
+ "mistral/codestral",
1366
+ "mistral/magistral-medium",
1367
+ "mistral/magistral-small",
1368
+ "mistral/ministral-3b",
1369
+ "mistral/ministral-8b",
1370
+ "mistral/mistral-large",
1371
+ "mistral/mistral-small",
1372
+ "mistral/mixtral-8x22b-instruct",
1373
+ "mistral/pixtral-12b",
1374
+ "mistral/pixtral-large",
1375
+ "moonshotai/kimi-k2",
1376
+ "morph/morph-v3-fast",
1377
+ "morph/morph-v3-large",
1378
+ "openai/gpt-4-turbo",
1379
+ "openai/gpt-4.1",
1380
+ "openai/gpt-4.1-mini",
1381
+ "openai/gpt-4.1-nano",
1382
+ "openai/gpt-4o",
1383
+ "openai/gpt-4o-mini",
1384
+ "openai/gpt-5",
1385
+ "openai/gpt-5-codex",
1386
+ "openai/gpt-5-mini",
1387
+ "openai/gpt-5-nano",
1388
+ "openai/gpt-oss-120b",
1389
+ "openai/gpt-oss-20b",
1390
+ "openai/o1",
1391
+ "openai/o3",
1392
+ "openai/o3-mini",
1393
+ "openai/o4-mini",
1394
+ "perplexity/sonar",
1395
+ "perplexity/sonar-pro",
1396
+ "perplexity/sonar-reasoning",
1397
+ "perplexity/sonar-reasoning-pro",
1398
+ "vercel/v0-1.0-md",
1399
+ "vercel/v0-1.5-md",
1400
+ "xai/grok-2",
1401
+ "xai/grok-2-vision",
1402
+ "xai/grok-3",
1403
+ "xai/grok-3-fast",
1404
+ "xai/grok-3-mini",
1405
+ "xai/grok-3-mini-fast",
1406
+ "xai/grok-4",
1407
+ "xai/grok-4-fast",
1408
+ "xai/grok-4-fast-non-reasoning",
1409
+ "xai/grok-code-fast-1",
1410
+ "zai/glm-4.5",
1411
+ "zai/glm-4.5-air",
1412
+ "zai/glm-4.5v",
1413
+ "zai/glm-4.6"
1414
+ ],
1415
+ nebius: [
1416
+ "NousResearch/hermes-4-405b",
1417
+ "NousResearch/hermes-4-70b",
1418
+ "deepseek-ai/deepseek-v3",
1419
+ "meta-llama/llama-3.3-70b-instruct-base",
1420
+ "meta-llama/llama-3.3-70b-instruct-fast",
1421
+ "meta-llama/llama-3_1-405b-instruct",
1422
+ "moonshotai/kimi-k2-instruct",
1423
+ "nvidia/llama-3_1-nemotron-ultra-253b-v1",
1424
+ "openai/gpt-oss-120b",
1425
+ "openai/gpt-oss-20b",
1426
+ "qwen/qwen3-235b-a22b-instruct-2507",
1427
+ "qwen/qwen3-235b-a22b-thinking-2507",
1428
+ "qwen/qwen3-coder-480b-a35b-instruct",
1429
+ "zai-org/glm-4.5",
1430
+ "zai-org/glm-4.5-air"
1232
1431
  ],
1233
- modelscope: [
1432
+ deepseek: ["deepseek-chat", "deepseek-reasoner"],
1433
+ "alibaba-cn": [
1434
+ "deepseek-r1",
1435
+ "deepseek-r1-0528",
1436
+ "deepseek-r1-distill-llama-70b",
1437
+ "deepseek-r1-distill-llama-8b",
1438
+ "deepseek-r1-distill-qwen-1-5b",
1439
+ "deepseek-r1-distill-qwen-14b",
1440
+ "deepseek-r1-distill-qwen-32b",
1441
+ "deepseek-r1-distill-qwen-7b",
1442
+ "deepseek-v3",
1443
+ "deepseek-v3-1",
1444
+ "deepseek-v3-2-exp",
1445
+ "moonshot-kimi-k2-instruct",
1446
+ "qvq-max",
1447
+ "qwen-deep-research",
1448
+ "qwen-doc-turbo",
1449
+ "qwen-flash",
1450
+ "qwen-long",
1451
+ "qwen-math-plus",
1452
+ "qwen-math-turbo",
1453
+ "qwen-max",
1454
+ "qwen-mt-plus",
1455
+ "qwen-mt-turbo",
1456
+ "qwen-omni-turbo",
1457
+ "qwen-omni-turbo-realtime",
1458
+ "qwen-plus",
1459
+ "qwen-plus-character",
1460
+ "qwen-turbo",
1461
+ "qwen-vl-max",
1462
+ "qwen-vl-ocr",
1463
+ "qwen-vl-plus",
1464
+ "qwen2-5-14b-instruct",
1465
+ "qwen2-5-32b-instruct",
1466
+ "qwen2-5-72b-instruct",
1467
+ "qwen2-5-7b-instruct",
1468
+ "qwen2-5-coder-32b-instruct",
1469
+ "qwen2-5-coder-7b-instruct",
1470
+ "qwen2-5-math-72b-instruct",
1471
+ "qwen2-5-math-7b-instruct",
1472
+ "qwen2-5-omni-7b",
1473
+ "qwen2-5-vl-72b-instruct",
1474
+ "qwen2-5-vl-7b-instruct",
1475
+ "qwen3-14b",
1476
+ "qwen3-235b-a22b",
1477
+ "qwen3-32b",
1478
+ "qwen3-8b",
1479
+ "qwen3-asr-flash",
1480
+ "qwen3-coder-30b-a3b-instruct",
1481
+ "qwen3-coder-480b-a35b-instruct",
1482
+ "qwen3-coder-flash",
1483
+ "qwen3-coder-plus",
1484
+ "qwen3-max",
1485
+ "qwen3-next-80b-a3b-instruct",
1486
+ "qwen3-next-80b-a3b-thinking",
1487
+ "qwen3-omni-flash",
1488
+ "qwen3-omni-flash-realtime",
1489
+ "qwen3-vl-235b-a22b",
1490
+ "qwen3-vl-30b-a3b",
1491
+ "qwen3-vl-plus",
1492
+ "qwq-32b",
1493
+ "qwq-plus",
1494
+ "tongyi-intent-detect-v3"
1495
+ ],
1496
+ venice: [
1497
+ "deepseek-coder-v2-lite",
1498
+ "deepseek-r1-671b",
1499
+ "dolphin-2.9.2-qwen2-72b",
1500
+ "llama-3.1-405b",
1501
+ "llama-3.2-3b",
1502
+ "llama-3.3-70b",
1503
+ "mistral-31-24b",
1504
+ "qwen-2.5-coder-32b",
1505
+ "qwen-2.5-qwq-32b",
1506
+ "qwen-2.5-vl",
1507
+ "qwen3-235b",
1508
+ "qwen3-4b",
1509
+ "venice-uncensored"
1510
+ ],
1511
+ chutes: [
1234
1512
  "Qwen/Qwen3-235B-A22B-Instruct-2507",
1235
1513
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
1514
+ "Qwen/Qwen3-30B-A3B",
1236
1515
  "Qwen/Qwen3-30B-A3B-Instruct-2507",
1237
1516
  "Qwen/Qwen3-30B-A3B-Thinking-2507",
1238
1517
  "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1239
- "ZhipuAI/GLM-4.5",
1240
- "ZhipuAI/GLM-4.6"
1518
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1519
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
1520
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
1521
+ "chutesai/Devstral-Small-2505",
1522
+ "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
1523
+ "deepseek-ai/DeepSeek-R1-0528",
1524
+ "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
1525
+ "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1526
+ "deepseek-ai/DeepSeek-V3-0324",
1527
+ "deepseek-ai/DeepSeek-V3.1",
1528
+ "deepseek-ai/DeepSeek-V3.1-Terminus",
1529
+ "deepseek-ai/DeepSeek-V3.1-turbo",
1530
+ "deepseek-ai/DeepSeek-V3.1:THINKING",
1531
+ "deepseek-ai/DeepSeek-V3.2-Exp",
1532
+ "meituan-longcat/LongCat-Flash-Chat-FP8",
1533
+ "moonshotai/Kimi-Dev-72B",
1534
+ "moonshotai/Kimi-K2-Instruct-0905",
1535
+ "moonshotai/Kimi-K2-Instruct-75k",
1536
+ "moonshotai/Kimi-VL-A3B-Thinking",
1537
+ "openai/gpt-oss-120b",
1538
+ "tngtech/DeepSeek-R1T-Chimera",
1539
+ "tngtech/DeepSeek-TNG-R1T2-Chimera",
1540
+ "zai-org/GLM-4.5-Air",
1541
+ "zai-org/GLM-4.5-FP8",
1542
+ "zai-org/GLM-4.5-turbo",
1543
+ "zai-org/GLM-4.6-FP8",
1544
+ "zai-org/GLM-4.6-turbo"
1241
1545
  ],
1242
- aihubmix: [
1243
- "DeepSeek-V3.2-Exp",
1244
- "DeepSeek-V3.2-Exp-Think",
1245
- "Kimi-K2-0905",
1246
- "claude-haiku-4-5",
1247
- "claude-opus-4-1",
1248
- "claude-sonnet-4-5",
1249
- "gemini-2.5-flash",
1546
+ cortecs: [
1547
+ "claude-4-5-sonnet",
1548
+ "claude-sonnet-4",
1549
+ "deepseek-v3-0324",
1250
1550
  "gemini-2.5-pro",
1251
- "glm-4.6",
1252
1551
  "gpt-4.1",
1253
- "gpt-4.1-mini",
1254
- "gpt-4.1-nano",
1255
- "gpt-4o",
1256
- "gpt-4o-2024-11-20",
1257
- "gpt-5",
1258
- "gpt-5-codex",
1259
- "gpt-5-mini",
1260
- "gpt-5-nano",
1261
- "gpt-5-pro",
1262
- "o4-mini",
1263
- "qwen3-235b-a22b-instruct-2507",
1264
- "qwen3-235b-a22b-thinking-2507",
1552
+ "gpt-oss-120b",
1553
+ "kimi-k2-instruct",
1554
+ "llama-3.1-405b-instruct",
1555
+ "nova-pro-v1",
1556
+ "qwen3-32b",
1265
1557
  "qwen3-coder-480b-a35b-instruct"
1266
1558
  ],
1267
- lucidquery: ["lucidnova-rf1-100b", "lucidquery-nexus-coder"],
1268
- xai: [
1269
- "grok-2",
1270
- "grok-2-1212",
1271
- "grok-2-latest",
1272
- "grok-2-vision",
1273
- "grok-2-vision-1212",
1274
- "grok-2-vision-latest",
1275
- "grok-3",
1276
- "grok-3-fast",
1277
- "grok-3-fast-latest",
1278
- "grok-3-latest",
1279
- "grok-3-mini",
1280
- "grok-3-mini-fast",
1281
- "grok-3-mini-fast-latest",
1282
- "grok-3-mini-latest",
1283
- "grok-4",
1284
- "grok-4-fast",
1285
- "grok-4-fast-non-reasoning",
1286
- "grok-beta",
1287
- "grok-code-fast-1",
1288
- "grok-vision-beta"
1289
- ],
1290
- deepseek: ["deepseek-chat", "deepseek-reasoner"],
1291
- requesty: [
1292
- "anthropic/claude-3-7-sonnet",
1293
- "anthropic/claude-4-sonnet-20250522",
1294
- "anthropic/claude-opus-4",
1295
- "anthropic/claude-opus-4-1-20250805",
1296
- "google/gemini-2.5-flash",
1297
- "google/gemini-2.5-pro",
1559
+ "github-models": [
1560
+ "ai21-labs/ai21-jamba-1.5-large",
1561
+ "ai21-labs/ai21-jamba-1.5-mini",
1562
+ "cohere/cohere-command-a",
1563
+ "cohere/cohere-command-r",
1564
+ "cohere/cohere-command-r-08-2024",
1565
+ "cohere/cohere-command-r-plus",
1566
+ "cohere/cohere-command-r-plus-08-2024",
1567
+ "core42/jais-30b-chat",
1568
+ "deepseek/deepseek-r1",
1569
+ "deepseek/deepseek-r1-0528",
1570
+ "deepseek/deepseek-v3-0324",
1571
+ "meta/llama-3.2-11b-vision-instruct",
1572
+ "meta/llama-3.2-90b-vision-instruct",
1573
+ "meta/llama-3.3-70b-instruct",
1574
+ "meta/llama-4-maverick-17b-128e-instruct-fp8",
1575
+ "meta/llama-4-scout-17b-16e-instruct",
1576
+ "meta/meta-llama-3-70b-instruct",
1577
+ "meta/meta-llama-3-8b-instruct",
1578
+ "meta/meta-llama-3.1-405b-instruct",
1579
+ "meta/meta-llama-3.1-70b-instruct",
1580
+ "meta/meta-llama-3.1-8b-instruct",
1581
+ "microsoft/mai-ds-r1",
1582
+ "microsoft/phi-3-medium-128k-instruct",
1583
+ "microsoft/phi-3-medium-4k-instruct",
1584
+ "microsoft/phi-3-mini-128k-instruct",
1585
+ "microsoft/phi-3-mini-4k-instruct",
1586
+ "microsoft/phi-3-small-128k-instruct",
1587
+ "microsoft/phi-3-small-8k-instruct",
1588
+ "microsoft/phi-3.5-mini-instruct",
1589
+ "microsoft/phi-3.5-moe-instruct",
1590
+ "microsoft/phi-3.5-vision-instruct",
1591
+ "microsoft/phi-4",
1592
+ "microsoft/phi-4-mini-instruct",
1593
+ "microsoft/phi-4-mini-reasoning",
1594
+ "microsoft/phi-4-multimodal-instruct",
1595
+ "microsoft/phi-4-reasoning",
1596
+ "mistral-ai/codestral-2501",
1597
+ "mistral-ai/ministral-3b",
1598
+ "mistral-ai/mistral-large-2411",
1599
+ "mistral-ai/mistral-medium-2505",
1600
+ "mistral-ai/mistral-nemo",
1601
+ "mistral-ai/mistral-small-2503",
1298
1602
  "openai/gpt-4.1",
1299
1603
  "openai/gpt-4.1-mini",
1604
+ "openai/gpt-4.1-nano",
1605
+ "openai/gpt-4o",
1300
1606
  "openai/gpt-4o-mini",
1301
- "openai/gpt-5",
1302
- "openai/gpt-5-mini",
1303
- "openai/gpt-5-nano",
1304
- "openai/o4-mini"
1607
+ "openai/o1",
1608
+ "openai/o1-mini",
1609
+ "openai/o1-preview",
1610
+ "openai/o3",
1611
+ "openai/o3-mini",
1612
+ "openai/o4-mini",
1613
+ "xai/grok-3",
1614
+ "xai/grok-3-mini"
1615
+ ],
1616
+ togetherai: [
1617
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1618
+ "deepseek-ai/DeepSeek-R1",
1619
+ "deepseek-ai/DeepSeek-V3",
1620
+ "meta-llama/Llama-3.3-70B-Instruct-Turbo",
1621
+ "moonshotai/Kimi-K2-Instruct",
1622
+ "openai/gpt-oss-120b"
1623
+ ],
1624
+ baseten: ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
1625
+ huggingface: [
1626
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1627
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1628
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
1629
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
1630
+ "deepseek-ai/DeepSeek-R1-0528",
1631
+ "deepseek-ai/Deepseek-V3-0324",
1632
+ "moonshotai/Kimi-K2-Instruct",
1633
+ "moonshotai/Kimi-K2-Instruct-0905",
1634
+ "zai-org/GLM-4.5",
1635
+ "zai-org/GLM-4.5-Air",
1636
+ "zai-org/GLM-4.6"
1305
1637
  ],
1306
- nebius: [
1307
- "NousResearch/hermes-4-405b",
1308
- "NousResearch/hermes-4-70b",
1309
- "deepseek-ai/deepseek-v3",
1310
- "meta-llama/llama-3.3-70b-instruct-base",
1311
- "meta-llama/llama-3.3-70b-instruct-fast",
1312
- "meta-llama/llama-3_1-405b-instruct",
1313
- "moonshotai/kimi-k2-instruct",
1314
- "nvidia/llama-3_1-nemotron-ultra-253b-v1",
1315
- "openai/gpt-oss-120b",
1316
- "openai/gpt-oss-20b",
1317
- "qwen/qwen3-235b-a22b-instruct-2507",
1318
- "qwen/qwen3-235b-a22b-thinking-2507",
1319
- "qwen/qwen3-coder-480b-a35b-instruct",
1320
- "zai-org/glm-4.5",
1321
- "zai-org/glm-4.5-air"
1638
+ opencode: [
1639
+ "an-gbt",
1640
+ "big-pickle",
1641
+ "claude-3-5-haiku",
1642
+ "claude-haiku-4-5",
1643
+ "claude-opus-4-1",
1644
+ "claude-sonnet-4",
1645
+ "claude-sonnet-4-5",
1646
+ "code-supernova",
1647
+ "glm-4.6",
1648
+ "gpt-5",
1649
+ "gpt-5-codex",
1650
+ "grok-code",
1651
+ "kimi-k2",
1652
+ "qwen3-coder"
1322
1653
  ],
1323
1654
  fastrouter: [
1324
1655
  "anthropic/claude-opus-4.1",
@@ -1336,22 +1667,75 @@ var provider_registry_default = {
1336
1667
  "qwen/qwen3-coder",
1337
1668
  "x-ai/grok-4"
1338
1669
  ],
1339
- perplexity: ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
1340
- morph: ["auto", "morph-v3-fast", "morph-v3-large"],
1341
- "zai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1342
- huggingface: [
1670
+ google: [
1671
+ "gemini-1.5-flash",
1672
+ "gemini-1.5-flash-8b",
1673
+ "gemini-1.5-pro",
1674
+ "gemini-2.0-flash",
1675
+ "gemini-2.0-flash-lite",
1676
+ "gemini-2.5-flash",
1677
+ "gemini-2.5-flash-image",
1678
+ "gemini-2.5-flash-image-preview",
1679
+ "gemini-2.5-flash-lite",
1680
+ "gemini-2.5-flash-lite-preview-06-17",
1681
+ "gemini-2.5-flash-lite-preview-09-2025",
1682
+ "gemini-2.5-flash-preview-04-17",
1683
+ "gemini-2.5-flash-preview-05-20",
1684
+ "gemini-2.5-flash-preview-09-2025",
1685
+ "gemini-2.5-flash-preview-tts",
1686
+ "gemini-2.5-pro",
1687
+ "gemini-2.5-pro-preview-05-06",
1688
+ "gemini-2.5-pro-preview-06-05",
1689
+ "gemini-2.5-pro-preview-tts",
1690
+ "gemini-flash-latest",
1691
+ "gemini-flash-lite-latest",
1692
+ "gemini-live-2.5-flash",
1693
+ "gemini-live-2.5-flash-preview-native-audio"
1694
+ ],
1695
+ inception: ["mercury", "mercury-coder"],
1696
+ wandb: [
1697
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1343
1698
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
1344
1699
  "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1345
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
1346
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
1347
1700
  "deepseek-ai/DeepSeek-R1-0528",
1348
- "deepseek-ai/Deepseek-V3-0324",
1349
- "moonshotai/Kimi-K2-Instruct",
1350
- "moonshotai/Kimi-K2-Instruct-0905",
1351
- "zai-org/GLM-4.5",
1352
- "zai-org/GLM-4.5-Air",
1353
- "zai-org/GLM-4.6"
1701
+ "deepseek-ai/DeepSeek-V3-0324",
1702
+ "meta-llama/Llama-3.1-8B-Instruct",
1703
+ "meta-llama/Llama-3.3-70B-Instruct",
1704
+ "meta-llama/Llama-4-Scout-17B-16E-Instruct",
1705
+ "microsoft/Phi-4-mini-instruct",
1706
+ "moonshotai/Kimi-K2-Instruct"
1707
+ ],
1708
+ openai: [
1709
+ "codex-mini-latest",
1710
+ "gpt-3.5-turbo",
1711
+ "gpt-4",
1712
+ "gpt-4-turbo",
1713
+ "gpt-4.1",
1714
+ "gpt-4.1-mini",
1715
+ "gpt-4.1-nano",
1716
+ "gpt-4o",
1717
+ "gpt-4o-2024-05-13",
1718
+ "gpt-4o-2024-08-06",
1719
+ "gpt-4o-2024-11-20",
1720
+ "gpt-4o-mini",
1721
+ "gpt-5",
1722
+ "gpt-5-chat-latest",
1723
+ "gpt-5-codex",
1724
+ "gpt-5-mini",
1725
+ "gpt-5-nano",
1726
+ "o1",
1727
+ "o1-mini",
1728
+ "o1-preview",
1729
+ "o1-pro",
1730
+ "o3",
1731
+ "o3-deep-research",
1732
+ "o3-mini",
1733
+ "o3-pro",
1734
+ "o4-mini",
1735
+ "o4-mini-deep-research"
1354
1736
  ],
1737
+ "zhipuai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1738
+ perplexity: ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
1355
1739
  openrouter: [
1356
1740
  "anthropic/claude-3.5-haiku",
1357
1741
  "anthropic/claude-3.7-sonnet",
@@ -1396,192 +1780,73 @@ var provider_registry_default = {
1396
1780
  "mistralai/devstral-small-2505:free",
1397
1781
  "mistralai/devstral-small-2507",
1398
1782
  "mistralai/mistral-7b-instruct:free",
1399
- "mistralai/mistral-medium-3",
1400
- "mistralai/mistral-medium-3.1",
1401
- "mistralai/mistral-nemo:free",
1402
- "mistralai/mistral-small-3.1-24b-instruct",
1403
- "mistralai/mistral-small-3.2-24b-instruct",
1404
- "mistralai/mistral-small-3.2-24b-instruct:free",
1405
- "moonshotai/kimi-dev-72b:free",
1406
- "moonshotai/kimi-k2",
1407
- "moonshotai/kimi-k2-0905",
1408
- "moonshotai/kimi-k2:free",
1409
- "nousresearch/deephermes-3-llama-3-8b-preview",
1410
- "nousresearch/hermes-4-405b",
1411
- "nousresearch/hermes-4-70b",
1412
- "openai/gpt-4.1",
1413
- "openai/gpt-4.1-mini",
1414
- "openai/gpt-4o-mini",
1415
- "openai/gpt-5",
1416
- "openai/gpt-5-chat",
1417
- "openai/gpt-5-codex",
1418
- "openai/gpt-5-image",
1419
- "openai/gpt-5-mini",
1420
- "openai/gpt-5-nano",
1421
- "openai/gpt-oss-120b",
1422
- "openai/gpt-oss-20b",
1423
- "openai/o4-mini",
1424
- "openrouter/cypher-alpha:free",
1425
- "openrouter/horizon-alpha",
1426
- "openrouter/horizon-beta",
1427
- "openrouter/sonoma-dusk-alpha",
1428
- "openrouter/sonoma-sky-alpha",
1429
- "qwen/qwen-2.5-coder-32b-instruct",
1430
- "qwen/qwen2.5-vl-32b-instruct:free",
1431
- "qwen/qwen2.5-vl-72b-instruct",
1432
- "qwen/qwen2.5-vl-72b-instruct:free",
1433
- "qwen/qwen3-14b:free",
1434
- "qwen/qwen3-235b-a22b-07-25",
1435
- "qwen/qwen3-235b-a22b-07-25:free",
1436
- "qwen/qwen3-235b-a22b-thinking-2507",
1437
- "qwen/qwen3-235b-a22b:free",
1438
- "qwen/qwen3-30b-a3b-instruct-2507",
1439
- "qwen/qwen3-30b-a3b-thinking-2507",
1440
- "qwen/qwen3-30b-a3b:free",
1441
- "qwen/qwen3-32b:free",
1442
- "qwen/qwen3-8b:free",
1443
- "qwen/qwen3-coder",
1444
- "qwen/qwen3-coder:free",
1445
- "qwen/qwen3-max",
1446
- "qwen/qwen3-next-80b-a3b-instruct",
1447
- "qwen/qwen3-next-80b-a3b-thinking",
1448
- "qwen/qwq-32b:free",
1449
- "rekaai/reka-flash-3",
1450
- "sarvamai/sarvam-m:free",
1451
- "thudm/glm-z1-32b:free",
1452
- "tngtech/deepseek-r1t2-chimera:free",
1453
- "x-ai/grok-3",
1454
- "x-ai/grok-3-beta",
1455
- "x-ai/grok-3-mini",
1456
- "x-ai/grok-3-mini-beta",
1457
- "x-ai/grok-4",
1458
- "x-ai/grok-4-fast",
1459
- "x-ai/grok-4-fast:free",
1460
- "x-ai/grok-code-fast-1",
1461
- "z-ai/glm-4.5",
1462
- "z-ai/glm-4.5-air",
1463
- "z-ai/glm-4.5-air:free",
1464
- "z-ai/glm-4.5v",
1465
- "z-ai/glm-4.6"
1466
- ],
1467
- cerebras: ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
1468
- zhipuai: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1469
- togetherai: [
1470
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1471
- "deepseek-ai/DeepSeek-R1",
1472
- "deepseek-ai/DeepSeek-V3",
1473
- "meta-llama/Llama-3.3-70B-Instruct-Turbo",
1474
- "moonshotai/Kimi-K2-Instruct",
1475
- "openai/gpt-oss-120b"
1476
- ],
1477
- wandb: [
1478
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1479
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1480
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1481
- "deepseek-ai/DeepSeek-R1-0528",
1482
- "deepseek-ai/DeepSeek-V3-0324",
1483
- "meta-llama/Llama-3.1-8B-Instruct",
1484
- "meta-llama/Llama-3.3-70B-Instruct",
1485
- "meta-llama/Llama-4-Scout-17B-16E-Instruct",
1486
- "microsoft/Phi-4-mini-instruct",
1487
- "moonshotai/Kimi-K2-Instruct"
1488
- ],
1489
- submodel: [
1490
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1491
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1492
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1493
- "deepseek-ai/DeepSeek-R1-0528",
1494
- "deepseek-ai/DeepSeek-V3-0324",
1495
- "deepseek-ai/DeepSeek-V3.1",
1496
- "openai/gpt-oss-120b",
1497
- "zai-org/GLM-4.5-Air",
1498
- "zai-org/GLM-4.5-FP8"
1499
- ],
1500
- vercel: [
1501
- "alibaba/qwen3-coder-plus",
1502
- "alibaba/qwen3-max",
1503
- "alibaba/qwen3-next-80b-a3b-instruct",
1504
- "alibaba/qwen3-next-80b-a3b-thinking",
1505
- "alibaba/qwen3-vl-instruct",
1506
- "alibaba/qwen3-vl-thinking",
1507
- "amazon/nova-lite",
1508
- "amazon/nova-micro",
1509
- "amazon/nova-pro",
1510
- "anthropic/claude-3-5-haiku",
1511
- "anthropic/claude-3-haiku",
1512
- "anthropic/claude-3-opus",
1513
- "anthropic/claude-3.5-sonnet",
1514
- "anthropic/claude-3.7-sonnet",
1515
- "anthropic/claude-4-1-opus",
1516
- "anthropic/claude-4-opus",
1517
- "anthropic/claude-4-sonnet",
1518
- "anthropic/claude-4.5-sonnet",
1519
- "anthropic/claude-haiku-4.5",
1520
- "cerebras/qwen3-coder",
1521
- "deepseek/deepseek-r1",
1522
- "deepseek/deepseek-r1-distill-llama-70b",
1523
- "deepseek/deepseek-v3.1-terminus",
1524
- "deepseek/deepseek-v3.2-exp",
1525
- "deepseek/deepseek-v3.2-exp-thinking",
1526
- "google/gemini-2.0-flash",
1527
- "google/gemini-2.0-flash-lite",
1528
- "google/gemini-2.5-flash",
1529
- "google/gemini-2.5-flash-lite",
1530
- "google/gemini-2.5-flash-lite-preview-09-2025",
1531
- "google/gemini-2.5-flash-preview-09-2025",
1532
- "google/gemini-2.5-pro",
1533
- "meta/llama-3.3-70b",
1534
- "meta/llama-4-maverick",
1535
- "meta/llama-4-scout",
1536
- "mistral/codestral",
1537
- "mistral/magistral-medium",
1538
- "mistral/magistral-small",
1539
- "mistral/ministral-3b",
1540
- "mistral/ministral-8b",
1541
- "mistral/mistral-large",
1542
- "mistral/mistral-small",
1543
- "mistral/mixtral-8x22b-instruct",
1544
- "mistral/pixtral-12b",
1545
- "mistral/pixtral-large",
1783
+ "mistralai/mistral-medium-3",
1784
+ "mistralai/mistral-medium-3.1",
1785
+ "mistralai/mistral-nemo:free",
1786
+ "mistralai/mistral-small-3.1-24b-instruct",
1787
+ "mistralai/mistral-small-3.2-24b-instruct",
1788
+ "mistralai/mistral-small-3.2-24b-instruct:free",
1789
+ "moonshotai/kimi-dev-72b:free",
1546
1790
  "moonshotai/kimi-k2",
1547
- "morph/morph-v3-fast",
1548
- "morph/morph-v3-large",
1549
- "openai/gpt-4-turbo",
1791
+ "moonshotai/kimi-k2-0905",
1792
+ "moonshotai/kimi-k2:free",
1793
+ "nousresearch/deephermes-3-llama-3-8b-preview",
1794
+ "nousresearch/hermes-4-405b",
1795
+ "nousresearch/hermes-4-70b",
1550
1796
  "openai/gpt-4.1",
1551
1797
  "openai/gpt-4.1-mini",
1552
- "openai/gpt-4.1-nano",
1553
- "openai/gpt-4o",
1554
1798
  "openai/gpt-4o-mini",
1555
1799
  "openai/gpt-5",
1800
+ "openai/gpt-5-chat",
1556
1801
  "openai/gpt-5-codex",
1802
+ "openai/gpt-5-image",
1557
1803
  "openai/gpt-5-mini",
1558
1804
  "openai/gpt-5-nano",
1559
1805
  "openai/gpt-oss-120b",
1560
1806
  "openai/gpt-oss-20b",
1561
- "openai/o1",
1562
- "openai/o3",
1563
- "openai/o3-mini",
1564
1807
  "openai/o4-mini",
1565
- "perplexity/sonar",
1566
- "perplexity/sonar-pro",
1567
- "perplexity/sonar-reasoning",
1568
- "perplexity/sonar-reasoning-pro",
1569
- "vercel/v0-1.0-md",
1570
- "vercel/v0-1.5-md",
1571
- "xai/grok-2",
1572
- "xai/grok-2-vision",
1573
- "xai/grok-3",
1574
- "xai/grok-3-fast",
1575
- "xai/grok-3-mini",
1576
- "xai/grok-3-mini-fast",
1577
- "xai/grok-4",
1578
- "xai/grok-4-fast",
1579
- "xai/grok-4-fast-non-reasoning",
1580
- "xai/grok-code-fast-1",
1581
- "zai/glm-4.5",
1582
- "zai/glm-4.5-air",
1583
- "zai/glm-4.5v",
1584
- "zai/glm-4.6"
1808
+ "openrouter/cypher-alpha:free",
1809
+ "openrouter/horizon-alpha",
1810
+ "openrouter/horizon-beta",
1811
+ "openrouter/sonoma-dusk-alpha",
1812
+ "openrouter/sonoma-sky-alpha",
1813
+ "qwen/qwen-2.5-coder-32b-instruct",
1814
+ "qwen/qwen2.5-vl-32b-instruct:free",
1815
+ "qwen/qwen2.5-vl-72b-instruct",
1816
+ "qwen/qwen2.5-vl-72b-instruct:free",
1817
+ "qwen/qwen3-14b:free",
1818
+ "qwen/qwen3-235b-a22b-07-25",
1819
+ "qwen/qwen3-235b-a22b-07-25:free",
1820
+ "qwen/qwen3-235b-a22b-thinking-2507",
1821
+ "qwen/qwen3-235b-a22b:free",
1822
+ "qwen/qwen3-30b-a3b-instruct-2507",
1823
+ "qwen/qwen3-30b-a3b-thinking-2507",
1824
+ "qwen/qwen3-30b-a3b:free",
1825
+ "qwen/qwen3-32b:free",
1826
+ "qwen/qwen3-8b:free",
1827
+ "qwen/qwen3-coder",
1828
+ "qwen/qwen3-coder:free",
1829
+ "qwen/qwen3-max",
1830
+ "qwen/qwen3-next-80b-a3b-instruct",
1831
+ "qwen/qwen3-next-80b-a3b-thinking",
1832
+ "qwen/qwq-32b:free",
1833
+ "rekaai/reka-flash-3",
1834
+ "sarvamai/sarvam-m:free",
1835
+ "thudm/glm-z1-32b:free",
1836
+ "tngtech/deepseek-r1t2-chimera:free",
1837
+ "x-ai/grok-3",
1838
+ "x-ai/grok-3-beta",
1839
+ "x-ai/grok-3-mini",
1840
+ "x-ai/grok-3-mini-beta",
1841
+ "x-ai/grok-4",
1842
+ "x-ai/grok-4-fast",
1843
+ "x-ai/grok-4-fast:free",
1844
+ "x-ai/grok-code-fast-1",
1845
+ "z-ai/glm-4.5",
1846
+ "z-ai/glm-4.5-air",
1847
+ "z-ai/glm-4.5-air:free",
1848
+ "z-ai/glm-4.5v",
1849
+ "z-ai/glm-4.6"
1585
1850
  ],
1586
1851
  synthetic: [
1587
1852
  "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
@@ -1606,184 +1871,53 @@ var provider_registry_default = {
1606
1871
  "hf:zai-org/GLM-4.5",
1607
1872
  "hf:zai-org/GLM-4.6"
1608
1873
  ],
1609
- google: [
1610
- "gemini-1.5-flash",
1611
- "gemini-1.5-flash-8b",
1612
- "gemini-1.5-pro",
1613
- "gemini-2.0-flash",
1614
- "gemini-2.0-flash-lite",
1615
- "gemini-2.5-flash",
1616
- "gemini-2.5-flash-image",
1617
- "gemini-2.5-flash-image-preview",
1618
- "gemini-2.5-flash-lite",
1619
- "gemini-2.5-flash-lite-preview-06-17",
1620
- "gemini-2.5-flash-lite-preview-09-2025",
1621
- "gemini-2.5-flash-preview-04-17",
1622
- "gemini-2.5-flash-preview-05-20",
1623
- "gemini-2.5-flash-preview-09-2025",
1624
- "gemini-2.5-flash-preview-tts",
1625
- "gemini-2.5-pro",
1626
- "gemini-2.5-pro-preview-05-06",
1627
- "gemini-2.5-pro-preview-06-05",
1628
- "gemini-2.5-pro-preview-tts",
1629
- "gemini-flash-latest",
1630
- "gemini-flash-lite-latest",
1631
- "gemini-live-2.5-flash",
1632
- "gemini-live-2.5-flash-preview-native-audio"
1633
- ],
1634
- groq: [
1635
- "deepseek-r1-distill-llama-70b",
1636
- "gemma2-9b-it",
1637
- "llama-3.1-8b-instant",
1638
- "llama-3.3-70b-versatile",
1639
- "llama-guard-3-8b",
1640
- "llama3-70b-8192",
1641
- "llama3-8b-8192",
1642
- "meta-llama/llama-4-maverick-17b-128e-instruct",
1643
- "meta-llama/llama-4-scout-17b-16e-instruct",
1644
- "meta-llama/llama-guard-4-12b",
1645
- "mistral-saba-24b",
1646
- "moonshotai/kimi-k2-instruct",
1647
- "moonshotai/kimi-k2-instruct-0905",
1648
- "openai/gpt-oss-120b",
1649
- "openai/gpt-oss-20b",
1650
- "qwen-qwq-32b",
1651
- "qwen/qwen3-32b"
1652
- ],
1653
- "moonshotai-cn": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1654
- "github-models": [
1655
- "ai21-labs/ai21-jamba-1.5-large",
1656
- "ai21-labs/ai21-jamba-1.5-mini",
1657
- "cohere/cohere-command-a",
1658
- "cohere/cohere-command-r",
1659
- "cohere/cohere-command-r-08-2024",
1660
- "cohere/cohere-command-r-plus",
1661
- "cohere/cohere-command-r-plus-08-2024",
1662
- "core42/jais-30b-chat",
1663
- "deepseek/deepseek-r1",
1664
- "deepseek/deepseek-r1-0528",
1665
- "deepseek/deepseek-v3-0324",
1666
- "meta/llama-3.2-11b-vision-instruct",
1667
- "meta/llama-3.2-90b-vision-instruct",
1668
- "meta/llama-3.3-70b-instruct",
1669
- "meta/llama-4-maverick-17b-128e-instruct-fp8",
1670
- "meta/llama-4-scout-17b-16e-instruct",
1671
- "meta/meta-llama-3-70b-instruct",
1672
- "meta/meta-llama-3-8b-instruct",
1673
- "meta/meta-llama-3.1-405b-instruct",
1674
- "meta/meta-llama-3.1-70b-instruct",
1675
- "meta/meta-llama-3.1-8b-instruct",
1676
- "microsoft/mai-ds-r1",
1677
- "microsoft/phi-3-medium-128k-instruct",
1678
- "microsoft/phi-3-medium-4k-instruct",
1679
- "microsoft/phi-3-mini-128k-instruct",
1680
- "microsoft/phi-3-mini-4k-instruct",
1681
- "microsoft/phi-3-small-128k-instruct",
1682
- "microsoft/phi-3-small-8k-instruct",
1683
- "microsoft/phi-3.5-mini-instruct",
1684
- "microsoft/phi-3.5-moe-instruct",
1685
- "microsoft/phi-3.5-vision-instruct",
1686
- "microsoft/phi-4",
1687
- "microsoft/phi-4-mini-instruct",
1688
- "microsoft/phi-4-mini-reasoning",
1689
- "microsoft/phi-4-multimodal-instruct",
1690
- "microsoft/phi-4-reasoning",
1691
- "mistral-ai/codestral-2501",
1692
- "mistral-ai/ministral-3b",
1693
- "mistral-ai/mistral-large-2411",
1694
- "mistral-ai/mistral-medium-2505",
1695
- "mistral-ai/mistral-nemo",
1696
- "mistral-ai/mistral-small-2503",
1697
- "openai/gpt-4.1",
1698
- "openai/gpt-4.1-mini",
1699
- "openai/gpt-4.1-nano",
1700
- "openai/gpt-4o",
1701
- "openai/gpt-4o-mini",
1702
- "openai/o1",
1703
- "openai/o1-mini",
1704
- "openai/o1-preview",
1705
- "openai/o3",
1706
- "openai/o3-mini",
1707
- "openai/o4-mini",
1708
- "xai/grok-3",
1709
- "xai/grok-3-mini"
1710
- ],
1711
1874
  deepinfra: [
1712
1875
  "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1713
1876
  "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo",
1714
1877
  "moonshotai/Kimi-K2-Instruct",
1715
1878
  "zai-org/GLM-4.5"
1716
1879
  ],
1717
- "fireworks-ai": [
1718
- "accounts/fireworks/models/deepseek-r1-0528",
1719
- "accounts/fireworks/models/deepseek-v3-0324",
1720
- "accounts/fireworks/models/deepseek-v3p1",
1721
- "accounts/fireworks/models/glm-4p5",
1722
- "accounts/fireworks/models/glm-4p5-air",
1723
- "accounts/fireworks/models/gpt-oss-120b",
1724
- "accounts/fireworks/models/gpt-oss-20b",
1725
- "accounts/fireworks/models/kimi-k2-instruct",
1726
- "accounts/fireworks/models/qwen3-235b-a22b",
1727
- "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
1880
+ zhipuai: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1881
+ submodel: [
1882
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1883
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1884
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1885
+ "deepseek-ai/DeepSeek-R1-0528",
1886
+ "deepseek-ai/DeepSeek-V3-0324",
1887
+ "deepseek-ai/DeepSeek-V3.1",
1888
+ "openai/gpt-oss-120b",
1889
+ "zai-org/GLM-4.5-Air",
1890
+ "zai-org/GLM-4.5-FP8"
1728
1891
  ],
1729
1892
  zai: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1730
- opencode: [
1731
- "an-gbt",
1732
- "big-pickle",
1733
- "claude-3-5-haiku",
1734
- "claude-haiku-4-5",
1735
- "claude-opus-4-1",
1736
- "claude-sonnet-4",
1737
- "claude-sonnet-4-5",
1738
- "code-supernova",
1739
- "glm-4.6",
1740
- "gpt-5",
1741
- "gpt-5-codex",
1742
- "grok-code",
1743
- "kimi-k2",
1744
- "qwen3-coder"
1893
+ inference: [
1894
+ "google/gemma-3",
1895
+ "meta/llama-3.1-8b-instruct",
1896
+ "meta/llama-3.2-11b-vision-instruct",
1897
+ "meta/llama-3.2-1b-instruct",
1898
+ "meta/llama-3.2-3b-instruct",
1899
+ "mistral/mistral-nemo-12b-instruct",
1900
+ "osmosis/osmosis-structure-0.6b",
1901
+ "qwen/qwen-2.5-7b-vision-instruct",
1902
+ "qwen/qwen3-embedding-4b"
1745
1903
  ],
1746
- "zhipuai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1747
- inception: ["mercury", "mercury-coder"],
1748
- llama: [
1749
- "cerebras-llama-4-maverick-17b-128e-instruct",
1750
- "cerebras-llama-4-scout-17b-16e-instruct",
1751
- "groq-llama-4-maverick-17b-128e-instruct",
1752
- "llama-3.3-70b-instruct",
1753
- "llama-3.3-8b-instruct",
1754
- "llama-4-maverick-17b-128e-instruct-fp8",
1755
- "llama-4-scout-17b-16e-instruct-fp8"
1904
+ requesty: [
1905
+ "anthropic/claude-3-7-sonnet",
1906
+ "anthropic/claude-4-sonnet-20250522",
1907
+ "anthropic/claude-opus-4",
1908
+ "anthropic/claude-opus-4-1-20250805",
1909
+ "google/gemini-2.5-flash",
1910
+ "google/gemini-2.5-pro",
1911
+ "openai/gpt-4.1",
1912
+ "openai/gpt-4.1-mini",
1913
+ "openai/gpt-4o-mini",
1914
+ "openai/gpt-5",
1915
+ "openai/gpt-5-mini",
1916
+ "openai/gpt-5-nano",
1917
+ "openai/o4-mini"
1756
1918
  ],
1919
+ morph: ["auto", "morph-v3-fast", "morph-v3-large"],
1757
1920
  lmstudio: ["openai/gpt-oss-20b", "qwen/qwen3-30b-a3b-2507", "qwen/qwen3-coder-30b"],
1758
- openai: [
1759
- "codex-mini-latest",
1760
- "gpt-3.5-turbo",
1761
- "gpt-4",
1762
- "gpt-4-turbo",
1763
- "gpt-4.1",
1764
- "gpt-4.1-mini",
1765
- "gpt-4.1-nano",
1766
- "gpt-4o",
1767
- "gpt-4o-2024-05-13",
1768
- "gpt-4o-2024-08-06",
1769
- "gpt-4o-2024-11-20",
1770
- "gpt-4o-mini",
1771
- "gpt-5",
1772
- "gpt-5-chat-latest",
1773
- "gpt-5-codex",
1774
- "gpt-5-mini",
1775
- "gpt-5-nano",
1776
- "o1",
1777
- "o1-mini",
1778
- "o1-preview",
1779
- "o1-pro",
1780
- "o3",
1781
- "o3-deep-research",
1782
- "o3-mini",
1783
- "o3-pro",
1784
- "o4-mini",
1785
- "o4-mini-deep-research"
1786
- ],
1787
1921
  anthropic: [
1788
1922
  "claude-3-5-haiku-20241022",
1789
1923
  "claude-3-5-haiku-latest",
@@ -1805,208 +1939,50 @@ var provider_registry_default = {
1805
1939
  "claude-sonnet-4-5",
1806
1940
  "claude-sonnet-4-5-20250929"
1807
1941
  ],
1808
- moonshotai: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1809
- inference: [
1810
- "google/gemma-3",
1811
- "meta/llama-3.1-8b-instruct",
1812
- "meta/llama-3.2-11b-vision-instruct",
1813
- "meta/llama-3.2-1b-instruct",
1814
- "meta/llama-3.2-3b-instruct",
1815
- "mistral/mistral-nemo-12b-instruct",
1816
- "osmosis/osmosis-structure-0.6b",
1817
- "qwen/qwen-2.5-7b-vision-instruct",
1818
- "qwen/qwen3-embedding-4b"
1819
- ],
1820
- baseten: ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
1821
- cortecs: [
1822
- "claude-4-5-sonnet",
1823
- "claude-sonnet-4",
1824
- "deepseek-v3-0324",
1825
- "gemini-2.5-pro",
1826
- "gpt-4.1",
1827
- "gpt-oss-120b",
1828
- "kimi-k2-instruct",
1829
- "llama-3.1-405b-instruct",
1830
- "nova-pro-v1",
1831
- "qwen3-32b",
1832
- "qwen3-coder-480b-a35b-instruct"
1833
- ],
1834
- mistral: [
1835
- "codestral-latest",
1836
- "devstral-medium-2507",
1837
- "devstral-small-2505",
1838
- "devstral-small-2507",
1839
- "magistral-medium-latest",
1840
- "magistral-small",
1841
- "ministral-3b-latest",
1842
- "ministral-8b-latest",
1843
- "mistral-large-latest",
1844
- "mistral-medium-2505",
1845
- "mistral-medium-2508",
1846
- "mistral-medium-latest",
1847
- "mistral-nemo",
1848
- "mistral-small-latest",
1849
- "open-mistral-7b",
1850
- "open-mixtral-8x22b",
1851
- "open-mixtral-8x7b",
1852
- "pixtral-12b",
1853
- "pixtral-large-latest"
1854
- ],
1855
- venice: [
1856
- "deepseek-coder-v2-lite",
1857
- "deepseek-r1-671b",
1858
- "dolphin-2.9.2-qwen2-72b",
1859
- "llama-3.1-405b",
1860
- "llama-3.2-3b",
1861
- "llama-3.3-70b",
1862
- "mistral-31-24b",
1863
- "qwen-2.5-coder-32b",
1864
- "qwen-2.5-qwq-32b",
1865
- "qwen-2.5-vl",
1866
- "qwen3-235b",
1867
- "qwen3-4b",
1868
- "venice-uncensored"
1869
- ],
1870
- alibaba: [
1871
- "qvq-max",
1872
- "qwen-flash",
1873
- "qwen-max",
1874
- "qwen-mt-plus",
1875
- "qwen-mt-turbo",
1876
- "qwen-omni-turbo",
1877
- "qwen-omni-turbo-realtime",
1878
- "qwen-plus",
1879
- "qwen-plus-character-ja",
1880
- "qwen-turbo",
1881
- "qwen-vl-max",
1882
- "qwen-vl-ocr",
1883
- "qwen-vl-plus",
1884
- "qwen2-5-14b-instruct",
1885
- "qwen2-5-32b-instruct",
1886
- "qwen2-5-72b-instruct",
1887
- "qwen2-5-7b-instruct",
1888
- "qwen2-5-omni-7b",
1889
- "qwen2-5-vl-72b-instruct",
1890
- "qwen2-5-vl-7b-instruct",
1891
- "qwen3-14b",
1892
- "qwen3-235b-a22b",
1893
- "qwen3-32b",
1894
- "qwen3-8b",
1895
- "qwen3-asr-flash",
1896
- "qwen3-coder-30b-a3b-instruct",
1897
- "qwen3-coder-480b-a35b-instruct",
1898
- "qwen3-coder-flash",
1899
- "qwen3-coder-plus",
1900
- "qwen3-livetranslate-flash-realtime",
1901
- "qwen3-max",
1902
- "qwen3-next-80b-a3b-instruct",
1903
- "qwen3-next-80b-a3b-thinking",
1904
- "qwen3-omni-flash",
1905
- "qwen3-omni-flash-realtime",
1906
- "qwen3-vl-235b-a22b",
1907
- "qwen3-vl-30b-a3b",
1908
- "qwen3-vl-plus",
1909
- "qwq-plus"
1910
- ],
1911
- "alibaba-cn": [
1912
- "deepseek-r1",
1913
- "deepseek-r1-0528",
1914
- "deepseek-r1-distill-llama-70b",
1915
- "deepseek-r1-distill-llama-8b",
1916
- "deepseek-r1-distill-qwen-1-5b",
1917
- "deepseek-r1-distill-qwen-14b",
1918
- "deepseek-r1-distill-qwen-32b",
1919
- "deepseek-r1-distill-qwen-7b",
1920
- "deepseek-v3",
1921
- "deepseek-v3-1",
1922
- "deepseek-v3-2-exp",
1923
- "moonshot-kimi-k2-instruct",
1924
- "qvq-max",
1925
- "qwen-deep-research",
1926
- "qwen-doc-turbo",
1927
- "qwen-flash",
1928
- "qwen-long",
1929
- "qwen-math-plus",
1930
- "qwen-math-turbo",
1931
- "qwen-max",
1932
- "qwen-mt-plus",
1933
- "qwen-mt-turbo",
1934
- "qwen-omni-turbo",
1935
- "qwen-omni-turbo-realtime",
1936
- "qwen-plus",
1937
- "qwen-plus-character",
1938
- "qwen-turbo",
1939
- "qwen-vl-max",
1940
- "qwen-vl-ocr",
1941
- "qwen-vl-plus",
1942
- "qwen2-5-14b-instruct",
1943
- "qwen2-5-32b-instruct",
1944
- "qwen2-5-72b-instruct",
1945
- "qwen2-5-7b-instruct",
1946
- "qwen2-5-coder-32b-instruct",
1947
- "qwen2-5-coder-7b-instruct",
1948
- "qwen2-5-math-72b-instruct",
1949
- "qwen2-5-math-7b-instruct",
1950
- "qwen2-5-omni-7b",
1951
- "qwen2-5-vl-72b-instruct",
1952
- "qwen2-5-vl-7b-instruct",
1953
- "qwen3-14b",
1954
- "qwen3-235b-a22b",
1955
- "qwen3-32b",
1956
- "qwen3-8b",
1957
- "qwen3-asr-flash",
1958
- "qwen3-coder-30b-a3b-instruct",
1959
- "qwen3-coder-480b-a35b-instruct",
1960
- "qwen3-coder-flash",
1961
- "qwen3-coder-plus",
1962
- "qwen3-max",
1963
- "qwen3-next-80b-a3b-instruct",
1964
- "qwen3-next-80b-a3b-thinking",
1965
- "qwen3-omni-flash",
1966
- "qwen3-omni-flash-realtime",
1967
- "qwen3-vl-235b-a22b",
1968
- "qwen3-vl-30b-a3b",
1969
- "qwen3-vl-plus",
1970
- "qwq-32b",
1971
- "qwq-plus",
1972
- "tongyi-intent-detect-v3"
1942
+ "fireworks-ai": [
1943
+ "accounts/fireworks/models/deepseek-r1-0528",
1944
+ "accounts/fireworks/models/deepseek-v3-0324",
1945
+ "accounts/fireworks/models/deepseek-v3p1",
1946
+ "accounts/fireworks/models/glm-4p5",
1947
+ "accounts/fireworks/models/glm-4p5-air",
1948
+ "accounts/fireworks/models/gpt-oss-120b",
1949
+ "accounts/fireworks/models/gpt-oss-20b",
1950
+ "accounts/fireworks/models/kimi-k2-instruct",
1951
+ "accounts/fireworks/models/qwen3-235b-a22b",
1952
+ "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
1973
1953
  ],
1974
- chutes: [
1954
+ modelscope: [
1975
1955
  "Qwen/Qwen3-235B-A22B-Instruct-2507",
1976
1956
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
1977
- "Qwen/Qwen3-30B-A3B",
1978
1957
  "Qwen/Qwen3-30B-A3B-Instruct-2507",
1979
1958
  "Qwen/Qwen3-30B-A3B-Thinking-2507",
1980
1959
  "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1981
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1982
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
1983
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
1984
- "chutesai/Devstral-Small-2505",
1985
- "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
1986
- "deepseek-ai/DeepSeek-R1-0528",
1987
- "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
1988
- "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1989
- "deepseek-ai/DeepSeek-V3-0324",
1990
- "deepseek-ai/DeepSeek-V3.1",
1991
- "deepseek-ai/DeepSeek-V3.1-Terminus",
1992
- "deepseek-ai/DeepSeek-V3.1-turbo",
1993
- "deepseek-ai/DeepSeek-V3.1:THINKING",
1994
- "deepseek-ai/DeepSeek-V3.2-Exp",
1995
- "meituan-longcat/LongCat-Flash-Chat-FP8",
1996
- "moonshotai/Kimi-Dev-72B",
1997
- "moonshotai/Kimi-K2-Instruct-0905",
1998
- "moonshotai/Kimi-K2-Instruct-75k",
1999
- "moonshotai/Kimi-VL-A3B-Thinking",
2000
- "openai/gpt-oss-120b",
2001
- "tngtech/DeepSeek-R1T-Chimera",
2002
- "tngtech/DeepSeek-TNG-R1T2-Chimera",
2003
- "zai-org/GLM-4.5-Air",
2004
- "zai-org/GLM-4.5-FP8",
2005
- "zai-org/GLM-4.5-turbo",
2006
- "zai-org/GLM-4.6-FP8",
2007
- "zai-org/GLM-4.6-turbo"
1960
+ "ZhipuAI/GLM-4.5",
1961
+ "ZhipuAI/GLM-4.6"
2008
1962
  ],
2009
- upstage: ["solar-mini", "solar-pro2"],
1963
+ llama: [
1964
+ "cerebras-llama-4-maverick-17b-128e-instruct",
1965
+ "cerebras-llama-4-scout-17b-16e-instruct",
1966
+ "groq-llama-4-maverick-17b-128e-instruct",
1967
+ "llama-3.3-70b-instruct",
1968
+ "llama-3.3-8b-instruct",
1969
+ "llama-4-maverick-17b-128e-instruct-fp8",
1970
+ "llama-4-scout-17b-16e-instruct-fp8"
1971
+ ],
1972
+ scaleway: [
1973
+ "deepseek-r1-distill-llama-70b",
1974
+ "gemma-3-27b-it",
1975
+ "gpt-oss-120b",
1976
+ "llama-3.1-8b-instruct",
1977
+ "llama-3.3-70b-instruct",
1978
+ "mistral-nemo-instruct-2407",
1979
+ "mistral-small-3.2-24b-instruct-2506",
1980
+ "pixtral-12b-2409",
1981
+ "qwen3-235b-a22b-instruct-2507",
1982
+ "qwen3-coder-30b-a3b-instruct",
1983
+ "voxtral-small-24b-2507"
1984
+ ],
1985
+ cerebras: ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
2010
1986
  netlify: [
2011
1987
  "anthropic/claude-3-5-haiku-20241022",
2012
1988
  "anthropic/claude-3-5-haiku-latest",
@@ -2078,7 +2054,7 @@ function saveLastRefreshTimeToDisk(date) {
2078
2054
  }
2079
2055
  function getPackageRoot() {
2080
2056
  try {
2081
- const require2 = module$1.createRequire((typeof document === 'undefined' ? require('u' + 'rl').pathToFileURL(__filename).href : (_documentCurrentScript && _documentCurrentScript.tagName.toUpperCase() === 'SCRIPT' && _documentCurrentScript.src || new URL('chunk-ZMPSVDDO.cjs', document.baseURI).href)) || "file://");
2057
+ const require2 = module$1.createRequire((typeof document === 'undefined' ? require('u' + 'rl').pathToFileURL(__filename).href : (_documentCurrentScript && _documentCurrentScript.tagName.toUpperCase() === 'SCRIPT' && _documentCurrentScript.src || new URL('chunk-FMNZ3BPT.cjs', document.baseURI).href)) || "file://");
2082
2058
  const packageJsonPath = require2.resolve("@mastra/core/package.json");
2083
2059
  return path__default.default.dirname(packageJsonPath);
2084
2060
  } catch {
@@ -2594,5 +2570,5 @@ exports.PROVIDER_REGISTRY = PROVIDER_REGISTRY;
2594
2570
  exports.getProviderConfig = getProviderConfig;
2595
2571
  exports.parseModelString = parseModelString;
2596
2572
  exports.resolveModelConfig = resolveModelConfig;
2597
- //# sourceMappingURL=chunk-ZMPSVDDO.cjs.map
2598
- //# sourceMappingURL=chunk-ZMPSVDDO.cjs.map
2573
+ //# sourceMappingURL=chunk-FMNZ3BPT.cjs.map
2574
+ //# sourceMappingURL=chunk-FMNZ3BPT.cjs.map