@mastra/core 0.21.2-alpha.0 → 0.22.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (181) hide show
  1. package/CHANGELOG.md +194 -0
  2. package/dist/agent/agent.d.ts +1 -0
  3. package/dist/agent/agent.d.ts.map +1 -1
  4. package/dist/agent/index.cjs +13 -13
  5. package/dist/agent/index.js +2 -2
  6. package/dist/agent/input-processor/index.cjs +6 -6
  7. package/dist/agent/input-processor/index.js +1 -1
  8. package/dist/agent/message-list/index.d.ts +14 -1
  9. package/dist/agent/message-list/index.d.ts.map +1 -1
  10. package/dist/agent/test-utils.d.ts +1 -0
  11. package/dist/agent/test-utils.d.ts.map +1 -1
  12. package/dist/agent/types.d.ts +6 -1
  13. package/dist/agent/types.d.ts.map +1 -1
  14. package/dist/agent/utils.d.ts +1 -1
  15. package/dist/agent/utils.d.ts.map +1 -1
  16. package/dist/ai-tracing/chunk-tracing.d.ts +76 -0
  17. package/dist/ai-tracing/chunk-tracing.d.ts.map +1 -0
  18. package/dist/ai-tracing/exporters/base.d.ts +111 -0
  19. package/dist/ai-tracing/exporters/base.d.ts.map +1 -0
  20. package/dist/ai-tracing/exporters/cloud.d.ts +6 -8
  21. package/dist/ai-tracing/exporters/cloud.d.ts.map +1 -1
  22. package/dist/ai-tracing/exporters/console.d.ts +6 -6
  23. package/dist/ai-tracing/exporters/console.d.ts.map +1 -1
  24. package/dist/ai-tracing/exporters/index.d.ts +1 -0
  25. package/dist/ai-tracing/exporters/index.d.ts.map +1 -1
  26. package/dist/ai-tracing/index.cjs +48 -32
  27. package/dist/ai-tracing/index.d.ts +1 -0
  28. package/dist/ai-tracing/index.d.ts.map +1 -1
  29. package/dist/ai-tracing/index.js +1 -1
  30. package/dist/ai-tracing/spans/base.d.ts +4 -1
  31. package/dist/ai-tracing/spans/base.d.ts.map +1 -1
  32. package/dist/ai-tracing/spans/default.d.ts.map +1 -1
  33. package/dist/ai-tracing/tracers/base.d.ts +15 -1
  34. package/dist/ai-tracing/tracers/base.d.ts.map +1 -1
  35. package/dist/ai-tracing/types.d.ts +85 -11
  36. package/dist/ai-tracing/types.d.ts.map +1 -1
  37. package/dist/ai-tracing/utils.d.ts +14 -0
  38. package/dist/ai-tracing/utils.d.ts.map +1 -1
  39. package/dist/{chunk-D3IOLHNB.cjs → chunk-34L2Z6PH.cjs} +12 -12
  40. package/dist/{chunk-D3IOLHNB.cjs.map → chunk-34L2Z6PH.cjs.map} +1 -1
  41. package/dist/{chunk-BLVB2IJK.js → chunk-3CVE7NQC.js} +728 -267
  42. package/dist/chunk-3CVE7NQC.js.map +1 -0
  43. package/dist/{chunk-URQI7RJ3.cjs → chunk-5GIAZ3CH.cjs} +734 -269
  44. package/dist/chunk-5GIAZ3CH.cjs.map +1 -0
  45. package/dist/{chunk-XYNSPEJO.js → chunk-5NYWRAJN.js} +3 -3
  46. package/dist/{chunk-XYNSPEJO.js.map → chunk-5NYWRAJN.js.map} +1 -1
  47. package/dist/{chunk-URVM3Y4T.cjs → chunk-634YFL42.cjs} +44 -7
  48. package/dist/chunk-634YFL42.cjs.map +1 -0
  49. package/dist/{chunk-NIESGYOH.js → chunk-A3TQYIIR.js} +1392 -1416
  50. package/dist/chunk-A3TQYIIR.js.map +1 -0
  51. package/dist/{chunk-EGNHIPGJ.cjs → chunk-A4B6IAKN.cjs} +4 -4
  52. package/dist/{chunk-EGNHIPGJ.cjs.map → chunk-A4B6IAKN.cjs.map} +1 -1
  53. package/dist/{chunk-LMP5KMU3.js → chunk-AGD5B3FB.js} +43 -6
  54. package/dist/chunk-AGD5B3FB.js.map +1 -0
  55. package/dist/{chunk-V5WDWSQ5.cjs → chunk-CAZTWPDK.cjs} +11 -11
  56. package/dist/{chunk-V5WDWSQ5.cjs.map → chunk-CAZTWPDK.cjs.map} +1 -1
  57. package/dist/{chunk-N3ZSX5OS.js → chunk-F7OMDF5K.js} +72 -36
  58. package/dist/chunk-F7OMDF5K.js.map +1 -0
  59. package/dist/{chunk-ZMPSVDDO.cjs → chunk-FMNZ3BPT.cjs} +1393 -1417
  60. package/dist/chunk-FMNZ3BPT.cjs.map +1 -0
  61. package/dist/{chunk-4ZFVJA3A.js → chunk-HZIF7HQC.js} +3 -3
  62. package/dist/{chunk-4ZFVJA3A.js.map → chunk-HZIF7HQC.js.map} +1 -1
  63. package/dist/{chunk-KLWDUSBX.js → chunk-ITFEGBP2.js} +4 -4
  64. package/dist/{chunk-KLWDUSBX.js.map → chunk-ITFEGBP2.js.map} +1 -1
  65. package/dist/{chunk-GKTRUHKB.js → chunk-KQBF5ZEN.js} +5 -5
  66. package/dist/{chunk-GKTRUHKB.js.map → chunk-KQBF5ZEN.js.map} +1 -1
  67. package/dist/{chunk-R35PINKN.js → chunk-MHICZASQ.js} +5 -5
  68. package/dist/{chunk-R35PINKN.js.map → chunk-MHICZASQ.js.map} +1 -1
  69. package/dist/{chunk-H4KO46HZ.js → chunk-MKCC5K77.js} +3 -3
  70. package/dist/{chunk-H4KO46HZ.js.map → chunk-MKCC5K77.js.map} +1 -1
  71. package/dist/{chunk-UN653TND.cjs → chunk-O4KVF3MI.cjs} +4 -4
  72. package/dist/{chunk-UN653TND.cjs.map → chunk-O4KVF3MI.cjs.map} +1 -1
  73. package/dist/{chunk-WI2YMBNG.cjs → chunk-QBPTDMR7.cjs} +102 -64
  74. package/dist/chunk-QBPTDMR7.cjs.map +1 -0
  75. package/dist/{chunk-7P5FMQQK.cjs → chunk-RWWOJXMF.cjs} +6 -6
  76. package/dist/{chunk-7P5FMQQK.cjs.map → chunk-RWWOJXMF.cjs.map} +1 -1
  77. package/dist/{chunk-XBJP7THY.js → chunk-RXBG6UV2.js} +4 -4
  78. package/dist/chunk-RXBG6UV2.js.map +1 -0
  79. package/dist/{chunk-NL3P7IFI.js → chunk-SF75RENF.js} +3 -3
  80. package/dist/{chunk-NL3P7IFI.js.map → chunk-SF75RENF.js.map} +1 -1
  81. package/dist/{chunk-SE4PA467.cjs → chunk-VF676YCO.cjs} +2 -2
  82. package/dist/chunk-VF676YCO.cjs.map +1 -0
  83. package/dist/{chunk-6OLRLZJ3.js → chunk-WM4RO23J.js} +2 -2
  84. package/dist/chunk-WM4RO23J.js.map +1 -0
  85. package/dist/{chunk-MVVMHOAC.cjs → chunk-YOVX3R5U.cjs} +14 -14
  86. package/dist/chunk-YOVX3R5U.cjs.map +1 -0
  87. package/dist/{chunk-L5A4MRCK.cjs → chunk-ZABG3SZ2.cjs} +4 -4
  88. package/dist/{chunk-L5A4MRCK.cjs.map → chunk-ZABG3SZ2.cjs.map} +1 -1
  89. package/dist/{chunk-YKVVW65D.cjs → chunk-ZDW322JC.cjs} +8 -8
  90. package/dist/{chunk-YKVVW65D.cjs.map → chunk-ZDW322JC.cjs.map} +1 -1
  91. package/dist/index.cjs +53 -53
  92. package/dist/index.js +11 -11
  93. package/dist/integration/index.cjs +3 -3
  94. package/dist/integration/index.js +1 -1
  95. package/dist/llm/index.cjs +7 -7
  96. package/dist/llm/index.js +1 -1
  97. package/dist/llm/model/model.loop.d.ts.map +1 -1
  98. package/dist/llm/model/provider-types.generated.d.ts +585 -597
  99. package/dist/loop/index.cjs +2 -2
  100. package/dist/loop/index.js +1 -1
  101. package/dist/loop/loop.d.ts.map +1 -1
  102. package/dist/loop/test-utils/mock-server-response.d.ts +7 -2
  103. package/dist/loop/test-utils/mock-server-response.d.ts.map +1 -1
  104. package/dist/loop/test-utils/options.d.ts.map +1 -1
  105. package/dist/loop/types.d.ts +2 -1
  106. package/dist/loop/types.d.ts.map +1 -1
  107. package/dist/loop/workflows/agentic-execution/llm-execution-step.d.ts.map +1 -1
  108. package/dist/loop/workflows/agentic-execution/tool-call-step.d.ts +1 -1
  109. package/dist/loop/workflows/agentic-execution/tool-call-step.d.ts.map +1 -1
  110. package/dist/mastra/index.cjs +2 -2
  111. package/dist/mastra/index.js +1 -1
  112. package/dist/memory/index.cjs +4 -4
  113. package/dist/memory/index.js +1 -1
  114. package/dist/memory/memory.d.ts +3 -2
  115. package/dist/memory/memory.d.ts.map +1 -1
  116. package/dist/processors/index.cjs +11 -11
  117. package/dist/processors/index.js +1 -1
  118. package/dist/provider-registry.json +1390 -1414
  119. package/dist/relevance/index.cjs +4 -4
  120. package/dist/relevance/index.js +1 -1
  121. package/dist/scores/index.cjs +9 -9
  122. package/dist/scores/index.js +2 -2
  123. package/dist/scores/scoreTraces/index.cjs +8 -8
  124. package/dist/scores/scoreTraces/index.js +3 -3
  125. package/dist/storage/index.cjs +3 -3
  126. package/dist/storage/index.js +1 -1
  127. package/dist/stream/RunOutput.d.ts +72 -0
  128. package/dist/stream/RunOutput.d.ts.map +1 -0
  129. package/dist/stream/aisdk/v5/output.d.ts +2 -2
  130. package/dist/stream/aisdk/v5/output.d.ts.map +1 -1
  131. package/dist/stream/base/base.d.ts +7 -0
  132. package/dist/stream/base/base.d.ts.map +1 -0
  133. package/dist/stream/base/consume-stream.d.ts +5 -0
  134. package/dist/stream/base/consume-stream.d.ts.map +1 -0
  135. package/dist/stream/base/output.d.ts.map +1 -1
  136. package/dist/stream/index.cjs +14 -10
  137. package/dist/stream/index.d.ts +2 -1
  138. package/dist/stream/index.d.ts.map +1 -1
  139. package/dist/stream/index.js +2 -2
  140. package/dist/stream/types.d.ts +1 -1
  141. package/dist/stream/types.d.ts.map +1 -1
  142. package/dist/test-utils/llm-mock.cjs +2 -2
  143. package/dist/test-utils/llm-mock.js +1 -1
  144. package/dist/tools/index.cjs +4 -4
  145. package/dist/tools/index.js +1 -1
  146. package/dist/tools/is-vercel-tool.cjs +2 -2
  147. package/dist/tools/is-vercel-tool.js +1 -1
  148. package/dist/tools/tool-builder/builder.d.ts +75 -2
  149. package/dist/tools/tool-builder/builder.d.ts.map +1 -1
  150. package/dist/tools/tool.d.ts +2 -2
  151. package/dist/tools/tool.d.ts.map +1 -1
  152. package/dist/tools/types.d.ts +17 -12
  153. package/dist/tools/types.d.ts.map +1 -1
  154. package/dist/utils.cjs +17 -17
  155. package/dist/utils.d.ts +1 -0
  156. package/dist/utils.d.ts.map +1 -1
  157. package/dist/utils.js +1 -1
  158. package/dist/workflows/evented/index.cjs +10 -10
  159. package/dist/workflows/evented/index.js +1 -1
  160. package/dist/workflows/evented/workflow.d.ts +5 -3
  161. package/dist/workflows/evented/workflow.d.ts.map +1 -1
  162. package/dist/workflows/index.cjs +12 -12
  163. package/dist/workflows/index.js +1 -1
  164. package/dist/workflows/legacy/index.cjs +22 -22
  165. package/dist/workflows/legacy/index.js +1 -1
  166. package/dist/workflows/workflow.d.ts +30 -23
  167. package/dist/workflows/workflow.d.ts.map +1 -1
  168. package/package.json +12 -10
  169. package/src/llm/model/provider-types.generated.d.ts +585 -597
  170. package/dist/chunk-6OLRLZJ3.js.map +0 -1
  171. package/dist/chunk-BLVB2IJK.js.map +0 -1
  172. package/dist/chunk-LMP5KMU3.js.map +0 -1
  173. package/dist/chunk-MVVMHOAC.cjs.map +0 -1
  174. package/dist/chunk-N3ZSX5OS.js.map +0 -1
  175. package/dist/chunk-NIESGYOH.js.map +0 -1
  176. package/dist/chunk-SE4PA467.cjs.map +0 -1
  177. package/dist/chunk-URQI7RJ3.cjs.map +0 -1
  178. package/dist/chunk-URVM3Y4T.cjs.map +0 -1
  179. package/dist/chunk-WI2YMBNG.cjs.map +0 -1
  180. package/dist/chunk-XBJP7THY.js.map +0 -1
  181. package/dist/chunk-ZMPSVDDO.cjs.map +0 -1
@@ -14,79 +14,13 @@ import { createOpenAI } from '@ai-sdk/openai-v5';
14
14
  // src/llm/model/provider-registry.json
15
15
  var provider_registry_default = {
16
16
  providers: {
17
- nvidia: {
18
- url: "https://integrate.api.nvidia.com/v1",
19
- apiKeyEnvVar: "NVIDIA_API_KEY",
20
- apiKeyHeader: "Authorization",
21
- name: "Nvidia",
22
- models: [
23
- "black-forest-labs/flux.1-dev",
24
- "deepseek-ai/deepseek-v3.1",
25
- "deepseek-ai/deepseek-v3.1-terminus",
26
- "google/gemma-3-27b-it",
27
- "microsoft/phi-4-mini-instruct",
28
- "moonshotai/kimi-k2-instruct",
29
- "moonshotai/kimi-k2-instruct-0905",
30
- "nvidia/cosmos-nemotron-34b",
31
- "nvidia/llama-3.1-nemotron-ultra-253b-v1",
32
- "nvidia/nemoretriever-ocr-v1",
33
- "nvidia/parakeet-tdt-0.6b-v2",
34
- "openai/gpt-oss-120b",
35
- "openai/whisper-large-v3",
36
- "qwen/qwen3-235b-a22b",
37
- "qwen/qwen3-coder-480b-a35b-instruct"
38
- ],
39
- docUrl: "https://docs.api.nvidia.com/nim/",
40
- gateway: "models.dev"
41
- },
42
- modelscope: {
43
- url: "https://api-inference.modelscope.cn/v1",
44
- apiKeyEnvVar: "MODELSCOPE_API_KEY",
45
- apiKeyHeader: "Authorization",
46
- name: "ModelScope",
47
- models: [
48
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
49
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
50
- "Qwen/Qwen3-30B-A3B-Instruct-2507",
51
- "Qwen/Qwen3-30B-A3B-Thinking-2507",
52
- "Qwen/Qwen3-Coder-30B-A3B-Instruct",
53
- "ZhipuAI/GLM-4.5",
54
- "ZhipuAI/GLM-4.6"
55
- ],
56
- docUrl: "https://modelscope.cn/docs/model-service/API-Inference/intro",
57
- gateway: "models.dev"
58
- },
59
- aihubmix: {
60
- url: "https://api.aihubmix.com/v1",
61
- apiKeyEnvVar: "AIHUBMIX_API_KEY",
17
+ "moonshotai-cn": {
18
+ url: "https://api.moonshot.cn/v1",
19
+ apiKeyEnvVar: "MOONSHOT_API_KEY",
62
20
  apiKeyHeader: "Authorization",
63
- name: "AIHubMix",
64
- models: [
65
- "DeepSeek-V3.2-Exp",
66
- "DeepSeek-V3.2-Exp-Think",
67
- "Kimi-K2-0905",
68
- "claude-haiku-4-5",
69
- "claude-opus-4-1",
70
- "claude-sonnet-4-5",
71
- "gemini-2.5-flash",
72
- "gemini-2.5-pro",
73
- "glm-4.6",
74
- "gpt-4.1",
75
- "gpt-4.1-mini",
76
- "gpt-4.1-nano",
77
- "gpt-4o",
78
- "gpt-4o-2024-11-20",
79
- "gpt-5",
80
- "gpt-5-codex",
81
- "gpt-5-mini",
82
- "gpt-5-nano",
83
- "gpt-5-pro",
84
- "o4-mini",
85
- "qwen3-235b-a22b-instruct-2507",
86
- "qwen3-235b-a22b-thinking-2507",
87
- "qwen3-coder-480b-a35b-instruct"
88
- ],
89
- docUrl: "https://aihubmix.com/docs/models",
21
+ name: "Moonshot AI (China)",
22
+ models: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
23
+ docUrl: "https://platform.moonshot.cn/docs/api/chat",
90
24
  gateway: "models.dev"
91
25
  },
92
26
  lucidquery: {
@@ -98,6 +32,73 @@ var provider_registry_default = {
98
32
  docUrl: "https://lucidquery.com/api/docs",
99
33
  gateway: "models.dev"
100
34
  },
35
+ moonshotai: {
36
+ url: "https://api.moonshot.ai/v1",
37
+ apiKeyEnvVar: "MOONSHOT_API_KEY",
38
+ apiKeyHeader: "Authorization",
39
+ name: "Moonshot AI",
40
+ models: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
41
+ docUrl: "https://platform.moonshot.ai/docs/api/chat",
42
+ gateway: "models.dev"
43
+ },
44
+ "zai-coding-plan": {
45
+ url: "https://api.z.ai/api/coding/paas/v4",
46
+ apiKeyEnvVar: "ZHIPU_API_KEY",
47
+ apiKeyHeader: "Authorization",
48
+ name: "Z.AI Coding Plan",
49
+ models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
50
+ docUrl: "https://docs.z.ai/devpack/overview",
51
+ gateway: "models.dev"
52
+ },
53
+ alibaba: {
54
+ url: "https://dashscope-intl.aliyuncs.com/compatible-mode/v1",
55
+ apiKeyEnvVar: "DASHSCOPE_API_KEY",
56
+ apiKeyHeader: "Authorization",
57
+ name: "Alibaba",
58
+ models: [
59
+ "qvq-max",
60
+ "qwen-flash",
61
+ "qwen-max",
62
+ "qwen-mt-plus",
63
+ "qwen-mt-turbo",
64
+ "qwen-omni-turbo",
65
+ "qwen-omni-turbo-realtime",
66
+ "qwen-plus",
67
+ "qwen-plus-character-ja",
68
+ "qwen-turbo",
69
+ "qwen-vl-max",
70
+ "qwen-vl-ocr",
71
+ "qwen-vl-plus",
72
+ "qwen2-5-14b-instruct",
73
+ "qwen2-5-32b-instruct",
74
+ "qwen2-5-72b-instruct",
75
+ "qwen2-5-7b-instruct",
76
+ "qwen2-5-omni-7b",
77
+ "qwen2-5-vl-72b-instruct",
78
+ "qwen2-5-vl-7b-instruct",
79
+ "qwen3-14b",
80
+ "qwen3-235b-a22b",
81
+ "qwen3-32b",
82
+ "qwen3-8b",
83
+ "qwen3-asr-flash",
84
+ "qwen3-coder-30b-a3b-instruct",
85
+ "qwen3-coder-480b-a35b-instruct",
86
+ "qwen3-coder-flash",
87
+ "qwen3-coder-plus",
88
+ "qwen3-livetranslate-flash-realtime",
89
+ "qwen3-max",
90
+ "qwen3-next-80b-a3b-instruct",
91
+ "qwen3-next-80b-a3b-thinking",
92
+ "qwen3-omni-flash",
93
+ "qwen3-omni-flash-realtime",
94
+ "qwen3-vl-235b-a22b",
95
+ "qwen3-vl-30b-a3b",
96
+ "qwen3-vl-plus",
97
+ "qwq-plus"
98
+ ],
99
+ docUrl: "https://www.alibabacloud.com/help/en/model-studio/models",
100
+ gateway: "models.dev"
101
+ },
101
102
  xai: {
102
103
  apiKeyEnvVar: "XAI_API_KEY",
103
104
  name: "xAI",
@@ -126,325 +127,94 @@ var provider_registry_default = {
126
127
  docUrl: "https://docs.x.ai/docs/models",
127
128
  gateway: "models.dev"
128
129
  },
129
- deepseek: {
130
- url: "https://api.deepseek.com",
131
- apiKeyEnvVar: "DEEPSEEK_API_KEY",
132
- apiKeyHeader: "Authorization",
133
- name: "DeepSeek",
134
- models: ["deepseek-chat", "deepseek-reasoner"],
135
- docUrl: "https://platform.deepseek.com/api-docs/pricing",
136
- gateway: "models.dev"
137
- },
138
- requesty: {
139
- url: "https://router.requesty.ai/v1",
140
- apiKeyEnvVar: "REQUESTY_API_KEY",
130
+ nvidia: {
131
+ url: "https://integrate.api.nvidia.com/v1",
132
+ apiKeyEnvVar: "NVIDIA_API_KEY",
141
133
  apiKeyHeader: "Authorization",
142
- name: "Requesty",
134
+ name: "Nvidia",
143
135
  models: [
144
- "anthropic/claude-3-7-sonnet",
145
- "anthropic/claude-4-sonnet-20250522",
146
- "anthropic/claude-opus-4",
147
- "anthropic/claude-opus-4-1-20250805",
148
- "google/gemini-2.5-flash",
149
- "google/gemini-2.5-pro",
150
- "openai/gpt-4.1",
151
- "openai/gpt-4.1-mini",
152
- "openai/gpt-4o-mini",
153
- "openai/gpt-5",
154
- "openai/gpt-5-mini",
155
- "openai/gpt-5-nano",
156
- "openai/o4-mini"
136
+ "black-forest-labs/flux.1-dev",
137
+ "deepseek-ai/deepseek-v3.1",
138
+ "deepseek-ai/deepseek-v3.1-terminus",
139
+ "google/gemma-3-27b-it",
140
+ "microsoft/phi-4-mini-instruct",
141
+ "moonshotai/kimi-k2-instruct",
142
+ "moonshotai/kimi-k2-instruct-0905",
143
+ "nvidia/cosmos-nemotron-34b",
144
+ "nvidia/llama-3.1-nemotron-ultra-253b-v1",
145
+ "nvidia/nemoretriever-ocr-v1",
146
+ "nvidia/parakeet-tdt-0.6b-v2",
147
+ "openai/gpt-oss-120b",
148
+ "openai/whisper-large-v3",
149
+ "qwen/qwen3-235b-a22b",
150
+ "qwen/qwen3-coder-480b-a35b-instruct"
157
151
  ],
158
- docUrl: "https://requesty.ai/solution/llm-routing/models",
152
+ docUrl: "https://docs.api.nvidia.com/nim/",
159
153
  gateway: "models.dev"
160
154
  },
161
- nebius: {
162
- url: "https://api.studio.nebius.com/v1/",
163
- apiKeyEnvVar: "NEBIUS_API_KEY",
155
+ upstage: {
156
+ url: "https://api.upstage.ai",
157
+ apiKeyEnvVar: "UPSTAGE_API_KEY",
164
158
  apiKeyHeader: "Authorization",
165
- name: "Nebius AI Studio",
166
- models: [
167
- "NousResearch/hermes-4-405b",
168
- "NousResearch/hermes-4-70b",
169
- "deepseek-ai/deepseek-v3",
170
- "meta-llama/llama-3.3-70b-instruct-base",
171
- "meta-llama/llama-3.3-70b-instruct-fast",
172
- "meta-llama/llama-3_1-405b-instruct",
173
- "moonshotai/kimi-k2-instruct",
174
- "nvidia/llama-3_1-nemotron-ultra-253b-v1",
175
- "openai/gpt-oss-120b",
176
- "openai/gpt-oss-20b",
177
- "qwen/qwen3-235b-a22b-instruct-2507",
178
- "qwen/qwen3-235b-a22b-thinking-2507",
179
- "qwen/qwen3-coder-480b-a35b-instruct",
180
- "zai-org/glm-4.5",
181
- "zai-org/glm-4.5-air"
182
- ],
183
- docUrl: "https://docs.studio.nebius.com/quickstart",
159
+ name: "Upstage",
160
+ models: ["solar-mini", "solar-pro2"],
161
+ docUrl: "https://developers.upstage.ai/docs/apis/chat",
184
162
  gateway: "models.dev"
185
163
  },
186
- fastrouter: {
187
- url: "https://go.fastrouter.ai/api/v1",
188
- apiKeyEnvVar: "FASTROUTER_API_KEY",
164
+ groq: {
165
+ url: "https://api.groq.com/openai/v1",
166
+ apiKeyEnvVar: "GROQ_API_KEY",
189
167
  apiKeyHeader: "Authorization",
190
- name: "FastRouter",
168
+ name: "Groq",
191
169
  models: [
192
- "anthropic/claude-opus-4.1",
193
- "anthropic/claude-sonnet-4",
194
- "deepseek-ai/deepseek-r1-distill-llama-70b",
195
- "google/gemini-2.5-flash",
196
- "google/gemini-2.5-pro",
197
- "moonshotai/kimi-k2",
198
- "openai/gpt-4.1",
199
- "openai/gpt-5",
200
- "openai/gpt-5-mini",
201
- "openai/gpt-5-nano",
170
+ "deepseek-r1-distill-llama-70b",
171
+ "gemma2-9b-it",
172
+ "llama-3.1-8b-instant",
173
+ "llama-3.3-70b-versatile",
174
+ "llama-guard-3-8b",
175
+ "llama3-70b-8192",
176
+ "llama3-8b-8192",
177
+ "meta-llama/llama-4-maverick-17b-128e-instruct",
178
+ "meta-llama/llama-4-scout-17b-16e-instruct",
179
+ "meta-llama/llama-guard-4-12b",
180
+ "mistral-saba-24b",
181
+ "moonshotai/kimi-k2-instruct",
182
+ "moonshotai/kimi-k2-instruct-0905",
202
183
  "openai/gpt-oss-120b",
203
184
  "openai/gpt-oss-20b",
204
- "qwen/qwen3-coder",
205
- "x-ai/grok-4"
185
+ "qwen-qwq-32b",
186
+ "qwen/qwen3-32b"
206
187
  ],
207
- docUrl: "https://fastrouter.ai/models",
188
+ docUrl: "https://console.groq.com/docs/models",
208
189
  gateway: "models.dev"
209
190
  },
210
- perplexity: {
211
- url: "https://api.perplexity.ai",
212
- apiKeyEnvVar: "PERPLEXITY_API_KEY",
191
+ mistral: {
192
+ url: "https://api.mistral.ai/v1",
193
+ apiKeyEnvVar: "MISTRAL_API_KEY",
213
194
  apiKeyHeader: "Authorization",
214
- name: "Perplexity",
215
- models: ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
216
- docUrl: "https://docs.perplexity.ai",
217
- gateway: "models.dev"
218
- },
219
- morph: {
220
- url: "https://api.morphllm.com/v1",
221
- apiKeyEnvVar: "MORPH_API_KEY",
222
- apiKeyHeader: "Authorization",
223
- name: "Morph",
224
- models: ["auto", "morph-v3-fast", "morph-v3-large"],
225
- docUrl: "https://docs.morphllm.com/api-reference/introduction",
226
- gateway: "models.dev"
227
- },
228
- "zai-coding-plan": {
229
- url: "https://api.z.ai/api/coding/paas/v4",
230
- apiKeyEnvVar: "ZHIPU_API_KEY",
231
- apiKeyHeader: "Authorization",
232
- name: "Z.AI Coding Plan",
233
- models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
234
- docUrl: "https://docs.z.ai/devpack/overview",
235
- gateway: "models.dev"
236
- },
237
- huggingface: {
238
- url: "https://router.huggingface.co/v1",
239
- apiKeyEnvVar: "HF_TOKEN",
240
- apiKeyHeader: "Authorization",
241
- name: "Hugging Face",
242
- models: [
243
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
244
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
245
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
246
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
247
- "deepseek-ai/DeepSeek-R1-0528",
248
- "deepseek-ai/Deepseek-V3-0324",
249
- "moonshotai/Kimi-K2-Instruct",
250
- "moonshotai/Kimi-K2-Instruct-0905",
251
- "zai-org/GLM-4.5",
252
- "zai-org/GLM-4.5-Air",
253
- "zai-org/GLM-4.6"
254
- ],
255
- docUrl: "https://huggingface.co/docs/inference-providers",
256
- gateway: "models.dev"
257
- },
258
- openrouter: {
259
- url: "https://openrouter.ai/api/v1",
260
- apiKeyEnvVar: "OPENROUTER_API_KEY",
261
- name: "OpenRouter",
262
- models: [
263
- "anthropic/claude-3.5-haiku",
264
- "anthropic/claude-3.7-sonnet",
265
- "anthropic/claude-haiku-4.5",
266
- "anthropic/claude-opus-4",
267
- "anthropic/claude-opus-4.1",
268
- "anthropic/claude-sonnet-4",
269
- "anthropic/claude-sonnet-4.5",
270
- "cognitivecomputations/dolphin3.0-mistral-24b",
271
- "cognitivecomputations/dolphin3.0-r1-mistral-24b",
272
- "deepseek/deepseek-chat-v3-0324",
273
- "deepseek/deepseek-chat-v3.1",
274
- "deepseek/deepseek-r1-0528-qwen3-8b:free",
275
- "deepseek/deepseek-r1-0528:free",
276
- "deepseek/deepseek-r1-distill-llama-70b",
277
- "deepseek/deepseek-r1-distill-qwen-14b",
278
- "deepseek/deepseek-r1:free",
279
- "deepseek/deepseek-v3-base:free",
280
- "deepseek/deepseek-v3.1-terminus",
281
- "featherless/qwerky-72b",
282
- "google/gemini-2.0-flash-001",
283
- "google/gemini-2.0-flash-exp:free",
284
- "google/gemini-2.5-flash",
285
- "google/gemini-2.5-flash-lite",
286
- "google/gemini-2.5-flash-lite-preview-09-2025",
287
- "google/gemini-2.5-flash-preview-09-2025",
288
- "google/gemini-2.5-pro",
289
- "google/gemini-2.5-pro-preview-05-06",
290
- "google/gemini-2.5-pro-preview-06-05",
291
- "google/gemma-2-9b-it:free",
292
- "google/gemma-3-12b-it",
293
- "google/gemma-3-27b-it",
294
- "google/gemma-3n-e4b-it",
295
- "google/gemma-3n-e4b-it:free",
296
- "meta-llama/llama-3.2-11b-vision-instruct",
297
- "meta-llama/llama-3.3-70b-instruct:free",
298
- "meta-llama/llama-4-scout:free",
299
- "microsoft/mai-ds-r1:free",
300
- "mistralai/codestral-2508",
301
- "mistralai/devstral-medium-2507",
302
- "mistralai/devstral-small-2505",
303
- "mistralai/devstral-small-2505:free",
304
- "mistralai/devstral-small-2507",
305
- "mistralai/mistral-7b-instruct:free",
306
- "mistralai/mistral-medium-3",
307
- "mistralai/mistral-medium-3.1",
308
- "mistralai/mistral-nemo:free",
309
- "mistralai/mistral-small-3.1-24b-instruct",
310
- "mistralai/mistral-small-3.2-24b-instruct",
311
- "mistralai/mistral-small-3.2-24b-instruct:free",
312
- "moonshotai/kimi-dev-72b:free",
313
- "moonshotai/kimi-k2",
314
- "moonshotai/kimi-k2-0905",
315
- "moonshotai/kimi-k2:free",
316
- "nousresearch/deephermes-3-llama-3-8b-preview",
317
- "nousresearch/hermes-4-405b",
318
- "nousresearch/hermes-4-70b",
319
- "openai/gpt-4.1",
320
- "openai/gpt-4.1-mini",
321
- "openai/gpt-4o-mini",
322
- "openai/gpt-5",
323
- "openai/gpt-5-chat",
324
- "openai/gpt-5-codex",
325
- "openai/gpt-5-image",
326
- "openai/gpt-5-mini",
327
- "openai/gpt-5-nano",
328
- "openai/gpt-oss-120b",
329
- "openai/gpt-oss-20b",
330
- "openai/o4-mini",
331
- "openrouter/cypher-alpha:free",
332
- "openrouter/horizon-alpha",
333
- "openrouter/horizon-beta",
334
- "openrouter/sonoma-dusk-alpha",
335
- "openrouter/sonoma-sky-alpha",
336
- "qwen/qwen-2.5-coder-32b-instruct",
337
- "qwen/qwen2.5-vl-32b-instruct:free",
338
- "qwen/qwen2.5-vl-72b-instruct",
339
- "qwen/qwen2.5-vl-72b-instruct:free",
340
- "qwen/qwen3-14b:free",
341
- "qwen/qwen3-235b-a22b-07-25",
342
- "qwen/qwen3-235b-a22b-07-25:free",
343
- "qwen/qwen3-235b-a22b-thinking-2507",
344
- "qwen/qwen3-235b-a22b:free",
345
- "qwen/qwen3-30b-a3b-instruct-2507",
346
- "qwen/qwen3-30b-a3b-thinking-2507",
347
- "qwen/qwen3-30b-a3b:free",
348
- "qwen/qwen3-32b:free",
349
- "qwen/qwen3-8b:free",
350
- "qwen/qwen3-coder",
351
- "qwen/qwen3-coder:free",
352
- "qwen/qwen3-max",
353
- "qwen/qwen3-next-80b-a3b-instruct",
354
- "qwen/qwen3-next-80b-a3b-thinking",
355
- "qwen/qwq-32b:free",
356
- "rekaai/reka-flash-3",
357
- "sarvamai/sarvam-m:free",
358
- "thudm/glm-z1-32b:free",
359
- "tngtech/deepseek-r1t2-chimera:free",
360
- "x-ai/grok-3",
361
- "x-ai/grok-3-beta",
362
- "x-ai/grok-3-mini",
363
- "x-ai/grok-3-mini-beta",
364
- "x-ai/grok-4",
365
- "x-ai/grok-4-fast",
366
- "x-ai/grok-4-fast:free",
367
- "x-ai/grok-code-fast-1",
368
- "z-ai/glm-4.5",
369
- "z-ai/glm-4.5-air",
370
- "z-ai/glm-4.5-air:free",
371
- "z-ai/glm-4.5v",
372
- "z-ai/glm-4.6"
373
- ],
374
- docUrl: "https://openrouter.ai/models",
375
- gateway: "models.dev"
376
- },
377
- cerebras: {
378
- url: "https://api.cerebras.ai/v1",
379
- apiKeyEnvVar: "CEREBRAS_API_KEY",
380
- apiKeyHeader: "Authorization",
381
- name: "Cerebras",
382
- models: ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
383
- docUrl: "https://inference-docs.cerebras.ai/models/overview",
384
- gateway: "models.dev"
385
- },
386
- zhipuai: {
387
- url: "https://open.bigmodel.cn/api/paas/v4",
388
- apiKeyEnvVar: "ZHIPU_API_KEY",
389
- apiKeyHeader: "Authorization",
390
- name: "Zhipu AI",
391
- models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
392
- docUrl: "https://docs.z.ai/guides/overview/pricing",
393
- gateway: "models.dev"
394
- },
395
- togetherai: {
396
- url: "https://api.together.xyz/v1",
397
- apiKeyEnvVar: "TOGETHER_API_KEY",
398
- apiKeyHeader: "Authorization",
399
- name: "Together AI",
400
- models: [
401
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
402
- "deepseek-ai/DeepSeek-R1",
403
- "deepseek-ai/DeepSeek-V3",
404
- "meta-llama/Llama-3.3-70B-Instruct-Turbo",
405
- "moonshotai/Kimi-K2-Instruct",
406
- "openai/gpt-oss-120b"
407
- ],
408
- docUrl: "https://docs.together.ai/docs/serverless-models",
409
- gateway: "models.dev"
410
- },
411
- wandb: {
412
- url: "https://api.inference.wandb.ai/v1",
413
- apiKeyEnvVar: "WANDB_API_KEY",
414
- apiKeyHeader: "Authorization",
415
- name: "Weights & Biases",
416
- models: [
417
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
418
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
419
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
420
- "deepseek-ai/DeepSeek-R1-0528",
421
- "deepseek-ai/DeepSeek-V3-0324",
422
- "meta-llama/Llama-3.1-8B-Instruct",
423
- "meta-llama/Llama-3.3-70B-Instruct",
424
- "meta-llama/Llama-4-Scout-17B-16E-Instruct",
425
- "microsoft/Phi-4-mini-instruct",
426
- "moonshotai/Kimi-K2-Instruct"
427
- ],
428
- docUrl: "https://weave-docs.wandb.ai/guides/integrations/inference/",
429
- gateway: "models.dev"
430
- },
431
- submodel: {
432
- url: "https://llm.submodel.ai/v1",
433
- apiKeyEnvVar: "SUBMODEL_INSTAGEN_ACCESS_KEY",
434
- apiKeyHeader: "Authorization",
435
- name: "submodel",
195
+ name: "Mistral",
436
196
  models: [
437
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
438
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
439
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
440
- "deepseek-ai/DeepSeek-R1-0528",
441
- "deepseek-ai/DeepSeek-V3-0324",
442
- "deepseek-ai/DeepSeek-V3.1",
443
- "openai/gpt-oss-120b",
444
- "zai-org/GLM-4.5-Air",
445
- "zai-org/GLM-4.5-FP8"
197
+ "codestral-latest",
198
+ "devstral-medium-2507",
199
+ "devstral-small-2505",
200
+ "devstral-small-2507",
201
+ "magistral-medium-latest",
202
+ "magistral-small",
203
+ "ministral-3b-latest",
204
+ "ministral-8b-latest",
205
+ "mistral-large-latest",
206
+ "mistral-medium-2505",
207
+ "mistral-medium-2508",
208
+ "mistral-medium-latest",
209
+ "mistral-nemo",
210
+ "mistral-small-latest",
211
+ "open-mistral-7b",
212
+ "open-mixtral-8x22b",
213
+ "open-mixtral-8x7b",
214
+ "pixtral-12b",
215
+ "pixtral-large-latest"
446
216
  ],
447
- docUrl: "https://submodel.gitbook.io",
217
+ docUrl: "https://docs.mistral.ai/getting-started/models/",
448
218
  gateway: "models.dev"
449
219
  },
450
220
  vercel: {
@@ -541,102 +311,196 @@ var provider_registry_default = {
541
311
  docUrl: "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway",
542
312
  gateway: "models.dev"
543
313
  },
544
- synthetic: {
545
- url: "https://api.synthetic.new/v1",
546
- apiKeyEnvVar: "SYNTHETIC_API_KEY",
314
+ nebius: {
315
+ url: "https://api.studio.nebius.com/v1/",
316
+ apiKeyEnvVar: "NEBIUS_API_KEY",
547
317
  apiKeyHeader: "Authorization",
548
- name: "Synthetic",
318
+ name: "Nebius AI Studio",
549
319
  models: [
550
- "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
551
- "hf:Qwen/Qwen3-235B-A22B-Instruct-2507",
552
- "hf:Qwen/Qwen3-235B-A22B-Thinking-2507",
553
- "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct",
554
- "hf:deepseek-ai/DeepSeek-R1",
555
- "hf:deepseek-ai/DeepSeek-R1-0528",
556
- "hf:deepseek-ai/DeepSeek-V3",
557
- "hf:deepseek-ai/DeepSeek-V3-0324",
558
- "hf:deepseek-ai/DeepSeek-V3.1",
559
- "hf:deepseek-ai/DeepSeek-V3.1-Terminus",
560
- "hf:meta-llama/Llama-3.1-405B-Instruct",
561
- "hf:meta-llama/Llama-3.1-70B-Instruct",
562
- "hf:meta-llama/Llama-3.1-8B-Instruct",
563
- "hf:meta-llama/Llama-3.3-70B-Instruct",
564
- "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
565
- "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct",
566
- "hf:moonshotai/Kimi-K2-Instruct",
567
- "hf:moonshotai/Kimi-K2-Instruct-0905",
568
- "hf:openai/gpt-oss-120b",
569
- "hf:zai-org/GLM-4.5",
570
- "hf:zai-org/GLM-4.6"
320
+ "NousResearch/hermes-4-405b",
321
+ "NousResearch/hermes-4-70b",
322
+ "deepseek-ai/deepseek-v3",
323
+ "meta-llama/llama-3.3-70b-instruct-base",
324
+ "meta-llama/llama-3.3-70b-instruct-fast",
325
+ "meta-llama/llama-3_1-405b-instruct",
326
+ "moonshotai/kimi-k2-instruct",
327
+ "nvidia/llama-3_1-nemotron-ultra-253b-v1",
328
+ "openai/gpt-oss-120b",
329
+ "openai/gpt-oss-20b",
330
+ "qwen/qwen3-235b-a22b-instruct-2507",
331
+ "qwen/qwen3-235b-a22b-thinking-2507",
332
+ "qwen/qwen3-coder-480b-a35b-instruct",
333
+ "zai-org/glm-4.5",
334
+ "zai-org/glm-4.5-air"
571
335
  ],
572
- docUrl: "https://synthetic.new/pricing",
336
+ docUrl: "https://docs.studio.nebius.com/quickstart",
573
337
  gateway: "models.dev"
574
338
  },
575
- google: {
576
- apiKeyEnvVar: "GOOGLE_GENERATIVE_AI_API_KEY",
577
- name: "Google",
339
+ deepseek: {
340
+ url: "https://api.deepseek.com",
341
+ apiKeyEnvVar: "DEEPSEEK_API_KEY",
342
+ apiKeyHeader: "Authorization",
343
+ name: "DeepSeek",
344
+ models: ["deepseek-chat", "deepseek-reasoner"],
345
+ docUrl: "https://platform.deepseek.com/api-docs/pricing",
346
+ gateway: "models.dev"
347
+ },
348
+ "alibaba-cn": {
349
+ url: "https://dashscope.aliyuncs.com/compatible-mode/v1",
350
+ apiKeyEnvVar: "DASHSCOPE_API_KEY",
351
+ apiKeyHeader: "Authorization",
352
+ name: "Alibaba (China)",
578
353
  models: [
579
- "gemini-1.5-flash",
580
- "gemini-1.5-flash-8b",
581
- "gemini-1.5-pro",
582
- "gemini-2.0-flash",
583
- "gemini-2.0-flash-lite",
584
- "gemini-2.5-flash",
585
- "gemini-2.5-flash-image",
586
- "gemini-2.5-flash-image-preview",
587
- "gemini-2.5-flash-lite",
588
- "gemini-2.5-flash-lite-preview-06-17",
589
- "gemini-2.5-flash-lite-preview-09-2025",
590
- "gemini-2.5-flash-preview-04-17",
591
- "gemini-2.5-flash-preview-05-20",
592
- "gemini-2.5-flash-preview-09-2025",
593
- "gemini-2.5-flash-preview-tts",
594
- "gemini-2.5-pro",
595
- "gemini-2.5-pro-preview-05-06",
596
- "gemini-2.5-pro-preview-06-05",
597
- "gemini-2.5-pro-preview-tts",
598
- "gemini-flash-latest",
599
- "gemini-flash-lite-latest",
600
- "gemini-live-2.5-flash",
601
- "gemini-live-2.5-flash-preview-native-audio"
354
+ "deepseek-r1",
355
+ "deepseek-r1-0528",
356
+ "deepseek-r1-distill-llama-70b",
357
+ "deepseek-r1-distill-llama-8b",
358
+ "deepseek-r1-distill-qwen-1-5b",
359
+ "deepseek-r1-distill-qwen-14b",
360
+ "deepseek-r1-distill-qwen-32b",
361
+ "deepseek-r1-distill-qwen-7b",
362
+ "deepseek-v3",
363
+ "deepseek-v3-1",
364
+ "deepseek-v3-2-exp",
365
+ "moonshot-kimi-k2-instruct",
366
+ "qvq-max",
367
+ "qwen-deep-research",
368
+ "qwen-doc-turbo",
369
+ "qwen-flash",
370
+ "qwen-long",
371
+ "qwen-math-plus",
372
+ "qwen-math-turbo",
373
+ "qwen-max",
374
+ "qwen-mt-plus",
375
+ "qwen-mt-turbo",
376
+ "qwen-omni-turbo",
377
+ "qwen-omni-turbo-realtime",
378
+ "qwen-plus",
379
+ "qwen-plus-character",
380
+ "qwen-turbo",
381
+ "qwen-vl-max",
382
+ "qwen-vl-ocr",
383
+ "qwen-vl-plus",
384
+ "qwen2-5-14b-instruct",
385
+ "qwen2-5-32b-instruct",
386
+ "qwen2-5-72b-instruct",
387
+ "qwen2-5-7b-instruct",
388
+ "qwen2-5-coder-32b-instruct",
389
+ "qwen2-5-coder-7b-instruct",
390
+ "qwen2-5-math-72b-instruct",
391
+ "qwen2-5-math-7b-instruct",
392
+ "qwen2-5-omni-7b",
393
+ "qwen2-5-vl-72b-instruct",
394
+ "qwen2-5-vl-7b-instruct",
395
+ "qwen3-14b",
396
+ "qwen3-235b-a22b",
397
+ "qwen3-32b",
398
+ "qwen3-8b",
399
+ "qwen3-asr-flash",
400
+ "qwen3-coder-30b-a3b-instruct",
401
+ "qwen3-coder-480b-a35b-instruct",
402
+ "qwen3-coder-flash",
403
+ "qwen3-coder-plus",
404
+ "qwen3-max",
405
+ "qwen3-next-80b-a3b-instruct",
406
+ "qwen3-next-80b-a3b-thinking",
407
+ "qwen3-omni-flash",
408
+ "qwen3-omni-flash-realtime",
409
+ "qwen3-vl-235b-a22b",
410
+ "qwen3-vl-30b-a3b",
411
+ "qwen3-vl-plus",
412
+ "qwq-32b",
413
+ "qwq-plus",
414
+ "tongyi-intent-detect-v3"
602
415
  ],
603
- docUrl: "https://ai.google.dev/gemini-api/docs/pricing",
416
+ docUrl: "https://www.alibabacloud.com/help/en/model-studio/models",
604
417
  gateway: "models.dev"
605
418
  },
606
- groq: {
607
- url: "https://api.groq.com/openai/v1",
608
- apiKeyEnvVar: "GROQ_API_KEY",
419
+ venice: {
420
+ url: "https://api.venice.ai/api/v1",
421
+ apiKeyEnvVar: "VENICE_API_KEY",
609
422
  apiKeyHeader: "Authorization",
610
- name: "Groq",
423
+ name: "Venice AI",
611
424
  models: [
612
- "deepseek-r1-distill-llama-70b",
613
- "gemma2-9b-it",
614
- "llama-3.1-8b-instant",
615
- "llama-3.3-70b-versatile",
616
- "llama-guard-3-8b",
617
- "llama3-70b-8192",
618
- "llama3-8b-8192",
619
- "meta-llama/llama-4-maverick-17b-128e-instruct",
620
- "meta-llama/llama-4-scout-17b-16e-instruct",
621
- "meta-llama/llama-guard-4-12b",
622
- "mistral-saba-24b",
623
- "moonshotai/kimi-k2-instruct",
624
- "moonshotai/kimi-k2-instruct-0905",
425
+ "deepseek-coder-v2-lite",
426
+ "deepseek-r1-671b",
427
+ "dolphin-2.9.2-qwen2-72b",
428
+ "llama-3.1-405b",
429
+ "llama-3.2-3b",
430
+ "llama-3.3-70b",
431
+ "mistral-31-24b",
432
+ "qwen-2.5-coder-32b",
433
+ "qwen-2.5-qwq-32b",
434
+ "qwen-2.5-vl",
435
+ "qwen3-235b",
436
+ "qwen3-4b",
437
+ "venice-uncensored"
438
+ ],
439
+ docUrl: "https://docs.venice.ai",
440
+ gateway: "models.dev"
441
+ },
442
+ chutes: {
443
+ url: "https://llm.chutes.ai/v1",
444
+ apiKeyEnvVar: "CHUTES_API_KEY",
445
+ apiKeyHeader: "Authorization",
446
+ name: "Chutes",
447
+ models: [
448
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
449
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
450
+ "Qwen/Qwen3-30B-A3B",
451
+ "Qwen/Qwen3-30B-A3B-Instruct-2507",
452
+ "Qwen/Qwen3-30B-A3B-Thinking-2507",
453
+ "Qwen/Qwen3-Coder-30B-A3B-Instruct",
454
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
455
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
456
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
457
+ "chutesai/Devstral-Small-2505",
458
+ "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
459
+ "deepseek-ai/DeepSeek-R1-0528",
460
+ "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
461
+ "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
462
+ "deepseek-ai/DeepSeek-V3-0324",
463
+ "deepseek-ai/DeepSeek-V3.1",
464
+ "deepseek-ai/DeepSeek-V3.1-Terminus",
465
+ "deepseek-ai/DeepSeek-V3.1-turbo",
466
+ "deepseek-ai/DeepSeek-V3.1:THINKING",
467
+ "deepseek-ai/DeepSeek-V3.2-Exp",
468
+ "meituan-longcat/LongCat-Flash-Chat-FP8",
469
+ "moonshotai/Kimi-Dev-72B",
470
+ "moonshotai/Kimi-K2-Instruct-0905",
471
+ "moonshotai/Kimi-K2-Instruct-75k",
472
+ "moonshotai/Kimi-VL-A3B-Thinking",
625
473
  "openai/gpt-oss-120b",
626
- "openai/gpt-oss-20b",
627
- "qwen-qwq-32b",
628
- "qwen/qwen3-32b"
474
+ "tngtech/DeepSeek-R1T-Chimera",
475
+ "tngtech/DeepSeek-TNG-R1T2-Chimera",
476
+ "zai-org/GLM-4.5-Air",
477
+ "zai-org/GLM-4.5-FP8",
478
+ "zai-org/GLM-4.5-turbo",
479
+ "zai-org/GLM-4.6-FP8",
480
+ "zai-org/GLM-4.6-turbo"
629
481
  ],
630
- docUrl: "https://console.groq.com/docs/models",
482
+ docUrl: "https://llm.chutes.ai/v1/models",
631
483
  gateway: "models.dev"
632
484
  },
633
- "moonshotai-cn": {
634
- url: "https://api.moonshot.cn/v1",
635
- apiKeyEnvVar: "MOONSHOT_API_KEY",
485
+ cortecs: {
486
+ url: "https://api.cortecs.ai/v1",
487
+ apiKeyEnvVar: "CORTECS_API_KEY",
636
488
  apiKeyHeader: "Authorization",
637
- name: "Moonshot AI (China)",
638
- models: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
639
- docUrl: "https://platform.moonshot.cn/docs/api/chat",
489
+ name: "Cortecs",
490
+ models: [
491
+ "claude-4-5-sonnet",
492
+ "claude-sonnet-4",
493
+ "deepseek-v3-0324",
494
+ "gemini-2.5-pro",
495
+ "gpt-4.1",
496
+ "gpt-oss-120b",
497
+ "kimi-k2-instruct",
498
+ "llama-3.1-405b-instruct",
499
+ "nova-pro-v1",
500
+ "qwen3-32b",
501
+ "qwen3-coder-480b-a35b-instruct"
502
+ ],
503
+ docUrl: "https://api.cortecs.ai/v1/models",
640
504
  gateway: "models.dev"
641
505
  },
642
506
  "github-models": {
@@ -704,47 +568,50 @@ var provider_registry_default = {
704
568
  docUrl: "https://docs.github.com/en/github-models",
705
569
  gateway: "models.dev"
706
570
  },
707
- deepinfra: {
708
- url: "https://api.deepinfra.com/v1/openai",
709
- apiKeyEnvVar: "DEEPINFRA_API_KEY",
571
+ togetherai: {
572
+ url: "https://api.together.xyz/v1",
573
+ apiKeyEnvVar: "TOGETHER_API_KEY",
710
574
  apiKeyHeader: "Authorization",
711
- name: "Deep Infra",
575
+ name: "Together AI",
712
576
  models: [
713
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
714
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo",
577
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
578
+ "deepseek-ai/DeepSeek-R1",
579
+ "deepseek-ai/DeepSeek-V3",
580
+ "meta-llama/Llama-3.3-70B-Instruct-Turbo",
715
581
  "moonshotai/Kimi-K2-Instruct",
716
- "zai-org/GLM-4.5"
582
+ "openai/gpt-oss-120b"
717
583
  ],
718
- docUrl: "https://deepinfra.com/models",
584
+ docUrl: "https://docs.together.ai/docs/serverless-models",
719
585
  gateway: "models.dev"
720
586
  },
721
- "fireworks-ai": {
722
- url: "https://api.fireworks.ai/inference/v1/",
723
- apiKeyEnvVar: "FIREWORKS_API_KEY",
587
+ baseten: {
588
+ url: "https://inference.baseten.co/v1",
589
+ apiKeyEnvVar: "BASETEN_API_KEY",
724
590
  apiKeyHeader: "Authorization",
725
- name: "Fireworks AI",
726
- models: [
727
- "accounts/fireworks/models/deepseek-r1-0528",
728
- "accounts/fireworks/models/deepseek-v3-0324",
729
- "accounts/fireworks/models/deepseek-v3p1",
730
- "accounts/fireworks/models/glm-4p5",
731
- "accounts/fireworks/models/glm-4p5-air",
732
- "accounts/fireworks/models/gpt-oss-120b",
733
- "accounts/fireworks/models/gpt-oss-20b",
734
- "accounts/fireworks/models/kimi-k2-instruct",
735
- "accounts/fireworks/models/qwen3-235b-a22b",
736
- "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
737
- ],
738
- docUrl: "https://fireworks.ai/docs/",
591
+ name: "Baseten",
592
+ models: ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
593
+ docUrl: "https://docs.baseten.co/development/model-apis/overview",
739
594
  gateway: "models.dev"
740
595
  },
741
- zai: {
742
- url: "https://api.z.ai/api/paas/v4",
743
- apiKeyEnvVar: "ZHIPU_API_KEY",
596
+ huggingface: {
597
+ url: "https://router.huggingface.co/v1",
598
+ apiKeyEnvVar: "HF_TOKEN",
744
599
  apiKeyHeader: "Authorization",
745
- name: "Z.AI",
746
- models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
747
- docUrl: "https://docs.z.ai/guides/overview/pricing",
600
+ name: "Hugging Face",
601
+ models: [
602
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
603
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
604
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
605
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
606
+ "deepseek-ai/DeepSeek-R1-0528",
607
+ "deepseek-ai/Deepseek-V3-0324",
608
+ "moonshotai/Kimi-K2-Instruct",
609
+ "moonshotai/Kimi-K2-Instruct-0905",
610
+ "zai-org/GLM-4.5",
611
+ "zai-org/GLM-4.5-Air",
612
+ "zai-org/GLM-4.6"
613
+ ],
614
+ docUrl: "https://huggingface.co/docs/inference-providers",
748
615
  gateway: "models.dev"
749
616
  },
750
617
  opencode: {
@@ -771,13 +638,59 @@ var provider_registry_default = {
771
638
  docUrl: "https://opencode.ai/docs/zen",
772
639
  gateway: "models.dev"
773
640
  },
774
- "zhipuai-coding-plan": {
775
- url: "https://open.bigmodel.cn/api/coding/paas/v4",
776
- apiKeyEnvVar: "ZHIPU_API_KEY",
641
+ fastrouter: {
642
+ url: "https://go.fastrouter.ai/api/v1",
643
+ apiKeyEnvVar: "FASTROUTER_API_KEY",
777
644
  apiKeyHeader: "Authorization",
778
- name: "Zhipu AI Coding Plan",
779
- models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
780
- docUrl: "https://docs.bigmodel.cn/cn/coding-plan/overview",
645
+ name: "FastRouter",
646
+ models: [
647
+ "anthropic/claude-opus-4.1",
648
+ "anthropic/claude-sonnet-4",
649
+ "deepseek-ai/deepseek-r1-distill-llama-70b",
650
+ "google/gemini-2.5-flash",
651
+ "google/gemini-2.5-pro",
652
+ "moonshotai/kimi-k2",
653
+ "openai/gpt-4.1",
654
+ "openai/gpt-5",
655
+ "openai/gpt-5-mini",
656
+ "openai/gpt-5-nano",
657
+ "openai/gpt-oss-120b",
658
+ "openai/gpt-oss-20b",
659
+ "qwen/qwen3-coder",
660
+ "x-ai/grok-4"
661
+ ],
662
+ docUrl: "https://fastrouter.ai/models",
663
+ gateway: "models.dev"
664
+ },
665
+ google: {
666
+ apiKeyEnvVar: "GOOGLE_GENERATIVE_AI_API_KEY",
667
+ name: "Google",
668
+ models: [
669
+ "gemini-1.5-flash",
670
+ "gemini-1.5-flash-8b",
671
+ "gemini-1.5-pro",
672
+ "gemini-2.0-flash",
673
+ "gemini-2.0-flash-lite",
674
+ "gemini-2.5-flash",
675
+ "gemini-2.5-flash-image",
676
+ "gemini-2.5-flash-image-preview",
677
+ "gemini-2.5-flash-lite",
678
+ "gemini-2.5-flash-lite-preview-06-17",
679
+ "gemini-2.5-flash-lite-preview-09-2025",
680
+ "gemini-2.5-flash-preview-04-17",
681
+ "gemini-2.5-flash-preview-05-20",
682
+ "gemini-2.5-flash-preview-09-2025",
683
+ "gemini-2.5-flash-preview-tts",
684
+ "gemini-2.5-pro",
685
+ "gemini-2.5-pro-preview-05-06",
686
+ "gemini-2.5-pro-preview-06-05",
687
+ "gemini-2.5-pro-preview-tts",
688
+ "gemini-flash-latest",
689
+ "gemini-flash-lite-latest",
690
+ "gemini-live-2.5-flash",
691
+ "gemini-live-2.5-flash-preview-native-audio"
692
+ ],
693
+ docUrl: "https://ai.google.dev/gemini-api/docs/pricing",
781
694
  gateway: "models.dev"
782
695
  },
783
696
  inception: {
@@ -789,30 +702,24 @@ var provider_registry_default = {
789
702
  docUrl: "https://platform.inceptionlabs.ai/docs",
790
703
  gateway: "models.dev"
791
704
  },
792
- llama: {
793
- url: "https://api.llama.com/compat/v1/",
794
- apiKeyEnvVar: "LLAMA_API_KEY",
705
+ wandb: {
706
+ url: "https://api.inference.wandb.ai/v1",
707
+ apiKeyEnvVar: "WANDB_API_KEY",
795
708
  apiKeyHeader: "Authorization",
796
- name: "Llama",
709
+ name: "Weights & Biases",
797
710
  models: [
798
- "cerebras-llama-4-maverick-17b-128e-instruct",
799
- "cerebras-llama-4-scout-17b-16e-instruct",
800
- "groq-llama-4-maverick-17b-128e-instruct",
801
- "llama-3.3-70b-instruct",
802
- "llama-3.3-8b-instruct",
803
- "llama-4-maverick-17b-128e-instruct-fp8",
804
- "llama-4-scout-17b-16e-instruct-fp8"
711
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
712
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
713
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
714
+ "deepseek-ai/DeepSeek-R1-0528",
715
+ "deepseek-ai/DeepSeek-V3-0324",
716
+ "meta-llama/Llama-3.1-8B-Instruct",
717
+ "meta-llama/Llama-3.3-70B-Instruct",
718
+ "meta-llama/Llama-4-Scout-17B-16E-Instruct",
719
+ "microsoft/Phi-4-mini-instruct",
720
+ "moonshotai/Kimi-K2-Instruct"
805
721
  ],
806
- docUrl: "https://llama.developer.meta.com/docs/models",
807
- gateway: "models.dev"
808
- },
809
- lmstudio: {
810
- url: "http://127.0.0.1:1234/v1",
811
- apiKeyEnvVar: "LMSTUDIO_API_KEY",
812
- apiKeyHeader: "Authorization",
813
- name: "LMStudio",
814
- models: ["openai/gpt-oss-20b", "qwen/qwen3-30b-a3b-2507", "qwen/qwen3-coder-30b"],
815
- docUrl: "https://lmstudio.ai/models",
722
+ docUrl: "https://weave-docs.wandb.ai/guides/integrations/inference/",
816
723
  gateway: "models.dev"
817
724
  },
818
725
  openai: {
@@ -850,313 +757,394 @@ var provider_registry_default = {
850
757
  docUrl: "https://platform.openai.com/docs/models",
851
758
  gateway: "models.dev"
852
759
  },
853
- anthropic: {
854
- apiKeyEnvVar: "ANTHROPIC_API_KEY",
855
- name: "Anthropic",
856
- models: [
857
- "claude-3-5-haiku-20241022",
858
- "claude-3-5-haiku-latest",
859
- "claude-3-5-sonnet-20240620",
860
- "claude-3-5-sonnet-20241022",
861
- "claude-3-7-sonnet-20250219",
862
- "claude-3-7-sonnet-latest",
863
- "claude-3-haiku-20240307",
864
- "claude-3-opus-20240229",
865
- "claude-3-sonnet-20240229",
866
- "claude-haiku-4-5",
867
- "claude-haiku-4-5-20251001",
868
- "claude-opus-4-0",
869
- "claude-opus-4-1",
870
- "claude-opus-4-1-20250805",
871
- "claude-opus-4-20250514",
872
- "claude-sonnet-4-0",
873
- "claude-sonnet-4-20250514",
874
- "claude-sonnet-4-5",
875
- "claude-sonnet-4-5-20250929"
876
- ],
877
- docUrl: "https://docs.anthropic.com/en/docs/about-claude/models",
878
- gateway: "models.dev"
879
- },
880
- moonshotai: {
881
- url: "https://api.moonshot.ai/v1",
882
- apiKeyEnvVar: "MOONSHOT_API_KEY",
883
- apiKeyHeader: "Authorization",
884
- name: "Moonshot AI",
885
- models: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
886
- docUrl: "https://platform.moonshot.ai/docs/api/chat",
887
- gateway: "models.dev"
888
- },
889
- inference: {
890
- url: "https://inference.net/v1",
891
- apiKeyEnvVar: "INFERENCE_API_KEY",
892
- apiKeyHeader: "Authorization",
893
- name: "Inference",
894
- models: [
895
- "google/gemma-3",
896
- "meta/llama-3.1-8b-instruct",
897
- "meta/llama-3.2-11b-vision-instruct",
898
- "meta/llama-3.2-1b-instruct",
899
- "meta/llama-3.2-3b-instruct",
900
- "mistral/mistral-nemo-12b-instruct",
901
- "osmosis/osmosis-structure-0.6b",
902
- "qwen/qwen-2.5-7b-vision-instruct",
903
- "qwen/qwen3-embedding-4b"
904
- ],
905
- docUrl: "https://inference.net/models",
906
- gateway: "models.dev"
907
- },
908
- baseten: {
909
- url: "https://inference.baseten.co/v1",
910
- apiKeyEnvVar: "BASETEN_API_KEY",
760
+ "zhipuai-coding-plan": {
761
+ url: "https://open.bigmodel.cn/api/coding/paas/v4",
762
+ apiKeyEnvVar: "ZHIPU_API_KEY",
911
763
  apiKeyHeader: "Authorization",
912
- name: "Baseten",
913
- models: ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
914
- docUrl: "https://docs.baseten.co/development/model-apis/overview",
764
+ name: "Zhipu AI Coding Plan",
765
+ models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
766
+ docUrl: "https://docs.bigmodel.cn/cn/coding-plan/overview",
915
767
  gateway: "models.dev"
916
768
  },
917
- cortecs: {
918
- url: "https://api.cortecs.ai/v1",
919
- apiKeyEnvVar: "CORTECS_API_KEY",
769
+ perplexity: {
770
+ url: "https://api.perplexity.ai",
771
+ apiKeyEnvVar: "PERPLEXITY_API_KEY",
920
772
  apiKeyHeader: "Authorization",
921
- name: "Cortecs",
922
- models: [
923
- "claude-4-5-sonnet",
924
- "claude-sonnet-4",
925
- "deepseek-v3-0324",
926
- "gemini-2.5-pro",
927
- "gpt-4.1",
928
- "gpt-oss-120b",
929
- "kimi-k2-instruct",
930
- "llama-3.1-405b-instruct",
931
- "nova-pro-v1",
932
- "qwen3-32b",
933
- "qwen3-coder-480b-a35b-instruct"
934
- ],
935
- docUrl: "https://api.cortecs.ai/v1/models",
773
+ name: "Perplexity",
774
+ models: ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
775
+ docUrl: "https://docs.perplexity.ai",
936
776
  gateway: "models.dev"
937
777
  },
938
- mistral: {
939
- url: "https://api.mistral.ai/v1",
940
- apiKeyEnvVar: "MISTRAL_API_KEY",
941
- apiKeyHeader: "Authorization",
942
- name: "Mistral",
778
+ openrouter: {
779
+ url: "https://openrouter.ai/api/v1",
780
+ apiKeyEnvVar: "OPENROUTER_API_KEY",
781
+ name: "OpenRouter",
943
782
  models: [
944
- "codestral-latest",
945
- "devstral-medium-2507",
946
- "devstral-small-2505",
947
- "devstral-small-2507",
948
- "magistral-medium-latest",
949
- "magistral-small",
950
- "ministral-3b-latest",
951
- "ministral-8b-latest",
952
- "mistral-large-latest",
953
- "mistral-medium-2505",
954
- "mistral-medium-2508",
955
- "mistral-medium-latest",
956
- "mistral-nemo",
957
- "mistral-small-latest",
958
- "open-mistral-7b",
959
- "open-mixtral-8x22b",
960
- "open-mixtral-8x7b",
961
- "pixtral-12b",
962
- "pixtral-large-latest"
783
+ "anthropic/claude-3.5-haiku",
784
+ "anthropic/claude-3.7-sonnet",
785
+ "anthropic/claude-haiku-4.5",
786
+ "anthropic/claude-opus-4",
787
+ "anthropic/claude-opus-4.1",
788
+ "anthropic/claude-sonnet-4",
789
+ "anthropic/claude-sonnet-4.5",
790
+ "cognitivecomputations/dolphin3.0-mistral-24b",
791
+ "cognitivecomputations/dolphin3.0-r1-mistral-24b",
792
+ "deepseek/deepseek-chat-v3-0324",
793
+ "deepseek/deepseek-chat-v3.1",
794
+ "deepseek/deepseek-r1-0528-qwen3-8b:free",
795
+ "deepseek/deepseek-r1-0528:free",
796
+ "deepseek/deepseek-r1-distill-llama-70b",
797
+ "deepseek/deepseek-r1-distill-qwen-14b",
798
+ "deepseek/deepseek-r1:free",
799
+ "deepseek/deepseek-v3-base:free",
800
+ "deepseek/deepseek-v3.1-terminus",
801
+ "featherless/qwerky-72b",
802
+ "google/gemini-2.0-flash-001",
803
+ "google/gemini-2.0-flash-exp:free",
804
+ "google/gemini-2.5-flash",
805
+ "google/gemini-2.5-flash-lite",
806
+ "google/gemini-2.5-flash-lite-preview-09-2025",
807
+ "google/gemini-2.5-flash-preview-09-2025",
808
+ "google/gemini-2.5-pro",
809
+ "google/gemini-2.5-pro-preview-05-06",
810
+ "google/gemini-2.5-pro-preview-06-05",
811
+ "google/gemma-2-9b-it:free",
812
+ "google/gemma-3-12b-it",
813
+ "google/gemma-3-27b-it",
814
+ "google/gemma-3n-e4b-it",
815
+ "google/gemma-3n-e4b-it:free",
816
+ "meta-llama/llama-3.2-11b-vision-instruct",
817
+ "meta-llama/llama-3.3-70b-instruct:free",
818
+ "meta-llama/llama-4-scout:free",
819
+ "microsoft/mai-ds-r1:free",
820
+ "mistralai/codestral-2508",
821
+ "mistralai/devstral-medium-2507",
822
+ "mistralai/devstral-small-2505",
823
+ "mistralai/devstral-small-2505:free",
824
+ "mistralai/devstral-small-2507",
825
+ "mistralai/mistral-7b-instruct:free",
826
+ "mistralai/mistral-medium-3",
827
+ "mistralai/mistral-medium-3.1",
828
+ "mistralai/mistral-nemo:free",
829
+ "mistralai/mistral-small-3.1-24b-instruct",
830
+ "mistralai/mistral-small-3.2-24b-instruct",
831
+ "mistralai/mistral-small-3.2-24b-instruct:free",
832
+ "moonshotai/kimi-dev-72b:free",
833
+ "moonshotai/kimi-k2",
834
+ "moonshotai/kimi-k2-0905",
835
+ "moonshotai/kimi-k2:free",
836
+ "nousresearch/deephermes-3-llama-3-8b-preview",
837
+ "nousresearch/hermes-4-405b",
838
+ "nousresearch/hermes-4-70b",
839
+ "openai/gpt-4.1",
840
+ "openai/gpt-4.1-mini",
841
+ "openai/gpt-4o-mini",
842
+ "openai/gpt-5",
843
+ "openai/gpt-5-chat",
844
+ "openai/gpt-5-codex",
845
+ "openai/gpt-5-image",
846
+ "openai/gpt-5-mini",
847
+ "openai/gpt-5-nano",
848
+ "openai/gpt-oss-120b",
849
+ "openai/gpt-oss-20b",
850
+ "openai/o4-mini",
851
+ "openrouter/cypher-alpha:free",
852
+ "openrouter/horizon-alpha",
853
+ "openrouter/horizon-beta",
854
+ "openrouter/sonoma-dusk-alpha",
855
+ "openrouter/sonoma-sky-alpha",
856
+ "qwen/qwen-2.5-coder-32b-instruct",
857
+ "qwen/qwen2.5-vl-32b-instruct:free",
858
+ "qwen/qwen2.5-vl-72b-instruct",
859
+ "qwen/qwen2.5-vl-72b-instruct:free",
860
+ "qwen/qwen3-14b:free",
861
+ "qwen/qwen3-235b-a22b-07-25",
862
+ "qwen/qwen3-235b-a22b-07-25:free",
863
+ "qwen/qwen3-235b-a22b-thinking-2507",
864
+ "qwen/qwen3-235b-a22b:free",
865
+ "qwen/qwen3-30b-a3b-instruct-2507",
866
+ "qwen/qwen3-30b-a3b-thinking-2507",
867
+ "qwen/qwen3-30b-a3b:free",
868
+ "qwen/qwen3-32b:free",
869
+ "qwen/qwen3-8b:free",
870
+ "qwen/qwen3-coder",
871
+ "qwen/qwen3-coder:free",
872
+ "qwen/qwen3-max",
873
+ "qwen/qwen3-next-80b-a3b-instruct",
874
+ "qwen/qwen3-next-80b-a3b-thinking",
875
+ "qwen/qwq-32b:free",
876
+ "rekaai/reka-flash-3",
877
+ "sarvamai/sarvam-m:free",
878
+ "thudm/glm-z1-32b:free",
879
+ "tngtech/deepseek-r1t2-chimera:free",
880
+ "x-ai/grok-3",
881
+ "x-ai/grok-3-beta",
882
+ "x-ai/grok-3-mini",
883
+ "x-ai/grok-3-mini-beta",
884
+ "x-ai/grok-4",
885
+ "x-ai/grok-4-fast",
886
+ "x-ai/grok-4-fast:free",
887
+ "x-ai/grok-code-fast-1",
888
+ "z-ai/glm-4.5",
889
+ "z-ai/glm-4.5-air",
890
+ "z-ai/glm-4.5-air:free",
891
+ "z-ai/glm-4.5v",
892
+ "z-ai/glm-4.6"
963
893
  ],
964
- docUrl: "https://docs.mistral.ai/getting-started/models/",
894
+ docUrl: "https://openrouter.ai/models",
965
895
  gateway: "models.dev"
966
896
  },
967
- venice: {
968
- url: "https://api.venice.ai/api/v1",
969
- apiKeyEnvVar: "VENICE_API_KEY",
897
+ synthetic: {
898
+ url: "https://api.synthetic.new/v1",
899
+ apiKeyEnvVar: "SYNTHETIC_API_KEY",
970
900
  apiKeyHeader: "Authorization",
971
- name: "Venice AI",
901
+ name: "Synthetic",
972
902
  models: [
973
- "deepseek-coder-v2-lite",
974
- "deepseek-r1-671b",
975
- "dolphin-2.9.2-qwen2-72b",
976
- "llama-3.1-405b",
977
- "llama-3.2-3b",
978
- "llama-3.3-70b",
979
- "mistral-31-24b",
980
- "qwen-2.5-coder-32b",
981
- "qwen-2.5-qwq-32b",
982
- "qwen-2.5-vl",
983
- "qwen3-235b",
984
- "qwen3-4b",
985
- "venice-uncensored"
903
+ "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
904
+ "hf:Qwen/Qwen3-235B-A22B-Instruct-2507",
905
+ "hf:Qwen/Qwen3-235B-A22B-Thinking-2507",
906
+ "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct",
907
+ "hf:deepseek-ai/DeepSeek-R1",
908
+ "hf:deepseek-ai/DeepSeek-R1-0528",
909
+ "hf:deepseek-ai/DeepSeek-V3",
910
+ "hf:deepseek-ai/DeepSeek-V3-0324",
911
+ "hf:deepseek-ai/DeepSeek-V3.1",
912
+ "hf:deepseek-ai/DeepSeek-V3.1-Terminus",
913
+ "hf:meta-llama/Llama-3.1-405B-Instruct",
914
+ "hf:meta-llama/Llama-3.1-70B-Instruct",
915
+ "hf:meta-llama/Llama-3.1-8B-Instruct",
916
+ "hf:meta-llama/Llama-3.3-70B-Instruct",
917
+ "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
918
+ "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct",
919
+ "hf:moonshotai/Kimi-K2-Instruct",
920
+ "hf:moonshotai/Kimi-K2-Instruct-0905",
921
+ "hf:openai/gpt-oss-120b",
922
+ "hf:zai-org/GLM-4.5",
923
+ "hf:zai-org/GLM-4.6"
986
924
  ],
987
- docUrl: "https://docs.venice.ai",
925
+ docUrl: "https://synthetic.new/pricing",
988
926
  gateway: "models.dev"
989
927
  },
990
- alibaba: {
991
- url: "https://dashscope-intl.aliyuncs.com/compatible-mode/v1",
992
- apiKeyEnvVar: "DASHSCOPE_API_KEY",
928
+ deepinfra: {
929
+ url: "https://api.deepinfra.com/v1/openai",
930
+ apiKeyEnvVar: "DEEPINFRA_API_KEY",
993
931
  apiKeyHeader: "Authorization",
994
- name: "Alibaba",
932
+ name: "Deep Infra",
995
933
  models: [
996
- "qvq-max",
997
- "qwen-flash",
998
- "qwen-max",
999
- "qwen-mt-plus",
1000
- "qwen-mt-turbo",
1001
- "qwen-omni-turbo",
1002
- "qwen-omni-turbo-realtime",
1003
- "qwen-plus",
1004
- "qwen-plus-character-ja",
1005
- "qwen-turbo",
1006
- "qwen-vl-max",
1007
- "qwen-vl-ocr",
1008
- "qwen-vl-plus",
1009
- "qwen2-5-14b-instruct",
1010
- "qwen2-5-32b-instruct",
1011
- "qwen2-5-72b-instruct",
1012
- "qwen2-5-7b-instruct",
1013
- "qwen2-5-omni-7b",
1014
- "qwen2-5-vl-72b-instruct",
1015
- "qwen2-5-vl-7b-instruct",
1016
- "qwen3-14b",
1017
- "qwen3-235b-a22b",
1018
- "qwen3-32b",
1019
- "qwen3-8b",
1020
- "qwen3-asr-flash",
1021
- "qwen3-coder-30b-a3b-instruct",
1022
- "qwen3-coder-480b-a35b-instruct",
1023
- "qwen3-coder-flash",
1024
- "qwen3-coder-plus",
1025
- "qwen3-livetranslate-flash-realtime",
1026
- "qwen3-max",
1027
- "qwen3-next-80b-a3b-instruct",
1028
- "qwen3-next-80b-a3b-thinking",
1029
- "qwen3-omni-flash",
1030
- "qwen3-omni-flash-realtime",
1031
- "qwen3-vl-235b-a22b",
1032
- "qwen3-vl-30b-a3b",
1033
- "qwen3-vl-plus",
1034
- "qwq-plus"
934
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
935
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo",
936
+ "moonshotai/Kimi-K2-Instruct",
937
+ "zai-org/GLM-4.5"
1035
938
  ],
1036
- docUrl: "https://www.alibabacloud.com/help/en/model-studio/models",
939
+ docUrl: "https://deepinfra.com/models",
1037
940
  gateway: "models.dev"
1038
941
  },
1039
- "alibaba-cn": {
1040
- url: "https://dashscope.aliyuncs.com/compatible-mode/v1",
1041
- apiKeyEnvVar: "DASHSCOPE_API_KEY",
942
+ zhipuai: {
943
+ url: "https://open.bigmodel.cn/api/paas/v4",
944
+ apiKeyEnvVar: "ZHIPU_API_KEY",
1042
945
  apiKeyHeader: "Authorization",
1043
- name: "Alibaba (China)",
946
+ name: "Zhipu AI",
947
+ models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
948
+ docUrl: "https://docs.z.ai/guides/overview/pricing",
949
+ gateway: "models.dev"
950
+ },
951
+ submodel: {
952
+ url: "https://llm.submodel.ai/v1",
953
+ apiKeyEnvVar: "SUBMODEL_INSTAGEN_ACCESS_KEY",
954
+ apiKeyHeader: "Authorization",
955
+ name: "submodel",
1044
956
  models: [
1045
- "deepseek-r1",
1046
- "deepseek-r1-0528",
1047
- "deepseek-r1-distill-llama-70b",
1048
- "deepseek-r1-distill-llama-8b",
1049
- "deepseek-r1-distill-qwen-1-5b",
1050
- "deepseek-r1-distill-qwen-14b",
1051
- "deepseek-r1-distill-qwen-32b",
1052
- "deepseek-r1-distill-qwen-7b",
1053
- "deepseek-v3",
1054
- "deepseek-v3-1",
1055
- "deepseek-v3-2-exp",
1056
- "moonshot-kimi-k2-instruct",
1057
- "qvq-max",
1058
- "qwen-deep-research",
1059
- "qwen-doc-turbo",
1060
- "qwen-flash",
1061
- "qwen-long",
1062
- "qwen-math-plus",
1063
- "qwen-math-turbo",
1064
- "qwen-max",
1065
- "qwen-mt-plus",
1066
- "qwen-mt-turbo",
1067
- "qwen-omni-turbo",
1068
- "qwen-omni-turbo-realtime",
1069
- "qwen-plus",
1070
- "qwen-plus-character",
1071
- "qwen-turbo",
1072
- "qwen-vl-max",
1073
- "qwen-vl-ocr",
1074
- "qwen-vl-plus",
1075
- "qwen2-5-14b-instruct",
1076
- "qwen2-5-32b-instruct",
1077
- "qwen2-5-72b-instruct",
1078
- "qwen2-5-7b-instruct",
1079
- "qwen2-5-coder-32b-instruct",
1080
- "qwen2-5-coder-7b-instruct",
1081
- "qwen2-5-math-72b-instruct",
1082
- "qwen2-5-math-7b-instruct",
1083
- "qwen2-5-omni-7b",
1084
- "qwen2-5-vl-72b-instruct",
1085
- "qwen2-5-vl-7b-instruct",
1086
- "qwen3-14b",
1087
- "qwen3-235b-a22b",
1088
- "qwen3-32b",
1089
- "qwen3-8b",
1090
- "qwen3-asr-flash",
1091
- "qwen3-coder-30b-a3b-instruct",
1092
- "qwen3-coder-480b-a35b-instruct",
1093
- "qwen3-coder-flash",
1094
- "qwen3-coder-plus",
1095
- "qwen3-max",
1096
- "qwen3-next-80b-a3b-instruct",
1097
- "qwen3-next-80b-a3b-thinking",
1098
- "qwen3-omni-flash",
1099
- "qwen3-omni-flash-realtime",
1100
- "qwen3-vl-235b-a22b",
1101
- "qwen3-vl-30b-a3b",
1102
- "qwen3-vl-plus",
1103
- "qwq-32b",
1104
- "qwq-plus",
1105
- "tongyi-intent-detect-v3"
957
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
958
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
959
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
960
+ "deepseek-ai/DeepSeek-R1-0528",
961
+ "deepseek-ai/DeepSeek-V3-0324",
962
+ "deepseek-ai/DeepSeek-V3.1",
963
+ "openai/gpt-oss-120b",
964
+ "zai-org/GLM-4.5-Air",
965
+ "zai-org/GLM-4.5-FP8"
1106
966
  ],
1107
- docUrl: "https://www.alibabacloud.com/help/en/model-studio/models",
967
+ docUrl: "https://submodel.gitbook.io",
1108
968
  gateway: "models.dev"
1109
969
  },
1110
- chutes: {
1111
- url: "https://llm.chutes.ai/v1",
1112
- apiKeyEnvVar: "CHUTES_API_KEY",
970
+ zai: {
971
+ url: "https://api.z.ai/api/paas/v4",
972
+ apiKeyEnvVar: "ZHIPU_API_KEY",
1113
973
  apiKeyHeader: "Authorization",
1114
- name: "Chutes",
974
+ name: "Z.AI",
975
+ models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
976
+ docUrl: "https://docs.z.ai/guides/overview/pricing",
977
+ gateway: "models.dev"
978
+ },
979
+ inference: {
980
+ url: "https://inference.net/v1",
981
+ apiKeyEnvVar: "INFERENCE_API_KEY",
982
+ apiKeyHeader: "Authorization",
983
+ name: "Inference",
984
+ models: [
985
+ "google/gemma-3",
986
+ "meta/llama-3.1-8b-instruct",
987
+ "meta/llama-3.2-11b-vision-instruct",
988
+ "meta/llama-3.2-1b-instruct",
989
+ "meta/llama-3.2-3b-instruct",
990
+ "mistral/mistral-nemo-12b-instruct",
991
+ "osmosis/osmosis-structure-0.6b",
992
+ "qwen/qwen-2.5-7b-vision-instruct",
993
+ "qwen/qwen3-embedding-4b"
994
+ ],
995
+ docUrl: "https://inference.net/models",
996
+ gateway: "models.dev"
997
+ },
998
+ requesty: {
999
+ url: "https://router.requesty.ai/v1",
1000
+ apiKeyEnvVar: "REQUESTY_API_KEY",
1001
+ apiKeyHeader: "Authorization",
1002
+ name: "Requesty",
1003
+ models: [
1004
+ "anthropic/claude-3-7-sonnet",
1005
+ "anthropic/claude-4-sonnet-20250522",
1006
+ "anthropic/claude-opus-4",
1007
+ "anthropic/claude-opus-4-1-20250805",
1008
+ "google/gemini-2.5-flash",
1009
+ "google/gemini-2.5-pro",
1010
+ "openai/gpt-4.1",
1011
+ "openai/gpt-4.1-mini",
1012
+ "openai/gpt-4o-mini",
1013
+ "openai/gpt-5",
1014
+ "openai/gpt-5-mini",
1015
+ "openai/gpt-5-nano",
1016
+ "openai/o4-mini"
1017
+ ],
1018
+ docUrl: "https://requesty.ai/solution/llm-routing/models",
1019
+ gateway: "models.dev"
1020
+ },
1021
+ morph: {
1022
+ url: "https://api.morphllm.com/v1",
1023
+ apiKeyEnvVar: "MORPH_API_KEY",
1024
+ apiKeyHeader: "Authorization",
1025
+ name: "Morph",
1026
+ models: ["auto", "morph-v3-fast", "morph-v3-large"],
1027
+ docUrl: "https://docs.morphllm.com/api-reference/introduction",
1028
+ gateway: "models.dev"
1029
+ },
1030
+ lmstudio: {
1031
+ url: "http://127.0.0.1:1234/v1",
1032
+ apiKeyEnvVar: "LMSTUDIO_API_KEY",
1033
+ apiKeyHeader: "Authorization",
1034
+ name: "LMStudio",
1035
+ models: ["openai/gpt-oss-20b", "qwen/qwen3-30b-a3b-2507", "qwen/qwen3-coder-30b"],
1036
+ docUrl: "https://lmstudio.ai/models",
1037
+ gateway: "models.dev"
1038
+ },
1039
+ anthropic: {
1040
+ apiKeyEnvVar: "ANTHROPIC_API_KEY",
1041
+ name: "Anthropic",
1042
+ models: [
1043
+ "claude-3-5-haiku-20241022",
1044
+ "claude-3-5-haiku-latest",
1045
+ "claude-3-5-sonnet-20240620",
1046
+ "claude-3-5-sonnet-20241022",
1047
+ "claude-3-7-sonnet-20250219",
1048
+ "claude-3-7-sonnet-latest",
1049
+ "claude-3-haiku-20240307",
1050
+ "claude-3-opus-20240229",
1051
+ "claude-3-sonnet-20240229",
1052
+ "claude-haiku-4-5",
1053
+ "claude-haiku-4-5-20251001",
1054
+ "claude-opus-4-0",
1055
+ "claude-opus-4-1",
1056
+ "claude-opus-4-1-20250805",
1057
+ "claude-opus-4-20250514",
1058
+ "claude-sonnet-4-0",
1059
+ "claude-sonnet-4-20250514",
1060
+ "claude-sonnet-4-5",
1061
+ "claude-sonnet-4-5-20250929"
1062
+ ],
1063
+ docUrl: "https://docs.anthropic.com/en/docs/about-claude/models",
1064
+ gateway: "models.dev"
1065
+ },
1066
+ "fireworks-ai": {
1067
+ url: "https://api.fireworks.ai/inference/v1/",
1068
+ apiKeyEnvVar: "FIREWORKS_API_KEY",
1069
+ apiKeyHeader: "Authorization",
1070
+ name: "Fireworks AI",
1071
+ models: [
1072
+ "accounts/fireworks/models/deepseek-r1-0528",
1073
+ "accounts/fireworks/models/deepseek-v3-0324",
1074
+ "accounts/fireworks/models/deepseek-v3p1",
1075
+ "accounts/fireworks/models/glm-4p5",
1076
+ "accounts/fireworks/models/glm-4p5-air",
1077
+ "accounts/fireworks/models/gpt-oss-120b",
1078
+ "accounts/fireworks/models/gpt-oss-20b",
1079
+ "accounts/fireworks/models/kimi-k2-instruct",
1080
+ "accounts/fireworks/models/qwen3-235b-a22b",
1081
+ "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
1082
+ ],
1083
+ docUrl: "https://fireworks.ai/docs/",
1084
+ gateway: "models.dev"
1085
+ },
1086
+ modelscope: {
1087
+ url: "https://api-inference.modelscope.cn/v1",
1088
+ apiKeyEnvVar: "MODELSCOPE_API_KEY",
1089
+ apiKeyHeader: "Authorization",
1090
+ name: "ModelScope",
1091
+ models: [
1092
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1093
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1094
+ "Qwen/Qwen3-30B-A3B-Instruct-2507",
1095
+ "Qwen/Qwen3-30B-A3B-Thinking-2507",
1096
+ "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1097
+ "ZhipuAI/GLM-4.5",
1098
+ "ZhipuAI/GLM-4.6"
1099
+ ],
1100
+ docUrl: "https://modelscope.cn/docs/model-service/API-Inference/intro",
1101
+ gateway: "models.dev"
1102
+ },
1103
+ llama: {
1104
+ url: "https://api.llama.com/compat/v1/",
1105
+ apiKeyEnvVar: "LLAMA_API_KEY",
1106
+ apiKeyHeader: "Authorization",
1107
+ name: "Llama",
1108
+ models: [
1109
+ "cerebras-llama-4-maverick-17b-128e-instruct",
1110
+ "cerebras-llama-4-scout-17b-16e-instruct",
1111
+ "groq-llama-4-maverick-17b-128e-instruct",
1112
+ "llama-3.3-70b-instruct",
1113
+ "llama-3.3-8b-instruct",
1114
+ "llama-4-maverick-17b-128e-instruct-fp8",
1115
+ "llama-4-scout-17b-16e-instruct-fp8"
1116
+ ],
1117
+ docUrl: "https://llama.developer.meta.com/docs/models",
1118
+ gateway: "models.dev"
1119
+ },
1120
+ scaleway: {
1121
+ url: "https://api.scaleway.ai/v1",
1122
+ apiKeyEnvVar: "SCALEWAY_API_KEY",
1123
+ apiKeyHeader: "Authorization",
1124
+ name: "Scaleway",
1115
1125
  models: [
1116
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1117
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1118
- "Qwen/Qwen3-30B-A3B",
1119
- "Qwen/Qwen3-30B-A3B-Instruct-2507",
1120
- "Qwen/Qwen3-30B-A3B-Thinking-2507",
1121
- "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1122
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1123
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
1124
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
1125
- "chutesai/Devstral-Small-2505",
1126
- "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
1127
- "deepseek-ai/DeepSeek-R1-0528",
1128
- "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
1129
- "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1130
- "deepseek-ai/DeepSeek-V3-0324",
1131
- "deepseek-ai/DeepSeek-V3.1",
1132
- "deepseek-ai/DeepSeek-V3.1-Terminus",
1133
- "deepseek-ai/DeepSeek-V3.1-turbo",
1134
- "deepseek-ai/DeepSeek-V3.1:THINKING",
1135
- "deepseek-ai/DeepSeek-V3.2-Exp",
1136
- "meituan-longcat/LongCat-Flash-Chat-FP8",
1137
- "moonshotai/Kimi-Dev-72B",
1138
- "moonshotai/Kimi-K2-Instruct-0905",
1139
- "moonshotai/Kimi-K2-Instruct-75k",
1140
- "moonshotai/Kimi-VL-A3B-Thinking",
1141
- "openai/gpt-oss-120b",
1142
- "tngtech/DeepSeek-R1T-Chimera",
1143
- "tngtech/DeepSeek-TNG-R1T2-Chimera",
1144
- "zai-org/GLM-4.5-Air",
1145
- "zai-org/GLM-4.5-FP8",
1146
- "zai-org/GLM-4.5-turbo",
1147
- "zai-org/GLM-4.6-FP8",
1148
- "zai-org/GLM-4.6-turbo"
1126
+ "deepseek-r1-distill-llama-70b",
1127
+ "gemma-3-27b-it",
1128
+ "gpt-oss-120b",
1129
+ "llama-3.1-8b-instruct",
1130
+ "llama-3.3-70b-instruct",
1131
+ "mistral-nemo-instruct-2407",
1132
+ "mistral-small-3.2-24b-instruct-2506",
1133
+ "pixtral-12b-2409",
1134
+ "qwen3-235b-a22b-instruct-2507",
1135
+ "qwen3-coder-30b-a3b-instruct",
1136
+ "voxtral-small-24b-2507"
1149
1137
  ],
1150
- docUrl: "https://llm.chutes.ai/v1/models",
1138
+ docUrl: "https://www.scaleway.com/en/docs/generative-apis/",
1151
1139
  gateway: "models.dev"
1152
1140
  },
1153
- upstage: {
1154
- url: "https://api.upstage.ai",
1155
- apiKeyEnvVar: "UPSTAGE_API_KEY",
1141
+ cerebras: {
1142
+ url: "https://api.cerebras.ai/v1",
1143
+ apiKeyEnvVar: "CEREBRAS_API_KEY",
1156
1144
  apiKeyHeader: "Authorization",
1157
- name: "Upstage",
1158
- models: ["solar-mini", "solar-pro2"],
1159
- docUrl: "https://developers.upstage.ai/docs/apis/chat",
1145
+ name: "Cerebras",
1146
+ models: ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
1147
+ docUrl: "https://inference-docs.cerebras.ai/models/overview",
1160
1148
  gateway: "models.dev"
1161
1149
  },
1162
1150
  netlify: {
@@ -1204,6 +1192,73 @@ var provider_registry_default = {
1204
1192
  }
1205
1193
  },
1206
1194
  models: {
1195
+ "moonshotai-cn": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1196
+ lucidquery: ["lucidnova-rf1-100b", "lucidquery-nexus-coder"],
1197
+ moonshotai: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1198
+ "zai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1199
+ alibaba: [
1200
+ "qvq-max",
1201
+ "qwen-flash",
1202
+ "qwen-max",
1203
+ "qwen-mt-plus",
1204
+ "qwen-mt-turbo",
1205
+ "qwen-omni-turbo",
1206
+ "qwen-omni-turbo-realtime",
1207
+ "qwen-plus",
1208
+ "qwen-plus-character-ja",
1209
+ "qwen-turbo",
1210
+ "qwen-vl-max",
1211
+ "qwen-vl-ocr",
1212
+ "qwen-vl-plus",
1213
+ "qwen2-5-14b-instruct",
1214
+ "qwen2-5-32b-instruct",
1215
+ "qwen2-5-72b-instruct",
1216
+ "qwen2-5-7b-instruct",
1217
+ "qwen2-5-omni-7b",
1218
+ "qwen2-5-vl-72b-instruct",
1219
+ "qwen2-5-vl-7b-instruct",
1220
+ "qwen3-14b",
1221
+ "qwen3-235b-a22b",
1222
+ "qwen3-32b",
1223
+ "qwen3-8b",
1224
+ "qwen3-asr-flash",
1225
+ "qwen3-coder-30b-a3b-instruct",
1226
+ "qwen3-coder-480b-a35b-instruct",
1227
+ "qwen3-coder-flash",
1228
+ "qwen3-coder-plus",
1229
+ "qwen3-livetranslate-flash-realtime",
1230
+ "qwen3-max",
1231
+ "qwen3-next-80b-a3b-instruct",
1232
+ "qwen3-next-80b-a3b-thinking",
1233
+ "qwen3-omni-flash",
1234
+ "qwen3-omni-flash-realtime",
1235
+ "qwen3-vl-235b-a22b",
1236
+ "qwen3-vl-30b-a3b",
1237
+ "qwen3-vl-plus",
1238
+ "qwq-plus"
1239
+ ],
1240
+ xai: [
1241
+ "grok-2",
1242
+ "grok-2-1212",
1243
+ "grok-2-latest",
1244
+ "grok-2-vision",
1245
+ "grok-2-vision-1212",
1246
+ "grok-2-vision-latest",
1247
+ "grok-3",
1248
+ "grok-3-fast",
1249
+ "grok-3-fast-latest",
1250
+ "grok-3-latest",
1251
+ "grok-3-mini",
1252
+ "grok-3-mini-fast",
1253
+ "grok-3-mini-fast-latest",
1254
+ "grok-3-mini-latest",
1255
+ "grok-4",
1256
+ "grok-4-fast",
1257
+ "grok-4-fast-non-reasoning",
1258
+ "grok-beta",
1259
+ "grok-code-fast-1",
1260
+ "grok-vision-beta"
1261
+ ],
1207
1262
  nvidia: [
1208
1263
  "black-forest-labs/flux.1-dev",
1209
1264
  "deepseek-ai/deepseek-v3.1",
@@ -1217,99 +1272,375 @@ var provider_registry_default = {
1217
1272
  "nvidia/nemoretriever-ocr-v1",
1218
1273
  "nvidia/parakeet-tdt-0.6b-v2",
1219
1274
  "openai/gpt-oss-120b",
1220
- "openai/whisper-large-v3",
1221
- "qwen/qwen3-235b-a22b",
1222
- "qwen/qwen3-coder-480b-a35b-instruct"
1275
+ "openai/whisper-large-v3",
1276
+ "qwen/qwen3-235b-a22b",
1277
+ "qwen/qwen3-coder-480b-a35b-instruct"
1278
+ ],
1279
+ upstage: ["solar-mini", "solar-pro2"],
1280
+ groq: [
1281
+ "deepseek-r1-distill-llama-70b",
1282
+ "gemma2-9b-it",
1283
+ "llama-3.1-8b-instant",
1284
+ "llama-3.3-70b-versatile",
1285
+ "llama-guard-3-8b",
1286
+ "llama3-70b-8192",
1287
+ "llama3-8b-8192",
1288
+ "meta-llama/llama-4-maverick-17b-128e-instruct",
1289
+ "meta-llama/llama-4-scout-17b-16e-instruct",
1290
+ "meta-llama/llama-guard-4-12b",
1291
+ "mistral-saba-24b",
1292
+ "moonshotai/kimi-k2-instruct",
1293
+ "moonshotai/kimi-k2-instruct-0905",
1294
+ "openai/gpt-oss-120b",
1295
+ "openai/gpt-oss-20b",
1296
+ "qwen-qwq-32b",
1297
+ "qwen/qwen3-32b"
1298
+ ],
1299
+ mistral: [
1300
+ "codestral-latest",
1301
+ "devstral-medium-2507",
1302
+ "devstral-small-2505",
1303
+ "devstral-small-2507",
1304
+ "magistral-medium-latest",
1305
+ "magistral-small",
1306
+ "ministral-3b-latest",
1307
+ "ministral-8b-latest",
1308
+ "mistral-large-latest",
1309
+ "mistral-medium-2505",
1310
+ "mistral-medium-2508",
1311
+ "mistral-medium-latest",
1312
+ "mistral-nemo",
1313
+ "mistral-small-latest",
1314
+ "open-mistral-7b",
1315
+ "open-mixtral-8x22b",
1316
+ "open-mixtral-8x7b",
1317
+ "pixtral-12b",
1318
+ "pixtral-large-latest"
1319
+ ],
1320
+ vercel: [
1321
+ "alibaba/qwen3-coder-plus",
1322
+ "alibaba/qwen3-max",
1323
+ "alibaba/qwen3-next-80b-a3b-instruct",
1324
+ "alibaba/qwen3-next-80b-a3b-thinking",
1325
+ "alibaba/qwen3-vl-instruct",
1326
+ "alibaba/qwen3-vl-thinking",
1327
+ "amazon/nova-lite",
1328
+ "amazon/nova-micro",
1329
+ "amazon/nova-pro",
1330
+ "anthropic/claude-3-5-haiku",
1331
+ "anthropic/claude-3-haiku",
1332
+ "anthropic/claude-3-opus",
1333
+ "anthropic/claude-3.5-sonnet",
1334
+ "anthropic/claude-3.7-sonnet",
1335
+ "anthropic/claude-4-1-opus",
1336
+ "anthropic/claude-4-opus",
1337
+ "anthropic/claude-4-sonnet",
1338
+ "anthropic/claude-4.5-sonnet",
1339
+ "anthropic/claude-haiku-4.5",
1340
+ "cerebras/qwen3-coder",
1341
+ "deepseek/deepseek-r1",
1342
+ "deepseek/deepseek-r1-distill-llama-70b",
1343
+ "deepseek/deepseek-v3.1-terminus",
1344
+ "deepseek/deepseek-v3.2-exp",
1345
+ "deepseek/deepseek-v3.2-exp-thinking",
1346
+ "google/gemini-2.0-flash",
1347
+ "google/gemini-2.0-flash-lite",
1348
+ "google/gemini-2.5-flash",
1349
+ "google/gemini-2.5-flash-lite",
1350
+ "google/gemini-2.5-flash-lite-preview-09-2025",
1351
+ "google/gemini-2.5-flash-preview-09-2025",
1352
+ "google/gemini-2.5-pro",
1353
+ "meta/llama-3.3-70b",
1354
+ "meta/llama-4-maverick",
1355
+ "meta/llama-4-scout",
1356
+ "mistral/codestral",
1357
+ "mistral/magistral-medium",
1358
+ "mistral/magistral-small",
1359
+ "mistral/ministral-3b",
1360
+ "mistral/ministral-8b",
1361
+ "mistral/mistral-large",
1362
+ "mistral/mistral-small",
1363
+ "mistral/mixtral-8x22b-instruct",
1364
+ "mistral/pixtral-12b",
1365
+ "mistral/pixtral-large",
1366
+ "moonshotai/kimi-k2",
1367
+ "morph/morph-v3-fast",
1368
+ "morph/morph-v3-large",
1369
+ "openai/gpt-4-turbo",
1370
+ "openai/gpt-4.1",
1371
+ "openai/gpt-4.1-mini",
1372
+ "openai/gpt-4.1-nano",
1373
+ "openai/gpt-4o",
1374
+ "openai/gpt-4o-mini",
1375
+ "openai/gpt-5",
1376
+ "openai/gpt-5-codex",
1377
+ "openai/gpt-5-mini",
1378
+ "openai/gpt-5-nano",
1379
+ "openai/gpt-oss-120b",
1380
+ "openai/gpt-oss-20b",
1381
+ "openai/o1",
1382
+ "openai/o3",
1383
+ "openai/o3-mini",
1384
+ "openai/o4-mini",
1385
+ "perplexity/sonar",
1386
+ "perplexity/sonar-pro",
1387
+ "perplexity/sonar-reasoning",
1388
+ "perplexity/sonar-reasoning-pro",
1389
+ "vercel/v0-1.0-md",
1390
+ "vercel/v0-1.5-md",
1391
+ "xai/grok-2",
1392
+ "xai/grok-2-vision",
1393
+ "xai/grok-3",
1394
+ "xai/grok-3-fast",
1395
+ "xai/grok-3-mini",
1396
+ "xai/grok-3-mini-fast",
1397
+ "xai/grok-4",
1398
+ "xai/grok-4-fast",
1399
+ "xai/grok-4-fast-non-reasoning",
1400
+ "xai/grok-code-fast-1",
1401
+ "zai/glm-4.5",
1402
+ "zai/glm-4.5-air",
1403
+ "zai/glm-4.5v",
1404
+ "zai/glm-4.6"
1405
+ ],
1406
+ nebius: [
1407
+ "NousResearch/hermes-4-405b",
1408
+ "NousResearch/hermes-4-70b",
1409
+ "deepseek-ai/deepseek-v3",
1410
+ "meta-llama/llama-3.3-70b-instruct-base",
1411
+ "meta-llama/llama-3.3-70b-instruct-fast",
1412
+ "meta-llama/llama-3_1-405b-instruct",
1413
+ "moonshotai/kimi-k2-instruct",
1414
+ "nvidia/llama-3_1-nemotron-ultra-253b-v1",
1415
+ "openai/gpt-oss-120b",
1416
+ "openai/gpt-oss-20b",
1417
+ "qwen/qwen3-235b-a22b-instruct-2507",
1418
+ "qwen/qwen3-235b-a22b-thinking-2507",
1419
+ "qwen/qwen3-coder-480b-a35b-instruct",
1420
+ "zai-org/glm-4.5",
1421
+ "zai-org/glm-4.5-air"
1223
1422
  ],
1224
- modelscope: [
1423
+ deepseek: ["deepseek-chat", "deepseek-reasoner"],
1424
+ "alibaba-cn": [
1425
+ "deepseek-r1",
1426
+ "deepseek-r1-0528",
1427
+ "deepseek-r1-distill-llama-70b",
1428
+ "deepseek-r1-distill-llama-8b",
1429
+ "deepseek-r1-distill-qwen-1-5b",
1430
+ "deepseek-r1-distill-qwen-14b",
1431
+ "deepseek-r1-distill-qwen-32b",
1432
+ "deepseek-r1-distill-qwen-7b",
1433
+ "deepseek-v3",
1434
+ "deepseek-v3-1",
1435
+ "deepseek-v3-2-exp",
1436
+ "moonshot-kimi-k2-instruct",
1437
+ "qvq-max",
1438
+ "qwen-deep-research",
1439
+ "qwen-doc-turbo",
1440
+ "qwen-flash",
1441
+ "qwen-long",
1442
+ "qwen-math-plus",
1443
+ "qwen-math-turbo",
1444
+ "qwen-max",
1445
+ "qwen-mt-plus",
1446
+ "qwen-mt-turbo",
1447
+ "qwen-omni-turbo",
1448
+ "qwen-omni-turbo-realtime",
1449
+ "qwen-plus",
1450
+ "qwen-plus-character",
1451
+ "qwen-turbo",
1452
+ "qwen-vl-max",
1453
+ "qwen-vl-ocr",
1454
+ "qwen-vl-plus",
1455
+ "qwen2-5-14b-instruct",
1456
+ "qwen2-5-32b-instruct",
1457
+ "qwen2-5-72b-instruct",
1458
+ "qwen2-5-7b-instruct",
1459
+ "qwen2-5-coder-32b-instruct",
1460
+ "qwen2-5-coder-7b-instruct",
1461
+ "qwen2-5-math-72b-instruct",
1462
+ "qwen2-5-math-7b-instruct",
1463
+ "qwen2-5-omni-7b",
1464
+ "qwen2-5-vl-72b-instruct",
1465
+ "qwen2-5-vl-7b-instruct",
1466
+ "qwen3-14b",
1467
+ "qwen3-235b-a22b",
1468
+ "qwen3-32b",
1469
+ "qwen3-8b",
1470
+ "qwen3-asr-flash",
1471
+ "qwen3-coder-30b-a3b-instruct",
1472
+ "qwen3-coder-480b-a35b-instruct",
1473
+ "qwen3-coder-flash",
1474
+ "qwen3-coder-plus",
1475
+ "qwen3-max",
1476
+ "qwen3-next-80b-a3b-instruct",
1477
+ "qwen3-next-80b-a3b-thinking",
1478
+ "qwen3-omni-flash",
1479
+ "qwen3-omni-flash-realtime",
1480
+ "qwen3-vl-235b-a22b",
1481
+ "qwen3-vl-30b-a3b",
1482
+ "qwen3-vl-plus",
1483
+ "qwq-32b",
1484
+ "qwq-plus",
1485
+ "tongyi-intent-detect-v3"
1486
+ ],
1487
+ venice: [
1488
+ "deepseek-coder-v2-lite",
1489
+ "deepseek-r1-671b",
1490
+ "dolphin-2.9.2-qwen2-72b",
1491
+ "llama-3.1-405b",
1492
+ "llama-3.2-3b",
1493
+ "llama-3.3-70b",
1494
+ "mistral-31-24b",
1495
+ "qwen-2.5-coder-32b",
1496
+ "qwen-2.5-qwq-32b",
1497
+ "qwen-2.5-vl",
1498
+ "qwen3-235b",
1499
+ "qwen3-4b",
1500
+ "venice-uncensored"
1501
+ ],
1502
+ chutes: [
1225
1503
  "Qwen/Qwen3-235B-A22B-Instruct-2507",
1226
1504
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
1505
+ "Qwen/Qwen3-30B-A3B",
1227
1506
  "Qwen/Qwen3-30B-A3B-Instruct-2507",
1228
1507
  "Qwen/Qwen3-30B-A3B-Thinking-2507",
1229
1508
  "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1230
- "ZhipuAI/GLM-4.5",
1231
- "ZhipuAI/GLM-4.6"
1509
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1510
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
1511
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
1512
+ "chutesai/Devstral-Small-2505",
1513
+ "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
1514
+ "deepseek-ai/DeepSeek-R1-0528",
1515
+ "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
1516
+ "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1517
+ "deepseek-ai/DeepSeek-V3-0324",
1518
+ "deepseek-ai/DeepSeek-V3.1",
1519
+ "deepseek-ai/DeepSeek-V3.1-Terminus",
1520
+ "deepseek-ai/DeepSeek-V3.1-turbo",
1521
+ "deepseek-ai/DeepSeek-V3.1:THINKING",
1522
+ "deepseek-ai/DeepSeek-V3.2-Exp",
1523
+ "meituan-longcat/LongCat-Flash-Chat-FP8",
1524
+ "moonshotai/Kimi-Dev-72B",
1525
+ "moonshotai/Kimi-K2-Instruct-0905",
1526
+ "moonshotai/Kimi-K2-Instruct-75k",
1527
+ "moonshotai/Kimi-VL-A3B-Thinking",
1528
+ "openai/gpt-oss-120b",
1529
+ "tngtech/DeepSeek-R1T-Chimera",
1530
+ "tngtech/DeepSeek-TNG-R1T2-Chimera",
1531
+ "zai-org/GLM-4.5-Air",
1532
+ "zai-org/GLM-4.5-FP8",
1533
+ "zai-org/GLM-4.5-turbo",
1534
+ "zai-org/GLM-4.6-FP8",
1535
+ "zai-org/GLM-4.6-turbo"
1232
1536
  ],
1233
- aihubmix: [
1234
- "DeepSeek-V3.2-Exp",
1235
- "DeepSeek-V3.2-Exp-Think",
1236
- "Kimi-K2-0905",
1237
- "claude-haiku-4-5",
1238
- "claude-opus-4-1",
1239
- "claude-sonnet-4-5",
1240
- "gemini-2.5-flash",
1537
+ cortecs: [
1538
+ "claude-4-5-sonnet",
1539
+ "claude-sonnet-4",
1540
+ "deepseek-v3-0324",
1241
1541
  "gemini-2.5-pro",
1242
- "glm-4.6",
1243
1542
  "gpt-4.1",
1244
- "gpt-4.1-mini",
1245
- "gpt-4.1-nano",
1246
- "gpt-4o",
1247
- "gpt-4o-2024-11-20",
1248
- "gpt-5",
1249
- "gpt-5-codex",
1250
- "gpt-5-mini",
1251
- "gpt-5-nano",
1252
- "gpt-5-pro",
1253
- "o4-mini",
1254
- "qwen3-235b-a22b-instruct-2507",
1255
- "qwen3-235b-a22b-thinking-2507",
1543
+ "gpt-oss-120b",
1544
+ "kimi-k2-instruct",
1545
+ "llama-3.1-405b-instruct",
1546
+ "nova-pro-v1",
1547
+ "qwen3-32b",
1256
1548
  "qwen3-coder-480b-a35b-instruct"
1257
1549
  ],
1258
- lucidquery: ["lucidnova-rf1-100b", "lucidquery-nexus-coder"],
1259
- xai: [
1260
- "grok-2",
1261
- "grok-2-1212",
1262
- "grok-2-latest",
1263
- "grok-2-vision",
1264
- "grok-2-vision-1212",
1265
- "grok-2-vision-latest",
1266
- "grok-3",
1267
- "grok-3-fast",
1268
- "grok-3-fast-latest",
1269
- "grok-3-latest",
1270
- "grok-3-mini",
1271
- "grok-3-mini-fast",
1272
- "grok-3-mini-fast-latest",
1273
- "grok-3-mini-latest",
1274
- "grok-4",
1275
- "grok-4-fast",
1276
- "grok-4-fast-non-reasoning",
1277
- "grok-beta",
1278
- "grok-code-fast-1",
1279
- "grok-vision-beta"
1280
- ],
1281
- deepseek: ["deepseek-chat", "deepseek-reasoner"],
1282
- requesty: [
1283
- "anthropic/claude-3-7-sonnet",
1284
- "anthropic/claude-4-sonnet-20250522",
1285
- "anthropic/claude-opus-4",
1286
- "anthropic/claude-opus-4-1-20250805",
1287
- "google/gemini-2.5-flash",
1288
- "google/gemini-2.5-pro",
1550
+ "github-models": [
1551
+ "ai21-labs/ai21-jamba-1.5-large",
1552
+ "ai21-labs/ai21-jamba-1.5-mini",
1553
+ "cohere/cohere-command-a",
1554
+ "cohere/cohere-command-r",
1555
+ "cohere/cohere-command-r-08-2024",
1556
+ "cohere/cohere-command-r-plus",
1557
+ "cohere/cohere-command-r-plus-08-2024",
1558
+ "core42/jais-30b-chat",
1559
+ "deepseek/deepseek-r1",
1560
+ "deepseek/deepseek-r1-0528",
1561
+ "deepseek/deepseek-v3-0324",
1562
+ "meta/llama-3.2-11b-vision-instruct",
1563
+ "meta/llama-3.2-90b-vision-instruct",
1564
+ "meta/llama-3.3-70b-instruct",
1565
+ "meta/llama-4-maverick-17b-128e-instruct-fp8",
1566
+ "meta/llama-4-scout-17b-16e-instruct",
1567
+ "meta/meta-llama-3-70b-instruct",
1568
+ "meta/meta-llama-3-8b-instruct",
1569
+ "meta/meta-llama-3.1-405b-instruct",
1570
+ "meta/meta-llama-3.1-70b-instruct",
1571
+ "meta/meta-llama-3.1-8b-instruct",
1572
+ "microsoft/mai-ds-r1",
1573
+ "microsoft/phi-3-medium-128k-instruct",
1574
+ "microsoft/phi-3-medium-4k-instruct",
1575
+ "microsoft/phi-3-mini-128k-instruct",
1576
+ "microsoft/phi-3-mini-4k-instruct",
1577
+ "microsoft/phi-3-small-128k-instruct",
1578
+ "microsoft/phi-3-small-8k-instruct",
1579
+ "microsoft/phi-3.5-mini-instruct",
1580
+ "microsoft/phi-3.5-moe-instruct",
1581
+ "microsoft/phi-3.5-vision-instruct",
1582
+ "microsoft/phi-4",
1583
+ "microsoft/phi-4-mini-instruct",
1584
+ "microsoft/phi-4-mini-reasoning",
1585
+ "microsoft/phi-4-multimodal-instruct",
1586
+ "microsoft/phi-4-reasoning",
1587
+ "mistral-ai/codestral-2501",
1588
+ "mistral-ai/ministral-3b",
1589
+ "mistral-ai/mistral-large-2411",
1590
+ "mistral-ai/mistral-medium-2505",
1591
+ "mistral-ai/mistral-nemo",
1592
+ "mistral-ai/mistral-small-2503",
1289
1593
  "openai/gpt-4.1",
1290
1594
  "openai/gpt-4.1-mini",
1595
+ "openai/gpt-4.1-nano",
1596
+ "openai/gpt-4o",
1291
1597
  "openai/gpt-4o-mini",
1292
- "openai/gpt-5",
1293
- "openai/gpt-5-mini",
1294
- "openai/gpt-5-nano",
1295
- "openai/o4-mini"
1598
+ "openai/o1",
1599
+ "openai/o1-mini",
1600
+ "openai/o1-preview",
1601
+ "openai/o3",
1602
+ "openai/o3-mini",
1603
+ "openai/o4-mini",
1604
+ "xai/grok-3",
1605
+ "xai/grok-3-mini"
1606
+ ],
1607
+ togetherai: [
1608
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1609
+ "deepseek-ai/DeepSeek-R1",
1610
+ "deepseek-ai/DeepSeek-V3",
1611
+ "meta-llama/Llama-3.3-70B-Instruct-Turbo",
1612
+ "moonshotai/Kimi-K2-Instruct",
1613
+ "openai/gpt-oss-120b"
1614
+ ],
1615
+ baseten: ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
1616
+ huggingface: [
1617
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1618
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1619
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
1620
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
1621
+ "deepseek-ai/DeepSeek-R1-0528",
1622
+ "deepseek-ai/Deepseek-V3-0324",
1623
+ "moonshotai/Kimi-K2-Instruct",
1624
+ "moonshotai/Kimi-K2-Instruct-0905",
1625
+ "zai-org/GLM-4.5",
1626
+ "zai-org/GLM-4.5-Air",
1627
+ "zai-org/GLM-4.6"
1296
1628
  ],
1297
- nebius: [
1298
- "NousResearch/hermes-4-405b",
1299
- "NousResearch/hermes-4-70b",
1300
- "deepseek-ai/deepseek-v3",
1301
- "meta-llama/llama-3.3-70b-instruct-base",
1302
- "meta-llama/llama-3.3-70b-instruct-fast",
1303
- "meta-llama/llama-3_1-405b-instruct",
1304
- "moonshotai/kimi-k2-instruct",
1305
- "nvidia/llama-3_1-nemotron-ultra-253b-v1",
1306
- "openai/gpt-oss-120b",
1307
- "openai/gpt-oss-20b",
1308
- "qwen/qwen3-235b-a22b-instruct-2507",
1309
- "qwen/qwen3-235b-a22b-thinking-2507",
1310
- "qwen/qwen3-coder-480b-a35b-instruct",
1311
- "zai-org/glm-4.5",
1312
- "zai-org/glm-4.5-air"
1629
+ opencode: [
1630
+ "an-gbt",
1631
+ "big-pickle",
1632
+ "claude-3-5-haiku",
1633
+ "claude-haiku-4-5",
1634
+ "claude-opus-4-1",
1635
+ "claude-sonnet-4",
1636
+ "claude-sonnet-4-5",
1637
+ "code-supernova",
1638
+ "glm-4.6",
1639
+ "gpt-5",
1640
+ "gpt-5-codex",
1641
+ "grok-code",
1642
+ "kimi-k2",
1643
+ "qwen3-coder"
1313
1644
  ],
1314
1645
  fastrouter: [
1315
1646
  "anthropic/claude-opus-4.1",
@@ -1327,22 +1658,75 @@ var provider_registry_default = {
1327
1658
  "qwen/qwen3-coder",
1328
1659
  "x-ai/grok-4"
1329
1660
  ],
1330
- perplexity: ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
1331
- morph: ["auto", "morph-v3-fast", "morph-v3-large"],
1332
- "zai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1333
- huggingface: [
1661
+ google: [
1662
+ "gemini-1.5-flash",
1663
+ "gemini-1.5-flash-8b",
1664
+ "gemini-1.5-pro",
1665
+ "gemini-2.0-flash",
1666
+ "gemini-2.0-flash-lite",
1667
+ "gemini-2.5-flash",
1668
+ "gemini-2.5-flash-image",
1669
+ "gemini-2.5-flash-image-preview",
1670
+ "gemini-2.5-flash-lite",
1671
+ "gemini-2.5-flash-lite-preview-06-17",
1672
+ "gemini-2.5-flash-lite-preview-09-2025",
1673
+ "gemini-2.5-flash-preview-04-17",
1674
+ "gemini-2.5-flash-preview-05-20",
1675
+ "gemini-2.5-flash-preview-09-2025",
1676
+ "gemini-2.5-flash-preview-tts",
1677
+ "gemini-2.5-pro",
1678
+ "gemini-2.5-pro-preview-05-06",
1679
+ "gemini-2.5-pro-preview-06-05",
1680
+ "gemini-2.5-pro-preview-tts",
1681
+ "gemini-flash-latest",
1682
+ "gemini-flash-lite-latest",
1683
+ "gemini-live-2.5-flash",
1684
+ "gemini-live-2.5-flash-preview-native-audio"
1685
+ ],
1686
+ inception: ["mercury", "mercury-coder"],
1687
+ wandb: [
1688
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1334
1689
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
1335
1690
  "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1336
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
1337
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
1338
1691
  "deepseek-ai/DeepSeek-R1-0528",
1339
- "deepseek-ai/Deepseek-V3-0324",
1340
- "moonshotai/Kimi-K2-Instruct",
1341
- "moonshotai/Kimi-K2-Instruct-0905",
1342
- "zai-org/GLM-4.5",
1343
- "zai-org/GLM-4.5-Air",
1344
- "zai-org/GLM-4.6"
1692
+ "deepseek-ai/DeepSeek-V3-0324",
1693
+ "meta-llama/Llama-3.1-8B-Instruct",
1694
+ "meta-llama/Llama-3.3-70B-Instruct",
1695
+ "meta-llama/Llama-4-Scout-17B-16E-Instruct",
1696
+ "microsoft/Phi-4-mini-instruct",
1697
+ "moonshotai/Kimi-K2-Instruct"
1698
+ ],
1699
+ openai: [
1700
+ "codex-mini-latest",
1701
+ "gpt-3.5-turbo",
1702
+ "gpt-4",
1703
+ "gpt-4-turbo",
1704
+ "gpt-4.1",
1705
+ "gpt-4.1-mini",
1706
+ "gpt-4.1-nano",
1707
+ "gpt-4o",
1708
+ "gpt-4o-2024-05-13",
1709
+ "gpt-4o-2024-08-06",
1710
+ "gpt-4o-2024-11-20",
1711
+ "gpt-4o-mini",
1712
+ "gpt-5",
1713
+ "gpt-5-chat-latest",
1714
+ "gpt-5-codex",
1715
+ "gpt-5-mini",
1716
+ "gpt-5-nano",
1717
+ "o1",
1718
+ "o1-mini",
1719
+ "o1-preview",
1720
+ "o1-pro",
1721
+ "o3",
1722
+ "o3-deep-research",
1723
+ "o3-mini",
1724
+ "o3-pro",
1725
+ "o4-mini",
1726
+ "o4-mini-deep-research"
1345
1727
  ],
1728
+ "zhipuai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1729
+ perplexity: ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
1346
1730
  openrouter: [
1347
1731
  "anthropic/claude-3.5-haiku",
1348
1732
  "anthropic/claude-3.7-sonnet",
@@ -1387,192 +1771,73 @@ var provider_registry_default = {
1387
1771
  "mistralai/devstral-small-2505:free",
1388
1772
  "mistralai/devstral-small-2507",
1389
1773
  "mistralai/mistral-7b-instruct:free",
1390
- "mistralai/mistral-medium-3",
1391
- "mistralai/mistral-medium-3.1",
1392
- "mistralai/mistral-nemo:free",
1393
- "mistralai/mistral-small-3.1-24b-instruct",
1394
- "mistralai/mistral-small-3.2-24b-instruct",
1395
- "mistralai/mistral-small-3.2-24b-instruct:free",
1396
- "moonshotai/kimi-dev-72b:free",
1397
- "moonshotai/kimi-k2",
1398
- "moonshotai/kimi-k2-0905",
1399
- "moonshotai/kimi-k2:free",
1400
- "nousresearch/deephermes-3-llama-3-8b-preview",
1401
- "nousresearch/hermes-4-405b",
1402
- "nousresearch/hermes-4-70b",
1403
- "openai/gpt-4.1",
1404
- "openai/gpt-4.1-mini",
1405
- "openai/gpt-4o-mini",
1406
- "openai/gpt-5",
1407
- "openai/gpt-5-chat",
1408
- "openai/gpt-5-codex",
1409
- "openai/gpt-5-image",
1410
- "openai/gpt-5-mini",
1411
- "openai/gpt-5-nano",
1412
- "openai/gpt-oss-120b",
1413
- "openai/gpt-oss-20b",
1414
- "openai/o4-mini",
1415
- "openrouter/cypher-alpha:free",
1416
- "openrouter/horizon-alpha",
1417
- "openrouter/horizon-beta",
1418
- "openrouter/sonoma-dusk-alpha",
1419
- "openrouter/sonoma-sky-alpha",
1420
- "qwen/qwen-2.5-coder-32b-instruct",
1421
- "qwen/qwen2.5-vl-32b-instruct:free",
1422
- "qwen/qwen2.5-vl-72b-instruct",
1423
- "qwen/qwen2.5-vl-72b-instruct:free",
1424
- "qwen/qwen3-14b:free",
1425
- "qwen/qwen3-235b-a22b-07-25",
1426
- "qwen/qwen3-235b-a22b-07-25:free",
1427
- "qwen/qwen3-235b-a22b-thinking-2507",
1428
- "qwen/qwen3-235b-a22b:free",
1429
- "qwen/qwen3-30b-a3b-instruct-2507",
1430
- "qwen/qwen3-30b-a3b-thinking-2507",
1431
- "qwen/qwen3-30b-a3b:free",
1432
- "qwen/qwen3-32b:free",
1433
- "qwen/qwen3-8b:free",
1434
- "qwen/qwen3-coder",
1435
- "qwen/qwen3-coder:free",
1436
- "qwen/qwen3-max",
1437
- "qwen/qwen3-next-80b-a3b-instruct",
1438
- "qwen/qwen3-next-80b-a3b-thinking",
1439
- "qwen/qwq-32b:free",
1440
- "rekaai/reka-flash-3",
1441
- "sarvamai/sarvam-m:free",
1442
- "thudm/glm-z1-32b:free",
1443
- "tngtech/deepseek-r1t2-chimera:free",
1444
- "x-ai/grok-3",
1445
- "x-ai/grok-3-beta",
1446
- "x-ai/grok-3-mini",
1447
- "x-ai/grok-3-mini-beta",
1448
- "x-ai/grok-4",
1449
- "x-ai/grok-4-fast",
1450
- "x-ai/grok-4-fast:free",
1451
- "x-ai/grok-code-fast-1",
1452
- "z-ai/glm-4.5",
1453
- "z-ai/glm-4.5-air",
1454
- "z-ai/glm-4.5-air:free",
1455
- "z-ai/glm-4.5v",
1456
- "z-ai/glm-4.6"
1457
- ],
1458
- cerebras: ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
1459
- zhipuai: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1460
- togetherai: [
1461
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1462
- "deepseek-ai/DeepSeek-R1",
1463
- "deepseek-ai/DeepSeek-V3",
1464
- "meta-llama/Llama-3.3-70B-Instruct-Turbo",
1465
- "moonshotai/Kimi-K2-Instruct",
1466
- "openai/gpt-oss-120b"
1467
- ],
1468
- wandb: [
1469
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1470
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1471
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1472
- "deepseek-ai/DeepSeek-R1-0528",
1473
- "deepseek-ai/DeepSeek-V3-0324",
1474
- "meta-llama/Llama-3.1-8B-Instruct",
1475
- "meta-llama/Llama-3.3-70B-Instruct",
1476
- "meta-llama/Llama-4-Scout-17B-16E-Instruct",
1477
- "microsoft/Phi-4-mini-instruct",
1478
- "moonshotai/Kimi-K2-Instruct"
1479
- ],
1480
- submodel: [
1481
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1482
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1483
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1484
- "deepseek-ai/DeepSeek-R1-0528",
1485
- "deepseek-ai/DeepSeek-V3-0324",
1486
- "deepseek-ai/DeepSeek-V3.1",
1487
- "openai/gpt-oss-120b",
1488
- "zai-org/GLM-4.5-Air",
1489
- "zai-org/GLM-4.5-FP8"
1490
- ],
1491
- vercel: [
1492
- "alibaba/qwen3-coder-plus",
1493
- "alibaba/qwen3-max",
1494
- "alibaba/qwen3-next-80b-a3b-instruct",
1495
- "alibaba/qwen3-next-80b-a3b-thinking",
1496
- "alibaba/qwen3-vl-instruct",
1497
- "alibaba/qwen3-vl-thinking",
1498
- "amazon/nova-lite",
1499
- "amazon/nova-micro",
1500
- "amazon/nova-pro",
1501
- "anthropic/claude-3-5-haiku",
1502
- "anthropic/claude-3-haiku",
1503
- "anthropic/claude-3-opus",
1504
- "anthropic/claude-3.5-sonnet",
1505
- "anthropic/claude-3.7-sonnet",
1506
- "anthropic/claude-4-1-opus",
1507
- "anthropic/claude-4-opus",
1508
- "anthropic/claude-4-sonnet",
1509
- "anthropic/claude-4.5-sonnet",
1510
- "anthropic/claude-haiku-4.5",
1511
- "cerebras/qwen3-coder",
1512
- "deepseek/deepseek-r1",
1513
- "deepseek/deepseek-r1-distill-llama-70b",
1514
- "deepseek/deepseek-v3.1-terminus",
1515
- "deepseek/deepseek-v3.2-exp",
1516
- "deepseek/deepseek-v3.2-exp-thinking",
1517
- "google/gemini-2.0-flash",
1518
- "google/gemini-2.0-flash-lite",
1519
- "google/gemini-2.5-flash",
1520
- "google/gemini-2.5-flash-lite",
1521
- "google/gemini-2.5-flash-lite-preview-09-2025",
1522
- "google/gemini-2.5-flash-preview-09-2025",
1523
- "google/gemini-2.5-pro",
1524
- "meta/llama-3.3-70b",
1525
- "meta/llama-4-maverick",
1526
- "meta/llama-4-scout",
1527
- "mistral/codestral",
1528
- "mistral/magistral-medium",
1529
- "mistral/magistral-small",
1530
- "mistral/ministral-3b",
1531
- "mistral/ministral-8b",
1532
- "mistral/mistral-large",
1533
- "mistral/mistral-small",
1534
- "mistral/mixtral-8x22b-instruct",
1535
- "mistral/pixtral-12b",
1536
- "mistral/pixtral-large",
1774
+ "mistralai/mistral-medium-3",
1775
+ "mistralai/mistral-medium-3.1",
1776
+ "mistralai/mistral-nemo:free",
1777
+ "mistralai/mistral-small-3.1-24b-instruct",
1778
+ "mistralai/mistral-small-3.2-24b-instruct",
1779
+ "mistralai/mistral-small-3.2-24b-instruct:free",
1780
+ "moonshotai/kimi-dev-72b:free",
1537
1781
  "moonshotai/kimi-k2",
1538
- "morph/morph-v3-fast",
1539
- "morph/morph-v3-large",
1540
- "openai/gpt-4-turbo",
1782
+ "moonshotai/kimi-k2-0905",
1783
+ "moonshotai/kimi-k2:free",
1784
+ "nousresearch/deephermes-3-llama-3-8b-preview",
1785
+ "nousresearch/hermes-4-405b",
1786
+ "nousresearch/hermes-4-70b",
1541
1787
  "openai/gpt-4.1",
1542
1788
  "openai/gpt-4.1-mini",
1543
- "openai/gpt-4.1-nano",
1544
- "openai/gpt-4o",
1545
1789
  "openai/gpt-4o-mini",
1546
1790
  "openai/gpt-5",
1791
+ "openai/gpt-5-chat",
1547
1792
  "openai/gpt-5-codex",
1793
+ "openai/gpt-5-image",
1548
1794
  "openai/gpt-5-mini",
1549
1795
  "openai/gpt-5-nano",
1550
1796
  "openai/gpt-oss-120b",
1551
1797
  "openai/gpt-oss-20b",
1552
- "openai/o1",
1553
- "openai/o3",
1554
- "openai/o3-mini",
1555
1798
  "openai/o4-mini",
1556
- "perplexity/sonar",
1557
- "perplexity/sonar-pro",
1558
- "perplexity/sonar-reasoning",
1559
- "perplexity/sonar-reasoning-pro",
1560
- "vercel/v0-1.0-md",
1561
- "vercel/v0-1.5-md",
1562
- "xai/grok-2",
1563
- "xai/grok-2-vision",
1564
- "xai/grok-3",
1565
- "xai/grok-3-fast",
1566
- "xai/grok-3-mini",
1567
- "xai/grok-3-mini-fast",
1568
- "xai/grok-4",
1569
- "xai/grok-4-fast",
1570
- "xai/grok-4-fast-non-reasoning",
1571
- "xai/grok-code-fast-1",
1572
- "zai/glm-4.5",
1573
- "zai/glm-4.5-air",
1574
- "zai/glm-4.5v",
1575
- "zai/glm-4.6"
1799
+ "openrouter/cypher-alpha:free",
1800
+ "openrouter/horizon-alpha",
1801
+ "openrouter/horizon-beta",
1802
+ "openrouter/sonoma-dusk-alpha",
1803
+ "openrouter/sonoma-sky-alpha",
1804
+ "qwen/qwen-2.5-coder-32b-instruct",
1805
+ "qwen/qwen2.5-vl-32b-instruct:free",
1806
+ "qwen/qwen2.5-vl-72b-instruct",
1807
+ "qwen/qwen2.5-vl-72b-instruct:free",
1808
+ "qwen/qwen3-14b:free",
1809
+ "qwen/qwen3-235b-a22b-07-25",
1810
+ "qwen/qwen3-235b-a22b-07-25:free",
1811
+ "qwen/qwen3-235b-a22b-thinking-2507",
1812
+ "qwen/qwen3-235b-a22b:free",
1813
+ "qwen/qwen3-30b-a3b-instruct-2507",
1814
+ "qwen/qwen3-30b-a3b-thinking-2507",
1815
+ "qwen/qwen3-30b-a3b:free",
1816
+ "qwen/qwen3-32b:free",
1817
+ "qwen/qwen3-8b:free",
1818
+ "qwen/qwen3-coder",
1819
+ "qwen/qwen3-coder:free",
1820
+ "qwen/qwen3-max",
1821
+ "qwen/qwen3-next-80b-a3b-instruct",
1822
+ "qwen/qwen3-next-80b-a3b-thinking",
1823
+ "qwen/qwq-32b:free",
1824
+ "rekaai/reka-flash-3",
1825
+ "sarvamai/sarvam-m:free",
1826
+ "thudm/glm-z1-32b:free",
1827
+ "tngtech/deepseek-r1t2-chimera:free",
1828
+ "x-ai/grok-3",
1829
+ "x-ai/grok-3-beta",
1830
+ "x-ai/grok-3-mini",
1831
+ "x-ai/grok-3-mini-beta",
1832
+ "x-ai/grok-4",
1833
+ "x-ai/grok-4-fast",
1834
+ "x-ai/grok-4-fast:free",
1835
+ "x-ai/grok-code-fast-1",
1836
+ "z-ai/glm-4.5",
1837
+ "z-ai/glm-4.5-air",
1838
+ "z-ai/glm-4.5-air:free",
1839
+ "z-ai/glm-4.5v",
1840
+ "z-ai/glm-4.6"
1576
1841
  ],
1577
1842
  synthetic: [
1578
1843
  "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
@@ -1597,184 +1862,53 @@ var provider_registry_default = {
1597
1862
  "hf:zai-org/GLM-4.5",
1598
1863
  "hf:zai-org/GLM-4.6"
1599
1864
  ],
1600
- google: [
1601
- "gemini-1.5-flash",
1602
- "gemini-1.5-flash-8b",
1603
- "gemini-1.5-pro",
1604
- "gemini-2.0-flash",
1605
- "gemini-2.0-flash-lite",
1606
- "gemini-2.5-flash",
1607
- "gemini-2.5-flash-image",
1608
- "gemini-2.5-flash-image-preview",
1609
- "gemini-2.5-flash-lite",
1610
- "gemini-2.5-flash-lite-preview-06-17",
1611
- "gemini-2.5-flash-lite-preview-09-2025",
1612
- "gemini-2.5-flash-preview-04-17",
1613
- "gemini-2.5-flash-preview-05-20",
1614
- "gemini-2.5-flash-preview-09-2025",
1615
- "gemini-2.5-flash-preview-tts",
1616
- "gemini-2.5-pro",
1617
- "gemini-2.5-pro-preview-05-06",
1618
- "gemini-2.5-pro-preview-06-05",
1619
- "gemini-2.5-pro-preview-tts",
1620
- "gemini-flash-latest",
1621
- "gemini-flash-lite-latest",
1622
- "gemini-live-2.5-flash",
1623
- "gemini-live-2.5-flash-preview-native-audio"
1624
- ],
1625
- groq: [
1626
- "deepseek-r1-distill-llama-70b",
1627
- "gemma2-9b-it",
1628
- "llama-3.1-8b-instant",
1629
- "llama-3.3-70b-versatile",
1630
- "llama-guard-3-8b",
1631
- "llama3-70b-8192",
1632
- "llama3-8b-8192",
1633
- "meta-llama/llama-4-maverick-17b-128e-instruct",
1634
- "meta-llama/llama-4-scout-17b-16e-instruct",
1635
- "meta-llama/llama-guard-4-12b",
1636
- "mistral-saba-24b",
1637
- "moonshotai/kimi-k2-instruct",
1638
- "moonshotai/kimi-k2-instruct-0905",
1639
- "openai/gpt-oss-120b",
1640
- "openai/gpt-oss-20b",
1641
- "qwen-qwq-32b",
1642
- "qwen/qwen3-32b"
1643
- ],
1644
- "moonshotai-cn": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1645
- "github-models": [
1646
- "ai21-labs/ai21-jamba-1.5-large",
1647
- "ai21-labs/ai21-jamba-1.5-mini",
1648
- "cohere/cohere-command-a",
1649
- "cohere/cohere-command-r",
1650
- "cohere/cohere-command-r-08-2024",
1651
- "cohere/cohere-command-r-plus",
1652
- "cohere/cohere-command-r-plus-08-2024",
1653
- "core42/jais-30b-chat",
1654
- "deepseek/deepseek-r1",
1655
- "deepseek/deepseek-r1-0528",
1656
- "deepseek/deepseek-v3-0324",
1657
- "meta/llama-3.2-11b-vision-instruct",
1658
- "meta/llama-3.2-90b-vision-instruct",
1659
- "meta/llama-3.3-70b-instruct",
1660
- "meta/llama-4-maverick-17b-128e-instruct-fp8",
1661
- "meta/llama-4-scout-17b-16e-instruct",
1662
- "meta/meta-llama-3-70b-instruct",
1663
- "meta/meta-llama-3-8b-instruct",
1664
- "meta/meta-llama-3.1-405b-instruct",
1665
- "meta/meta-llama-3.1-70b-instruct",
1666
- "meta/meta-llama-3.1-8b-instruct",
1667
- "microsoft/mai-ds-r1",
1668
- "microsoft/phi-3-medium-128k-instruct",
1669
- "microsoft/phi-3-medium-4k-instruct",
1670
- "microsoft/phi-3-mini-128k-instruct",
1671
- "microsoft/phi-3-mini-4k-instruct",
1672
- "microsoft/phi-3-small-128k-instruct",
1673
- "microsoft/phi-3-small-8k-instruct",
1674
- "microsoft/phi-3.5-mini-instruct",
1675
- "microsoft/phi-3.5-moe-instruct",
1676
- "microsoft/phi-3.5-vision-instruct",
1677
- "microsoft/phi-4",
1678
- "microsoft/phi-4-mini-instruct",
1679
- "microsoft/phi-4-mini-reasoning",
1680
- "microsoft/phi-4-multimodal-instruct",
1681
- "microsoft/phi-4-reasoning",
1682
- "mistral-ai/codestral-2501",
1683
- "mistral-ai/ministral-3b",
1684
- "mistral-ai/mistral-large-2411",
1685
- "mistral-ai/mistral-medium-2505",
1686
- "mistral-ai/mistral-nemo",
1687
- "mistral-ai/mistral-small-2503",
1688
- "openai/gpt-4.1",
1689
- "openai/gpt-4.1-mini",
1690
- "openai/gpt-4.1-nano",
1691
- "openai/gpt-4o",
1692
- "openai/gpt-4o-mini",
1693
- "openai/o1",
1694
- "openai/o1-mini",
1695
- "openai/o1-preview",
1696
- "openai/o3",
1697
- "openai/o3-mini",
1698
- "openai/o4-mini",
1699
- "xai/grok-3",
1700
- "xai/grok-3-mini"
1701
- ],
1702
1865
  deepinfra: [
1703
1866
  "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1704
1867
  "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo",
1705
1868
  "moonshotai/Kimi-K2-Instruct",
1706
1869
  "zai-org/GLM-4.5"
1707
1870
  ],
1708
- "fireworks-ai": [
1709
- "accounts/fireworks/models/deepseek-r1-0528",
1710
- "accounts/fireworks/models/deepseek-v3-0324",
1711
- "accounts/fireworks/models/deepseek-v3p1",
1712
- "accounts/fireworks/models/glm-4p5",
1713
- "accounts/fireworks/models/glm-4p5-air",
1714
- "accounts/fireworks/models/gpt-oss-120b",
1715
- "accounts/fireworks/models/gpt-oss-20b",
1716
- "accounts/fireworks/models/kimi-k2-instruct",
1717
- "accounts/fireworks/models/qwen3-235b-a22b",
1718
- "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
1871
+ zhipuai: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1872
+ submodel: [
1873
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1874
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1875
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1876
+ "deepseek-ai/DeepSeek-R1-0528",
1877
+ "deepseek-ai/DeepSeek-V3-0324",
1878
+ "deepseek-ai/DeepSeek-V3.1",
1879
+ "openai/gpt-oss-120b",
1880
+ "zai-org/GLM-4.5-Air",
1881
+ "zai-org/GLM-4.5-FP8"
1719
1882
  ],
1720
1883
  zai: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1721
- opencode: [
1722
- "an-gbt",
1723
- "big-pickle",
1724
- "claude-3-5-haiku",
1725
- "claude-haiku-4-5",
1726
- "claude-opus-4-1",
1727
- "claude-sonnet-4",
1728
- "claude-sonnet-4-5",
1729
- "code-supernova",
1730
- "glm-4.6",
1731
- "gpt-5",
1732
- "gpt-5-codex",
1733
- "grok-code",
1734
- "kimi-k2",
1735
- "qwen3-coder"
1884
+ inference: [
1885
+ "google/gemma-3",
1886
+ "meta/llama-3.1-8b-instruct",
1887
+ "meta/llama-3.2-11b-vision-instruct",
1888
+ "meta/llama-3.2-1b-instruct",
1889
+ "meta/llama-3.2-3b-instruct",
1890
+ "mistral/mistral-nemo-12b-instruct",
1891
+ "osmosis/osmosis-structure-0.6b",
1892
+ "qwen/qwen-2.5-7b-vision-instruct",
1893
+ "qwen/qwen3-embedding-4b"
1736
1894
  ],
1737
- "zhipuai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1738
- inception: ["mercury", "mercury-coder"],
1739
- llama: [
1740
- "cerebras-llama-4-maverick-17b-128e-instruct",
1741
- "cerebras-llama-4-scout-17b-16e-instruct",
1742
- "groq-llama-4-maverick-17b-128e-instruct",
1743
- "llama-3.3-70b-instruct",
1744
- "llama-3.3-8b-instruct",
1745
- "llama-4-maverick-17b-128e-instruct-fp8",
1746
- "llama-4-scout-17b-16e-instruct-fp8"
1895
+ requesty: [
1896
+ "anthropic/claude-3-7-sonnet",
1897
+ "anthropic/claude-4-sonnet-20250522",
1898
+ "anthropic/claude-opus-4",
1899
+ "anthropic/claude-opus-4-1-20250805",
1900
+ "google/gemini-2.5-flash",
1901
+ "google/gemini-2.5-pro",
1902
+ "openai/gpt-4.1",
1903
+ "openai/gpt-4.1-mini",
1904
+ "openai/gpt-4o-mini",
1905
+ "openai/gpt-5",
1906
+ "openai/gpt-5-mini",
1907
+ "openai/gpt-5-nano",
1908
+ "openai/o4-mini"
1747
1909
  ],
1910
+ morph: ["auto", "morph-v3-fast", "morph-v3-large"],
1748
1911
  lmstudio: ["openai/gpt-oss-20b", "qwen/qwen3-30b-a3b-2507", "qwen/qwen3-coder-30b"],
1749
- openai: [
1750
- "codex-mini-latest",
1751
- "gpt-3.5-turbo",
1752
- "gpt-4",
1753
- "gpt-4-turbo",
1754
- "gpt-4.1",
1755
- "gpt-4.1-mini",
1756
- "gpt-4.1-nano",
1757
- "gpt-4o",
1758
- "gpt-4o-2024-05-13",
1759
- "gpt-4o-2024-08-06",
1760
- "gpt-4o-2024-11-20",
1761
- "gpt-4o-mini",
1762
- "gpt-5",
1763
- "gpt-5-chat-latest",
1764
- "gpt-5-codex",
1765
- "gpt-5-mini",
1766
- "gpt-5-nano",
1767
- "o1",
1768
- "o1-mini",
1769
- "o1-preview",
1770
- "o1-pro",
1771
- "o3",
1772
- "o3-deep-research",
1773
- "o3-mini",
1774
- "o3-pro",
1775
- "o4-mini",
1776
- "o4-mini-deep-research"
1777
- ],
1778
1912
  anthropic: [
1779
1913
  "claude-3-5-haiku-20241022",
1780
1914
  "claude-3-5-haiku-latest",
@@ -1796,208 +1930,50 @@ var provider_registry_default = {
1796
1930
  "claude-sonnet-4-5",
1797
1931
  "claude-sonnet-4-5-20250929"
1798
1932
  ],
1799
- moonshotai: ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1800
- inference: [
1801
- "google/gemma-3",
1802
- "meta/llama-3.1-8b-instruct",
1803
- "meta/llama-3.2-11b-vision-instruct",
1804
- "meta/llama-3.2-1b-instruct",
1805
- "meta/llama-3.2-3b-instruct",
1806
- "mistral/mistral-nemo-12b-instruct",
1807
- "osmosis/osmosis-structure-0.6b",
1808
- "qwen/qwen-2.5-7b-vision-instruct",
1809
- "qwen/qwen3-embedding-4b"
1810
- ],
1811
- baseten: ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
1812
- cortecs: [
1813
- "claude-4-5-sonnet",
1814
- "claude-sonnet-4",
1815
- "deepseek-v3-0324",
1816
- "gemini-2.5-pro",
1817
- "gpt-4.1",
1818
- "gpt-oss-120b",
1819
- "kimi-k2-instruct",
1820
- "llama-3.1-405b-instruct",
1821
- "nova-pro-v1",
1822
- "qwen3-32b",
1823
- "qwen3-coder-480b-a35b-instruct"
1824
- ],
1825
- mistral: [
1826
- "codestral-latest",
1827
- "devstral-medium-2507",
1828
- "devstral-small-2505",
1829
- "devstral-small-2507",
1830
- "magistral-medium-latest",
1831
- "magistral-small",
1832
- "ministral-3b-latest",
1833
- "ministral-8b-latest",
1834
- "mistral-large-latest",
1835
- "mistral-medium-2505",
1836
- "mistral-medium-2508",
1837
- "mistral-medium-latest",
1838
- "mistral-nemo",
1839
- "mistral-small-latest",
1840
- "open-mistral-7b",
1841
- "open-mixtral-8x22b",
1842
- "open-mixtral-8x7b",
1843
- "pixtral-12b",
1844
- "pixtral-large-latest"
1845
- ],
1846
- venice: [
1847
- "deepseek-coder-v2-lite",
1848
- "deepseek-r1-671b",
1849
- "dolphin-2.9.2-qwen2-72b",
1850
- "llama-3.1-405b",
1851
- "llama-3.2-3b",
1852
- "llama-3.3-70b",
1853
- "mistral-31-24b",
1854
- "qwen-2.5-coder-32b",
1855
- "qwen-2.5-qwq-32b",
1856
- "qwen-2.5-vl",
1857
- "qwen3-235b",
1858
- "qwen3-4b",
1859
- "venice-uncensored"
1860
- ],
1861
- alibaba: [
1862
- "qvq-max",
1863
- "qwen-flash",
1864
- "qwen-max",
1865
- "qwen-mt-plus",
1866
- "qwen-mt-turbo",
1867
- "qwen-omni-turbo",
1868
- "qwen-omni-turbo-realtime",
1869
- "qwen-plus",
1870
- "qwen-plus-character-ja",
1871
- "qwen-turbo",
1872
- "qwen-vl-max",
1873
- "qwen-vl-ocr",
1874
- "qwen-vl-plus",
1875
- "qwen2-5-14b-instruct",
1876
- "qwen2-5-32b-instruct",
1877
- "qwen2-5-72b-instruct",
1878
- "qwen2-5-7b-instruct",
1879
- "qwen2-5-omni-7b",
1880
- "qwen2-5-vl-72b-instruct",
1881
- "qwen2-5-vl-7b-instruct",
1882
- "qwen3-14b",
1883
- "qwen3-235b-a22b",
1884
- "qwen3-32b",
1885
- "qwen3-8b",
1886
- "qwen3-asr-flash",
1887
- "qwen3-coder-30b-a3b-instruct",
1888
- "qwen3-coder-480b-a35b-instruct",
1889
- "qwen3-coder-flash",
1890
- "qwen3-coder-plus",
1891
- "qwen3-livetranslate-flash-realtime",
1892
- "qwen3-max",
1893
- "qwen3-next-80b-a3b-instruct",
1894
- "qwen3-next-80b-a3b-thinking",
1895
- "qwen3-omni-flash",
1896
- "qwen3-omni-flash-realtime",
1897
- "qwen3-vl-235b-a22b",
1898
- "qwen3-vl-30b-a3b",
1899
- "qwen3-vl-plus",
1900
- "qwq-plus"
1901
- ],
1902
- "alibaba-cn": [
1903
- "deepseek-r1",
1904
- "deepseek-r1-0528",
1905
- "deepseek-r1-distill-llama-70b",
1906
- "deepseek-r1-distill-llama-8b",
1907
- "deepseek-r1-distill-qwen-1-5b",
1908
- "deepseek-r1-distill-qwen-14b",
1909
- "deepseek-r1-distill-qwen-32b",
1910
- "deepseek-r1-distill-qwen-7b",
1911
- "deepseek-v3",
1912
- "deepseek-v3-1",
1913
- "deepseek-v3-2-exp",
1914
- "moonshot-kimi-k2-instruct",
1915
- "qvq-max",
1916
- "qwen-deep-research",
1917
- "qwen-doc-turbo",
1918
- "qwen-flash",
1919
- "qwen-long",
1920
- "qwen-math-plus",
1921
- "qwen-math-turbo",
1922
- "qwen-max",
1923
- "qwen-mt-plus",
1924
- "qwen-mt-turbo",
1925
- "qwen-omni-turbo",
1926
- "qwen-omni-turbo-realtime",
1927
- "qwen-plus",
1928
- "qwen-plus-character",
1929
- "qwen-turbo",
1930
- "qwen-vl-max",
1931
- "qwen-vl-ocr",
1932
- "qwen-vl-plus",
1933
- "qwen2-5-14b-instruct",
1934
- "qwen2-5-32b-instruct",
1935
- "qwen2-5-72b-instruct",
1936
- "qwen2-5-7b-instruct",
1937
- "qwen2-5-coder-32b-instruct",
1938
- "qwen2-5-coder-7b-instruct",
1939
- "qwen2-5-math-72b-instruct",
1940
- "qwen2-5-math-7b-instruct",
1941
- "qwen2-5-omni-7b",
1942
- "qwen2-5-vl-72b-instruct",
1943
- "qwen2-5-vl-7b-instruct",
1944
- "qwen3-14b",
1945
- "qwen3-235b-a22b",
1946
- "qwen3-32b",
1947
- "qwen3-8b",
1948
- "qwen3-asr-flash",
1949
- "qwen3-coder-30b-a3b-instruct",
1950
- "qwen3-coder-480b-a35b-instruct",
1951
- "qwen3-coder-flash",
1952
- "qwen3-coder-plus",
1953
- "qwen3-max",
1954
- "qwen3-next-80b-a3b-instruct",
1955
- "qwen3-next-80b-a3b-thinking",
1956
- "qwen3-omni-flash",
1957
- "qwen3-omni-flash-realtime",
1958
- "qwen3-vl-235b-a22b",
1959
- "qwen3-vl-30b-a3b",
1960
- "qwen3-vl-plus",
1961
- "qwq-32b",
1962
- "qwq-plus",
1963
- "tongyi-intent-detect-v3"
1933
+ "fireworks-ai": [
1934
+ "accounts/fireworks/models/deepseek-r1-0528",
1935
+ "accounts/fireworks/models/deepseek-v3-0324",
1936
+ "accounts/fireworks/models/deepseek-v3p1",
1937
+ "accounts/fireworks/models/glm-4p5",
1938
+ "accounts/fireworks/models/glm-4p5-air",
1939
+ "accounts/fireworks/models/gpt-oss-120b",
1940
+ "accounts/fireworks/models/gpt-oss-20b",
1941
+ "accounts/fireworks/models/kimi-k2-instruct",
1942
+ "accounts/fireworks/models/qwen3-235b-a22b",
1943
+ "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
1964
1944
  ],
1965
- chutes: [
1945
+ modelscope: [
1966
1946
  "Qwen/Qwen3-235B-A22B-Instruct-2507",
1967
1947
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
1968
- "Qwen/Qwen3-30B-A3B",
1969
1948
  "Qwen/Qwen3-30B-A3B-Instruct-2507",
1970
1949
  "Qwen/Qwen3-30B-A3B-Thinking-2507",
1971
1950
  "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1972
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1973
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
1974
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
1975
- "chutesai/Devstral-Small-2505",
1976
- "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
1977
- "deepseek-ai/DeepSeek-R1-0528",
1978
- "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
1979
- "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1980
- "deepseek-ai/DeepSeek-V3-0324",
1981
- "deepseek-ai/DeepSeek-V3.1",
1982
- "deepseek-ai/DeepSeek-V3.1-Terminus",
1983
- "deepseek-ai/DeepSeek-V3.1-turbo",
1984
- "deepseek-ai/DeepSeek-V3.1:THINKING",
1985
- "deepseek-ai/DeepSeek-V3.2-Exp",
1986
- "meituan-longcat/LongCat-Flash-Chat-FP8",
1987
- "moonshotai/Kimi-Dev-72B",
1988
- "moonshotai/Kimi-K2-Instruct-0905",
1989
- "moonshotai/Kimi-K2-Instruct-75k",
1990
- "moonshotai/Kimi-VL-A3B-Thinking",
1991
- "openai/gpt-oss-120b",
1992
- "tngtech/DeepSeek-R1T-Chimera",
1993
- "tngtech/DeepSeek-TNG-R1T2-Chimera",
1994
- "zai-org/GLM-4.5-Air",
1995
- "zai-org/GLM-4.5-FP8",
1996
- "zai-org/GLM-4.5-turbo",
1997
- "zai-org/GLM-4.6-FP8",
1998
- "zai-org/GLM-4.6-turbo"
1951
+ "ZhipuAI/GLM-4.5",
1952
+ "ZhipuAI/GLM-4.6"
1999
1953
  ],
2000
- upstage: ["solar-mini", "solar-pro2"],
1954
+ llama: [
1955
+ "cerebras-llama-4-maverick-17b-128e-instruct",
1956
+ "cerebras-llama-4-scout-17b-16e-instruct",
1957
+ "groq-llama-4-maverick-17b-128e-instruct",
1958
+ "llama-3.3-70b-instruct",
1959
+ "llama-3.3-8b-instruct",
1960
+ "llama-4-maverick-17b-128e-instruct-fp8",
1961
+ "llama-4-scout-17b-16e-instruct-fp8"
1962
+ ],
1963
+ scaleway: [
1964
+ "deepseek-r1-distill-llama-70b",
1965
+ "gemma-3-27b-it",
1966
+ "gpt-oss-120b",
1967
+ "llama-3.1-8b-instruct",
1968
+ "llama-3.3-70b-instruct",
1969
+ "mistral-nemo-instruct-2407",
1970
+ "mistral-small-3.2-24b-instruct-2506",
1971
+ "pixtral-12b-2409",
1972
+ "qwen3-235b-a22b-instruct-2507",
1973
+ "qwen3-coder-30b-a3b-instruct",
1974
+ "voxtral-small-24b-2507"
1975
+ ],
1976
+ cerebras: ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
2001
1977
  netlify: [
2002
1978
  "anthropic/claude-3-5-haiku-20241022",
2003
1979
  "anthropic/claude-3-5-haiku-latest",
@@ -2580,5 +2556,5 @@ var ModelRouterEmbeddingModel = class {
2580
2556
  };
2581
2557
 
2582
2558
  export { ModelRouterEmbeddingModel, ModelRouterLanguageModel, PROVIDER_REGISTRY, getProviderConfig, parseModelString, resolveModelConfig };
2583
- //# sourceMappingURL=chunk-NIESGYOH.js.map
2584
- //# sourceMappingURL=chunk-NIESGYOH.js.map
2559
+ //# sourceMappingURL=chunk-A3TQYIIR.js.map
2560
+ //# sourceMappingURL=chunk-A3TQYIIR.js.map