@mastra/core 0.21.2-alpha.0 → 0.22.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (181) hide show
  1. package/CHANGELOG.md +194 -0
  2. package/dist/agent/agent.d.ts +1 -0
  3. package/dist/agent/agent.d.ts.map +1 -1
  4. package/dist/agent/index.cjs +13 -13
  5. package/dist/agent/index.js +2 -2
  6. package/dist/agent/input-processor/index.cjs +6 -6
  7. package/dist/agent/input-processor/index.js +1 -1
  8. package/dist/agent/message-list/index.d.ts +14 -1
  9. package/dist/agent/message-list/index.d.ts.map +1 -1
  10. package/dist/agent/test-utils.d.ts +1 -0
  11. package/dist/agent/test-utils.d.ts.map +1 -1
  12. package/dist/agent/types.d.ts +6 -1
  13. package/dist/agent/types.d.ts.map +1 -1
  14. package/dist/agent/utils.d.ts +1 -1
  15. package/dist/agent/utils.d.ts.map +1 -1
  16. package/dist/ai-tracing/chunk-tracing.d.ts +76 -0
  17. package/dist/ai-tracing/chunk-tracing.d.ts.map +1 -0
  18. package/dist/ai-tracing/exporters/base.d.ts +111 -0
  19. package/dist/ai-tracing/exporters/base.d.ts.map +1 -0
  20. package/dist/ai-tracing/exporters/cloud.d.ts +6 -8
  21. package/dist/ai-tracing/exporters/cloud.d.ts.map +1 -1
  22. package/dist/ai-tracing/exporters/console.d.ts +6 -6
  23. package/dist/ai-tracing/exporters/console.d.ts.map +1 -1
  24. package/dist/ai-tracing/exporters/index.d.ts +1 -0
  25. package/dist/ai-tracing/exporters/index.d.ts.map +1 -1
  26. package/dist/ai-tracing/index.cjs +48 -32
  27. package/dist/ai-tracing/index.d.ts +1 -0
  28. package/dist/ai-tracing/index.d.ts.map +1 -1
  29. package/dist/ai-tracing/index.js +1 -1
  30. package/dist/ai-tracing/spans/base.d.ts +4 -1
  31. package/dist/ai-tracing/spans/base.d.ts.map +1 -1
  32. package/dist/ai-tracing/spans/default.d.ts.map +1 -1
  33. package/dist/ai-tracing/tracers/base.d.ts +15 -1
  34. package/dist/ai-tracing/tracers/base.d.ts.map +1 -1
  35. package/dist/ai-tracing/types.d.ts +85 -11
  36. package/dist/ai-tracing/types.d.ts.map +1 -1
  37. package/dist/ai-tracing/utils.d.ts +14 -0
  38. package/dist/ai-tracing/utils.d.ts.map +1 -1
  39. package/dist/{chunk-D3IOLHNB.cjs → chunk-34L2Z6PH.cjs} +12 -12
  40. package/dist/{chunk-D3IOLHNB.cjs.map → chunk-34L2Z6PH.cjs.map} +1 -1
  41. package/dist/{chunk-BLVB2IJK.js → chunk-3CVE7NQC.js} +728 -267
  42. package/dist/chunk-3CVE7NQC.js.map +1 -0
  43. package/dist/{chunk-URQI7RJ3.cjs → chunk-5GIAZ3CH.cjs} +734 -269
  44. package/dist/chunk-5GIAZ3CH.cjs.map +1 -0
  45. package/dist/{chunk-XYNSPEJO.js → chunk-5NYWRAJN.js} +3 -3
  46. package/dist/{chunk-XYNSPEJO.js.map → chunk-5NYWRAJN.js.map} +1 -1
  47. package/dist/{chunk-URVM3Y4T.cjs → chunk-634YFL42.cjs} +44 -7
  48. package/dist/chunk-634YFL42.cjs.map +1 -0
  49. package/dist/{chunk-NIESGYOH.js → chunk-A3TQYIIR.js} +1392 -1416
  50. package/dist/chunk-A3TQYIIR.js.map +1 -0
  51. package/dist/{chunk-EGNHIPGJ.cjs → chunk-A4B6IAKN.cjs} +4 -4
  52. package/dist/{chunk-EGNHIPGJ.cjs.map → chunk-A4B6IAKN.cjs.map} +1 -1
  53. package/dist/{chunk-LMP5KMU3.js → chunk-AGD5B3FB.js} +43 -6
  54. package/dist/chunk-AGD5B3FB.js.map +1 -0
  55. package/dist/{chunk-V5WDWSQ5.cjs → chunk-CAZTWPDK.cjs} +11 -11
  56. package/dist/{chunk-V5WDWSQ5.cjs.map → chunk-CAZTWPDK.cjs.map} +1 -1
  57. package/dist/{chunk-N3ZSX5OS.js → chunk-F7OMDF5K.js} +72 -36
  58. package/dist/chunk-F7OMDF5K.js.map +1 -0
  59. package/dist/{chunk-ZMPSVDDO.cjs → chunk-FMNZ3BPT.cjs} +1393 -1417
  60. package/dist/chunk-FMNZ3BPT.cjs.map +1 -0
  61. package/dist/{chunk-4ZFVJA3A.js → chunk-HZIF7HQC.js} +3 -3
  62. package/dist/{chunk-4ZFVJA3A.js.map → chunk-HZIF7HQC.js.map} +1 -1
  63. package/dist/{chunk-KLWDUSBX.js → chunk-ITFEGBP2.js} +4 -4
  64. package/dist/{chunk-KLWDUSBX.js.map → chunk-ITFEGBP2.js.map} +1 -1
  65. package/dist/{chunk-GKTRUHKB.js → chunk-KQBF5ZEN.js} +5 -5
  66. package/dist/{chunk-GKTRUHKB.js.map → chunk-KQBF5ZEN.js.map} +1 -1
  67. package/dist/{chunk-R35PINKN.js → chunk-MHICZASQ.js} +5 -5
  68. package/dist/{chunk-R35PINKN.js.map → chunk-MHICZASQ.js.map} +1 -1
  69. package/dist/{chunk-H4KO46HZ.js → chunk-MKCC5K77.js} +3 -3
  70. package/dist/{chunk-H4KO46HZ.js.map → chunk-MKCC5K77.js.map} +1 -1
  71. package/dist/{chunk-UN653TND.cjs → chunk-O4KVF3MI.cjs} +4 -4
  72. package/dist/{chunk-UN653TND.cjs.map → chunk-O4KVF3MI.cjs.map} +1 -1
  73. package/dist/{chunk-WI2YMBNG.cjs → chunk-QBPTDMR7.cjs} +102 -64
  74. package/dist/chunk-QBPTDMR7.cjs.map +1 -0
  75. package/dist/{chunk-7P5FMQQK.cjs → chunk-RWWOJXMF.cjs} +6 -6
  76. package/dist/{chunk-7P5FMQQK.cjs.map → chunk-RWWOJXMF.cjs.map} +1 -1
  77. package/dist/{chunk-XBJP7THY.js → chunk-RXBG6UV2.js} +4 -4
  78. package/dist/chunk-RXBG6UV2.js.map +1 -0
  79. package/dist/{chunk-NL3P7IFI.js → chunk-SF75RENF.js} +3 -3
  80. package/dist/{chunk-NL3P7IFI.js.map → chunk-SF75RENF.js.map} +1 -1
  81. package/dist/{chunk-SE4PA467.cjs → chunk-VF676YCO.cjs} +2 -2
  82. package/dist/chunk-VF676YCO.cjs.map +1 -0
  83. package/dist/{chunk-6OLRLZJ3.js → chunk-WM4RO23J.js} +2 -2
  84. package/dist/chunk-WM4RO23J.js.map +1 -0
  85. package/dist/{chunk-MVVMHOAC.cjs → chunk-YOVX3R5U.cjs} +14 -14
  86. package/dist/chunk-YOVX3R5U.cjs.map +1 -0
  87. package/dist/{chunk-L5A4MRCK.cjs → chunk-ZABG3SZ2.cjs} +4 -4
  88. package/dist/{chunk-L5A4MRCK.cjs.map → chunk-ZABG3SZ2.cjs.map} +1 -1
  89. package/dist/{chunk-YKVVW65D.cjs → chunk-ZDW322JC.cjs} +8 -8
  90. package/dist/{chunk-YKVVW65D.cjs.map → chunk-ZDW322JC.cjs.map} +1 -1
  91. package/dist/index.cjs +53 -53
  92. package/dist/index.js +11 -11
  93. package/dist/integration/index.cjs +3 -3
  94. package/dist/integration/index.js +1 -1
  95. package/dist/llm/index.cjs +7 -7
  96. package/dist/llm/index.js +1 -1
  97. package/dist/llm/model/model.loop.d.ts.map +1 -1
  98. package/dist/llm/model/provider-types.generated.d.ts +585 -597
  99. package/dist/loop/index.cjs +2 -2
  100. package/dist/loop/index.js +1 -1
  101. package/dist/loop/loop.d.ts.map +1 -1
  102. package/dist/loop/test-utils/mock-server-response.d.ts +7 -2
  103. package/dist/loop/test-utils/mock-server-response.d.ts.map +1 -1
  104. package/dist/loop/test-utils/options.d.ts.map +1 -1
  105. package/dist/loop/types.d.ts +2 -1
  106. package/dist/loop/types.d.ts.map +1 -1
  107. package/dist/loop/workflows/agentic-execution/llm-execution-step.d.ts.map +1 -1
  108. package/dist/loop/workflows/agentic-execution/tool-call-step.d.ts +1 -1
  109. package/dist/loop/workflows/agentic-execution/tool-call-step.d.ts.map +1 -1
  110. package/dist/mastra/index.cjs +2 -2
  111. package/dist/mastra/index.js +1 -1
  112. package/dist/memory/index.cjs +4 -4
  113. package/dist/memory/index.js +1 -1
  114. package/dist/memory/memory.d.ts +3 -2
  115. package/dist/memory/memory.d.ts.map +1 -1
  116. package/dist/processors/index.cjs +11 -11
  117. package/dist/processors/index.js +1 -1
  118. package/dist/provider-registry.json +1390 -1414
  119. package/dist/relevance/index.cjs +4 -4
  120. package/dist/relevance/index.js +1 -1
  121. package/dist/scores/index.cjs +9 -9
  122. package/dist/scores/index.js +2 -2
  123. package/dist/scores/scoreTraces/index.cjs +8 -8
  124. package/dist/scores/scoreTraces/index.js +3 -3
  125. package/dist/storage/index.cjs +3 -3
  126. package/dist/storage/index.js +1 -1
  127. package/dist/stream/RunOutput.d.ts +72 -0
  128. package/dist/stream/RunOutput.d.ts.map +1 -0
  129. package/dist/stream/aisdk/v5/output.d.ts +2 -2
  130. package/dist/stream/aisdk/v5/output.d.ts.map +1 -1
  131. package/dist/stream/base/base.d.ts +7 -0
  132. package/dist/stream/base/base.d.ts.map +1 -0
  133. package/dist/stream/base/consume-stream.d.ts +5 -0
  134. package/dist/stream/base/consume-stream.d.ts.map +1 -0
  135. package/dist/stream/base/output.d.ts.map +1 -1
  136. package/dist/stream/index.cjs +14 -10
  137. package/dist/stream/index.d.ts +2 -1
  138. package/dist/stream/index.d.ts.map +1 -1
  139. package/dist/stream/index.js +2 -2
  140. package/dist/stream/types.d.ts +1 -1
  141. package/dist/stream/types.d.ts.map +1 -1
  142. package/dist/test-utils/llm-mock.cjs +2 -2
  143. package/dist/test-utils/llm-mock.js +1 -1
  144. package/dist/tools/index.cjs +4 -4
  145. package/dist/tools/index.js +1 -1
  146. package/dist/tools/is-vercel-tool.cjs +2 -2
  147. package/dist/tools/is-vercel-tool.js +1 -1
  148. package/dist/tools/tool-builder/builder.d.ts +75 -2
  149. package/dist/tools/tool-builder/builder.d.ts.map +1 -1
  150. package/dist/tools/tool.d.ts +2 -2
  151. package/dist/tools/tool.d.ts.map +1 -1
  152. package/dist/tools/types.d.ts +17 -12
  153. package/dist/tools/types.d.ts.map +1 -1
  154. package/dist/utils.cjs +17 -17
  155. package/dist/utils.d.ts +1 -0
  156. package/dist/utils.d.ts.map +1 -1
  157. package/dist/utils.js +1 -1
  158. package/dist/workflows/evented/index.cjs +10 -10
  159. package/dist/workflows/evented/index.js +1 -1
  160. package/dist/workflows/evented/workflow.d.ts +5 -3
  161. package/dist/workflows/evented/workflow.d.ts.map +1 -1
  162. package/dist/workflows/index.cjs +12 -12
  163. package/dist/workflows/index.js +1 -1
  164. package/dist/workflows/legacy/index.cjs +22 -22
  165. package/dist/workflows/legacy/index.js +1 -1
  166. package/dist/workflows/workflow.d.ts +30 -23
  167. package/dist/workflows/workflow.d.ts.map +1 -1
  168. package/package.json +12 -10
  169. package/src/llm/model/provider-types.generated.d.ts +585 -597
  170. package/dist/chunk-6OLRLZJ3.js.map +0 -1
  171. package/dist/chunk-BLVB2IJK.js.map +0 -1
  172. package/dist/chunk-LMP5KMU3.js.map +0 -1
  173. package/dist/chunk-MVVMHOAC.cjs.map +0 -1
  174. package/dist/chunk-N3ZSX5OS.js.map +0 -1
  175. package/dist/chunk-NIESGYOH.js.map +0 -1
  176. package/dist/chunk-SE4PA467.cjs.map +0 -1
  177. package/dist/chunk-URQI7RJ3.cjs.map +0 -1
  178. package/dist/chunk-URVM3Y4T.cjs.map +0 -1
  179. package/dist/chunk-WI2YMBNG.cjs.map +0 -1
  180. package/dist/chunk-XBJP7THY.js.map +0 -1
  181. package/dist/chunk-ZMPSVDDO.cjs.map +0 -1
@@ -1,78 +1,12 @@
1
1
  {
2
2
  "providers": {
3
- "nvidia": {
4
- "url": "https://integrate.api.nvidia.com/v1",
5
- "apiKeyEnvVar": "NVIDIA_API_KEY",
6
- "apiKeyHeader": "Authorization",
7
- "name": "Nvidia",
8
- "models": [
9
- "black-forest-labs/flux.1-dev",
10
- "deepseek-ai/deepseek-v3.1",
11
- "deepseek-ai/deepseek-v3.1-terminus",
12
- "google/gemma-3-27b-it",
13
- "microsoft/phi-4-mini-instruct",
14
- "moonshotai/kimi-k2-instruct",
15
- "moonshotai/kimi-k2-instruct-0905",
16
- "nvidia/cosmos-nemotron-34b",
17
- "nvidia/llama-3.1-nemotron-ultra-253b-v1",
18
- "nvidia/nemoretriever-ocr-v1",
19
- "nvidia/parakeet-tdt-0.6b-v2",
20
- "openai/gpt-oss-120b",
21
- "openai/whisper-large-v3",
22
- "qwen/qwen3-235b-a22b",
23
- "qwen/qwen3-coder-480b-a35b-instruct"
24
- ],
25
- "docUrl": "https://docs.api.nvidia.com/nim/",
26
- "gateway": "models.dev"
27
- },
28
- "modelscope": {
29
- "url": "https://api-inference.modelscope.cn/v1",
30
- "apiKeyEnvVar": "MODELSCOPE_API_KEY",
31
- "apiKeyHeader": "Authorization",
32
- "name": "ModelScope",
33
- "models": [
34
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
35
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
36
- "Qwen/Qwen3-30B-A3B-Instruct-2507",
37
- "Qwen/Qwen3-30B-A3B-Thinking-2507",
38
- "Qwen/Qwen3-Coder-30B-A3B-Instruct",
39
- "ZhipuAI/GLM-4.5",
40
- "ZhipuAI/GLM-4.6"
41
- ],
42
- "docUrl": "https://modelscope.cn/docs/model-service/API-Inference/intro",
43
- "gateway": "models.dev"
44
- },
45
- "aihubmix": {
46
- "url": "https://api.aihubmix.com/v1",
47
- "apiKeyEnvVar": "AIHUBMIX_API_KEY",
3
+ "moonshotai-cn": {
4
+ "url": "https://api.moonshot.cn/v1",
5
+ "apiKeyEnvVar": "MOONSHOT_API_KEY",
48
6
  "apiKeyHeader": "Authorization",
49
- "name": "AIHubMix",
50
- "models": [
51
- "DeepSeek-V3.2-Exp",
52
- "DeepSeek-V3.2-Exp-Think",
53
- "Kimi-K2-0905",
54
- "claude-haiku-4-5",
55
- "claude-opus-4-1",
56
- "claude-sonnet-4-5",
57
- "gemini-2.5-flash",
58
- "gemini-2.5-pro",
59
- "glm-4.6",
60
- "gpt-4.1",
61
- "gpt-4.1-mini",
62
- "gpt-4.1-nano",
63
- "gpt-4o",
64
- "gpt-4o-2024-11-20",
65
- "gpt-5",
66
- "gpt-5-codex",
67
- "gpt-5-mini",
68
- "gpt-5-nano",
69
- "gpt-5-pro",
70
- "o4-mini",
71
- "qwen3-235b-a22b-instruct-2507",
72
- "qwen3-235b-a22b-thinking-2507",
73
- "qwen3-coder-480b-a35b-instruct"
74
- ],
75
- "docUrl": "https://aihubmix.com/docs/models",
7
+ "name": "Moonshot AI (China)",
8
+ "models": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
9
+ "docUrl": "https://platform.moonshot.cn/docs/api/chat",
76
10
  "gateway": "models.dev"
77
11
  },
78
12
  "lucidquery": {
@@ -84,6 +18,73 @@
84
18
  "docUrl": "https://lucidquery.com/api/docs",
85
19
  "gateway": "models.dev"
86
20
  },
21
+ "moonshotai": {
22
+ "url": "https://api.moonshot.ai/v1",
23
+ "apiKeyEnvVar": "MOONSHOT_API_KEY",
24
+ "apiKeyHeader": "Authorization",
25
+ "name": "Moonshot AI",
26
+ "models": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
27
+ "docUrl": "https://platform.moonshot.ai/docs/api/chat",
28
+ "gateway": "models.dev"
29
+ },
30
+ "zai-coding-plan": {
31
+ "url": "https://api.z.ai/api/coding/paas/v4",
32
+ "apiKeyEnvVar": "ZHIPU_API_KEY",
33
+ "apiKeyHeader": "Authorization",
34
+ "name": "Z.AI Coding Plan",
35
+ "models": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
36
+ "docUrl": "https://docs.z.ai/devpack/overview",
37
+ "gateway": "models.dev"
38
+ },
39
+ "alibaba": {
40
+ "url": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1",
41
+ "apiKeyEnvVar": "DASHSCOPE_API_KEY",
42
+ "apiKeyHeader": "Authorization",
43
+ "name": "Alibaba",
44
+ "models": [
45
+ "qvq-max",
46
+ "qwen-flash",
47
+ "qwen-max",
48
+ "qwen-mt-plus",
49
+ "qwen-mt-turbo",
50
+ "qwen-omni-turbo",
51
+ "qwen-omni-turbo-realtime",
52
+ "qwen-plus",
53
+ "qwen-plus-character-ja",
54
+ "qwen-turbo",
55
+ "qwen-vl-max",
56
+ "qwen-vl-ocr",
57
+ "qwen-vl-plus",
58
+ "qwen2-5-14b-instruct",
59
+ "qwen2-5-32b-instruct",
60
+ "qwen2-5-72b-instruct",
61
+ "qwen2-5-7b-instruct",
62
+ "qwen2-5-omni-7b",
63
+ "qwen2-5-vl-72b-instruct",
64
+ "qwen2-5-vl-7b-instruct",
65
+ "qwen3-14b",
66
+ "qwen3-235b-a22b",
67
+ "qwen3-32b",
68
+ "qwen3-8b",
69
+ "qwen3-asr-flash",
70
+ "qwen3-coder-30b-a3b-instruct",
71
+ "qwen3-coder-480b-a35b-instruct",
72
+ "qwen3-coder-flash",
73
+ "qwen3-coder-plus",
74
+ "qwen3-livetranslate-flash-realtime",
75
+ "qwen3-max",
76
+ "qwen3-next-80b-a3b-instruct",
77
+ "qwen3-next-80b-a3b-thinking",
78
+ "qwen3-omni-flash",
79
+ "qwen3-omni-flash-realtime",
80
+ "qwen3-vl-235b-a22b",
81
+ "qwen3-vl-30b-a3b",
82
+ "qwen3-vl-plus",
83
+ "qwq-plus"
84
+ ],
85
+ "docUrl": "https://www.alibabacloud.com/help/en/model-studio/models",
86
+ "gateway": "models.dev"
87
+ },
87
88
  "xai": {
88
89
  "apiKeyEnvVar": "XAI_API_KEY",
89
90
  "name": "xAI",
@@ -112,325 +113,94 @@
112
113
  "docUrl": "https://docs.x.ai/docs/models",
113
114
  "gateway": "models.dev"
114
115
  },
115
- "deepseek": {
116
- "url": "https://api.deepseek.com",
117
- "apiKeyEnvVar": "DEEPSEEK_API_KEY",
118
- "apiKeyHeader": "Authorization",
119
- "name": "DeepSeek",
120
- "models": ["deepseek-chat", "deepseek-reasoner"],
121
- "docUrl": "https://platform.deepseek.com/api-docs/pricing",
122
- "gateway": "models.dev"
123
- },
124
- "requesty": {
125
- "url": "https://router.requesty.ai/v1",
126
- "apiKeyEnvVar": "REQUESTY_API_KEY",
116
+ "nvidia": {
117
+ "url": "https://integrate.api.nvidia.com/v1",
118
+ "apiKeyEnvVar": "NVIDIA_API_KEY",
127
119
  "apiKeyHeader": "Authorization",
128
- "name": "Requesty",
120
+ "name": "Nvidia",
129
121
  "models": [
130
- "anthropic/claude-3-7-sonnet",
131
- "anthropic/claude-4-sonnet-20250522",
132
- "anthropic/claude-opus-4",
133
- "anthropic/claude-opus-4-1-20250805",
134
- "google/gemini-2.5-flash",
135
- "google/gemini-2.5-pro",
136
- "openai/gpt-4.1",
137
- "openai/gpt-4.1-mini",
138
- "openai/gpt-4o-mini",
139
- "openai/gpt-5",
140
- "openai/gpt-5-mini",
141
- "openai/gpt-5-nano",
142
- "openai/o4-mini"
122
+ "black-forest-labs/flux.1-dev",
123
+ "deepseek-ai/deepseek-v3.1",
124
+ "deepseek-ai/deepseek-v3.1-terminus",
125
+ "google/gemma-3-27b-it",
126
+ "microsoft/phi-4-mini-instruct",
127
+ "moonshotai/kimi-k2-instruct",
128
+ "moonshotai/kimi-k2-instruct-0905",
129
+ "nvidia/cosmos-nemotron-34b",
130
+ "nvidia/llama-3.1-nemotron-ultra-253b-v1",
131
+ "nvidia/nemoretriever-ocr-v1",
132
+ "nvidia/parakeet-tdt-0.6b-v2",
133
+ "openai/gpt-oss-120b",
134
+ "openai/whisper-large-v3",
135
+ "qwen/qwen3-235b-a22b",
136
+ "qwen/qwen3-coder-480b-a35b-instruct"
143
137
  ],
144
- "docUrl": "https://requesty.ai/solution/llm-routing/models",
138
+ "docUrl": "https://docs.api.nvidia.com/nim/",
145
139
  "gateway": "models.dev"
146
140
  },
147
- "nebius": {
148
- "url": "https://api.studio.nebius.com/v1/",
149
- "apiKeyEnvVar": "NEBIUS_API_KEY",
141
+ "upstage": {
142
+ "url": "https://api.upstage.ai",
143
+ "apiKeyEnvVar": "UPSTAGE_API_KEY",
150
144
  "apiKeyHeader": "Authorization",
151
- "name": "Nebius AI Studio",
152
- "models": [
153
- "NousResearch/hermes-4-405b",
154
- "NousResearch/hermes-4-70b",
155
- "deepseek-ai/deepseek-v3",
156
- "meta-llama/llama-3.3-70b-instruct-base",
157
- "meta-llama/llama-3.3-70b-instruct-fast",
158
- "meta-llama/llama-3_1-405b-instruct",
159
- "moonshotai/kimi-k2-instruct",
160
- "nvidia/llama-3_1-nemotron-ultra-253b-v1",
161
- "openai/gpt-oss-120b",
162
- "openai/gpt-oss-20b",
163
- "qwen/qwen3-235b-a22b-instruct-2507",
164
- "qwen/qwen3-235b-a22b-thinking-2507",
165
- "qwen/qwen3-coder-480b-a35b-instruct",
166
- "zai-org/glm-4.5",
167
- "zai-org/glm-4.5-air"
168
- ],
169
- "docUrl": "https://docs.studio.nebius.com/quickstart",
145
+ "name": "Upstage",
146
+ "models": ["solar-mini", "solar-pro2"],
147
+ "docUrl": "https://developers.upstage.ai/docs/apis/chat",
170
148
  "gateway": "models.dev"
171
149
  },
172
- "fastrouter": {
173
- "url": "https://go.fastrouter.ai/api/v1",
174
- "apiKeyEnvVar": "FASTROUTER_API_KEY",
150
+ "groq": {
151
+ "url": "https://api.groq.com/openai/v1",
152
+ "apiKeyEnvVar": "GROQ_API_KEY",
175
153
  "apiKeyHeader": "Authorization",
176
- "name": "FastRouter",
154
+ "name": "Groq",
177
155
  "models": [
178
- "anthropic/claude-opus-4.1",
179
- "anthropic/claude-sonnet-4",
180
- "deepseek-ai/deepseek-r1-distill-llama-70b",
181
- "google/gemini-2.5-flash",
182
- "google/gemini-2.5-pro",
183
- "moonshotai/kimi-k2",
184
- "openai/gpt-4.1",
185
- "openai/gpt-5",
186
- "openai/gpt-5-mini",
187
- "openai/gpt-5-nano",
156
+ "deepseek-r1-distill-llama-70b",
157
+ "gemma2-9b-it",
158
+ "llama-3.1-8b-instant",
159
+ "llama-3.3-70b-versatile",
160
+ "llama-guard-3-8b",
161
+ "llama3-70b-8192",
162
+ "llama3-8b-8192",
163
+ "meta-llama/llama-4-maverick-17b-128e-instruct",
164
+ "meta-llama/llama-4-scout-17b-16e-instruct",
165
+ "meta-llama/llama-guard-4-12b",
166
+ "mistral-saba-24b",
167
+ "moonshotai/kimi-k2-instruct",
168
+ "moonshotai/kimi-k2-instruct-0905",
188
169
  "openai/gpt-oss-120b",
189
170
  "openai/gpt-oss-20b",
190
- "qwen/qwen3-coder",
191
- "x-ai/grok-4"
171
+ "qwen-qwq-32b",
172
+ "qwen/qwen3-32b"
192
173
  ],
193
- "docUrl": "https://fastrouter.ai/models",
174
+ "docUrl": "https://console.groq.com/docs/models",
194
175
  "gateway": "models.dev"
195
176
  },
196
- "perplexity": {
197
- "url": "https://api.perplexity.ai",
198
- "apiKeyEnvVar": "PERPLEXITY_API_KEY",
177
+ "mistral": {
178
+ "url": "https://api.mistral.ai/v1",
179
+ "apiKeyEnvVar": "MISTRAL_API_KEY",
199
180
  "apiKeyHeader": "Authorization",
200
- "name": "Perplexity",
201
- "models": ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
202
- "docUrl": "https://docs.perplexity.ai",
203
- "gateway": "models.dev"
204
- },
205
- "morph": {
206
- "url": "https://api.morphllm.com/v1",
207
- "apiKeyEnvVar": "MORPH_API_KEY",
208
- "apiKeyHeader": "Authorization",
209
- "name": "Morph",
210
- "models": ["auto", "morph-v3-fast", "morph-v3-large"],
211
- "docUrl": "https://docs.morphllm.com/api-reference/introduction",
212
- "gateway": "models.dev"
213
- },
214
- "zai-coding-plan": {
215
- "url": "https://api.z.ai/api/coding/paas/v4",
216
- "apiKeyEnvVar": "ZHIPU_API_KEY",
217
- "apiKeyHeader": "Authorization",
218
- "name": "Z.AI Coding Plan",
219
- "models": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
220
- "docUrl": "https://docs.z.ai/devpack/overview",
221
- "gateway": "models.dev"
222
- },
223
- "huggingface": {
224
- "url": "https://router.huggingface.co/v1",
225
- "apiKeyEnvVar": "HF_TOKEN",
226
- "apiKeyHeader": "Authorization",
227
- "name": "Hugging Face",
228
- "models": [
229
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
230
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
231
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
232
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
233
- "deepseek-ai/DeepSeek-R1-0528",
234
- "deepseek-ai/Deepseek-V3-0324",
235
- "moonshotai/Kimi-K2-Instruct",
236
- "moonshotai/Kimi-K2-Instruct-0905",
237
- "zai-org/GLM-4.5",
238
- "zai-org/GLM-4.5-Air",
239
- "zai-org/GLM-4.6"
240
- ],
241
- "docUrl": "https://huggingface.co/docs/inference-providers",
242
- "gateway": "models.dev"
243
- },
244
- "openrouter": {
245
- "url": "https://openrouter.ai/api/v1",
246
- "apiKeyEnvVar": "OPENROUTER_API_KEY",
247
- "name": "OpenRouter",
248
- "models": [
249
- "anthropic/claude-3.5-haiku",
250
- "anthropic/claude-3.7-sonnet",
251
- "anthropic/claude-haiku-4.5",
252
- "anthropic/claude-opus-4",
253
- "anthropic/claude-opus-4.1",
254
- "anthropic/claude-sonnet-4",
255
- "anthropic/claude-sonnet-4.5",
256
- "cognitivecomputations/dolphin3.0-mistral-24b",
257
- "cognitivecomputations/dolphin3.0-r1-mistral-24b",
258
- "deepseek/deepseek-chat-v3-0324",
259
- "deepseek/deepseek-chat-v3.1",
260
- "deepseek/deepseek-r1-0528-qwen3-8b:free",
261
- "deepseek/deepseek-r1-0528:free",
262
- "deepseek/deepseek-r1-distill-llama-70b",
263
- "deepseek/deepseek-r1-distill-qwen-14b",
264
- "deepseek/deepseek-r1:free",
265
- "deepseek/deepseek-v3-base:free",
266
- "deepseek/deepseek-v3.1-terminus",
267
- "featherless/qwerky-72b",
268
- "google/gemini-2.0-flash-001",
269
- "google/gemini-2.0-flash-exp:free",
270
- "google/gemini-2.5-flash",
271
- "google/gemini-2.5-flash-lite",
272
- "google/gemini-2.5-flash-lite-preview-09-2025",
273
- "google/gemini-2.5-flash-preview-09-2025",
274
- "google/gemini-2.5-pro",
275
- "google/gemini-2.5-pro-preview-05-06",
276
- "google/gemini-2.5-pro-preview-06-05",
277
- "google/gemma-2-9b-it:free",
278
- "google/gemma-3-12b-it",
279
- "google/gemma-3-27b-it",
280
- "google/gemma-3n-e4b-it",
281
- "google/gemma-3n-e4b-it:free",
282
- "meta-llama/llama-3.2-11b-vision-instruct",
283
- "meta-llama/llama-3.3-70b-instruct:free",
284
- "meta-llama/llama-4-scout:free",
285
- "microsoft/mai-ds-r1:free",
286
- "mistralai/codestral-2508",
287
- "mistralai/devstral-medium-2507",
288
- "mistralai/devstral-small-2505",
289
- "mistralai/devstral-small-2505:free",
290
- "mistralai/devstral-small-2507",
291
- "mistralai/mistral-7b-instruct:free",
292
- "mistralai/mistral-medium-3",
293
- "mistralai/mistral-medium-3.1",
294
- "mistralai/mistral-nemo:free",
295
- "mistralai/mistral-small-3.1-24b-instruct",
296
- "mistralai/mistral-small-3.2-24b-instruct",
297
- "mistralai/mistral-small-3.2-24b-instruct:free",
298
- "moonshotai/kimi-dev-72b:free",
299
- "moonshotai/kimi-k2",
300
- "moonshotai/kimi-k2-0905",
301
- "moonshotai/kimi-k2:free",
302
- "nousresearch/deephermes-3-llama-3-8b-preview",
303
- "nousresearch/hermes-4-405b",
304
- "nousresearch/hermes-4-70b",
305
- "openai/gpt-4.1",
306
- "openai/gpt-4.1-mini",
307
- "openai/gpt-4o-mini",
308
- "openai/gpt-5",
309
- "openai/gpt-5-chat",
310
- "openai/gpt-5-codex",
311
- "openai/gpt-5-image",
312
- "openai/gpt-5-mini",
313
- "openai/gpt-5-nano",
314
- "openai/gpt-oss-120b",
315
- "openai/gpt-oss-20b",
316
- "openai/o4-mini",
317
- "openrouter/cypher-alpha:free",
318
- "openrouter/horizon-alpha",
319
- "openrouter/horizon-beta",
320
- "openrouter/sonoma-dusk-alpha",
321
- "openrouter/sonoma-sky-alpha",
322
- "qwen/qwen-2.5-coder-32b-instruct",
323
- "qwen/qwen2.5-vl-32b-instruct:free",
324
- "qwen/qwen2.5-vl-72b-instruct",
325
- "qwen/qwen2.5-vl-72b-instruct:free",
326
- "qwen/qwen3-14b:free",
327
- "qwen/qwen3-235b-a22b-07-25",
328
- "qwen/qwen3-235b-a22b-07-25:free",
329
- "qwen/qwen3-235b-a22b-thinking-2507",
330
- "qwen/qwen3-235b-a22b:free",
331
- "qwen/qwen3-30b-a3b-instruct-2507",
332
- "qwen/qwen3-30b-a3b-thinking-2507",
333
- "qwen/qwen3-30b-a3b:free",
334
- "qwen/qwen3-32b:free",
335
- "qwen/qwen3-8b:free",
336
- "qwen/qwen3-coder",
337
- "qwen/qwen3-coder:free",
338
- "qwen/qwen3-max",
339
- "qwen/qwen3-next-80b-a3b-instruct",
340
- "qwen/qwen3-next-80b-a3b-thinking",
341
- "qwen/qwq-32b:free",
342
- "rekaai/reka-flash-3",
343
- "sarvamai/sarvam-m:free",
344
- "thudm/glm-z1-32b:free",
345
- "tngtech/deepseek-r1t2-chimera:free",
346
- "x-ai/grok-3",
347
- "x-ai/grok-3-beta",
348
- "x-ai/grok-3-mini",
349
- "x-ai/grok-3-mini-beta",
350
- "x-ai/grok-4",
351
- "x-ai/grok-4-fast",
352
- "x-ai/grok-4-fast:free",
353
- "x-ai/grok-code-fast-1",
354
- "z-ai/glm-4.5",
355
- "z-ai/glm-4.5-air",
356
- "z-ai/glm-4.5-air:free",
357
- "z-ai/glm-4.5v",
358
- "z-ai/glm-4.6"
359
- ],
360
- "docUrl": "https://openrouter.ai/models",
361
- "gateway": "models.dev"
362
- },
363
- "cerebras": {
364
- "url": "https://api.cerebras.ai/v1",
365
- "apiKeyEnvVar": "CEREBRAS_API_KEY",
366
- "apiKeyHeader": "Authorization",
367
- "name": "Cerebras",
368
- "models": ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
369
- "docUrl": "https://inference-docs.cerebras.ai/models/overview",
370
- "gateway": "models.dev"
371
- },
372
- "zhipuai": {
373
- "url": "https://open.bigmodel.cn/api/paas/v4",
374
- "apiKeyEnvVar": "ZHIPU_API_KEY",
375
- "apiKeyHeader": "Authorization",
376
- "name": "Zhipu AI",
377
- "models": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
378
- "docUrl": "https://docs.z.ai/guides/overview/pricing",
379
- "gateway": "models.dev"
380
- },
381
- "togetherai": {
382
- "url": "https://api.together.xyz/v1",
383
- "apiKeyEnvVar": "TOGETHER_API_KEY",
384
- "apiKeyHeader": "Authorization",
385
- "name": "Together AI",
386
- "models": [
387
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
388
- "deepseek-ai/DeepSeek-R1",
389
- "deepseek-ai/DeepSeek-V3",
390
- "meta-llama/Llama-3.3-70B-Instruct-Turbo",
391
- "moonshotai/Kimi-K2-Instruct",
392
- "openai/gpt-oss-120b"
393
- ],
394
- "docUrl": "https://docs.together.ai/docs/serverless-models",
395
- "gateway": "models.dev"
396
- },
397
- "wandb": {
398
- "url": "https://api.inference.wandb.ai/v1",
399
- "apiKeyEnvVar": "WANDB_API_KEY",
400
- "apiKeyHeader": "Authorization",
401
- "name": "Weights & Biases",
402
- "models": [
403
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
404
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
405
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
406
- "deepseek-ai/DeepSeek-R1-0528",
407
- "deepseek-ai/DeepSeek-V3-0324",
408
- "meta-llama/Llama-3.1-8B-Instruct",
409
- "meta-llama/Llama-3.3-70B-Instruct",
410
- "meta-llama/Llama-4-Scout-17B-16E-Instruct",
411
- "microsoft/Phi-4-mini-instruct",
412
- "moonshotai/Kimi-K2-Instruct"
413
- ],
414
- "docUrl": "https://weave-docs.wandb.ai/guides/integrations/inference/",
415
- "gateway": "models.dev"
416
- },
417
- "submodel": {
418
- "url": "https://llm.submodel.ai/v1",
419
- "apiKeyEnvVar": "SUBMODEL_INSTAGEN_ACCESS_KEY",
420
- "apiKeyHeader": "Authorization",
421
- "name": "submodel",
181
+ "name": "Mistral",
422
182
  "models": [
423
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
424
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
425
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
426
- "deepseek-ai/DeepSeek-R1-0528",
427
- "deepseek-ai/DeepSeek-V3-0324",
428
- "deepseek-ai/DeepSeek-V3.1",
429
- "openai/gpt-oss-120b",
430
- "zai-org/GLM-4.5-Air",
431
- "zai-org/GLM-4.5-FP8"
183
+ "codestral-latest",
184
+ "devstral-medium-2507",
185
+ "devstral-small-2505",
186
+ "devstral-small-2507",
187
+ "magistral-medium-latest",
188
+ "magistral-small",
189
+ "ministral-3b-latest",
190
+ "ministral-8b-latest",
191
+ "mistral-large-latest",
192
+ "mistral-medium-2505",
193
+ "mistral-medium-2508",
194
+ "mistral-medium-latest",
195
+ "mistral-nemo",
196
+ "mistral-small-latest",
197
+ "open-mistral-7b",
198
+ "open-mixtral-8x22b",
199
+ "open-mixtral-8x7b",
200
+ "pixtral-12b",
201
+ "pixtral-large-latest"
432
202
  ],
433
- "docUrl": "https://submodel.gitbook.io",
203
+ "docUrl": "https://docs.mistral.ai/getting-started/models/",
434
204
  "gateway": "models.dev"
435
205
  },
436
206
  "vercel": {
@@ -527,102 +297,196 @@
527
297
  "docUrl": "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway",
528
298
  "gateway": "models.dev"
529
299
  },
530
- "synthetic": {
531
- "url": "https://api.synthetic.new/v1",
532
- "apiKeyEnvVar": "SYNTHETIC_API_KEY",
300
+ "nebius": {
301
+ "url": "https://api.studio.nebius.com/v1/",
302
+ "apiKeyEnvVar": "NEBIUS_API_KEY",
533
303
  "apiKeyHeader": "Authorization",
534
- "name": "Synthetic",
304
+ "name": "Nebius AI Studio",
535
305
  "models": [
536
- "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
537
- "hf:Qwen/Qwen3-235B-A22B-Instruct-2507",
538
- "hf:Qwen/Qwen3-235B-A22B-Thinking-2507",
539
- "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct",
540
- "hf:deepseek-ai/DeepSeek-R1",
541
- "hf:deepseek-ai/DeepSeek-R1-0528",
542
- "hf:deepseek-ai/DeepSeek-V3",
543
- "hf:deepseek-ai/DeepSeek-V3-0324",
544
- "hf:deepseek-ai/DeepSeek-V3.1",
545
- "hf:deepseek-ai/DeepSeek-V3.1-Terminus",
546
- "hf:meta-llama/Llama-3.1-405B-Instruct",
547
- "hf:meta-llama/Llama-3.1-70B-Instruct",
548
- "hf:meta-llama/Llama-3.1-8B-Instruct",
549
- "hf:meta-llama/Llama-3.3-70B-Instruct",
550
- "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
551
- "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct",
552
- "hf:moonshotai/Kimi-K2-Instruct",
553
- "hf:moonshotai/Kimi-K2-Instruct-0905",
554
- "hf:openai/gpt-oss-120b",
555
- "hf:zai-org/GLM-4.5",
556
- "hf:zai-org/GLM-4.6"
306
+ "NousResearch/hermes-4-405b",
307
+ "NousResearch/hermes-4-70b",
308
+ "deepseek-ai/deepseek-v3",
309
+ "meta-llama/llama-3.3-70b-instruct-base",
310
+ "meta-llama/llama-3.3-70b-instruct-fast",
311
+ "meta-llama/llama-3_1-405b-instruct",
312
+ "moonshotai/kimi-k2-instruct",
313
+ "nvidia/llama-3_1-nemotron-ultra-253b-v1",
314
+ "openai/gpt-oss-120b",
315
+ "openai/gpt-oss-20b",
316
+ "qwen/qwen3-235b-a22b-instruct-2507",
317
+ "qwen/qwen3-235b-a22b-thinking-2507",
318
+ "qwen/qwen3-coder-480b-a35b-instruct",
319
+ "zai-org/glm-4.5",
320
+ "zai-org/glm-4.5-air"
557
321
  ],
558
- "docUrl": "https://synthetic.new/pricing",
322
+ "docUrl": "https://docs.studio.nebius.com/quickstart",
559
323
  "gateway": "models.dev"
560
324
  },
561
- "google": {
562
- "apiKeyEnvVar": "GOOGLE_GENERATIVE_AI_API_KEY",
563
- "name": "Google",
325
+ "deepseek": {
326
+ "url": "https://api.deepseek.com",
327
+ "apiKeyEnvVar": "DEEPSEEK_API_KEY",
328
+ "apiKeyHeader": "Authorization",
329
+ "name": "DeepSeek",
330
+ "models": ["deepseek-chat", "deepseek-reasoner"],
331
+ "docUrl": "https://platform.deepseek.com/api-docs/pricing",
332
+ "gateway": "models.dev"
333
+ },
334
+ "alibaba-cn": {
335
+ "url": "https://dashscope.aliyuncs.com/compatible-mode/v1",
336
+ "apiKeyEnvVar": "DASHSCOPE_API_KEY",
337
+ "apiKeyHeader": "Authorization",
338
+ "name": "Alibaba (China)",
564
339
  "models": [
565
- "gemini-1.5-flash",
566
- "gemini-1.5-flash-8b",
567
- "gemini-1.5-pro",
568
- "gemini-2.0-flash",
569
- "gemini-2.0-flash-lite",
570
- "gemini-2.5-flash",
571
- "gemini-2.5-flash-image",
572
- "gemini-2.5-flash-image-preview",
573
- "gemini-2.5-flash-lite",
574
- "gemini-2.5-flash-lite-preview-06-17",
575
- "gemini-2.5-flash-lite-preview-09-2025",
576
- "gemini-2.5-flash-preview-04-17",
577
- "gemini-2.5-flash-preview-05-20",
578
- "gemini-2.5-flash-preview-09-2025",
579
- "gemini-2.5-flash-preview-tts",
580
- "gemini-2.5-pro",
581
- "gemini-2.5-pro-preview-05-06",
582
- "gemini-2.5-pro-preview-06-05",
583
- "gemini-2.5-pro-preview-tts",
584
- "gemini-flash-latest",
585
- "gemini-flash-lite-latest",
586
- "gemini-live-2.5-flash",
587
- "gemini-live-2.5-flash-preview-native-audio"
340
+ "deepseek-r1",
341
+ "deepseek-r1-0528",
342
+ "deepseek-r1-distill-llama-70b",
343
+ "deepseek-r1-distill-llama-8b",
344
+ "deepseek-r1-distill-qwen-1-5b",
345
+ "deepseek-r1-distill-qwen-14b",
346
+ "deepseek-r1-distill-qwen-32b",
347
+ "deepseek-r1-distill-qwen-7b",
348
+ "deepseek-v3",
349
+ "deepseek-v3-1",
350
+ "deepseek-v3-2-exp",
351
+ "moonshot-kimi-k2-instruct",
352
+ "qvq-max",
353
+ "qwen-deep-research",
354
+ "qwen-doc-turbo",
355
+ "qwen-flash",
356
+ "qwen-long",
357
+ "qwen-math-plus",
358
+ "qwen-math-turbo",
359
+ "qwen-max",
360
+ "qwen-mt-plus",
361
+ "qwen-mt-turbo",
362
+ "qwen-omni-turbo",
363
+ "qwen-omni-turbo-realtime",
364
+ "qwen-plus",
365
+ "qwen-plus-character",
366
+ "qwen-turbo",
367
+ "qwen-vl-max",
368
+ "qwen-vl-ocr",
369
+ "qwen-vl-plus",
370
+ "qwen2-5-14b-instruct",
371
+ "qwen2-5-32b-instruct",
372
+ "qwen2-5-72b-instruct",
373
+ "qwen2-5-7b-instruct",
374
+ "qwen2-5-coder-32b-instruct",
375
+ "qwen2-5-coder-7b-instruct",
376
+ "qwen2-5-math-72b-instruct",
377
+ "qwen2-5-math-7b-instruct",
378
+ "qwen2-5-omni-7b",
379
+ "qwen2-5-vl-72b-instruct",
380
+ "qwen2-5-vl-7b-instruct",
381
+ "qwen3-14b",
382
+ "qwen3-235b-a22b",
383
+ "qwen3-32b",
384
+ "qwen3-8b",
385
+ "qwen3-asr-flash",
386
+ "qwen3-coder-30b-a3b-instruct",
387
+ "qwen3-coder-480b-a35b-instruct",
388
+ "qwen3-coder-flash",
389
+ "qwen3-coder-plus",
390
+ "qwen3-max",
391
+ "qwen3-next-80b-a3b-instruct",
392
+ "qwen3-next-80b-a3b-thinking",
393
+ "qwen3-omni-flash",
394
+ "qwen3-omni-flash-realtime",
395
+ "qwen3-vl-235b-a22b",
396
+ "qwen3-vl-30b-a3b",
397
+ "qwen3-vl-plus",
398
+ "qwq-32b",
399
+ "qwq-plus",
400
+ "tongyi-intent-detect-v3"
588
401
  ],
589
- "docUrl": "https://ai.google.dev/gemini-api/docs/pricing",
402
+ "docUrl": "https://www.alibabacloud.com/help/en/model-studio/models",
590
403
  "gateway": "models.dev"
591
404
  },
592
- "groq": {
593
- "url": "https://api.groq.com/openai/v1",
594
- "apiKeyEnvVar": "GROQ_API_KEY",
405
+ "venice": {
406
+ "url": "https://api.venice.ai/api/v1",
407
+ "apiKeyEnvVar": "VENICE_API_KEY",
595
408
  "apiKeyHeader": "Authorization",
596
- "name": "Groq",
409
+ "name": "Venice AI",
597
410
  "models": [
598
- "deepseek-r1-distill-llama-70b",
599
- "gemma2-9b-it",
600
- "llama-3.1-8b-instant",
601
- "llama-3.3-70b-versatile",
602
- "llama-guard-3-8b",
603
- "llama3-70b-8192",
604
- "llama3-8b-8192",
605
- "meta-llama/llama-4-maverick-17b-128e-instruct",
606
- "meta-llama/llama-4-scout-17b-16e-instruct",
607
- "meta-llama/llama-guard-4-12b",
608
- "mistral-saba-24b",
609
- "moonshotai/kimi-k2-instruct",
610
- "moonshotai/kimi-k2-instruct-0905",
411
+ "deepseek-coder-v2-lite",
412
+ "deepseek-r1-671b",
413
+ "dolphin-2.9.2-qwen2-72b",
414
+ "llama-3.1-405b",
415
+ "llama-3.2-3b",
416
+ "llama-3.3-70b",
417
+ "mistral-31-24b",
418
+ "qwen-2.5-coder-32b",
419
+ "qwen-2.5-qwq-32b",
420
+ "qwen-2.5-vl",
421
+ "qwen3-235b",
422
+ "qwen3-4b",
423
+ "venice-uncensored"
424
+ ],
425
+ "docUrl": "https://docs.venice.ai",
426
+ "gateway": "models.dev"
427
+ },
428
+ "chutes": {
429
+ "url": "https://llm.chutes.ai/v1",
430
+ "apiKeyEnvVar": "CHUTES_API_KEY",
431
+ "apiKeyHeader": "Authorization",
432
+ "name": "Chutes",
433
+ "models": [
434
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
435
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
436
+ "Qwen/Qwen3-30B-A3B",
437
+ "Qwen/Qwen3-30B-A3B-Instruct-2507",
438
+ "Qwen/Qwen3-30B-A3B-Thinking-2507",
439
+ "Qwen/Qwen3-Coder-30B-A3B-Instruct",
440
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
441
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
442
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
443
+ "chutesai/Devstral-Small-2505",
444
+ "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
445
+ "deepseek-ai/DeepSeek-R1-0528",
446
+ "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
447
+ "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
448
+ "deepseek-ai/DeepSeek-V3-0324",
449
+ "deepseek-ai/DeepSeek-V3.1",
450
+ "deepseek-ai/DeepSeek-V3.1-Terminus",
451
+ "deepseek-ai/DeepSeek-V3.1-turbo",
452
+ "deepseek-ai/DeepSeek-V3.1:THINKING",
453
+ "deepseek-ai/DeepSeek-V3.2-Exp",
454
+ "meituan-longcat/LongCat-Flash-Chat-FP8",
455
+ "moonshotai/Kimi-Dev-72B",
456
+ "moonshotai/Kimi-K2-Instruct-0905",
457
+ "moonshotai/Kimi-K2-Instruct-75k",
458
+ "moonshotai/Kimi-VL-A3B-Thinking",
611
459
  "openai/gpt-oss-120b",
612
- "openai/gpt-oss-20b",
613
- "qwen-qwq-32b",
614
- "qwen/qwen3-32b"
460
+ "tngtech/DeepSeek-R1T-Chimera",
461
+ "tngtech/DeepSeek-TNG-R1T2-Chimera",
462
+ "zai-org/GLM-4.5-Air",
463
+ "zai-org/GLM-4.5-FP8",
464
+ "zai-org/GLM-4.5-turbo",
465
+ "zai-org/GLM-4.6-FP8",
466
+ "zai-org/GLM-4.6-turbo"
615
467
  ],
616
- "docUrl": "https://console.groq.com/docs/models",
468
+ "docUrl": "https://llm.chutes.ai/v1/models",
617
469
  "gateway": "models.dev"
618
470
  },
619
- "moonshotai-cn": {
620
- "url": "https://api.moonshot.cn/v1",
621
- "apiKeyEnvVar": "MOONSHOT_API_KEY",
471
+ "cortecs": {
472
+ "url": "https://api.cortecs.ai/v1",
473
+ "apiKeyEnvVar": "CORTECS_API_KEY",
622
474
  "apiKeyHeader": "Authorization",
623
- "name": "Moonshot AI (China)",
624
- "models": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
625
- "docUrl": "https://platform.moonshot.cn/docs/api/chat",
475
+ "name": "Cortecs",
476
+ "models": [
477
+ "claude-4-5-sonnet",
478
+ "claude-sonnet-4",
479
+ "deepseek-v3-0324",
480
+ "gemini-2.5-pro",
481
+ "gpt-4.1",
482
+ "gpt-oss-120b",
483
+ "kimi-k2-instruct",
484
+ "llama-3.1-405b-instruct",
485
+ "nova-pro-v1",
486
+ "qwen3-32b",
487
+ "qwen3-coder-480b-a35b-instruct"
488
+ ],
489
+ "docUrl": "https://api.cortecs.ai/v1/models",
626
490
  "gateway": "models.dev"
627
491
  },
628
492
  "github-models": {
@@ -690,47 +554,50 @@
690
554
  "docUrl": "https://docs.github.com/en/github-models",
691
555
  "gateway": "models.dev"
692
556
  },
693
- "deepinfra": {
694
- "url": "https://api.deepinfra.com/v1/openai",
695
- "apiKeyEnvVar": "DEEPINFRA_API_KEY",
557
+ "togetherai": {
558
+ "url": "https://api.together.xyz/v1",
559
+ "apiKeyEnvVar": "TOGETHER_API_KEY",
696
560
  "apiKeyHeader": "Authorization",
697
- "name": "Deep Infra",
561
+ "name": "Together AI",
698
562
  "models": [
699
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
700
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo",
563
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
564
+ "deepseek-ai/DeepSeek-R1",
565
+ "deepseek-ai/DeepSeek-V3",
566
+ "meta-llama/Llama-3.3-70B-Instruct-Turbo",
701
567
  "moonshotai/Kimi-K2-Instruct",
702
- "zai-org/GLM-4.5"
568
+ "openai/gpt-oss-120b"
703
569
  ],
704
- "docUrl": "https://deepinfra.com/models",
570
+ "docUrl": "https://docs.together.ai/docs/serverless-models",
705
571
  "gateway": "models.dev"
706
572
  },
707
- "fireworks-ai": {
708
- "url": "https://api.fireworks.ai/inference/v1/",
709
- "apiKeyEnvVar": "FIREWORKS_API_KEY",
573
+ "baseten": {
574
+ "url": "https://inference.baseten.co/v1",
575
+ "apiKeyEnvVar": "BASETEN_API_KEY",
710
576
  "apiKeyHeader": "Authorization",
711
- "name": "Fireworks AI",
712
- "models": [
713
- "accounts/fireworks/models/deepseek-r1-0528",
714
- "accounts/fireworks/models/deepseek-v3-0324",
715
- "accounts/fireworks/models/deepseek-v3p1",
716
- "accounts/fireworks/models/glm-4p5",
717
- "accounts/fireworks/models/glm-4p5-air",
718
- "accounts/fireworks/models/gpt-oss-120b",
719
- "accounts/fireworks/models/gpt-oss-20b",
720
- "accounts/fireworks/models/kimi-k2-instruct",
721
- "accounts/fireworks/models/qwen3-235b-a22b",
722
- "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
723
- ],
724
- "docUrl": "https://fireworks.ai/docs/",
577
+ "name": "Baseten",
578
+ "models": ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
579
+ "docUrl": "https://docs.baseten.co/development/model-apis/overview",
725
580
  "gateway": "models.dev"
726
581
  },
727
- "zai": {
728
- "url": "https://api.z.ai/api/paas/v4",
729
- "apiKeyEnvVar": "ZHIPU_API_KEY",
582
+ "huggingface": {
583
+ "url": "https://router.huggingface.co/v1",
584
+ "apiKeyEnvVar": "HF_TOKEN",
730
585
  "apiKeyHeader": "Authorization",
731
- "name": "Z.AI",
732
- "models": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
733
- "docUrl": "https://docs.z.ai/guides/overview/pricing",
586
+ "name": "Hugging Face",
587
+ "models": [
588
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
589
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
590
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
591
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
592
+ "deepseek-ai/DeepSeek-R1-0528",
593
+ "deepseek-ai/Deepseek-V3-0324",
594
+ "moonshotai/Kimi-K2-Instruct",
595
+ "moonshotai/Kimi-K2-Instruct-0905",
596
+ "zai-org/GLM-4.5",
597
+ "zai-org/GLM-4.5-Air",
598
+ "zai-org/GLM-4.6"
599
+ ],
600
+ "docUrl": "https://huggingface.co/docs/inference-providers",
734
601
  "gateway": "models.dev"
735
602
  },
736
603
  "opencode": {
@@ -757,13 +624,59 @@
757
624
  "docUrl": "https://opencode.ai/docs/zen",
758
625
  "gateway": "models.dev"
759
626
  },
760
- "zhipuai-coding-plan": {
761
- "url": "https://open.bigmodel.cn/api/coding/paas/v4",
762
- "apiKeyEnvVar": "ZHIPU_API_KEY",
627
+ "fastrouter": {
628
+ "url": "https://go.fastrouter.ai/api/v1",
629
+ "apiKeyEnvVar": "FASTROUTER_API_KEY",
763
630
  "apiKeyHeader": "Authorization",
764
- "name": "Zhipu AI Coding Plan",
765
- "models": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
766
- "docUrl": "https://docs.bigmodel.cn/cn/coding-plan/overview",
631
+ "name": "FastRouter",
632
+ "models": [
633
+ "anthropic/claude-opus-4.1",
634
+ "anthropic/claude-sonnet-4",
635
+ "deepseek-ai/deepseek-r1-distill-llama-70b",
636
+ "google/gemini-2.5-flash",
637
+ "google/gemini-2.5-pro",
638
+ "moonshotai/kimi-k2",
639
+ "openai/gpt-4.1",
640
+ "openai/gpt-5",
641
+ "openai/gpt-5-mini",
642
+ "openai/gpt-5-nano",
643
+ "openai/gpt-oss-120b",
644
+ "openai/gpt-oss-20b",
645
+ "qwen/qwen3-coder",
646
+ "x-ai/grok-4"
647
+ ],
648
+ "docUrl": "https://fastrouter.ai/models",
649
+ "gateway": "models.dev"
650
+ },
651
+ "google": {
652
+ "apiKeyEnvVar": "GOOGLE_GENERATIVE_AI_API_KEY",
653
+ "name": "Google",
654
+ "models": [
655
+ "gemini-1.5-flash",
656
+ "gemini-1.5-flash-8b",
657
+ "gemini-1.5-pro",
658
+ "gemini-2.0-flash",
659
+ "gemini-2.0-flash-lite",
660
+ "gemini-2.5-flash",
661
+ "gemini-2.5-flash-image",
662
+ "gemini-2.5-flash-image-preview",
663
+ "gemini-2.5-flash-lite",
664
+ "gemini-2.5-flash-lite-preview-06-17",
665
+ "gemini-2.5-flash-lite-preview-09-2025",
666
+ "gemini-2.5-flash-preview-04-17",
667
+ "gemini-2.5-flash-preview-05-20",
668
+ "gemini-2.5-flash-preview-09-2025",
669
+ "gemini-2.5-flash-preview-tts",
670
+ "gemini-2.5-pro",
671
+ "gemini-2.5-pro-preview-05-06",
672
+ "gemini-2.5-pro-preview-06-05",
673
+ "gemini-2.5-pro-preview-tts",
674
+ "gemini-flash-latest",
675
+ "gemini-flash-lite-latest",
676
+ "gemini-live-2.5-flash",
677
+ "gemini-live-2.5-flash-preview-native-audio"
678
+ ],
679
+ "docUrl": "https://ai.google.dev/gemini-api/docs/pricing",
767
680
  "gateway": "models.dev"
768
681
  },
769
682
  "inception": {
@@ -775,30 +688,24 @@
775
688
  "docUrl": "https://platform.inceptionlabs.ai/docs",
776
689
  "gateway": "models.dev"
777
690
  },
778
- "llama": {
779
- "url": "https://api.llama.com/compat/v1/",
780
- "apiKeyEnvVar": "LLAMA_API_KEY",
691
+ "wandb": {
692
+ "url": "https://api.inference.wandb.ai/v1",
693
+ "apiKeyEnvVar": "WANDB_API_KEY",
781
694
  "apiKeyHeader": "Authorization",
782
- "name": "Llama",
695
+ "name": "Weights & Biases",
783
696
  "models": [
784
- "cerebras-llama-4-maverick-17b-128e-instruct",
785
- "cerebras-llama-4-scout-17b-16e-instruct",
786
- "groq-llama-4-maverick-17b-128e-instruct",
787
- "llama-3.3-70b-instruct",
788
- "llama-3.3-8b-instruct",
789
- "llama-4-maverick-17b-128e-instruct-fp8",
790
- "llama-4-scout-17b-16e-instruct-fp8"
697
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
698
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
699
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
700
+ "deepseek-ai/DeepSeek-R1-0528",
701
+ "deepseek-ai/DeepSeek-V3-0324",
702
+ "meta-llama/Llama-3.1-8B-Instruct",
703
+ "meta-llama/Llama-3.3-70B-Instruct",
704
+ "meta-llama/Llama-4-Scout-17B-16E-Instruct",
705
+ "microsoft/Phi-4-mini-instruct",
706
+ "moonshotai/Kimi-K2-Instruct"
791
707
  ],
792
- "docUrl": "https://llama.developer.meta.com/docs/models",
793
- "gateway": "models.dev"
794
- },
795
- "lmstudio": {
796
- "url": "http://127.0.0.1:1234/v1",
797
- "apiKeyEnvVar": "LMSTUDIO_API_KEY",
798
- "apiKeyHeader": "Authorization",
799
- "name": "LMStudio",
800
- "models": ["openai/gpt-oss-20b", "qwen/qwen3-30b-a3b-2507", "qwen/qwen3-coder-30b"],
801
- "docUrl": "https://lmstudio.ai/models",
708
+ "docUrl": "https://weave-docs.wandb.ai/guides/integrations/inference/",
802
709
  "gateway": "models.dev"
803
710
  },
804
711
  "openai": {
@@ -836,313 +743,394 @@
836
743
  "docUrl": "https://platform.openai.com/docs/models",
837
744
  "gateway": "models.dev"
838
745
  },
839
- "anthropic": {
840
- "apiKeyEnvVar": "ANTHROPIC_API_KEY",
841
- "name": "Anthropic",
842
- "models": [
843
- "claude-3-5-haiku-20241022",
844
- "claude-3-5-haiku-latest",
845
- "claude-3-5-sonnet-20240620",
846
- "claude-3-5-sonnet-20241022",
847
- "claude-3-7-sonnet-20250219",
848
- "claude-3-7-sonnet-latest",
849
- "claude-3-haiku-20240307",
850
- "claude-3-opus-20240229",
851
- "claude-3-sonnet-20240229",
852
- "claude-haiku-4-5",
853
- "claude-haiku-4-5-20251001",
854
- "claude-opus-4-0",
855
- "claude-opus-4-1",
856
- "claude-opus-4-1-20250805",
857
- "claude-opus-4-20250514",
858
- "claude-sonnet-4-0",
859
- "claude-sonnet-4-20250514",
860
- "claude-sonnet-4-5",
861
- "claude-sonnet-4-5-20250929"
862
- ],
863
- "docUrl": "https://docs.anthropic.com/en/docs/about-claude/models",
864
- "gateway": "models.dev"
865
- },
866
- "moonshotai": {
867
- "url": "https://api.moonshot.ai/v1",
868
- "apiKeyEnvVar": "MOONSHOT_API_KEY",
869
- "apiKeyHeader": "Authorization",
870
- "name": "Moonshot AI",
871
- "models": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
872
- "docUrl": "https://platform.moonshot.ai/docs/api/chat",
873
- "gateway": "models.dev"
874
- },
875
- "inference": {
876
- "url": "https://inference.net/v1",
877
- "apiKeyEnvVar": "INFERENCE_API_KEY",
878
- "apiKeyHeader": "Authorization",
879
- "name": "Inference",
880
- "models": [
881
- "google/gemma-3",
882
- "meta/llama-3.1-8b-instruct",
883
- "meta/llama-3.2-11b-vision-instruct",
884
- "meta/llama-3.2-1b-instruct",
885
- "meta/llama-3.2-3b-instruct",
886
- "mistral/mistral-nemo-12b-instruct",
887
- "osmosis/osmosis-structure-0.6b",
888
- "qwen/qwen-2.5-7b-vision-instruct",
889
- "qwen/qwen3-embedding-4b"
890
- ],
891
- "docUrl": "https://inference.net/models",
892
- "gateway": "models.dev"
893
- },
894
- "baseten": {
895
- "url": "https://inference.baseten.co/v1",
896
- "apiKeyEnvVar": "BASETEN_API_KEY",
746
+ "zhipuai-coding-plan": {
747
+ "url": "https://open.bigmodel.cn/api/coding/paas/v4",
748
+ "apiKeyEnvVar": "ZHIPU_API_KEY",
897
749
  "apiKeyHeader": "Authorization",
898
- "name": "Baseten",
899
- "models": ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
900
- "docUrl": "https://docs.baseten.co/development/model-apis/overview",
750
+ "name": "Zhipu AI Coding Plan",
751
+ "models": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
752
+ "docUrl": "https://docs.bigmodel.cn/cn/coding-plan/overview",
901
753
  "gateway": "models.dev"
902
754
  },
903
- "cortecs": {
904
- "url": "https://api.cortecs.ai/v1",
905
- "apiKeyEnvVar": "CORTECS_API_KEY",
755
+ "perplexity": {
756
+ "url": "https://api.perplexity.ai",
757
+ "apiKeyEnvVar": "PERPLEXITY_API_KEY",
906
758
  "apiKeyHeader": "Authorization",
907
- "name": "Cortecs",
908
- "models": [
909
- "claude-4-5-sonnet",
910
- "claude-sonnet-4",
911
- "deepseek-v3-0324",
912
- "gemini-2.5-pro",
913
- "gpt-4.1",
914
- "gpt-oss-120b",
915
- "kimi-k2-instruct",
916
- "llama-3.1-405b-instruct",
917
- "nova-pro-v1",
918
- "qwen3-32b",
919
- "qwen3-coder-480b-a35b-instruct"
920
- ],
921
- "docUrl": "https://api.cortecs.ai/v1/models",
759
+ "name": "Perplexity",
760
+ "models": ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
761
+ "docUrl": "https://docs.perplexity.ai",
922
762
  "gateway": "models.dev"
923
763
  },
924
- "mistral": {
925
- "url": "https://api.mistral.ai/v1",
926
- "apiKeyEnvVar": "MISTRAL_API_KEY",
927
- "apiKeyHeader": "Authorization",
928
- "name": "Mistral",
764
+ "openrouter": {
765
+ "url": "https://openrouter.ai/api/v1",
766
+ "apiKeyEnvVar": "OPENROUTER_API_KEY",
767
+ "name": "OpenRouter",
929
768
  "models": [
930
- "codestral-latest",
931
- "devstral-medium-2507",
932
- "devstral-small-2505",
933
- "devstral-small-2507",
934
- "magistral-medium-latest",
935
- "magistral-small",
936
- "ministral-3b-latest",
937
- "ministral-8b-latest",
938
- "mistral-large-latest",
939
- "mistral-medium-2505",
940
- "mistral-medium-2508",
941
- "mistral-medium-latest",
942
- "mistral-nemo",
943
- "mistral-small-latest",
944
- "open-mistral-7b",
945
- "open-mixtral-8x22b",
946
- "open-mixtral-8x7b",
947
- "pixtral-12b",
948
- "pixtral-large-latest"
769
+ "anthropic/claude-3.5-haiku",
770
+ "anthropic/claude-3.7-sonnet",
771
+ "anthropic/claude-haiku-4.5",
772
+ "anthropic/claude-opus-4",
773
+ "anthropic/claude-opus-4.1",
774
+ "anthropic/claude-sonnet-4",
775
+ "anthropic/claude-sonnet-4.5",
776
+ "cognitivecomputations/dolphin3.0-mistral-24b",
777
+ "cognitivecomputations/dolphin3.0-r1-mistral-24b",
778
+ "deepseek/deepseek-chat-v3-0324",
779
+ "deepseek/deepseek-chat-v3.1",
780
+ "deepseek/deepseek-r1-0528-qwen3-8b:free",
781
+ "deepseek/deepseek-r1-0528:free",
782
+ "deepseek/deepseek-r1-distill-llama-70b",
783
+ "deepseek/deepseek-r1-distill-qwen-14b",
784
+ "deepseek/deepseek-r1:free",
785
+ "deepseek/deepseek-v3-base:free",
786
+ "deepseek/deepseek-v3.1-terminus",
787
+ "featherless/qwerky-72b",
788
+ "google/gemini-2.0-flash-001",
789
+ "google/gemini-2.0-flash-exp:free",
790
+ "google/gemini-2.5-flash",
791
+ "google/gemini-2.5-flash-lite",
792
+ "google/gemini-2.5-flash-lite-preview-09-2025",
793
+ "google/gemini-2.5-flash-preview-09-2025",
794
+ "google/gemini-2.5-pro",
795
+ "google/gemini-2.5-pro-preview-05-06",
796
+ "google/gemini-2.5-pro-preview-06-05",
797
+ "google/gemma-2-9b-it:free",
798
+ "google/gemma-3-12b-it",
799
+ "google/gemma-3-27b-it",
800
+ "google/gemma-3n-e4b-it",
801
+ "google/gemma-3n-e4b-it:free",
802
+ "meta-llama/llama-3.2-11b-vision-instruct",
803
+ "meta-llama/llama-3.3-70b-instruct:free",
804
+ "meta-llama/llama-4-scout:free",
805
+ "microsoft/mai-ds-r1:free",
806
+ "mistralai/codestral-2508",
807
+ "mistralai/devstral-medium-2507",
808
+ "mistralai/devstral-small-2505",
809
+ "mistralai/devstral-small-2505:free",
810
+ "mistralai/devstral-small-2507",
811
+ "mistralai/mistral-7b-instruct:free",
812
+ "mistralai/mistral-medium-3",
813
+ "mistralai/mistral-medium-3.1",
814
+ "mistralai/mistral-nemo:free",
815
+ "mistralai/mistral-small-3.1-24b-instruct",
816
+ "mistralai/mistral-small-3.2-24b-instruct",
817
+ "mistralai/mistral-small-3.2-24b-instruct:free",
818
+ "moonshotai/kimi-dev-72b:free",
819
+ "moonshotai/kimi-k2",
820
+ "moonshotai/kimi-k2-0905",
821
+ "moonshotai/kimi-k2:free",
822
+ "nousresearch/deephermes-3-llama-3-8b-preview",
823
+ "nousresearch/hermes-4-405b",
824
+ "nousresearch/hermes-4-70b",
825
+ "openai/gpt-4.1",
826
+ "openai/gpt-4.1-mini",
827
+ "openai/gpt-4o-mini",
828
+ "openai/gpt-5",
829
+ "openai/gpt-5-chat",
830
+ "openai/gpt-5-codex",
831
+ "openai/gpt-5-image",
832
+ "openai/gpt-5-mini",
833
+ "openai/gpt-5-nano",
834
+ "openai/gpt-oss-120b",
835
+ "openai/gpt-oss-20b",
836
+ "openai/o4-mini",
837
+ "openrouter/cypher-alpha:free",
838
+ "openrouter/horizon-alpha",
839
+ "openrouter/horizon-beta",
840
+ "openrouter/sonoma-dusk-alpha",
841
+ "openrouter/sonoma-sky-alpha",
842
+ "qwen/qwen-2.5-coder-32b-instruct",
843
+ "qwen/qwen2.5-vl-32b-instruct:free",
844
+ "qwen/qwen2.5-vl-72b-instruct",
845
+ "qwen/qwen2.5-vl-72b-instruct:free",
846
+ "qwen/qwen3-14b:free",
847
+ "qwen/qwen3-235b-a22b-07-25",
848
+ "qwen/qwen3-235b-a22b-07-25:free",
849
+ "qwen/qwen3-235b-a22b-thinking-2507",
850
+ "qwen/qwen3-235b-a22b:free",
851
+ "qwen/qwen3-30b-a3b-instruct-2507",
852
+ "qwen/qwen3-30b-a3b-thinking-2507",
853
+ "qwen/qwen3-30b-a3b:free",
854
+ "qwen/qwen3-32b:free",
855
+ "qwen/qwen3-8b:free",
856
+ "qwen/qwen3-coder",
857
+ "qwen/qwen3-coder:free",
858
+ "qwen/qwen3-max",
859
+ "qwen/qwen3-next-80b-a3b-instruct",
860
+ "qwen/qwen3-next-80b-a3b-thinking",
861
+ "qwen/qwq-32b:free",
862
+ "rekaai/reka-flash-3",
863
+ "sarvamai/sarvam-m:free",
864
+ "thudm/glm-z1-32b:free",
865
+ "tngtech/deepseek-r1t2-chimera:free",
866
+ "x-ai/grok-3",
867
+ "x-ai/grok-3-beta",
868
+ "x-ai/grok-3-mini",
869
+ "x-ai/grok-3-mini-beta",
870
+ "x-ai/grok-4",
871
+ "x-ai/grok-4-fast",
872
+ "x-ai/grok-4-fast:free",
873
+ "x-ai/grok-code-fast-1",
874
+ "z-ai/glm-4.5",
875
+ "z-ai/glm-4.5-air",
876
+ "z-ai/glm-4.5-air:free",
877
+ "z-ai/glm-4.5v",
878
+ "z-ai/glm-4.6"
949
879
  ],
950
- "docUrl": "https://docs.mistral.ai/getting-started/models/",
880
+ "docUrl": "https://openrouter.ai/models",
951
881
  "gateway": "models.dev"
952
882
  },
953
- "venice": {
954
- "url": "https://api.venice.ai/api/v1",
955
- "apiKeyEnvVar": "VENICE_API_KEY",
883
+ "synthetic": {
884
+ "url": "https://api.synthetic.new/v1",
885
+ "apiKeyEnvVar": "SYNTHETIC_API_KEY",
956
886
  "apiKeyHeader": "Authorization",
957
- "name": "Venice AI",
887
+ "name": "Synthetic",
958
888
  "models": [
959
- "deepseek-coder-v2-lite",
960
- "deepseek-r1-671b",
961
- "dolphin-2.9.2-qwen2-72b",
962
- "llama-3.1-405b",
963
- "llama-3.2-3b",
964
- "llama-3.3-70b",
965
- "mistral-31-24b",
966
- "qwen-2.5-coder-32b",
967
- "qwen-2.5-qwq-32b",
968
- "qwen-2.5-vl",
969
- "qwen3-235b",
970
- "qwen3-4b",
971
- "venice-uncensored"
889
+ "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
890
+ "hf:Qwen/Qwen3-235B-A22B-Instruct-2507",
891
+ "hf:Qwen/Qwen3-235B-A22B-Thinking-2507",
892
+ "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct",
893
+ "hf:deepseek-ai/DeepSeek-R1",
894
+ "hf:deepseek-ai/DeepSeek-R1-0528",
895
+ "hf:deepseek-ai/DeepSeek-V3",
896
+ "hf:deepseek-ai/DeepSeek-V3-0324",
897
+ "hf:deepseek-ai/DeepSeek-V3.1",
898
+ "hf:deepseek-ai/DeepSeek-V3.1-Terminus",
899
+ "hf:meta-llama/Llama-3.1-405B-Instruct",
900
+ "hf:meta-llama/Llama-3.1-70B-Instruct",
901
+ "hf:meta-llama/Llama-3.1-8B-Instruct",
902
+ "hf:meta-llama/Llama-3.3-70B-Instruct",
903
+ "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
904
+ "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct",
905
+ "hf:moonshotai/Kimi-K2-Instruct",
906
+ "hf:moonshotai/Kimi-K2-Instruct-0905",
907
+ "hf:openai/gpt-oss-120b",
908
+ "hf:zai-org/GLM-4.5",
909
+ "hf:zai-org/GLM-4.6"
972
910
  ],
973
- "docUrl": "https://docs.venice.ai",
911
+ "docUrl": "https://synthetic.new/pricing",
974
912
  "gateway": "models.dev"
975
913
  },
976
- "alibaba": {
977
- "url": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1",
978
- "apiKeyEnvVar": "DASHSCOPE_API_KEY",
914
+ "deepinfra": {
915
+ "url": "https://api.deepinfra.com/v1/openai",
916
+ "apiKeyEnvVar": "DEEPINFRA_API_KEY",
979
917
  "apiKeyHeader": "Authorization",
980
- "name": "Alibaba",
918
+ "name": "Deep Infra",
981
919
  "models": [
982
- "qvq-max",
983
- "qwen-flash",
984
- "qwen-max",
985
- "qwen-mt-plus",
986
- "qwen-mt-turbo",
987
- "qwen-omni-turbo",
988
- "qwen-omni-turbo-realtime",
989
- "qwen-plus",
990
- "qwen-plus-character-ja",
991
- "qwen-turbo",
992
- "qwen-vl-max",
993
- "qwen-vl-ocr",
994
- "qwen-vl-plus",
995
- "qwen2-5-14b-instruct",
996
- "qwen2-5-32b-instruct",
997
- "qwen2-5-72b-instruct",
998
- "qwen2-5-7b-instruct",
999
- "qwen2-5-omni-7b",
1000
- "qwen2-5-vl-72b-instruct",
1001
- "qwen2-5-vl-7b-instruct",
1002
- "qwen3-14b",
1003
- "qwen3-235b-a22b",
1004
- "qwen3-32b",
1005
- "qwen3-8b",
1006
- "qwen3-asr-flash",
1007
- "qwen3-coder-30b-a3b-instruct",
1008
- "qwen3-coder-480b-a35b-instruct",
1009
- "qwen3-coder-flash",
1010
- "qwen3-coder-plus",
1011
- "qwen3-livetranslate-flash-realtime",
1012
- "qwen3-max",
1013
- "qwen3-next-80b-a3b-instruct",
1014
- "qwen3-next-80b-a3b-thinking",
1015
- "qwen3-omni-flash",
1016
- "qwen3-omni-flash-realtime",
1017
- "qwen3-vl-235b-a22b",
1018
- "qwen3-vl-30b-a3b",
1019
- "qwen3-vl-plus",
1020
- "qwq-plus"
920
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
921
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo",
922
+ "moonshotai/Kimi-K2-Instruct",
923
+ "zai-org/GLM-4.5"
1021
924
  ],
1022
- "docUrl": "https://www.alibabacloud.com/help/en/model-studio/models",
925
+ "docUrl": "https://deepinfra.com/models",
1023
926
  "gateway": "models.dev"
1024
927
  },
1025
- "alibaba-cn": {
1026
- "url": "https://dashscope.aliyuncs.com/compatible-mode/v1",
1027
- "apiKeyEnvVar": "DASHSCOPE_API_KEY",
928
+ "zhipuai": {
929
+ "url": "https://open.bigmodel.cn/api/paas/v4",
930
+ "apiKeyEnvVar": "ZHIPU_API_KEY",
1028
931
  "apiKeyHeader": "Authorization",
1029
- "name": "Alibaba (China)",
932
+ "name": "Zhipu AI",
933
+ "models": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
934
+ "docUrl": "https://docs.z.ai/guides/overview/pricing",
935
+ "gateway": "models.dev"
936
+ },
937
+ "submodel": {
938
+ "url": "https://llm.submodel.ai/v1",
939
+ "apiKeyEnvVar": "SUBMODEL_INSTAGEN_ACCESS_KEY",
940
+ "apiKeyHeader": "Authorization",
941
+ "name": "submodel",
1030
942
  "models": [
1031
- "deepseek-r1",
1032
- "deepseek-r1-0528",
1033
- "deepseek-r1-distill-llama-70b",
1034
- "deepseek-r1-distill-llama-8b",
1035
- "deepseek-r1-distill-qwen-1-5b",
1036
- "deepseek-r1-distill-qwen-14b",
1037
- "deepseek-r1-distill-qwen-32b",
1038
- "deepseek-r1-distill-qwen-7b",
1039
- "deepseek-v3",
1040
- "deepseek-v3-1",
1041
- "deepseek-v3-2-exp",
1042
- "moonshot-kimi-k2-instruct",
1043
- "qvq-max",
1044
- "qwen-deep-research",
1045
- "qwen-doc-turbo",
1046
- "qwen-flash",
1047
- "qwen-long",
1048
- "qwen-math-plus",
1049
- "qwen-math-turbo",
1050
- "qwen-max",
1051
- "qwen-mt-plus",
1052
- "qwen-mt-turbo",
1053
- "qwen-omni-turbo",
1054
- "qwen-omni-turbo-realtime",
1055
- "qwen-plus",
1056
- "qwen-plus-character",
1057
- "qwen-turbo",
1058
- "qwen-vl-max",
1059
- "qwen-vl-ocr",
1060
- "qwen-vl-plus",
1061
- "qwen2-5-14b-instruct",
1062
- "qwen2-5-32b-instruct",
1063
- "qwen2-5-72b-instruct",
1064
- "qwen2-5-7b-instruct",
1065
- "qwen2-5-coder-32b-instruct",
1066
- "qwen2-5-coder-7b-instruct",
1067
- "qwen2-5-math-72b-instruct",
1068
- "qwen2-5-math-7b-instruct",
1069
- "qwen2-5-omni-7b",
1070
- "qwen2-5-vl-72b-instruct",
1071
- "qwen2-5-vl-7b-instruct",
1072
- "qwen3-14b",
1073
- "qwen3-235b-a22b",
1074
- "qwen3-32b",
1075
- "qwen3-8b",
1076
- "qwen3-asr-flash",
1077
- "qwen3-coder-30b-a3b-instruct",
1078
- "qwen3-coder-480b-a35b-instruct",
1079
- "qwen3-coder-flash",
1080
- "qwen3-coder-plus",
1081
- "qwen3-max",
1082
- "qwen3-next-80b-a3b-instruct",
1083
- "qwen3-next-80b-a3b-thinking",
1084
- "qwen3-omni-flash",
1085
- "qwen3-omni-flash-realtime",
1086
- "qwen3-vl-235b-a22b",
1087
- "qwen3-vl-30b-a3b",
1088
- "qwen3-vl-plus",
1089
- "qwq-32b",
1090
- "qwq-plus",
1091
- "tongyi-intent-detect-v3"
943
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
944
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
945
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
946
+ "deepseek-ai/DeepSeek-R1-0528",
947
+ "deepseek-ai/DeepSeek-V3-0324",
948
+ "deepseek-ai/DeepSeek-V3.1",
949
+ "openai/gpt-oss-120b",
950
+ "zai-org/GLM-4.5-Air",
951
+ "zai-org/GLM-4.5-FP8"
1092
952
  ],
1093
- "docUrl": "https://www.alibabacloud.com/help/en/model-studio/models",
953
+ "docUrl": "https://submodel.gitbook.io",
1094
954
  "gateway": "models.dev"
1095
955
  },
1096
- "chutes": {
1097
- "url": "https://llm.chutes.ai/v1",
1098
- "apiKeyEnvVar": "CHUTES_API_KEY",
956
+ "zai": {
957
+ "url": "https://api.z.ai/api/paas/v4",
958
+ "apiKeyEnvVar": "ZHIPU_API_KEY",
1099
959
  "apiKeyHeader": "Authorization",
1100
- "name": "Chutes",
960
+ "name": "Z.AI",
961
+ "models": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
962
+ "docUrl": "https://docs.z.ai/guides/overview/pricing",
963
+ "gateway": "models.dev"
964
+ },
965
+ "inference": {
966
+ "url": "https://inference.net/v1",
967
+ "apiKeyEnvVar": "INFERENCE_API_KEY",
968
+ "apiKeyHeader": "Authorization",
969
+ "name": "Inference",
970
+ "models": [
971
+ "google/gemma-3",
972
+ "meta/llama-3.1-8b-instruct",
973
+ "meta/llama-3.2-11b-vision-instruct",
974
+ "meta/llama-3.2-1b-instruct",
975
+ "meta/llama-3.2-3b-instruct",
976
+ "mistral/mistral-nemo-12b-instruct",
977
+ "osmosis/osmosis-structure-0.6b",
978
+ "qwen/qwen-2.5-7b-vision-instruct",
979
+ "qwen/qwen3-embedding-4b"
980
+ ],
981
+ "docUrl": "https://inference.net/models",
982
+ "gateway": "models.dev"
983
+ },
984
+ "requesty": {
985
+ "url": "https://router.requesty.ai/v1",
986
+ "apiKeyEnvVar": "REQUESTY_API_KEY",
987
+ "apiKeyHeader": "Authorization",
988
+ "name": "Requesty",
989
+ "models": [
990
+ "anthropic/claude-3-7-sonnet",
991
+ "anthropic/claude-4-sonnet-20250522",
992
+ "anthropic/claude-opus-4",
993
+ "anthropic/claude-opus-4-1-20250805",
994
+ "google/gemini-2.5-flash",
995
+ "google/gemini-2.5-pro",
996
+ "openai/gpt-4.1",
997
+ "openai/gpt-4.1-mini",
998
+ "openai/gpt-4o-mini",
999
+ "openai/gpt-5",
1000
+ "openai/gpt-5-mini",
1001
+ "openai/gpt-5-nano",
1002
+ "openai/o4-mini"
1003
+ ],
1004
+ "docUrl": "https://requesty.ai/solution/llm-routing/models",
1005
+ "gateway": "models.dev"
1006
+ },
1007
+ "morph": {
1008
+ "url": "https://api.morphllm.com/v1",
1009
+ "apiKeyEnvVar": "MORPH_API_KEY",
1010
+ "apiKeyHeader": "Authorization",
1011
+ "name": "Morph",
1012
+ "models": ["auto", "morph-v3-fast", "morph-v3-large"],
1013
+ "docUrl": "https://docs.morphllm.com/api-reference/introduction",
1014
+ "gateway": "models.dev"
1015
+ },
1016
+ "lmstudio": {
1017
+ "url": "http://127.0.0.1:1234/v1",
1018
+ "apiKeyEnvVar": "LMSTUDIO_API_KEY",
1019
+ "apiKeyHeader": "Authorization",
1020
+ "name": "LMStudio",
1021
+ "models": ["openai/gpt-oss-20b", "qwen/qwen3-30b-a3b-2507", "qwen/qwen3-coder-30b"],
1022
+ "docUrl": "https://lmstudio.ai/models",
1023
+ "gateway": "models.dev"
1024
+ },
1025
+ "anthropic": {
1026
+ "apiKeyEnvVar": "ANTHROPIC_API_KEY",
1027
+ "name": "Anthropic",
1028
+ "models": [
1029
+ "claude-3-5-haiku-20241022",
1030
+ "claude-3-5-haiku-latest",
1031
+ "claude-3-5-sonnet-20240620",
1032
+ "claude-3-5-sonnet-20241022",
1033
+ "claude-3-7-sonnet-20250219",
1034
+ "claude-3-7-sonnet-latest",
1035
+ "claude-3-haiku-20240307",
1036
+ "claude-3-opus-20240229",
1037
+ "claude-3-sonnet-20240229",
1038
+ "claude-haiku-4-5",
1039
+ "claude-haiku-4-5-20251001",
1040
+ "claude-opus-4-0",
1041
+ "claude-opus-4-1",
1042
+ "claude-opus-4-1-20250805",
1043
+ "claude-opus-4-20250514",
1044
+ "claude-sonnet-4-0",
1045
+ "claude-sonnet-4-20250514",
1046
+ "claude-sonnet-4-5",
1047
+ "claude-sonnet-4-5-20250929"
1048
+ ],
1049
+ "docUrl": "https://docs.anthropic.com/en/docs/about-claude/models",
1050
+ "gateway": "models.dev"
1051
+ },
1052
+ "fireworks-ai": {
1053
+ "url": "https://api.fireworks.ai/inference/v1/",
1054
+ "apiKeyEnvVar": "FIREWORKS_API_KEY",
1055
+ "apiKeyHeader": "Authorization",
1056
+ "name": "Fireworks AI",
1057
+ "models": [
1058
+ "accounts/fireworks/models/deepseek-r1-0528",
1059
+ "accounts/fireworks/models/deepseek-v3-0324",
1060
+ "accounts/fireworks/models/deepseek-v3p1",
1061
+ "accounts/fireworks/models/glm-4p5",
1062
+ "accounts/fireworks/models/glm-4p5-air",
1063
+ "accounts/fireworks/models/gpt-oss-120b",
1064
+ "accounts/fireworks/models/gpt-oss-20b",
1065
+ "accounts/fireworks/models/kimi-k2-instruct",
1066
+ "accounts/fireworks/models/qwen3-235b-a22b",
1067
+ "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
1068
+ ],
1069
+ "docUrl": "https://fireworks.ai/docs/",
1070
+ "gateway": "models.dev"
1071
+ },
1072
+ "modelscope": {
1073
+ "url": "https://api-inference.modelscope.cn/v1",
1074
+ "apiKeyEnvVar": "MODELSCOPE_API_KEY",
1075
+ "apiKeyHeader": "Authorization",
1076
+ "name": "ModelScope",
1077
+ "models": [
1078
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1079
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1080
+ "Qwen/Qwen3-30B-A3B-Instruct-2507",
1081
+ "Qwen/Qwen3-30B-A3B-Thinking-2507",
1082
+ "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1083
+ "ZhipuAI/GLM-4.5",
1084
+ "ZhipuAI/GLM-4.6"
1085
+ ],
1086
+ "docUrl": "https://modelscope.cn/docs/model-service/API-Inference/intro",
1087
+ "gateway": "models.dev"
1088
+ },
1089
+ "llama": {
1090
+ "url": "https://api.llama.com/compat/v1/",
1091
+ "apiKeyEnvVar": "LLAMA_API_KEY",
1092
+ "apiKeyHeader": "Authorization",
1093
+ "name": "Llama",
1094
+ "models": [
1095
+ "cerebras-llama-4-maverick-17b-128e-instruct",
1096
+ "cerebras-llama-4-scout-17b-16e-instruct",
1097
+ "groq-llama-4-maverick-17b-128e-instruct",
1098
+ "llama-3.3-70b-instruct",
1099
+ "llama-3.3-8b-instruct",
1100
+ "llama-4-maverick-17b-128e-instruct-fp8",
1101
+ "llama-4-scout-17b-16e-instruct-fp8"
1102
+ ],
1103
+ "docUrl": "https://llama.developer.meta.com/docs/models",
1104
+ "gateway": "models.dev"
1105
+ },
1106
+ "scaleway": {
1107
+ "url": "https://api.scaleway.ai/v1",
1108
+ "apiKeyEnvVar": "SCALEWAY_API_KEY",
1109
+ "apiKeyHeader": "Authorization",
1110
+ "name": "Scaleway",
1101
1111
  "models": [
1102
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1103
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1104
- "Qwen/Qwen3-30B-A3B",
1105
- "Qwen/Qwen3-30B-A3B-Instruct-2507",
1106
- "Qwen/Qwen3-30B-A3B-Thinking-2507",
1107
- "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1108
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1109
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
1110
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
1111
- "chutesai/Devstral-Small-2505",
1112
- "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
1113
- "deepseek-ai/DeepSeek-R1-0528",
1114
- "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
1115
- "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1116
- "deepseek-ai/DeepSeek-V3-0324",
1117
- "deepseek-ai/DeepSeek-V3.1",
1118
- "deepseek-ai/DeepSeek-V3.1-Terminus",
1119
- "deepseek-ai/DeepSeek-V3.1-turbo",
1120
- "deepseek-ai/DeepSeek-V3.1:THINKING",
1121
- "deepseek-ai/DeepSeek-V3.2-Exp",
1122
- "meituan-longcat/LongCat-Flash-Chat-FP8",
1123
- "moonshotai/Kimi-Dev-72B",
1124
- "moonshotai/Kimi-K2-Instruct-0905",
1125
- "moonshotai/Kimi-K2-Instruct-75k",
1126
- "moonshotai/Kimi-VL-A3B-Thinking",
1127
- "openai/gpt-oss-120b",
1128
- "tngtech/DeepSeek-R1T-Chimera",
1129
- "tngtech/DeepSeek-TNG-R1T2-Chimera",
1130
- "zai-org/GLM-4.5-Air",
1131
- "zai-org/GLM-4.5-FP8",
1132
- "zai-org/GLM-4.5-turbo",
1133
- "zai-org/GLM-4.6-FP8",
1134
- "zai-org/GLM-4.6-turbo"
1112
+ "deepseek-r1-distill-llama-70b",
1113
+ "gemma-3-27b-it",
1114
+ "gpt-oss-120b",
1115
+ "llama-3.1-8b-instruct",
1116
+ "llama-3.3-70b-instruct",
1117
+ "mistral-nemo-instruct-2407",
1118
+ "mistral-small-3.2-24b-instruct-2506",
1119
+ "pixtral-12b-2409",
1120
+ "qwen3-235b-a22b-instruct-2507",
1121
+ "qwen3-coder-30b-a3b-instruct",
1122
+ "voxtral-small-24b-2507"
1135
1123
  ],
1136
- "docUrl": "https://llm.chutes.ai/v1/models",
1124
+ "docUrl": "https://www.scaleway.com/en/docs/generative-apis/",
1137
1125
  "gateway": "models.dev"
1138
1126
  },
1139
- "upstage": {
1140
- "url": "https://api.upstage.ai",
1141
- "apiKeyEnvVar": "UPSTAGE_API_KEY",
1127
+ "cerebras": {
1128
+ "url": "https://api.cerebras.ai/v1",
1129
+ "apiKeyEnvVar": "CEREBRAS_API_KEY",
1142
1130
  "apiKeyHeader": "Authorization",
1143
- "name": "Upstage",
1144
- "models": ["solar-mini", "solar-pro2"],
1145
- "docUrl": "https://developers.upstage.ai/docs/apis/chat",
1131
+ "name": "Cerebras",
1132
+ "models": ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
1133
+ "docUrl": "https://inference-docs.cerebras.ai/models/overview",
1146
1134
  "gateway": "models.dev"
1147
1135
  },
1148
1136
  "netlify": {
@@ -1190,6 +1178,73 @@
1190
1178
  }
1191
1179
  },
1192
1180
  "models": {
1181
+ "moonshotai-cn": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1182
+ "lucidquery": ["lucidnova-rf1-100b", "lucidquery-nexus-coder"],
1183
+ "moonshotai": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1184
+ "zai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1185
+ "alibaba": [
1186
+ "qvq-max",
1187
+ "qwen-flash",
1188
+ "qwen-max",
1189
+ "qwen-mt-plus",
1190
+ "qwen-mt-turbo",
1191
+ "qwen-omni-turbo",
1192
+ "qwen-omni-turbo-realtime",
1193
+ "qwen-plus",
1194
+ "qwen-plus-character-ja",
1195
+ "qwen-turbo",
1196
+ "qwen-vl-max",
1197
+ "qwen-vl-ocr",
1198
+ "qwen-vl-plus",
1199
+ "qwen2-5-14b-instruct",
1200
+ "qwen2-5-32b-instruct",
1201
+ "qwen2-5-72b-instruct",
1202
+ "qwen2-5-7b-instruct",
1203
+ "qwen2-5-omni-7b",
1204
+ "qwen2-5-vl-72b-instruct",
1205
+ "qwen2-5-vl-7b-instruct",
1206
+ "qwen3-14b",
1207
+ "qwen3-235b-a22b",
1208
+ "qwen3-32b",
1209
+ "qwen3-8b",
1210
+ "qwen3-asr-flash",
1211
+ "qwen3-coder-30b-a3b-instruct",
1212
+ "qwen3-coder-480b-a35b-instruct",
1213
+ "qwen3-coder-flash",
1214
+ "qwen3-coder-plus",
1215
+ "qwen3-livetranslate-flash-realtime",
1216
+ "qwen3-max",
1217
+ "qwen3-next-80b-a3b-instruct",
1218
+ "qwen3-next-80b-a3b-thinking",
1219
+ "qwen3-omni-flash",
1220
+ "qwen3-omni-flash-realtime",
1221
+ "qwen3-vl-235b-a22b",
1222
+ "qwen3-vl-30b-a3b",
1223
+ "qwen3-vl-plus",
1224
+ "qwq-plus"
1225
+ ],
1226
+ "xai": [
1227
+ "grok-2",
1228
+ "grok-2-1212",
1229
+ "grok-2-latest",
1230
+ "grok-2-vision",
1231
+ "grok-2-vision-1212",
1232
+ "grok-2-vision-latest",
1233
+ "grok-3",
1234
+ "grok-3-fast",
1235
+ "grok-3-fast-latest",
1236
+ "grok-3-latest",
1237
+ "grok-3-mini",
1238
+ "grok-3-mini-fast",
1239
+ "grok-3-mini-fast-latest",
1240
+ "grok-3-mini-latest",
1241
+ "grok-4",
1242
+ "grok-4-fast",
1243
+ "grok-4-fast-non-reasoning",
1244
+ "grok-beta",
1245
+ "grok-code-fast-1",
1246
+ "grok-vision-beta"
1247
+ ],
1193
1248
  "nvidia": [
1194
1249
  "black-forest-labs/flux.1-dev",
1195
1250
  "deepseek-ai/deepseek-v3.1",
@@ -1203,99 +1258,375 @@
1203
1258
  "nvidia/nemoretriever-ocr-v1",
1204
1259
  "nvidia/parakeet-tdt-0.6b-v2",
1205
1260
  "openai/gpt-oss-120b",
1206
- "openai/whisper-large-v3",
1207
- "qwen/qwen3-235b-a22b",
1208
- "qwen/qwen3-coder-480b-a35b-instruct"
1261
+ "openai/whisper-large-v3",
1262
+ "qwen/qwen3-235b-a22b",
1263
+ "qwen/qwen3-coder-480b-a35b-instruct"
1264
+ ],
1265
+ "upstage": ["solar-mini", "solar-pro2"],
1266
+ "groq": [
1267
+ "deepseek-r1-distill-llama-70b",
1268
+ "gemma2-9b-it",
1269
+ "llama-3.1-8b-instant",
1270
+ "llama-3.3-70b-versatile",
1271
+ "llama-guard-3-8b",
1272
+ "llama3-70b-8192",
1273
+ "llama3-8b-8192",
1274
+ "meta-llama/llama-4-maverick-17b-128e-instruct",
1275
+ "meta-llama/llama-4-scout-17b-16e-instruct",
1276
+ "meta-llama/llama-guard-4-12b",
1277
+ "mistral-saba-24b",
1278
+ "moonshotai/kimi-k2-instruct",
1279
+ "moonshotai/kimi-k2-instruct-0905",
1280
+ "openai/gpt-oss-120b",
1281
+ "openai/gpt-oss-20b",
1282
+ "qwen-qwq-32b",
1283
+ "qwen/qwen3-32b"
1284
+ ],
1285
+ "mistral": [
1286
+ "codestral-latest",
1287
+ "devstral-medium-2507",
1288
+ "devstral-small-2505",
1289
+ "devstral-small-2507",
1290
+ "magistral-medium-latest",
1291
+ "magistral-small",
1292
+ "ministral-3b-latest",
1293
+ "ministral-8b-latest",
1294
+ "mistral-large-latest",
1295
+ "mistral-medium-2505",
1296
+ "mistral-medium-2508",
1297
+ "mistral-medium-latest",
1298
+ "mistral-nemo",
1299
+ "mistral-small-latest",
1300
+ "open-mistral-7b",
1301
+ "open-mixtral-8x22b",
1302
+ "open-mixtral-8x7b",
1303
+ "pixtral-12b",
1304
+ "pixtral-large-latest"
1305
+ ],
1306
+ "vercel": [
1307
+ "alibaba/qwen3-coder-plus",
1308
+ "alibaba/qwen3-max",
1309
+ "alibaba/qwen3-next-80b-a3b-instruct",
1310
+ "alibaba/qwen3-next-80b-a3b-thinking",
1311
+ "alibaba/qwen3-vl-instruct",
1312
+ "alibaba/qwen3-vl-thinking",
1313
+ "amazon/nova-lite",
1314
+ "amazon/nova-micro",
1315
+ "amazon/nova-pro",
1316
+ "anthropic/claude-3-5-haiku",
1317
+ "anthropic/claude-3-haiku",
1318
+ "anthropic/claude-3-opus",
1319
+ "anthropic/claude-3.5-sonnet",
1320
+ "anthropic/claude-3.7-sonnet",
1321
+ "anthropic/claude-4-1-opus",
1322
+ "anthropic/claude-4-opus",
1323
+ "anthropic/claude-4-sonnet",
1324
+ "anthropic/claude-4.5-sonnet",
1325
+ "anthropic/claude-haiku-4.5",
1326
+ "cerebras/qwen3-coder",
1327
+ "deepseek/deepseek-r1",
1328
+ "deepseek/deepseek-r1-distill-llama-70b",
1329
+ "deepseek/deepseek-v3.1-terminus",
1330
+ "deepseek/deepseek-v3.2-exp",
1331
+ "deepseek/deepseek-v3.2-exp-thinking",
1332
+ "google/gemini-2.0-flash",
1333
+ "google/gemini-2.0-flash-lite",
1334
+ "google/gemini-2.5-flash",
1335
+ "google/gemini-2.5-flash-lite",
1336
+ "google/gemini-2.5-flash-lite-preview-09-2025",
1337
+ "google/gemini-2.5-flash-preview-09-2025",
1338
+ "google/gemini-2.5-pro",
1339
+ "meta/llama-3.3-70b",
1340
+ "meta/llama-4-maverick",
1341
+ "meta/llama-4-scout",
1342
+ "mistral/codestral",
1343
+ "mistral/magistral-medium",
1344
+ "mistral/magistral-small",
1345
+ "mistral/ministral-3b",
1346
+ "mistral/ministral-8b",
1347
+ "mistral/mistral-large",
1348
+ "mistral/mistral-small",
1349
+ "mistral/mixtral-8x22b-instruct",
1350
+ "mistral/pixtral-12b",
1351
+ "mistral/pixtral-large",
1352
+ "moonshotai/kimi-k2",
1353
+ "morph/morph-v3-fast",
1354
+ "morph/morph-v3-large",
1355
+ "openai/gpt-4-turbo",
1356
+ "openai/gpt-4.1",
1357
+ "openai/gpt-4.1-mini",
1358
+ "openai/gpt-4.1-nano",
1359
+ "openai/gpt-4o",
1360
+ "openai/gpt-4o-mini",
1361
+ "openai/gpt-5",
1362
+ "openai/gpt-5-codex",
1363
+ "openai/gpt-5-mini",
1364
+ "openai/gpt-5-nano",
1365
+ "openai/gpt-oss-120b",
1366
+ "openai/gpt-oss-20b",
1367
+ "openai/o1",
1368
+ "openai/o3",
1369
+ "openai/o3-mini",
1370
+ "openai/o4-mini",
1371
+ "perplexity/sonar",
1372
+ "perplexity/sonar-pro",
1373
+ "perplexity/sonar-reasoning",
1374
+ "perplexity/sonar-reasoning-pro",
1375
+ "vercel/v0-1.0-md",
1376
+ "vercel/v0-1.5-md",
1377
+ "xai/grok-2",
1378
+ "xai/grok-2-vision",
1379
+ "xai/grok-3",
1380
+ "xai/grok-3-fast",
1381
+ "xai/grok-3-mini",
1382
+ "xai/grok-3-mini-fast",
1383
+ "xai/grok-4",
1384
+ "xai/grok-4-fast",
1385
+ "xai/grok-4-fast-non-reasoning",
1386
+ "xai/grok-code-fast-1",
1387
+ "zai/glm-4.5",
1388
+ "zai/glm-4.5-air",
1389
+ "zai/glm-4.5v",
1390
+ "zai/glm-4.6"
1391
+ ],
1392
+ "nebius": [
1393
+ "NousResearch/hermes-4-405b",
1394
+ "NousResearch/hermes-4-70b",
1395
+ "deepseek-ai/deepseek-v3",
1396
+ "meta-llama/llama-3.3-70b-instruct-base",
1397
+ "meta-llama/llama-3.3-70b-instruct-fast",
1398
+ "meta-llama/llama-3_1-405b-instruct",
1399
+ "moonshotai/kimi-k2-instruct",
1400
+ "nvidia/llama-3_1-nemotron-ultra-253b-v1",
1401
+ "openai/gpt-oss-120b",
1402
+ "openai/gpt-oss-20b",
1403
+ "qwen/qwen3-235b-a22b-instruct-2507",
1404
+ "qwen/qwen3-235b-a22b-thinking-2507",
1405
+ "qwen/qwen3-coder-480b-a35b-instruct",
1406
+ "zai-org/glm-4.5",
1407
+ "zai-org/glm-4.5-air"
1209
1408
  ],
1210
- "modelscope": [
1409
+ "deepseek": ["deepseek-chat", "deepseek-reasoner"],
1410
+ "alibaba-cn": [
1411
+ "deepseek-r1",
1412
+ "deepseek-r1-0528",
1413
+ "deepseek-r1-distill-llama-70b",
1414
+ "deepseek-r1-distill-llama-8b",
1415
+ "deepseek-r1-distill-qwen-1-5b",
1416
+ "deepseek-r1-distill-qwen-14b",
1417
+ "deepseek-r1-distill-qwen-32b",
1418
+ "deepseek-r1-distill-qwen-7b",
1419
+ "deepseek-v3",
1420
+ "deepseek-v3-1",
1421
+ "deepseek-v3-2-exp",
1422
+ "moonshot-kimi-k2-instruct",
1423
+ "qvq-max",
1424
+ "qwen-deep-research",
1425
+ "qwen-doc-turbo",
1426
+ "qwen-flash",
1427
+ "qwen-long",
1428
+ "qwen-math-plus",
1429
+ "qwen-math-turbo",
1430
+ "qwen-max",
1431
+ "qwen-mt-plus",
1432
+ "qwen-mt-turbo",
1433
+ "qwen-omni-turbo",
1434
+ "qwen-omni-turbo-realtime",
1435
+ "qwen-plus",
1436
+ "qwen-plus-character",
1437
+ "qwen-turbo",
1438
+ "qwen-vl-max",
1439
+ "qwen-vl-ocr",
1440
+ "qwen-vl-plus",
1441
+ "qwen2-5-14b-instruct",
1442
+ "qwen2-5-32b-instruct",
1443
+ "qwen2-5-72b-instruct",
1444
+ "qwen2-5-7b-instruct",
1445
+ "qwen2-5-coder-32b-instruct",
1446
+ "qwen2-5-coder-7b-instruct",
1447
+ "qwen2-5-math-72b-instruct",
1448
+ "qwen2-5-math-7b-instruct",
1449
+ "qwen2-5-omni-7b",
1450
+ "qwen2-5-vl-72b-instruct",
1451
+ "qwen2-5-vl-7b-instruct",
1452
+ "qwen3-14b",
1453
+ "qwen3-235b-a22b",
1454
+ "qwen3-32b",
1455
+ "qwen3-8b",
1456
+ "qwen3-asr-flash",
1457
+ "qwen3-coder-30b-a3b-instruct",
1458
+ "qwen3-coder-480b-a35b-instruct",
1459
+ "qwen3-coder-flash",
1460
+ "qwen3-coder-plus",
1461
+ "qwen3-max",
1462
+ "qwen3-next-80b-a3b-instruct",
1463
+ "qwen3-next-80b-a3b-thinking",
1464
+ "qwen3-omni-flash",
1465
+ "qwen3-omni-flash-realtime",
1466
+ "qwen3-vl-235b-a22b",
1467
+ "qwen3-vl-30b-a3b",
1468
+ "qwen3-vl-plus",
1469
+ "qwq-32b",
1470
+ "qwq-plus",
1471
+ "tongyi-intent-detect-v3"
1472
+ ],
1473
+ "venice": [
1474
+ "deepseek-coder-v2-lite",
1475
+ "deepseek-r1-671b",
1476
+ "dolphin-2.9.2-qwen2-72b",
1477
+ "llama-3.1-405b",
1478
+ "llama-3.2-3b",
1479
+ "llama-3.3-70b",
1480
+ "mistral-31-24b",
1481
+ "qwen-2.5-coder-32b",
1482
+ "qwen-2.5-qwq-32b",
1483
+ "qwen-2.5-vl",
1484
+ "qwen3-235b",
1485
+ "qwen3-4b",
1486
+ "venice-uncensored"
1487
+ ],
1488
+ "chutes": [
1211
1489
  "Qwen/Qwen3-235B-A22B-Instruct-2507",
1212
1490
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
1491
+ "Qwen/Qwen3-30B-A3B",
1213
1492
  "Qwen/Qwen3-30B-A3B-Instruct-2507",
1214
1493
  "Qwen/Qwen3-30B-A3B-Thinking-2507",
1215
1494
  "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1216
- "ZhipuAI/GLM-4.5",
1217
- "ZhipuAI/GLM-4.6"
1495
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1496
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
1497
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
1498
+ "chutesai/Devstral-Small-2505",
1499
+ "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
1500
+ "deepseek-ai/DeepSeek-R1-0528",
1501
+ "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
1502
+ "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1503
+ "deepseek-ai/DeepSeek-V3-0324",
1504
+ "deepseek-ai/DeepSeek-V3.1",
1505
+ "deepseek-ai/DeepSeek-V3.1-Terminus",
1506
+ "deepseek-ai/DeepSeek-V3.1-turbo",
1507
+ "deepseek-ai/DeepSeek-V3.1:THINKING",
1508
+ "deepseek-ai/DeepSeek-V3.2-Exp",
1509
+ "meituan-longcat/LongCat-Flash-Chat-FP8",
1510
+ "moonshotai/Kimi-Dev-72B",
1511
+ "moonshotai/Kimi-K2-Instruct-0905",
1512
+ "moonshotai/Kimi-K2-Instruct-75k",
1513
+ "moonshotai/Kimi-VL-A3B-Thinking",
1514
+ "openai/gpt-oss-120b",
1515
+ "tngtech/DeepSeek-R1T-Chimera",
1516
+ "tngtech/DeepSeek-TNG-R1T2-Chimera",
1517
+ "zai-org/GLM-4.5-Air",
1518
+ "zai-org/GLM-4.5-FP8",
1519
+ "zai-org/GLM-4.5-turbo",
1520
+ "zai-org/GLM-4.6-FP8",
1521
+ "zai-org/GLM-4.6-turbo"
1218
1522
  ],
1219
- "aihubmix": [
1220
- "DeepSeek-V3.2-Exp",
1221
- "DeepSeek-V3.2-Exp-Think",
1222
- "Kimi-K2-0905",
1223
- "claude-haiku-4-5",
1224
- "claude-opus-4-1",
1225
- "claude-sonnet-4-5",
1226
- "gemini-2.5-flash",
1523
+ "cortecs": [
1524
+ "claude-4-5-sonnet",
1525
+ "claude-sonnet-4",
1526
+ "deepseek-v3-0324",
1227
1527
  "gemini-2.5-pro",
1228
- "glm-4.6",
1229
1528
  "gpt-4.1",
1230
- "gpt-4.1-mini",
1231
- "gpt-4.1-nano",
1232
- "gpt-4o",
1233
- "gpt-4o-2024-11-20",
1234
- "gpt-5",
1235
- "gpt-5-codex",
1236
- "gpt-5-mini",
1237
- "gpt-5-nano",
1238
- "gpt-5-pro",
1239
- "o4-mini",
1240
- "qwen3-235b-a22b-instruct-2507",
1241
- "qwen3-235b-a22b-thinking-2507",
1529
+ "gpt-oss-120b",
1530
+ "kimi-k2-instruct",
1531
+ "llama-3.1-405b-instruct",
1532
+ "nova-pro-v1",
1533
+ "qwen3-32b",
1242
1534
  "qwen3-coder-480b-a35b-instruct"
1243
1535
  ],
1244
- "lucidquery": ["lucidnova-rf1-100b", "lucidquery-nexus-coder"],
1245
- "xai": [
1246
- "grok-2",
1247
- "grok-2-1212",
1248
- "grok-2-latest",
1249
- "grok-2-vision",
1250
- "grok-2-vision-1212",
1251
- "grok-2-vision-latest",
1252
- "grok-3",
1253
- "grok-3-fast",
1254
- "grok-3-fast-latest",
1255
- "grok-3-latest",
1256
- "grok-3-mini",
1257
- "grok-3-mini-fast",
1258
- "grok-3-mini-fast-latest",
1259
- "grok-3-mini-latest",
1260
- "grok-4",
1261
- "grok-4-fast",
1262
- "grok-4-fast-non-reasoning",
1263
- "grok-beta",
1264
- "grok-code-fast-1",
1265
- "grok-vision-beta"
1266
- ],
1267
- "deepseek": ["deepseek-chat", "deepseek-reasoner"],
1268
- "requesty": [
1269
- "anthropic/claude-3-7-sonnet",
1270
- "anthropic/claude-4-sonnet-20250522",
1271
- "anthropic/claude-opus-4",
1272
- "anthropic/claude-opus-4-1-20250805",
1273
- "google/gemini-2.5-flash",
1274
- "google/gemini-2.5-pro",
1536
+ "github-models": [
1537
+ "ai21-labs/ai21-jamba-1.5-large",
1538
+ "ai21-labs/ai21-jamba-1.5-mini",
1539
+ "cohere/cohere-command-a",
1540
+ "cohere/cohere-command-r",
1541
+ "cohere/cohere-command-r-08-2024",
1542
+ "cohere/cohere-command-r-plus",
1543
+ "cohere/cohere-command-r-plus-08-2024",
1544
+ "core42/jais-30b-chat",
1545
+ "deepseek/deepseek-r1",
1546
+ "deepseek/deepseek-r1-0528",
1547
+ "deepseek/deepseek-v3-0324",
1548
+ "meta/llama-3.2-11b-vision-instruct",
1549
+ "meta/llama-3.2-90b-vision-instruct",
1550
+ "meta/llama-3.3-70b-instruct",
1551
+ "meta/llama-4-maverick-17b-128e-instruct-fp8",
1552
+ "meta/llama-4-scout-17b-16e-instruct",
1553
+ "meta/meta-llama-3-70b-instruct",
1554
+ "meta/meta-llama-3-8b-instruct",
1555
+ "meta/meta-llama-3.1-405b-instruct",
1556
+ "meta/meta-llama-3.1-70b-instruct",
1557
+ "meta/meta-llama-3.1-8b-instruct",
1558
+ "microsoft/mai-ds-r1",
1559
+ "microsoft/phi-3-medium-128k-instruct",
1560
+ "microsoft/phi-3-medium-4k-instruct",
1561
+ "microsoft/phi-3-mini-128k-instruct",
1562
+ "microsoft/phi-3-mini-4k-instruct",
1563
+ "microsoft/phi-3-small-128k-instruct",
1564
+ "microsoft/phi-3-small-8k-instruct",
1565
+ "microsoft/phi-3.5-mini-instruct",
1566
+ "microsoft/phi-3.5-moe-instruct",
1567
+ "microsoft/phi-3.5-vision-instruct",
1568
+ "microsoft/phi-4",
1569
+ "microsoft/phi-4-mini-instruct",
1570
+ "microsoft/phi-4-mini-reasoning",
1571
+ "microsoft/phi-4-multimodal-instruct",
1572
+ "microsoft/phi-4-reasoning",
1573
+ "mistral-ai/codestral-2501",
1574
+ "mistral-ai/ministral-3b",
1575
+ "mistral-ai/mistral-large-2411",
1576
+ "mistral-ai/mistral-medium-2505",
1577
+ "mistral-ai/mistral-nemo",
1578
+ "mistral-ai/mistral-small-2503",
1275
1579
  "openai/gpt-4.1",
1276
1580
  "openai/gpt-4.1-mini",
1581
+ "openai/gpt-4.1-nano",
1582
+ "openai/gpt-4o",
1277
1583
  "openai/gpt-4o-mini",
1278
- "openai/gpt-5",
1279
- "openai/gpt-5-mini",
1280
- "openai/gpt-5-nano",
1281
- "openai/o4-mini"
1584
+ "openai/o1",
1585
+ "openai/o1-mini",
1586
+ "openai/o1-preview",
1587
+ "openai/o3",
1588
+ "openai/o3-mini",
1589
+ "openai/o4-mini",
1590
+ "xai/grok-3",
1591
+ "xai/grok-3-mini"
1592
+ ],
1593
+ "togetherai": [
1594
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1595
+ "deepseek-ai/DeepSeek-R1",
1596
+ "deepseek-ai/DeepSeek-V3",
1597
+ "meta-llama/Llama-3.3-70B-Instruct-Turbo",
1598
+ "moonshotai/Kimi-K2-Instruct",
1599
+ "openai/gpt-oss-120b"
1600
+ ],
1601
+ "baseten": ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
1602
+ "huggingface": [
1603
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1604
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1605
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
1606
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
1607
+ "deepseek-ai/DeepSeek-R1-0528",
1608
+ "deepseek-ai/Deepseek-V3-0324",
1609
+ "moonshotai/Kimi-K2-Instruct",
1610
+ "moonshotai/Kimi-K2-Instruct-0905",
1611
+ "zai-org/GLM-4.5",
1612
+ "zai-org/GLM-4.5-Air",
1613
+ "zai-org/GLM-4.6"
1282
1614
  ],
1283
- "nebius": [
1284
- "NousResearch/hermes-4-405b",
1285
- "NousResearch/hermes-4-70b",
1286
- "deepseek-ai/deepseek-v3",
1287
- "meta-llama/llama-3.3-70b-instruct-base",
1288
- "meta-llama/llama-3.3-70b-instruct-fast",
1289
- "meta-llama/llama-3_1-405b-instruct",
1290
- "moonshotai/kimi-k2-instruct",
1291
- "nvidia/llama-3_1-nemotron-ultra-253b-v1",
1292
- "openai/gpt-oss-120b",
1293
- "openai/gpt-oss-20b",
1294
- "qwen/qwen3-235b-a22b-instruct-2507",
1295
- "qwen/qwen3-235b-a22b-thinking-2507",
1296
- "qwen/qwen3-coder-480b-a35b-instruct",
1297
- "zai-org/glm-4.5",
1298
- "zai-org/glm-4.5-air"
1615
+ "opencode": [
1616
+ "an-gbt",
1617
+ "big-pickle",
1618
+ "claude-3-5-haiku",
1619
+ "claude-haiku-4-5",
1620
+ "claude-opus-4-1",
1621
+ "claude-sonnet-4",
1622
+ "claude-sonnet-4-5",
1623
+ "code-supernova",
1624
+ "glm-4.6",
1625
+ "gpt-5",
1626
+ "gpt-5-codex",
1627
+ "grok-code",
1628
+ "kimi-k2",
1629
+ "qwen3-coder"
1299
1630
  ],
1300
1631
  "fastrouter": [
1301
1632
  "anthropic/claude-opus-4.1",
@@ -1313,22 +1644,75 @@
1313
1644
  "qwen/qwen3-coder",
1314
1645
  "x-ai/grok-4"
1315
1646
  ],
1316
- "perplexity": ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
1317
- "morph": ["auto", "morph-v3-fast", "morph-v3-large"],
1318
- "zai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1319
- "huggingface": [
1647
+ "google": [
1648
+ "gemini-1.5-flash",
1649
+ "gemini-1.5-flash-8b",
1650
+ "gemini-1.5-pro",
1651
+ "gemini-2.0-flash",
1652
+ "gemini-2.0-flash-lite",
1653
+ "gemini-2.5-flash",
1654
+ "gemini-2.5-flash-image",
1655
+ "gemini-2.5-flash-image-preview",
1656
+ "gemini-2.5-flash-lite",
1657
+ "gemini-2.5-flash-lite-preview-06-17",
1658
+ "gemini-2.5-flash-lite-preview-09-2025",
1659
+ "gemini-2.5-flash-preview-04-17",
1660
+ "gemini-2.5-flash-preview-05-20",
1661
+ "gemini-2.5-flash-preview-09-2025",
1662
+ "gemini-2.5-flash-preview-tts",
1663
+ "gemini-2.5-pro",
1664
+ "gemini-2.5-pro-preview-05-06",
1665
+ "gemini-2.5-pro-preview-06-05",
1666
+ "gemini-2.5-pro-preview-tts",
1667
+ "gemini-flash-latest",
1668
+ "gemini-flash-lite-latest",
1669
+ "gemini-live-2.5-flash",
1670
+ "gemini-live-2.5-flash-preview-native-audio"
1671
+ ],
1672
+ "inception": ["mercury", "mercury-coder"],
1673
+ "wandb": [
1674
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1320
1675
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
1321
1676
  "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1322
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
1323
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
1324
1677
  "deepseek-ai/DeepSeek-R1-0528",
1325
- "deepseek-ai/Deepseek-V3-0324",
1326
- "moonshotai/Kimi-K2-Instruct",
1327
- "moonshotai/Kimi-K2-Instruct-0905",
1328
- "zai-org/GLM-4.5",
1329
- "zai-org/GLM-4.5-Air",
1330
- "zai-org/GLM-4.6"
1678
+ "deepseek-ai/DeepSeek-V3-0324",
1679
+ "meta-llama/Llama-3.1-8B-Instruct",
1680
+ "meta-llama/Llama-3.3-70B-Instruct",
1681
+ "meta-llama/Llama-4-Scout-17B-16E-Instruct",
1682
+ "microsoft/Phi-4-mini-instruct",
1683
+ "moonshotai/Kimi-K2-Instruct"
1684
+ ],
1685
+ "openai": [
1686
+ "codex-mini-latest",
1687
+ "gpt-3.5-turbo",
1688
+ "gpt-4",
1689
+ "gpt-4-turbo",
1690
+ "gpt-4.1",
1691
+ "gpt-4.1-mini",
1692
+ "gpt-4.1-nano",
1693
+ "gpt-4o",
1694
+ "gpt-4o-2024-05-13",
1695
+ "gpt-4o-2024-08-06",
1696
+ "gpt-4o-2024-11-20",
1697
+ "gpt-4o-mini",
1698
+ "gpt-5",
1699
+ "gpt-5-chat-latest",
1700
+ "gpt-5-codex",
1701
+ "gpt-5-mini",
1702
+ "gpt-5-nano",
1703
+ "o1",
1704
+ "o1-mini",
1705
+ "o1-preview",
1706
+ "o1-pro",
1707
+ "o3",
1708
+ "o3-deep-research",
1709
+ "o3-mini",
1710
+ "o3-pro",
1711
+ "o4-mini",
1712
+ "o4-mini-deep-research"
1331
1713
  ],
1714
+ "zhipuai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1715
+ "perplexity": ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
1332
1716
  "openrouter": [
1333
1717
  "anthropic/claude-3.5-haiku",
1334
1718
  "anthropic/claude-3.7-sonnet",
@@ -1373,192 +1757,73 @@
1373
1757
  "mistralai/devstral-small-2505:free",
1374
1758
  "mistralai/devstral-small-2507",
1375
1759
  "mistralai/mistral-7b-instruct:free",
1376
- "mistralai/mistral-medium-3",
1377
- "mistralai/mistral-medium-3.1",
1378
- "mistralai/mistral-nemo:free",
1379
- "mistralai/mistral-small-3.1-24b-instruct",
1380
- "mistralai/mistral-small-3.2-24b-instruct",
1381
- "mistralai/mistral-small-3.2-24b-instruct:free",
1382
- "moonshotai/kimi-dev-72b:free",
1383
- "moonshotai/kimi-k2",
1384
- "moonshotai/kimi-k2-0905",
1385
- "moonshotai/kimi-k2:free",
1386
- "nousresearch/deephermes-3-llama-3-8b-preview",
1387
- "nousresearch/hermes-4-405b",
1388
- "nousresearch/hermes-4-70b",
1389
- "openai/gpt-4.1",
1390
- "openai/gpt-4.1-mini",
1391
- "openai/gpt-4o-mini",
1392
- "openai/gpt-5",
1393
- "openai/gpt-5-chat",
1394
- "openai/gpt-5-codex",
1395
- "openai/gpt-5-image",
1396
- "openai/gpt-5-mini",
1397
- "openai/gpt-5-nano",
1398
- "openai/gpt-oss-120b",
1399
- "openai/gpt-oss-20b",
1400
- "openai/o4-mini",
1401
- "openrouter/cypher-alpha:free",
1402
- "openrouter/horizon-alpha",
1403
- "openrouter/horizon-beta",
1404
- "openrouter/sonoma-dusk-alpha",
1405
- "openrouter/sonoma-sky-alpha",
1406
- "qwen/qwen-2.5-coder-32b-instruct",
1407
- "qwen/qwen2.5-vl-32b-instruct:free",
1408
- "qwen/qwen2.5-vl-72b-instruct",
1409
- "qwen/qwen2.5-vl-72b-instruct:free",
1410
- "qwen/qwen3-14b:free",
1411
- "qwen/qwen3-235b-a22b-07-25",
1412
- "qwen/qwen3-235b-a22b-07-25:free",
1413
- "qwen/qwen3-235b-a22b-thinking-2507",
1414
- "qwen/qwen3-235b-a22b:free",
1415
- "qwen/qwen3-30b-a3b-instruct-2507",
1416
- "qwen/qwen3-30b-a3b-thinking-2507",
1417
- "qwen/qwen3-30b-a3b:free",
1418
- "qwen/qwen3-32b:free",
1419
- "qwen/qwen3-8b:free",
1420
- "qwen/qwen3-coder",
1421
- "qwen/qwen3-coder:free",
1422
- "qwen/qwen3-max",
1423
- "qwen/qwen3-next-80b-a3b-instruct",
1424
- "qwen/qwen3-next-80b-a3b-thinking",
1425
- "qwen/qwq-32b:free",
1426
- "rekaai/reka-flash-3",
1427
- "sarvamai/sarvam-m:free",
1428
- "thudm/glm-z1-32b:free",
1429
- "tngtech/deepseek-r1t2-chimera:free",
1430
- "x-ai/grok-3",
1431
- "x-ai/grok-3-beta",
1432
- "x-ai/grok-3-mini",
1433
- "x-ai/grok-3-mini-beta",
1434
- "x-ai/grok-4",
1435
- "x-ai/grok-4-fast",
1436
- "x-ai/grok-4-fast:free",
1437
- "x-ai/grok-code-fast-1",
1438
- "z-ai/glm-4.5",
1439
- "z-ai/glm-4.5-air",
1440
- "z-ai/glm-4.5-air:free",
1441
- "z-ai/glm-4.5v",
1442
- "z-ai/glm-4.6"
1443
- ],
1444
- "cerebras": ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
1445
- "zhipuai": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1446
- "togetherai": [
1447
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1448
- "deepseek-ai/DeepSeek-R1",
1449
- "deepseek-ai/DeepSeek-V3",
1450
- "meta-llama/Llama-3.3-70B-Instruct-Turbo",
1451
- "moonshotai/Kimi-K2-Instruct",
1452
- "openai/gpt-oss-120b"
1453
- ],
1454
- "wandb": [
1455
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1456
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1457
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1458
- "deepseek-ai/DeepSeek-R1-0528",
1459
- "deepseek-ai/DeepSeek-V3-0324",
1460
- "meta-llama/Llama-3.1-8B-Instruct",
1461
- "meta-llama/Llama-3.3-70B-Instruct",
1462
- "meta-llama/Llama-4-Scout-17B-16E-Instruct",
1463
- "microsoft/Phi-4-mini-instruct",
1464
- "moonshotai/Kimi-K2-Instruct"
1465
- ],
1466
- "submodel": [
1467
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1468
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1469
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1470
- "deepseek-ai/DeepSeek-R1-0528",
1471
- "deepseek-ai/DeepSeek-V3-0324",
1472
- "deepseek-ai/DeepSeek-V3.1",
1473
- "openai/gpt-oss-120b",
1474
- "zai-org/GLM-4.5-Air",
1475
- "zai-org/GLM-4.5-FP8"
1476
- ],
1477
- "vercel": [
1478
- "alibaba/qwen3-coder-plus",
1479
- "alibaba/qwen3-max",
1480
- "alibaba/qwen3-next-80b-a3b-instruct",
1481
- "alibaba/qwen3-next-80b-a3b-thinking",
1482
- "alibaba/qwen3-vl-instruct",
1483
- "alibaba/qwen3-vl-thinking",
1484
- "amazon/nova-lite",
1485
- "amazon/nova-micro",
1486
- "amazon/nova-pro",
1487
- "anthropic/claude-3-5-haiku",
1488
- "anthropic/claude-3-haiku",
1489
- "anthropic/claude-3-opus",
1490
- "anthropic/claude-3.5-sonnet",
1491
- "anthropic/claude-3.7-sonnet",
1492
- "anthropic/claude-4-1-opus",
1493
- "anthropic/claude-4-opus",
1494
- "anthropic/claude-4-sonnet",
1495
- "anthropic/claude-4.5-sonnet",
1496
- "anthropic/claude-haiku-4.5",
1497
- "cerebras/qwen3-coder",
1498
- "deepseek/deepseek-r1",
1499
- "deepseek/deepseek-r1-distill-llama-70b",
1500
- "deepseek/deepseek-v3.1-terminus",
1501
- "deepseek/deepseek-v3.2-exp",
1502
- "deepseek/deepseek-v3.2-exp-thinking",
1503
- "google/gemini-2.0-flash",
1504
- "google/gemini-2.0-flash-lite",
1505
- "google/gemini-2.5-flash",
1506
- "google/gemini-2.5-flash-lite",
1507
- "google/gemini-2.5-flash-lite-preview-09-2025",
1508
- "google/gemini-2.5-flash-preview-09-2025",
1509
- "google/gemini-2.5-pro",
1510
- "meta/llama-3.3-70b",
1511
- "meta/llama-4-maverick",
1512
- "meta/llama-4-scout",
1513
- "mistral/codestral",
1514
- "mistral/magistral-medium",
1515
- "mistral/magistral-small",
1516
- "mistral/ministral-3b",
1517
- "mistral/ministral-8b",
1518
- "mistral/mistral-large",
1519
- "mistral/mistral-small",
1520
- "mistral/mixtral-8x22b-instruct",
1521
- "mistral/pixtral-12b",
1522
- "mistral/pixtral-large",
1760
+ "mistralai/mistral-medium-3",
1761
+ "mistralai/mistral-medium-3.1",
1762
+ "mistralai/mistral-nemo:free",
1763
+ "mistralai/mistral-small-3.1-24b-instruct",
1764
+ "mistralai/mistral-small-3.2-24b-instruct",
1765
+ "mistralai/mistral-small-3.2-24b-instruct:free",
1766
+ "moonshotai/kimi-dev-72b:free",
1523
1767
  "moonshotai/kimi-k2",
1524
- "morph/morph-v3-fast",
1525
- "morph/morph-v3-large",
1526
- "openai/gpt-4-turbo",
1768
+ "moonshotai/kimi-k2-0905",
1769
+ "moonshotai/kimi-k2:free",
1770
+ "nousresearch/deephermes-3-llama-3-8b-preview",
1771
+ "nousresearch/hermes-4-405b",
1772
+ "nousresearch/hermes-4-70b",
1527
1773
  "openai/gpt-4.1",
1528
1774
  "openai/gpt-4.1-mini",
1529
- "openai/gpt-4.1-nano",
1530
- "openai/gpt-4o",
1531
1775
  "openai/gpt-4o-mini",
1532
1776
  "openai/gpt-5",
1777
+ "openai/gpt-5-chat",
1533
1778
  "openai/gpt-5-codex",
1779
+ "openai/gpt-5-image",
1534
1780
  "openai/gpt-5-mini",
1535
1781
  "openai/gpt-5-nano",
1536
1782
  "openai/gpt-oss-120b",
1537
1783
  "openai/gpt-oss-20b",
1538
- "openai/o1",
1539
- "openai/o3",
1540
- "openai/o3-mini",
1541
1784
  "openai/o4-mini",
1542
- "perplexity/sonar",
1543
- "perplexity/sonar-pro",
1544
- "perplexity/sonar-reasoning",
1545
- "perplexity/sonar-reasoning-pro",
1546
- "vercel/v0-1.0-md",
1547
- "vercel/v0-1.5-md",
1548
- "xai/grok-2",
1549
- "xai/grok-2-vision",
1550
- "xai/grok-3",
1551
- "xai/grok-3-fast",
1552
- "xai/grok-3-mini",
1553
- "xai/grok-3-mini-fast",
1554
- "xai/grok-4",
1555
- "xai/grok-4-fast",
1556
- "xai/grok-4-fast-non-reasoning",
1557
- "xai/grok-code-fast-1",
1558
- "zai/glm-4.5",
1559
- "zai/glm-4.5-air",
1560
- "zai/glm-4.5v",
1561
- "zai/glm-4.6"
1785
+ "openrouter/cypher-alpha:free",
1786
+ "openrouter/horizon-alpha",
1787
+ "openrouter/horizon-beta",
1788
+ "openrouter/sonoma-dusk-alpha",
1789
+ "openrouter/sonoma-sky-alpha",
1790
+ "qwen/qwen-2.5-coder-32b-instruct",
1791
+ "qwen/qwen2.5-vl-32b-instruct:free",
1792
+ "qwen/qwen2.5-vl-72b-instruct",
1793
+ "qwen/qwen2.5-vl-72b-instruct:free",
1794
+ "qwen/qwen3-14b:free",
1795
+ "qwen/qwen3-235b-a22b-07-25",
1796
+ "qwen/qwen3-235b-a22b-07-25:free",
1797
+ "qwen/qwen3-235b-a22b-thinking-2507",
1798
+ "qwen/qwen3-235b-a22b:free",
1799
+ "qwen/qwen3-30b-a3b-instruct-2507",
1800
+ "qwen/qwen3-30b-a3b-thinking-2507",
1801
+ "qwen/qwen3-30b-a3b:free",
1802
+ "qwen/qwen3-32b:free",
1803
+ "qwen/qwen3-8b:free",
1804
+ "qwen/qwen3-coder",
1805
+ "qwen/qwen3-coder:free",
1806
+ "qwen/qwen3-max",
1807
+ "qwen/qwen3-next-80b-a3b-instruct",
1808
+ "qwen/qwen3-next-80b-a3b-thinking",
1809
+ "qwen/qwq-32b:free",
1810
+ "rekaai/reka-flash-3",
1811
+ "sarvamai/sarvam-m:free",
1812
+ "thudm/glm-z1-32b:free",
1813
+ "tngtech/deepseek-r1t2-chimera:free",
1814
+ "x-ai/grok-3",
1815
+ "x-ai/grok-3-beta",
1816
+ "x-ai/grok-3-mini",
1817
+ "x-ai/grok-3-mini-beta",
1818
+ "x-ai/grok-4",
1819
+ "x-ai/grok-4-fast",
1820
+ "x-ai/grok-4-fast:free",
1821
+ "x-ai/grok-code-fast-1",
1822
+ "z-ai/glm-4.5",
1823
+ "z-ai/glm-4.5-air",
1824
+ "z-ai/glm-4.5-air:free",
1825
+ "z-ai/glm-4.5v",
1826
+ "z-ai/glm-4.6"
1562
1827
  ],
1563
1828
  "synthetic": [
1564
1829
  "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
@@ -1583,184 +1848,53 @@
1583
1848
  "hf:zai-org/GLM-4.5",
1584
1849
  "hf:zai-org/GLM-4.6"
1585
1850
  ],
1586
- "google": [
1587
- "gemini-1.5-flash",
1588
- "gemini-1.5-flash-8b",
1589
- "gemini-1.5-pro",
1590
- "gemini-2.0-flash",
1591
- "gemini-2.0-flash-lite",
1592
- "gemini-2.5-flash",
1593
- "gemini-2.5-flash-image",
1594
- "gemini-2.5-flash-image-preview",
1595
- "gemini-2.5-flash-lite",
1596
- "gemini-2.5-flash-lite-preview-06-17",
1597
- "gemini-2.5-flash-lite-preview-09-2025",
1598
- "gemini-2.5-flash-preview-04-17",
1599
- "gemini-2.5-flash-preview-05-20",
1600
- "gemini-2.5-flash-preview-09-2025",
1601
- "gemini-2.5-flash-preview-tts",
1602
- "gemini-2.5-pro",
1603
- "gemini-2.5-pro-preview-05-06",
1604
- "gemini-2.5-pro-preview-06-05",
1605
- "gemini-2.5-pro-preview-tts",
1606
- "gemini-flash-latest",
1607
- "gemini-flash-lite-latest",
1608
- "gemini-live-2.5-flash",
1609
- "gemini-live-2.5-flash-preview-native-audio"
1610
- ],
1611
- "groq": [
1612
- "deepseek-r1-distill-llama-70b",
1613
- "gemma2-9b-it",
1614
- "llama-3.1-8b-instant",
1615
- "llama-3.3-70b-versatile",
1616
- "llama-guard-3-8b",
1617
- "llama3-70b-8192",
1618
- "llama3-8b-8192",
1619
- "meta-llama/llama-4-maverick-17b-128e-instruct",
1620
- "meta-llama/llama-4-scout-17b-16e-instruct",
1621
- "meta-llama/llama-guard-4-12b",
1622
- "mistral-saba-24b",
1623
- "moonshotai/kimi-k2-instruct",
1624
- "moonshotai/kimi-k2-instruct-0905",
1625
- "openai/gpt-oss-120b",
1626
- "openai/gpt-oss-20b",
1627
- "qwen-qwq-32b",
1628
- "qwen/qwen3-32b"
1629
- ],
1630
- "moonshotai-cn": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1631
- "github-models": [
1632
- "ai21-labs/ai21-jamba-1.5-large",
1633
- "ai21-labs/ai21-jamba-1.5-mini",
1634
- "cohere/cohere-command-a",
1635
- "cohere/cohere-command-r",
1636
- "cohere/cohere-command-r-08-2024",
1637
- "cohere/cohere-command-r-plus",
1638
- "cohere/cohere-command-r-plus-08-2024",
1639
- "core42/jais-30b-chat",
1640
- "deepseek/deepseek-r1",
1641
- "deepseek/deepseek-r1-0528",
1642
- "deepseek/deepseek-v3-0324",
1643
- "meta/llama-3.2-11b-vision-instruct",
1644
- "meta/llama-3.2-90b-vision-instruct",
1645
- "meta/llama-3.3-70b-instruct",
1646
- "meta/llama-4-maverick-17b-128e-instruct-fp8",
1647
- "meta/llama-4-scout-17b-16e-instruct",
1648
- "meta/meta-llama-3-70b-instruct",
1649
- "meta/meta-llama-3-8b-instruct",
1650
- "meta/meta-llama-3.1-405b-instruct",
1651
- "meta/meta-llama-3.1-70b-instruct",
1652
- "meta/meta-llama-3.1-8b-instruct",
1653
- "microsoft/mai-ds-r1",
1654
- "microsoft/phi-3-medium-128k-instruct",
1655
- "microsoft/phi-3-medium-4k-instruct",
1656
- "microsoft/phi-3-mini-128k-instruct",
1657
- "microsoft/phi-3-mini-4k-instruct",
1658
- "microsoft/phi-3-small-128k-instruct",
1659
- "microsoft/phi-3-small-8k-instruct",
1660
- "microsoft/phi-3.5-mini-instruct",
1661
- "microsoft/phi-3.5-moe-instruct",
1662
- "microsoft/phi-3.5-vision-instruct",
1663
- "microsoft/phi-4",
1664
- "microsoft/phi-4-mini-instruct",
1665
- "microsoft/phi-4-mini-reasoning",
1666
- "microsoft/phi-4-multimodal-instruct",
1667
- "microsoft/phi-4-reasoning",
1668
- "mistral-ai/codestral-2501",
1669
- "mistral-ai/ministral-3b",
1670
- "mistral-ai/mistral-large-2411",
1671
- "mistral-ai/mistral-medium-2505",
1672
- "mistral-ai/mistral-nemo",
1673
- "mistral-ai/mistral-small-2503",
1674
- "openai/gpt-4.1",
1675
- "openai/gpt-4.1-mini",
1676
- "openai/gpt-4.1-nano",
1677
- "openai/gpt-4o",
1678
- "openai/gpt-4o-mini",
1679
- "openai/o1",
1680
- "openai/o1-mini",
1681
- "openai/o1-preview",
1682
- "openai/o3",
1683
- "openai/o3-mini",
1684
- "openai/o4-mini",
1685
- "xai/grok-3",
1686
- "xai/grok-3-mini"
1687
- ],
1688
1851
  "deepinfra": [
1689
1852
  "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1690
1853
  "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo",
1691
1854
  "moonshotai/Kimi-K2-Instruct",
1692
1855
  "zai-org/GLM-4.5"
1693
1856
  ],
1694
- "fireworks-ai": [
1695
- "accounts/fireworks/models/deepseek-r1-0528",
1696
- "accounts/fireworks/models/deepseek-v3-0324",
1697
- "accounts/fireworks/models/deepseek-v3p1",
1698
- "accounts/fireworks/models/glm-4p5",
1699
- "accounts/fireworks/models/glm-4p5-air",
1700
- "accounts/fireworks/models/gpt-oss-120b",
1701
- "accounts/fireworks/models/gpt-oss-20b",
1702
- "accounts/fireworks/models/kimi-k2-instruct",
1703
- "accounts/fireworks/models/qwen3-235b-a22b",
1704
- "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
1857
+ "zhipuai": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1858
+ "submodel": [
1859
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1860
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1861
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1862
+ "deepseek-ai/DeepSeek-R1-0528",
1863
+ "deepseek-ai/DeepSeek-V3-0324",
1864
+ "deepseek-ai/DeepSeek-V3.1",
1865
+ "openai/gpt-oss-120b",
1866
+ "zai-org/GLM-4.5-Air",
1867
+ "zai-org/GLM-4.5-FP8"
1705
1868
  ],
1706
1869
  "zai": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1707
- "opencode": [
1708
- "an-gbt",
1709
- "big-pickle",
1710
- "claude-3-5-haiku",
1711
- "claude-haiku-4-5",
1712
- "claude-opus-4-1",
1713
- "claude-sonnet-4",
1714
- "claude-sonnet-4-5",
1715
- "code-supernova",
1716
- "glm-4.6",
1717
- "gpt-5",
1718
- "gpt-5-codex",
1719
- "grok-code",
1720
- "kimi-k2",
1721
- "qwen3-coder"
1870
+ "inference": [
1871
+ "google/gemma-3",
1872
+ "meta/llama-3.1-8b-instruct",
1873
+ "meta/llama-3.2-11b-vision-instruct",
1874
+ "meta/llama-3.2-1b-instruct",
1875
+ "meta/llama-3.2-3b-instruct",
1876
+ "mistral/mistral-nemo-12b-instruct",
1877
+ "osmosis/osmosis-structure-0.6b",
1878
+ "qwen/qwen-2.5-7b-vision-instruct",
1879
+ "qwen/qwen3-embedding-4b"
1722
1880
  ],
1723
- "zhipuai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1724
- "inception": ["mercury", "mercury-coder"],
1725
- "llama": [
1726
- "cerebras-llama-4-maverick-17b-128e-instruct",
1727
- "cerebras-llama-4-scout-17b-16e-instruct",
1728
- "groq-llama-4-maverick-17b-128e-instruct",
1729
- "llama-3.3-70b-instruct",
1730
- "llama-3.3-8b-instruct",
1731
- "llama-4-maverick-17b-128e-instruct-fp8",
1732
- "llama-4-scout-17b-16e-instruct-fp8"
1881
+ "requesty": [
1882
+ "anthropic/claude-3-7-sonnet",
1883
+ "anthropic/claude-4-sonnet-20250522",
1884
+ "anthropic/claude-opus-4",
1885
+ "anthropic/claude-opus-4-1-20250805",
1886
+ "google/gemini-2.5-flash",
1887
+ "google/gemini-2.5-pro",
1888
+ "openai/gpt-4.1",
1889
+ "openai/gpt-4.1-mini",
1890
+ "openai/gpt-4o-mini",
1891
+ "openai/gpt-5",
1892
+ "openai/gpt-5-mini",
1893
+ "openai/gpt-5-nano",
1894
+ "openai/o4-mini"
1733
1895
  ],
1896
+ "morph": ["auto", "morph-v3-fast", "morph-v3-large"],
1734
1897
  "lmstudio": ["openai/gpt-oss-20b", "qwen/qwen3-30b-a3b-2507", "qwen/qwen3-coder-30b"],
1735
- "openai": [
1736
- "codex-mini-latest",
1737
- "gpt-3.5-turbo",
1738
- "gpt-4",
1739
- "gpt-4-turbo",
1740
- "gpt-4.1",
1741
- "gpt-4.1-mini",
1742
- "gpt-4.1-nano",
1743
- "gpt-4o",
1744
- "gpt-4o-2024-05-13",
1745
- "gpt-4o-2024-08-06",
1746
- "gpt-4o-2024-11-20",
1747
- "gpt-4o-mini",
1748
- "gpt-5",
1749
- "gpt-5-chat-latest",
1750
- "gpt-5-codex",
1751
- "gpt-5-mini",
1752
- "gpt-5-nano",
1753
- "o1",
1754
- "o1-mini",
1755
- "o1-preview",
1756
- "o1-pro",
1757
- "o3",
1758
- "o3-deep-research",
1759
- "o3-mini",
1760
- "o3-pro",
1761
- "o4-mini",
1762
- "o4-mini-deep-research"
1763
- ],
1764
1898
  "anthropic": [
1765
1899
  "claude-3-5-haiku-20241022",
1766
1900
  "claude-3-5-haiku-latest",
@@ -1782,208 +1916,50 @@
1782
1916
  "claude-sonnet-4-5",
1783
1917
  "claude-sonnet-4-5-20250929"
1784
1918
  ],
1785
- "moonshotai": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1786
- "inference": [
1787
- "google/gemma-3",
1788
- "meta/llama-3.1-8b-instruct",
1789
- "meta/llama-3.2-11b-vision-instruct",
1790
- "meta/llama-3.2-1b-instruct",
1791
- "meta/llama-3.2-3b-instruct",
1792
- "mistral/mistral-nemo-12b-instruct",
1793
- "osmosis/osmosis-structure-0.6b",
1794
- "qwen/qwen-2.5-7b-vision-instruct",
1795
- "qwen/qwen3-embedding-4b"
1796
- ],
1797
- "baseten": ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
1798
- "cortecs": [
1799
- "claude-4-5-sonnet",
1800
- "claude-sonnet-4",
1801
- "deepseek-v3-0324",
1802
- "gemini-2.5-pro",
1803
- "gpt-4.1",
1804
- "gpt-oss-120b",
1805
- "kimi-k2-instruct",
1806
- "llama-3.1-405b-instruct",
1807
- "nova-pro-v1",
1808
- "qwen3-32b",
1809
- "qwen3-coder-480b-a35b-instruct"
1810
- ],
1811
- "mistral": [
1812
- "codestral-latest",
1813
- "devstral-medium-2507",
1814
- "devstral-small-2505",
1815
- "devstral-small-2507",
1816
- "magistral-medium-latest",
1817
- "magistral-small",
1818
- "ministral-3b-latest",
1819
- "ministral-8b-latest",
1820
- "mistral-large-latest",
1821
- "mistral-medium-2505",
1822
- "mistral-medium-2508",
1823
- "mistral-medium-latest",
1824
- "mistral-nemo",
1825
- "mistral-small-latest",
1826
- "open-mistral-7b",
1827
- "open-mixtral-8x22b",
1828
- "open-mixtral-8x7b",
1829
- "pixtral-12b",
1830
- "pixtral-large-latest"
1831
- ],
1832
- "venice": [
1833
- "deepseek-coder-v2-lite",
1834
- "deepseek-r1-671b",
1835
- "dolphin-2.9.2-qwen2-72b",
1836
- "llama-3.1-405b",
1837
- "llama-3.2-3b",
1838
- "llama-3.3-70b",
1839
- "mistral-31-24b",
1840
- "qwen-2.5-coder-32b",
1841
- "qwen-2.5-qwq-32b",
1842
- "qwen-2.5-vl",
1843
- "qwen3-235b",
1844
- "qwen3-4b",
1845
- "venice-uncensored"
1846
- ],
1847
- "alibaba": [
1848
- "qvq-max",
1849
- "qwen-flash",
1850
- "qwen-max",
1851
- "qwen-mt-plus",
1852
- "qwen-mt-turbo",
1853
- "qwen-omni-turbo",
1854
- "qwen-omni-turbo-realtime",
1855
- "qwen-plus",
1856
- "qwen-plus-character-ja",
1857
- "qwen-turbo",
1858
- "qwen-vl-max",
1859
- "qwen-vl-ocr",
1860
- "qwen-vl-plus",
1861
- "qwen2-5-14b-instruct",
1862
- "qwen2-5-32b-instruct",
1863
- "qwen2-5-72b-instruct",
1864
- "qwen2-5-7b-instruct",
1865
- "qwen2-5-omni-7b",
1866
- "qwen2-5-vl-72b-instruct",
1867
- "qwen2-5-vl-7b-instruct",
1868
- "qwen3-14b",
1869
- "qwen3-235b-a22b",
1870
- "qwen3-32b",
1871
- "qwen3-8b",
1872
- "qwen3-asr-flash",
1873
- "qwen3-coder-30b-a3b-instruct",
1874
- "qwen3-coder-480b-a35b-instruct",
1875
- "qwen3-coder-flash",
1876
- "qwen3-coder-plus",
1877
- "qwen3-livetranslate-flash-realtime",
1878
- "qwen3-max",
1879
- "qwen3-next-80b-a3b-instruct",
1880
- "qwen3-next-80b-a3b-thinking",
1881
- "qwen3-omni-flash",
1882
- "qwen3-omni-flash-realtime",
1883
- "qwen3-vl-235b-a22b",
1884
- "qwen3-vl-30b-a3b",
1885
- "qwen3-vl-plus",
1886
- "qwq-plus"
1887
- ],
1888
- "alibaba-cn": [
1889
- "deepseek-r1",
1890
- "deepseek-r1-0528",
1891
- "deepseek-r1-distill-llama-70b",
1892
- "deepseek-r1-distill-llama-8b",
1893
- "deepseek-r1-distill-qwen-1-5b",
1894
- "deepseek-r1-distill-qwen-14b",
1895
- "deepseek-r1-distill-qwen-32b",
1896
- "deepseek-r1-distill-qwen-7b",
1897
- "deepseek-v3",
1898
- "deepseek-v3-1",
1899
- "deepseek-v3-2-exp",
1900
- "moonshot-kimi-k2-instruct",
1901
- "qvq-max",
1902
- "qwen-deep-research",
1903
- "qwen-doc-turbo",
1904
- "qwen-flash",
1905
- "qwen-long",
1906
- "qwen-math-plus",
1907
- "qwen-math-turbo",
1908
- "qwen-max",
1909
- "qwen-mt-plus",
1910
- "qwen-mt-turbo",
1911
- "qwen-omni-turbo",
1912
- "qwen-omni-turbo-realtime",
1913
- "qwen-plus",
1914
- "qwen-plus-character",
1915
- "qwen-turbo",
1916
- "qwen-vl-max",
1917
- "qwen-vl-ocr",
1918
- "qwen-vl-plus",
1919
- "qwen2-5-14b-instruct",
1920
- "qwen2-5-32b-instruct",
1921
- "qwen2-5-72b-instruct",
1922
- "qwen2-5-7b-instruct",
1923
- "qwen2-5-coder-32b-instruct",
1924
- "qwen2-5-coder-7b-instruct",
1925
- "qwen2-5-math-72b-instruct",
1926
- "qwen2-5-math-7b-instruct",
1927
- "qwen2-5-omni-7b",
1928
- "qwen2-5-vl-72b-instruct",
1929
- "qwen2-5-vl-7b-instruct",
1930
- "qwen3-14b",
1931
- "qwen3-235b-a22b",
1932
- "qwen3-32b",
1933
- "qwen3-8b",
1934
- "qwen3-asr-flash",
1935
- "qwen3-coder-30b-a3b-instruct",
1936
- "qwen3-coder-480b-a35b-instruct",
1937
- "qwen3-coder-flash",
1938
- "qwen3-coder-plus",
1939
- "qwen3-max",
1940
- "qwen3-next-80b-a3b-instruct",
1941
- "qwen3-next-80b-a3b-thinking",
1942
- "qwen3-omni-flash",
1943
- "qwen3-omni-flash-realtime",
1944
- "qwen3-vl-235b-a22b",
1945
- "qwen3-vl-30b-a3b",
1946
- "qwen3-vl-plus",
1947
- "qwq-32b",
1948
- "qwq-plus",
1949
- "tongyi-intent-detect-v3"
1919
+ "fireworks-ai": [
1920
+ "accounts/fireworks/models/deepseek-r1-0528",
1921
+ "accounts/fireworks/models/deepseek-v3-0324",
1922
+ "accounts/fireworks/models/deepseek-v3p1",
1923
+ "accounts/fireworks/models/glm-4p5",
1924
+ "accounts/fireworks/models/glm-4p5-air",
1925
+ "accounts/fireworks/models/gpt-oss-120b",
1926
+ "accounts/fireworks/models/gpt-oss-20b",
1927
+ "accounts/fireworks/models/kimi-k2-instruct",
1928
+ "accounts/fireworks/models/qwen3-235b-a22b",
1929
+ "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
1950
1930
  ],
1951
- "chutes": [
1931
+ "modelscope": [
1952
1932
  "Qwen/Qwen3-235B-A22B-Instruct-2507",
1953
1933
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
1954
- "Qwen/Qwen3-30B-A3B",
1955
1934
  "Qwen/Qwen3-30B-A3B-Instruct-2507",
1956
1935
  "Qwen/Qwen3-30B-A3B-Thinking-2507",
1957
1936
  "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1958
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1959
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
1960
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
1961
- "chutesai/Devstral-Small-2505",
1962
- "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
1963
- "deepseek-ai/DeepSeek-R1-0528",
1964
- "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
1965
- "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1966
- "deepseek-ai/DeepSeek-V3-0324",
1967
- "deepseek-ai/DeepSeek-V3.1",
1968
- "deepseek-ai/DeepSeek-V3.1-Terminus",
1969
- "deepseek-ai/DeepSeek-V3.1-turbo",
1970
- "deepseek-ai/DeepSeek-V3.1:THINKING",
1971
- "deepseek-ai/DeepSeek-V3.2-Exp",
1972
- "meituan-longcat/LongCat-Flash-Chat-FP8",
1973
- "moonshotai/Kimi-Dev-72B",
1974
- "moonshotai/Kimi-K2-Instruct-0905",
1975
- "moonshotai/Kimi-K2-Instruct-75k",
1976
- "moonshotai/Kimi-VL-A3B-Thinking",
1977
- "openai/gpt-oss-120b",
1978
- "tngtech/DeepSeek-R1T-Chimera",
1979
- "tngtech/DeepSeek-TNG-R1T2-Chimera",
1980
- "zai-org/GLM-4.5-Air",
1981
- "zai-org/GLM-4.5-FP8",
1982
- "zai-org/GLM-4.5-turbo",
1983
- "zai-org/GLM-4.6-FP8",
1984
- "zai-org/GLM-4.6-turbo"
1937
+ "ZhipuAI/GLM-4.5",
1938
+ "ZhipuAI/GLM-4.6"
1985
1939
  ],
1986
- "upstage": ["solar-mini", "solar-pro2"],
1940
+ "llama": [
1941
+ "cerebras-llama-4-maverick-17b-128e-instruct",
1942
+ "cerebras-llama-4-scout-17b-16e-instruct",
1943
+ "groq-llama-4-maverick-17b-128e-instruct",
1944
+ "llama-3.3-70b-instruct",
1945
+ "llama-3.3-8b-instruct",
1946
+ "llama-4-maverick-17b-128e-instruct-fp8",
1947
+ "llama-4-scout-17b-16e-instruct-fp8"
1948
+ ],
1949
+ "scaleway": [
1950
+ "deepseek-r1-distill-llama-70b",
1951
+ "gemma-3-27b-it",
1952
+ "gpt-oss-120b",
1953
+ "llama-3.1-8b-instruct",
1954
+ "llama-3.3-70b-instruct",
1955
+ "mistral-nemo-instruct-2407",
1956
+ "mistral-small-3.2-24b-instruct-2506",
1957
+ "pixtral-12b-2409",
1958
+ "qwen3-235b-a22b-instruct-2507",
1959
+ "qwen3-coder-30b-a3b-instruct",
1960
+ "voxtral-small-24b-2507"
1961
+ ],
1962
+ "cerebras": ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
1987
1963
  "netlify": [
1988
1964
  "anthropic/claude-3-5-haiku-20241022",
1989
1965
  "anthropic/claude-3-5-haiku-latest",