@mastra/core 0.21.1 → 0.21.2-alpha.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (212) hide show
  1. package/CHANGELOG.md +44 -0
  2. package/dist/agent/__tests__/mock-model.d.ts +6 -0
  3. package/dist/agent/__tests__/mock-model.d.ts.map +1 -0
  4. package/dist/agent/agent.d.ts +9 -4
  5. package/dist/agent/agent.d.ts.map +1 -1
  6. package/dist/agent/agent.types.d.ts +4 -3
  7. package/dist/agent/agent.types.d.ts.map +1 -1
  8. package/dist/agent/index.cjs +13 -13
  9. package/dist/agent/index.js +2 -2
  10. package/dist/agent/input-processor/index.cjs +6 -6
  11. package/dist/agent/input-processor/index.js +1 -1
  12. package/dist/agent/message-list/index.d.ts.map +1 -1
  13. package/dist/agent/message-list/utils/ai-v5/gemini-compatibility.d.ts +22 -0
  14. package/dist/agent/message-list/utils/ai-v5/gemini-compatibility.d.ts.map +1 -0
  15. package/dist/agent/types.d.ts +5 -0
  16. package/dist/agent/types.d.ts.map +1 -1
  17. package/dist/agent/utils.d.ts.map +1 -1
  18. package/dist/agent/workflows/prepare-stream/index.d.ts +7 -4
  19. package/dist/agent/workflows/prepare-stream/index.d.ts.map +1 -1
  20. package/dist/agent/workflows/prepare-stream/prepare-memory-step.d.ts +7 -4
  21. package/dist/agent/workflows/prepare-stream/prepare-memory-step.d.ts.map +1 -1
  22. package/dist/agent/workflows/prepare-stream/schema.d.ts +4 -4
  23. package/dist/agent/workflows/prepare-stream/stream-step.d.ts +3 -0
  24. package/dist/agent/workflows/prepare-stream/stream-step.d.ts.map +1 -1
  25. package/dist/ai-tracing/index.cjs +32 -32
  26. package/dist/ai-tracing/index.js +1 -1
  27. package/dist/{chunk-NHKXTGR6.js → chunk-4ZFVJA3A.js} +3 -3
  28. package/dist/{chunk-NHKXTGR6.js.map → chunk-4ZFVJA3A.js.map} +1 -1
  29. package/dist/{chunk-XVREJCOW.cjs → chunk-7P5FMQQK.cjs} +6 -6
  30. package/dist/{chunk-XVREJCOW.cjs.map → chunk-7P5FMQQK.cjs.map} +1 -1
  31. package/dist/{chunk-3V4O35FO.js → chunk-BLVB2IJK.js} +3 -3
  32. package/dist/{chunk-3V4O35FO.js.map → chunk-BLVB2IJK.js.map} +1 -1
  33. package/dist/{chunk-FESSBG5D.cjs → chunk-D3IOLHNB.cjs} +12 -12
  34. package/dist/{chunk-FESSBG5D.cjs.map → chunk-D3IOLHNB.cjs.map} +1 -1
  35. package/dist/{chunk-KAV4EP3T.cjs → chunk-EGNHIPGJ.cjs} +4 -4
  36. package/dist/{chunk-KAV4EP3T.cjs.map → chunk-EGNHIPGJ.cjs.map} +1 -1
  37. package/dist/{chunk-5NR2GY4U.js → chunk-GB5BIA4V.js} +5 -3
  38. package/dist/chunk-GB5BIA4V.js.map +1 -0
  39. package/dist/{chunk-J2OKI2L3.js → chunk-GKTRUHKB.js} +10 -5
  40. package/dist/chunk-GKTRUHKB.js.map +1 -0
  41. package/dist/{chunk-A3QHQYMC.js → chunk-HGNRQ3OG.js} +12 -2
  42. package/dist/chunk-HGNRQ3OG.js.map +1 -0
  43. package/dist/{chunk-MUAFIPD7.js → chunk-KLWDUSBX.js} +4 -4
  44. package/dist/{chunk-MUAFIPD7.js.map → chunk-KLWDUSBX.js.map} +1 -1
  45. package/dist/chunk-LJFJTTZQ.cjs +4 -0
  46. package/dist/chunk-LJFJTTZQ.cjs.map +1 -0
  47. package/dist/{chunk-T3PBU7JK.js → chunk-LMP5KMU3.js} +34 -45
  48. package/dist/chunk-LMP5KMU3.js.map +1 -0
  49. package/dist/{chunk-OXAN5SM7.cjs → chunk-LRSB62Z6.cjs} +12 -2
  50. package/dist/chunk-LRSB62Z6.cjs.map +1 -0
  51. package/dist/{chunk-3ORA5EFD.cjs → chunk-LZUSZT7R.cjs} +5 -3
  52. package/dist/chunk-LZUSZT7R.cjs.map +1 -0
  53. package/dist/{chunk-XHPBKALR.cjs → chunk-MVVMHOAC.cjs} +15 -12
  54. package/dist/chunk-MVVMHOAC.cjs.map +1 -0
  55. package/dist/{chunk-HBJVAMCS.js → chunk-N3ZSX5OS.js} +31 -32
  56. package/dist/chunk-N3ZSX5OS.js.map +1 -0
  57. package/dist/{chunk-HP7B2TQQ.js → chunk-NIESGYOH.js} +1654 -1469
  58. package/dist/chunk-NIESGYOH.js.map +1 -0
  59. package/dist/{chunk-F6BMIPYW.js → chunk-NL3P7IFI.js} +3 -3
  60. package/dist/{chunk-F6BMIPYW.js.map → chunk-NL3P7IFI.js.map} +1 -1
  61. package/dist/{chunk-U6CUPKV2.js → chunk-R35PINKN.js} +5 -5
  62. package/dist/{chunk-U6CUPKV2.js.map → chunk-R35PINKN.js.map} +1 -1
  63. package/dist/{chunk-W3DS6F6G.cjs → chunk-UN653TND.cjs} +4 -4
  64. package/dist/{chunk-W3DS6F6G.cjs.map → chunk-UN653TND.cjs.map} +1 -1
  65. package/dist/{chunk-44ODA6L3.cjs → chunk-URQI7RJ3.cjs} +4 -4
  66. package/dist/{chunk-44ODA6L3.cjs.map → chunk-URQI7RJ3.cjs.map} +1 -1
  67. package/dist/{chunk-APY2BE4K.cjs → chunk-URVM3Y4T.cjs} +35 -46
  68. package/dist/chunk-URVM3Y4T.cjs.map +1 -0
  69. package/dist/{chunk-AJK7QPSD.cjs → chunk-V5WDWSQ5.cjs} +11 -11
  70. package/dist/{chunk-AJK7QPSD.cjs.map → chunk-V5WDWSQ5.cjs.map} +1 -1
  71. package/dist/{chunk-FLXB6WXO.js → chunk-VQLW7LPO.js} +5 -3
  72. package/dist/chunk-VQLW7LPO.js.map +1 -0
  73. package/dist/{chunk-462DRETM.cjs → chunk-WI2YMBNG.cjs} +64 -66
  74. package/dist/chunk-WI2YMBNG.cjs.map +1 -0
  75. package/dist/{chunk-NUURZ3AY.js → chunk-XBJP7THY.js} +6 -3
  76. package/dist/chunk-XBJP7THY.js.map +1 -0
  77. package/dist/{chunk-5DZ4RYWL.js → chunk-XYNSPEJO.js} +3 -3
  78. package/dist/{chunk-5DZ4RYWL.js.map → chunk-XYNSPEJO.js.map} +1 -1
  79. package/dist/{chunk-OY6UJ3QL.cjs → chunk-YGL6E6PD.cjs} +5 -3
  80. package/dist/chunk-YGL6E6PD.cjs.map +1 -0
  81. package/dist/{chunk-BV6CD4IZ.cjs → chunk-YKVVW65D.cjs} +12 -7
  82. package/dist/chunk-YKVVW65D.cjs.map +1 -0
  83. package/dist/{chunk-DGQW5VRR.cjs → chunk-ZMPSVDDO.cjs} +1658 -1472
  84. package/dist/chunk-ZMPSVDDO.cjs.map +1 -0
  85. package/dist/chunk-ZV5CC35D.js +3 -0
  86. package/dist/chunk-ZV5CC35D.js.map +1 -0
  87. package/dist/index.cjs +50 -46
  88. package/dist/index.js +8 -8
  89. package/dist/llm/index.cjs +10 -6
  90. package/dist/llm/index.d.ts +1 -0
  91. package/dist/llm/index.d.ts.map +1 -1
  92. package/dist/llm/index.js +1 -1
  93. package/dist/llm/model/embedding-router.d.ts +50 -0
  94. package/dist/llm/model/embedding-router.d.ts.map +1 -0
  95. package/dist/llm/model/gateways/models-dev.d.ts.map +1 -1
  96. package/dist/llm/model/gateways/netlify.d.ts.map +1 -1
  97. package/dist/llm/model/index.d.ts +1 -0
  98. package/dist/llm/model/index.d.ts.map +1 -1
  99. package/dist/llm/model/model.loop.d.ts +1 -1
  100. package/dist/llm/model/model.loop.d.ts.map +1 -1
  101. package/dist/llm/model/provider-options.d.ts +42 -0
  102. package/dist/llm/model/provider-options.d.ts.map +1 -0
  103. package/dist/llm/model/provider-types.generated.d.ts +629 -590
  104. package/dist/llm/model/router.d.ts.map +1 -1
  105. package/dist/loop/index.cjs +2 -2
  106. package/dist/loop/index.js +1 -1
  107. package/dist/loop/network/index.d.ts +4 -1
  108. package/dist/loop/network/index.d.ts.map +1 -1
  109. package/dist/loop/test-utils/fullStream.d.ts.map +1 -1
  110. package/dist/loop/test-utils/generateText.d.ts.map +1 -1
  111. package/dist/loop/test-utils/options.d.ts.map +1 -1
  112. package/dist/loop/test-utils/resultObject.d.ts.map +1 -1
  113. package/dist/loop/test-utils/streamObject.d.ts.map +1 -1
  114. package/dist/loop/test-utils/telemetry.d.ts.map +1 -1
  115. package/dist/loop/test-utils/textStream.d.ts.map +1 -1
  116. package/dist/loop/test-utils/toUIMessageStream.d.ts.map +1 -1
  117. package/dist/loop/test-utils/tools.d.ts.map +1 -1
  118. package/dist/loop/test-utils/utils.d.ts +2 -0
  119. package/dist/loop/test-utils/utils.d.ts.map +1 -1
  120. package/dist/loop/workflows/agentic-execution/index.d.ts +42 -42
  121. package/dist/loop/workflows/agentic-execution/llm-execution-step.d.ts +28 -28
  122. package/dist/loop/workflows/agentic-execution/llm-mapping-step.d.ts +14 -14
  123. package/dist/loop/workflows/agentic-loop/index.d.ts +42 -42
  124. package/dist/loop/workflows/schema.d.ts +14 -14
  125. package/dist/mastra/index.cjs +2 -2
  126. package/dist/mastra/index.js +1 -1
  127. package/dist/memory/index.cjs +4 -4
  128. package/dist/memory/index.js +1 -1
  129. package/dist/memory/memory.d.ts.map +1 -1
  130. package/dist/memory/types.d.ts +10 -1
  131. package/dist/memory/types.d.ts.map +1 -1
  132. package/dist/models-dev-4VGIWYS3.js +3 -0
  133. package/dist/{models-dev-3VEABUH4.js.map → models-dev-4VGIWYS3.js.map} +1 -1
  134. package/dist/models-dev-AXZASLL2.cjs +12 -0
  135. package/dist/{models-dev-L42ORGVT.cjs.map → models-dev-AXZASLL2.cjs.map} +1 -1
  136. package/dist/netlify-26MMY5X4.js +3 -0
  137. package/dist/{netlify-NYFKA6UB.js.map → netlify-26MMY5X4.js.map} +1 -1
  138. package/dist/netlify-F3MVGV4Y.cjs +12 -0
  139. package/dist/{netlify-3B6HDHRP.cjs.map → netlify-F3MVGV4Y.cjs.map} +1 -1
  140. package/dist/processors/index.cjs +11 -11
  141. package/dist/processors/index.js +1 -1
  142. package/dist/provider-registry.json +1542 -1464
  143. package/dist/relevance/index.cjs +4 -4
  144. package/dist/relevance/index.js +1 -1
  145. package/dist/scores/index.cjs +9 -9
  146. package/dist/scores/index.js +2 -2
  147. package/dist/scores/scoreTraces/index.cjs +8 -8
  148. package/dist/scores/scoreTraces/index.js +3 -3
  149. package/dist/storage/domains/workflows/inmemory.d.ts.map +1 -1
  150. package/dist/storage/index.cjs +5 -3
  151. package/dist/storage/index.cjs.map +1 -1
  152. package/dist/storage/index.js +3 -1
  153. package/dist/storage/index.js.map +1 -1
  154. package/dist/stream/aisdk/v5/execute.d.ts.map +1 -1
  155. package/dist/stream/aisdk/v5/output.d.ts +9 -10
  156. package/dist/stream/aisdk/v5/output.d.ts.map +1 -1
  157. package/dist/stream/base/output-format-handlers.d.ts +1 -2
  158. package/dist/stream/base/output-format-handlers.d.ts.map +1 -1
  159. package/dist/stream/base/output.d.ts.map +1 -1
  160. package/dist/stream/index.cjs +10 -10
  161. package/dist/stream/index.d.ts +1 -1
  162. package/dist/stream/index.d.ts.map +1 -1
  163. package/dist/stream/index.js +2 -2
  164. package/dist/stream/types.d.ts +17 -1
  165. package/dist/stream/types.d.ts.map +1 -1
  166. package/dist/test-utils/llm-mock.cjs +2 -2
  167. package/dist/test-utils/llm-mock.js +1 -1
  168. package/dist/tools/index.cjs +2 -2
  169. package/dist/tools/index.js +1 -1
  170. package/dist/tools/stream.d.ts +7 -0
  171. package/dist/tools/stream.d.ts.map +1 -1
  172. package/dist/utils.cjs +17 -17
  173. package/dist/utils.js +1 -1
  174. package/dist/workflows/default.d.ts +1 -0
  175. package/dist/workflows/default.d.ts.map +1 -1
  176. package/dist/workflows/evented/index.cjs +10 -10
  177. package/dist/workflows/evented/index.js +1 -1
  178. package/dist/workflows/evented/workflow-event-processor/index.d.ts.map +1 -1
  179. package/dist/workflows/evented/workflow.d.ts.map +1 -1
  180. package/dist/workflows/index.cjs +12 -12
  181. package/dist/workflows/index.js +1 -1
  182. package/dist/workflows/legacy/index.cjs +22 -22
  183. package/dist/workflows/legacy/index.js +1 -1
  184. package/dist/workflows/legacy/machine.d.ts +1 -1
  185. package/dist/workflows/step.d.ts +4 -1
  186. package/dist/workflows/step.d.ts.map +1 -1
  187. package/dist/workflows/types.d.ts +1 -0
  188. package/dist/workflows/types.d.ts.map +1 -1
  189. package/dist/workflows/workflow.d.ts +3 -1
  190. package/dist/workflows/workflow.d.ts.map +1 -1
  191. package/package.json +11 -10
  192. package/src/llm/model/provider-types.generated.d.ts +629 -590
  193. package/dist/chunk-3ORA5EFD.cjs.map +0 -1
  194. package/dist/chunk-462DRETM.cjs.map +0 -1
  195. package/dist/chunk-5NR2GY4U.js.map +0 -1
  196. package/dist/chunk-A3QHQYMC.js.map +0 -1
  197. package/dist/chunk-APY2BE4K.cjs.map +0 -1
  198. package/dist/chunk-BV6CD4IZ.cjs.map +0 -1
  199. package/dist/chunk-DGQW5VRR.cjs.map +0 -1
  200. package/dist/chunk-FLXB6WXO.js.map +0 -1
  201. package/dist/chunk-HBJVAMCS.js.map +0 -1
  202. package/dist/chunk-HP7B2TQQ.js.map +0 -1
  203. package/dist/chunk-J2OKI2L3.js.map +0 -1
  204. package/dist/chunk-NUURZ3AY.js.map +0 -1
  205. package/dist/chunk-OXAN5SM7.cjs.map +0 -1
  206. package/dist/chunk-OY6UJ3QL.cjs.map +0 -1
  207. package/dist/chunk-T3PBU7JK.js.map +0 -1
  208. package/dist/chunk-XHPBKALR.cjs.map +0 -1
  209. package/dist/models-dev-3VEABUH4.js +0 -3
  210. package/dist/models-dev-L42ORGVT.cjs +0 -12
  211. package/dist/netlify-3B6HDHRP.cjs +0 -12
  212. package/dist/netlify-NYFKA6UB.js +0 -3
@@ -1,88 +1,87 @@
1
1
  {
2
2
  "providers": {
3
- "moonshotai-cn": {
4
- "url": "https://api.moonshot.cn/v1",
5
- "apiKeyEnvVar": "MOONSHOT_API_KEY",
6
- "apiKeyHeader": "Authorization",
7
- "name": "Moonshot AI (China)",
8
- "models": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
9
- "docUrl": "https://platform.moonshot.cn/docs/api/chat",
10
- "gateway": "models.dev"
11
- },
12
- "lucidquery": {
13
- "url": "https://lucidquery.com/api/v1",
14
- "apiKeyEnvVar": "LUCIDQUERY_API_KEY",
3
+ "nvidia": {
4
+ "url": "https://integrate.api.nvidia.com/v1",
5
+ "apiKeyEnvVar": "NVIDIA_API_KEY",
15
6
  "apiKeyHeader": "Authorization",
16
- "name": "LucidQuery AI",
17
- "models": ["lucidnova-rf1-100b", "lucidquery-nexus-coder"],
18
- "docUrl": "https://lucidquery.com/api/docs",
7
+ "name": "Nvidia",
8
+ "models": [
9
+ "black-forest-labs/flux.1-dev",
10
+ "deepseek-ai/deepseek-v3.1",
11
+ "deepseek-ai/deepseek-v3.1-terminus",
12
+ "google/gemma-3-27b-it",
13
+ "microsoft/phi-4-mini-instruct",
14
+ "moonshotai/kimi-k2-instruct",
15
+ "moonshotai/kimi-k2-instruct-0905",
16
+ "nvidia/cosmos-nemotron-34b",
17
+ "nvidia/llama-3.1-nemotron-ultra-253b-v1",
18
+ "nvidia/nemoretriever-ocr-v1",
19
+ "nvidia/parakeet-tdt-0.6b-v2",
20
+ "openai/gpt-oss-120b",
21
+ "openai/whisper-large-v3",
22
+ "qwen/qwen3-235b-a22b",
23
+ "qwen/qwen3-coder-480b-a35b-instruct"
24
+ ],
25
+ "docUrl": "https://docs.api.nvidia.com/nim/",
19
26
  "gateway": "models.dev"
20
27
  },
21
- "moonshotai": {
22
- "url": "https://api.moonshot.ai/v1",
23
- "apiKeyEnvVar": "MOONSHOT_API_KEY",
28
+ "modelscope": {
29
+ "url": "https://api-inference.modelscope.cn/v1",
30
+ "apiKeyEnvVar": "MODELSCOPE_API_KEY",
24
31
  "apiKeyHeader": "Authorization",
25
- "name": "Moonshot AI",
26
- "models": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
27
- "docUrl": "https://platform.moonshot.ai/docs/api/chat",
32
+ "name": "ModelScope",
33
+ "models": [
34
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
35
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
36
+ "Qwen/Qwen3-30B-A3B-Instruct-2507",
37
+ "Qwen/Qwen3-30B-A3B-Thinking-2507",
38
+ "Qwen/Qwen3-Coder-30B-A3B-Instruct",
39
+ "ZhipuAI/GLM-4.5",
40
+ "ZhipuAI/GLM-4.6"
41
+ ],
42
+ "docUrl": "https://modelscope.cn/docs/model-service/API-Inference/intro",
28
43
  "gateway": "models.dev"
29
44
  },
30
- "zai-coding-plan": {
31
- "url": "https://api.z.ai/api/coding/paas/v4",
32
- "apiKeyEnvVar": "ZHIPU_API_KEY",
45
+ "aihubmix": {
46
+ "url": "https://api.aihubmix.com/v1",
47
+ "apiKeyEnvVar": "AIHUBMIX_API_KEY",
33
48
  "apiKeyHeader": "Authorization",
34
- "name": "Z.AI Coding Plan",
35
- "models": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
36
- "docUrl": "https://docs.z.ai/devpack/overview",
49
+ "name": "AIHubMix",
50
+ "models": [
51
+ "DeepSeek-V3.2-Exp",
52
+ "DeepSeek-V3.2-Exp-Think",
53
+ "Kimi-K2-0905",
54
+ "claude-haiku-4-5",
55
+ "claude-opus-4-1",
56
+ "claude-sonnet-4-5",
57
+ "gemini-2.5-flash",
58
+ "gemini-2.5-pro",
59
+ "glm-4.6",
60
+ "gpt-4.1",
61
+ "gpt-4.1-mini",
62
+ "gpt-4.1-nano",
63
+ "gpt-4o",
64
+ "gpt-4o-2024-11-20",
65
+ "gpt-5",
66
+ "gpt-5-codex",
67
+ "gpt-5-mini",
68
+ "gpt-5-nano",
69
+ "gpt-5-pro",
70
+ "o4-mini",
71
+ "qwen3-235b-a22b-instruct-2507",
72
+ "qwen3-235b-a22b-thinking-2507",
73
+ "qwen3-coder-480b-a35b-instruct"
74
+ ],
75
+ "docUrl": "https://aihubmix.com/docs/models",
37
76
  "gateway": "models.dev"
38
77
  },
39
- "alibaba": {
40
- "url": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1",
41
- "apiKeyEnvVar": "DASHSCOPE_API_KEY",
78
+ "lucidquery": {
79
+ "url": "https://lucidquery.com/api/v1",
80
+ "apiKeyEnvVar": "LUCIDQUERY_API_KEY",
42
81
  "apiKeyHeader": "Authorization",
43
- "name": "Alibaba",
44
- "models": [
45
- "qvq-max",
46
- "qwen-flash",
47
- "qwen-max",
48
- "qwen-mt-plus",
49
- "qwen-mt-turbo",
50
- "qwen-omni-turbo",
51
- "qwen-omni-turbo-realtime",
52
- "qwen-plus",
53
- "qwen-plus-character-ja",
54
- "qwen-turbo",
55
- "qwen-vl-max",
56
- "qwen-vl-ocr",
57
- "qwen-vl-plus",
58
- "qwen2-5-14b-instruct",
59
- "qwen2-5-32b-instruct",
60
- "qwen2-5-72b-instruct",
61
- "qwen2-5-7b-instruct",
62
- "qwen2-5-omni-7b",
63
- "qwen2-5-vl-72b-instruct",
64
- "qwen2-5-vl-7b-instruct",
65
- "qwen3-14b",
66
- "qwen3-235b-a22b",
67
- "qwen3-32b",
68
- "qwen3-8b",
69
- "qwen3-asr-flash",
70
- "qwen3-coder-30b-a3b-instruct",
71
- "qwen3-coder-480b-a35b-instruct",
72
- "qwen3-coder-flash",
73
- "qwen3-coder-plus",
74
- "qwen3-livetranslate-flash-realtime",
75
- "qwen3-max",
76
- "qwen3-next-80b-a3b-instruct",
77
- "qwen3-next-80b-a3b-thinking",
78
- "qwen3-omni-flash",
79
- "qwen3-omni-flash-realtime",
80
- "qwen3-vl-235b-a22b",
81
- "qwen3-vl-30b-a3b",
82
- "qwen3-vl-plus",
83
- "qwq-plus"
84
- ],
85
- "docUrl": "https://www.alibabacloud.com/help/en/model-studio/models",
82
+ "name": "LucidQuery AI",
83
+ "models": ["lucidnova-rf1-100b", "lucidquery-nexus-coder"],
84
+ "docUrl": "https://lucidquery.com/api/docs",
86
85
  "gateway": "models.dev"
87
86
  },
88
87
  "xai": {
@@ -113,444 +112,270 @@
113
112
  "docUrl": "https://docs.x.ai/docs/models",
114
113
  "gateway": "models.dev"
115
114
  },
116
- "nvidia": {
117
- "url": "https://integrate.api.nvidia.com/v1",
118
- "apiKeyEnvVar": "NVIDIA_API_KEY",
115
+ "deepseek": {
116
+ "url": "https://api.deepseek.com",
117
+ "apiKeyEnvVar": "DEEPSEEK_API_KEY",
119
118
  "apiKeyHeader": "Authorization",
120
- "name": "Nvidia",
121
- "models": [
122
- "black-forest-labs/flux.1-dev",
123
- "deepseek-ai/deepseek-v3.1",
124
- "google/gemma-3-27b-it",
125
- "microsoft/phi-4-mini-instruct",
126
- "moonshotai/kimi-k2-instruct",
127
- "moonshotai/kimi-k2-instruct-0905",
128
- "nvidia/cosmos-nemotron-34b",
129
- "nvidia/llama-3.1-nemotron-ultra-253b-v1",
130
- "nvidia/nemoretriever-ocr-v1",
131
- "nvidia/parakeet-tdt-0.6b-v2",
132
- "openai/gpt-oss-120b",
133
- "openai/whisper-large-v3",
134
- "qwen/qwen3-235b-a22b",
135
- "qwen/qwen3-coder-480b-a35b-instruct"
136
- ],
137
- "docUrl": "https://docs.api.nvidia.com/nim/",
119
+ "name": "DeepSeek",
120
+ "models": ["deepseek-chat", "deepseek-reasoner"],
121
+ "docUrl": "https://platform.deepseek.com/api-docs/pricing",
138
122
  "gateway": "models.dev"
139
123
  },
140
- "upstage": {
141
- "url": "https://api.upstage.ai",
142
- "apiKeyEnvVar": "UPSTAGE_API_KEY",
124
+ "requesty": {
125
+ "url": "https://router.requesty.ai/v1",
126
+ "apiKeyEnvVar": "REQUESTY_API_KEY",
143
127
  "apiKeyHeader": "Authorization",
144
- "name": "Upstage",
145
- "models": ["solar-mini", "solar-pro2"],
146
- "docUrl": "https://developers.upstage.ai/docs/apis/chat",
128
+ "name": "Requesty",
129
+ "models": [
130
+ "anthropic/claude-3-7-sonnet",
131
+ "anthropic/claude-4-sonnet-20250522",
132
+ "anthropic/claude-opus-4",
133
+ "anthropic/claude-opus-4-1-20250805",
134
+ "google/gemini-2.5-flash",
135
+ "google/gemini-2.5-pro",
136
+ "openai/gpt-4.1",
137
+ "openai/gpt-4.1-mini",
138
+ "openai/gpt-4o-mini",
139
+ "openai/gpt-5",
140
+ "openai/gpt-5-mini",
141
+ "openai/gpt-5-nano",
142
+ "openai/o4-mini"
143
+ ],
144
+ "docUrl": "https://requesty.ai/solution/llm-routing/models",
147
145
  "gateway": "models.dev"
148
146
  },
149
- "groq": {
150
- "url": "https://api.groq.com/openai/v1",
151
- "apiKeyEnvVar": "GROQ_API_KEY",
147
+ "nebius": {
148
+ "url": "https://api.studio.nebius.com/v1/",
149
+ "apiKeyEnvVar": "NEBIUS_API_KEY",
152
150
  "apiKeyHeader": "Authorization",
153
- "name": "Groq",
151
+ "name": "Nebius AI Studio",
154
152
  "models": [
155
- "deepseek-r1-distill-llama-70b",
156
- "gemma2-9b-it",
157
- "llama-3.1-8b-instant",
158
- "llama-3.3-70b-versatile",
159
- "llama-guard-3-8b",
160
- "llama3-70b-8192",
161
- "llama3-8b-8192",
162
- "meta-llama/llama-4-maverick-17b-128e-instruct",
163
- "meta-llama/llama-4-scout-17b-16e-instruct",
164
- "meta-llama/llama-guard-4-12b",
165
- "mistral-saba-24b",
153
+ "NousResearch/hermes-4-405b",
154
+ "NousResearch/hermes-4-70b",
155
+ "deepseek-ai/deepseek-v3",
156
+ "meta-llama/llama-3.3-70b-instruct-base",
157
+ "meta-llama/llama-3.3-70b-instruct-fast",
158
+ "meta-llama/llama-3_1-405b-instruct",
166
159
  "moonshotai/kimi-k2-instruct",
167
- "moonshotai/kimi-k2-instruct-0905",
160
+ "nvidia/llama-3_1-nemotron-ultra-253b-v1",
168
161
  "openai/gpt-oss-120b",
169
162
  "openai/gpt-oss-20b",
170
- "qwen-qwq-32b",
171
- "qwen/qwen3-32b"
163
+ "qwen/qwen3-235b-a22b-instruct-2507",
164
+ "qwen/qwen3-235b-a22b-thinking-2507",
165
+ "qwen/qwen3-coder-480b-a35b-instruct",
166
+ "zai-org/glm-4.5",
167
+ "zai-org/glm-4.5-air"
172
168
  ],
173
- "docUrl": "https://console.groq.com/docs/models",
169
+ "docUrl": "https://docs.studio.nebius.com/quickstart",
174
170
  "gateway": "models.dev"
175
171
  },
176
- "mistral": {
177
- "url": "https://api.mistral.ai/v1",
178
- "apiKeyEnvVar": "MISTRAL_API_KEY",
172
+ "fastrouter": {
173
+ "url": "https://go.fastrouter.ai/api/v1",
174
+ "apiKeyEnvVar": "FASTROUTER_API_KEY",
179
175
  "apiKeyHeader": "Authorization",
180
- "name": "Mistral",
176
+ "name": "FastRouter",
181
177
  "models": [
182
- "codestral-latest",
183
- "devstral-medium-2507",
184
- "devstral-small-2505",
185
- "devstral-small-2507",
186
- "magistral-medium-latest",
187
- "magistral-small",
188
- "ministral-3b-latest",
189
- "ministral-8b-latest",
190
- "mistral-large-latest",
191
- "mistral-medium-2505",
192
- "mistral-medium-2508",
193
- "mistral-medium-latest",
194
- "mistral-nemo",
195
- "mistral-small-latest",
196
- "open-mistral-7b",
197
- "open-mixtral-8x22b",
198
- "open-mixtral-8x7b",
199
- "pixtral-12b",
200
- "pixtral-large-latest"
201
- ],
202
- "docUrl": "https://docs.mistral.ai/getting-started/models/",
203
- "gateway": "models.dev"
204
- },
205
- "vercel": {
206
- "url": "https://ai-gateway.vercel.sh/v1",
207
- "apiKeyEnvVar": "AI_GATEWAY_API_KEY",
208
- "apiKeyHeader": "Authorization",
209
- "name": "Vercel AI Gateway",
210
- "models": [
211
- "alibaba/qwen3-coder-plus",
212
- "alibaba/qwen3-max",
213
- "alibaba/qwen3-next-80b-a3b-instruct",
214
- "alibaba/qwen3-next-80b-a3b-thinking",
215
- "alibaba/qwen3-vl-instruct",
216
- "alibaba/qwen3-vl-thinking",
217
- "amazon/nova-lite",
218
- "amazon/nova-micro",
219
- "amazon/nova-pro",
220
- "anthropic/claude-3-5-haiku",
221
- "anthropic/claude-3-haiku",
222
- "anthropic/claude-3-opus",
223
- "anthropic/claude-3.5-sonnet",
224
- "anthropic/claude-3.7-sonnet",
225
- "anthropic/claude-4-1-opus",
226
- "anthropic/claude-4-opus",
227
- "anthropic/claude-4-sonnet",
228
- "anthropic/claude-4.5-sonnet",
229
- "anthropic/claude-haiku-4.5",
230
- "cerebras/qwen3-coder",
231
- "deepseek/deepseek-r1",
232
- "deepseek/deepseek-r1-distill-llama-70b",
233
- "deepseek/deepseek-v3.1-terminus",
234
- "deepseek/deepseek-v3.2-exp",
235
- "deepseek/deepseek-v3.2-exp-thinking",
236
- "google/gemini-2.0-flash",
237
- "google/gemini-2.0-flash-lite",
178
+ "anthropic/claude-opus-4.1",
179
+ "anthropic/claude-sonnet-4",
180
+ "deepseek-ai/deepseek-r1-distill-llama-70b",
238
181
  "google/gemini-2.5-flash",
239
- "google/gemini-2.5-flash-lite",
240
- "google/gemini-2.5-flash-lite-preview-09-2025",
241
- "google/gemini-2.5-flash-preview-09-2025",
242
182
  "google/gemini-2.5-pro",
243
- "meta/llama-3.3-70b",
244
- "meta/llama-4-maverick",
245
- "meta/llama-4-scout",
246
- "mistral/codestral",
247
- "mistral/magistral-medium",
248
- "mistral/magistral-small",
249
- "mistral/ministral-3b",
250
- "mistral/ministral-8b",
251
- "mistral/mistral-large",
252
- "mistral/mistral-small",
253
- "mistral/mixtral-8x22b-instruct",
254
- "mistral/pixtral-12b",
255
- "mistral/pixtral-large",
256
183
  "moonshotai/kimi-k2",
257
- "morph/morph-v3-fast",
258
- "morph/morph-v3-large",
259
- "openai/gpt-4-turbo",
260
184
  "openai/gpt-4.1",
261
- "openai/gpt-4.1-mini",
262
- "openai/gpt-4.1-nano",
263
- "openai/gpt-4o",
264
- "openai/gpt-4o-mini",
265
185
  "openai/gpt-5",
266
- "openai/gpt-5-codex",
267
186
  "openai/gpt-5-mini",
268
187
  "openai/gpt-5-nano",
269
188
  "openai/gpt-oss-120b",
270
189
  "openai/gpt-oss-20b",
271
- "openai/o1",
272
- "openai/o3",
273
- "openai/o3-mini",
274
- "openai/o4-mini",
275
- "perplexity/sonar",
276
- "perplexity/sonar-pro",
277
- "perplexity/sonar-reasoning",
278
- "perplexity/sonar-reasoning-pro",
279
- "vercel/v0-1.0-md",
280
- "vercel/v0-1.5-md",
281
- "xai/grok-2",
282
- "xai/grok-2-vision",
283
- "xai/grok-3",
284
- "xai/grok-3-fast",
285
- "xai/grok-3-mini",
286
- "xai/grok-3-mini-fast",
287
- "xai/grok-4",
288
- "xai/grok-4-fast",
289
- "xai/grok-4-fast-non-reasoning",
290
- "xai/grok-code-fast-1",
291
- "zai/glm-4.5",
292
- "zai/glm-4.5-air",
293
- "zai/glm-4.5v",
294
- "zai/glm-4.6"
295
- ],
296
- "docUrl": "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway",
297
- "gateway": "models.dev"
298
- },
299
- "nebius": {
300
- "url": "https://api.studio.nebius.com/v1/",
301
- "apiKeyEnvVar": "NEBIUS_API_KEY",
302
- "apiKeyHeader": "Authorization",
303
- "name": "Nebius AI Studio",
304
- "models": [
305
- "NousResearch/hermes-4-405b",
306
- "NousResearch/hermes-4-70b",
307
- "deepseek-ai/deepseek-v3",
308
- "meta-llama/llama-3.3-70b-instruct-base",
309
- "meta-llama/llama-3.3-70b-instruct-fast",
310
- "meta-llama/llama-3_1-405b-instruct",
311
- "moonshotai/kimi-k2-instruct",
312
- "nvidia/llama-3_1-nemotron-ultra-253b-v1",
313
- "openai/gpt-oss-120b",
314
- "openai/gpt-oss-20b",
315
- "qwen/qwen3-235b-a22b-instruct-2507",
316
- "qwen/qwen3-235b-a22b-thinking-2507",
317
- "qwen/qwen3-coder-480b-a35b-instruct",
318
- "zai-org/glm-4.5",
319
- "zai-org/glm-4.5-air"
190
+ "qwen/qwen3-coder",
191
+ "x-ai/grok-4"
320
192
  ],
321
- "docUrl": "https://docs.studio.nebius.com/quickstart",
193
+ "docUrl": "https://fastrouter.ai/models",
322
194
  "gateway": "models.dev"
323
195
  },
324
- "deepseek": {
325
- "url": "https://api.deepseek.com",
326
- "apiKeyEnvVar": "DEEPSEEK_API_KEY",
196
+ "perplexity": {
197
+ "url": "https://api.perplexity.ai",
198
+ "apiKeyEnvVar": "PERPLEXITY_API_KEY",
327
199
  "apiKeyHeader": "Authorization",
328
- "name": "DeepSeek",
329
- "models": ["deepseek-chat", "deepseek-reasoner"],
330
- "docUrl": "https://platform.deepseek.com/api-docs/pricing",
200
+ "name": "Perplexity",
201
+ "models": ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
202
+ "docUrl": "https://docs.perplexity.ai",
331
203
  "gateway": "models.dev"
332
204
  },
333
- "alibaba-cn": {
334
- "url": "https://dashscope.aliyuncs.com/compatible-mode/v1",
335
- "apiKeyEnvVar": "DASHSCOPE_API_KEY",
205
+ "morph": {
206
+ "url": "https://api.morphllm.com/v1",
207
+ "apiKeyEnvVar": "MORPH_API_KEY",
336
208
  "apiKeyHeader": "Authorization",
337
- "name": "Alibaba (China)",
338
- "models": [
339
- "deepseek-r1",
340
- "deepseek-r1-0528",
341
- "deepseek-r1-distill-llama-70b",
342
- "deepseek-r1-distill-llama-8b",
343
- "deepseek-r1-distill-qwen-1-5b",
344
- "deepseek-r1-distill-qwen-14b",
345
- "deepseek-r1-distill-qwen-32b",
346
- "deepseek-r1-distill-qwen-7b",
347
- "deepseek-v3",
348
- "deepseek-v3-1",
349
- "deepseek-v3-2-exp",
350
- "moonshot-kimi-k2-instruct",
351
- "qvq-max",
352
- "qwen-deep-research",
353
- "qwen-doc-turbo",
354
- "qwen-flash",
355
- "qwen-long",
356
- "qwen-math-plus",
357
- "qwen-math-turbo",
358
- "qwen-max",
359
- "qwen-mt-plus",
360
- "qwen-mt-turbo",
361
- "qwen-omni-turbo",
362
- "qwen-omni-turbo-realtime",
363
- "qwen-plus",
364
- "qwen-plus-character",
365
- "qwen-turbo",
366
- "qwen-vl-max",
367
- "qwen-vl-ocr",
368
- "qwen-vl-plus",
369
- "qwen2-5-14b-instruct",
370
- "qwen2-5-32b-instruct",
371
- "qwen2-5-72b-instruct",
372
- "qwen2-5-7b-instruct",
373
- "qwen2-5-coder-32b-instruct",
374
- "qwen2-5-coder-7b-instruct",
375
- "qwen2-5-math-72b-instruct",
376
- "qwen2-5-math-7b-instruct",
377
- "qwen2-5-omni-7b",
378
- "qwen2-5-vl-72b-instruct",
379
- "qwen2-5-vl-7b-instruct",
380
- "qwen3-14b",
381
- "qwen3-235b-a22b",
382
- "qwen3-32b",
383
- "qwen3-8b",
384
- "qwen3-asr-flash",
385
- "qwen3-coder-30b-a3b-instruct",
386
- "qwen3-coder-480b-a35b-instruct",
387
- "qwen3-coder-flash",
388
- "qwen3-coder-plus",
389
- "qwen3-max",
390
- "qwen3-next-80b-a3b-instruct",
391
- "qwen3-next-80b-a3b-thinking",
392
- "qwen3-omni-flash",
393
- "qwen3-omni-flash-realtime",
394
- "qwen3-vl-235b-a22b",
395
- "qwen3-vl-30b-a3b",
396
- "qwen3-vl-plus",
397
- "qwq-32b",
398
- "qwq-plus",
399
- "tongyi-intent-detect-v3"
400
- ],
401
- "docUrl": "https://www.alibabacloud.com/help/en/model-studio/models",
209
+ "name": "Morph",
210
+ "models": ["auto", "morph-v3-fast", "morph-v3-large"],
211
+ "docUrl": "https://docs.morphllm.com/api-reference/introduction",
402
212
  "gateway": "models.dev"
403
213
  },
404
- "venice": {
405
- "url": "https://api.venice.ai/api/v1",
406
- "apiKeyEnvVar": "VENICE_API_KEY",
214
+ "zai-coding-plan": {
215
+ "url": "https://api.z.ai/api/coding/paas/v4",
216
+ "apiKeyEnvVar": "ZHIPU_API_KEY",
407
217
  "apiKeyHeader": "Authorization",
408
- "name": "Venice AI",
409
- "models": [
410
- "deepseek-coder-v2-lite",
411
- "deepseek-r1-671b",
412
- "dolphin-2.9.2-qwen2-72b",
413
- "llama-3.1-405b",
414
- "llama-3.2-3b",
415
- "llama-3.3-70b",
416
- "mistral-31-24b",
417
- "qwen-2.5-coder-32b",
418
- "qwen-2.5-qwq-32b",
419
- "qwen-2.5-vl",
420
- "qwen3-235b",
421
- "qwen3-4b",
422
- "venice-uncensored"
423
- ],
424
- "docUrl": "https://docs.venice.ai",
218
+ "name": "Z.AI Coding Plan",
219
+ "models": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
220
+ "docUrl": "https://docs.z.ai/devpack/overview",
425
221
  "gateway": "models.dev"
426
222
  },
427
- "chutes": {
428
- "url": "https://llm.chutes.ai/v1",
429
- "apiKeyEnvVar": "CHUTES_API_KEY",
223
+ "huggingface": {
224
+ "url": "https://router.huggingface.co/v1",
225
+ "apiKeyEnvVar": "HF_TOKEN",
430
226
  "apiKeyHeader": "Authorization",
431
- "name": "Chutes",
227
+ "name": "Hugging Face",
432
228
  "models": [
433
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
434
229
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
435
- "Qwen/Qwen3-30B-A3B",
436
- "Qwen/Qwen3-30B-A3B-Instruct-2507",
437
- "Qwen/Qwen3-30B-A3B-Thinking-2507",
438
- "Qwen/Qwen3-Coder-30B-A3B-Instruct",
439
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
230
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
440
231
  "Qwen/Qwen3-Next-80B-A3B-Instruct",
441
232
  "Qwen/Qwen3-Next-80B-A3B-Thinking",
442
- "chutesai/Devstral-Small-2505",
443
- "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
444
233
  "deepseek-ai/DeepSeek-R1-0528",
445
- "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
446
- "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
447
- "deepseek-ai/DeepSeek-V3-0324",
448
- "deepseek-ai/DeepSeek-V3.1",
449
- "deepseek-ai/DeepSeek-V3.1-Terminus",
450
- "deepseek-ai/DeepSeek-V3.1-turbo",
451
- "deepseek-ai/DeepSeek-V3.1:THINKING",
452
- "deepseek-ai/DeepSeek-V3.2-Exp",
453
- "meituan-longcat/LongCat-Flash-Chat-FP8",
454
- "moonshotai/Kimi-Dev-72B",
234
+ "deepseek-ai/Deepseek-V3-0324",
235
+ "moonshotai/Kimi-K2-Instruct",
455
236
  "moonshotai/Kimi-K2-Instruct-0905",
456
- "moonshotai/Kimi-K2-Instruct-75k",
457
- "moonshotai/Kimi-VL-A3B-Thinking",
458
- "openai/gpt-oss-120b",
459
- "tngtech/DeepSeek-R1T-Chimera",
460
- "tngtech/DeepSeek-TNG-R1T2-Chimera",
237
+ "zai-org/GLM-4.5",
461
238
  "zai-org/GLM-4.5-Air",
462
- "zai-org/GLM-4.5-FP8",
463
- "zai-org/GLM-4.5-turbo",
464
- "zai-org/GLM-4.6-FP8",
465
- "zai-org/GLM-4.6-turbo"
466
- ],
467
- "docUrl": "https://llm.chutes.ai/v1/models",
468
- "gateway": "models.dev"
469
- },
470
- "cortecs": {
471
- "url": "https://api.cortecs.ai/v1",
472
- "apiKeyEnvVar": "CORTECS_API_KEY",
473
- "apiKeyHeader": "Authorization",
474
- "name": "Cortecs",
475
- "models": [
476
- "claude-4-5-sonnet",
477
- "claude-sonnet-4",
478
- "deepseek-v3-0324",
479
- "gemini-2.5-pro",
480
- "gpt-4.1",
481
- "gpt-oss-120b",
482
- "kimi-k2-instruct",
483
- "llama-3.1-405b-instruct",
484
- "nova-pro-v1",
485
- "qwen3-32b",
486
- "qwen3-coder-480b-a35b-instruct"
239
+ "zai-org/GLM-4.6"
487
240
  ],
488
- "docUrl": "https://api.cortecs.ai/v1/models",
241
+ "docUrl": "https://huggingface.co/docs/inference-providers",
489
242
  "gateway": "models.dev"
490
243
  },
491
- "github-models": {
492
- "url": "https://models.github.ai/inference",
493
- "apiKeyEnvVar": "GITHUB_TOKEN",
494
- "apiKeyHeader": "Authorization",
495
- "name": "GitHub Models",
244
+ "openrouter": {
245
+ "url": "https://openrouter.ai/api/v1",
246
+ "apiKeyEnvVar": "OPENROUTER_API_KEY",
247
+ "name": "OpenRouter",
496
248
  "models": [
497
- "ai21-labs/ai21-jamba-1.5-large",
498
- "ai21-labs/ai21-jamba-1.5-mini",
499
- "cohere/cohere-command-a",
500
- "cohere/cohere-command-r",
501
- "cohere/cohere-command-r-08-2024",
502
- "cohere/cohere-command-r-plus",
503
- "cohere/cohere-command-r-plus-08-2024",
504
- "core42/jais-30b-chat",
505
- "deepseek/deepseek-r1",
506
- "deepseek/deepseek-r1-0528",
507
- "deepseek/deepseek-v3-0324",
508
- "meta/llama-3.2-11b-vision-instruct",
509
- "meta/llama-3.2-90b-vision-instruct",
510
- "meta/llama-3.3-70b-instruct",
511
- "meta/llama-4-maverick-17b-128e-instruct-fp8",
512
- "meta/llama-4-scout-17b-16e-instruct",
513
- "meta/meta-llama-3-70b-instruct",
514
- "meta/meta-llama-3-8b-instruct",
515
- "meta/meta-llama-3.1-405b-instruct",
516
- "meta/meta-llama-3.1-70b-instruct",
517
- "meta/meta-llama-3.1-8b-instruct",
518
- "microsoft/mai-ds-r1",
519
- "microsoft/phi-3-medium-128k-instruct",
520
- "microsoft/phi-3-medium-4k-instruct",
521
- "microsoft/phi-3-mini-128k-instruct",
522
- "microsoft/phi-3-mini-4k-instruct",
523
- "microsoft/phi-3-small-128k-instruct",
524
- "microsoft/phi-3-small-8k-instruct",
525
- "microsoft/phi-3.5-mini-instruct",
526
- "microsoft/phi-3.5-moe-instruct",
527
- "microsoft/phi-3.5-vision-instruct",
528
- "microsoft/phi-4",
529
- "microsoft/phi-4-mini-instruct",
530
- "microsoft/phi-4-mini-reasoning",
531
- "microsoft/phi-4-multimodal-instruct",
532
- "microsoft/phi-4-reasoning",
533
- "mistral-ai/codestral-2501",
534
- "mistral-ai/ministral-3b",
535
- "mistral-ai/mistral-large-2411",
536
- "mistral-ai/mistral-medium-2505",
537
- "mistral-ai/mistral-nemo",
538
- "mistral-ai/mistral-small-2503",
249
+ "anthropic/claude-3.5-haiku",
250
+ "anthropic/claude-3.7-sonnet",
251
+ "anthropic/claude-haiku-4.5",
252
+ "anthropic/claude-opus-4",
253
+ "anthropic/claude-opus-4.1",
254
+ "anthropic/claude-sonnet-4",
255
+ "anthropic/claude-sonnet-4.5",
256
+ "cognitivecomputations/dolphin3.0-mistral-24b",
257
+ "cognitivecomputations/dolphin3.0-r1-mistral-24b",
258
+ "deepseek/deepseek-chat-v3-0324",
259
+ "deepseek/deepseek-chat-v3.1",
260
+ "deepseek/deepseek-r1-0528-qwen3-8b:free",
261
+ "deepseek/deepseek-r1-0528:free",
262
+ "deepseek/deepseek-r1-distill-llama-70b",
263
+ "deepseek/deepseek-r1-distill-qwen-14b",
264
+ "deepseek/deepseek-r1:free",
265
+ "deepseek/deepseek-v3-base:free",
266
+ "deepseek/deepseek-v3.1-terminus",
267
+ "featherless/qwerky-72b",
268
+ "google/gemini-2.0-flash-001",
269
+ "google/gemini-2.0-flash-exp:free",
270
+ "google/gemini-2.5-flash",
271
+ "google/gemini-2.5-flash-lite",
272
+ "google/gemini-2.5-flash-lite-preview-09-2025",
273
+ "google/gemini-2.5-flash-preview-09-2025",
274
+ "google/gemini-2.5-pro",
275
+ "google/gemini-2.5-pro-preview-05-06",
276
+ "google/gemini-2.5-pro-preview-06-05",
277
+ "google/gemma-2-9b-it:free",
278
+ "google/gemma-3-12b-it",
279
+ "google/gemma-3-27b-it",
280
+ "google/gemma-3n-e4b-it",
281
+ "google/gemma-3n-e4b-it:free",
282
+ "meta-llama/llama-3.2-11b-vision-instruct",
283
+ "meta-llama/llama-3.3-70b-instruct:free",
284
+ "meta-llama/llama-4-scout:free",
285
+ "microsoft/mai-ds-r1:free",
286
+ "mistralai/codestral-2508",
287
+ "mistralai/devstral-medium-2507",
288
+ "mistralai/devstral-small-2505",
289
+ "mistralai/devstral-small-2505:free",
290
+ "mistralai/devstral-small-2507",
291
+ "mistralai/mistral-7b-instruct:free",
292
+ "mistralai/mistral-medium-3",
293
+ "mistralai/mistral-medium-3.1",
294
+ "mistralai/mistral-nemo:free",
295
+ "mistralai/mistral-small-3.1-24b-instruct",
296
+ "mistralai/mistral-small-3.2-24b-instruct",
297
+ "mistralai/mistral-small-3.2-24b-instruct:free",
298
+ "moonshotai/kimi-dev-72b:free",
299
+ "moonshotai/kimi-k2",
300
+ "moonshotai/kimi-k2-0905",
301
+ "moonshotai/kimi-k2:free",
302
+ "nousresearch/deephermes-3-llama-3-8b-preview",
303
+ "nousresearch/hermes-4-405b",
304
+ "nousresearch/hermes-4-70b",
539
305
  "openai/gpt-4.1",
540
306
  "openai/gpt-4.1-mini",
541
- "openai/gpt-4.1-nano",
542
- "openai/gpt-4o",
543
307
  "openai/gpt-4o-mini",
544
- "openai/o1",
545
- "openai/o1-mini",
546
- "openai/o1-preview",
547
- "openai/o3",
548
- "openai/o3-mini",
308
+ "openai/gpt-5",
309
+ "openai/gpt-5-chat",
310
+ "openai/gpt-5-codex",
311
+ "openai/gpt-5-image",
312
+ "openai/gpt-5-mini",
313
+ "openai/gpt-5-nano",
314
+ "openai/gpt-oss-120b",
315
+ "openai/gpt-oss-20b",
549
316
  "openai/o4-mini",
550
- "xai/grok-3",
551
- "xai/grok-3-mini"
317
+ "openrouter/cypher-alpha:free",
318
+ "openrouter/horizon-alpha",
319
+ "openrouter/horizon-beta",
320
+ "openrouter/sonoma-dusk-alpha",
321
+ "openrouter/sonoma-sky-alpha",
322
+ "qwen/qwen-2.5-coder-32b-instruct",
323
+ "qwen/qwen2.5-vl-32b-instruct:free",
324
+ "qwen/qwen2.5-vl-72b-instruct",
325
+ "qwen/qwen2.5-vl-72b-instruct:free",
326
+ "qwen/qwen3-14b:free",
327
+ "qwen/qwen3-235b-a22b-07-25",
328
+ "qwen/qwen3-235b-a22b-07-25:free",
329
+ "qwen/qwen3-235b-a22b-thinking-2507",
330
+ "qwen/qwen3-235b-a22b:free",
331
+ "qwen/qwen3-30b-a3b-instruct-2507",
332
+ "qwen/qwen3-30b-a3b-thinking-2507",
333
+ "qwen/qwen3-30b-a3b:free",
334
+ "qwen/qwen3-32b:free",
335
+ "qwen/qwen3-8b:free",
336
+ "qwen/qwen3-coder",
337
+ "qwen/qwen3-coder:free",
338
+ "qwen/qwen3-max",
339
+ "qwen/qwen3-next-80b-a3b-instruct",
340
+ "qwen/qwen3-next-80b-a3b-thinking",
341
+ "qwen/qwq-32b:free",
342
+ "rekaai/reka-flash-3",
343
+ "sarvamai/sarvam-m:free",
344
+ "thudm/glm-z1-32b:free",
345
+ "tngtech/deepseek-r1t2-chimera:free",
346
+ "x-ai/grok-3",
347
+ "x-ai/grok-3-beta",
348
+ "x-ai/grok-3-mini",
349
+ "x-ai/grok-3-mini-beta",
350
+ "x-ai/grok-4",
351
+ "x-ai/grok-4-fast",
352
+ "x-ai/grok-4-fast:free",
353
+ "x-ai/grok-code-fast-1",
354
+ "z-ai/glm-4.5",
355
+ "z-ai/glm-4.5-air",
356
+ "z-ai/glm-4.5-air:free",
357
+ "z-ai/glm-4.5v",
358
+ "z-ai/glm-4.6"
552
359
  ],
553
- "docUrl": "https://docs.github.com/en/github-models",
360
+ "docUrl": "https://openrouter.ai/models",
361
+ "gateway": "models.dev"
362
+ },
363
+ "cerebras": {
364
+ "url": "https://api.cerebras.ai/v1",
365
+ "apiKeyEnvVar": "CEREBRAS_API_KEY",
366
+ "apiKeyHeader": "Authorization",
367
+ "name": "Cerebras",
368
+ "models": ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
369
+ "docUrl": "https://inference-docs.cerebras.ai/models/overview",
370
+ "gateway": "models.dev"
371
+ },
372
+ "zhipuai": {
373
+ "url": "https://open.bigmodel.cn/api/paas/v4",
374
+ "apiKeyEnvVar": "ZHIPU_API_KEY",
375
+ "apiKeyHeader": "Authorization",
376
+ "name": "Zhipu AI",
377
+ "models": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
378
+ "docUrl": "https://docs.z.ai/guides/overview/pricing",
554
379
  "gateway": "models.dev"
555
380
  },
556
381
  "togetherai": {
@@ -569,81 +394,168 @@
569
394
  "docUrl": "https://docs.together.ai/docs/serverless-models",
570
395
  "gateway": "models.dev"
571
396
  },
572
- "baseten": {
573
- "url": "https://inference.baseten.co/v1",
574
- "apiKeyEnvVar": "BASETEN_API_KEY",
575
- "apiKeyHeader": "Authorization",
576
- "name": "Baseten",
577
- "models": ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905"],
578
- "docUrl": "https://docs.baseten.co/development/model-apis/overview",
579
- "gateway": "models.dev"
580
- },
581
- "huggingface": {
582
- "url": "https://router.huggingface.co/v1",
583
- "apiKeyEnvVar": "HF_TOKEN",
397
+ "wandb": {
398
+ "url": "https://api.inference.wandb.ai/v1",
399
+ "apiKeyEnvVar": "WANDB_API_KEY",
584
400
  "apiKeyHeader": "Authorization",
585
- "name": "Hugging Face",
401
+ "name": "Weights & Biases",
586
402
  "models": [
403
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
587
404
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
588
405
  "Qwen/Qwen3-Coder-480B-A35B-Instruct",
589
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
590
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
591
406
  "deepseek-ai/DeepSeek-R1-0528",
592
- "deepseek-ai/Deepseek-V3-0324",
593
- "moonshotai/Kimi-K2-Instruct",
594
- "moonshotai/Kimi-K2-Instruct-0905",
595
- "zai-org/GLM-4.5",
596
- "zai-org/GLM-4.5-Air",
597
- "zai-org/GLM-4.6"
407
+ "deepseek-ai/DeepSeek-V3-0324",
408
+ "meta-llama/Llama-3.1-8B-Instruct",
409
+ "meta-llama/Llama-3.3-70B-Instruct",
410
+ "meta-llama/Llama-4-Scout-17B-16E-Instruct",
411
+ "microsoft/Phi-4-mini-instruct",
412
+ "moonshotai/Kimi-K2-Instruct"
598
413
  ],
599
- "docUrl": "https://huggingface.co/docs/inference-providers",
414
+ "docUrl": "https://weave-docs.wandb.ai/guides/integrations/inference/",
600
415
  "gateway": "models.dev"
601
416
  },
602
- "opencode": {
603
- "url": "https://opencode.ai/zen/v1",
604
- "apiKeyEnvVar": "OPENCODE_API_KEY",
417
+ "submodel": {
418
+ "url": "https://llm.submodel.ai/v1",
419
+ "apiKeyEnvVar": "SUBMODEL_INSTAGEN_ACCESS_KEY",
605
420
  "apiKeyHeader": "Authorization",
606
- "name": "OpenCode Zen",
421
+ "name": "submodel",
607
422
  "models": [
608
- "an-g8x",
609
- "claude-3-5-haiku",
610
- "claude-haiku-4-5",
611
- "claude-opus-4-1",
612
- "claude-sonnet-4",
613
- "claude-sonnet-4-5",
614
- "code-supernova",
615
- "glm-4.6",
616
- "gpt-5",
617
- "gpt-5-codex",
618
- "grok-code",
619
- "kimi-k2",
620
- "qwen3-coder"
423
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
424
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
425
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
426
+ "deepseek-ai/DeepSeek-R1-0528",
427
+ "deepseek-ai/DeepSeek-V3-0324",
428
+ "deepseek-ai/DeepSeek-V3.1",
429
+ "openai/gpt-oss-120b",
430
+ "zai-org/GLM-4.5-Air",
431
+ "zai-org/GLM-4.5-FP8"
621
432
  ],
622
- "docUrl": "https://opencode.ai/docs/zen",
433
+ "docUrl": "https://submodel.gitbook.io",
623
434
  "gateway": "models.dev"
624
435
  },
625
- "fastrouter": {
626
- "url": "https://go.fastrouter.ai/api/v1",
627
- "apiKeyEnvVar": "FASTROUTER_API_KEY",
436
+ "vercel": {
437
+ "url": "https://ai-gateway.vercel.sh/v1",
438
+ "apiKeyEnvVar": "AI_GATEWAY_API_KEY",
628
439
  "apiKeyHeader": "Authorization",
629
- "name": "FastRouter",
440
+ "name": "Vercel AI Gateway",
630
441
  "models": [
631
- "anthropic/claude-opus-4.1",
632
- "anthropic/claude-sonnet-4",
633
- "deepseek-ai/deepseek-r1-distill-llama-70b",
442
+ "alibaba/qwen3-coder-plus",
443
+ "alibaba/qwen3-max",
444
+ "alibaba/qwen3-next-80b-a3b-instruct",
445
+ "alibaba/qwen3-next-80b-a3b-thinking",
446
+ "alibaba/qwen3-vl-instruct",
447
+ "alibaba/qwen3-vl-thinking",
448
+ "amazon/nova-lite",
449
+ "amazon/nova-micro",
450
+ "amazon/nova-pro",
451
+ "anthropic/claude-3-5-haiku",
452
+ "anthropic/claude-3-haiku",
453
+ "anthropic/claude-3-opus",
454
+ "anthropic/claude-3.5-sonnet",
455
+ "anthropic/claude-3.7-sonnet",
456
+ "anthropic/claude-4-1-opus",
457
+ "anthropic/claude-4-opus",
458
+ "anthropic/claude-4-sonnet",
459
+ "anthropic/claude-4.5-sonnet",
460
+ "anthropic/claude-haiku-4.5",
461
+ "cerebras/qwen3-coder",
462
+ "deepseek/deepseek-r1",
463
+ "deepseek/deepseek-r1-distill-llama-70b",
464
+ "deepseek/deepseek-v3.1-terminus",
465
+ "deepseek/deepseek-v3.2-exp",
466
+ "deepseek/deepseek-v3.2-exp-thinking",
467
+ "google/gemini-2.0-flash",
468
+ "google/gemini-2.0-flash-lite",
634
469
  "google/gemini-2.5-flash",
470
+ "google/gemini-2.5-flash-lite",
471
+ "google/gemini-2.5-flash-lite-preview-09-2025",
472
+ "google/gemini-2.5-flash-preview-09-2025",
635
473
  "google/gemini-2.5-pro",
474
+ "meta/llama-3.3-70b",
475
+ "meta/llama-4-maverick",
476
+ "meta/llama-4-scout",
477
+ "mistral/codestral",
478
+ "mistral/magistral-medium",
479
+ "mistral/magistral-small",
480
+ "mistral/ministral-3b",
481
+ "mistral/ministral-8b",
482
+ "mistral/mistral-large",
483
+ "mistral/mistral-small",
484
+ "mistral/mixtral-8x22b-instruct",
485
+ "mistral/pixtral-12b",
486
+ "mistral/pixtral-large",
636
487
  "moonshotai/kimi-k2",
488
+ "morph/morph-v3-fast",
489
+ "morph/morph-v3-large",
490
+ "openai/gpt-4-turbo",
637
491
  "openai/gpt-4.1",
492
+ "openai/gpt-4.1-mini",
493
+ "openai/gpt-4.1-nano",
494
+ "openai/gpt-4o",
495
+ "openai/gpt-4o-mini",
638
496
  "openai/gpt-5",
497
+ "openai/gpt-5-codex",
639
498
  "openai/gpt-5-mini",
640
499
  "openai/gpt-5-nano",
641
500
  "openai/gpt-oss-120b",
642
501
  "openai/gpt-oss-20b",
643
- "qwen/qwen3-coder",
644
- "x-ai/grok-4"
502
+ "openai/o1",
503
+ "openai/o3",
504
+ "openai/o3-mini",
505
+ "openai/o4-mini",
506
+ "perplexity/sonar",
507
+ "perplexity/sonar-pro",
508
+ "perplexity/sonar-reasoning",
509
+ "perplexity/sonar-reasoning-pro",
510
+ "vercel/v0-1.0-md",
511
+ "vercel/v0-1.5-md",
512
+ "xai/grok-2",
513
+ "xai/grok-2-vision",
514
+ "xai/grok-3",
515
+ "xai/grok-3-fast",
516
+ "xai/grok-3-mini",
517
+ "xai/grok-3-mini-fast",
518
+ "xai/grok-4",
519
+ "xai/grok-4-fast",
520
+ "xai/grok-4-fast-non-reasoning",
521
+ "xai/grok-code-fast-1",
522
+ "zai/glm-4.5",
523
+ "zai/glm-4.5-air",
524
+ "zai/glm-4.5v",
525
+ "zai/glm-4.6"
645
526
  ],
646
- "docUrl": "https://fastrouter.ai/models",
527
+ "docUrl": "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway",
528
+ "gateway": "models.dev"
529
+ },
530
+ "synthetic": {
531
+ "url": "https://api.synthetic.new/v1",
532
+ "apiKeyEnvVar": "SYNTHETIC_API_KEY",
533
+ "apiKeyHeader": "Authorization",
534
+ "name": "Synthetic",
535
+ "models": [
536
+ "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
537
+ "hf:Qwen/Qwen3-235B-A22B-Instruct-2507",
538
+ "hf:Qwen/Qwen3-235B-A22B-Thinking-2507",
539
+ "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct",
540
+ "hf:deepseek-ai/DeepSeek-R1",
541
+ "hf:deepseek-ai/DeepSeek-R1-0528",
542
+ "hf:deepseek-ai/DeepSeek-V3",
543
+ "hf:deepseek-ai/DeepSeek-V3-0324",
544
+ "hf:deepseek-ai/DeepSeek-V3.1",
545
+ "hf:deepseek-ai/DeepSeek-V3.1-Terminus",
546
+ "hf:meta-llama/Llama-3.1-405B-Instruct",
547
+ "hf:meta-llama/Llama-3.1-70B-Instruct",
548
+ "hf:meta-llama/Llama-3.1-8B-Instruct",
549
+ "hf:meta-llama/Llama-3.3-70B-Instruct",
550
+ "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
551
+ "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct",
552
+ "hf:moonshotai/Kimi-K2-Instruct",
553
+ "hf:moonshotai/Kimi-K2-Instruct-0905",
554
+ "hf:openai/gpt-oss-120b",
555
+ "hf:zai-org/GLM-4.5",
556
+ "hf:zai-org/GLM-4.6"
557
+ ],
558
+ "docUrl": "https://synthetic.new/pricing",
647
559
  "gateway": "models.dev"
648
560
  },
649
561
  "google": {
@@ -677,236 +589,105 @@
677
589
  "docUrl": "https://ai.google.dev/gemini-api/docs/pricing",
678
590
  "gateway": "models.dev"
679
591
  },
680
- "inception": {
681
- "url": "https://api.inceptionlabs.ai/v1/",
682
- "apiKeyEnvVar": "INCEPTION_API_KEY",
683
- "apiKeyHeader": "Authorization",
684
- "name": "Inception",
685
- "models": ["mercury", "mercury-coder"],
686
- "docUrl": "https://platform.inceptionlabs.ai/docs",
687
- "gateway": "models.dev"
688
- },
689
- "wandb": {
690
- "url": "https://api.inference.wandb.ai/v1",
691
- "apiKeyEnvVar": "WANDB_API_KEY",
592
+ "groq": {
593
+ "url": "https://api.groq.com/openai/v1",
594
+ "apiKeyEnvVar": "GROQ_API_KEY",
692
595
  "apiKeyHeader": "Authorization",
693
- "name": "Weights & Biases",
694
- "models": [
695
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
696
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
697
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
698
- "deepseek-ai/DeepSeek-R1-0528",
699
- "deepseek-ai/DeepSeek-V3-0324",
700
- "meta-llama/Llama-3.1-8B-Instruct",
701
- "meta-llama/Llama-3.3-70B-Instruct",
702
- "meta-llama/Llama-4-Scout-17B-16E-Instruct",
703
- "microsoft/Phi-4-mini-instruct",
704
- "moonshotai/Kimi-K2-Instruct"
705
- ],
706
- "docUrl": "https://weave-docs.wandb.ai/guides/integrations/inference/",
707
- "gateway": "models.dev"
708
- },
709
- "openai": {
710
- "apiKeyEnvVar": "OPENAI_API_KEY",
711
- "name": "OpenAI",
596
+ "name": "Groq",
712
597
  "models": [
713
- "codex-mini-latest",
714
- "gpt-3.5-turbo",
715
- "gpt-4",
716
- "gpt-4-turbo",
717
- "gpt-4.1",
718
- "gpt-4.1-mini",
719
- "gpt-4.1-nano",
720
- "gpt-4o",
721
- "gpt-4o-2024-05-13",
722
- "gpt-4o-2024-08-06",
723
- "gpt-4o-2024-11-20",
724
- "gpt-4o-mini",
725
- "gpt-5",
726
- "gpt-5-chat-latest",
727
- "gpt-5-codex",
728
- "gpt-5-mini",
729
- "gpt-5-nano",
730
- "o1",
731
- "o1-mini",
732
- "o1-preview",
733
- "o1-pro",
734
- "o3",
735
- "o3-deep-research",
736
- "o3-mini",
737
- "o3-pro",
738
- "o4-mini",
739
- "o4-mini-deep-research"
598
+ "deepseek-r1-distill-llama-70b",
599
+ "gemma2-9b-it",
600
+ "llama-3.1-8b-instant",
601
+ "llama-3.3-70b-versatile",
602
+ "llama-guard-3-8b",
603
+ "llama3-70b-8192",
604
+ "llama3-8b-8192",
605
+ "meta-llama/llama-4-maverick-17b-128e-instruct",
606
+ "meta-llama/llama-4-scout-17b-16e-instruct",
607
+ "meta-llama/llama-guard-4-12b",
608
+ "mistral-saba-24b",
609
+ "moonshotai/kimi-k2-instruct",
610
+ "moonshotai/kimi-k2-instruct-0905",
611
+ "openai/gpt-oss-120b",
612
+ "openai/gpt-oss-20b",
613
+ "qwen-qwq-32b",
614
+ "qwen/qwen3-32b"
740
615
  ],
741
- "docUrl": "https://platform.openai.com/docs/models",
616
+ "docUrl": "https://console.groq.com/docs/models",
742
617
  "gateway": "models.dev"
743
618
  },
744
- "zhipuai-coding-plan": {
745
- "url": "https://open.bigmodel.cn/api/coding/paas/v4",
746
- "apiKeyEnvVar": "ZHIPU_API_KEY",
619
+ "moonshotai-cn": {
620
+ "url": "https://api.moonshot.cn/v1",
621
+ "apiKeyEnvVar": "MOONSHOT_API_KEY",
747
622
  "apiKeyHeader": "Authorization",
748
- "name": "Zhipu AI Coding Plan",
749
- "models": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
750
- "docUrl": "https://docs.bigmodel.cn/cn/coding-plan/overview",
623
+ "name": "Moonshot AI (China)",
624
+ "models": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
625
+ "docUrl": "https://platform.moonshot.cn/docs/api/chat",
751
626
  "gateway": "models.dev"
752
627
  },
753
- "perplexity": {
754
- "url": "https://api.perplexity.ai",
755
- "apiKeyEnvVar": "PERPLEXITY_API_KEY",
628
+ "github-models": {
629
+ "url": "https://models.github.ai/inference",
630
+ "apiKeyEnvVar": "GITHUB_TOKEN",
756
631
  "apiKeyHeader": "Authorization",
757
- "name": "Perplexity",
758
- "models": ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
759
- "docUrl": "https://docs.perplexity.ai",
760
- "gateway": "models.dev"
761
- },
762
- "openrouter": {
763
- "url": "https://openrouter.ai/api/v1",
764
- "apiKeyEnvVar": "OPENROUTER_API_KEY",
765
- "name": "OpenRouter",
632
+ "name": "GitHub Models",
766
633
  "models": [
767
- "anthropic/claude-3.5-haiku",
768
- "anthropic/claude-3.7-sonnet",
769
- "anthropic/claude-4.5-haiku",
770
- "anthropic/claude-opus-4",
771
- "anthropic/claude-opus-4.1",
772
- "anthropic/claude-sonnet-4",
773
- "anthropic/claude-sonnet-4.5",
774
- "cognitivecomputations/dolphin3.0-mistral-24b",
775
- "cognitivecomputations/dolphin3.0-r1-mistral-24b",
776
- "deepseek/deepseek-chat-v3-0324",
777
- "deepseek/deepseek-chat-v3.1",
778
- "deepseek/deepseek-r1-0528-qwen3-8b:free",
779
- "deepseek/deepseek-r1-0528:free",
780
- "deepseek/deepseek-r1-distill-llama-70b",
781
- "deepseek/deepseek-r1-distill-qwen-14b",
782
- "deepseek/deepseek-r1:free",
783
- "deepseek/deepseek-v3-base:free",
784
- "deepseek/deepseek-v3.1-terminus",
785
- "featherless/qwerky-72b",
786
- "google/gemini-2.0-flash-001",
787
- "google/gemini-2.0-flash-exp:free",
788
- "google/gemini-2.5-flash",
789
- "google/gemini-2.5-flash-lite",
790
- "google/gemini-2.5-flash-lite-preview-09-2025",
791
- "google/gemini-2.5-flash-preview-09-2025",
792
- "google/gemini-2.5-pro",
793
- "google/gemini-2.5-pro-preview-05-06",
794
- "google/gemini-2.5-pro-preview-06-05",
795
- "google/gemma-2-9b-it:free",
796
- "google/gemma-3-12b-it",
797
- "google/gemma-3-27b-it",
798
- "google/gemma-3n-e4b-it",
799
- "google/gemma-3n-e4b-it:free",
800
- "meta-llama/llama-3.2-11b-vision-instruct",
801
- "meta-llama/llama-3.3-70b-instruct:free",
802
- "meta-llama/llama-4-scout:free",
803
- "microsoft/mai-ds-r1:free",
804
- "mistralai/codestral-2508",
805
- "mistralai/devstral-medium-2507",
806
- "mistralai/devstral-small-2505",
807
- "mistralai/devstral-small-2505:free",
808
- "mistralai/devstral-small-2507",
809
- "mistralai/mistral-7b-instruct:free",
810
- "mistralai/mistral-medium-3",
811
- "mistralai/mistral-medium-3.1",
812
- "mistralai/mistral-nemo:free",
813
- "mistralai/mistral-small-3.1-24b-instruct",
814
- "mistralai/mistral-small-3.2-24b-instruct",
815
- "mistralai/mistral-small-3.2-24b-instruct:free",
816
- "moonshotai/kimi-dev-72b:free",
817
- "moonshotai/kimi-k2",
818
- "moonshotai/kimi-k2-0905",
819
- "moonshotai/kimi-k2:free",
820
- "nousresearch/deephermes-3-llama-3-8b-preview",
821
- "nousresearch/hermes-4-405b",
822
- "nousresearch/hermes-4-70b",
634
+ "ai21-labs/ai21-jamba-1.5-large",
635
+ "ai21-labs/ai21-jamba-1.5-mini",
636
+ "cohere/cohere-command-a",
637
+ "cohere/cohere-command-r",
638
+ "cohere/cohere-command-r-08-2024",
639
+ "cohere/cohere-command-r-plus",
640
+ "cohere/cohere-command-r-plus-08-2024",
641
+ "core42/jais-30b-chat",
642
+ "deepseek/deepseek-r1",
643
+ "deepseek/deepseek-r1-0528",
644
+ "deepseek/deepseek-v3-0324",
645
+ "meta/llama-3.2-11b-vision-instruct",
646
+ "meta/llama-3.2-90b-vision-instruct",
647
+ "meta/llama-3.3-70b-instruct",
648
+ "meta/llama-4-maverick-17b-128e-instruct-fp8",
649
+ "meta/llama-4-scout-17b-16e-instruct",
650
+ "meta/meta-llama-3-70b-instruct",
651
+ "meta/meta-llama-3-8b-instruct",
652
+ "meta/meta-llama-3.1-405b-instruct",
653
+ "meta/meta-llama-3.1-70b-instruct",
654
+ "meta/meta-llama-3.1-8b-instruct",
655
+ "microsoft/mai-ds-r1",
656
+ "microsoft/phi-3-medium-128k-instruct",
657
+ "microsoft/phi-3-medium-4k-instruct",
658
+ "microsoft/phi-3-mini-128k-instruct",
659
+ "microsoft/phi-3-mini-4k-instruct",
660
+ "microsoft/phi-3-small-128k-instruct",
661
+ "microsoft/phi-3-small-8k-instruct",
662
+ "microsoft/phi-3.5-mini-instruct",
663
+ "microsoft/phi-3.5-moe-instruct",
664
+ "microsoft/phi-3.5-vision-instruct",
665
+ "microsoft/phi-4",
666
+ "microsoft/phi-4-mini-instruct",
667
+ "microsoft/phi-4-mini-reasoning",
668
+ "microsoft/phi-4-multimodal-instruct",
669
+ "microsoft/phi-4-reasoning",
670
+ "mistral-ai/codestral-2501",
671
+ "mistral-ai/ministral-3b",
672
+ "mistral-ai/mistral-large-2411",
673
+ "mistral-ai/mistral-medium-2505",
674
+ "mistral-ai/mistral-nemo",
675
+ "mistral-ai/mistral-small-2503",
823
676
  "openai/gpt-4.1",
824
677
  "openai/gpt-4.1-mini",
678
+ "openai/gpt-4.1-nano",
679
+ "openai/gpt-4o",
825
680
  "openai/gpt-4o-mini",
826
- "openai/gpt-5",
827
- "openai/gpt-5-chat",
828
- "openai/gpt-5-codex",
829
- "openai/gpt-5-image",
830
- "openai/gpt-5-mini",
831
- "openai/gpt-5-nano",
832
- "openai/gpt-oss-120b",
833
- "openai/gpt-oss-20b",
681
+ "openai/o1",
682
+ "openai/o1-mini",
683
+ "openai/o1-preview",
684
+ "openai/o3",
685
+ "openai/o3-mini",
834
686
  "openai/o4-mini",
835
- "openrouter/cypher-alpha:free",
836
- "openrouter/horizon-alpha",
837
- "openrouter/horizon-beta",
838
- "openrouter/sonoma-dusk-alpha",
839
- "openrouter/sonoma-sky-alpha",
840
- "qwen/qwen-2.5-coder-32b-instruct",
841
- "qwen/qwen2.5-vl-32b-instruct:free",
842
- "qwen/qwen2.5-vl-72b-instruct",
843
- "qwen/qwen2.5-vl-72b-instruct:free",
844
- "qwen/qwen3-14b:free",
845
- "qwen/qwen3-235b-a22b-07-25",
846
- "qwen/qwen3-235b-a22b-07-25:free",
847
- "qwen/qwen3-235b-a22b-thinking-2507",
848
- "qwen/qwen3-235b-a22b:free",
849
- "qwen/qwen3-30b-a3b-instruct-2507",
850
- "qwen/qwen3-30b-a3b-thinking-2507",
851
- "qwen/qwen3-30b-a3b:free",
852
- "qwen/qwen3-32b:free",
853
- "qwen/qwen3-8b:free",
854
- "qwen/qwen3-coder",
855
- "qwen/qwen3-coder:free",
856
- "qwen/qwen3-max",
857
- "qwen/qwen3-next-80b-a3b-instruct",
858
- "qwen/qwen3-next-80b-a3b-thinking",
859
- "qwen/qwq-32b:free",
860
- "rekaai/reka-flash-3",
861
- "sarvamai/sarvam-m:free",
862
- "thudm/glm-z1-32b:free",
863
- "tngtech/deepseek-r1t2-chimera:free",
864
- "x-ai/grok-3",
865
- "x-ai/grok-3-beta",
866
- "x-ai/grok-3-mini",
867
- "x-ai/grok-3-mini-beta",
868
- "x-ai/grok-4",
869
- "x-ai/grok-4-fast",
870
- "x-ai/grok-4-fast:free",
871
- "x-ai/grok-code-fast-1",
872
- "z-ai/glm-4.5",
873
- "z-ai/glm-4.5-air",
874
- "z-ai/glm-4.5-air:free",
875
- "z-ai/glm-4.5v",
876
- "z-ai/glm-4.6"
877
- ],
878
- "docUrl": "https://openrouter.ai/models",
879
- "gateway": "models.dev"
880
- },
881
- "synthetic": {
882
- "url": "https://api.synthetic.new/v1",
883
- "apiKeyEnvVar": "SYNTHETIC_API_KEY",
884
- "apiKeyHeader": "Authorization",
885
- "name": "Synthetic",
886
- "models": [
887
- "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
888
- "hf:Qwen/Qwen3-235B-A22B-Instruct-2507",
889
- "hf:Qwen/Qwen3-235B-A22B-Thinking-2507",
890
- "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct",
891
- "hf:deepseek-ai/DeepSeek-R1",
892
- "hf:deepseek-ai/DeepSeek-R1-0528",
893
- "hf:deepseek-ai/DeepSeek-V3",
894
- "hf:deepseek-ai/DeepSeek-V3-0324",
895
- "hf:deepseek-ai/DeepSeek-V3.1",
896
- "hf:deepseek-ai/DeepSeek-V3.1-Terminus",
897
- "hf:meta-llama/Llama-3.1-405B-Instruct",
898
- "hf:meta-llama/Llama-3.1-70B-Instruct",
899
- "hf:meta-llama/Llama-3.1-8B-Instruct",
900
- "hf:meta-llama/Llama-3.3-70B-Instruct",
901
- "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
902
- "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct",
903
- "hf:moonshotai/Kimi-K2-Instruct",
904
- "hf:moonshotai/Kimi-K2-Instruct-0905",
905
- "hf:openai/gpt-oss-120b",
906
- "hf:zai-org/GLM-4.5",
907
- "hf:zai-org/GLM-4.6"
687
+ "xai/grok-3",
688
+ "xai/grok-3-mini"
908
689
  ],
909
- "docUrl": "https://synthetic.new/pricing",
690
+ "docUrl": "https://docs.github.com/en/github-models",
910
691
  "gateway": "models.dev"
911
692
  },
912
693
  "deepinfra": {
@@ -923,32 +704,24 @@
923
704
  "docUrl": "https://deepinfra.com/models",
924
705
  "gateway": "models.dev"
925
706
  },
926
- "zhipuai": {
927
- "url": "https://open.bigmodel.cn/api/paas/v4",
928
- "apiKeyEnvVar": "ZHIPU_API_KEY",
929
- "apiKeyHeader": "Authorization",
930
- "name": "Zhipu AI",
931
- "models": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
932
- "docUrl": "https://docs.z.ai/guides/overview/pricing",
933
- "gateway": "models.dev"
934
- },
935
- "submodel": {
936
- "url": "https://llm.submodel.ai/v1",
937
- "apiKeyEnvVar": "SUBMODEL_INSTAGEN_ACCESS_KEY",
707
+ "fireworks-ai": {
708
+ "url": "https://api.fireworks.ai/inference/v1/",
709
+ "apiKeyEnvVar": "FIREWORKS_API_KEY",
938
710
  "apiKeyHeader": "Authorization",
939
- "name": "submodel",
711
+ "name": "Fireworks AI",
940
712
  "models": [
941
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
942
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
943
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
944
- "deepseek-ai/DeepSeek-R1-0528",
945
- "deepseek-ai/DeepSeek-V3-0324",
946
- "deepseek-ai/DeepSeek-V3.1",
947
- "openai/gpt-oss-120b",
948
- "zai-org/GLM-4.5-Air",
949
- "zai-org/GLM-4.5-FP8"
713
+ "accounts/fireworks/models/deepseek-r1-0528",
714
+ "accounts/fireworks/models/deepseek-v3-0324",
715
+ "accounts/fireworks/models/deepseek-v3p1",
716
+ "accounts/fireworks/models/glm-4p5",
717
+ "accounts/fireworks/models/glm-4p5-air",
718
+ "accounts/fireworks/models/gpt-oss-120b",
719
+ "accounts/fireworks/models/gpt-oss-20b",
720
+ "accounts/fireworks/models/kimi-k2-instruct",
721
+ "accounts/fireworks/models/qwen3-235b-a22b",
722
+ "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
950
723
  ],
951
- "docUrl": "https://submodel.gitbook.io",
724
+ "docUrl": "https://fireworks.ai/docs/",
952
725
  "gateway": "models.dev"
953
726
  },
954
727
  "zai": {
@@ -960,55 +733,63 @@
960
733
  "docUrl": "https://docs.z.ai/guides/overview/pricing",
961
734
  "gateway": "models.dev"
962
735
  },
963
- "inference": {
964
- "url": "https://inference.net/v1",
965
- "apiKeyEnvVar": "INFERENCE_API_KEY",
736
+ "opencode": {
737
+ "url": "https://opencode.ai/zen/v1",
738
+ "apiKeyEnvVar": "OPENCODE_API_KEY",
966
739
  "apiKeyHeader": "Authorization",
967
- "name": "Inference",
740
+ "name": "OpenCode Zen",
968
741
  "models": [
969
- "google/gemma-3",
970
- "meta/llama-3.1-8b-instruct",
971
- "meta/llama-3.2-11b-vision-instruct",
972
- "meta/llama-3.2-1b-instruct",
973
- "meta/llama-3.2-3b-instruct",
974
- "mistral/mistral-nemo-12b-instruct",
975
- "osmosis/osmosis-structure-0.6b",
976
- "qwen/qwen-2.5-7b-vision-instruct",
977
- "qwen/qwen3-embedding-4b"
742
+ "an-gbt",
743
+ "big-pickle",
744
+ "claude-3-5-haiku",
745
+ "claude-haiku-4-5",
746
+ "claude-opus-4-1",
747
+ "claude-sonnet-4",
748
+ "claude-sonnet-4-5",
749
+ "code-supernova",
750
+ "glm-4.6",
751
+ "gpt-5",
752
+ "gpt-5-codex",
753
+ "grok-code",
754
+ "kimi-k2",
755
+ "qwen3-coder"
978
756
  ],
979
- "docUrl": "https://inference.net/models",
757
+ "docUrl": "https://opencode.ai/docs/zen",
980
758
  "gateway": "models.dev"
981
759
  },
982
- "requesty": {
983
- "url": "https://router.requesty.ai/v1",
984
- "apiKeyEnvVar": "REQUESTY_API_KEY",
760
+ "zhipuai-coding-plan": {
761
+ "url": "https://open.bigmodel.cn/api/coding/paas/v4",
762
+ "apiKeyEnvVar": "ZHIPU_API_KEY",
985
763
  "apiKeyHeader": "Authorization",
986
- "name": "Requesty",
987
- "models": [
988
- "anthropic/claude-3-7-sonnet",
989
- "anthropic/claude-4-sonnet-20250522",
990
- "anthropic/claude-opus-4",
991
- "anthropic/claude-opus-4-1-20250805",
992
- "google/gemini-2.5-flash",
993
- "google/gemini-2.5-pro",
994
- "openai/gpt-4.1",
995
- "openai/gpt-4.1-mini",
996
- "openai/gpt-4o-mini",
997
- "openai/gpt-5",
998
- "openai/gpt-5-mini",
999
- "openai/gpt-5-nano",
1000
- "openai/o4-mini"
1001
- ],
1002
- "docUrl": "https://requesty.ai/solution/llm-routing/models",
764
+ "name": "Zhipu AI Coding Plan",
765
+ "models": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
766
+ "docUrl": "https://docs.bigmodel.cn/cn/coding-plan/overview",
1003
767
  "gateway": "models.dev"
1004
768
  },
1005
- "morph": {
1006
- "url": "https://api.morphllm.com/v1",
1007
- "apiKeyEnvVar": "MORPH_API_KEY",
769
+ "inception": {
770
+ "url": "https://api.inceptionlabs.ai/v1/",
771
+ "apiKeyEnvVar": "INCEPTION_API_KEY",
1008
772
  "apiKeyHeader": "Authorization",
1009
- "name": "Morph",
1010
- "models": ["auto", "morph-v3-fast", "morph-v3-large"],
1011
- "docUrl": "https://docs.morphllm.com/api-reference/introduction",
773
+ "name": "Inception",
774
+ "models": ["mercury", "mercury-coder"],
775
+ "docUrl": "https://platform.inceptionlabs.ai/docs",
776
+ "gateway": "models.dev"
777
+ },
778
+ "llama": {
779
+ "url": "https://api.llama.com/compat/v1/",
780
+ "apiKeyEnvVar": "LLAMA_API_KEY",
781
+ "apiKeyHeader": "Authorization",
782
+ "name": "Llama",
783
+ "models": [
784
+ "cerebras-llama-4-maverick-17b-128e-instruct",
785
+ "cerebras-llama-4-scout-17b-16e-instruct",
786
+ "groq-llama-4-maverick-17b-128e-instruct",
787
+ "llama-3.3-70b-instruct",
788
+ "llama-3.3-8b-instruct",
789
+ "llama-4-maverick-17b-128e-instruct-fp8",
790
+ "llama-4-scout-17b-16e-instruct-fp8"
791
+ ],
792
+ "docUrl": "https://llama.developer.meta.com/docs/models",
1012
793
  "gateway": "models.dev"
1013
794
  },
1014
795
  "lmstudio": {
@@ -1020,118 +801,380 @@
1020
801
  "docUrl": "https://lmstudio.ai/models",
1021
802
  "gateway": "models.dev"
1022
803
  },
804
+ "openai": {
805
+ "apiKeyEnvVar": "OPENAI_API_KEY",
806
+ "name": "OpenAI",
807
+ "models": [
808
+ "codex-mini-latest",
809
+ "gpt-3.5-turbo",
810
+ "gpt-4",
811
+ "gpt-4-turbo",
812
+ "gpt-4.1",
813
+ "gpt-4.1-mini",
814
+ "gpt-4.1-nano",
815
+ "gpt-4o",
816
+ "gpt-4o-2024-05-13",
817
+ "gpt-4o-2024-08-06",
818
+ "gpt-4o-2024-11-20",
819
+ "gpt-4o-mini",
820
+ "gpt-5",
821
+ "gpt-5-chat-latest",
822
+ "gpt-5-codex",
823
+ "gpt-5-mini",
824
+ "gpt-5-nano",
825
+ "o1",
826
+ "o1-mini",
827
+ "o1-preview",
828
+ "o1-pro",
829
+ "o3",
830
+ "o3-deep-research",
831
+ "o3-mini",
832
+ "o3-pro",
833
+ "o4-mini",
834
+ "o4-mini-deep-research"
835
+ ],
836
+ "docUrl": "https://platform.openai.com/docs/models",
837
+ "gateway": "models.dev"
838
+ },
1023
839
  "anthropic": {
1024
840
  "apiKeyEnvVar": "ANTHROPIC_API_KEY",
1025
841
  "name": "Anthropic",
1026
842
  "models": [
1027
843
  "claude-3-5-haiku-20241022",
844
+ "claude-3-5-haiku-latest",
1028
845
  "claude-3-5-sonnet-20240620",
1029
846
  "claude-3-5-sonnet-20241022",
1030
847
  "claude-3-7-sonnet-20250219",
848
+ "claude-3-7-sonnet-latest",
1031
849
  "claude-3-haiku-20240307",
1032
850
  "claude-3-opus-20240229",
1033
851
  "claude-3-sonnet-20240229",
852
+ "claude-haiku-4-5",
1034
853
  "claude-haiku-4-5-20251001",
854
+ "claude-opus-4-0",
855
+ "claude-opus-4-1",
1035
856
  "claude-opus-4-1-20250805",
1036
857
  "claude-opus-4-20250514",
858
+ "claude-sonnet-4-0",
1037
859
  "claude-sonnet-4-20250514",
860
+ "claude-sonnet-4-5",
1038
861
  "claude-sonnet-4-5-20250929"
1039
862
  ],
1040
863
  "docUrl": "https://docs.anthropic.com/en/docs/about-claude/models",
1041
864
  "gateway": "models.dev"
1042
865
  },
1043
- "fireworks-ai": {
1044
- "url": "https://api.fireworks.ai/inference/v1/",
1045
- "apiKeyEnvVar": "FIREWORKS_API_KEY",
866
+ "moonshotai": {
867
+ "url": "https://api.moonshot.ai/v1",
868
+ "apiKeyEnvVar": "MOONSHOT_API_KEY",
1046
869
  "apiKeyHeader": "Authorization",
1047
- "name": "Fireworks AI",
870
+ "name": "Moonshot AI",
871
+ "models": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
872
+ "docUrl": "https://platform.moonshot.ai/docs/api/chat",
873
+ "gateway": "models.dev"
874
+ },
875
+ "inference": {
876
+ "url": "https://inference.net/v1",
877
+ "apiKeyEnvVar": "INFERENCE_API_KEY",
878
+ "apiKeyHeader": "Authorization",
879
+ "name": "Inference",
1048
880
  "models": [
1049
- "accounts/fireworks/models/deepseek-r1-0528",
1050
- "accounts/fireworks/models/deepseek-v3-0324",
1051
- "accounts/fireworks/models/deepseek-v3p1",
1052
- "accounts/fireworks/models/glm-4p5",
1053
- "accounts/fireworks/models/glm-4p5-air",
1054
- "accounts/fireworks/models/gpt-oss-120b",
1055
- "accounts/fireworks/models/gpt-oss-20b",
1056
- "accounts/fireworks/models/kimi-k2-instruct",
1057
- "accounts/fireworks/models/qwen3-235b-a22b",
1058
- "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
881
+ "google/gemma-3",
882
+ "meta/llama-3.1-8b-instruct",
883
+ "meta/llama-3.2-11b-vision-instruct",
884
+ "meta/llama-3.2-1b-instruct",
885
+ "meta/llama-3.2-3b-instruct",
886
+ "mistral/mistral-nemo-12b-instruct",
887
+ "osmosis/osmosis-structure-0.6b",
888
+ "qwen/qwen-2.5-7b-vision-instruct",
889
+ "qwen/qwen3-embedding-4b"
1059
890
  ],
1060
- "docUrl": "https://fireworks.ai/docs/",
891
+ "docUrl": "https://inference.net/models",
1061
892
  "gateway": "models.dev"
1062
893
  },
1063
- "modelscope": {
1064
- "url": "https://api-inference.modelscope.cn/v1",
1065
- "apiKeyEnvVar": "MODELSCOPE_API_KEY",
894
+ "baseten": {
895
+ "url": "https://inference.baseten.co/v1",
896
+ "apiKeyEnvVar": "BASETEN_API_KEY",
1066
897
  "apiKeyHeader": "Authorization",
1067
- "name": "ModelScope",
898
+ "name": "Baseten",
899
+ "models": ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
900
+ "docUrl": "https://docs.baseten.co/development/model-apis/overview",
901
+ "gateway": "models.dev"
902
+ },
903
+ "cortecs": {
904
+ "url": "https://api.cortecs.ai/v1",
905
+ "apiKeyEnvVar": "CORTECS_API_KEY",
906
+ "apiKeyHeader": "Authorization",
907
+ "name": "Cortecs",
1068
908
  "models": [
1069
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1070
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1071
- "Qwen/Qwen3-30B-A3B-Instruct-2507",
1072
- "Qwen/Qwen3-30B-A3B-Thinking-2507",
1073
- "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1074
- "ZhipuAI/GLM-4.5"
909
+ "claude-4-5-sonnet",
910
+ "claude-sonnet-4",
911
+ "deepseek-v3-0324",
912
+ "gemini-2.5-pro",
913
+ "gpt-4.1",
914
+ "gpt-oss-120b",
915
+ "kimi-k2-instruct",
916
+ "llama-3.1-405b-instruct",
917
+ "nova-pro-v1",
918
+ "qwen3-32b",
919
+ "qwen3-coder-480b-a35b-instruct"
1075
920
  ],
1076
- "docUrl": "https://modelscope.cn/docs/model-service/API-Inference/intro",
921
+ "docUrl": "https://api.cortecs.ai/v1/models",
1077
922
  "gateway": "models.dev"
1078
923
  },
1079
- "llama": {
1080
- "url": "https://api.llama.com/compat/v1/",
1081
- "apiKeyEnvVar": "LLAMA_API_KEY",
924
+ "mistral": {
925
+ "url": "https://api.mistral.ai/v1",
926
+ "apiKeyEnvVar": "MISTRAL_API_KEY",
1082
927
  "apiKeyHeader": "Authorization",
1083
- "name": "Llama",
928
+ "name": "Mistral",
1084
929
  "models": [
1085
- "cerebras-llama-4-maverick-17b-128e-instruct",
1086
- "cerebras-llama-4-scout-17b-16e-instruct",
1087
- "groq-llama-4-maverick-17b-128e-instruct",
1088
- "llama-3.3-70b-instruct",
1089
- "llama-3.3-8b-instruct",
1090
- "llama-4-maverick-17b-128e-instruct-fp8",
1091
- "llama-4-scout-17b-16e-instruct-fp8"
930
+ "codestral-latest",
931
+ "devstral-medium-2507",
932
+ "devstral-small-2505",
933
+ "devstral-small-2507",
934
+ "magistral-medium-latest",
935
+ "magistral-small",
936
+ "ministral-3b-latest",
937
+ "ministral-8b-latest",
938
+ "mistral-large-latest",
939
+ "mistral-medium-2505",
940
+ "mistral-medium-2508",
941
+ "mistral-medium-latest",
942
+ "mistral-nemo",
943
+ "mistral-small-latest",
944
+ "open-mistral-7b",
945
+ "open-mixtral-8x22b",
946
+ "open-mixtral-8x7b",
947
+ "pixtral-12b",
948
+ "pixtral-large-latest"
1092
949
  ],
1093
- "docUrl": "https://llama.developer.meta.com/docs/models",
950
+ "docUrl": "https://docs.mistral.ai/getting-started/models/",
1094
951
  "gateway": "models.dev"
1095
952
  },
1096
- "cerebras": {
1097
- "url": "https://api.cerebras.ai/v1",
1098
- "apiKeyEnvVar": "CEREBRAS_API_KEY",
953
+ "venice": {
954
+ "url": "https://api.venice.ai/api/v1",
955
+ "apiKeyEnvVar": "VENICE_API_KEY",
1099
956
  "apiKeyHeader": "Authorization",
1100
- "name": "Cerebras",
1101
- "models": ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
1102
- "docUrl": "https://inference-docs.cerebras.ai/models/overview",
957
+ "name": "Venice AI",
958
+ "models": [
959
+ "deepseek-coder-v2-lite",
960
+ "deepseek-r1-671b",
961
+ "dolphin-2.9.2-qwen2-72b",
962
+ "llama-3.1-405b",
963
+ "llama-3.2-3b",
964
+ "llama-3.3-70b",
965
+ "mistral-31-24b",
966
+ "qwen-2.5-coder-32b",
967
+ "qwen-2.5-qwq-32b",
968
+ "qwen-2.5-vl",
969
+ "qwen3-235b",
970
+ "qwen3-4b",
971
+ "venice-uncensored"
972
+ ],
973
+ "docUrl": "https://docs.venice.ai",
1103
974
  "gateway": "models.dev"
1104
975
  },
1105
- "netlify": {
1106
- "apiKeyEnvVar": ["NETLIFY_TOKEN", "NETLIFY_SITE_ID"],
976
+ "alibaba": {
977
+ "url": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1",
978
+ "apiKeyEnvVar": "DASHSCOPE_API_KEY",
1107
979
  "apiKeyHeader": "Authorization",
1108
- "name": "Netlify",
1109
- "gateway": "netlify",
980
+ "name": "Alibaba",
1110
981
  "models": [
1111
- "anthropic/claude-3-5-haiku-20241022",
1112
- "anthropic/claude-3-5-haiku-latest",
1113
- "anthropic/claude-3-7-sonnet-20250219",
1114
- "anthropic/claude-3-7-sonnet-latest",
1115
- "anthropic/claude-3-haiku-20240307",
1116
- "anthropic/claude-haiku-4-5-20251001",
1117
- "anthropic/claude-opus-4-1-20250805",
1118
- "anthropic/claude-opus-4-20250514",
1119
- "anthropic/claude-sonnet-4-20250514",
1120
- "anthropic/claude-sonnet-4-5-20250929",
1121
- "gemini/gemini-2.0-flash",
1122
- "gemini/gemini-2.0-flash-lite",
1123
- "gemini/gemini-2.5-flash",
1124
- "gemini/gemini-2.5-flash-image-preview",
1125
- "gemini/gemini-2.5-flash-lite",
1126
- "gemini/gemini-2.5-flash-lite-preview-09-2025",
1127
- "gemini/gemini-2.5-flash-preview-09-2025",
1128
- "gemini/gemini-2.5-pro",
1129
- "gemini/gemini-flash-latest",
1130
- "gemini/gemini-flash-lite-latest",
1131
- "openai/codex-mini-latest",
1132
- "openai/gpt-4.1",
1133
- "openai/gpt-4.1-mini",
1134
- "openai/gpt-4.1-nano",
982
+ "qvq-max",
983
+ "qwen-flash",
984
+ "qwen-max",
985
+ "qwen-mt-plus",
986
+ "qwen-mt-turbo",
987
+ "qwen-omni-turbo",
988
+ "qwen-omni-turbo-realtime",
989
+ "qwen-plus",
990
+ "qwen-plus-character-ja",
991
+ "qwen-turbo",
992
+ "qwen-vl-max",
993
+ "qwen-vl-ocr",
994
+ "qwen-vl-plus",
995
+ "qwen2-5-14b-instruct",
996
+ "qwen2-5-32b-instruct",
997
+ "qwen2-5-72b-instruct",
998
+ "qwen2-5-7b-instruct",
999
+ "qwen2-5-omni-7b",
1000
+ "qwen2-5-vl-72b-instruct",
1001
+ "qwen2-5-vl-7b-instruct",
1002
+ "qwen3-14b",
1003
+ "qwen3-235b-a22b",
1004
+ "qwen3-32b",
1005
+ "qwen3-8b",
1006
+ "qwen3-asr-flash",
1007
+ "qwen3-coder-30b-a3b-instruct",
1008
+ "qwen3-coder-480b-a35b-instruct",
1009
+ "qwen3-coder-flash",
1010
+ "qwen3-coder-plus",
1011
+ "qwen3-livetranslate-flash-realtime",
1012
+ "qwen3-max",
1013
+ "qwen3-next-80b-a3b-instruct",
1014
+ "qwen3-next-80b-a3b-thinking",
1015
+ "qwen3-omni-flash",
1016
+ "qwen3-omni-flash-realtime",
1017
+ "qwen3-vl-235b-a22b",
1018
+ "qwen3-vl-30b-a3b",
1019
+ "qwen3-vl-plus",
1020
+ "qwq-plus"
1021
+ ],
1022
+ "docUrl": "https://www.alibabacloud.com/help/en/model-studio/models",
1023
+ "gateway": "models.dev"
1024
+ },
1025
+ "alibaba-cn": {
1026
+ "url": "https://dashscope.aliyuncs.com/compatible-mode/v1",
1027
+ "apiKeyEnvVar": "DASHSCOPE_API_KEY",
1028
+ "apiKeyHeader": "Authorization",
1029
+ "name": "Alibaba (China)",
1030
+ "models": [
1031
+ "deepseek-r1",
1032
+ "deepseek-r1-0528",
1033
+ "deepseek-r1-distill-llama-70b",
1034
+ "deepseek-r1-distill-llama-8b",
1035
+ "deepseek-r1-distill-qwen-1-5b",
1036
+ "deepseek-r1-distill-qwen-14b",
1037
+ "deepseek-r1-distill-qwen-32b",
1038
+ "deepseek-r1-distill-qwen-7b",
1039
+ "deepseek-v3",
1040
+ "deepseek-v3-1",
1041
+ "deepseek-v3-2-exp",
1042
+ "moonshot-kimi-k2-instruct",
1043
+ "qvq-max",
1044
+ "qwen-deep-research",
1045
+ "qwen-doc-turbo",
1046
+ "qwen-flash",
1047
+ "qwen-long",
1048
+ "qwen-math-plus",
1049
+ "qwen-math-turbo",
1050
+ "qwen-max",
1051
+ "qwen-mt-plus",
1052
+ "qwen-mt-turbo",
1053
+ "qwen-omni-turbo",
1054
+ "qwen-omni-turbo-realtime",
1055
+ "qwen-plus",
1056
+ "qwen-plus-character",
1057
+ "qwen-turbo",
1058
+ "qwen-vl-max",
1059
+ "qwen-vl-ocr",
1060
+ "qwen-vl-plus",
1061
+ "qwen2-5-14b-instruct",
1062
+ "qwen2-5-32b-instruct",
1063
+ "qwen2-5-72b-instruct",
1064
+ "qwen2-5-7b-instruct",
1065
+ "qwen2-5-coder-32b-instruct",
1066
+ "qwen2-5-coder-7b-instruct",
1067
+ "qwen2-5-math-72b-instruct",
1068
+ "qwen2-5-math-7b-instruct",
1069
+ "qwen2-5-omni-7b",
1070
+ "qwen2-5-vl-72b-instruct",
1071
+ "qwen2-5-vl-7b-instruct",
1072
+ "qwen3-14b",
1073
+ "qwen3-235b-a22b",
1074
+ "qwen3-32b",
1075
+ "qwen3-8b",
1076
+ "qwen3-asr-flash",
1077
+ "qwen3-coder-30b-a3b-instruct",
1078
+ "qwen3-coder-480b-a35b-instruct",
1079
+ "qwen3-coder-flash",
1080
+ "qwen3-coder-plus",
1081
+ "qwen3-max",
1082
+ "qwen3-next-80b-a3b-instruct",
1083
+ "qwen3-next-80b-a3b-thinking",
1084
+ "qwen3-omni-flash",
1085
+ "qwen3-omni-flash-realtime",
1086
+ "qwen3-vl-235b-a22b",
1087
+ "qwen3-vl-30b-a3b",
1088
+ "qwen3-vl-plus",
1089
+ "qwq-32b",
1090
+ "qwq-plus",
1091
+ "tongyi-intent-detect-v3"
1092
+ ],
1093
+ "docUrl": "https://www.alibabacloud.com/help/en/model-studio/models",
1094
+ "gateway": "models.dev"
1095
+ },
1096
+ "chutes": {
1097
+ "url": "https://llm.chutes.ai/v1",
1098
+ "apiKeyEnvVar": "CHUTES_API_KEY",
1099
+ "apiKeyHeader": "Authorization",
1100
+ "name": "Chutes",
1101
+ "models": [
1102
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1103
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1104
+ "Qwen/Qwen3-30B-A3B",
1105
+ "Qwen/Qwen3-30B-A3B-Instruct-2507",
1106
+ "Qwen/Qwen3-30B-A3B-Thinking-2507",
1107
+ "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1108
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1109
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
1110
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
1111
+ "chutesai/Devstral-Small-2505",
1112
+ "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
1113
+ "deepseek-ai/DeepSeek-R1-0528",
1114
+ "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
1115
+ "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1116
+ "deepseek-ai/DeepSeek-V3-0324",
1117
+ "deepseek-ai/DeepSeek-V3.1",
1118
+ "deepseek-ai/DeepSeek-V3.1-Terminus",
1119
+ "deepseek-ai/DeepSeek-V3.1-turbo",
1120
+ "deepseek-ai/DeepSeek-V3.1:THINKING",
1121
+ "deepseek-ai/DeepSeek-V3.2-Exp",
1122
+ "meituan-longcat/LongCat-Flash-Chat-FP8",
1123
+ "moonshotai/Kimi-Dev-72B",
1124
+ "moonshotai/Kimi-K2-Instruct-0905",
1125
+ "moonshotai/Kimi-K2-Instruct-75k",
1126
+ "moonshotai/Kimi-VL-A3B-Thinking",
1127
+ "openai/gpt-oss-120b",
1128
+ "tngtech/DeepSeek-R1T-Chimera",
1129
+ "tngtech/DeepSeek-TNG-R1T2-Chimera",
1130
+ "zai-org/GLM-4.5-Air",
1131
+ "zai-org/GLM-4.5-FP8",
1132
+ "zai-org/GLM-4.5-turbo",
1133
+ "zai-org/GLM-4.6-FP8",
1134
+ "zai-org/GLM-4.6-turbo"
1135
+ ],
1136
+ "docUrl": "https://llm.chutes.ai/v1/models",
1137
+ "gateway": "models.dev"
1138
+ },
1139
+ "upstage": {
1140
+ "url": "https://api.upstage.ai",
1141
+ "apiKeyEnvVar": "UPSTAGE_API_KEY",
1142
+ "apiKeyHeader": "Authorization",
1143
+ "name": "Upstage",
1144
+ "models": ["solar-mini", "solar-pro2"],
1145
+ "docUrl": "https://developers.upstage.ai/docs/apis/chat",
1146
+ "gateway": "models.dev"
1147
+ },
1148
+ "netlify": {
1149
+ "apiKeyEnvVar": ["NETLIFY_TOKEN", "NETLIFY_SITE_ID"],
1150
+ "apiKeyHeader": "Authorization",
1151
+ "name": "Netlify",
1152
+ "gateway": "netlify",
1153
+ "models": [
1154
+ "anthropic/claude-3-5-haiku-20241022",
1155
+ "anthropic/claude-3-5-haiku-latest",
1156
+ "anthropic/claude-3-7-sonnet-20250219",
1157
+ "anthropic/claude-3-7-sonnet-latest",
1158
+ "anthropic/claude-3-haiku-20240307",
1159
+ "anthropic/claude-haiku-4-5-20251001",
1160
+ "anthropic/claude-opus-4-1-20250805",
1161
+ "anthropic/claude-opus-4-20250514",
1162
+ "anthropic/claude-sonnet-4-20250514",
1163
+ "anthropic/claude-sonnet-4-5-20250929",
1164
+ "gemini/gemini-2.0-flash",
1165
+ "gemini/gemini-2.0-flash-lite",
1166
+ "gemini/gemini-2.5-flash",
1167
+ "gemini/gemini-2.5-flash-image-preview",
1168
+ "gemini/gemini-2.5-flash-lite",
1169
+ "gemini/gemini-2.5-flash-lite-preview-09-2025",
1170
+ "gemini/gemini-2.5-flash-preview-09-2025",
1171
+ "gemini/gemini-2.5-pro",
1172
+ "gemini/gemini-flash-latest",
1173
+ "gemini/gemini-flash-lite-latest",
1174
+ "openai/codex-mini-latest",
1175
+ "openai/gpt-4.1",
1176
+ "openai/gpt-4.1-mini",
1177
+ "openai/gpt-4.1-nano",
1135
1178
  "openai/gpt-4o",
1136
1179
  "openai/gpt-4o-mini",
1137
1180
  "openai/gpt-5",
@@ -1147,52 +1190,59 @@
1147
1190
  }
1148
1191
  },
1149
1192
  "models": {
1150
- "moonshotai-cn": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1151
- "lucidquery": ["lucidnova-rf1-100b", "lucidquery-nexus-coder"],
1152
- "moonshotai": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1153
- "zai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1154
- "alibaba": [
1155
- "qvq-max",
1156
- "qwen-flash",
1157
- "qwen-max",
1158
- "qwen-mt-plus",
1159
- "qwen-mt-turbo",
1160
- "qwen-omni-turbo",
1161
- "qwen-omni-turbo-realtime",
1162
- "qwen-plus",
1163
- "qwen-plus-character-ja",
1164
- "qwen-turbo",
1165
- "qwen-vl-max",
1166
- "qwen-vl-ocr",
1167
- "qwen-vl-plus",
1168
- "qwen2-5-14b-instruct",
1169
- "qwen2-5-32b-instruct",
1170
- "qwen2-5-72b-instruct",
1171
- "qwen2-5-7b-instruct",
1172
- "qwen2-5-omni-7b",
1173
- "qwen2-5-vl-72b-instruct",
1174
- "qwen2-5-vl-7b-instruct",
1175
- "qwen3-14b",
1176
- "qwen3-235b-a22b",
1177
- "qwen3-32b",
1178
- "qwen3-8b",
1179
- "qwen3-asr-flash",
1180
- "qwen3-coder-30b-a3b-instruct",
1181
- "qwen3-coder-480b-a35b-instruct",
1182
- "qwen3-coder-flash",
1183
- "qwen3-coder-plus",
1184
- "qwen3-livetranslate-flash-realtime",
1185
- "qwen3-max",
1186
- "qwen3-next-80b-a3b-instruct",
1187
- "qwen3-next-80b-a3b-thinking",
1188
- "qwen3-omni-flash",
1189
- "qwen3-omni-flash-realtime",
1190
- "qwen3-vl-235b-a22b",
1191
- "qwen3-vl-30b-a3b",
1192
- "qwen3-vl-plus",
1193
- "qwq-plus"
1193
+ "nvidia": [
1194
+ "black-forest-labs/flux.1-dev",
1195
+ "deepseek-ai/deepseek-v3.1",
1196
+ "deepseek-ai/deepseek-v3.1-terminus",
1197
+ "google/gemma-3-27b-it",
1198
+ "microsoft/phi-4-mini-instruct",
1199
+ "moonshotai/kimi-k2-instruct",
1200
+ "moonshotai/kimi-k2-instruct-0905",
1201
+ "nvidia/cosmos-nemotron-34b",
1202
+ "nvidia/llama-3.1-nemotron-ultra-253b-v1",
1203
+ "nvidia/nemoretriever-ocr-v1",
1204
+ "nvidia/parakeet-tdt-0.6b-v2",
1205
+ "openai/gpt-oss-120b",
1206
+ "openai/whisper-large-v3",
1207
+ "qwen/qwen3-235b-a22b",
1208
+ "qwen/qwen3-coder-480b-a35b-instruct"
1194
1209
  ],
1195
- "xai": [
1210
+ "modelscope": [
1211
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1212
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1213
+ "Qwen/Qwen3-30B-A3B-Instruct-2507",
1214
+ "Qwen/Qwen3-30B-A3B-Thinking-2507",
1215
+ "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1216
+ "ZhipuAI/GLM-4.5",
1217
+ "ZhipuAI/GLM-4.6"
1218
+ ],
1219
+ "aihubmix": [
1220
+ "DeepSeek-V3.2-Exp",
1221
+ "DeepSeek-V3.2-Exp-Think",
1222
+ "Kimi-K2-0905",
1223
+ "claude-haiku-4-5",
1224
+ "claude-opus-4-1",
1225
+ "claude-sonnet-4-5",
1226
+ "gemini-2.5-flash",
1227
+ "gemini-2.5-pro",
1228
+ "glm-4.6",
1229
+ "gpt-4.1",
1230
+ "gpt-4.1-mini",
1231
+ "gpt-4.1-nano",
1232
+ "gpt-4o",
1233
+ "gpt-4o-2024-11-20",
1234
+ "gpt-5",
1235
+ "gpt-5-codex",
1236
+ "gpt-5-mini",
1237
+ "gpt-5-nano",
1238
+ "gpt-5-pro",
1239
+ "o4-mini",
1240
+ "qwen3-235b-a22b-instruct-2507",
1241
+ "qwen3-235b-a22b-thinking-2507",
1242
+ "qwen3-coder-480b-a35b-instruct"
1243
+ ],
1244
+ "lucidquery": ["lucidnova-rf1-100b", "lucidquery-nexus-coder"],
1245
+ "xai": [
1196
1246
  "grok-2",
1197
1247
  "grok-2-1212",
1198
1248
  "grok-2-latest",
@@ -1205,395 +1255,47 @@
1205
1255
  "grok-3-latest",
1206
1256
  "grok-3-mini",
1207
1257
  "grok-3-mini-fast",
1208
- "grok-3-mini-fast-latest",
1209
- "grok-3-mini-latest",
1210
- "grok-4",
1211
- "grok-4-fast",
1212
- "grok-4-fast-non-reasoning",
1213
- "grok-beta",
1214
- "grok-code-fast-1",
1215
- "grok-vision-beta"
1216
- ],
1217
- "nvidia": [
1218
- "black-forest-labs/flux.1-dev",
1219
- "deepseek-ai/deepseek-v3.1",
1220
- "google/gemma-3-27b-it",
1221
- "microsoft/phi-4-mini-instruct",
1222
- "moonshotai/kimi-k2-instruct",
1223
- "moonshotai/kimi-k2-instruct-0905",
1224
- "nvidia/cosmos-nemotron-34b",
1225
- "nvidia/llama-3.1-nemotron-ultra-253b-v1",
1226
- "nvidia/nemoretriever-ocr-v1",
1227
- "nvidia/parakeet-tdt-0.6b-v2",
1228
- "openai/gpt-oss-120b",
1229
- "openai/whisper-large-v3",
1230
- "qwen/qwen3-235b-a22b",
1231
- "qwen/qwen3-coder-480b-a35b-instruct"
1232
- ],
1233
- "upstage": ["solar-mini", "solar-pro2"],
1234
- "groq": [
1235
- "deepseek-r1-distill-llama-70b",
1236
- "gemma2-9b-it",
1237
- "llama-3.1-8b-instant",
1238
- "llama-3.3-70b-versatile",
1239
- "llama-guard-3-8b",
1240
- "llama3-70b-8192",
1241
- "llama3-8b-8192",
1242
- "meta-llama/llama-4-maverick-17b-128e-instruct",
1243
- "meta-llama/llama-4-scout-17b-16e-instruct",
1244
- "meta-llama/llama-guard-4-12b",
1245
- "mistral-saba-24b",
1246
- "moonshotai/kimi-k2-instruct",
1247
- "moonshotai/kimi-k2-instruct-0905",
1248
- "openai/gpt-oss-120b",
1249
- "openai/gpt-oss-20b",
1250
- "qwen-qwq-32b",
1251
- "qwen/qwen3-32b"
1252
- ],
1253
- "mistral": [
1254
- "codestral-latest",
1255
- "devstral-medium-2507",
1256
- "devstral-small-2505",
1257
- "devstral-small-2507",
1258
- "magistral-medium-latest",
1259
- "magistral-small",
1260
- "ministral-3b-latest",
1261
- "ministral-8b-latest",
1262
- "mistral-large-latest",
1263
- "mistral-medium-2505",
1264
- "mistral-medium-2508",
1265
- "mistral-medium-latest",
1266
- "mistral-nemo",
1267
- "mistral-small-latest",
1268
- "open-mistral-7b",
1269
- "open-mixtral-8x22b",
1270
- "open-mixtral-8x7b",
1271
- "pixtral-12b",
1272
- "pixtral-large-latest"
1273
- ],
1274
- "vercel": [
1275
- "alibaba/qwen3-coder-plus",
1276
- "alibaba/qwen3-max",
1277
- "alibaba/qwen3-next-80b-a3b-instruct",
1278
- "alibaba/qwen3-next-80b-a3b-thinking",
1279
- "alibaba/qwen3-vl-instruct",
1280
- "alibaba/qwen3-vl-thinking",
1281
- "amazon/nova-lite",
1282
- "amazon/nova-micro",
1283
- "amazon/nova-pro",
1284
- "anthropic/claude-3-5-haiku",
1285
- "anthropic/claude-3-haiku",
1286
- "anthropic/claude-3-opus",
1287
- "anthropic/claude-3.5-sonnet",
1288
- "anthropic/claude-3.7-sonnet",
1289
- "anthropic/claude-4-1-opus",
1290
- "anthropic/claude-4-opus",
1291
- "anthropic/claude-4-sonnet",
1292
- "anthropic/claude-4.5-sonnet",
1293
- "anthropic/claude-haiku-4.5",
1294
- "cerebras/qwen3-coder",
1295
- "deepseek/deepseek-r1",
1296
- "deepseek/deepseek-r1-distill-llama-70b",
1297
- "deepseek/deepseek-v3.1-terminus",
1298
- "deepseek/deepseek-v3.2-exp",
1299
- "deepseek/deepseek-v3.2-exp-thinking",
1300
- "google/gemini-2.0-flash",
1301
- "google/gemini-2.0-flash-lite",
1302
- "google/gemini-2.5-flash",
1303
- "google/gemini-2.5-flash-lite",
1304
- "google/gemini-2.5-flash-lite-preview-09-2025",
1305
- "google/gemini-2.5-flash-preview-09-2025",
1306
- "google/gemini-2.5-pro",
1307
- "meta/llama-3.3-70b",
1308
- "meta/llama-4-maverick",
1309
- "meta/llama-4-scout",
1310
- "mistral/codestral",
1311
- "mistral/magistral-medium",
1312
- "mistral/magistral-small",
1313
- "mistral/ministral-3b",
1314
- "mistral/ministral-8b",
1315
- "mistral/mistral-large",
1316
- "mistral/mistral-small",
1317
- "mistral/mixtral-8x22b-instruct",
1318
- "mistral/pixtral-12b",
1319
- "mistral/pixtral-large",
1320
- "moonshotai/kimi-k2",
1321
- "morph/morph-v3-fast",
1322
- "morph/morph-v3-large",
1323
- "openai/gpt-4-turbo",
1324
- "openai/gpt-4.1",
1325
- "openai/gpt-4.1-mini",
1326
- "openai/gpt-4.1-nano",
1327
- "openai/gpt-4o",
1328
- "openai/gpt-4o-mini",
1329
- "openai/gpt-5",
1330
- "openai/gpt-5-codex",
1331
- "openai/gpt-5-mini",
1332
- "openai/gpt-5-nano",
1333
- "openai/gpt-oss-120b",
1334
- "openai/gpt-oss-20b",
1335
- "openai/o1",
1336
- "openai/o3",
1337
- "openai/o3-mini",
1338
- "openai/o4-mini",
1339
- "perplexity/sonar",
1340
- "perplexity/sonar-pro",
1341
- "perplexity/sonar-reasoning",
1342
- "perplexity/sonar-reasoning-pro",
1343
- "vercel/v0-1.0-md",
1344
- "vercel/v0-1.5-md",
1345
- "xai/grok-2",
1346
- "xai/grok-2-vision",
1347
- "xai/grok-3",
1348
- "xai/grok-3-fast",
1349
- "xai/grok-3-mini",
1350
- "xai/grok-3-mini-fast",
1351
- "xai/grok-4",
1352
- "xai/grok-4-fast",
1353
- "xai/grok-4-fast-non-reasoning",
1354
- "xai/grok-code-fast-1",
1355
- "zai/glm-4.5",
1356
- "zai/glm-4.5-air",
1357
- "zai/glm-4.5v",
1358
- "zai/glm-4.6"
1359
- ],
1360
- "nebius": [
1361
- "NousResearch/hermes-4-405b",
1362
- "NousResearch/hermes-4-70b",
1363
- "deepseek-ai/deepseek-v3",
1364
- "meta-llama/llama-3.3-70b-instruct-base",
1365
- "meta-llama/llama-3.3-70b-instruct-fast",
1366
- "meta-llama/llama-3_1-405b-instruct",
1367
- "moonshotai/kimi-k2-instruct",
1368
- "nvidia/llama-3_1-nemotron-ultra-253b-v1",
1369
- "openai/gpt-oss-120b",
1370
- "openai/gpt-oss-20b",
1371
- "qwen/qwen3-235b-a22b-instruct-2507",
1372
- "qwen/qwen3-235b-a22b-thinking-2507",
1373
- "qwen/qwen3-coder-480b-a35b-instruct",
1374
- "zai-org/glm-4.5",
1375
- "zai-org/glm-4.5-air"
1376
- ],
1377
- "deepseek": ["deepseek-chat", "deepseek-reasoner"],
1378
- "alibaba-cn": [
1379
- "deepseek-r1",
1380
- "deepseek-r1-0528",
1381
- "deepseek-r1-distill-llama-70b",
1382
- "deepseek-r1-distill-llama-8b",
1383
- "deepseek-r1-distill-qwen-1-5b",
1384
- "deepseek-r1-distill-qwen-14b",
1385
- "deepseek-r1-distill-qwen-32b",
1386
- "deepseek-r1-distill-qwen-7b",
1387
- "deepseek-v3",
1388
- "deepseek-v3-1",
1389
- "deepseek-v3-2-exp",
1390
- "moonshot-kimi-k2-instruct",
1391
- "qvq-max",
1392
- "qwen-deep-research",
1393
- "qwen-doc-turbo",
1394
- "qwen-flash",
1395
- "qwen-long",
1396
- "qwen-math-plus",
1397
- "qwen-math-turbo",
1398
- "qwen-max",
1399
- "qwen-mt-plus",
1400
- "qwen-mt-turbo",
1401
- "qwen-omni-turbo",
1402
- "qwen-omni-turbo-realtime",
1403
- "qwen-plus",
1404
- "qwen-plus-character",
1405
- "qwen-turbo",
1406
- "qwen-vl-max",
1407
- "qwen-vl-ocr",
1408
- "qwen-vl-plus",
1409
- "qwen2-5-14b-instruct",
1410
- "qwen2-5-32b-instruct",
1411
- "qwen2-5-72b-instruct",
1412
- "qwen2-5-7b-instruct",
1413
- "qwen2-5-coder-32b-instruct",
1414
- "qwen2-5-coder-7b-instruct",
1415
- "qwen2-5-math-72b-instruct",
1416
- "qwen2-5-math-7b-instruct",
1417
- "qwen2-5-omni-7b",
1418
- "qwen2-5-vl-72b-instruct",
1419
- "qwen2-5-vl-7b-instruct",
1420
- "qwen3-14b",
1421
- "qwen3-235b-a22b",
1422
- "qwen3-32b",
1423
- "qwen3-8b",
1424
- "qwen3-asr-flash",
1425
- "qwen3-coder-30b-a3b-instruct",
1426
- "qwen3-coder-480b-a35b-instruct",
1427
- "qwen3-coder-flash",
1428
- "qwen3-coder-plus",
1429
- "qwen3-max",
1430
- "qwen3-next-80b-a3b-instruct",
1431
- "qwen3-next-80b-a3b-thinking",
1432
- "qwen3-omni-flash",
1433
- "qwen3-omni-flash-realtime",
1434
- "qwen3-vl-235b-a22b",
1435
- "qwen3-vl-30b-a3b",
1436
- "qwen3-vl-plus",
1437
- "qwq-32b",
1438
- "qwq-plus",
1439
- "tongyi-intent-detect-v3"
1440
- ],
1441
- "venice": [
1442
- "deepseek-coder-v2-lite",
1443
- "deepseek-r1-671b",
1444
- "dolphin-2.9.2-qwen2-72b",
1445
- "llama-3.1-405b",
1446
- "llama-3.2-3b",
1447
- "llama-3.3-70b",
1448
- "mistral-31-24b",
1449
- "qwen-2.5-coder-32b",
1450
- "qwen-2.5-qwq-32b",
1451
- "qwen-2.5-vl",
1452
- "qwen3-235b",
1453
- "qwen3-4b",
1454
- "venice-uncensored"
1455
- ],
1456
- "chutes": [
1457
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1458
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1459
- "Qwen/Qwen3-30B-A3B",
1460
- "Qwen/Qwen3-30B-A3B-Instruct-2507",
1461
- "Qwen/Qwen3-30B-A3B-Thinking-2507",
1462
- "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1463
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1464
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
1465
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
1466
- "chutesai/Devstral-Small-2505",
1467
- "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
1468
- "deepseek-ai/DeepSeek-R1-0528",
1469
- "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
1470
- "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1471
- "deepseek-ai/DeepSeek-V3-0324",
1472
- "deepseek-ai/DeepSeek-V3.1",
1473
- "deepseek-ai/DeepSeek-V3.1-Terminus",
1474
- "deepseek-ai/DeepSeek-V3.1-turbo",
1475
- "deepseek-ai/DeepSeek-V3.1:THINKING",
1476
- "deepseek-ai/DeepSeek-V3.2-Exp",
1477
- "meituan-longcat/LongCat-Flash-Chat-FP8",
1478
- "moonshotai/Kimi-Dev-72B",
1479
- "moonshotai/Kimi-K2-Instruct-0905",
1480
- "moonshotai/Kimi-K2-Instruct-75k",
1481
- "moonshotai/Kimi-VL-A3B-Thinking",
1482
- "openai/gpt-oss-120b",
1483
- "tngtech/DeepSeek-R1T-Chimera",
1484
- "tngtech/DeepSeek-TNG-R1T2-Chimera",
1485
- "zai-org/GLM-4.5-Air",
1486
- "zai-org/GLM-4.5-FP8",
1487
- "zai-org/GLM-4.5-turbo",
1488
- "zai-org/GLM-4.6-FP8",
1489
- "zai-org/GLM-4.6-turbo"
1490
- ],
1491
- "cortecs": [
1492
- "claude-4-5-sonnet",
1493
- "claude-sonnet-4",
1494
- "deepseek-v3-0324",
1495
- "gemini-2.5-pro",
1496
- "gpt-4.1",
1497
- "gpt-oss-120b",
1498
- "kimi-k2-instruct",
1499
- "llama-3.1-405b-instruct",
1500
- "nova-pro-v1",
1501
- "qwen3-32b",
1502
- "qwen3-coder-480b-a35b-instruct"
1503
- ],
1504
- "github-models": [
1505
- "ai21-labs/ai21-jamba-1.5-large",
1506
- "ai21-labs/ai21-jamba-1.5-mini",
1507
- "cohere/cohere-command-a",
1508
- "cohere/cohere-command-r",
1509
- "cohere/cohere-command-r-08-2024",
1510
- "cohere/cohere-command-r-plus",
1511
- "cohere/cohere-command-r-plus-08-2024",
1512
- "core42/jais-30b-chat",
1513
- "deepseek/deepseek-r1",
1514
- "deepseek/deepseek-r1-0528",
1515
- "deepseek/deepseek-v3-0324",
1516
- "meta/llama-3.2-11b-vision-instruct",
1517
- "meta/llama-3.2-90b-vision-instruct",
1518
- "meta/llama-3.3-70b-instruct",
1519
- "meta/llama-4-maverick-17b-128e-instruct-fp8",
1520
- "meta/llama-4-scout-17b-16e-instruct",
1521
- "meta/meta-llama-3-70b-instruct",
1522
- "meta/meta-llama-3-8b-instruct",
1523
- "meta/meta-llama-3.1-405b-instruct",
1524
- "meta/meta-llama-3.1-70b-instruct",
1525
- "meta/meta-llama-3.1-8b-instruct",
1526
- "microsoft/mai-ds-r1",
1527
- "microsoft/phi-3-medium-128k-instruct",
1528
- "microsoft/phi-3-medium-4k-instruct",
1529
- "microsoft/phi-3-mini-128k-instruct",
1530
- "microsoft/phi-3-mini-4k-instruct",
1531
- "microsoft/phi-3-small-128k-instruct",
1532
- "microsoft/phi-3-small-8k-instruct",
1533
- "microsoft/phi-3.5-mini-instruct",
1534
- "microsoft/phi-3.5-moe-instruct",
1535
- "microsoft/phi-3.5-vision-instruct",
1536
- "microsoft/phi-4",
1537
- "microsoft/phi-4-mini-instruct",
1538
- "microsoft/phi-4-mini-reasoning",
1539
- "microsoft/phi-4-multimodal-instruct",
1540
- "microsoft/phi-4-reasoning",
1541
- "mistral-ai/codestral-2501",
1542
- "mistral-ai/ministral-3b",
1543
- "mistral-ai/mistral-large-2411",
1544
- "mistral-ai/mistral-medium-2505",
1545
- "mistral-ai/mistral-nemo",
1546
- "mistral-ai/mistral-small-2503",
1547
- "openai/gpt-4.1",
1548
- "openai/gpt-4.1-mini",
1549
- "openai/gpt-4.1-nano",
1550
- "openai/gpt-4o",
1551
- "openai/gpt-4o-mini",
1552
- "openai/o1",
1553
- "openai/o1-mini",
1554
- "openai/o1-preview",
1555
- "openai/o3",
1556
- "openai/o3-mini",
1557
- "openai/o4-mini",
1558
- "xai/grok-3",
1559
- "xai/grok-3-mini"
1560
- ],
1561
- "togetherai": [
1562
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1563
- "deepseek-ai/DeepSeek-R1",
1564
- "deepseek-ai/DeepSeek-V3",
1565
- "meta-llama/Llama-3.3-70B-Instruct-Turbo",
1566
- "moonshotai/Kimi-K2-Instruct",
1567
- "openai/gpt-oss-120b"
1568
- ],
1569
- "baseten": ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905"],
1570
- "huggingface": [
1571
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1572
- "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1573
- "Qwen/Qwen3-Next-80B-A3B-Instruct",
1574
- "Qwen/Qwen3-Next-80B-A3B-Thinking",
1575
- "deepseek-ai/DeepSeek-R1-0528",
1576
- "deepseek-ai/Deepseek-V3-0324",
1577
- "moonshotai/Kimi-K2-Instruct",
1578
- "moonshotai/Kimi-K2-Instruct-0905",
1579
- "zai-org/GLM-4.5",
1580
- "zai-org/GLM-4.5-Air",
1581
- "zai-org/GLM-4.6"
1258
+ "grok-3-mini-fast-latest",
1259
+ "grok-3-mini-latest",
1260
+ "grok-4",
1261
+ "grok-4-fast",
1262
+ "grok-4-fast-non-reasoning",
1263
+ "grok-beta",
1264
+ "grok-code-fast-1",
1265
+ "grok-vision-beta"
1582
1266
  ],
1583
- "opencode": [
1584
- "an-g8x",
1585
- "claude-3-5-haiku",
1586
- "claude-haiku-4-5",
1587
- "claude-opus-4-1",
1588
- "claude-sonnet-4",
1589
- "claude-sonnet-4-5",
1590
- "code-supernova",
1591
- "glm-4.6",
1592
- "gpt-5",
1593
- "gpt-5-codex",
1594
- "grok-code",
1595
- "kimi-k2",
1596
- "qwen3-coder"
1267
+ "deepseek": ["deepseek-chat", "deepseek-reasoner"],
1268
+ "requesty": [
1269
+ "anthropic/claude-3-7-sonnet",
1270
+ "anthropic/claude-4-sonnet-20250522",
1271
+ "anthropic/claude-opus-4",
1272
+ "anthropic/claude-opus-4-1-20250805",
1273
+ "google/gemini-2.5-flash",
1274
+ "google/gemini-2.5-pro",
1275
+ "openai/gpt-4.1",
1276
+ "openai/gpt-4.1-mini",
1277
+ "openai/gpt-4o-mini",
1278
+ "openai/gpt-5",
1279
+ "openai/gpt-5-mini",
1280
+ "openai/gpt-5-nano",
1281
+ "openai/o4-mini"
1282
+ ],
1283
+ "nebius": [
1284
+ "NousResearch/hermes-4-405b",
1285
+ "NousResearch/hermes-4-70b",
1286
+ "deepseek-ai/deepseek-v3",
1287
+ "meta-llama/llama-3.3-70b-instruct-base",
1288
+ "meta-llama/llama-3.3-70b-instruct-fast",
1289
+ "meta-llama/llama-3_1-405b-instruct",
1290
+ "moonshotai/kimi-k2-instruct",
1291
+ "nvidia/llama-3_1-nemotron-ultra-253b-v1",
1292
+ "openai/gpt-oss-120b",
1293
+ "openai/gpt-oss-20b",
1294
+ "qwen/qwen3-235b-a22b-instruct-2507",
1295
+ "qwen/qwen3-235b-a22b-thinking-2507",
1296
+ "qwen/qwen3-coder-480b-a35b-instruct",
1297
+ "zai-org/glm-4.5",
1298
+ "zai-org/glm-4.5-air"
1597
1299
  ],
1598
1300
  "fastrouter": [
1599
1301
  "anthropic/claude-opus-4.1",
@@ -1611,79 +1313,26 @@
1611
1313
  "qwen/qwen3-coder",
1612
1314
  "x-ai/grok-4"
1613
1315
  ],
1614
- "google": [
1615
- "gemini-1.5-flash",
1616
- "gemini-1.5-flash-8b",
1617
- "gemini-1.5-pro",
1618
- "gemini-2.0-flash",
1619
- "gemini-2.0-flash-lite",
1620
- "gemini-2.5-flash",
1621
- "gemini-2.5-flash-image",
1622
- "gemini-2.5-flash-image-preview",
1623
- "gemini-2.5-flash-lite",
1624
- "gemini-2.5-flash-lite-preview-06-17",
1625
- "gemini-2.5-flash-lite-preview-09-2025",
1626
- "gemini-2.5-flash-preview-04-17",
1627
- "gemini-2.5-flash-preview-05-20",
1628
- "gemini-2.5-flash-preview-09-2025",
1629
- "gemini-2.5-flash-preview-tts",
1630
- "gemini-2.5-pro",
1631
- "gemini-2.5-pro-preview-05-06",
1632
- "gemini-2.5-pro-preview-06-05",
1633
- "gemini-2.5-pro-preview-tts",
1634
- "gemini-flash-latest",
1635
- "gemini-flash-lite-latest",
1636
- "gemini-live-2.5-flash",
1637
- "gemini-live-2.5-flash-preview-native-audio"
1638
- ],
1639
- "inception": ["mercury", "mercury-coder"],
1640
- "wandb": [
1641
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1316
+ "perplexity": ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
1317
+ "morph": ["auto", "morph-v3-fast", "morph-v3-large"],
1318
+ "zai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1319
+ "huggingface": [
1642
1320
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
1643
1321
  "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1322
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
1323
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
1644
1324
  "deepseek-ai/DeepSeek-R1-0528",
1645
- "deepseek-ai/DeepSeek-V3-0324",
1646
- "meta-llama/Llama-3.1-8B-Instruct",
1647
- "meta-llama/Llama-3.3-70B-Instruct",
1648
- "meta-llama/Llama-4-Scout-17B-16E-Instruct",
1649
- "microsoft/Phi-4-mini-instruct",
1650
- "moonshotai/Kimi-K2-Instruct"
1651
- ],
1652
- "openai": [
1653
- "codex-mini-latest",
1654
- "gpt-3.5-turbo",
1655
- "gpt-4",
1656
- "gpt-4-turbo",
1657
- "gpt-4.1",
1658
- "gpt-4.1-mini",
1659
- "gpt-4.1-nano",
1660
- "gpt-4o",
1661
- "gpt-4o-2024-05-13",
1662
- "gpt-4o-2024-08-06",
1663
- "gpt-4o-2024-11-20",
1664
- "gpt-4o-mini",
1665
- "gpt-5",
1666
- "gpt-5-chat-latest",
1667
- "gpt-5-codex",
1668
- "gpt-5-mini",
1669
- "gpt-5-nano",
1670
- "o1",
1671
- "o1-mini",
1672
- "o1-preview",
1673
- "o1-pro",
1674
- "o3",
1675
- "o3-deep-research",
1676
- "o3-mini",
1677
- "o3-pro",
1678
- "o4-mini",
1679
- "o4-mini-deep-research"
1325
+ "deepseek-ai/Deepseek-V3-0324",
1326
+ "moonshotai/Kimi-K2-Instruct",
1327
+ "moonshotai/Kimi-K2-Instruct-0905",
1328
+ "zai-org/GLM-4.5",
1329
+ "zai-org/GLM-4.5-Air",
1330
+ "zai-org/GLM-4.6"
1680
1331
  ],
1681
- "zhipuai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1682
- "perplexity": ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
1683
1332
  "openrouter": [
1684
1333
  "anthropic/claude-3.5-haiku",
1685
1334
  "anthropic/claude-3.7-sonnet",
1686
- "anthropic/claude-4.5-haiku",
1335
+ "anthropic/claude-haiku-4.5",
1687
1336
  "anthropic/claude-opus-4",
1688
1337
  "anthropic/claude-opus-4.1",
1689
1338
  "anthropic/claude-sonnet-4",
@@ -1732,65 +1381,184 @@
1732
1381
  "mistralai/mistral-small-3.2-24b-instruct:free",
1733
1382
  "moonshotai/kimi-dev-72b:free",
1734
1383
  "moonshotai/kimi-k2",
1735
- "moonshotai/kimi-k2-0905",
1736
- "moonshotai/kimi-k2:free",
1737
- "nousresearch/deephermes-3-llama-3-8b-preview",
1738
- "nousresearch/hermes-4-405b",
1739
- "nousresearch/hermes-4-70b",
1384
+ "moonshotai/kimi-k2-0905",
1385
+ "moonshotai/kimi-k2:free",
1386
+ "nousresearch/deephermes-3-llama-3-8b-preview",
1387
+ "nousresearch/hermes-4-405b",
1388
+ "nousresearch/hermes-4-70b",
1389
+ "openai/gpt-4.1",
1390
+ "openai/gpt-4.1-mini",
1391
+ "openai/gpt-4o-mini",
1392
+ "openai/gpt-5",
1393
+ "openai/gpt-5-chat",
1394
+ "openai/gpt-5-codex",
1395
+ "openai/gpt-5-image",
1396
+ "openai/gpt-5-mini",
1397
+ "openai/gpt-5-nano",
1398
+ "openai/gpt-oss-120b",
1399
+ "openai/gpt-oss-20b",
1400
+ "openai/o4-mini",
1401
+ "openrouter/cypher-alpha:free",
1402
+ "openrouter/horizon-alpha",
1403
+ "openrouter/horizon-beta",
1404
+ "openrouter/sonoma-dusk-alpha",
1405
+ "openrouter/sonoma-sky-alpha",
1406
+ "qwen/qwen-2.5-coder-32b-instruct",
1407
+ "qwen/qwen2.5-vl-32b-instruct:free",
1408
+ "qwen/qwen2.5-vl-72b-instruct",
1409
+ "qwen/qwen2.5-vl-72b-instruct:free",
1410
+ "qwen/qwen3-14b:free",
1411
+ "qwen/qwen3-235b-a22b-07-25",
1412
+ "qwen/qwen3-235b-a22b-07-25:free",
1413
+ "qwen/qwen3-235b-a22b-thinking-2507",
1414
+ "qwen/qwen3-235b-a22b:free",
1415
+ "qwen/qwen3-30b-a3b-instruct-2507",
1416
+ "qwen/qwen3-30b-a3b-thinking-2507",
1417
+ "qwen/qwen3-30b-a3b:free",
1418
+ "qwen/qwen3-32b:free",
1419
+ "qwen/qwen3-8b:free",
1420
+ "qwen/qwen3-coder",
1421
+ "qwen/qwen3-coder:free",
1422
+ "qwen/qwen3-max",
1423
+ "qwen/qwen3-next-80b-a3b-instruct",
1424
+ "qwen/qwen3-next-80b-a3b-thinking",
1425
+ "qwen/qwq-32b:free",
1426
+ "rekaai/reka-flash-3",
1427
+ "sarvamai/sarvam-m:free",
1428
+ "thudm/glm-z1-32b:free",
1429
+ "tngtech/deepseek-r1t2-chimera:free",
1430
+ "x-ai/grok-3",
1431
+ "x-ai/grok-3-beta",
1432
+ "x-ai/grok-3-mini",
1433
+ "x-ai/grok-3-mini-beta",
1434
+ "x-ai/grok-4",
1435
+ "x-ai/grok-4-fast",
1436
+ "x-ai/grok-4-fast:free",
1437
+ "x-ai/grok-code-fast-1",
1438
+ "z-ai/glm-4.5",
1439
+ "z-ai/glm-4.5-air",
1440
+ "z-ai/glm-4.5-air:free",
1441
+ "z-ai/glm-4.5v",
1442
+ "z-ai/glm-4.6"
1443
+ ],
1444
+ "cerebras": ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
1445
+ "zhipuai": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1446
+ "togetherai": [
1447
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1448
+ "deepseek-ai/DeepSeek-R1",
1449
+ "deepseek-ai/DeepSeek-V3",
1450
+ "meta-llama/Llama-3.3-70B-Instruct-Turbo",
1451
+ "moonshotai/Kimi-K2-Instruct",
1452
+ "openai/gpt-oss-120b"
1453
+ ],
1454
+ "wandb": [
1455
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1456
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1457
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1458
+ "deepseek-ai/DeepSeek-R1-0528",
1459
+ "deepseek-ai/DeepSeek-V3-0324",
1460
+ "meta-llama/Llama-3.1-8B-Instruct",
1461
+ "meta-llama/Llama-3.3-70B-Instruct",
1462
+ "meta-llama/Llama-4-Scout-17B-16E-Instruct",
1463
+ "microsoft/Phi-4-mini-instruct",
1464
+ "moonshotai/Kimi-K2-Instruct"
1465
+ ],
1466
+ "submodel": [
1467
+ "Qwen/Qwen3-235B-A22B-Instruct-2507",
1468
+ "Qwen/Qwen3-235B-A22B-Thinking-2507",
1469
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1470
+ "deepseek-ai/DeepSeek-R1-0528",
1471
+ "deepseek-ai/DeepSeek-V3-0324",
1472
+ "deepseek-ai/DeepSeek-V3.1",
1473
+ "openai/gpt-oss-120b",
1474
+ "zai-org/GLM-4.5-Air",
1475
+ "zai-org/GLM-4.5-FP8"
1476
+ ],
1477
+ "vercel": [
1478
+ "alibaba/qwen3-coder-plus",
1479
+ "alibaba/qwen3-max",
1480
+ "alibaba/qwen3-next-80b-a3b-instruct",
1481
+ "alibaba/qwen3-next-80b-a3b-thinking",
1482
+ "alibaba/qwen3-vl-instruct",
1483
+ "alibaba/qwen3-vl-thinking",
1484
+ "amazon/nova-lite",
1485
+ "amazon/nova-micro",
1486
+ "amazon/nova-pro",
1487
+ "anthropic/claude-3-5-haiku",
1488
+ "anthropic/claude-3-haiku",
1489
+ "anthropic/claude-3-opus",
1490
+ "anthropic/claude-3.5-sonnet",
1491
+ "anthropic/claude-3.7-sonnet",
1492
+ "anthropic/claude-4-1-opus",
1493
+ "anthropic/claude-4-opus",
1494
+ "anthropic/claude-4-sonnet",
1495
+ "anthropic/claude-4.5-sonnet",
1496
+ "anthropic/claude-haiku-4.5",
1497
+ "cerebras/qwen3-coder",
1498
+ "deepseek/deepseek-r1",
1499
+ "deepseek/deepseek-r1-distill-llama-70b",
1500
+ "deepseek/deepseek-v3.1-terminus",
1501
+ "deepseek/deepseek-v3.2-exp",
1502
+ "deepseek/deepseek-v3.2-exp-thinking",
1503
+ "google/gemini-2.0-flash",
1504
+ "google/gemini-2.0-flash-lite",
1505
+ "google/gemini-2.5-flash",
1506
+ "google/gemini-2.5-flash-lite",
1507
+ "google/gemini-2.5-flash-lite-preview-09-2025",
1508
+ "google/gemini-2.5-flash-preview-09-2025",
1509
+ "google/gemini-2.5-pro",
1510
+ "meta/llama-3.3-70b",
1511
+ "meta/llama-4-maverick",
1512
+ "meta/llama-4-scout",
1513
+ "mistral/codestral",
1514
+ "mistral/magistral-medium",
1515
+ "mistral/magistral-small",
1516
+ "mistral/ministral-3b",
1517
+ "mistral/ministral-8b",
1518
+ "mistral/mistral-large",
1519
+ "mistral/mistral-small",
1520
+ "mistral/mixtral-8x22b-instruct",
1521
+ "mistral/pixtral-12b",
1522
+ "mistral/pixtral-large",
1523
+ "moonshotai/kimi-k2",
1524
+ "morph/morph-v3-fast",
1525
+ "morph/morph-v3-large",
1526
+ "openai/gpt-4-turbo",
1740
1527
  "openai/gpt-4.1",
1741
1528
  "openai/gpt-4.1-mini",
1529
+ "openai/gpt-4.1-nano",
1530
+ "openai/gpt-4o",
1742
1531
  "openai/gpt-4o-mini",
1743
1532
  "openai/gpt-5",
1744
- "openai/gpt-5-chat",
1745
1533
  "openai/gpt-5-codex",
1746
- "openai/gpt-5-image",
1747
1534
  "openai/gpt-5-mini",
1748
1535
  "openai/gpt-5-nano",
1749
1536
  "openai/gpt-oss-120b",
1750
1537
  "openai/gpt-oss-20b",
1538
+ "openai/o1",
1539
+ "openai/o3",
1540
+ "openai/o3-mini",
1751
1541
  "openai/o4-mini",
1752
- "openrouter/cypher-alpha:free",
1753
- "openrouter/horizon-alpha",
1754
- "openrouter/horizon-beta",
1755
- "openrouter/sonoma-dusk-alpha",
1756
- "openrouter/sonoma-sky-alpha",
1757
- "qwen/qwen-2.5-coder-32b-instruct",
1758
- "qwen/qwen2.5-vl-32b-instruct:free",
1759
- "qwen/qwen2.5-vl-72b-instruct",
1760
- "qwen/qwen2.5-vl-72b-instruct:free",
1761
- "qwen/qwen3-14b:free",
1762
- "qwen/qwen3-235b-a22b-07-25",
1763
- "qwen/qwen3-235b-a22b-07-25:free",
1764
- "qwen/qwen3-235b-a22b-thinking-2507",
1765
- "qwen/qwen3-235b-a22b:free",
1766
- "qwen/qwen3-30b-a3b-instruct-2507",
1767
- "qwen/qwen3-30b-a3b-thinking-2507",
1768
- "qwen/qwen3-30b-a3b:free",
1769
- "qwen/qwen3-32b:free",
1770
- "qwen/qwen3-8b:free",
1771
- "qwen/qwen3-coder",
1772
- "qwen/qwen3-coder:free",
1773
- "qwen/qwen3-max",
1774
- "qwen/qwen3-next-80b-a3b-instruct",
1775
- "qwen/qwen3-next-80b-a3b-thinking",
1776
- "qwen/qwq-32b:free",
1777
- "rekaai/reka-flash-3",
1778
- "sarvamai/sarvam-m:free",
1779
- "thudm/glm-z1-32b:free",
1780
- "tngtech/deepseek-r1t2-chimera:free",
1781
- "x-ai/grok-3",
1782
- "x-ai/grok-3-beta",
1783
- "x-ai/grok-3-mini",
1784
- "x-ai/grok-3-mini-beta",
1785
- "x-ai/grok-4",
1786
- "x-ai/grok-4-fast",
1787
- "x-ai/grok-4-fast:free",
1788
- "x-ai/grok-code-fast-1",
1789
- "z-ai/glm-4.5",
1790
- "z-ai/glm-4.5-air",
1791
- "z-ai/glm-4.5-air:free",
1792
- "z-ai/glm-4.5v",
1793
- "z-ai/glm-4.6"
1542
+ "perplexity/sonar",
1543
+ "perplexity/sonar-pro",
1544
+ "perplexity/sonar-reasoning",
1545
+ "perplexity/sonar-reasoning-pro",
1546
+ "vercel/v0-1.0-md",
1547
+ "vercel/v0-1.5-md",
1548
+ "xai/grok-2",
1549
+ "xai/grok-2-vision",
1550
+ "xai/grok-3",
1551
+ "xai/grok-3-fast",
1552
+ "xai/grok-3-mini",
1553
+ "xai/grok-3-mini-fast",
1554
+ "xai/grok-4",
1555
+ "xai/grok-4-fast",
1556
+ "xai/grok-4-fast-non-reasoning",
1557
+ "xai/grok-code-fast-1",
1558
+ "zai/glm-4.5",
1559
+ "zai/glm-4.5-air",
1560
+ "zai/glm-4.5v",
1561
+ "zai/glm-4.6"
1794
1562
  ],
1795
1563
  "synthetic": [
1796
1564
  "hf:Qwen/Qwen2.5-Coder-32B-Instruct",
@@ -1815,97 +1583,407 @@
1815
1583
  "hf:zai-org/GLM-4.5",
1816
1584
  "hf:zai-org/GLM-4.6"
1817
1585
  ],
1586
+ "google": [
1587
+ "gemini-1.5-flash",
1588
+ "gemini-1.5-flash-8b",
1589
+ "gemini-1.5-pro",
1590
+ "gemini-2.0-flash",
1591
+ "gemini-2.0-flash-lite",
1592
+ "gemini-2.5-flash",
1593
+ "gemini-2.5-flash-image",
1594
+ "gemini-2.5-flash-image-preview",
1595
+ "gemini-2.5-flash-lite",
1596
+ "gemini-2.5-flash-lite-preview-06-17",
1597
+ "gemini-2.5-flash-lite-preview-09-2025",
1598
+ "gemini-2.5-flash-preview-04-17",
1599
+ "gemini-2.5-flash-preview-05-20",
1600
+ "gemini-2.5-flash-preview-09-2025",
1601
+ "gemini-2.5-flash-preview-tts",
1602
+ "gemini-2.5-pro",
1603
+ "gemini-2.5-pro-preview-05-06",
1604
+ "gemini-2.5-pro-preview-06-05",
1605
+ "gemini-2.5-pro-preview-tts",
1606
+ "gemini-flash-latest",
1607
+ "gemini-flash-lite-latest",
1608
+ "gemini-live-2.5-flash",
1609
+ "gemini-live-2.5-flash-preview-native-audio"
1610
+ ],
1611
+ "groq": [
1612
+ "deepseek-r1-distill-llama-70b",
1613
+ "gemma2-9b-it",
1614
+ "llama-3.1-8b-instant",
1615
+ "llama-3.3-70b-versatile",
1616
+ "llama-guard-3-8b",
1617
+ "llama3-70b-8192",
1618
+ "llama3-8b-8192",
1619
+ "meta-llama/llama-4-maverick-17b-128e-instruct",
1620
+ "meta-llama/llama-4-scout-17b-16e-instruct",
1621
+ "meta-llama/llama-guard-4-12b",
1622
+ "mistral-saba-24b",
1623
+ "moonshotai/kimi-k2-instruct",
1624
+ "moonshotai/kimi-k2-instruct-0905",
1625
+ "openai/gpt-oss-120b",
1626
+ "openai/gpt-oss-20b",
1627
+ "qwen-qwq-32b",
1628
+ "qwen/qwen3-32b"
1629
+ ],
1630
+ "moonshotai-cn": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1631
+ "github-models": [
1632
+ "ai21-labs/ai21-jamba-1.5-large",
1633
+ "ai21-labs/ai21-jamba-1.5-mini",
1634
+ "cohere/cohere-command-a",
1635
+ "cohere/cohere-command-r",
1636
+ "cohere/cohere-command-r-08-2024",
1637
+ "cohere/cohere-command-r-plus",
1638
+ "cohere/cohere-command-r-plus-08-2024",
1639
+ "core42/jais-30b-chat",
1640
+ "deepseek/deepseek-r1",
1641
+ "deepseek/deepseek-r1-0528",
1642
+ "deepseek/deepseek-v3-0324",
1643
+ "meta/llama-3.2-11b-vision-instruct",
1644
+ "meta/llama-3.2-90b-vision-instruct",
1645
+ "meta/llama-3.3-70b-instruct",
1646
+ "meta/llama-4-maverick-17b-128e-instruct-fp8",
1647
+ "meta/llama-4-scout-17b-16e-instruct",
1648
+ "meta/meta-llama-3-70b-instruct",
1649
+ "meta/meta-llama-3-8b-instruct",
1650
+ "meta/meta-llama-3.1-405b-instruct",
1651
+ "meta/meta-llama-3.1-70b-instruct",
1652
+ "meta/meta-llama-3.1-8b-instruct",
1653
+ "microsoft/mai-ds-r1",
1654
+ "microsoft/phi-3-medium-128k-instruct",
1655
+ "microsoft/phi-3-medium-4k-instruct",
1656
+ "microsoft/phi-3-mini-128k-instruct",
1657
+ "microsoft/phi-3-mini-4k-instruct",
1658
+ "microsoft/phi-3-small-128k-instruct",
1659
+ "microsoft/phi-3-small-8k-instruct",
1660
+ "microsoft/phi-3.5-mini-instruct",
1661
+ "microsoft/phi-3.5-moe-instruct",
1662
+ "microsoft/phi-3.5-vision-instruct",
1663
+ "microsoft/phi-4",
1664
+ "microsoft/phi-4-mini-instruct",
1665
+ "microsoft/phi-4-mini-reasoning",
1666
+ "microsoft/phi-4-multimodal-instruct",
1667
+ "microsoft/phi-4-reasoning",
1668
+ "mistral-ai/codestral-2501",
1669
+ "mistral-ai/ministral-3b",
1670
+ "mistral-ai/mistral-large-2411",
1671
+ "mistral-ai/mistral-medium-2505",
1672
+ "mistral-ai/mistral-nemo",
1673
+ "mistral-ai/mistral-small-2503",
1674
+ "openai/gpt-4.1",
1675
+ "openai/gpt-4.1-mini",
1676
+ "openai/gpt-4.1-nano",
1677
+ "openai/gpt-4o",
1678
+ "openai/gpt-4o-mini",
1679
+ "openai/o1",
1680
+ "openai/o1-mini",
1681
+ "openai/o1-preview",
1682
+ "openai/o3",
1683
+ "openai/o3-mini",
1684
+ "openai/o4-mini",
1685
+ "xai/grok-3",
1686
+ "xai/grok-3-mini"
1687
+ ],
1818
1688
  "deepinfra": [
1819
1689
  "Qwen/Qwen3-Coder-480B-A35B-Instruct",
1820
1690
  "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo",
1821
1691
  "moonshotai/Kimi-K2-Instruct",
1822
1692
  "zai-org/GLM-4.5"
1823
1693
  ],
1824
- "zhipuai": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1825
- "submodel": [
1826
- "Qwen/Qwen3-235B-A22B-Instruct-2507",
1827
- "Qwen/Qwen3-235B-A22B-Thinking-2507",
1828
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1829
- "deepseek-ai/DeepSeek-R1-0528",
1830
- "deepseek-ai/DeepSeek-V3-0324",
1831
- "deepseek-ai/DeepSeek-V3.1",
1832
- "openai/gpt-oss-120b",
1833
- "zai-org/GLM-4.5-Air",
1834
- "zai-org/GLM-4.5-FP8"
1694
+ "fireworks-ai": [
1695
+ "accounts/fireworks/models/deepseek-r1-0528",
1696
+ "accounts/fireworks/models/deepseek-v3-0324",
1697
+ "accounts/fireworks/models/deepseek-v3p1",
1698
+ "accounts/fireworks/models/glm-4p5",
1699
+ "accounts/fireworks/models/glm-4p5-air",
1700
+ "accounts/fireworks/models/gpt-oss-120b",
1701
+ "accounts/fireworks/models/gpt-oss-20b",
1702
+ "accounts/fireworks/models/kimi-k2-instruct",
1703
+ "accounts/fireworks/models/qwen3-235b-a22b",
1704
+ "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
1835
1705
  ],
1836
1706
  "zai": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1837
- "inference": [
1838
- "google/gemma-3",
1839
- "meta/llama-3.1-8b-instruct",
1840
- "meta/llama-3.2-11b-vision-instruct",
1841
- "meta/llama-3.2-1b-instruct",
1842
- "meta/llama-3.2-3b-instruct",
1843
- "mistral/mistral-nemo-12b-instruct",
1844
- "osmosis/osmosis-structure-0.6b",
1845
- "qwen/qwen-2.5-7b-vision-instruct",
1846
- "qwen/qwen3-embedding-4b"
1707
+ "opencode": [
1708
+ "an-gbt",
1709
+ "big-pickle",
1710
+ "claude-3-5-haiku",
1711
+ "claude-haiku-4-5",
1712
+ "claude-opus-4-1",
1713
+ "claude-sonnet-4",
1714
+ "claude-sonnet-4-5",
1715
+ "code-supernova",
1716
+ "glm-4.6",
1717
+ "gpt-5",
1718
+ "gpt-5-codex",
1719
+ "grok-code",
1720
+ "kimi-k2",
1721
+ "qwen3-coder"
1847
1722
  ],
1848
- "requesty": [
1849
- "anthropic/claude-3-7-sonnet",
1850
- "anthropic/claude-4-sonnet-20250522",
1851
- "anthropic/claude-opus-4",
1852
- "anthropic/claude-opus-4-1-20250805",
1853
- "google/gemini-2.5-flash",
1854
- "google/gemini-2.5-pro",
1855
- "openai/gpt-4.1",
1856
- "openai/gpt-4.1-mini",
1857
- "openai/gpt-4o-mini",
1858
- "openai/gpt-5",
1859
- "openai/gpt-5-mini",
1860
- "openai/gpt-5-nano",
1861
- "openai/o4-mini"
1723
+ "zhipuai-coding-plan": ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
1724
+ "inception": ["mercury", "mercury-coder"],
1725
+ "llama": [
1726
+ "cerebras-llama-4-maverick-17b-128e-instruct",
1727
+ "cerebras-llama-4-scout-17b-16e-instruct",
1728
+ "groq-llama-4-maverick-17b-128e-instruct",
1729
+ "llama-3.3-70b-instruct",
1730
+ "llama-3.3-8b-instruct",
1731
+ "llama-4-maverick-17b-128e-instruct-fp8",
1732
+ "llama-4-scout-17b-16e-instruct-fp8"
1862
1733
  ],
1863
- "morph": ["auto", "morph-v3-fast", "morph-v3-large"],
1864
1734
  "lmstudio": ["openai/gpt-oss-20b", "qwen/qwen3-30b-a3b-2507", "qwen/qwen3-coder-30b"],
1735
+ "openai": [
1736
+ "codex-mini-latest",
1737
+ "gpt-3.5-turbo",
1738
+ "gpt-4",
1739
+ "gpt-4-turbo",
1740
+ "gpt-4.1",
1741
+ "gpt-4.1-mini",
1742
+ "gpt-4.1-nano",
1743
+ "gpt-4o",
1744
+ "gpt-4o-2024-05-13",
1745
+ "gpt-4o-2024-08-06",
1746
+ "gpt-4o-2024-11-20",
1747
+ "gpt-4o-mini",
1748
+ "gpt-5",
1749
+ "gpt-5-chat-latest",
1750
+ "gpt-5-codex",
1751
+ "gpt-5-mini",
1752
+ "gpt-5-nano",
1753
+ "o1",
1754
+ "o1-mini",
1755
+ "o1-preview",
1756
+ "o1-pro",
1757
+ "o3",
1758
+ "o3-deep-research",
1759
+ "o3-mini",
1760
+ "o3-pro",
1761
+ "o4-mini",
1762
+ "o4-mini-deep-research"
1763
+ ],
1865
1764
  "anthropic": [
1866
1765
  "claude-3-5-haiku-20241022",
1766
+ "claude-3-5-haiku-latest",
1867
1767
  "claude-3-5-sonnet-20240620",
1868
1768
  "claude-3-5-sonnet-20241022",
1869
1769
  "claude-3-7-sonnet-20250219",
1770
+ "claude-3-7-sonnet-latest",
1870
1771
  "claude-3-haiku-20240307",
1871
1772
  "claude-3-opus-20240229",
1872
1773
  "claude-3-sonnet-20240229",
1774
+ "claude-haiku-4-5",
1873
1775
  "claude-haiku-4-5-20251001",
1776
+ "claude-opus-4-0",
1777
+ "claude-opus-4-1",
1874
1778
  "claude-opus-4-1-20250805",
1875
1779
  "claude-opus-4-20250514",
1780
+ "claude-sonnet-4-0",
1876
1781
  "claude-sonnet-4-20250514",
1782
+ "claude-sonnet-4-5",
1877
1783
  "claude-sonnet-4-5-20250929"
1878
1784
  ],
1879
- "fireworks-ai": [
1880
- "accounts/fireworks/models/deepseek-r1-0528",
1881
- "accounts/fireworks/models/deepseek-v3-0324",
1882
- "accounts/fireworks/models/deepseek-v3p1",
1883
- "accounts/fireworks/models/glm-4p5",
1884
- "accounts/fireworks/models/glm-4p5-air",
1885
- "accounts/fireworks/models/gpt-oss-120b",
1886
- "accounts/fireworks/models/gpt-oss-20b",
1887
- "accounts/fireworks/models/kimi-k2-instruct",
1888
- "accounts/fireworks/models/qwen3-235b-a22b",
1889
- "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
1785
+ "moonshotai": ["kimi-k2-0711-preview", "kimi-k2-0905-preview", "kimi-k2-turbo-preview"],
1786
+ "inference": [
1787
+ "google/gemma-3",
1788
+ "meta/llama-3.1-8b-instruct",
1789
+ "meta/llama-3.2-11b-vision-instruct",
1790
+ "meta/llama-3.2-1b-instruct",
1791
+ "meta/llama-3.2-3b-instruct",
1792
+ "mistral/mistral-nemo-12b-instruct",
1793
+ "osmosis/osmosis-structure-0.6b",
1794
+ "qwen/qwen-2.5-7b-vision-instruct",
1795
+ "qwen/qwen3-embedding-4b"
1890
1796
  ],
1891
- "modelscope": [
1797
+ "baseten": ["Qwen3/Qwen3-Coder-480B-A35B-Instruct", "moonshotai/Kimi-K2-Instruct-0905", "zai-org/GLM-4.6"],
1798
+ "cortecs": [
1799
+ "claude-4-5-sonnet",
1800
+ "claude-sonnet-4",
1801
+ "deepseek-v3-0324",
1802
+ "gemini-2.5-pro",
1803
+ "gpt-4.1",
1804
+ "gpt-oss-120b",
1805
+ "kimi-k2-instruct",
1806
+ "llama-3.1-405b-instruct",
1807
+ "nova-pro-v1",
1808
+ "qwen3-32b",
1809
+ "qwen3-coder-480b-a35b-instruct"
1810
+ ],
1811
+ "mistral": [
1812
+ "codestral-latest",
1813
+ "devstral-medium-2507",
1814
+ "devstral-small-2505",
1815
+ "devstral-small-2507",
1816
+ "magistral-medium-latest",
1817
+ "magistral-small",
1818
+ "ministral-3b-latest",
1819
+ "ministral-8b-latest",
1820
+ "mistral-large-latest",
1821
+ "mistral-medium-2505",
1822
+ "mistral-medium-2508",
1823
+ "mistral-medium-latest",
1824
+ "mistral-nemo",
1825
+ "mistral-small-latest",
1826
+ "open-mistral-7b",
1827
+ "open-mixtral-8x22b",
1828
+ "open-mixtral-8x7b",
1829
+ "pixtral-12b",
1830
+ "pixtral-large-latest"
1831
+ ],
1832
+ "venice": [
1833
+ "deepseek-coder-v2-lite",
1834
+ "deepseek-r1-671b",
1835
+ "dolphin-2.9.2-qwen2-72b",
1836
+ "llama-3.1-405b",
1837
+ "llama-3.2-3b",
1838
+ "llama-3.3-70b",
1839
+ "mistral-31-24b",
1840
+ "qwen-2.5-coder-32b",
1841
+ "qwen-2.5-qwq-32b",
1842
+ "qwen-2.5-vl",
1843
+ "qwen3-235b",
1844
+ "qwen3-4b",
1845
+ "venice-uncensored"
1846
+ ],
1847
+ "alibaba": [
1848
+ "qvq-max",
1849
+ "qwen-flash",
1850
+ "qwen-max",
1851
+ "qwen-mt-plus",
1852
+ "qwen-mt-turbo",
1853
+ "qwen-omni-turbo",
1854
+ "qwen-omni-turbo-realtime",
1855
+ "qwen-plus",
1856
+ "qwen-plus-character-ja",
1857
+ "qwen-turbo",
1858
+ "qwen-vl-max",
1859
+ "qwen-vl-ocr",
1860
+ "qwen-vl-plus",
1861
+ "qwen2-5-14b-instruct",
1862
+ "qwen2-5-32b-instruct",
1863
+ "qwen2-5-72b-instruct",
1864
+ "qwen2-5-7b-instruct",
1865
+ "qwen2-5-omni-7b",
1866
+ "qwen2-5-vl-72b-instruct",
1867
+ "qwen2-5-vl-7b-instruct",
1868
+ "qwen3-14b",
1869
+ "qwen3-235b-a22b",
1870
+ "qwen3-32b",
1871
+ "qwen3-8b",
1872
+ "qwen3-asr-flash",
1873
+ "qwen3-coder-30b-a3b-instruct",
1874
+ "qwen3-coder-480b-a35b-instruct",
1875
+ "qwen3-coder-flash",
1876
+ "qwen3-coder-plus",
1877
+ "qwen3-livetranslate-flash-realtime",
1878
+ "qwen3-max",
1879
+ "qwen3-next-80b-a3b-instruct",
1880
+ "qwen3-next-80b-a3b-thinking",
1881
+ "qwen3-omni-flash",
1882
+ "qwen3-omni-flash-realtime",
1883
+ "qwen3-vl-235b-a22b",
1884
+ "qwen3-vl-30b-a3b",
1885
+ "qwen3-vl-plus",
1886
+ "qwq-plus"
1887
+ ],
1888
+ "alibaba-cn": [
1889
+ "deepseek-r1",
1890
+ "deepseek-r1-0528",
1891
+ "deepseek-r1-distill-llama-70b",
1892
+ "deepseek-r1-distill-llama-8b",
1893
+ "deepseek-r1-distill-qwen-1-5b",
1894
+ "deepseek-r1-distill-qwen-14b",
1895
+ "deepseek-r1-distill-qwen-32b",
1896
+ "deepseek-r1-distill-qwen-7b",
1897
+ "deepseek-v3",
1898
+ "deepseek-v3-1",
1899
+ "deepseek-v3-2-exp",
1900
+ "moonshot-kimi-k2-instruct",
1901
+ "qvq-max",
1902
+ "qwen-deep-research",
1903
+ "qwen-doc-turbo",
1904
+ "qwen-flash",
1905
+ "qwen-long",
1906
+ "qwen-math-plus",
1907
+ "qwen-math-turbo",
1908
+ "qwen-max",
1909
+ "qwen-mt-plus",
1910
+ "qwen-mt-turbo",
1911
+ "qwen-omni-turbo",
1912
+ "qwen-omni-turbo-realtime",
1913
+ "qwen-plus",
1914
+ "qwen-plus-character",
1915
+ "qwen-turbo",
1916
+ "qwen-vl-max",
1917
+ "qwen-vl-ocr",
1918
+ "qwen-vl-plus",
1919
+ "qwen2-5-14b-instruct",
1920
+ "qwen2-5-32b-instruct",
1921
+ "qwen2-5-72b-instruct",
1922
+ "qwen2-5-7b-instruct",
1923
+ "qwen2-5-coder-32b-instruct",
1924
+ "qwen2-5-coder-7b-instruct",
1925
+ "qwen2-5-math-72b-instruct",
1926
+ "qwen2-5-math-7b-instruct",
1927
+ "qwen2-5-omni-7b",
1928
+ "qwen2-5-vl-72b-instruct",
1929
+ "qwen2-5-vl-7b-instruct",
1930
+ "qwen3-14b",
1931
+ "qwen3-235b-a22b",
1932
+ "qwen3-32b",
1933
+ "qwen3-8b",
1934
+ "qwen3-asr-flash",
1935
+ "qwen3-coder-30b-a3b-instruct",
1936
+ "qwen3-coder-480b-a35b-instruct",
1937
+ "qwen3-coder-flash",
1938
+ "qwen3-coder-plus",
1939
+ "qwen3-max",
1940
+ "qwen3-next-80b-a3b-instruct",
1941
+ "qwen3-next-80b-a3b-thinking",
1942
+ "qwen3-omni-flash",
1943
+ "qwen3-omni-flash-realtime",
1944
+ "qwen3-vl-235b-a22b",
1945
+ "qwen3-vl-30b-a3b",
1946
+ "qwen3-vl-plus",
1947
+ "qwq-32b",
1948
+ "qwq-plus",
1949
+ "tongyi-intent-detect-v3"
1950
+ ],
1951
+ "chutes": [
1892
1952
  "Qwen/Qwen3-235B-A22B-Instruct-2507",
1893
1953
  "Qwen/Qwen3-235B-A22B-Thinking-2507",
1954
+ "Qwen/Qwen3-30B-A3B",
1894
1955
  "Qwen/Qwen3-30B-A3B-Instruct-2507",
1895
1956
  "Qwen/Qwen3-30B-A3B-Thinking-2507",
1896
1957
  "Qwen/Qwen3-Coder-30B-A3B-Instruct",
1897
- "ZhipuAI/GLM-4.5"
1898
- ],
1899
- "llama": [
1900
- "cerebras-llama-4-maverick-17b-128e-instruct",
1901
- "cerebras-llama-4-scout-17b-16e-instruct",
1902
- "groq-llama-4-maverick-17b-128e-instruct",
1903
- "llama-3.3-70b-instruct",
1904
- "llama-3.3-8b-instruct",
1905
- "llama-4-maverick-17b-128e-instruct-fp8",
1906
- "llama-4-scout-17b-16e-instruct-fp8"
1958
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
1959
+ "Qwen/Qwen3-Next-80B-A3B-Instruct",
1960
+ "Qwen/Qwen3-Next-80B-A3B-Thinking",
1961
+ "chutesai/Devstral-Small-2505",
1962
+ "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
1963
+ "deepseek-ai/DeepSeek-R1-0528",
1964
+ "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
1965
+ "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1966
+ "deepseek-ai/DeepSeek-V3-0324",
1967
+ "deepseek-ai/DeepSeek-V3.1",
1968
+ "deepseek-ai/DeepSeek-V3.1-Terminus",
1969
+ "deepseek-ai/DeepSeek-V3.1-turbo",
1970
+ "deepseek-ai/DeepSeek-V3.1:THINKING",
1971
+ "deepseek-ai/DeepSeek-V3.2-Exp",
1972
+ "meituan-longcat/LongCat-Flash-Chat-FP8",
1973
+ "moonshotai/Kimi-Dev-72B",
1974
+ "moonshotai/Kimi-K2-Instruct-0905",
1975
+ "moonshotai/Kimi-K2-Instruct-75k",
1976
+ "moonshotai/Kimi-VL-A3B-Thinking",
1977
+ "openai/gpt-oss-120b",
1978
+ "tngtech/DeepSeek-R1T-Chimera",
1979
+ "tngtech/DeepSeek-TNG-R1T2-Chimera",
1980
+ "zai-org/GLM-4.5-Air",
1981
+ "zai-org/GLM-4.5-FP8",
1982
+ "zai-org/GLM-4.5-turbo",
1983
+ "zai-org/GLM-4.6-FP8",
1984
+ "zai-org/GLM-4.6-turbo"
1907
1985
  ],
1908
- "cerebras": ["gpt-oss-120b", "qwen-3-235b-a22b-instruct-2507", "qwen-3-coder-480b"],
1986
+ "upstage": ["solar-mini", "solar-pro2"],
1909
1987
  "netlify": [
1910
1988
  "anthropic/claude-3-5-haiku-20241022",
1911
1989
  "anthropic/claude-3-5-haiku-latest",