@ailib-official/ai-protocol 0.8.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (194) hide show
  1. package/LICENSE +6 -0
  2. package/README.md +415 -0
  3. package/dist/index.json +8 -0
  4. package/dist/v1/models/ai21.json +140 -0
  5. package/dist/v1/models/baichuan.json +138 -0
  6. package/dist/v1/models/cerebras.json +147 -0
  7. package/dist/v1/models/claude.json +114 -0
  8. package/dist/v1/models/cohere.json +235 -0
  9. package/dist/v1/models/deepinfra.json +43 -0
  10. package/dist/v1/models/deepseek-chat.json +55 -0
  11. package/dist/v1/models/doubao.json +197 -0
  12. package/dist/v1/models/ernie.json +223 -0
  13. package/dist/v1/models/fireworks.json +222 -0
  14. package/dist/v1/models/gemini.json +58 -0
  15. package/dist/v1/models/gpt.json +166 -0
  16. package/dist/v1/models/grok.json +138 -0
  17. package/dist/v1/models/huggingface.json +183 -0
  18. package/dist/v1/models/hunyuan.json +255 -0
  19. package/dist/v1/models/jina.json +139 -0
  20. package/dist/v1/models/lepton.json +188 -0
  21. package/dist/v1/models/llama.json +143 -0
  22. package/dist/v1/models/minimax.json +194 -0
  23. package/dist/v1/models/mistral.json +177 -0
  24. package/dist/v1/models/moonshot.json +144 -0
  25. package/dist/v1/models/nvidia.json +212 -0
  26. package/dist/v1/models/palmyra.json +103 -0
  27. package/dist/v1/models/perplexity.json +143 -0
  28. package/dist/v1/models/qwen.json +49 -0
  29. package/dist/v1/models/replicate.json +206 -0
  30. package/dist/v1/models/sensenova.json +144 -0
  31. package/dist/v1/models/siliconflow.json +44 -0
  32. package/dist/v1/models/spark.json +173 -0
  33. package/dist/v1/models/stable-diffusion.json +161 -0
  34. package/dist/v1/models/tiangong.json +169 -0
  35. package/dist/v1/models/together.json +43 -0
  36. package/dist/v1/models/yi.json +199 -0
  37. package/dist/v1/models/zhipu.json +250 -0
  38. package/dist/v1/providers/ai21.json +215 -0
  39. package/dist/v1/providers/anthropic.json +253 -0
  40. package/dist/v1/providers/anyscale.json +115 -0
  41. package/dist/v1/providers/azure.json +188 -0
  42. package/dist/v1/providers/baichuan.json +205 -0
  43. package/dist/v1/providers/baidu.json +205 -0
  44. package/dist/v1/providers/cerebras.json +216 -0
  45. package/dist/v1/providers/cohere.json +209 -0
  46. package/dist/v1/providers/deepinfra.json +196 -0
  47. package/dist/v1/providers/deepseek.json +221 -0
  48. package/dist/v1/providers/doubao.json +209 -0
  49. package/dist/v1/providers/fireworks.json +227 -0
  50. package/dist/v1/providers/gemini.json +279 -0
  51. package/dist/v1/providers/groq.json +218 -0
  52. package/dist/v1/providers/huggingface.json +181 -0
  53. package/dist/v1/providers/hunyuan.json +198 -0
  54. package/dist/v1/providers/jina.json +202 -0
  55. package/dist/v1/providers/lepton.json +221 -0
  56. package/dist/v1/providers/minimax.json +209 -0
  57. package/dist/v1/providers/mistral.json +214 -0
  58. package/dist/v1/providers/moonshot.json +214 -0
  59. package/dist/v1/providers/nvidia.json +213 -0
  60. package/dist/v1/providers/openai.json +267 -0
  61. package/dist/v1/providers/openrouter.json +220 -0
  62. package/dist/v1/providers/perplexity.json +172 -0
  63. package/dist/v1/providers/qwen.json +231 -0
  64. package/dist/v1/providers/replicate.json +192 -0
  65. package/dist/v1/providers/sensenova.json +185 -0
  66. package/dist/v1/providers/siliconflow.json +197 -0
  67. package/dist/v1/providers/spark.json +204 -0
  68. package/dist/v1/providers/stability.json +221 -0
  69. package/dist/v1/providers/tiangong.json +207 -0
  70. package/dist/v1/providers/together.json +196 -0
  71. package/dist/v1/providers/writer.json +253 -0
  72. package/dist/v1/providers/xai.json +238 -0
  73. package/dist/v1/providers/yi.json +205 -0
  74. package/dist/v1/providers/zhipu.json +208 -0
  75. package/dist/v1/spec.json +783 -0
  76. package/dist/v2/providers/anthropic.json +372 -0
  77. package/dist/v2/providers/cohere.json +109 -0
  78. package/dist/v2/providers/deepseek.json +272 -0
  79. package/dist/v2/providers/doubao.json +260 -0
  80. package/dist/v2/providers/google.json +388 -0
  81. package/dist/v2/providers/jina.json +71 -0
  82. package/dist/v2/providers/moonshot.json +284 -0
  83. package/dist/v2/providers/openai.json +419 -0
  84. package/dist/v2/providers/qwen.json +274 -0
  85. package/dist/v2/providers/zhipu.json +257 -0
  86. package/dist/v2-alpha/providers/anthropic.json +182 -0
  87. package/dist/v2-alpha/providers/gemini.json +187 -0
  88. package/dist/v2-alpha/providers/openai.json +215 -0
  89. package/dist/v2-alpha/spec.json +644 -0
  90. package/package.json +61 -0
  91. package/schemas/spec.json +186 -0
  92. package/schemas/v1.json +1116 -0
  93. package/schemas/v2/availability.json +66 -0
  94. package/schemas/v2/capabilities.json +182 -0
  95. package/schemas/v2/capability-profile.json +174 -0
  96. package/schemas/v2/computer-use.json +222 -0
  97. package/schemas/v2/context-policy.json +148 -0
  98. package/schemas/v2/endpoint.json +2 -0
  99. package/schemas/v2/error-codes.yaml +225 -0
  100. package/schemas/v2/errors.json +250 -0
  101. package/schemas/v2/execution-metadata.json +59 -0
  102. package/schemas/v2/mcp.json +225 -0
  103. package/schemas/v2/message-roles.json +10 -0
  104. package/schemas/v2/multimodal.json +297 -0
  105. package/schemas/v2/pricing.json +14 -0
  106. package/schemas/v2/provider-contract.json +317 -0
  107. package/schemas/v2/provider.json +203 -0
  108. package/schemas/v2/regions.json +14 -0
  109. package/v1/models/ai21.yaml +97 -0
  110. package/v1/models/baichuan.yaml +95 -0
  111. package/v1/models/cerebras.yaml +99 -0
  112. package/v1/models/claude.yaml +59 -0
  113. package/v1/models/cohere.yaml +165 -0
  114. package/v1/models/deepinfra.yaml +29 -0
  115. package/v1/models/deepseek-chat.yaml +32 -0
  116. package/v1/models/doubao.yaml +129 -0
  117. package/v1/models/ernie.yaml +146 -0
  118. package/v1/models/fireworks.yaml +145 -0
  119. package/v1/models/gemini.yaml +32 -0
  120. package/v1/models/gpt.yaml +90 -0
  121. package/v1/models/grok.yaml +74 -0
  122. package/v1/models/huggingface.yaml +110 -0
  123. package/v1/models/hunyuan.yaml +164 -0
  124. package/v1/models/jina.yaml +98 -0
  125. package/v1/models/lepton.yaml +130 -0
  126. package/v1/models/llama.yaml +91 -0
  127. package/v1/models/minimax.yaml +132 -0
  128. package/v1/models/mistral.yaml +100 -0
  129. package/v1/models/moonshot.yaml +97 -0
  130. package/v1/models/nvidia.yaml +118 -0
  131. package/v1/models/palmyra.yaml +59 -0
  132. package/v1/models/perplexity.yaml +97 -0
  133. package/v1/models/qwen.yaml +27 -0
  134. package/v1/models/replicate.yaml +136 -0
  135. package/v1/models/sensenova.yaml +97 -0
  136. package/v1/models/siliconflow.yaml +29 -0
  137. package/v1/models/spark.yaml +114 -0
  138. package/v1/models/stable-diffusion.yaml +113 -0
  139. package/v1/models/tiangong.yaml +114 -0
  140. package/v1/models/together.yaml +29 -0
  141. package/v1/models/yi.yaml +132 -0
  142. package/v1/models/zhipu.yaml +163 -0
  143. package/v1/providers/ai21.yaml +176 -0
  144. package/v1/providers/anthropic.yaml +209 -0
  145. package/v1/providers/anyscale.yaml +106 -0
  146. package/v1/providers/azure.yaml +155 -0
  147. package/v1/providers/baichuan.yaml +168 -0
  148. package/v1/providers/baidu.yaml +173 -0
  149. package/v1/providers/cerebras.yaml +178 -0
  150. package/v1/providers/cohere.yaml +175 -0
  151. package/v1/providers/deepinfra.yaml +156 -0
  152. package/v1/providers/deepseek.yaml +189 -0
  153. package/v1/providers/doubao.yaml +172 -0
  154. package/v1/providers/fireworks.yaml +187 -0
  155. package/v1/providers/gemini.yaml +229 -0
  156. package/v1/providers/groq.yaml +181 -0
  157. package/v1/providers/huggingface.yaml +157 -0
  158. package/v1/providers/hunyuan.yaml +162 -0
  159. package/v1/providers/jina.yaml +171 -0
  160. package/v1/providers/lepton.yaml +183 -0
  161. package/v1/providers/minimax.yaml +172 -0
  162. package/v1/providers/mistral.yaml +186 -0
  163. package/v1/providers/moonshot.yaml +176 -0
  164. package/v1/providers/nvidia.yaml +172 -0
  165. package/v1/providers/openai.yaml +224 -0
  166. package/v1/providers/openrouter.yaml +181 -0
  167. package/v1/providers/perplexity.yaml +144 -0
  168. package/v1/providers/qwen.yaml +192 -0
  169. package/v1/providers/replicate.yaml +159 -0
  170. package/v1/providers/sensenova.yaml +153 -0
  171. package/v1/providers/siliconflow.yaml +156 -0
  172. package/v1/providers/spark.yaml +167 -0
  173. package/v1/providers/stability.yaml +185 -0
  174. package/v1/providers/tiangong.yaml +170 -0
  175. package/v1/providers/together.yaml +156 -0
  176. package/v1/providers/writer.yaml +212 -0
  177. package/v1/providers/xai.yaml +206 -0
  178. package/v1/providers/yi.yaml +168 -0
  179. package/v1/providers/zhipu.yaml +171 -0
  180. package/v1/spec.yaml +637 -0
  181. package/v2/providers/anthropic.yaml +244 -0
  182. package/v2/providers/cohere.yaml +75 -0
  183. package/v2/providers/deepseek.yaml +176 -0
  184. package/v2/providers/doubao.yaml +169 -0
  185. package/v2/providers/google.yaml +245 -0
  186. package/v2/providers/jina.yaml +55 -0
  187. package/v2/providers/moonshot.yaml +186 -0
  188. package/v2/providers/openai.yaml +266 -0
  189. package/v2/providers/qwen.yaml +174 -0
  190. package/v2/providers/zhipu.yaml +176 -0
  191. package/v2-alpha/providers/anthropic.yaml +134 -0
  192. package/v2-alpha/providers/gemini.yaml +144 -0
  193. package/v2-alpha/providers/openai.yaml +154 -0
  194. package/v2-alpha/spec.yaml +512 -0
@@ -0,0 +1,255 @@
1
+ {
2
+ "$schema": "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json",
3
+ "protocol_version": "1.1",
4
+ "models": {
5
+ "hunyuan-pro": {
6
+ "provider": "hunyuan",
7
+ "model_id": "hunyuan-pro",
8
+ "display_name": "混元 Pro",
9
+ "verification": {
10
+ "status": "unverified",
11
+ "verified_at": "2026-01-31",
12
+ "source": "documentation",
13
+ "notes": "Hunyuan flagship model with best quality."
14
+ },
15
+ "context_window": 32768,
16
+ "capabilities": [
17
+ "chat",
18
+ "tools",
19
+ "streaming"
20
+ ],
21
+ "status": "active",
22
+ "tags": [
23
+ "tencent",
24
+ "hunyuan",
25
+ "pro",
26
+ "flagship",
27
+ "cn"
28
+ ],
29
+ "pricing": {
30
+ "input_per_token": 0.00003,
31
+ "output_per_token": 0.0001
32
+ }
33
+ },
34
+ "hunyuan-standard": {
35
+ "provider": "hunyuan",
36
+ "model_id": "hunyuan-standard",
37
+ "display_name": "混元 Standard",
38
+ "verification": {
39
+ "status": "unverified",
40
+ "verified_at": "2026-01-31",
41
+ "source": "documentation"
42
+ },
43
+ "context_window": 32768,
44
+ "capabilities": [
45
+ "chat",
46
+ "tools",
47
+ "streaming"
48
+ ],
49
+ "status": "active",
50
+ "tags": [
51
+ "tencent",
52
+ "hunyuan",
53
+ "standard",
54
+ "cn"
55
+ ],
56
+ "pricing": {
57
+ "input_per_token": 0.0000045,
58
+ "output_per_token": 0.000005
59
+ }
60
+ },
61
+ "hunyuan-standard-256k": {
62
+ "provider": "hunyuan",
63
+ "model_id": "hunyuan-standard-256K",
64
+ "display_name": "混元 Standard 256K",
65
+ "verification": {
66
+ "status": "unverified",
67
+ "verified_at": "2026-01-31",
68
+ "source": "documentation"
69
+ },
70
+ "context_window": 262144,
71
+ "capabilities": [
72
+ "chat",
73
+ "tools",
74
+ "streaming"
75
+ ],
76
+ "status": "active",
77
+ "tags": [
78
+ "tencent",
79
+ "hunyuan",
80
+ "standard",
81
+ "ultra_long_context",
82
+ "cn"
83
+ ],
84
+ "pricing": {
85
+ "input_per_token": 0.000015,
86
+ "output_per_token": 0.00006
87
+ }
88
+ },
89
+ "hunyuan-lite": {
90
+ "provider": "hunyuan",
91
+ "model_id": "hunyuan-lite",
92
+ "display_name": "混元 Lite",
93
+ "verification": {
94
+ "status": "unverified",
95
+ "verified_at": "2026-01-31",
96
+ "source": "documentation",
97
+ "notes": "Free tier available with rate limits."
98
+ },
99
+ "context_window": 4096,
100
+ "capabilities": [
101
+ "chat",
102
+ "streaming"
103
+ ],
104
+ "status": "active",
105
+ "tags": [
106
+ "tencent",
107
+ "hunyuan",
108
+ "lite",
109
+ "free_tier",
110
+ "cn"
111
+ ],
112
+ "pricing": {
113
+ "input_per_token": 0,
114
+ "output_per_token": 0
115
+ }
116
+ },
117
+ "hunyuan-turbo": {
118
+ "provider": "hunyuan",
119
+ "model_id": "hunyuan-turbo",
120
+ "display_name": "混元 Turbo",
121
+ "verification": {
122
+ "status": "unverified",
123
+ "verified_at": "2026-01-31",
124
+ "source": "documentation"
125
+ },
126
+ "context_window": 32768,
127
+ "capabilities": [
128
+ "chat",
129
+ "tools",
130
+ "streaming"
131
+ ],
132
+ "status": "active",
133
+ "tags": [
134
+ "tencent",
135
+ "hunyuan",
136
+ "turbo",
137
+ "cn"
138
+ ],
139
+ "pricing": {
140
+ "input_per_token": 0.000015,
141
+ "output_per_token": 0.00005
142
+ }
143
+ },
144
+ "hunyuan-turbo-latest": {
145
+ "provider": "hunyuan",
146
+ "model_id": "hunyuan-turbo-latest",
147
+ "display_name": "混元 Turbo Latest",
148
+ "verification": {
149
+ "status": "unverified",
150
+ "verified_at": "2026-01-31",
151
+ "source": "documentation"
152
+ },
153
+ "context_window": 32768,
154
+ "capabilities": [
155
+ "chat",
156
+ "tools",
157
+ "streaming"
158
+ ],
159
+ "status": "active",
160
+ "tags": [
161
+ "tencent",
162
+ "hunyuan",
163
+ "turbo",
164
+ "latest",
165
+ "cn"
166
+ ],
167
+ "pricing": {
168
+ "input_per_token": 0.000015,
169
+ "output_per_token": 0.00005
170
+ }
171
+ },
172
+ "hunyuan-vision": {
173
+ "provider": "hunyuan",
174
+ "model_id": "hunyuan-vision",
175
+ "display_name": "混元 Vision",
176
+ "verification": {
177
+ "status": "unverified",
178
+ "verified_at": "2026-01-31",
179
+ "source": "documentation"
180
+ },
181
+ "context_window": 8192,
182
+ "capabilities": [
183
+ "chat",
184
+ "vision",
185
+ "streaming"
186
+ ],
187
+ "status": "active",
188
+ "tags": [
189
+ "tencent",
190
+ "hunyuan",
191
+ "vision",
192
+ "multimodal",
193
+ "cn"
194
+ ],
195
+ "pricing": {
196
+ "input_per_token": 0.00002,
197
+ "output_per_token": 0.00002
198
+ }
199
+ },
200
+ "hunyuan-code": {
201
+ "provider": "hunyuan",
202
+ "model_id": "hunyuan-code",
203
+ "display_name": "混元 Code",
204
+ "verification": {
205
+ "status": "unverified",
206
+ "verified_at": "2026-01-31",
207
+ "source": "documentation"
208
+ },
209
+ "context_window": 8192,
210
+ "capabilities": [
211
+ "chat",
212
+ "code",
213
+ "streaming"
214
+ ],
215
+ "status": "active",
216
+ "tags": [
217
+ "tencent",
218
+ "hunyuan",
219
+ "code",
220
+ "cn"
221
+ ],
222
+ "pricing": {
223
+ "input_per_token": 0.0000045,
224
+ "output_per_token": 0.000005
225
+ }
226
+ },
227
+ "hunyuan-role": {
228
+ "provider": "hunyuan",
229
+ "model_id": "hunyuan-role",
230
+ "display_name": "混元 Role",
231
+ "verification": {
232
+ "status": "unverified",
233
+ "verified_at": "2026-01-31",
234
+ "source": "documentation"
235
+ },
236
+ "context_window": 32768,
237
+ "capabilities": [
238
+ "chat",
239
+ "streaming"
240
+ ],
241
+ "status": "active",
242
+ "tags": [
243
+ "tencent",
244
+ "hunyuan",
245
+ "role",
246
+ "roleplay",
247
+ "cn"
248
+ ],
249
+ "pricing": {
250
+ "input_per_token": 0.0000045,
251
+ "output_per_token": 0.000005
252
+ }
253
+ }
254
+ }
255
+ }
@@ -0,0 +1,139 @@
1
+ {
2
+ "$schema": "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json",
3
+ "protocol_version": "1.5",
4
+ "models": {
5
+ "jina-embeddings-v3": {
6
+ "provider": "jina",
7
+ "model_id": "jina-embeddings-v3",
8
+ "display_name": "Jina Embeddings v3",
9
+ "verification": {
10
+ "status": "unverified",
11
+ "source": "manual",
12
+ "notes": "State-of-the-art text embeddings"
13
+ },
14
+ "context_window": 8192,
15
+ "capabilities": [
16
+ "embeddings"
17
+ ],
18
+ "modality": "text",
19
+ "pricing": {
20
+ "input_per_token": null,
21
+ "output_per_token": null
22
+ },
23
+ "status": "active",
24
+ "tags": [
25
+ "jina",
26
+ "embeddings",
27
+ "rag",
28
+ "search"
29
+ ],
30
+ "dimensions": 1024
31
+ },
32
+ "jina-embeddings-v2-base-en": {
33
+ "provider": "jina",
34
+ "model_id": "jina-embeddings-v2-base-en",
35
+ "display_name": "Jina Embeddings v2 Base EN",
36
+ "verification": {
37
+ "status": "unverified",
38
+ "source": "manual",
39
+ "notes": "English-only embeddings model"
40
+ },
41
+ "context_window": 8192,
42
+ "capabilities": [
43
+ "embeddings"
44
+ ],
45
+ "modality": "text",
46
+ "pricing": {
47
+ "input_per_token": null,
48
+ "output_per_token": null
49
+ },
50
+ "status": "active",
51
+ "tags": [
52
+ "jina",
53
+ "embeddings",
54
+ "en",
55
+ "fast"
56
+ ],
57
+ "dimensions": 768
58
+ },
59
+ "jina-embeddings-v2-base-code": {
60
+ "provider": "jina",
61
+ "model_id": "jina-embeddings-v2-base-code",
62
+ "display_name": "Jina Embeddings v2 Base Code",
63
+ "verification": {
64
+ "status": "unverified",
65
+ "source": "manual",
66
+ "notes": "Code embeddings for semantic code search"
67
+ },
68
+ "context_window": 8192,
69
+ "capabilities": [
70
+ "embeddings"
71
+ ],
72
+ "modality": "code",
73
+ "pricing": {
74
+ "input_per_token": null,
75
+ "output_per_token": null
76
+ },
77
+ "status": "active",
78
+ "tags": [
79
+ "jina",
80
+ "embeddings",
81
+ "code",
82
+ "search"
83
+ ],
84
+ "dimensions": 768
85
+ },
86
+ "jina-reranker-v2-base-en": {
87
+ "provider": "jina",
88
+ "model_id": "jina-reranker-v2-base-en",
89
+ "display_name": "Jina Reranker v2 Base EN",
90
+ "verification": {
91
+ "status": "unverified",
92
+ "source": "manual",
93
+ "notes": "Re-ranking model for RAG"
94
+ },
95
+ "context_window": 512,
96
+ "capabilities": [
97
+ "rerank"
98
+ ],
99
+ "modality": "text",
100
+ "pricing": {
101
+ "input_per_token": null,
102
+ "output_per_token": null
103
+ },
104
+ "status": "active",
105
+ "tags": [
106
+ "jina",
107
+ "rerank",
108
+ "rag",
109
+ "search"
110
+ ]
111
+ },
112
+ "jina-colbert-v2": {
113
+ "provider": "jina",
114
+ "model_id": "jina-colbert-v2",
115
+ "display_name": "Jina ColBERT v2",
116
+ "verification": {
117
+ "status": "unverified",
118
+ "source": "manual",
119
+ "notes": "Late interaction reranking"
120
+ },
121
+ "context_window": 512,
122
+ "capabilities": [
123
+ "rerank"
124
+ ],
125
+ "modality": "text",
126
+ "pricing": {
127
+ "input_per_token": null,
128
+ "output_per_token": null
129
+ },
130
+ "status": "active",
131
+ "tags": [
132
+ "jina",
133
+ "rerank",
134
+ "colbert",
135
+ "rag"
136
+ ]
137
+ }
138
+ }
139
+ }
@@ -0,0 +1,188 @@
1
+ {
2
+ "$schema": "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json",
3
+ "protocol_version": "1.1",
4
+ "models": {
5
+ "llama3-1-8b": {
6
+ "provider": "lepton",
7
+ "model_id": "llama3-1-8b",
8
+ "display_name": "Llama 3.1 8B",
9
+ "verification": {
10
+ "status": "unverified",
11
+ "verified_at": "2026-01-29",
12
+ "source": "documentation",
13
+ "notes": "Endpoint: https://llama3-1-8b.lepton.run/api/v1"
14
+ },
15
+ "context_window": 131072,
16
+ "capabilities": [
17
+ "chat",
18
+ "tools",
19
+ "streaming"
20
+ ],
21
+ "status": "active",
22
+ "tags": [
23
+ "meta",
24
+ "llama",
25
+ "lepton"
26
+ ]
27
+ },
28
+ "llama3-1-70b": {
29
+ "provider": "lepton",
30
+ "model_id": "llama3-1-70b",
31
+ "display_name": "Llama 3.1 70B",
32
+ "verification": {
33
+ "status": "unverified",
34
+ "verified_at": "2026-01-29",
35
+ "source": "documentation",
36
+ "notes": "Endpoint: https://llama3-1-70b.lepton.run/api/v1"
37
+ },
38
+ "context_window": 131072,
39
+ "capabilities": [
40
+ "chat",
41
+ "tools",
42
+ "streaming"
43
+ ],
44
+ "status": "active",
45
+ "tags": [
46
+ "meta",
47
+ "llama",
48
+ "lepton"
49
+ ]
50
+ },
51
+ "llama3-1-405b": {
52
+ "provider": "lepton",
53
+ "model_id": "llama3-1-405b",
54
+ "display_name": "Llama 3.1 405B",
55
+ "verification": {
56
+ "status": "unverified",
57
+ "verified_at": "2026-01-29",
58
+ "source": "documentation",
59
+ "notes": "Endpoint: https://llama3-1-405b.lepton.run/api/v1"
60
+ },
61
+ "context_window": 131072,
62
+ "capabilities": [
63
+ "chat",
64
+ "tools",
65
+ "streaming"
66
+ ],
67
+ "status": "active",
68
+ "tags": [
69
+ "meta",
70
+ "llama",
71
+ "lepton",
72
+ "flagship"
73
+ ]
74
+ },
75
+ "mixtral-8x7b": {
76
+ "provider": "lepton",
77
+ "model_id": "mixtral-8x7b",
78
+ "display_name": "Mixtral 8x7B",
79
+ "verification": {
80
+ "status": "unverified",
81
+ "verified_at": "2026-01-29",
82
+ "source": "documentation",
83
+ "notes": "Endpoint: https://mixtral-8x7b.lepton.run/api/v1"
84
+ },
85
+ "context_window": 32768,
86
+ "capabilities": [
87
+ "chat",
88
+ "streaming"
89
+ ],
90
+ "status": "active",
91
+ "tags": [
92
+ "mistral",
93
+ "mixtral",
94
+ "moe",
95
+ "lepton"
96
+ ]
97
+ },
98
+ "qwen2-72b": {
99
+ "provider": "lepton",
100
+ "model_id": "qwen2-72b",
101
+ "display_name": "Qwen 2 72B",
102
+ "verification": {
103
+ "status": "unverified",
104
+ "verified_at": "2026-01-29",
105
+ "source": "documentation",
106
+ "notes": "Endpoint: https://qwen2-72b.lepton.run/api/v1"
107
+ },
108
+ "context_window": 32768,
109
+ "capabilities": [
110
+ "chat",
111
+ "tools",
112
+ "streaming"
113
+ ],
114
+ "status": "active",
115
+ "tags": [
116
+ "alibaba",
117
+ "qwen",
118
+ "lepton"
119
+ ]
120
+ },
121
+ "mistral-7b": {
122
+ "provider": "lepton",
123
+ "model_id": "mistral-7b",
124
+ "display_name": "Mistral 7B",
125
+ "verification": {
126
+ "status": "unverified",
127
+ "verified_at": "2026-01-29",
128
+ "source": "documentation",
129
+ "notes": "Endpoint: https://mistral-7b.lepton.run/api/v1"
130
+ },
131
+ "context_window": 8192,
132
+ "capabilities": [
133
+ "chat",
134
+ "streaming"
135
+ ],
136
+ "status": "active",
137
+ "tags": [
138
+ "mistral",
139
+ "lepton"
140
+ ]
141
+ },
142
+ "wizardlm-2-8x22b": {
143
+ "provider": "lepton",
144
+ "model_id": "wizardlm-2-8x22b",
145
+ "display_name": "WizardLM 2 8x22B",
146
+ "verification": {
147
+ "status": "unverified",
148
+ "verified_at": "2026-01-29",
149
+ "source": "documentation",
150
+ "notes": "Endpoint: https://wizardlm-2-8x22b.lepton.run/api/v1"
151
+ },
152
+ "context_window": 65536,
153
+ "capabilities": [
154
+ "chat",
155
+ "streaming"
156
+ ],
157
+ "status": "active",
158
+ "tags": [
159
+ "wizardlm",
160
+ "moe",
161
+ "lepton"
162
+ ]
163
+ },
164
+ "dolphin-mixtral-8x7b": {
165
+ "provider": "lepton",
166
+ "model_id": "dolphin-mixtral-8x7b",
167
+ "display_name": "Dolphin Mixtral 8x7B",
168
+ "verification": {
169
+ "status": "unverified",
170
+ "verified_at": "2026-01-29",
171
+ "source": "documentation",
172
+ "notes": "Endpoint: https://dolphin-mixtral-8x7b.lepton.run/api/v1"
173
+ },
174
+ "context_window": 32768,
175
+ "capabilities": [
176
+ "chat",
177
+ "streaming"
178
+ ],
179
+ "status": "active",
180
+ "tags": [
181
+ "dolphin",
182
+ "mixtral",
183
+ "lepton",
184
+ "uncensored"
185
+ ]
186
+ }
187
+ }
188
+ }