@ailib-official/ai-protocol 0.8.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (194) hide show
  1. package/LICENSE +6 -0
  2. package/README.md +415 -0
  3. package/dist/index.json +8 -0
  4. package/dist/v1/models/ai21.json +140 -0
  5. package/dist/v1/models/baichuan.json +138 -0
  6. package/dist/v1/models/cerebras.json +147 -0
  7. package/dist/v1/models/claude.json +114 -0
  8. package/dist/v1/models/cohere.json +235 -0
  9. package/dist/v1/models/deepinfra.json +43 -0
  10. package/dist/v1/models/deepseek-chat.json +55 -0
  11. package/dist/v1/models/doubao.json +197 -0
  12. package/dist/v1/models/ernie.json +223 -0
  13. package/dist/v1/models/fireworks.json +222 -0
  14. package/dist/v1/models/gemini.json +58 -0
  15. package/dist/v1/models/gpt.json +166 -0
  16. package/dist/v1/models/grok.json +138 -0
  17. package/dist/v1/models/huggingface.json +183 -0
  18. package/dist/v1/models/hunyuan.json +255 -0
  19. package/dist/v1/models/jina.json +139 -0
  20. package/dist/v1/models/lepton.json +188 -0
  21. package/dist/v1/models/llama.json +143 -0
  22. package/dist/v1/models/minimax.json +194 -0
  23. package/dist/v1/models/mistral.json +177 -0
  24. package/dist/v1/models/moonshot.json +144 -0
  25. package/dist/v1/models/nvidia.json +212 -0
  26. package/dist/v1/models/palmyra.json +103 -0
  27. package/dist/v1/models/perplexity.json +143 -0
  28. package/dist/v1/models/qwen.json +49 -0
  29. package/dist/v1/models/replicate.json +206 -0
  30. package/dist/v1/models/sensenova.json +144 -0
  31. package/dist/v1/models/siliconflow.json +44 -0
  32. package/dist/v1/models/spark.json +173 -0
  33. package/dist/v1/models/stable-diffusion.json +161 -0
  34. package/dist/v1/models/tiangong.json +169 -0
  35. package/dist/v1/models/together.json +43 -0
  36. package/dist/v1/models/yi.json +199 -0
  37. package/dist/v1/models/zhipu.json +250 -0
  38. package/dist/v1/providers/ai21.json +215 -0
  39. package/dist/v1/providers/anthropic.json +253 -0
  40. package/dist/v1/providers/anyscale.json +115 -0
  41. package/dist/v1/providers/azure.json +188 -0
  42. package/dist/v1/providers/baichuan.json +205 -0
  43. package/dist/v1/providers/baidu.json +205 -0
  44. package/dist/v1/providers/cerebras.json +216 -0
  45. package/dist/v1/providers/cohere.json +209 -0
  46. package/dist/v1/providers/deepinfra.json +196 -0
  47. package/dist/v1/providers/deepseek.json +221 -0
  48. package/dist/v1/providers/doubao.json +209 -0
  49. package/dist/v1/providers/fireworks.json +227 -0
  50. package/dist/v1/providers/gemini.json +279 -0
  51. package/dist/v1/providers/groq.json +218 -0
  52. package/dist/v1/providers/huggingface.json +181 -0
  53. package/dist/v1/providers/hunyuan.json +198 -0
  54. package/dist/v1/providers/jina.json +202 -0
  55. package/dist/v1/providers/lepton.json +221 -0
  56. package/dist/v1/providers/minimax.json +209 -0
  57. package/dist/v1/providers/mistral.json +214 -0
  58. package/dist/v1/providers/moonshot.json +214 -0
  59. package/dist/v1/providers/nvidia.json +213 -0
  60. package/dist/v1/providers/openai.json +267 -0
  61. package/dist/v1/providers/openrouter.json +220 -0
  62. package/dist/v1/providers/perplexity.json +172 -0
  63. package/dist/v1/providers/qwen.json +231 -0
  64. package/dist/v1/providers/replicate.json +192 -0
  65. package/dist/v1/providers/sensenova.json +185 -0
  66. package/dist/v1/providers/siliconflow.json +197 -0
  67. package/dist/v1/providers/spark.json +204 -0
  68. package/dist/v1/providers/stability.json +221 -0
  69. package/dist/v1/providers/tiangong.json +207 -0
  70. package/dist/v1/providers/together.json +196 -0
  71. package/dist/v1/providers/writer.json +253 -0
  72. package/dist/v1/providers/xai.json +238 -0
  73. package/dist/v1/providers/yi.json +205 -0
  74. package/dist/v1/providers/zhipu.json +208 -0
  75. package/dist/v1/spec.json +783 -0
  76. package/dist/v2/providers/anthropic.json +372 -0
  77. package/dist/v2/providers/cohere.json +109 -0
  78. package/dist/v2/providers/deepseek.json +272 -0
  79. package/dist/v2/providers/doubao.json +260 -0
  80. package/dist/v2/providers/google.json +388 -0
  81. package/dist/v2/providers/jina.json +71 -0
  82. package/dist/v2/providers/moonshot.json +284 -0
  83. package/dist/v2/providers/openai.json +419 -0
  84. package/dist/v2/providers/qwen.json +274 -0
  85. package/dist/v2/providers/zhipu.json +257 -0
  86. package/dist/v2-alpha/providers/anthropic.json +182 -0
  87. package/dist/v2-alpha/providers/gemini.json +187 -0
  88. package/dist/v2-alpha/providers/openai.json +215 -0
  89. package/dist/v2-alpha/spec.json +644 -0
  90. package/package.json +61 -0
  91. package/schemas/spec.json +186 -0
  92. package/schemas/v1.json +1116 -0
  93. package/schemas/v2/availability.json +66 -0
  94. package/schemas/v2/capabilities.json +182 -0
  95. package/schemas/v2/capability-profile.json +174 -0
  96. package/schemas/v2/computer-use.json +222 -0
  97. package/schemas/v2/context-policy.json +148 -0
  98. package/schemas/v2/endpoint.json +2 -0
  99. package/schemas/v2/error-codes.yaml +225 -0
  100. package/schemas/v2/errors.json +250 -0
  101. package/schemas/v2/execution-metadata.json +59 -0
  102. package/schemas/v2/mcp.json +225 -0
  103. package/schemas/v2/message-roles.json +10 -0
  104. package/schemas/v2/multimodal.json +297 -0
  105. package/schemas/v2/pricing.json +14 -0
  106. package/schemas/v2/provider-contract.json +317 -0
  107. package/schemas/v2/provider.json +203 -0
  108. package/schemas/v2/regions.json +14 -0
  109. package/v1/models/ai21.yaml +97 -0
  110. package/v1/models/baichuan.yaml +95 -0
  111. package/v1/models/cerebras.yaml +99 -0
  112. package/v1/models/claude.yaml +59 -0
  113. package/v1/models/cohere.yaml +165 -0
  114. package/v1/models/deepinfra.yaml +29 -0
  115. package/v1/models/deepseek-chat.yaml +32 -0
  116. package/v1/models/doubao.yaml +129 -0
  117. package/v1/models/ernie.yaml +146 -0
  118. package/v1/models/fireworks.yaml +145 -0
  119. package/v1/models/gemini.yaml +32 -0
  120. package/v1/models/gpt.yaml +90 -0
  121. package/v1/models/grok.yaml +74 -0
  122. package/v1/models/huggingface.yaml +110 -0
  123. package/v1/models/hunyuan.yaml +164 -0
  124. package/v1/models/jina.yaml +98 -0
  125. package/v1/models/lepton.yaml +130 -0
  126. package/v1/models/llama.yaml +91 -0
  127. package/v1/models/minimax.yaml +132 -0
  128. package/v1/models/mistral.yaml +100 -0
  129. package/v1/models/moonshot.yaml +97 -0
  130. package/v1/models/nvidia.yaml +118 -0
  131. package/v1/models/palmyra.yaml +59 -0
  132. package/v1/models/perplexity.yaml +97 -0
  133. package/v1/models/qwen.yaml +27 -0
  134. package/v1/models/replicate.yaml +136 -0
  135. package/v1/models/sensenova.yaml +97 -0
  136. package/v1/models/siliconflow.yaml +29 -0
  137. package/v1/models/spark.yaml +114 -0
  138. package/v1/models/stable-diffusion.yaml +113 -0
  139. package/v1/models/tiangong.yaml +114 -0
  140. package/v1/models/together.yaml +29 -0
  141. package/v1/models/yi.yaml +132 -0
  142. package/v1/models/zhipu.yaml +163 -0
  143. package/v1/providers/ai21.yaml +176 -0
  144. package/v1/providers/anthropic.yaml +209 -0
  145. package/v1/providers/anyscale.yaml +106 -0
  146. package/v1/providers/azure.yaml +155 -0
  147. package/v1/providers/baichuan.yaml +168 -0
  148. package/v1/providers/baidu.yaml +173 -0
  149. package/v1/providers/cerebras.yaml +178 -0
  150. package/v1/providers/cohere.yaml +175 -0
  151. package/v1/providers/deepinfra.yaml +156 -0
  152. package/v1/providers/deepseek.yaml +189 -0
  153. package/v1/providers/doubao.yaml +172 -0
  154. package/v1/providers/fireworks.yaml +187 -0
  155. package/v1/providers/gemini.yaml +229 -0
  156. package/v1/providers/groq.yaml +181 -0
  157. package/v1/providers/huggingface.yaml +157 -0
  158. package/v1/providers/hunyuan.yaml +162 -0
  159. package/v1/providers/jina.yaml +171 -0
  160. package/v1/providers/lepton.yaml +183 -0
  161. package/v1/providers/minimax.yaml +172 -0
  162. package/v1/providers/mistral.yaml +186 -0
  163. package/v1/providers/moonshot.yaml +176 -0
  164. package/v1/providers/nvidia.yaml +172 -0
  165. package/v1/providers/openai.yaml +224 -0
  166. package/v1/providers/openrouter.yaml +181 -0
  167. package/v1/providers/perplexity.yaml +144 -0
  168. package/v1/providers/qwen.yaml +192 -0
  169. package/v1/providers/replicate.yaml +159 -0
  170. package/v1/providers/sensenova.yaml +153 -0
  171. package/v1/providers/siliconflow.yaml +156 -0
  172. package/v1/providers/spark.yaml +167 -0
  173. package/v1/providers/stability.yaml +185 -0
  174. package/v1/providers/tiangong.yaml +170 -0
  175. package/v1/providers/together.yaml +156 -0
  176. package/v1/providers/writer.yaml +212 -0
  177. package/v1/providers/xai.yaml +206 -0
  178. package/v1/providers/yi.yaml +168 -0
  179. package/v1/providers/zhipu.yaml +171 -0
  180. package/v1/spec.yaml +637 -0
  181. package/v2/providers/anthropic.yaml +244 -0
  182. package/v2/providers/cohere.yaml +75 -0
  183. package/v2/providers/deepseek.yaml +176 -0
  184. package/v2/providers/doubao.yaml +169 -0
  185. package/v2/providers/google.yaml +245 -0
  186. package/v2/providers/jina.yaml +55 -0
  187. package/v2/providers/moonshot.yaml +186 -0
  188. package/v2/providers/openai.yaml +266 -0
  189. package/v2/providers/qwen.yaml +174 -0
  190. package/v2/providers/zhipu.yaml +176 -0
  191. package/v2-alpha/providers/anthropic.yaml +134 -0
  192. package/v2-alpha/providers/gemini.yaml +144 -0
  193. package/v2-alpha/providers/openai.yaml +154 -0
  194. package/v2-alpha/spec.yaml +512 -0
@@ -0,0 +1,164 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ # 腾讯混元 (Tencent Hunyuan) Model Instances
5
+ #
6
+ # VERIFIED_AT: 2026-01-31 (based on public Tencent Cloud documentation)
7
+ #
8
+ # Notes:
9
+ # - Hunyuan (混元) is Tencent's flagship LLM series.
10
+ # - Strong performance in Chinese language tasks.
11
+
12
+ models:
13
+ # Hunyuan Pro (flagship)
14
+ hunyuan-pro:
15
+ provider: hunyuan
16
+ model_id: "hunyuan-pro"
17
+ display_name: "混元 Pro"
18
+ verification:
19
+ status: unverified
20
+ verified_at: "2026-01-31"
21
+ source: "documentation"
22
+ notes: "Hunyuan flagship model with best quality."
23
+ context_window: 32768
24
+ capabilities: [chat, tools, streaming]
25
+ status: active
26
+ tags: ["tencent", "hunyuan", "pro", "flagship", "cn"]
27
+ pricing:
28
+ input_per_token: 0.00003
29
+ output_per_token: 0.0001
30
+
31
+ # Hunyuan Standard
32
+ hunyuan-standard:
33
+ provider: hunyuan
34
+ model_id: "hunyuan-standard"
35
+ display_name: "混元 Standard"
36
+ verification:
37
+ status: unverified
38
+ verified_at: "2026-01-31"
39
+ source: "documentation"
40
+ context_window: 32768
41
+ capabilities: [chat, tools, streaming]
42
+ status: active
43
+ tags: ["tencent", "hunyuan", "standard", "cn"]
44
+ pricing:
45
+ input_per_token: 0.0000045
46
+ output_per_token: 0.000005
47
+
48
+ hunyuan-standard-256k:
49
+ provider: hunyuan
50
+ model_id: "hunyuan-standard-256K"
51
+ display_name: "混元 Standard 256K"
52
+ verification:
53
+ status: unverified
54
+ verified_at: "2026-01-31"
55
+ source: "documentation"
56
+ context_window: 262144
57
+ capabilities: [chat, tools, streaming]
58
+ status: active
59
+ tags: ["tencent", "hunyuan", "standard", "ultra_long_context", "cn"]
60
+ pricing:
61
+ input_per_token: 0.000015
62
+ output_per_token: 0.00006
63
+
64
+ # Hunyuan Lite (cost-effective)
65
+ hunyuan-lite:
66
+ provider: hunyuan
67
+ model_id: "hunyuan-lite"
68
+ display_name: "混元 Lite"
69
+ verification:
70
+ status: unverified
71
+ verified_at: "2026-01-31"
72
+ source: "documentation"
73
+ notes: "Free tier available with rate limits."
74
+ context_window: 4096
75
+ capabilities: [chat, streaming]
76
+ status: active
77
+ tags: ["tencent", "hunyuan", "lite", "free_tier", "cn"]
78
+ pricing:
79
+ input_per_token: 0
80
+ output_per_token: 0
81
+
82
+ # Hunyuan Turbo (balanced speed and quality)
83
+ hunyuan-turbo:
84
+ provider: hunyuan
85
+ model_id: "hunyuan-turbo"
86
+ display_name: "混元 Turbo"
87
+ verification:
88
+ status: unverified
89
+ verified_at: "2026-01-31"
90
+ source: "documentation"
91
+ context_window: 32768
92
+ capabilities: [chat, tools, streaming]
93
+ status: active
94
+ tags: ["tencent", "hunyuan", "turbo", "cn"]
95
+ pricing:
96
+ input_per_token: 0.000015
97
+ output_per_token: 0.00005
98
+
99
+ hunyuan-turbo-latest:
100
+ provider: hunyuan
101
+ model_id: "hunyuan-turbo-latest"
102
+ display_name: "混元 Turbo Latest"
103
+ verification:
104
+ status: unverified
105
+ verified_at: "2026-01-31"
106
+ source: "documentation"
107
+ context_window: 32768
108
+ capabilities: [chat, tools, streaming]
109
+ status: active
110
+ tags: ["tencent", "hunyuan", "turbo", "latest", "cn"]
111
+ pricing:
112
+ input_per_token: 0.000015
113
+ output_per_token: 0.00005
114
+
115
+ # Hunyuan Vision
116
+ hunyuan-vision:
117
+ provider: hunyuan
118
+ model_id: "hunyuan-vision"
119
+ display_name: "混元 Vision"
120
+ verification:
121
+ status: unverified
122
+ verified_at: "2026-01-31"
123
+ source: "documentation"
124
+ context_window: 8192
125
+ capabilities: [chat, vision, streaming]
126
+ status: active
127
+ tags: ["tencent", "hunyuan", "vision", "multimodal", "cn"]
128
+ pricing:
129
+ input_per_token: 0.00002
130
+ output_per_token: 0.00002
131
+
132
+ # Hunyuan Code
133
+ hunyuan-code:
134
+ provider: hunyuan
135
+ model_id: "hunyuan-code"
136
+ display_name: "混元 Code"
137
+ verification:
138
+ status: unverified
139
+ verified_at: "2026-01-31"
140
+ source: "documentation"
141
+ context_window: 8192
142
+ capabilities: [chat, code, streaming]
143
+ status: active
144
+ tags: ["tencent", "hunyuan", "code", "cn"]
145
+ pricing:
146
+ input_per_token: 0.0000045
147
+ output_per_token: 0.000005
148
+
149
+ # Hunyuan Role (角色扮演)
150
+ hunyuan-role:
151
+ provider: hunyuan
152
+ model_id: "hunyuan-role"
153
+ display_name: "混元 Role"
154
+ verification:
155
+ status: unverified
156
+ verified_at: "2026-01-31"
157
+ source: "documentation"
158
+ context_window: 32768
159
+ capabilities: [chat, streaming]
160
+ status: active
161
+ tags: ["tencent", "hunyuan", "role", "roleplay", "cn"]
162
+ pricing:
163
+ input_per_token: 0.0000045
164
+ output_per_token: 0.000005
@@ -0,0 +1,98 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.5"
3
+
4
+ # Jina AI Model Instances
5
+ # Notes: Jina AI provides embeddings, rerank, and reader APIs (not chat LLM)
6
+ # These models are primarily for RAG (Retrieval-Augmented Generation) infrastructure
7
+
8
+ models:
9
+ # Text Embeddings
10
+ jina-embeddings-v3:
11
+ provider: jina
12
+ model_id: "jina-embeddings-v3"
13
+ display_name: "Jina Embeddings v3"
14
+ verification:
15
+ status: unverified
16
+ source: "manual"
17
+ notes: "State-of-the-art text embeddings"
18
+ context_window: 8192
19
+ capabilities: [embeddings]
20
+ modality: "text"
21
+ pricing:
22
+ input_per_token: null
23
+ output_per_token: null
24
+ status: active
25
+ tags: ["jina", "embeddings", "rag", "search"]
26
+ dimensions: 1024
27
+
28
+ jina-embeddings-v2-base-en:
29
+ provider: jina
30
+ model_id: "jina-embeddings-v2-base-en"
31
+ display_name: "Jina Embeddings v2 Base EN"
32
+ verification:
33
+ status: unverified
34
+ source: "manual"
35
+ notes: "English-only embeddings model"
36
+ context_window: 8192
37
+ capabilities: [embeddings]
38
+ modality: "text"
39
+ pricing:
40
+ input_per_token: null
41
+ output_per_token: null
42
+ status: active
43
+ tags: ["jina", "embeddings", "en", "fast"]
44
+ dimensions: 768
45
+
46
+ # Code Embeddings
47
+ jina-embeddings-v2-base-code:
48
+ provider: jina
49
+ model_id: "jina-embeddings-v2-base-code"
50
+ display_name: "Jina Embeddings v2 Base Code"
51
+ verification:
52
+ status: unverified
53
+ source: "manual"
54
+ notes: "Code embeddings for semantic code search"
55
+ context_window: 8192
56
+ capabilities: [embeddings]
57
+ modality: "code"
58
+ pricing:
59
+ input_per_token: null
60
+ output_per_token: null
61
+ status: active
62
+ tags: ["jina", "embeddings", "code", "search"]
63
+ dimensions: 768
64
+
65
+ # Rerank Models
66
+ jina-reranker-v2-base-en:
67
+ provider: jina
68
+ model_id: "jina-reranker-v2-base-en"
69
+ display_name: "Jina Reranker v2 Base EN"
70
+ verification:
71
+ status: unverified
72
+ source: "manual"
73
+ notes: "Re-ranking model for RAG"
74
+ context_window: 512
75
+ capabilities: [rerank]
76
+ modality: "text"
77
+ pricing:
78
+ input_per_token: null
79
+ output_per_token: null
80
+ status: active
81
+ tags: ["jina", "rerank", "rag", "search"]
82
+
83
+ jina-colbert-v2:
84
+ provider: jina
85
+ model_id: "jina-colbert-v2"
86
+ display_name: "Jina ColBERT v2"
87
+ verification:
88
+ status: unverified
89
+ source: "manual"
90
+ notes: "Late interaction reranking"
91
+ context_window: 512
92
+ capabilities: [rerank]
93
+ modality: "text"
94
+ pricing:
95
+ input_per_token: null
96
+ output_per_token: null
97
+ status: active
98
+ tags: ["jina", "rerank", "colbert", "rag"]
@@ -0,0 +1,130 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ # Lepton AI Model Instances
5
+ #
6
+ # VERIFIED_AT: 2026-01-29 (based on public Lepton AI documentation)
7
+ #
8
+ # Notes:
9
+ # - Lepton AI provides serverless inference for various models.
10
+ # - Each model has its own subdomain endpoint.
11
+ # - Base URL pattern: https://{model_id}.lepton.run/api/v1
12
+
13
+ models:
14
+ # Llama 3.1 models
15
+ llama3-1-8b:
16
+ provider: lepton
17
+ model_id: "llama3-1-8b"
18
+ display_name: "Llama 3.1 8B"
19
+ verification:
20
+ status: unverified
21
+ verified_at: "2026-01-29"
22
+ source: "documentation"
23
+ notes: "Endpoint: https://llama3-1-8b.lepton.run/api/v1"
24
+ context_window: 131072
25
+ capabilities: [chat, tools, streaming]
26
+ status: active
27
+ tags: ["meta", "llama", "lepton"]
28
+
29
+ llama3-1-70b:
30
+ provider: lepton
31
+ model_id: "llama3-1-70b"
32
+ display_name: "Llama 3.1 70B"
33
+ verification:
34
+ status: unverified
35
+ verified_at: "2026-01-29"
36
+ source: "documentation"
37
+ notes: "Endpoint: https://llama3-1-70b.lepton.run/api/v1"
38
+ context_window: 131072
39
+ capabilities: [chat, tools, streaming]
40
+ status: active
41
+ tags: ["meta", "llama", "lepton"]
42
+
43
+ llama3-1-405b:
44
+ provider: lepton
45
+ model_id: "llama3-1-405b"
46
+ display_name: "Llama 3.1 405B"
47
+ verification:
48
+ status: unverified
49
+ verified_at: "2026-01-29"
50
+ source: "documentation"
51
+ notes: "Endpoint: https://llama3-1-405b.lepton.run/api/v1"
52
+ context_window: 131072
53
+ capabilities: [chat, tools, streaming]
54
+ status: active
55
+ tags: ["meta", "llama", "lepton", "flagship"]
56
+
57
+ # Mixtral models
58
+ mixtral-8x7b:
59
+ provider: lepton
60
+ model_id: "mixtral-8x7b"
61
+ display_name: "Mixtral 8x7B"
62
+ verification:
63
+ status: unverified
64
+ verified_at: "2026-01-29"
65
+ source: "documentation"
66
+ notes: "Endpoint: https://mixtral-8x7b.lepton.run/api/v1"
67
+ context_window: 32768
68
+ capabilities: [chat, streaming]
69
+ status: active
70
+ tags: ["mistral", "mixtral", "moe", "lepton"]
71
+
72
+ # Qwen models
73
+ qwen2-72b:
74
+ provider: lepton
75
+ model_id: "qwen2-72b"
76
+ display_name: "Qwen 2 72B"
77
+ verification:
78
+ status: unverified
79
+ verified_at: "2026-01-29"
80
+ source: "documentation"
81
+ notes: "Endpoint: https://qwen2-72b.lepton.run/api/v1"
82
+ context_window: 32768
83
+ capabilities: [chat, tools, streaming]
84
+ status: active
85
+ tags: ["alibaba", "qwen", "lepton"]
86
+
87
+ # Mistral models
88
+ mistral-7b:
89
+ provider: lepton
90
+ model_id: "mistral-7b"
91
+ display_name: "Mistral 7B"
92
+ verification:
93
+ status: unverified
94
+ verified_at: "2026-01-29"
95
+ source: "documentation"
96
+ notes: "Endpoint: https://mistral-7b.lepton.run/api/v1"
97
+ context_window: 8192
98
+ capabilities: [chat, streaming]
99
+ status: active
100
+ tags: ["mistral", "lepton"]
101
+
102
+ # Wizardlm models
103
+ wizardlm-2-8x22b:
104
+ provider: lepton
105
+ model_id: "wizardlm-2-8x22b"
106
+ display_name: "WizardLM 2 8x22B"
107
+ verification:
108
+ status: unverified
109
+ verified_at: "2026-01-29"
110
+ source: "documentation"
111
+ notes: "Endpoint: https://wizardlm-2-8x22b.lepton.run/api/v1"
112
+ context_window: 65536
113
+ capabilities: [chat, streaming]
114
+ status: active
115
+ tags: ["wizardlm", "moe", "lepton"]
116
+
117
+ # Dolphin models (uncensored)
118
+ dolphin-mixtral-8x7b:
119
+ provider: lepton
120
+ model_id: "dolphin-mixtral-8x7b"
121
+ display_name: "Dolphin Mixtral 8x7B"
122
+ verification:
123
+ status: unverified
124
+ verified_at: "2026-01-29"
125
+ source: "documentation"
126
+ notes: "Endpoint: https://dolphin-mixtral-8x7b.lepton.run/api/v1"
127
+ context_window: 32768
128
+ capabilities: [chat, streaming]
129
+ status: active
130
+ tags: ["dolphin", "mixtral", "lepton", "uncensored"]
@@ -0,0 +1,91 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ # Groq Llama Model Instances
5
+ #
6
+ # VERIFIED_AT: 2026-01-28 (via Groq list_models: GET /openai/v1/models)
7
+ #
8
+ # Notes:
9
+ # - Groq model ids evolve over time; keep deprecated entries for historical reference.
10
+ models:
11
+ # Historical ids (no longer present in current /models list for this key)
12
+ llama3-8b-8192:
13
+ provider: groq
14
+ model_id: "llama3-8b-8192"
15
+ display_name: "Llama 3 8B (legacy id)"
16
+ verification:
17
+ status: verified
18
+ verified_at: "2026-01-28"
19
+ source: "list_models:/models"
20
+ notes: "Legacy id (not present in current /models list); kept for reference."
21
+ context_window: 8192
22
+ capabilities: [chat, tools, streaming]
23
+ status: deprecated
24
+ tags: ["meta", "llama", "groq", "legacy"]
25
+
26
+ llama3-70b-8192:
27
+ provider: groq
28
+ model_id: "llama3-70b-8192"
29
+ display_name: "Llama 3 70B (legacy id)"
30
+ verification:
31
+ status: verified
32
+ verified_at: "2026-01-28"
33
+ source: "list_models:/models"
34
+ notes: "Legacy id (not present in current /models list); kept for reference."
35
+ context_window: 8192
36
+ capabilities: [chat, tools, streaming]
37
+ status: deprecated
38
+ tags: ["meta", "llama", "groq", "legacy"]
39
+
40
+ # Current Groq-available Llama family (examples)
41
+ llama-3.1-8b-instant:
42
+ provider: groq
43
+ model_id: "llama-3.1-8b-instant"
44
+ display_name: "Llama 3.1 8B Instant"
45
+ verification:
46
+ status: verified
47
+ verified_at: "2026-01-28"
48
+ source: "list_models:/models"
49
+ context_window: 8192
50
+ capabilities: [chat, tools, streaming]
51
+ status: active
52
+ tags: ["meta", "llama", "fast", "groq"]
53
+
54
+ llama-3.3-70b-versatile:
55
+ provider: groq
56
+ model_id: "llama-3.3-70b-versatile"
57
+ display_name: "Llama 3.3 70B Versatile"
58
+ verification:
59
+ status: verified
60
+ verified_at: "2026-01-28"
61
+ source: "list_models:/models"
62
+ context_window: 8192
63
+ capabilities: [chat, tools, streaming]
64
+ status: active
65
+ tags: ["meta", "llama", "groq"]
66
+
67
+ "meta-llama/llama-4-maverick-17b-128e-instruct":
68
+ provider: groq
69
+ model_id: "meta-llama/llama-4-maverick-17b-128e-instruct"
70
+ display_name: "Llama 4 Maverick 17B (128e) Instruct"
71
+ verification:
72
+ status: verified
73
+ verified_at: "2026-01-28"
74
+ source: "list_models:/models"
75
+ context_window: 8192
76
+ capabilities: [chat, tools, streaming]
77
+ status: active
78
+ tags: ["meta", "llama", "groq"]
79
+
80
+ "meta-llama/llama-4-scout-17b-16e-instruct":
81
+ provider: groq
82
+ model_id: "meta-llama/llama-4-scout-17b-16e-instruct"
83
+ display_name: "Llama 4 Scout 17B (16e) Instruct"
84
+ verification:
85
+ status: verified
86
+ verified_at: "2026-01-28"
87
+ source: "list_models:/models"
88
+ context_window: 8192
89
+ capabilities: [chat, tools, streaming]
90
+ status: active
91
+ tags: ["meta", "llama", "groq"]
@@ -0,0 +1,132 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ # MiniMax Model Instances
5
+ #
6
+ # VERIFIED_AT: 2026-01-31 (based on public MiniMax platform documentation)
7
+ #
8
+ # Notes:
9
+ # - MiniMax is a leading Chinese AI company.
10
+ # - abab series are their flagship LLM models.
11
+ # - Official docs: https://platform.minimaxi.com/document/ChatCompletion%20v2
12
+
13
+ models:
14
+ # abab 6.5 series (latest flagship)
15
+ abab6.5s-chat:
16
+ provider: minimax
17
+ model_id: "abab6.5s-chat"
18
+ display_name: "MiniMax abab 6.5s Chat"
19
+ verification:
20
+ status: unverified
21
+ verified_at: "2026-01-31"
22
+ source: "documentation"
23
+ notes: "Latest flagship model with enhanced capabilities."
24
+ context_window: 245760
25
+ capabilities: [chat, tools, streaming]
26
+ status: active
27
+ tags: ["minimax", "abab", "flagship", "long_context", "cn"]
28
+ pricing:
29
+ input_per_token: 0.000001
30
+ output_per_token: 0.000001
31
+
32
+ abab6.5g-chat:
33
+ provider: minimax
34
+ model_id: "abab6.5g-chat"
35
+ display_name: "MiniMax abab 6.5g Chat"
36
+ verification:
37
+ status: unverified
38
+ verified_at: "2026-01-31"
39
+ source: "documentation"
40
+ notes: "General purpose flagship model."
41
+ context_window: 8192
42
+ capabilities: [chat, tools, streaming]
43
+ status: active
44
+ tags: ["minimax", "abab", "flagship", "cn"]
45
+ pricing:
46
+ input_per_token: 0.000001
47
+ output_per_token: 0.000001
48
+
49
+ abab6.5t-chat:
50
+ provider: minimax
51
+ model_id: "abab6.5t-chat"
52
+ display_name: "MiniMax abab 6.5t Chat"
53
+ verification:
54
+ status: unverified
55
+ verified_at: "2026-01-31"
56
+ source: "documentation"
57
+ notes: "Optimized for specific tasks."
58
+ context_window: 8192
59
+ capabilities: [chat, tools, streaming]
60
+ status: active
61
+ tags: ["minimax", "abab", "cn"]
62
+ pricing:
63
+ input_per_token: 0.000001
64
+ output_per_token: 0.000001
65
+
66
+ # abab 5.5 series (stable)
67
+ abab5.5s-chat:
68
+ provider: minimax
69
+ model_id: "abab5.5s-chat"
70
+ display_name: "MiniMax abab 5.5s Chat"
71
+ verification:
72
+ status: unverified
73
+ verified_at: "2026-01-31"
74
+ source: "documentation"
75
+ context_window: 16384
76
+ capabilities: [chat, tools, streaming]
77
+ status: active
78
+ tags: ["minimax", "abab", "stable", "cn"]
79
+ pricing:
80
+ input_per_token: 0.000001
81
+ output_per_token: 0.000001
82
+
83
+ abab5.5-chat:
84
+ provider: minimax
85
+ model_id: "abab5.5-chat"
86
+ display_name: "MiniMax abab 5.5 Chat"
87
+ verification:
88
+ status: unverified
89
+ verified_at: "2026-01-31"
90
+ source: "documentation"
91
+ context_window: 16384
92
+ capabilities: [chat, tools, streaming]
93
+ status: active
94
+ tags: ["minimax", "abab", "stable", "cn"]
95
+ pricing:
96
+ input_per_token: 0.0000005
97
+ output_per_token: 0.0000005
98
+
99
+ # Embedding model
100
+ embo-01:
101
+ provider: minimax
102
+ model_id: "embo-01"
103
+ display_name: "MiniMax Embedding"
104
+ verification:
105
+ status: unverified
106
+ verified_at: "2026-01-31"
107
+ source: "documentation"
108
+ context_window: 4096
109
+ capabilities: [embedding]
110
+ status: active
111
+ tags: ["minimax", "embedding", "cn"]
112
+ pricing:
113
+ input_per_token: 0.0000001
114
+ output_per_token: 0
115
+
116
+ # Speech model (T2A - Text to Audio)
117
+ speech-01-turbo:
118
+ provider: minimax
119
+ model_id: "speech-01-turbo"
120
+ display_name: "MiniMax Speech Turbo"
121
+ verification:
122
+ status: unverified
123
+ verified_at: "2026-01-31"
124
+ source: "documentation"
125
+ notes: "Text-to-speech model with multiple voice options."
126
+ context_window: 10000
127
+ capabilities: [speech_synthesis]
128
+ status: active
129
+ tags: ["minimax", "speech", "tts", "cn"]
130
+ pricing:
131
+ input_per_token: 0.000001
132
+ output_per_token: 0