@ailib-official/ai-protocol 0.8.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (194) hide show
  1. package/LICENSE +6 -0
  2. package/README.md +415 -0
  3. package/dist/index.json +8 -0
  4. package/dist/v1/models/ai21.json +140 -0
  5. package/dist/v1/models/baichuan.json +138 -0
  6. package/dist/v1/models/cerebras.json +147 -0
  7. package/dist/v1/models/claude.json +114 -0
  8. package/dist/v1/models/cohere.json +235 -0
  9. package/dist/v1/models/deepinfra.json +43 -0
  10. package/dist/v1/models/deepseek-chat.json +55 -0
  11. package/dist/v1/models/doubao.json +197 -0
  12. package/dist/v1/models/ernie.json +223 -0
  13. package/dist/v1/models/fireworks.json +222 -0
  14. package/dist/v1/models/gemini.json +58 -0
  15. package/dist/v1/models/gpt.json +166 -0
  16. package/dist/v1/models/grok.json +138 -0
  17. package/dist/v1/models/huggingface.json +183 -0
  18. package/dist/v1/models/hunyuan.json +255 -0
  19. package/dist/v1/models/jina.json +139 -0
  20. package/dist/v1/models/lepton.json +188 -0
  21. package/dist/v1/models/llama.json +143 -0
  22. package/dist/v1/models/minimax.json +194 -0
  23. package/dist/v1/models/mistral.json +177 -0
  24. package/dist/v1/models/moonshot.json +144 -0
  25. package/dist/v1/models/nvidia.json +212 -0
  26. package/dist/v1/models/palmyra.json +103 -0
  27. package/dist/v1/models/perplexity.json +143 -0
  28. package/dist/v1/models/qwen.json +49 -0
  29. package/dist/v1/models/replicate.json +206 -0
  30. package/dist/v1/models/sensenova.json +144 -0
  31. package/dist/v1/models/siliconflow.json +44 -0
  32. package/dist/v1/models/spark.json +173 -0
  33. package/dist/v1/models/stable-diffusion.json +161 -0
  34. package/dist/v1/models/tiangong.json +169 -0
  35. package/dist/v1/models/together.json +43 -0
  36. package/dist/v1/models/yi.json +199 -0
  37. package/dist/v1/models/zhipu.json +250 -0
  38. package/dist/v1/providers/ai21.json +215 -0
  39. package/dist/v1/providers/anthropic.json +253 -0
  40. package/dist/v1/providers/anyscale.json +115 -0
  41. package/dist/v1/providers/azure.json +188 -0
  42. package/dist/v1/providers/baichuan.json +205 -0
  43. package/dist/v1/providers/baidu.json +205 -0
  44. package/dist/v1/providers/cerebras.json +216 -0
  45. package/dist/v1/providers/cohere.json +209 -0
  46. package/dist/v1/providers/deepinfra.json +196 -0
  47. package/dist/v1/providers/deepseek.json +221 -0
  48. package/dist/v1/providers/doubao.json +209 -0
  49. package/dist/v1/providers/fireworks.json +227 -0
  50. package/dist/v1/providers/gemini.json +279 -0
  51. package/dist/v1/providers/groq.json +218 -0
  52. package/dist/v1/providers/huggingface.json +181 -0
  53. package/dist/v1/providers/hunyuan.json +198 -0
  54. package/dist/v1/providers/jina.json +202 -0
  55. package/dist/v1/providers/lepton.json +221 -0
  56. package/dist/v1/providers/minimax.json +209 -0
  57. package/dist/v1/providers/mistral.json +214 -0
  58. package/dist/v1/providers/moonshot.json +214 -0
  59. package/dist/v1/providers/nvidia.json +213 -0
  60. package/dist/v1/providers/openai.json +267 -0
  61. package/dist/v1/providers/openrouter.json +220 -0
  62. package/dist/v1/providers/perplexity.json +172 -0
  63. package/dist/v1/providers/qwen.json +231 -0
  64. package/dist/v1/providers/replicate.json +192 -0
  65. package/dist/v1/providers/sensenova.json +185 -0
  66. package/dist/v1/providers/siliconflow.json +197 -0
  67. package/dist/v1/providers/spark.json +204 -0
  68. package/dist/v1/providers/stability.json +221 -0
  69. package/dist/v1/providers/tiangong.json +207 -0
  70. package/dist/v1/providers/together.json +196 -0
  71. package/dist/v1/providers/writer.json +253 -0
  72. package/dist/v1/providers/xai.json +238 -0
  73. package/dist/v1/providers/yi.json +205 -0
  74. package/dist/v1/providers/zhipu.json +208 -0
  75. package/dist/v1/spec.json +783 -0
  76. package/dist/v2/providers/anthropic.json +372 -0
  77. package/dist/v2/providers/cohere.json +109 -0
  78. package/dist/v2/providers/deepseek.json +272 -0
  79. package/dist/v2/providers/doubao.json +260 -0
  80. package/dist/v2/providers/google.json +388 -0
  81. package/dist/v2/providers/jina.json +71 -0
  82. package/dist/v2/providers/moonshot.json +284 -0
  83. package/dist/v2/providers/openai.json +419 -0
  84. package/dist/v2/providers/qwen.json +274 -0
  85. package/dist/v2/providers/zhipu.json +257 -0
  86. package/dist/v2-alpha/providers/anthropic.json +182 -0
  87. package/dist/v2-alpha/providers/gemini.json +187 -0
  88. package/dist/v2-alpha/providers/openai.json +215 -0
  89. package/dist/v2-alpha/spec.json +644 -0
  90. package/package.json +61 -0
  91. package/schemas/spec.json +186 -0
  92. package/schemas/v1.json +1116 -0
  93. package/schemas/v2/availability.json +66 -0
  94. package/schemas/v2/capabilities.json +182 -0
  95. package/schemas/v2/capability-profile.json +174 -0
  96. package/schemas/v2/computer-use.json +222 -0
  97. package/schemas/v2/context-policy.json +148 -0
  98. package/schemas/v2/endpoint.json +2 -0
  99. package/schemas/v2/error-codes.yaml +225 -0
  100. package/schemas/v2/errors.json +250 -0
  101. package/schemas/v2/execution-metadata.json +59 -0
  102. package/schemas/v2/mcp.json +225 -0
  103. package/schemas/v2/message-roles.json +10 -0
  104. package/schemas/v2/multimodal.json +297 -0
  105. package/schemas/v2/pricing.json +14 -0
  106. package/schemas/v2/provider-contract.json +317 -0
  107. package/schemas/v2/provider.json +203 -0
  108. package/schemas/v2/regions.json +14 -0
  109. package/v1/models/ai21.yaml +97 -0
  110. package/v1/models/baichuan.yaml +95 -0
  111. package/v1/models/cerebras.yaml +99 -0
  112. package/v1/models/claude.yaml +59 -0
  113. package/v1/models/cohere.yaml +165 -0
  114. package/v1/models/deepinfra.yaml +29 -0
  115. package/v1/models/deepseek-chat.yaml +32 -0
  116. package/v1/models/doubao.yaml +129 -0
  117. package/v1/models/ernie.yaml +146 -0
  118. package/v1/models/fireworks.yaml +145 -0
  119. package/v1/models/gemini.yaml +32 -0
  120. package/v1/models/gpt.yaml +90 -0
  121. package/v1/models/grok.yaml +74 -0
  122. package/v1/models/huggingface.yaml +110 -0
  123. package/v1/models/hunyuan.yaml +164 -0
  124. package/v1/models/jina.yaml +98 -0
  125. package/v1/models/lepton.yaml +130 -0
  126. package/v1/models/llama.yaml +91 -0
  127. package/v1/models/minimax.yaml +132 -0
  128. package/v1/models/mistral.yaml +100 -0
  129. package/v1/models/moonshot.yaml +97 -0
  130. package/v1/models/nvidia.yaml +118 -0
  131. package/v1/models/palmyra.yaml +59 -0
  132. package/v1/models/perplexity.yaml +97 -0
  133. package/v1/models/qwen.yaml +27 -0
  134. package/v1/models/replicate.yaml +136 -0
  135. package/v1/models/sensenova.yaml +97 -0
  136. package/v1/models/siliconflow.yaml +29 -0
  137. package/v1/models/spark.yaml +114 -0
  138. package/v1/models/stable-diffusion.yaml +113 -0
  139. package/v1/models/tiangong.yaml +114 -0
  140. package/v1/models/together.yaml +29 -0
  141. package/v1/models/yi.yaml +132 -0
  142. package/v1/models/zhipu.yaml +163 -0
  143. package/v1/providers/ai21.yaml +176 -0
  144. package/v1/providers/anthropic.yaml +209 -0
  145. package/v1/providers/anyscale.yaml +106 -0
  146. package/v1/providers/azure.yaml +155 -0
  147. package/v1/providers/baichuan.yaml +168 -0
  148. package/v1/providers/baidu.yaml +173 -0
  149. package/v1/providers/cerebras.yaml +178 -0
  150. package/v1/providers/cohere.yaml +175 -0
  151. package/v1/providers/deepinfra.yaml +156 -0
  152. package/v1/providers/deepseek.yaml +189 -0
  153. package/v1/providers/doubao.yaml +172 -0
  154. package/v1/providers/fireworks.yaml +187 -0
  155. package/v1/providers/gemini.yaml +229 -0
  156. package/v1/providers/groq.yaml +181 -0
  157. package/v1/providers/huggingface.yaml +157 -0
  158. package/v1/providers/hunyuan.yaml +162 -0
  159. package/v1/providers/jina.yaml +171 -0
  160. package/v1/providers/lepton.yaml +183 -0
  161. package/v1/providers/minimax.yaml +172 -0
  162. package/v1/providers/mistral.yaml +186 -0
  163. package/v1/providers/moonshot.yaml +176 -0
  164. package/v1/providers/nvidia.yaml +172 -0
  165. package/v1/providers/openai.yaml +224 -0
  166. package/v1/providers/openrouter.yaml +181 -0
  167. package/v1/providers/perplexity.yaml +144 -0
  168. package/v1/providers/qwen.yaml +192 -0
  169. package/v1/providers/replicate.yaml +159 -0
  170. package/v1/providers/sensenova.yaml +153 -0
  171. package/v1/providers/siliconflow.yaml +156 -0
  172. package/v1/providers/spark.yaml +167 -0
  173. package/v1/providers/stability.yaml +185 -0
  174. package/v1/providers/tiangong.yaml +170 -0
  175. package/v1/providers/together.yaml +156 -0
  176. package/v1/providers/writer.yaml +212 -0
  177. package/v1/providers/xai.yaml +206 -0
  178. package/v1/providers/yi.yaml +168 -0
  179. package/v1/providers/zhipu.yaml +171 -0
  180. package/v1/spec.yaml +637 -0
  181. package/v2/providers/anthropic.yaml +244 -0
  182. package/v2/providers/cohere.yaml +75 -0
  183. package/v2/providers/deepseek.yaml +176 -0
  184. package/v2/providers/doubao.yaml +169 -0
  185. package/v2/providers/google.yaml +245 -0
  186. package/v2/providers/jina.yaml +55 -0
  187. package/v2/providers/moonshot.yaml +186 -0
  188. package/v2/providers/openai.yaml +266 -0
  189. package/v2/providers/qwen.yaml +174 -0
  190. package/v2/providers/zhipu.yaml +176 -0
  191. package/v2-alpha/providers/anthropic.yaml +134 -0
  192. package/v2-alpha/providers/gemini.yaml +144 -0
  193. package/v2-alpha/providers/openai.yaml +154 -0
  194. package/v2-alpha/spec.yaml +512 -0
@@ -0,0 +1,100 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ # Mistral Model Instances
5
+ # Reference: https://docs.mistral.ai/api/
6
+
7
+ models:
8
+ mistral-small-latest:
9
+ provider: mistral
10
+ model_id: "mistral-small-latest"
11
+ display_name: "Mistral Small"
12
+ verification:
13
+ status: verified
14
+ verified_at: "2026-01-28"
15
+ source: "list_models:/models"
16
+ context_window: 32000
17
+ capabilities: [chat, tools, streaming, parallel_tools]
18
+ status: active
19
+ tags: ["mistral", "small", "tools", "latest"]
20
+
21
+ mistral-medium-latest:
22
+ provider: mistral
23
+ model_id: "mistral-medium-latest"
24
+ display_name: "Mistral Medium"
25
+ verification:
26
+ status: verified
27
+ verified_at: "2026-01-28"
28
+ source: "list_models:/models"
29
+ context_window: 32000
30
+ capabilities: [chat, tools, streaming, parallel_tools]
31
+ status: active
32
+ tags: ["mistral", "medium", "tools", "latest"]
33
+
34
+ mistral-large-latest:
35
+ provider: mistral
36
+ model_id: "mistral-large-latest"
37
+ display_name: "Mistral Large"
38
+ verification:
39
+ status: verified
40
+ verified_at: "2026-01-28"
41
+ source: "list_models:/models"
42
+ context_window: 32000
43
+ capabilities: [chat, tools, streaming, parallel_tools, agentic]
44
+ status: active
45
+ tags: ["mistral", "large", "tools", "agentic", "latest"]
46
+
47
+ pixtral-12b-latest:
48
+ provider: mistral
49
+ model_id: "pixtral-12b-latest"
50
+ display_name: "Pixtral 12B"
51
+ verification:
52
+ status: verified
53
+ verified_at: "2026-01-28"
54
+ source: "list_models:/models"
55
+ context_window: 128000
56
+ capabilities: [chat, vision, tools, streaming, parallel_tools]
57
+ status: active
58
+ tags: ["mistral", "pixtral", "vision", "12b", "latest"]
59
+
60
+ pixtral-large-latest:
61
+ provider: mistral
62
+ model_id: "pixtral-large-latest"
63
+ display_name: "Pixtral Large"
64
+ verification:
65
+ status: verified
66
+ verified_at: "2026-01-28"
67
+ source: "list_models:/models"
68
+ context_window: 128000
69
+ capabilities: [chat, vision, tools, streaming, parallel_tools, agentic]
70
+ status: active
71
+ tags: ["mistral", "pixtral", "vision", "large", "agentic", "latest"]
72
+
73
+ open-mistral-7b:
74
+ provider: mistral
75
+ model_id: "open-mistral-7b"
76
+ display_name: "Open Mistral 7B"
77
+ verification:
78
+ status: verified
79
+ verified_at: "2026-01-28"
80
+ source: "list_models:/models"
81
+ context_window: 32000
82
+ capabilities: [chat, streaming]
83
+ status: active
84
+ tags: ["mistral", "open", "7b", "base"]
85
+
86
+ # NOTE: `open-mixtral-8x7b` is not present in the current /v1/models list for this provider.
87
+ # Keep it removed to prevent 404 model_not_found. If it returns, re-add with evidence.
88
+
89
+ mistral-tiny:
90
+ provider: mistral
91
+ model_id: "mistral-tiny"
92
+ display_name: "Mistral Tiny"
93
+ verification:
94
+ status: verified
95
+ verified_at: "2026-01-28"
96
+ source: "list_models:/models"
97
+ context_window: 32000
98
+ capabilities: [chat, streaming]
99
+ status: active
100
+ tags: ["mistral", "tiny", "cost-effective"]
@@ -0,0 +1,97 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ # 月之暗面 Kimi (Moonshot) Model Instances
5
+ #
6
+ # VERIFIED_AT: 2026-01-31 (based on public Moonshot documentation)
7
+ #
8
+ # Notes:
9
+ # - Kimi is known for ultra-long context windows.
10
+ # - Supports file understanding and web search.
11
+
12
+ models:
13
+ # Moonshot v1 series
14
+ moonshot-v1-8k:
15
+ provider: moonshot
16
+ model_id: "moonshot-v1-8k"
17
+ display_name: "Kimi v1 8K"
18
+ verification:
19
+ status: unverified
20
+ verified_at: "2026-01-31"
21
+ source: "documentation"
22
+ notes: "Standard context model, cost-effective."
23
+ context_window: 8192
24
+ capabilities: [chat, tools, streaming]
25
+ status: active
26
+ tags: ["moonshot", "kimi", "cn"]
27
+ pricing:
28
+ input_per_token: 0.000012
29
+ output_per_token: 0.000012
30
+
31
+ moonshot-v1-32k:
32
+ provider: moonshot
33
+ model_id: "moonshot-v1-32k"
34
+ display_name: "Kimi v1 32K"
35
+ verification:
36
+ status: unverified
37
+ verified_at: "2026-01-31"
38
+ source: "documentation"
39
+ context_window: 32768
40
+ capabilities: [chat, tools, streaming]
41
+ status: active
42
+ tags: ["moonshot", "kimi", "long_context", "cn"]
43
+ pricing:
44
+ input_per_token: 0.000024
45
+ output_per_token: 0.000024
46
+
47
+ moonshot-v1-128k:
48
+ provider: moonshot
49
+ model_id: "moonshot-v1-128k"
50
+ display_name: "Kimi v1 128K"
51
+ verification:
52
+ status: unverified
53
+ verified_at: "2026-01-31"
54
+ source: "documentation"
55
+ context_window: 131072
56
+ capabilities: [chat, tools, streaming]
57
+ status: active
58
+ tags: ["moonshot", "kimi", "ultra_long_context", "cn"]
59
+ pricing:
60
+ input_per_token: 0.00006
61
+ output_per_token: 0.00006
62
+
63
+ # Kimi k1 series (latest with enhanced capabilities)
64
+ kimi-latest:
65
+ provider: moonshot
66
+ model_id: "kimi-latest"
67
+ display_name: "Kimi Latest"
68
+ verification:
69
+ status: unverified
70
+ verified_at: "2026-01-31"
71
+ source: "documentation"
72
+ notes: "Alias for the latest Kimi model."
73
+ context_window: 131072
74
+ capabilities: [chat, tools, vision, streaming]
75
+ status: active
76
+ tags: ["moonshot", "kimi", "latest", "cn"]
77
+ pricing:
78
+ input_per_token: 0.00006
79
+ output_per_token: 0.00006
80
+
81
+ # Moonshot web search model
82
+ moonshot-v1-auto:
83
+ provider: moonshot
84
+ model_id: "moonshot-v1-auto"
85
+ display_name: "Kimi v1 Auto"
86
+ verification:
87
+ status: unverified
88
+ verified_at: "2026-01-31"
89
+ source: "documentation"
90
+ notes: "Auto-selects context window based on input."
91
+ context_window: 131072
92
+ capabilities: [chat, tools, streaming]
93
+ status: active
94
+ tags: ["moonshot", "kimi", "auto", "cn"]
95
+ pricing:
96
+ input_per_token: 0.000024
97
+ output_per_token: 0.000024
@@ -0,0 +1,118 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ # NVIDIA API Catalog – top LLMs including Minimax and Kimi latest (verified via official API reference)
5
+ # Source: https://docs.api.nvidia.com/nim/reference/llm-apis
6
+ # Catalog: https://build.nvidia.com/explore/discover
7
+ models:
8
+ nvidia-nemotron-4-340b-instruct:
9
+ provider: nvidia
10
+ model_id: "nvidia-nemotron-4-340b-instruct"
11
+ display_name: "Nemotron 4 340B Instruct"
12
+ verification:
13
+ status: verified
14
+ verified_at: "2026-02-04"
15
+ source: "https://docs.api.nvidia.com/nim/reference/llm-apis"
16
+ notes: "NVIDIA flagship 340B chat model; OpenAI-compatible chat completions."
17
+ context_window: 128000
18
+ capabilities: [chat, vision, tools, streaming, agentic, parallel_tools, reasoning]
19
+ status: active
20
+ tags: ["nvidia", "nemotron", "flagship", "reasoning", "tools"]
21
+
22
+ "nvidia/llama3-chatqa-1.5-70b":
23
+ provider: nvidia
24
+ model_id: "nvidia/llama3-chatqa-1.5-70b"
25
+ display_name: "Llama 3 ChatQA 1.5 70B"
26
+ verification:
27
+ status: verified
28
+ verified_at: "2026-02-04"
29
+ source: "https://docs.api.nvidia.com/nim/reference/llm-apis"
30
+ notes: "70B chat QA model on NVIDIA API Catalog."
31
+ context_window: 32768
32
+ capabilities: [chat, tools, streaming, agentic]
33
+ status: active
34
+ tags: ["nvidia", "llama", "chatqa", "70b"]
35
+
36
+ "deepseek-ai/deepseek-r1":
37
+ provider: nvidia
38
+ model_id: "deepseek-ai/deepseek-r1"
39
+ display_name: "DeepSeek R1 (via NVIDIA)"
40
+ verification:
41
+ status: verified
42
+ verified_at: "2026-02-04"
43
+ source: "https://docs.api.nvidia.com/nim/reference/llm-apis"
44
+ notes: "Reasoning model available on NVIDIA API Catalog."
45
+ context_window: 64000
46
+ capabilities: [chat, tools, streaming, reasoning]
47
+ status: active
48
+ tags: ["deepseek", "reasoning", "nvidia-catalog"]
49
+
50
+ "mistralai/mistral-large-2-instruct":
51
+ provider: nvidia
52
+ model_id: "mistralai/mistral-large-2-instruct"
53
+ display_name: "Mistral Large 2 Instruct (via NVIDIA)"
54
+ verification:
55
+ status: verified
56
+ verified_at: "2026-02-04"
57
+ source: "https://docs.api.nvidia.com/nim/reference/llm-apis"
58
+ notes: "Mistral flagship instruct model on NVIDIA API Catalog."
59
+ context_window: 128000
60
+ capabilities: [chat, vision, tools, streaming, agentic]
61
+ status: active
62
+ tags: ["mistral", "instruct", "nvidia-catalog"]
63
+
64
+ "mistralai/mixtral-8x22b-instruct":
65
+ provider: nvidia
66
+ model_id: "mistralai/mixtral-8x22b-instruct"
67
+ display_name: "Mixtral 8x22B Instruct (via NVIDIA)"
68
+ verification:
69
+ status: verified
70
+ verified_at: "2026-02-04"
71
+ source: "https://docs.api.nvidia.com/nim/reference/llm-apis"
72
+ notes: "MoE 8x22B instruct model on NVIDIA API Catalog."
73
+ context_window: 65536
74
+ capabilities: [chat, tools, streaming, agentic]
75
+ status: active
76
+ tags: ["mistral", "mixtral", "moe", "nvidia-catalog"]
77
+
78
+ "meta/llama3-70b":
79
+ provider: nvidia
80
+ model_id: "meta/llama3-70b"
81
+ display_name: "Llama 3 70B (via NVIDIA)"
82
+ verification:
83
+ status: verified
84
+ verified_at: "2026-02-04"
85
+ source: "https://docs.api.nvidia.com/nim/reference/llm-apis"
86
+ notes: "Meta Llama 3 70B on NVIDIA API Catalog."
87
+ context_window: 8192
88
+ capabilities: [chat, tools, streaming]
89
+ status: active
90
+ tags: ["meta", "llama", "70b", "nvidia-catalog"]
91
+
92
+ "moonshotai/kimi-k2-instruct":
93
+ provider: nvidia
94
+ model_id: "moonshotai/kimi-k2-instruct"
95
+ display_name: "Kimi K2 Instruct (via NVIDIA)"
96
+ verification:
97
+ status: verified
98
+ verified_at: "2026-02-04"
99
+ source: "https://docs.api.nvidia.com/nim/reference/moonshotai-kimi-k2-instruct"
100
+ notes: "Moonshot Kimi K2 MoE 1T/32B; agentic, tools, 128K context on NVIDIA API Catalog."
101
+ context_window: 128000
102
+ capabilities: [chat, tools, streaming, agentic, reasoning]
103
+ status: active
104
+ tags: ["moonshot", "kimi", "moe", "nvidia-catalog", "agentic"]
105
+
106
+ "minimaxai/minimax-m2":
107
+ provider: nvidia
108
+ model_id: "minimaxai/minimax-m2"
109
+ display_name: "MiniMax M2 (via NVIDIA)"
110
+ verification:
111
+ status: verified
112
+ verified_at: "2026-02-04"
113
+ source: "https://docs.api.nvidia.com/nim/reference/minimaxai-minimax-m2"
114
+ notes: "MiniMax M2 MoE 230B/10B; coding, reasoning, tool-use, 128K context on NVIDIA API Catalog."
115
+ context_window: 128000
116
+ capabilities: [chat, tools, streaming, agentic, reasoning]
117
+ status: active
118
+ tags: ["minimax", "moe", "nvidia-catalog", "coding", "agentic"]
@@ -0,0 +1,59 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.5"
3
+
4
+ # Writer Model Instances (Palmyra Series)
5
+ # Notes: Writer provides enterprise-focused AI writing and content generation
6
+
7
+ models:
8
+ palmyra-x-004:
9
+ provider: writer
10
+ model_id: "palmyra-x-004"
11
+ display_name: "Palmyra X 004"
12
+ verification:
13
+ status: unverified
14
+ source: "manual"
15
+ notes: "Flagship model for enterprise writing"
16
+ context_window: 128000
17
+ capabilities: [chat, tools, streaming, agentic, reasoning]
18
+ pricing:
19
+ input_per_token: null
20
+ output_per_token: null
21
+ status: active
22
+ tags: ["palmyra", "writer", "enterprise", "writing", "reasoning"]
23
+ agentic_capabilities:
24
+ reasoning_effort: "medium"
25
+ thinking_blocks: false
26
+ parallel_tools: false
27
+ builtin_tools: ["web_search", "fact_check", "compliance"]
28
+
29
+ palmyra-med:
30
+ provider: writer
31
+ model_id: "palmyra-med"
32
+ display_name: "Palmyra Med"
33
+ verification:
34
+ status: unverified
35
+ source: "manual"
36
+ notes: "Specialized for medical and healthcare content"
37
+ context_window: 64000
38
+ capabilities: [chat, tools, streaming, agentic]
39
+ pricing:
40
+ input_per_token: null
41
+ output_per_token: null
42
+ status: active
43
+ tags: ["palmyra", "writer", "medical", "healthcare", "enterprise"]
44
+
45
+ palmyra-fin:
46
+ provider: writer
47
+ model_id: "palmyra-fin"
48
+ display_name: "Palmyra Fin"
49
+ verification:
50
+ status: unverified
51
+ source: "manual"
52
+ notes: "Specialized for financial content"
53
+ context_window: 64000
54
+ capabilities: [chat, tools, streaming, agentic]
55
+ pricing:
56
+ input_per_token: null
57
+ output_per_token: null
58
+ status: active
59
+ tags: ["palmyra", "writer", "finance", "enterprise"]
@@ -0,0 +1,97 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ # Perplexity Model Instances
5
+ #
6
+ # VERIFIED_AT: 2026-01-31 (based on public Perplexity documentation)
7
+ #
8
+ # Notes:
9
+ # - Perplexity is known for search-augmented AI.
10
+ # - "Online" models include real-time web search.
11
+ # - "Chat" models are standard conversational models.
12
+
13
+ models:
14
+ # Sonar Online models (with web search)
15
+ llama-3.1-sonar-small-128k-online:
16
+ provider: perplexity
17
+ model_id: "llama-3.1-sonar-small-128k-online"
18
+ display_name: "Sonar Small Online (8B)"
19
+ verification:
20
+ status: unverified
21
+ verified_at: "2026-01-31"
22
+ source: "documentation"
23
+ notes: "Llama 3.1 8B with real-time web search."
24
+ context_window: 127072
25
+ capabilities: [chat, streaming, online_search]
26
+ status: active
27
+ tags: ["perplexity", "sonar", "online", "search"]
28
+ pricing:
29
+ input_per_token: 0.0000002
30
+ output_per_token: 0.0000002
31
+
32
+ llama-3.1-sonar-large-128k-online:
33
+ provider: perplexity
34
+ model_id: "llama-3.1-sonar-large-128k-online"
35
+ display_name: "Sonar Large Online (70B)"
36
+ verification:
37
+ status: unverified
38
+ verified_at: "2026-01-31"
39
+ source: "documentation"
40
+ notes: "Llama 3.1 70B with real-time web search."
41
+ context_window: 127072
42
+ capabilities: [chat, streaming, online_search]
43
+ status: active
44
+ tags: ["perplexity", "sonar", "online", "search", "large"]
45
+ pricing:
46
+ input_per_token: 0.000001
47
+ output_per_token: 0.000001
48
+
49
+ llama-3.1-sonar-huge-128k-online:
50
+ provider: perplexity
51
+ model_id: "llama-3.1-sonar-huge-128k-online"
52
+ display_name: "Sonar Huge Online (405B)"
53
+ verification:
54
+ status: unverified
55
+ verified_at: "2026-01-31"
56
+ source: "documentation"
57
+ notes: "Llama 3.1 405B with real-time web search."
58
+ context_window: 127072
59
+ capabilities: [chat, streaming, online_search]
60
+ status: active
61
+ tags: ["perplexity", "sonar", "online", "search", "flagship"]
62
+ pricing:
63
+ input_per_token: 0.000005
64
+ output_per_token: 0.000005
65
+
66
+ # Sonar Chat models (without web search)
67
+ llama-3.1-sonar-small-128k-chat:
68
+ provider: perplexity
69
+ model_id: "llama-3.1-sonar-small-128k-chat"
70
+ display_name: "Sonar Small Chat (8B)"
71
+ verification:
72
+ status: unverified
73
+ verified_at: "2026-01-31"
74
+ source: "documentation"
75
+ context_window: 131072
76
+ capabilities: [chat, streaming]
77
+ status: active
78
+ tags: ["perplexity", "sonar", "chat"]
79
+ pricing:
80
+ input_per_token: 0.0000002
81
+ output_per_token: 0.0000002
82
+
83
+ llama-3.1-sonar-large-128k-chat:
84
+ provider: perplexity
85
+ model_id: "llama-3.1-sonar-large-128k-chat"
86
+ display_name: "Sonar Large Chat (70B)"
87
+ verification:
88
+ status: unverified
89
+ verified_at: "2026-01-31"
90
+ source: "documentation"
91
+ context_window: 131072
92
+ capabilities: [chat, streaming]
93
+ status: active
94
+ tags: ["perplexity", "sonar", "chat", "large"]
95
+ pricing:
96
+ input_per_token: 0.000001
97
+ output_per_token: 0.000001
@@ -0,0 +1,27 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ # Qwen Model Instances
5
+ models:
6
+ qwen-max:
7
+ provider: qwen
8
+ model_id: "qwen-max"
9
+ display_name: "Qwen Max"
10
+ verification:
11
+ status: unverified
12
+ source: "manual"
13
+ context_window: 262144
14
+ capabilities: [chat, tools, streaming]
15
+ status: active
16
+ tags: ["alibaba", "qwen", "strong"]
17
+
18
+ qwen-turbo:
19
+ provider: qwen
20
+ model_id: "qwen-turbo"
21
+ display_name: "Qwen Turbo"
22
+ verification:
23
+ status: unverified
24
+ source: "manual"
25
+ capabilities: [chat, vision, tools, streaming, agentic]
26
+ status: active
27
+ tags: ["alibaba", "qwen", "fast"]
@@ -0,0 +1,136 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ # Replicate Model Instances
5
+ #
6
+ # VERIFIED_AT: 2026-01-29 (based on public Replicate documentation)
7
+ #
8
+ # Notes:
9
+ # - Replicate is a model hosting platform with async prediction API.
10
+ # - Model IDs follow the pattern: {owner}/{model_name}
11
+ # - Supports both native Replicate API and OpenAI-compatible endpoints for some models.
12
+
13
+ models:
14
+ # Meta Llama models
15
+ "meta/llama-2-70b-chat":
16
+ provider: replicate
17
+ model_id: "meta/llama-2-70b-chat"
18
+ display_name: "Llama 2 70B Chat"
19
+ verification:
20
+ status: unverified
21
+ verified_at: "2026-01-29"
22
+ source: "documentation"
23
+ notes: "Based on public documentation. Runtime verification recommended."
24
+ context_window: 4096
25
+ capabilities: [chat, streaming]
26
+ status: active
27
+ tags: ["meta", "llama", "replicate", "chat"]
28
+
29
+ "meta/meta-llama-3-70b-instruct":
30
+ provider: replicate
31
+ model_id: "meta/meta-llama-3-70b-instruct"
32
+ display_name: "Llama 3 70B Instruct"
33
+ verification:
34
+ status: unverified
35
+ verified_at: "2026-01-29"
36
+ source: "documentation"
37
+ context_window: 8192
38
+ capabilities: [chat, streaming]
39
+ status: active
40
+ tags: ["meta", "llama", "replicate", "instruct"]
41
+
42
+ "meta/meta-llama-3.1-405b-instruct":
43
+ provider: replicate
44
+ model_id: "meta/meta-llama-3.1-405b-instruct"
45
+ display_name: "Llama 3.1 405B Instruct"
46
+ verification:
47
+ status: unverified
48
+ verified_at: "2026-01-29"
49
+ source: "documentation"
50
+ context_window: 131072
51
+ capabilities: [chat, streaming]
52
+ status: active
53
+ tags: ["meta", "llama", "replicate", "instruct", "flagship"]
54
+
55
+ # Mistral models
56
+ "mistralai/mistral-7b-instruct-v0.2":
57
+ provider: replicate
58
+ model_id: "mistralai/mistral-7b-instruct-v0.2"
59
+ display_name: "Mistral 7B Instruct v0.2"
60
+ verification:
61
+ status: unverified
62
+ verified_at: "2026-01-29"
63
+ source: "documentation"
64
+ context_window: 8192
65
+ capabilities: [chat, streaming]
66
+ status: active
67
+ tags: ["mistral", "replicate", "instruct"]
68
+
69
+ "mistralai/mixtral-8x7b-instruct-v0.1":
70
+ provider: replicate
71
+ model_id: "mistralai/mixtral-8x7b-instruct-v0.1"
72
+ display_name: "Mixtral 8x7B Instruct"
73
+ verification:
74
+ status: unverified
75
+ verified_at: "2026-01-29"
76
+ source: "documentation"
77
+ context_window: 32768
78
+ capabilities: [chat, streaming]
79
+ status: active
80
+ tags: ["mistral", "mixtral", "moe", "replicate"]
81
+
82
+ # Stability AI models (text)
83
+ "stability-ai/stablelm-tuned-alpha-7b":
84
+ provider: replicate
85
+ model_id: "stability-ai/stablelm-tuned-alpha-7b"
86
+ display_name: "StableLM Tuned Alpha 7B"
87
+ verification:
88
+ status: unverified
89
+ verified_at: "2026-01-29"
90
+ source: "documentation"
91
+ context_window: 4096
92
+ capabilities: [chat, streaming]
93
+ status: deprecated
94
+ tags: ["stability", "stablelm", "replicate"]
95
+
96
+ # Snowflake models
97
+ "snowflake/snowflake-arctic-instruct":
98
+ provider: replicate
99
+ model_id: "snowflake/snowflake-arctic-instruct"
100
+ display_name: "Snowflake Arctic Instruct"
101
+ verification:
102
+ status: unverified
103
+ verified_at: "2026-01-29"
104
+ source: "documentation"
105
+ context_window: 4096
106
+ capabilities: [chat, streaming]
107
+ status: active
108
+ tags: ["snowflake", "arctic", "replicate", "enterprise"]
109
+
110
+ # Vision-language models
111
+ "yorickvp/llava-13b":
112
+ provider: replicate
113
+ model_id: "yorickvp/llava-13b"
114
+ display_name: "LLaVA 13B"
115
+ verification:
116
+ status: unverified
117
+ verified_at: "2026-01-29"
118
+ source: "documentation"
119
+ context_window: 2048
120
+ capabilities: [chat, vision, streaming]
121
+ status: active
122
+ tags: ["llava", "vision", "multimodal", "replicate"]
123
+
124
+ # Code models
125
+ "meta/codellama-70b-instruct":
126
+ provider: replicate
127
+ model_id: "meta/codellama-70b-instruct"
128
+ display_name: "Code Llama 70B Instruct"
129
+ verification:
130
+ status: unverified
131
+ verified_at: "2026-01-29"
132
+ source: "documentation"
133
+ context_window: 16384
134
+ capabilities: [chat, code, streaming]
135
+ status: active
136
+ tags: ["meta", "codellama", "code", "replicate"]