@ailib-official/ai-protocol 0.8.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (194) hide show
  1. package/LICENSE +6 -0
  2. package/README.md +415 -0
  3. package/dist/index.json +8 -0
  4. package/dist/v1/models/ai21.json +140 -0
  5. package/dist/v1/models/baichuan.json +138 -0
  6. package/dist/v1/models/cerebras.json +147 -0
  7. package/dist/v1/models/claude.json +114 -0
  8. package/dist/v1/models/cohere.json +235 -0
  9. package/dist/v1/models/deepinfra.json +43 -0
  10. package/dist/v1/models/deepseek-chat.json +55 -0
  11. package/dist/v1/models/doubao.json +197 -0
  12. package/dist/v1/models/ernie.json +223 -0
  13. package/dist/v1/models/fireworks.json +222 -0
  14. package/dist/v1/models/gemini.json +58 -0
  15. package/dist/v1/models/gpt.json +166 -0
  16. package/dist/v1/models/grok.json +138 -0
  17. package/dist/v1/models/huggingface.json +183 -0
  18. package/dist/v1/models/hunyuan.json +255 -0
  19. package/dist/v1/models/jina.json +139 -0
  20. package/dist/v1/models/lepton.json +188 -0
  21. package/dist/v1/models/llama.json +143 -0
  22. package/dist/v1/models/minimax.json +194 -0
  23. package/dist/v1/models/mistral.json +177 -0
  24. package/dist/v1/models/moonshot.json +144 -0
  25. package/dist/v1/models/nvidia.json +212 -0
  26. package/dist/v1/models/palmyra.json +103 -0
  27. package/dist/v1/models/perplexity.json +143 -0
  28. package/dist/v1/models/qwen.json +49 -0
  29. package/dist/v1/models/replicate.json +206 -0
  30. package/dist/v1/models/sensenova.json +144 -0
  31. package/dist/v1/models/siliconflow.json +44 -0
  32. package/dist/v1/models/spark.json +173 -0
  33. package/dist/v1/models/stable-diffusion.json +161 -0
  34. package/dist/v1/models/tiangong.json +169 -0
  35. package/dist/v1/models/together.json +43 -0
  36. package/dist/v1/models/yi.json +199 -0
  37. package/dist/v1/models/zhipu.json +250 -0
  38. package/dist/v1/providers/ai21.json +215 -0
  39. package/dist/v1/providers/anthropic.json +253 -0
  40. package/dist/v1/providers/anyscale.json +115 -0
  41. package/dist/v1/providers/azure.json +188 -0
  42. package/dist/v1/providers/baichuan.json +205 -0
  43. package/dist/v1/providers/baidu.json +205 -0
  44. package/dist/v1/providers/cerebras.json +216 -0
  45. package/dist/v1/providers/cohere.json +209 -0
  46. package/dist/v1/providers/deepinfra.json +196 -0
  47. package/dist/v1/providers/deepseek.json +221 -0
  48. package/dist/v1/providers/doubao.json +209 -0
  49. package/dist/v1/providers/fireworks.json +227 -0
  50. package/dist/v1/providers/gemini.json +279 -0
  51. package/dist/v1/providers/groq.json +218 -0
  52. package/dist/v1/providers/huggingface.json +181 -0
  53. package/dist/v1/providers/hunyuan.json +198 -0
  54. package/dist/v1/providers/jina.json +202 -0
  55. package/dist/v1/providers/lepton.json +221 -0
  56. package/dist/v1/providers/minimax.json +209 -0
  57. package/dist/v1/providers/mistral.json +214 -0
  58. package/dist/v1/providers/moonshot.json +214 -0
  59. package/dist/v1/providers/nvidia.json +213 -0
  60. package/dist/v1/providers/openai.json +267 -0
  61. package/dist/v1/providers/openrouter.json +220 -0
  62. package/dist/v1/providers/perplexity.json +172 -0
  63. package/dist/v1/providers/qwen.json +231 -0
  64. package/dist/v1/providers/replicate.json +192 -0
  65. package/dist/v1/providers/sensenova.json +185 -0
  66. package/dist/v1/providers/siliconflow.json +197 -0
  67. package/dist/v1/providers/spark.json +204 -0
  68. package/dist/v1/providers/stability.json +221 -0
  69. package/dist/v1/providers/tiangong.json +207 -0
  70. package/dist/v1/providers/together.json +196 -0
  71. package/dist/v1/providers/writer.json +253 -0
  72. package/dist/v1/providers/xai.json +238 -0
  73. package/dist/v1/providers/yi.json +205 -0
  74. package/dist/v1/providers/zhipu.json +208 -0
  75. package/dist/v1/spec.json +783 -0
  76. package/dist/v2/providers/anthropic.json +372 -0
  77. package/dist/v2/providers/cohere.json +109 -0
  78. package/dist/v2/providers/deepseek.json +272 -0
  79. package/dist/v2/providers/doubao.json +260 -0
  80. package/dist/v2/providers/google.json +388 -0
  81. package/dist/v2/providers/jina.json +71 -0
  82. package/dist/v2/providers/moonshot.json +284 -0
  83. package/dist/v2/providers/openai.json +419 -0
  84. package/dist/v2/providers/qwen.json +274 -0
  85. package/dist/v2/providers/zhipu.json +257 -0
  86. package/dist/v2-alpha/providers/anthropic.json +182 -0
  87. package/dist/v2-alpha/providers/gemini.json +187 -0
  88. package/dist/v2-alpha/providers/openai.json +215 -0
  89. package/dist/v2-alpha/spec.json +644 -0
  90. package/package.json +61 -0
  91. package/schemas/spec.json +186 -0
  92. package/schemas/v1.json +1116 -0
  93. package/schemas/v2/availability.json +66 -0
  94. package/schemas/v2/capabilities.json +182 -0
  95. package/schemas/v2/capability-profile.json +174 -0
  96. package/schemas/v2/computer-use.json +222 -0
  97. package/schemas/v2/context-policy.json +148 -0
  98. package/schemas/v2/endpoint.json +2 -0
  99. package/schemas/v2/error-codes.yaml +225 -0
  100. package/schemas/v2/errors.json +250 -0
  101. package/schemas/v2/execution-metadata.json +59 -0
  102. package/schemas/v2/mcp.json +225 -0
  103. package/schemas/v2/message-roles.json +10 -0
  104. package/schemas/v2/multimodal.json +297 -0
  105. package/schemas/v2/pricing.json +14 -0
  106. package/schemas/v2/provider-contract.json +317 -0
  107. package/schemas/v2/provider.json +203 -0
  108. package/schemas/v2/regions.json +14 -0
  109. package/v1/models/ai21.yaml +97 -0
  110. package/v1/models/baichuan.yaml +95 -0
  111. package/v1/models/cerebras.yaml +99 -0
  112. package/v1/models/claude.yaml +59 -0
  113. package/v1/models/cohere.yaml +165 -0
  114. package/v1/models/deepinfra.yaml +29 -0
  115. package/v1/models/deepseek-chat.yaml +32 -0
  116. package/v1/models/doubao.yaml +129 -0
  117. package/v1/models/ernie.yaml +146 -0
  118. package/v1/models/fireworks.yaml +145 -0
  119. package/v1/models/gemini.yaml +32 -0
  120. package/v1/models/gpt.yaml +90 -0
  121. package/v1/models/grok.yaml +74 -0
  122. package/v1/models/huggingface.yaml +110 -0
  123. package/v1/models/hunyuan.yaml +164 -0
  124. package/v1/models/jina.yaml +98 -0
  125. package/v1/models/lepton.yaml +130 -0
  126. package/v1/models/llama.yaml +91 -0
  127. package/v1/models/minimax.yaml +132 -0
  128. package/v1/models/mistral.yaml +100 -0
  129. package/v1/models/moonshot.yaml +97 -0
  130. package/v1/models/nvidia.yaml +118 -0
  131. package/v1/models/palmyra.yaml +59 -0
  132. package/v1/models/perplexity.yaml +97 -0
  133. package/v1/models/qwen.yaml +27 -0
  134. package/v1/models/replicate.yaml +136 -0
  135. package/v1/models/sensenova.yaml +97 -0
  136. package/v1/models/siliconflow.yaml +29 -0
  137. package/v1/models/spark.yaml +114 -0
  138. package/v1/models/stable-diffusion.yaml +113 -0
  139. package/v1/models/tiangong.yaml +114 -0
  140. package/v1/models/together.yaml +29 -0
  141. package/v1/models/yi.yaml +132 -0
  142. package/v1/models/zhipu.yaml +163 -0
  143. package/v1/providers/ai21.yaml +176 -0
  144. package/v1/providers/anthropic.yaml +209 -0
  145. package/v1/providers/anyscale.yaml +106 -0
  146. package/v1/providers/azure.yaml +155 -0
  147. package/v1/providers/baichuan.yaml +168 -0
  148. package/v1/providers/baidu.yaml +173 -0
  149. package/v1/providers/cerebras.yaml +178 -0
  150. package/v1/providers/cohere.yaml +175 -0
  151. package/v1/providers/deepinfra.yaml +156 -0
  152. package/v1/providers/deepseek.yaml +189 -0
  153. package/v1/providers/doubao.yaml +172 -0
  154. package/v1/providers/fireworks.yaml +187 -0
  155. package/v1/providers/gemini.yaml +229 -0
  156. package/v1/providers/groq.yaml +181 -0
  157. package/v1/providers/huggingface.yaml +157 -0
  158. package/v1/providers/hunyuan.yaml +162 -0
  159. package/v1/providers/jina.yaml +171 -0
  160. package/v1/providers/lepton.yaml +183 -0
  161. package/v1/providers/minimax.yaml +172 -0
  162. package/v1/providers/mistral.yaml +186 -0
  163. package/v1/providers/moonshot.yaml +176 -0
  164. package/v1/providers/nvidia.yaml +172 -0
  165. package/v1/providers/openai.yaml +224 -0
  166. package/v1/providers/openrouter.yaml +181 -0
  167. package/v1/providers/perplexity.yaml +144 -0
  168. package/v1/providers/qwen.yaml +192 -0
  169. package/v1/providers/replicate.yaml +159 -0
  170. package/v1/providers/sensenova.yaml +153 -0
  171. package/v1/providers/siliconflow.yaml +156 -0
  172. package/v1/providers/spark.yaml +167 -0
  173. package/v1/providers/stability.yaml +185 -0
  174. package/v1/providers/tiangong.yaml +170 -0
  175. package/v1/providers/together.yaml +156 -0
  176. package/v1/providers/writer.yaml +212 -0
  177. package/v1/providers/xai.yaml +206 -0
  178. package/v1/providers/yi.yaml +168 -0
  179. package/v1/providers/zhipu.yaml +171 -0
  180. package/v1/spec.yaml +637 -0
  181. package/v2/providers/anthropic.yaml +244 -0
  182. package/v2/providers/cohere.yaml +75 -0
  183. package/v2/providers/deepseek.yaml +176 -0
  184. package/v2/providers/doubao.yaml +169 -0
  185. package/v2/providers/google.yaml +245 -0
  186. package/v2/providers/jina.yaml +55 -0
  187. package/v2/providers/moonshot.yaml +186 -0
  188. package/v2/providers/openai.yaml +266 -0
  189. package/v2/providers/qwen.yaml +174 -0
  190. package/v2/providers/zhipu.yaml +176 -0
  191. package/v2-alpha/providers/anthropic.yaml +134 -0
  192. package/v2-alpha/providers/gemini.yaml +144 -0
  193. package/v2-alpha/providers/openai.yaml +154 -0
  194. package/v2-alpha/spec.yaml +512 -0
@@ -0,0 +1,95 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ # 百川智能 (Baichuan) Model Instances
5
+ #
6
+ # VERIFIED_AT: 2026-01-31 (based on public Baichuan documentation)
7
+ #
8
+ # Notes:
9
+ # - Baichuan is a leading Chinese AI company.
10
+ # - Known for strong Chinese language understanding.
11
+
12
+ models:
13
+ # Baichuan 4 series (latest)
14
+ Baichuan4:
15
+ provider: baichuan
16
+ model_id: "Baichuan4"
17
+ display_name: "百川 4"
18
+ verification:
19
+ status: unverified
20
+ verified_at: "2026-01-31"
21
+ source: "documentation"
22
+ notes: "Latest flagship model with best performance."
23
+ context_window: 32768
24
+ capabilities: [chat, tools, streaming]
25
+ status: active
26
+ tags: ["baichuan", "flagship", "cn"]
27
+ pricing:
28
+ input_per_token: 0.0001
29
+ output_per_token: 0.0001
30
+
31
+ # Baichuan 3 Turbo series
32
+ Baichuan3-Turbo:
33
+ provider: baichuan
34
+ model_id: "Baichuan3-Turbo"
35
+ display_name: "百川 3 Turbo"
36
+ verification:
37
+ status: unverified
38
+ verified_at: "2026-01-31"
39
+ source: "documentation"
40
+ context_window: 32768
41
+ capabilities: [chat, tools, streaming]
42
+ status: active
43
+ tags: ["baichuan", "turbo", "cn"]
44
+ pricing:
45
+ input_per_token: 0.000012
46
+ output_per_token: 0.000012
47
+
48
+ Baichuan3-Turbo-128k:
49
+ provider: baichuan
50
+ model_id: "Baichuan3-Turbo-128k"
51
+ display_name: "百川 3 Turbo 128K"
52
+ verification:
53
+ status: unverified
54
+ verified_at: "2026-01-31"
55
+ source: "documentation"
56
+ context_window: 131072
57
+ capabilities: [chat, tools, streaming]
58
+ status: active
59
+ tags: ["baichuan", "turbo", "long_context", "cn"]
60
+ pricing:
61
+ input_per_token: 0.000024
62
+ output_per_token: 0.000024
63
+
64
+ # Baichuan 2 series (legacy)
65
+ Baichuan2-Turbo:
66
+ provider: baichuan
67
+ model_id: "Baichuan2-Turbo"
68
+ display_name: "百川 2 Turbo"
69
+ verification:
70
+ status: unverified
71
+ verified_at: "2026-01-31"
72
+ source: "documentation"
73
+ context_window: 8192
74
+ capabilities: [chat, streaming]
75
+ status: active
76
+ tags: ["baichuan", "turbo", "legacy", "cn"]
77
+ pricing:
78
+ input_per_token: 0.000008
79
+ output_per_token: 0.000008
80
+
81
+ Baichuan2-Turbo-192k:
82
+ provider: baichuan
83
+ model_id: "Baichuan2-Turbo-192k"
84
+ display_name: "百川 2 Turbo 192K"
85
+ verification:
86
+ status: unverified
87
+ verified_at: "2026-01-31"
88
+ source: "documentation"
89
+ context_window: 196608
90
+ capabilities: [chat, streaming]
91
+ status: active
92
+ tags: ["baichuan", "turbo", "ultra_long_context", "cn"]
93
+ pricing:
94
+ input_per_token: 0.000016
95
+ output_per_token: 0.000016
@@ -0,0 +1,99 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ # Cerebras Model Instances
5
+ #
6
+ # VERIFIED_AT: 2026-01-29 (based on public Cerebras documentation)
7
+ #
8
+ # Notes:
9
+ # - Cerebras offers extremely fast inference using Wafer-Scale Engine technology.
10
+ # - Known for achieving thousands of tokens per second.
11
+ # - Primarily hosts Llama models.
12
+
13
+ models:
14
+ # Llama 3.1 models
15
+ llama3.1-8b:
16
+ provider: cerebras
17
+ model_id: "llama3.1-8b"
18
+ display_name: "Llama 3.1 8B"
19
+ verification:
20
+ status: unverified
21
+ verified_at: "2026-01-29"
22
+ source: "documentation"
23
+ notes: "Based on public documentation. Cerebras achieves ~2100 tokens/sec."
24
+ context_window: 8192
25
+ capabilities: [chat, tools, streaming]
26
+ status: active
27
+ tags: ["meta", "llama", "cerebras", "fast"]
28
+ pricing:
29
+ input_per_token: 0.0000001
30
+ output_per_token: 0.0000001
31
+
32
+ llama3.1-70b:
33
+ provider: cerebras
34
+ model_id: "llama3.1-70b"
35
+ display_name: "Llama 3.1 70B"
36
+ verification:
37
+ status: unverified
38
+ verified_at: "2026-01-29"
39
+ source: "documentation"
40
+ notes: "Cerebras achieves ~450 tokens/sec for this model."
41
+ context_window: 8192
42
+ capabilities: [chat, tools, streaming]
43
+ status: active
44
+ tags: ["meta", "llama", "cerebras", "fast"]
45
+ pricing:
46
+ input_per_token: 0.0000006
47
+ output_per_token: 0.0000006
48
+
49
+ # Llama 3.3 models
50
+ llama-3.3-70b:
51
+ provider: cerebras
52
+ model_id: "llama-3.3-70b"
53
+ display_name: "Llama 3.3 70B"
54
+ verification:
55
+ status: unverified
56
+ verified_at: "2026-01-29"
57
+ source: "documentation"
58
+ notes: "Cerebras achieves ~970 tokens/sec for this model."
59
+ context_window: 8192
60
+ capabilities: [chat, tools, streaming]
61
+ status: active
62
+ tags: ["meta", "llama", "cerebras", "fast", "latest"]
63
+ pricing:
64
+ input_per_token: 0.00000085
65
+ output_per_token: 0.00000085
66
+
67
+ # Qwen models
68
+ qwen-2.5-32b:
69
+ provider: cerebras
70
+ model_id: "qwen-2.5-32b"
71
+ display_name: "Qwen 2.5 32B"
72
+ verification:
73
+ status: unverified
74
+ verified_at: "2026-01-29"
75
+ source: "documentation"
76
+ context_window: 8192
77
+ capabilities: [chat, tools, streaming]
78
+ status: active
79
+ tags: ["alibaba", "qwen", "cerebras", "fast"]
80
+ pricing:
81
+ input_per_token: 0.0000003
82
+ output_per_token: 0.0000003
83
+
84
+ # DeepSeek models
85
+ deepseek-r1-distill-llama-70b:
86
+ provider: cerebras
87
+ model_id: "deepseek-r1-distill-llama-70b"
88
+ display_name: "DeepSeek R1 Distill Llama 70B"
89
+ verification:
90
+ status: unverified
91
+ verified_at: "2026-01-29"
92
+ source: "documentation"
93
+ context_window: 8192
94
+ capabilities: [chat, tools, streaming, reasoning]
95
+ status: active
96
+ tags: ["deepseek", "distill", "cerebras", "fast", "reasoning"]
97
+ pricing:
98
+ input_per_token: 0.00000085
99
+ output_per_token: 0.00000085
@@ -0,0 +1,59 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ # Claude Model Instances
5
+ models:
6
+ claude-3-5-sonnet:
7
+ provider: anthropic
8
+ model_id: "claude-3-5-sonnet-20241022"
9
+ display_name: "Claude 3.5 Sonnet"
10
+ verification:
11
+ status: unverified
12
+ source: "manual"
13
+ context_window: 200000
14
+ capabilities: [chat, vision, tools, streaming, agentic, reasoning]
15
+ pricing:
16
+ input_per_token: 0.000003
17
+ output_per_token: 0.000015
18
+ status: active
19
+ tags: ["claude", "vision", "reasoning", "agentic", "thinking"]
20
+ agentic_capabilities:
21
+ reasoning_effort: "high"
22
+ thinking_blocks: true
23
+ parallel_tools: false
24
+ builtin_tools: ["web_search", "document_analysis"]
25
+
26
+ claude-3-5-haiku:
27
+ provider: anthropic
28
+ model_id: "claude-3-5-haiku-20241022"
29
+ display_name: "Claude 3.5 Haiku"
30
+ verification:
31
+ status: unverified
32
+ source: "manual"
33
+ context_window: 200000
34
+ capabilities: [chat, vision, tools, streaming, agentic]
35
+ pricing:
36
+ input_per_token: 0.0000008
37
+ output_per_token: 0.000004
38
+ status: active
39
+ tags: ["claude", "vision", "fast", "cost-effective", "agentic"]
40
+
41
+ claude-3-opus:
42
+ provider: anthropic
43
+ model_id: "claude-3-opus-20240229"
44
+ display_name: "Claude 3 Opus"
45
+ verification:
46
+ status: unverified
47
+ source: "manual"
48
+ context_window: 200000
49
+ capabilities: [chat, vision, tools, streaming, agentic, reasoning]
50
+ pricing:
51
+ input_per_token: 0.000015
52
+ output_per_token: 0.000075
53
+ status: active
54
+ tags: ["claude", "vision", "premium", "reasoning", "agentic"]
55
+ agentic_capabilities:
56
+ reasoning_effort: "high"
57
+ thinking_blocks: true
58
+ parallel_tools: true
59
+ builtin_tools: ["web_search", "code_execution", "document_analysis"]
@@ -0,0 +1,165 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ # Cohere Model Instances
5
+ #
6
+ # VERIFIED_AT: 2026-01-31 (based on public Cohere documentation)
7
+ # FACT-CHECK 2026-02: https://docs.cohere.com/docs/models — command-r, command-r-plus
8
+ # deprecated Sept 15, 2025. Use command-r-plus-08-2024 or command-r-08-2024 (Live).
9
+ #
10
+ # Notes:
11
+ # - Cohere is known for enterprise-grade LLMs.
12
+ # - For Chat API use Live models: command-r-plus-08-2024, command-r-08-2024, command-a-03-2025, etc.
13
+
14
+ models:
15
+ # Command R+ (deprecated Sept 15, 2025 — use command-r-plus-08-2024)
16
+ command-r-plus:
17
+ provider: cohere
18
+ model_id: "command-r-plus"
19
+ display_name: "Command R+ (deprecated)"
20
+ verification:
21
+ status: unverified
22
+ verified_at: "2026-02-04"
23
+ source: "https://docs.cohere.com/docs/models"
24
+ notes: "Deprecated Sept 15, 2025. Use command-r-plus-08-2024."
25
+ context_window: 131072
26
+ capabilities: [chat, tools, streaming]
27
+ status: deprecated
28
+ tags: ["cohere", "command", "flagship", "rag"]
29
+ pricing:
30
+ input_per_token: 0.000003
31
+ output_per_token: 0.000015
32
+
33
+ command-r-plus-08-2024:
34
+ provider: cohere
35
+ model_id: "command-r-plus-08-2024"
36
+ display_name: "Command R+ (08-2024)"
37
+ verification:
38
+ status: unverified
39
+ verified_at: "2026-01-31"
40
+ source: "documentation"
41
+ context_window: 131072
42
+ capabilities: [chat, tools, streaming]
43
+ status: active
44
+ tags: ["cohere", "command", "flagship"]
45
+ pricing:
46
+ input_per_token: 0.0000025
47
+ output_per_token: 0.00001
48
+
49
+ # Command R (deprecated Sept 15, 2025 — use command-r-08-2024)
50
+ command-r:
51
+ provider: cohere
52
+ model_id: "command-r"
53
+ display_name: "Command R (deprecated)"
54
+ verification:
55
+ status: unverified
56
+ verified_at: "2026-02-04"
57
+ source: "https://docs.cohere.com/docs/models"
58
+ notes: "Deprecated Sept 15, 2025. Use command-r-08-2024."
59
+ context_window: 131072
60
+ capabilities: [chat, tools, streaming]
61
+ status: deprecated
62
+ tags: ["cohere", "command", "standard"]
63
+ pricing:
64
+ input_per_token: 0.0000005
65
+ output_per_token: 0.0000015
66
+
67
+ command-r-08-2024:
68
+ provider: cohere
69
+ model_id: "command-r-08-2024"
70
+ display_name: "Command R (08-2024)"
71
+ verification:
72
+ status: unverified
73
+ verified_at: "2026-01-31"
74
+ source: "documentation"
75
+ context_window: 131072
76
+ capabilities: [chat, tools, streaming]
77
+ status: active
78
+ tags: ["cohere", "command"]
79
+ pricing:
80
+ input_per_token: 0.00000015
81
+ output_per_token: 0.0000006
82
+
83
+ # Command Light (legacy)
84
+ command-light:
85
+ provider: cohere
86
+ model_id: "command-light"
87
+ display_name: "Command Light"
88
+ verification:
89
+ status: unverified
90
+ verified_at: "2026-01-31"
91
+ source: "documentation"
92
+ notes: "Lightweight model, being deprecated in favor of Command R."
93
+ context_window: 4096
94
+ capabilities: [chat, streaming]
95
+ status: deprecated
96
+ tags: ["cohere", "command", "light", "legacy"]
97
+ pricing:
98
+ input_per_token: 0.0000003
99
+ output_per_token: 0.0000006
100
+
101
+ # Embed models
102
+ embed-english-v3.0:
103
+ provider: cohere
104
+ model_id: "embed-english-v3.0"
105
+ display_name: "Embed English v3"
106
+ verification:
107
+ status: unverified
108
+ verified_at: "2026-01-31"
109
+ source: "documentation"
110
+ context_window: 512
111
+ capabilities: [embedding]
112
+ status: active
113
+ tags: ["cohere", "embed", "english"]
114
+ pricing:
115
+ input_per_token: 0.0000001
116
+ output_per_token: 0
117
+
118
+ embed-multilingual-v3.0:
119
+ provider: cohere
120
+ model_id: "embed-multilingual-v3.0"
121
+ display_name: "Embed Multilingual v3"
122
+ verification:
123
+ status: unverified
124
+ verified_at: "2026-01-31"
125
+ source: "documentation"
126
+ context_window: 512
127
+ capabilities: [embedding]
128
+ status: active
129
+ tags: ["cohere", "embed", "multilingual"]
130
+ pricing:
131
+ input_per_token: 0.0000001
132
+ output_per_token: 0
133
+
134
+ # Rerank models
135
+ rerank-english-v3.0:
136
+ provider: cohere
137
+ model_id: "rerank-english-v3.0"
138
+ display_name: "Rerank English v3"
139
+ verification:
140
+ status: unverified
141
+ verified_at: "2026-01-31"
142
+ source: "documentation"
143
+ context_window: 4096
144
+ capabilities: [rerank]
145
+ status: active
146
+ tags: ["cohere", "rerank", "english"]
147
+ pricing:
148
+ input_per_token: 0.000002
149
+ output_per_token: 0
150
+
151
+ rerank-multilingual-v3.0:
152
+ provider: cohere
153
+ model_id: "rerank-multilingual-v3.0"
154
+ display_name: "Rerank Multilingual v3"
155
+ verification:
156
+ status: unverified
157
+ verified_at: "2026-01-31"
158
+ source: "documentation"
159
+ context_window: 4096
160
+ capabilities: [rerank]
161
+ status: active
162
+ tags: ["cohere", "rerank", "multilingual"]
163
+ pricing:
164
+ input_per_token: 0.000002
165
+ output_per_token: 0
@@ -0,0 +1,29 @@
1
+ $schema: ../../schemas/v1.json
2
+ protocol_version: "1.1"
3
+ models:
4
+ "deepinfra/meta-llama/Meta-Llama-3-8B-Instruct":
5
+ provider: "deepinfra"
6
+ model_id: "meta-llama/Meta-Llama-3-8B-Instruct"
7
+ verification:
8
+ status: unverified
9
+ source: "manual"
10
+ context_window: 8192
11
+ capabilities: ["chat"]
12
+
13
+ "deepinfra/mistralai/Mistral-7B-Instruct-v0.3":
14
+ provider: "deepinfra"
15
+ model_id: "mistralai/Mistral-7B-Instruct-v0.3"
16
+ verification:
17
+ status: unverified
18
+ source: "manual"
19
+ context_window: 32768
20
+ capabilities: ["chat", "tools"]
21
+
22
+ "deepinfra/microsoft/WizardLM-2-8x22B":
23
+ provider: "deepinfra"
24
+ model_id: "microsoft/WizardLM-2-8x22B"
25
+ verification:
26
+ status: unverified
27
+ source: "manual"
28
+ context_window: 65536
29
+ capabilities: ["chat"]
@@ -0,0 +1,32 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ models:
5
+ deepseek-chat:
6
+ provider: deepseek
7
+ model_id: "deepseek-chat"
8
+ display_name: "DeepSeek Chat"
9
+ verification:
10
+ status: verified
11
+ verified_at: "2026-01-28"
12
+ source: "list_models:/models"
13
+ context_window: 32768
14
+ capabilities: [chat, streaming, tools]
15
+ pricing:
16
+ input_per_token: 0.00000014 # example
17
+ output_per_token: 0.00000028 # example
18
+ status: active
19
+ tags: ["deepseek", "chat", "tools"]
20
+
21
+ deepseek-reasoner:
22
+ provider: deepseek
23
+ model_id: "deepseek-reasoner"
24
+ display_name: "DeepSeek Reasoner"
25
+ verification:
26
+ status: verified
27
+ verified_at: "2026-03-06"
28
+ source: "deepseek-console"
29
+ context_window: 64000
30
+ capabilities: [chat, streaming, tools, reasoning]
31
+ status: active
32
+ tags: ["deepseek", "reasoning", "tools"]
@@ -0,0 +1,129 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+ protocol_version: "1.1"
3
+
4
+ # 字节跳动豆包 (Doubao) Model Instances
5
+ #
6
+ # VERIFIED_AT: 2026-01-31 (based on public Volcengine documentation)
7
+ #
8
+ # Notes:
9
+ # - Doubao (豆包) is ByteDance's flagship LLM series.
10
+ # - Accessed via Volcengine (火山引擎) platform.
11
+ # - Model IDs are endpoint IDs that need to be created in Volcengine console.
12
+
13
+ models:
14
+ # Doubao Pro series
15
+ doubao-pro-32k:
16
+ provider: doubao
17
+ model_id: "doubao-pro-32k"
18
+ display_name: "豆包 Pro 32K"
19
+ verification:
20
+ status: unverified
21
+ verified_at: "2026-01-31"
22
+ source: "documentation"
23
+ notes: "Based on Volcengine documentation. Endpoint ID required."
24
+ context_window: 32768
25
+ capabilities: [chat, tools, streaming]
26
+ status: active
27
+ tags: ["bytedance", "doubao", "pro", "cn"]
28
+ pricing:
29
+ input_per_token: 0.0000008
30
+ output_per_token: 0.000002
31
+
32
+ doubao-pro-128k:
33
+ provider: doubao
34
+ model_id: "doubao-pro-128k"
35
+ display_name: "豆包 Pro 128K"
36
+ verification:
37
+ status: unverified
38
+ verified_at: "2026-01-31"
39
+ source: "documentation"
40
+ context_window: 131072
41
+ capabilities: [chat, tools, streaming]
42
+ status: active
43
+ tags: ["bytedance", "doubao", "pro", "long_context", "cn"]
44
+ pricing:
45
+ input_per_token: 0.000005
46
+ output_per_token: 0.000009
47
+
48
+ doubao-pro-256k:
49
+ provider: doubao
50
+ model_id: "doubao-pro-256k"
51
+ display_name: "豆包 Pro 256K"
52
+ verification:
53
+ status: unverified
54
+ verified_at: "2026-01-31"
55
+ source: "documentation"
56
+ context_window: 262144
57
+ capabilities: [chat, tools, streaming]
58
+ status: active
59
+ tags: ["bytedance", "doubao", "pro", "ultra_long_context", "cn"]
60
+ pricing:
61
+ input_per_token: 0.000005
62
+ output_per_token: 0.000009
63
+
64
+ # Doubao Lite series (cost-effective)
65
+ doubao-lite-32k:
66
+ provider: doubao
67
+ model_id: "doubao-lite-32k"
68
+ display_name: "豆包 Lite 32K"
69
+ verification:
70
+ status: unverified
71
+ verified_at: "2026-01-31"
72
+ source: "documentation"
73
+ context_window: 32768
74
+ capabilities: [chat, streaming]
75
+ status: active
76
+ tags: ["bytedance", "doubao", "lite", "cost_effective", "cn"]
77
+ pricing:
78
+ input_per_token: 0.0000003
79
+ output_per_token: 0.0000006
80
+
81
+ doubao-lite-128k:
82
+ provider: doubao
83
+ model_id: "doubao-lite-128k"
84
+ display_name: "豆包 Lite 128K"
85
+ verification:
86
+ status: unverified
87
+ verified_at: "2026-01-31"
88
+ source: "documentation"
89
+ context_window: 131072
90
+ capabilities: [chat, streaming]
91
+ status: active
92
+ tags: ["bytedance", "doubao", "lite", "long_context", "cn"]
93
+ pricing:
94
+ input_per_token: 0.0000008
95
+ output_per_token: 0.000001
96
+
97
+ # Doubao Vision
98
+ doubao-vision-pro-32k:
99
+ provider: doubao
100
+ model_id: "doubao-vision-pro-32k"
101
+ display_name: "豆包 Vision Pro 32K"
102
+ verification:
103
+ status: unverified
104
+ verified_at: "2026-01-31"
105
+ source: "documentation"
106
+ context_window: 32768
107
+ capabilities: [chat, vision, streaming]
108
+ status: active
109
+ tags: ["bytedance", "doubao", "vision", "multimodal", "cn"]
110
+ pricing:
111
+ input_per_token: 0.000003
112
+ output_per_token: 0.000009
113
+
114
+ # Doubao Embedding
115
+ doubao-embedding:
116
+ provider: doubao
117
+ model_id: "doubao-embedding"
118
+ display_name: "豆包 Embedding"
119
+ verification:
120
+ status: unverified
121
+ verified_at: "2026-01-31"
122
+ source: "documentation"
123
+ context_window: 4096
124
+ capabilities: [embedding]
125
+ status: active
126
+ tags: ["bytedance", "doubao", "embedding", "cn"]
127
+ pricing:
128
+ input_per_token: 0.0000005
129
+ output_per_token: 0