@ailib-official/ai-protocol 0.8.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (194) hide show
  1. package/LICENSE +6 -0
  2. package/README.md +415 -0
  3. package/dist/index.json +8 -0
  4. package/dist/v1/models/ai21.json +140 -0
  5. package/dist/v1/models/baichuan.json +138 -0
  6. package/dist/v1/models/cerebras.json +147 -0
  7. package/dist/v1/models/claude.json +114 -0
  8. package/dist/v1/models/cohere.json +235 -0
  9. package/dist/v1/models/deepinfra.json +43 -0
  10. package/dist/v1/models/deepseek-chat.json +55 -0
  11. package/dist/v1/models/doubao.json +197 -0
  12. package/dist/v1/models/ernie.json +223 -0
  13. package/dist/v1/models/fireworks.json +222 -0
  14. package/dist/v1/models/gemini.json +58 -0
  15. package/dist/v1/models/gpt.json +166 -0
  16. package/dist/v1/models/grok.json +138 -0
  17. package/dist/v1/models/huggingface.json +183 -0
  18. package/dist/v1/models/hunyuan.json +255 -0
  19. package/dist/v1/models/jina.json +139 -0
  20. package/dist/v1/models/lepton.json +188 -0
  21. package/dist/v1/models/llama.json +143 -0
  22. package/dist/v1/models/minimax.json +194 -0
  23. package/dist/v1/models/mistral.json +177 -0
  24. package/dist/v1/models/moonshot.json +144 -0
  25. package/dist/v1/models/nvidia.json +212 -0
  26. package/dist/v1/models/palmyra.json +103 -0
  27. package/dist/v1/models/perplexity.json +143 -0
  28. package/dist/v1/models/qwen.json +49 -0
  29. package/dist/v1/models/replicate.json +206 -0
  30. package/dist/v1/models/sensenova.json +144 -0
  31. package/dist/v1/models/siliconflow.json +44 -0
  32. package/dist/v1/models/spark.json +173 -0
  33. package/dist/v1/models/stable-diffusion.json +161 -0
  34. package/dist/v1/models/tiangong.json +169 -0
  35. package/dist/v1/models/together.json +43 -0
  36. package/dist/v1/models/yi.json +199 -0
  37. package/dist/v1/models/zhipu.json +250 -0
  38. package/dist/v1/providers/ai21.json +215 -0
  39. package/dist/v1/providers/anthropic.json +253 -0
  40. package/dist/v1/providers/anyscale.json +115 -0
  41. package/dist/v1/providers/azure.json +188 -0
  42. package/dist/v1/providers/baichuan.json +205 -0
  43. package/dist/v1/providers/baidu.json +205 -0
  44. package/dist/v1/providers/cerebras.json +216 -0
  45. package/dist/v1/providers/cohere.json +209 -0
  46. package/dist/v1/providers/deepinfra.json +196 -0
  47. package/dist/v1/providers/deepseek.json +221 -0
  48. package/dist/v1/providers/doubao.json +209 -0
  49. package/dist/v1/providers/fireworks.json +227 -0
  50. package/dist/v1/providers/gemini.json +279 -0
  51. package/dist/v1/providers/groq.json +218 -0
  52. package/dist/v1/providers/huggingface.json +181 -0
  53. package/dist/v1/providers/hunyuan.json +198 -0
  54. package/dist/v1/providers/jina.json +202 -0
  55. package/dist/v1/providers/lepton.json +221 -0
  56. package/dist/v1/providers/minimax.json +209 -0
  57. package/dist/v1/providers/mistral.json +214 -0
  58. package/dist/v1/providers/moonshot.json +214 -0
  59. package/dist/v1/providers/nvidia.json +213 -0
  60. package/dist/v1/providers/openai.json +267 -0
  61. package/dist/v1/providers/openrouter.json +220 -0
  62. package/dist/v1/providers/perplexity.json +172 -0
  63. package/dist/v1/providers/qwen.json +231 -0
  64. package/dist/v1/providers/replicate.json +192 -0
  65. package/dist/v1/providers/sensenova.json +185 -0
  66. package/dist/v1/providers/siliconflow.json +197 -0
  67. package/dist/v1/providers/spark.json +204 -0
  68. package/dist/v1/providers/stability.json +221 -0
  69. package/dist/v1/providers/tiangong.json +207 -0
  70. package/dist/v1/providers/together.json +196 -0
  71. package/dist/v1/providers/writer.json +253 -0
  72. package/dist/v1/providers/xai.json +238 -0
  73. package/dist/v1/providers/yi.json +205 -0
  74. package/dist/v1/providers/zhipu.json +208 -0
  75. package/dist/v1/spec.json +783 -0
  76. package/dist/v2/providers/anthropic.json +372 -0
  77. package/dist/v2/providers/cohere.json +109 -0
  78. package/dist/v2/providers/deepseek.json +272 -0
  79. package/dist/v2/providers/doubao.json +260 -0
  80. package/dist/v2/providers/google.json +388 -0
  81. package/dist/v2/providers/jina.json +71 -0
  82. package/dist/v2/providers/moonshot.json +284 -0
  83. package/dist/v2/providers/openai.json +419 -0
  84. package/dist/v2/providers/qwen.json +274 -0
  85. package/dist/v2/providers/zhipu.json +257 -0
  86. package/dist/v2-alpha/providers/anthropic.json +182 -0
  87. package/dist/v2-alpha/providers/gemini.json +187 -0
  88. package/dist/v2-alpha/providers/openai.json +215 -0
  89. package/dist/v2-alpha/spec.json +644 -0
  90. package/package.json +61 -0
  91. package/schemas/spec.json +186 -0
  92. package/schemas/v1.json +1116 -0
  93. package/schemas/v2/availability.json +66 -0
  94. package/schemas/v2/capabilities.json +182 -0
  95. package/schemas/v2/capability-profile.json +174 -0
  96. package/schemas/v2/computer-use.json +222 -0
  97. package/schemas/v2/context-policy.json +148 -0
  98. package/schemas/v2/endpoint.json +2 -0
  99. package/schemas/v2/error-codes.yaml +225 -0
  100. package/schemas/v2/errors.json +250 -0
  101. package/schemas/v2/execution-metadata.json +59 -0
  102. package/schemas/v2/mcp.json +225 -0
  103. package/schemas/v2/message-roles.json +10 -0
  104. package/schemas/v2/multimodal.json +297 -0
  105. package/schemas/v2/pricing.json +14 -0
  106. package/schemas/v2/provider-contract.json +317 -0
  107. package/schemas/v2/provider.json +203 -0
  108. package/schemas/v2/regions.json +14 -0
  109. package/v1/models/ai21.yaml +97 -0
  110. package/v1/models/baichuan.yaml +95 -0
  111. package/v1/models/cerebras.yaml +99 -0
  112. package/v1/models/claude.yaml +59 -0
  113. package/v1/models/cohere.yaml +165 -0
  114. package/v1/models/deepinfra.yaml +29 -0
  115. package/v1/models/deepseek-chat.yaml +32 -0
  116. package/v1/models/doubao.yaml +129 -0
  117. package/v1/models/ernie.yaml +146 -0
  118. package/v1/models/fireworks.yaml +145 -0
  119. package/v1/models/gemini.yaml +32 -0
  120. package/v1/models/gpt.yaml +90 -0
  121. package/v1/models/grok.yaml +74 -0
  122. package/v1/models/huggingface.yaml +110 -0
  123. package/v1/models/hunyuan.yaml +164 -0
  124. package/v1/models/jina.yaml +98 -0
  125. package/v1/models/lepton.yaml +130 -0
  126. package/v1/models/llama.yaml +91 -0
  127. package/v1/models/minimax.yaml +132 -0
  128. package/v1/models/mistral.yaml +100 -0
  129. package/v1/models/moonshot.yaml +97 -0
  130. package/v1/models/nvidia.yaml +118 -0
  131. package/v1/models/palmyra.yaml +59 -0
  132. package/v1/models/perplexity.yaml +97 -0
  133. package/v1/models/qwen.yaml +27 -0
  134. package/v1/models/replicate.yaml +136 -0
  135. package/v1/models/sensenova.yaml +97 -0
  136. package/v1/models/siliconflow.yaml +29 -0
  137. package/v1/models/spark.yaml +114 -0
  138. package/v1/models/stable-diffusion.yaml +113 -0
  139. package/v1/models/tiangong.yaml +114 -0
  140. package/v1/models/together.yaml +29 -0
  141. package/v1/models/yi.yaml +132 -0
  142. package/v1/models/zhipu.yaml +163 -0
  143. package/v1/providers/ai21.yaml +176 -0
  144. package/v1/providers/anthropic.yaml +209 -0
  145. package/v1/providers/anyscale.yaml +106 -0
  146. package/v1/providers/azure.yaml +155 -0
  147. package/v1/providers/baichuan.yaml +168 -0
  148. package/v1/providers/baidu.yaml +173 -0
  149. package/v1/providers/cerebras.yaml +178 -0
  150. package/v1/providers/cohere.yaml +175 -0
  151. package/v1/providers/deepinfra.yaml +156 -0
  152. package/v1/providers/deepseek.yaml +189 -0
  153. package/v1/providers/doubao.yaml +172 -0
  154. package/v1/providers/fireworks.yaml +187 -0
  155. package/v1/providers/gemini.yaml +229 -0
  156. package/v1/providers/groq.yaml +181 -0
  157. package/v1/providers/huggingface.yaml +157 -0
  158. package/v1/providers/hunyuan.yaml +162 -0
  159. package/v1/providers/jina.yaml +171 -0
  160. package/v1/providers/lepton.yaml +183 -0
  161. package/v1/providers/minimax.yaml +172 -0
  162. package/v1/providers/mistral.yaml +186 -0
  163. package/v1/providers/moonshot.yaml +176 -0
  164. package/v1/providers/nvidia.yaml +172 -0
  165. package/v1/providers/openai.yaml +224 -0
  166. package/v1/providers/openrouter.yaml +181 -0
  167. package/v1/providers/perplexity.yaml +144 -0
  168. package/v1/providers/qwen.yaml +192 -0
  169. package/v1/providers/replicate.yaml +159 -0
  170. package/v1/providers/sensenova.yaml +153 -0
  171. package/v1/providers/siliconflow.yaml +156 -0
  172. package/v1/providers/spark.yaml +167 -0
  173. package/v1/providers/stability.yaml +185 -0
  174. package/v1/providers/tiangong.yaml +170 -0
  175. package/v1/providers/together.yaml +156 -0
  176. package/v1/providers/writer.yaml +212 -0
  177. package/v1/providers/xai.yaml +206 -0
  178. package/v1/providers/yi.yaml +168 -0
  179. package/v1/providers/zhipu.yaml +171 -0
  180. package/v1/spec.yaml +637 -0
  181. package/v2/providers/anthropic.yaml +244 -0
  182. package/v2/providers/cohere.yaml +75 -0
  183. package/v2/providers/deepseek.yaml +176 -0
  184. package/v2/providers/doubao.yaml +169 -0
  185. package/v2/providers/google.yaml +245 -0
  186. package/v2/providers/jina.yaml +55 -0
  187. package/v2/providers/moonshot.yaml +186 -0
  188. package/v2/providers/openai.yaml +266 -0
  189. package/v2/providers/qwen.yaml +174 -0
  190. package/v2/providers/zhipu.yaml +176 -0
  191. package/v2-alpha/providers/anthropic.yaml +134 -0
  192. package/v2-alpha/providers/gemini.yaml +144 -0
  193. package/v2-alpha/providers/openai.yaml +154 -0
  194. package/v2-alpha/spec.yaml +512 -0
@@ -0,0 +1,172 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+
3
+ id: minimax
4
+ protocol_version: "1.5"
5
+
6
+ name: MiniMax
7
+ version: "v1"
8
+ status: stable
9
+ category: ai_provider
10
+ official_url: "https://platform.minimaxi.com/document/ChatCompletion%20v2"
11
+ support_contact: "https://www.minimaxi.com/contact"
12
+
13
+ endpoint:
14
+ base_url: "https://api.minimax.chat/v1"
15
+ protocol: https
16
+ timeout_ms: 60000
17
+
18
+ auth:
19
+ type: bearer
20
+ token_env: "MINIMAX_API_KEY"
21
+
22
+ payload_format: "openai_style"
23
+
24
+ # MiniMax uses OpenAI-compatible API
25
+ api_families: ["chat_completions"]
26
+ default_api_family: "chat_completions"
27
+
28
+ endpoints:
29
+ chat:
30
+ path: "/chat/completions"
31
+ method: "POST"
32
+ adapter: "openai"
33
+
34
+ services:
35
+ list_models:
36
+ path: "/models"
37
+ method: "GET"
38
+ response_binding: "data"
39
+
40
+ termination:
41
+ source_field: "finish_reason"
42
+ mapping:
43
+ stop: "end_turn"
44
+ length: "max_tokens"
45
+ tool_calls: "tool_use"
46
+ content_filter: "refusal"
47
+ notes:
48
+ - "OpenAI-compatible finish_reason."
49
+ - "MiniMax is a leading Chinese AI company known for abab model series."
50
+
51
+ tooling:
52
+ source_model: "openai_tool_calls"
53
+ tool_use:
54
+ id_path: "id"
55
+ name_path: "function.name"
56
+ input_path: "function.arguments"
57
+ input_format: "json_string"
58
+ notes:
59
+ - "Supports OpenAI-compatible function calling."
60
+
61
+ retry_policy:
62
+ strategy: "exponential_backoff"
63
+ max_retries: 3
64
+ min_delay_ms: 1000
65
+ max_delay_ms: 30000
66
+ jitter: "full"
67
+ retry_on_http_status: [429, 500, 502, 503]
68
+
69
+ error_classification:
70
+ by_http_status:
71
+ "400": "invalid_request"
72
+ "401": "authentication"
73
+ "403": "permission_denied"
74
+ "404": "not_found"
75
+ "429": "rate_limited"
76
+ "500": "server_error"
77
+ "503": "overloaded"
78
+
79
+ parameter_mappings:
80
+ temperature: "temperature"
81
+ max_tokens: "max_tokens"
82
+ stream: "stream"
83
+ top_p: "top_p"
84
+ stop_sequences: "stop"
85
+ tools: "tools"
86
+ tool_choice: "tool_choice"
87
+ n: "n"
88
+
89
+ response_format: "openai_style"
90
+
91
+ response_paths:
92
+ content: "choices[0].message.content"
93
+ tool_calls: "choices[0].message.tool_calls"
94
+ usage: "usage"
95
+ finish_reason: "choices[0].finish_reason"
96
+
97
+ streaming:
98
+ event_format: "data_lines"
99
+ decoder:
100
+ format: "sse"
101
+ delimiter: "\n\n"
102
+ prefix: "data: "
103
+ done_signal: "[DONE]"
104
+ content_path: "choices[0].delta.content"
105
+ tool_call_path: "choices[0].delta.tool_calls"
106
+ usage_path: "usage"
107
+ frame_selector: "exists($.choices) || exists($.error)"
108
+ event_map:
109
+ - match: "exists($.choices[*].delta.content)"
110
+ emit: "PartialContentDelta"
111
+ fields:
112
+ content: "$.choices[*].delta.content"
113
+ - match: "exists($.choices[*].delta.tool_calls[*].function.name)"
114
+ emit: "ToolCallStarted"
115
+ fields:
116
+ tool_call_id: "$.choices[*].delta.tool_calls[*].id"
117
+ tool_name: "$.choices[*].delta.tool_calls[*].function.name"
118
+ index: "$.choices[*].delta.tool_calls[*].index"
119
+ - match: "exists($.choices[*].delta.tool_calls[*].function.arguments)"
120
+ emit: "PartialToolCall"
121
+ fields:
122
+ arguments: "$.choices[*].delta.tool_calls[*].function.arguments"
123
+ index: "$.choices[*].delta.tool_calls[*].index"
124
+ - match: "exists($.usage)"
125
+ emit: "Metadata"
126
+ fields:
127
+ usage: "$.usage"
128
+ - match: "exists($.choices[*].finish_reason)"
129
+ emit: "FinalCandidate"
130
+ fields:
131
+ finish_reason: "$.choices[*].finish_reason"
132
+ stop_condition: "$.choices[0].finish_reason != null"
133
+
134
+ features:
135
+ multi_candidate:
136
+ support_type: "native"
137
+ param_name: "n"
138
+ response_mapping:
139
+ tool_calls:
140
+ path: "choices[0].message.tool_calls"
141
+ fields:
142
+ id: "id"
143
+ name: "function.name"
144
+ args: "function.arguments"
145
+ error:
146
+ message_path: "error.message"
147
+ code_path: "error.code"
148
+ type_path: "error.type"
149
+
150
+ capabilities:
151
+ streaming: true
152
+ tools: true
153
+ vision: true
154
+ agentic: true
155
+ parallel_tools: true
156
+ reasoning: false
157
+
158
+ availability:
159
+ required: false
160
+ regions:
161
+ - cn
162
+ - global
163
+ check:
164
+ method: GET
165
+ path: "/models"
166
+ expected_status: [200, 401]
167
+ timeout_ms: 5000
168
+
169
+ experimental_features:
170
+ - "voice_synthesis"
171
+ - "music_generation"
172
+ - "video_generation"
@@ -0,0 +1,186 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+
3
+ id: mistral
4
+ protocol_version: "1.5"
5
+
6
+ name: Mistral AI
7
+ version: "v1"
8
+ status: stable
9
+ category: ai_provider
10
+ official_url: "https://docs.mistral.ai"
11
+ support_contact: "https://mistral.ai/contact"
12
+
13
+ endpoint:
14
+ base_url: "https://api.mistral.ai/v1"
15
+ protocol: https
16
+ timeout_ms: 10000
17
+ auth:
18
+ type: bearer
19
+ token_env: "MISTRAL_API_KEY"
20
+ payload_format: "openai_style"
21
+
22
+ # OpenAI-compatible API families
23
+ api_families: ["chat_completions"]
24
+ default_api_family: "chat_completions"
25
+ endpoints:
26
+ # Runtime uses UnifiedRequest.operation (currently "chat") to resolve endpoints.
27
+ # Keep keys aligned with runtime expectations.
28
+ chat:
29
+ path: "/chat/completions"
30
+ method: "POST"
31
+ adapter: "openai"
32
+
33
+ # Optional service endpoints (OpenAI-compatible).
34
+ services:
35
+ list_models:
36
+ path: "/models"
37
+ method: "GET"
38
+ response_binding: "data"
39
+
40
+ # Termination reason normalization (see v1/spec.yaml: standard_schema.streaming_events.termination_reasons)
41
+ termination:
42
+ source_field: "finish_reason"
43
+ mapping:
44
+ stop: "end_turn"
45
+ length: "max_tokens"
46
+ tool_calls: "tool_use"
47
+ content_filter: "refusal"
48
+ notes:
49
+ - "OpenAI-compatible: finish_reason is reported per candidate."
50
+
51
+ # Tool invocation normalization (see v1/spec.yaml: standard_schema.content_blocks)
52
+ tooling:
53
+ source_model: "openai_tool_calls"
54
+ tool_use:
55
+ id_path: "id"
56
+ name_path: "function.name"
57
+ input_path: "function.arguments"
58
+ input_format: "json_string"
59
+ notes:
60
+ - "OpenAI-compatible tool_calls.function.arguments is typically a JSON string; runtimes SHOULD parse it into an object when normalizing."
61
+
62
+ # Rate limits (Mistral uses standard HTTP headers)
63
+ # Note: Mistral may use different header names, but we follow OpenAI-compatible pattern
64
+ rate_limit_headers:
65
+ requests_limit: "x-ratelimit-limit-requests"
66
+ requests_remaining: "x-ratelimit-remaining-requests"
67
+ requests_reset: "x-ratelimit-reset-requests"
68
+ tokens_limit: "x-ratelimit-limit-tokens"
69
+ tokens_remaining: "x-ratelimit-remaining-tokens"
70
+ tokens_reset: "x-ratelimit-reset-tokens"
71
+ retry_after: "retry-after"
72
+
73
+ # Retry policy (OpenAI-compatible guidance: exponential backoff for 429; retry 5xx after brief wait)
74
+ retry_policy:
75
+ max_retries: 3
76
+ max_delay_ms: 30000
77
+ strategy: "exponential_backoff"
78
+ min_delay_ms: 1000
79
+ jitter: "full"
80
+ retry_on_http_status: [429, 500, 502, 503]
81
+ notes:
82
+ - "OpenAI-compatible: exponential backoff is recommended for rate limit errors (429)."
83
+ - "Retry 500 after a brief wait."
84
+
85
+ parameter_mappings:
86
+ temperature: "temperature"
87
+ max_tokens: "max_tokens"
88
+ stream: "stream"
89
+ stop_sequences: "stop"
90
+ tools: "tools"
91
+ tool_choice: "tool_choice"
92
+ frequency_penalty: "frequency_penalty"
93
+ presence_penalty: "presence_penalty"
94
+ top_p: "top_p"
95
+ random_seed: "random_seed"
96
+ n: "n"
97
+ parallel_tool_calls: "parallel_tool_calls"
98
+ safe_prompt: "safe_prompt"
99
+ response_format: "response_format"
100
+ prompt_mode: "prompt_mode"
101
+ prediction: "prediction"
102
+ metadata: "metadata"
103
+
104
+ response_format: "openai_style"
105
+ response_paths:
106
+ content: "choices[0].message.content"
107
+ tool_calls: "choices[0].message.tool_calls"
108
+ usage: "usage"
109
+
110
+ streaming:
111
+ event_format: "data_lines"
112
+ decoder:
113
+ format: "sse"
114
+ delimiter: "\n\n"
115
+ prefix: "data: "
116
+ done_signal: "[DONE]"
117
+ content_path: "choices[0].delta.content"
118
+ tool_call_path: "choices[0].delta.tool_calls"
119
+ usage_path: "usage"
120
+ frame_selector: "exists($.choices) || exists($.error)"
121
+ event_map:
122
+ # Text content delta
123
+ - match: "exists($.choices[*].delta.content)"
124
+ emit: "PartialContentDelta"
125
+ fields:
126
+ content: "$.choices[*].delta.content"
127
+ # Tool call start
128
+ - match: "exists($.choices[*].delta.tool_calls[*].function.name)"
129
+ emit: "ToolCallStarted"
130
+ fields:
131
+ tool_call_id: "$.choices[*].delta.tool_calls[*].id"
132
+ tool_name: "$.choices[*].delta.tool_calls[*].function.name"
133
+ index: "$.choices[*].delta.tool_calls[*].index"
134
+ # Tool call arguments streaming
135
+ - match: "exists($.choices[*].delta.tool_calls[*].function.arguments)"
136
+ emit: "PartialToolCall"
137
+ fields:
138
+ arguments: "$.choices[*].delta.tool_calls[*].function.arguments"
139
+ index: "$.choices[*].delta.tool_calls[*].index"
140
+ # Usage metadata
141
+ - match: "exists($.usage)"
142
+ emit: "Metadata"
143
+ fields:
144
+ usage: "$.usage"
145
+ # Finish with reason
146
+ - match: "exists($.choices[*].finish_reason)"
147
+ emit: "FinalCandidate"
148
+ fields:
149
+ finish_reason: "$.choices[*].finish_reason"
150
+ candidate_index: "$.choices[*].index"
151
+ stop_condition: "$.choices[0].finish_reason != null"
152
+
153
+ features:
154
+ multi_candidate:
155
+ support_type: "native"
156
+ param_name: "n"
157
+ response_mapping:
158
+ tool_calls:
159
+ path: "choices[0].message.tool_calls"
160
+ fields:
161
+ id: "id"
162
+ name: "function.name"
163
+ args: "function.arguments"
164
+ error:
165
+ message_path: "error.message"
166
+ code_path: "error.code"
167
+ type_path: "error.type"
168
+ param_path: "error.param"
169
+
170
+ capabilities:
171
+ streaming: true
172
+ tools: true
173
+ vision: false
174
+ agentic: true
175
+ parallel_tools: true
176
+ reasoning: false
177
+
178
+ availability:
179
+ required: false
180
+ regions:
181
+ - global
182
+ check:
183
+ method: GET
184
+ path: "/models"
185
+ expected_status: [200, 401]
186
+ timeout_ms: 3000
@@ -0,0 +1,176 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+
3
+ id: moonshot
4
+ protocol_version: "1.5"
5
+
6
+ name: 月之暗面 Kimi (Moonshot)
7
+ version: "v1"
8
+ status: stable
9
+ category: ai_provider
10
+ official_url: "https://platform.moonshot.cn/docs"
11
+ support_contact: "https://www.moonshot.cn/contact"
12
+
13
+ endpoint:
14
+ base_url: "https://api.moonshot.cn/v1"
15
+ protocol: https
16
+ timeout_ms: 60000
17
+
18
+ auth:
19
+ type: bearer
20
+ token_env: "MOONSHOT_API_KEY"
21
+
22
+ payload_format: "openai_style"
23
+
24
+ # OpenAI-compatible API
25
+ api_families: ["chat_completions"]
26
+ default_api_family: "chat_completions"
27
+
28
+ endpoints:
29
+ chat:
30
+ path: "/chat/completions"
31
+ method: "POST"
32
+ adapter: "openai"
33
+
34
+ services:
35
+ list_models:
36
+ path: "/models"
37
+ method: "GET"
38
+ response_binding: "data"
39
+ # Kimi supports file upload for context
40
+ upload_file:
41
+ path: "/files"
42
+ method: "POST"
43
+ list_files:
44
+ path: "/files"
45
+ method: "GET"
46
+
47
+ termination:
48
+ source_field: "finish_reason"
49
+ mapping:
50
+ stop: "end_turn"
51
+ length: "max_tokens"
52
+ tool_calls: "tool_use"
53
+ notes:
54
+ - "OpenAI-compatible finish_reason."
55
+ - "Kimi is known for ultra-long context (up to 200K tokens) and file understanding."
56
+
57
+ tooling:
58
+ source_model: "openai_tool_calls"
59
+ tool_use:
60
+ id_path: "id"
61
+ name_path: "function.name"
62
+ input_path: "function.arguments"
63
+ input_format: "json_string"
64
+ notes:
65
+ - "Supports OpenAI-compatible function calling."
66
+
67
+ retry_policy:
68
+ strategy: "exponential_backoff"
69
+ max_retries: 3
70
+ min_delay_ms: 1000
71
+ max_delay_ms: 30000
72
+ jitter: "full"
73
+ retry_on_http_status: [429, 500, 502, 503]
74
+
75
+ error_classification:
76
+ by_http_status:
77
+ "400": "invalid_request"
78
+ "401": "authentication"
79
+ "403": "permission_denied"
80
+ "404": "not_found"
81
+ "429": "rate_limited"
82
+ "500": "server_error"
83
+ "503": "overloaded"
84
+
85
+ parameter_mappings:
86
+ temperature: "temperature"
87
+ max_tokens: "max_tokens"
88
+ stream: "stream"
89
+ top_p: "top_p"
90
+ stop_sequences: "stop"
91
+ tools: "tools"
92
+ tool_choice: "tool_choice"
93
+ n: "n"
94
+
95
+ response_format: "openai_style"
96
+
97
+ response_paths:
98
+ content: "choices[0].message.content"
99
+ tool_calls: "choices[0].message.tool_calls"
100
+ usage: "usage"
101
+ finish_reason: "choices[0].finish_reason"
102
+
103
+ streaming:
104
+ event_format: "data_lines"
105
+ decoder:
106
+ format: "sse"
107
+ delimiter: "\n\n"
108
+ prefix: "data: "
109
+ done_signal: "[DONE]"
110
+ content_path: "choices[0].delta.content"
111
+ tool_call_path: "choices[0].delta.tool_calls"
112
+ usage_path: "usage"
113
+ frame_selector: "exists($.choices) || exists($.error)"
114
+ event_map:
115
+ - match: "exists($.choices[*].delta.content)"
116
+ emit: "PartialContentDelta"
117
+ fields:
118
+ content: "$.choices[*].delta.content"
119
+ - match: "exists($.choices[*].delta.tool_calls[*].function.name)"
120
+ emit: "ToolCallStarted"
121
+ fields:
122
+ tool_call_id: "$.choices[*].delta.tool_calls[*].id"
123
+ tool_name: "$.choices[*].delta.tool_calls[*].function.name"
124
+ index: "$.choices[*].delta.tool_calls[*].index"
125
+ - match: "exists($.choices[*].delta.tool_calls[*].function.arguments)"
126
+ emit: "PartialToolCall"
127
+ fields:
128
+ arguments: "$.choices[*].delta.tool_calls[*].function.arguments"
129
+ index: "$.choices[*].delta.tool_calls[*].index"
130
+ - match: "exists($.usage)"
131
+ emit: "Metadata"
132
+ fields:
133
+ usage: "$.usage"
134
+ - match: "exists($.choices[*].finish_reason)"
135
+ emit: "FinalCandidate"
136
+ fields:
137
+ finish_reason: "$.choices[*].finish_reason"
138
+ stop_condition: "$.choices[0].finish_reason != null"
139
+
140
+ features:
141
+ multi_candidate:
142
+ support_type: "native"
143
+ param_name: "n"
144
+ response_mapping:
145
+ tool_calls:
146
+ path: "choices[0].message.tool_calls"
147
+ fields:
148
+ id: "id"
149
+ name: "function.name"
150
+ args: "function.arguments"
151
+ error:
152
+ message_path: "error.message"
153
+ code_path: "error.code"
154
+
155
+ capabilities:
156
+ streaming: true
157
+ tools: true
158
+ vision: true
159
+ agentic: true
160
+ parallel_tools: true
161
+ reasoning: false
162
+
163
+ availability:
164
+ required: false
165
+ regions:
166
+ - cn
167
+ check:
168
+ method: GET
169
+ path: "/models"
170
+ expected_status: [200, 401]
171
+ timeout_ms: 5000
172
+
173
+ experimental_features:
174
+ - "file_upload"
175
+ - "web_search"
176
+ - "long_context"
@@ -0,0 +1,172 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+
3
+ id: nvidia
4
+ protocol_version: "1.5"
5
+
6
+ name: NVIDIA API Catalog
7
+ version: "v1"
8
+ status: stable
9
+ category: third_party_aggregator
10
+ official_url: "https://build.nvidia.com/explore/discover"
11
+ support_contact: "https://docs.api.nvidia.com/nim/docs"
12
+
13
+ # NVIDIA API Catalog (NVIDIA Build) - OpenAI-compatible chat completions
14
+ # Base URL: https://integrate.api.nvidia.com (docs.api.nvidia.com/nim/reference/llm-apis)
15
+ endpoint:
16
+ base_url: "https://integrate.api.nvidia.com/v1"
17
+ protocol: https
18
+ timeout_ms: 60000
19
+
20
+ auth:
21
+ type: bearer
22
+ token_env: "NVIDIA_API_KEY"
23
+
24
+ payload_format: "openai_style"
25
+
26
+ api_families: ["chat_completions", "completions"]
27
+ default_api_family: "chat_completions"
28
+ endpoints:
29
+ chat:
30
+ path: "/chat/completions"
31
+ method: "POST"
32
+ adapter: "openai"
33
+ completions:
34
+ path: "/completions"
35
+ method: "POST"
36
+ adapter: "openai"
37
+
38
+ services:
39
+ list_models:
40
+ path: "/models"
41
+ method: "GET"
42
+ response_binding: "data"
43
+
44
+ termination:
45
+ source_field: "finish_reason"
46
+ mapping:
47
+ stop: "end_turn"
48
+ length: "max_tokens"
49
+ tool_calls: "tool_use"
50
+ content_filter: "refusal"
51
+ notes:
52
+ - "OpenAI-compatible: finish_reason is reported per candidate."
53
+
54
+ tooling:
55
+ source_model: "openai_tool_calls"
56
+ tool_use:
57
+ id_path: "id"
58
+ name_path: "function.name"
59
+ input_path: "function.arguments"
60
+ input_format: "json_string"
61
+ notes:
62
+ - "OpenAI-compatible tool_calls.function.arguments is typically a JSON string."
63
+
64
+ retry_policy:
65
+ max_retries: 3
66
+ max_delay_ms: 30000
67
+ strategy: "exponential_backoff"
68
+ min_delay_ms: 1000
69
+ jitter: "full"
70
+ retry_on_http_status: [429, 500, 502, 503]
71
+ notes:
72
+ - "Exponential backoff recommended for 429; retry 5xx after brief wait."
73
+
74
+ error_classification:
75
+ by_http_status:
76
+ "400": "invalid_request"
77
+ "401": "authentication"
78
+ "403": "permission_denied"
79
+ "404": "not_found"
80
+ "429": "rate_limited"
81
+ "500": "server_error"
82
+
83
+ parameter_mappings:
84
+ temperature: "temperature"
85
+ max_tokens: "max_tokens"
86
+ stream: "stream"
87
+ stop_sequences: "stop"
88
+ tools: "tools"
89
+ tool_choice: "tool_choice"
90
+ frequency_penalty: "frequency_penalty"
91
+ presence_penalty: "presence_penalty"
92
+ top_p: "top_p"
93
+
94
+ response_format: "openai_style"
95
+ response_paths:
96
+ content: "choices[0].message.content"
97
+ tool_calls: "choices[0].message.tool_calls"
98
+ usage: "usage"
99
+ finish_reason: "choices[0].finish_reason"
100
+
101
+ streaming:
102
+ event_format: "data_lines"
103
+ decoder:
104
+ format: "sse"
105
+ delimiter: "\n\n"
106
+ prefix: "data: "
107
+ done_signal: "[DONE]"
108
+ content_path: "choices[0].delta.content"
109
+ tool_call_path: "choices[0].delta.tool_calls"
110
+ usage_path: "usage"
111
+ frame_selector: "exists($.choices) || exists($.error)"
112
+ event_map:
113
+ - match: "exists($.choices[*].delta.content)"
114
+ emit: "PartialContentDelta"
115
+ fields:
116
+ content: "$.choices[*].delta.content"
117
+ - match: "exists($.choices[*].delta.tool_calls[*].function.name)"
118
+ emit: "ToolCallStarted"
119
+ fields:
120
+ tool_call_id: "$.choices[*].delta.tool_calls[*].id"
121
+ tool_name: "$.choices[*].delta.tool_calls[*].function.name"
122
+ index: "$.choices[*].delta.tool_calls[*].index"
123
+ - match: "exists($.choices[*].delta.tool_calls[*].function.arguments)"
124
+ emit: "PartialToolCall"
125
+ fields:
126
+ arguments: "$.choices[*].delta.tool_calls[*].function.arguments"
127
+ index: "$.choices[*].delta.tool_calls[*].index"
128
+ - match: "exists($.usage)"
129
+ emit: "Metadata"
130
+ fields:
131
+ usage: "$.usage"
132
+ - match: "exists($.choices[*].finish_reason)"
133
+ emit: "FinalCandidate"
134
+ fields:
135
+ finish_reason: "$.choices[*].finish_reason"
136
+ candidate_index: "$.choices[*].index"
137
+ stop_condition: "$.choices[0].finish_reason != null"
138
+
139
+ features:
140
+ multi_candidate:
141
+ support_type: "native"
142
+ param_name: "n"
143
+ response_mapping:
144
+ tool_calls:
145
+ path: "choices[0].message.tool_calls"
146
+ fields:
147
+ id: "id"
148
+ name: "function.name"
149
+ args: "function.arguments"
150
+ error:
151
+ message_path: "error.message"
152
+ code_path: "error.code"
153
+ type_path: "error.type"
154
+ param_path: "error.param"
155
+
156
+ capabilities:
157
+ streaming: true
158
+ tools: true
159
+ vision: true
160
+ agentic: true
161
+ parallel_tools: true
162
+ reasoning: true
163
+
164
+ availability:
165
+ required: false
166
+ regions:
167
+ - global
168
+ check:
169
+ method: GET
170
+ path: "/models"
171
+ expected_status: [200, 401]
172
+ timeout_ms: 5000