@ailib-official/ai-protocol 0.8.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (194) hide show
  1. package/LICENSE +6 -0
  2. package/README.md +415 -0
  3. package/dist/index.json +8 -0
  4. package/dist/v1/models/ai21.json +140 -0
  5. package/dist/v1/models/baichuan.json +138 -0
  6. package/dist/v1/models/cerebras.json +147 -0
  7. package/dist/v1/models/claude.json +114 -0
  8. package/dist/v1/models/cohere.json +235 -0
  9. package/dist/v1/models/deepinfra.json +43 -0
  10. package/dist/v1/models/deepseek-chat.json +55 -0
  11. package/dist/v1/models/doubao.json +197 -0
  12. package/dist/v1/models/ernie.json +223 -0
  13. package/dist/v1/models/fireworks.json +222 -0
  14. package/dist/v1/models/gemini.json +58 -0
  15. package/dist/v1/models/gpt.json +166 -0
  16. package/dist/v1/models/grok.json +138 -0
  17. package/dist/v1/models/huggingface.json +183 -0
  18. package/dist/v1/models/hunyuan.json +255 -0
  19. package/dist/v1/models/jina.json +139 -0
  20. package/dist/v1/models/lepton.json +188 -0
  21. package/dist/v1/models/llama.json +143 -0
  22. package/dist/v1/models/minimax.json +194 -0
  23. package/dist/v1/models/mistral.json +177 -0
  24. package/dist/v1/models/moonshot.json +144 -0
  25. package/dist/v1/models/nvidia.json +212 -0
  26. package/dist/v1/models/palmyra.json +103 -0
  27. package/dist/v1/models/perplexity.json +143 -0
  28. package/dist/v1/models/qwen.json +49 -0
  29. package/dist/v1/models/replicate.json +206 -0
  30. package/dist/v1/models/sensenova.json +144 -0
  31. package/dist/v1/models/siliconflow.json +44 -0
  32. package/dist/v1/models/spark.json +173 -0
  33. package/dist/v1/models/stable-diffusion.json +161 -0
  34. package/dist/v1/models/tiangong.json +169 -0
  35. package/dist/v1/models/together.json +43 -0
  36. package/dist/v1/models/yi.json +199 -0
  37. package/dist/v1/models/zhipu.json +250 -0
  38. package/dist/v1/providers/ai21.json +215 -0
  39. package/dist/v1/providers/anthropic.json +253 -0
  40. package/dist/v1/providers/anyscale.json +115 -0
  41. package/dist/v1/providers/azure.json +188 -0
  42. package/dist/v1/providers/baichuan.json +205 -0
  43. package/dist/v1/providers/baidu.json +205 -0
  44. package/dist/v1/providers/cerebras.json +216 -0
  45. package/dist/v1/providers/cohere.json +209 -0
  46. package/dist/v1/providers/deepinfra.json +196 -0
  47. package/dist/v1/providers/deepseek.json +221 -0
  48. package/dist/v1/providers/doubao.json +209 -0
  49. package/dist/v1/providers/fireworks.json +227 -0
  50. package/dist/v1/providers/gemini.json +279 -0
  51. package/dist/v1/providers/groq.json +218 -0
  52. package/dist/v1/providers/huggingface.json +181 -0
  53. package/dist/v1/providers/hunyuan.json +198 -0
  54. package/dist/v1/providers/jina.json +202 -0
  55. package/dist/v1/providers/lepton.json +221 -0
  56. package/dist/v1/providers/minimax.json +209 -0
  57. package/dist/v1/providers/mistral.json +214 -0
  58. package/dist/v1/providers/moonshot.json +214 -0
  59. package/dist/v1/providers/nvidia.json +213 -0
  60. package/dist/v1/providers/openai.json +267 -0
  61. package/dist/v1/providers/openrouter.json +220 -0
  62. package/dist/v1/providers/perplexity.json +172 -0
  63. package/dist/v1/providers/qwen.json +231 -0
  64. package/dist/v1/providers/replicate.json +192 -0
  65. package/dist/v1/providers/sensenova.json +185 -0
  66. package/dist/v1/providers/siliconflow.json +197 -0
  67. package/dist/v1/providers/spark.json +204 -0
  68. package/dist/v1/providers/stability.json +221 -0
  69. package/dist/v1/providers/tiangong.json +207 -0
  70. package/dist/v1/providers/together.json +196 -0
  71. package/dist/v1/providers/writer.json +253 -0
  72. package/dist/v1/providers/xai.json +238 -0
  73. package/dist/v1/providers/yi.json +205 -0
  74. package/dist/v1/providers/zhipu.json +208 -0
  75. package/dist/v1/spec.json +783 -0
  76. package/dist/v2/providers/anthropic.json +372 -0
  77. package/dist/v2/providers/cohere.json +109 -0
  78. package/dist/v2/providers/deepseek.json +272 -0
  79. package/dist/v2/providers/doubao.json +260 -0
  80. package/dist/v2/providers/google.json +388 -0
  81. package/dist/v2/providers/jina.json +71 -0
  82. package/dist/v2/providers/moonshot.json +284 -0
  83. package/dist/v2/providers/openai.json +419 -0
  84. package/dist/v2/providers/qwen.json +274 -0
  85. package/dist/v2/providers/zhipu.json +257 -0
  86. package/dist/v2-alpha/providers/anthropic.json +182 -0
  87. package/dist/v2-alpha/providers/gemini.json +187 -0
  88. package/dist/v2-alpha/providers/openai.json +215 -0
  89. package/dist/v2-alpha/spec.json +644 -0
  90. package/package.json +61 -0
  91. package/schemas/spec.json +186 -0
  92. package/schemas/v1.json +1116 -0
  93. package/schemas/v2/availability.json +66 -0
  94. package/schemas/v2/capabilities.json +182 -0
  95. package/schemas/v2/capability-profile.json +174 -0
  96. package/schemas/v2/computer-use.json +222 -0
  97. package/schemas/v2/context-policy.json +148 -0
  98. package/schemas/v2/endpoint.json +2 -0
  99. package/schemas/v2/error-codes.yaml +225 -0
  100. package/schemas/v2/errors.json +250 -0
  101. package/schemas/v2/execution-metadata.json +59 -0
  102. package/schemas/v2/mcp.json +225 -0
  103. package/schemas/v2/message-roles.json +10 -0
  104. package/schemas/v2/multimodal.json +297 -0
  105. package/schemas/v2/pricing.json +14 -0
  106. package/schemas/v2/provider-contract.json +317 -0
  107. package/schemas/v2/provider.json +203 -0
  108. package/schemas/v2/regions.json +14 -0
  109. package/v1/models/ai21.yaml +97 -0
  110. package/v1/models/baichuan.yaml +95 -0
  111. package/v1/models/cerebras.yaml +99 -0
  112. package/v1/models/claude.yaml +59 -0
  113. package/v1/models/cohere.yaml +165 -0
  114. package/v1/models/deepinfra.yaml +29 -0
  115. package/v1/models/deepseek-chat.yaml +32 -0
  116. package/v1/models/doubao.yaml +129 -0
  117. package/v1/models/ernie.yaml +146 -0
  118. package/v1/models/fireworks.yaml +145 -0
  119. package/v1/models/gemini.yaml +32 -0
  120. package/v1/models/gpt.yaml +90 -0
  121. package/v1/models/grok.yaml +74 -0
  122. package/v1/models/huggingface.yaml +110 -0
  123. package/v1/models/hunyuan.yaml +164 -0
  124. package/v1/models/jina.yaml +98 -0
  125. package/v1/models/lepton.yaml +130 -0
  126. package/v1/models/llama.yaml +91 -0
  127. package/v1/models/minimax.yaml +132 -0
  128. package/v1/models/mistral.yaml +100 -0
  129. package/v1/models/moonshot.yaml +97 -0
  130. package/v1/models/nvidia.yaml +118 -0
  131. package/v1/models/palmyra.yaml +59 -0
  132. package/v1/models/perplexity.yaml +97 -0
  133. package/v1/models/qwen.yaml +27 -0
  134. package/v1/models/replicate.yaml +136 -0
  135. package/v1/models/sensenova.yaml +97 -0
  136. package/v1/models/siliconflow.yaml +29 -0
  137. package/v1/models/spark.yaml +114 -0
  138. package/v1/models/stable-diffusion.yaml +113 -0
  139. package/v1/models/tiangong.yaml +114 -0
  140. package/v1/models/together.yaml +29 -0
  141. package/v1/models/yi.yaml +132 -0
  142. package/v1/models/zhipu.yaml +163 -0
  143. package/v1/providers/ai21.yaml +176 -0
  144. package/v1/providers/anthropic.yaml +209 -0
  145. package/v1/providers/anyscale.yaml +106 -0
  146. package/v1/providers/azure.yaml +155 -0
  147. package/v1/providers/baichuan.yaml +168 -0
  148. package/v1/providers/baidu.yaml +173 -0
  149. package/v1/providers/cerebras.yaml +178 -0
  150. package/v1/providers/cohere.yaml +175 -0
  151. package/v1/providers/deepinfra.yaml +156 -0
  152. package/v1/providers/deepseek.yaml +189 -0
  153. package/v1/providers/doubao.yaml +172 -0
  154. package/v1/providers/fireworks.yaml +187 -0
  155. package/v1/providers/gemini.yaml +229 -0
  156. package/v1/providers/groq.yaml +181 -0
  157. package/v1/providers/huggingface.yaml +157 -0
  158. package/v1/providers/hunyuan.yaml +162 -0
  159. package/v1/providers/jina.yaml +171 -0
  160. package/v1/providers/lepton.yaml +183 -0
  161. package/v1/providers/minimax.yaml +172 -0
  162. package/v1/providers/mistral.yaml +186 -0
  163. package/v1/providers/moonshot.yaml +176 -0
  164. package/v1/providers/nvidia.yaml +172 -0
  165. package/v1/providers/openai.yaml +224 -0
  166. package/v1/providers/openrouter.yaml +181 -0
  167. package/v1/providers/perplexity.yaml +144 -0
  168. package/v1/providers/qwen.yaml +192 -0
  169. package/v1/providers/replicate.yaml +159 -0
  170. package/v1/providers/sensenova.yaml +153 -0
  171. package/v1/providers/siliconflow.yaml +156 -0
  172. package/v1/providers/spark.yaml +167 -0
  173. package/v1/providers/stability.yaml +185 -0
  174. package/v1/providers/tiangong.yaml +170 -0
  175. package/v1/providers/together.yaml +156 -0
  176. package/v1/providers/writer.yaml +212 -0
  177. package/v1/providers/xai.yaml +206 -0
  178. package/v1/providers/yi.yaml +168 -0
  179. package/v1/providers/zhipu.yaml +171 -0
  180. package/v1/spec.yaml +637 -0
  181. package/v2/providers/anthropic.yaml +244 -0
  182. package/v2/providers/cohere.yaml +75 -0
  183. package/v2/providers/deepseek.yaml +176 -0
  184. package/v2/providers/doubao.yaml +169 -0
  185. package/v2/providers/google.yaml +245 -0
  186. package/v2/providers/jina.yaml +55 -0
  187. package/v2/providers/moonshot.yaml +186 -0
  188. package/v2/providers/openai.yaml +266 -0
  189. package/v2/providers/qwen.yaml +174 -0
  190. package/v2/providers/zhipu.yaml +176 -0
  191. package/v2-alpha/providers/anthropic.yaml +134 -0
  192. package/v2-alpha/providers/gemini.yaml +144 -0
  193. package/v2-alpha/providers/openai.yaml +154 -0
  194. package/v2-alpha/spec.yaml +512 -0
@@ -0,0 +1,245 @@
1
+ # Google Gemini V2 正式提供商清单 — 全模态支持(音频/视频/CU),合并 v2-alpha 与深度调研数据
2
+ # AI-Protocol V2 Provider Manifest
3
+ # Provider: Google | Models: Gemini 3 Pro / Flash
4
+ # Last Updated: 2026-02-16
5
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v2/provider.json"
6
+
7
+ # === Ring 1: Core Skeleton ===
8
+ id: google
9
+ protocol_version: "2.0"
10
+ name: "Google Gemini"
11
+ version: "3.0.0"
12
+ status: stable
13
+ category: ai_provider
14
+ official_url: "https://ai.google.dev/docs"
15
+ support_contact: "https://support.google.com/gemini"
16
+
17
+ endpoint:
18
+ base_url: "https://generativelanguage.googleapis.com/v1beta"
19
+ chat: "/models/{model}:generateContent"
20
+ embeddings: "/models/{model}:embedContent"
21
+ auth:
22
+ type: "query_param"
23
+ param_name: "key"
24
+ token_env: "GEMINI_API_KEY"
25
+
26
+ error_classification:
27
+ by_http_status:
28
+ "400": "invalid_request"
29
+ "401": "authentication"
30
+ "403": "permission_denied"
31
+ "404": "not_found"
32
+ "429": "rate_limited"
33
+ "500": "server_error"
34
+ "503": "overloaded"
35
+ by_error_code:
36
+ "INVALID_ARGUMENT": "invalid_request"
37
+ "UNAUTHENTICATED": "authentication"
38
+ "PERMISSION_DENIED": "permission_denied"
39
+ "NOT_FOUND": "not_found"
40
+ "RESOURCE_EXHAUSTED": "rate_limited"
41
+ "INTERNAL": "server_error"
42
+ "UNAVAILABLE": "overloaded"
43
+ "DEADLINE_EXCEEDED": "timeout"
44
+
45
+ # === Ring 2: Capability Mapping ===
46
+ capabilities:
47
+ required:
48
+ - text
49
+ - streaming
50
+ - tools
51
+ optional:
52
+ - vision
53
+ - audio
54
+ - video
55
+ - parallel_tools
56
+ - reasoning
57
+ - embeddings
58
+ - structured_output
59
+ - computer_use
60
+ - mcp_client
61
+ feature_flags:
62
+ structured_output: true
63
+ parallel_tool_calls: true
64
+ extended_thinking: true
65
+ streaming_usage: false
66
+ system_messages: true
67
+
68
+ capability_profile:
69
+ phase: "ios_v1"
70
+ inputs:
71
+ modalities: ["text", "image", "audio", "video"]
72
+ outcomes:
73
+ types: ["text_completion", "structured_json", "tool_call_sequence"]
74
+ systems:
75
+ requires: ["mcp", "search"]
76
+
77
+ parameters:
78
+ temperature: { type: float, range: [0.0, 2.0], default: 1.0 }
79
+ maxOutputTokens: { type: integer, min: 1, max: 65536, alias: "max_tokens" }
80
+ topP: { type: float, range: [0.0, 1.0], alias: "top_p" }
81
+ topK: { type: integer, min: 0, alias: "top_k" }
82
+
83
+ streaming:
84
+ decoder:
85
+ format: "gemini_sse"
86
+ strategy: "gemini_generate"
87
+ event_map:
88
+ - match: "$.candidates[0].content.parts[0].text"
89
+ emit: "PartialContentDelta"
90
+ extract:
91
+ content: "$.candidates[0].content.parts[0].text"
92
+ - match: "$.candidates[0].content.parts[0].functionCall"
93
+ emit: "PartialToolCall"
94
+ extract:
95
+ tool_call: "$.candidates[0].content.parts[0].functionCall"
96
+ - match: "$.candidates[0].finishReason"
97
+ emit: "StreamEnd"
98
+ extract:
99
+ finish_reason: "$.candidates[0].finishReason"
100
+ candidate:
101
+ candidate_id_path: "$.candidates[*].index"
102
+ fan_out: true
103
+
104
+ multimodal:
105
+ input:
106
+ vision:
107
+ supported: true
108
+ formats: [jpeg, png, gif, bmp, tiff, webp]
109
+ max_file_size: "20MB"
110
+ max_resolution: "4096x4096"
111
+ encoding_methods: [base64_inline, url, file_uri]
112
+ document_understanding: true
113
+ audio:
114
+ supported: true
115
+ formats: [mp3, wav, flac, ogg, aac, m4a]
116
+ max_duration: "8h"
117
+ speech_recognition: true
118
+ video:
119
+ supported: true
120
+ formats: [mp4, mov, avi, flv, wmv]
121
+ max_duration: "1h"
122
+ frame_extraction: automatic
123
+ audio_track: true
124
+ temporal_reasoning: true
125
+ output:
126
+ text: true
127
+ audio:
128
+ supported: false
129
+ image:
130
+ supported: true
131
+ formats: [png, jpeg]
132
+ omni_mode:
133
+ supported: false
134
+
135
+ computer_use:
136
+ supported: true
137
+ status: ga
138
+ implementation: tool_based
139
+ actions:
140
+ screenshot:
141
+ supported: true
142
+ formats: [png, jpeg]
143
+ mouse:
144
+ supported: true
145
+ operations: [click, double_click, drag, scroll]
146
+ keyboard:
147
+ supported: true
148
+ operations: [type, key_press, shortcut]
149
+ browser:
150
+ supported: true
151
+ operations: [navigate, fill_form, click_element, scroll]
152
+ safety:
153
+ confirmation_required: true
154
+ sandbox_mode: recommended
155
+ action_logging: true
156
+ domain_allowlist: false
157
+ sensitive_data_protection: true
158
+ environment:
159
+ browser: true
160
+ desktop: true
161
+ provider_mapping:
162
+ tool_type: "computer_use"
163
+ config_method: sdk_config
164
+
165
+ mcp:
166
+ client:
167
+ supported: true
168
+ protocol_version: "2025-11-25"
169
+ transports: [streamable_http, sse]
170
+ auth_methods: [bearer, oauth2, api_key]
171
+ capabilities:
172
+ tools: true
173
+ resources: false
174
+ prompts: false
175
+ sampling: false
176
+ provider_mapping:
177
+ config_method: sdk_config
178
+ server:
179
+ supported: false
180
+
181
+ # === Ring 3: Advanced Extensions ===
182
+ api_families: ["generate_content"]
183
+ default_api_family: "generate_content"
184
+
185
+ endpoints:
186
+ chat:
187
+ path: "/models/{model}:generateContent"
188
+ method: "POST"
189
+ adapter: "gemini"
190
+ stream_chat:
191
+ path: "/models/{model}:streamGenerateContent"
192
+ method: "POST"
193
+ adapter: "gemini"
194
+ embeddings:
195
+ path: "/models/{model}:embedContent"
196
+ method: "POST"
197
+ adapter: "gemini"
198
+
199
+ services:
200
+ list_models:
201
+ path: "/models"
202
+ method: "GET"
203
+ response_binding: "models"
204
+ get_model:
205
+ path: "/models/{model}"
206
+ method: "GET"
207
+
208
+ retry_policy:
209
+ strategy: "exponential_backoff"
210
+ max_retries: 3
211
+ min_delay_ms: 1000
212
+ max_delay_ms: 30000
213
+ jitter: "full"
214
+ retry_on_http_status: [429, 500, 503]
215
+
216
+ termination:
217
+ source_field: "finishReason"
218
+ mapping:
219
+ STOP: "end_turn"
220
+ MAX_TOKENS: "max_tokens"
221
+ SAFETY: "refusal"
222
+ RECITATION: "refusal"
223
+ OTHER: "other"
224
+ BLOCKLIST: "refusal"
225
+ PROHIBITED_CONTENT: "refusal"
226
+
227
+ metadata:
228
+ models:
229
+ gemini-3-pro:
230
+ context_window: 1000000
231
+ max_output_tokens: 64000
232
+ status: public_preview
233
+ pricing: { input_per_1m: 2.00, output_per_1m: 12.00 }
234
+ gemini-3-flash:
235
+ context_window: 1000000
236
+ max_output_tokens: 64000
237
+ status: public_preview
238
+ pricing: { input_per_1m: 0.15, output_per_1m: 0.60 }
239
+ context_caching:
240
+ supported: true
241
+ pricing: "$0.20-0.40 per 1M tokens/hour"
242
+ sdk:
243
+ python: google-genai
244
+ javascript: "@google/genai"
245
+ go: "cloud.google.com/go/vertexai"
@@ -0,0 +1,55 @@
1
+ # Jina AI V2 Provider Manifest — Rerank 专用
2
+ # AI-Protocol V2 Provider Manifest
3
+ # Provider: Jina AI | Reranker v2/v3 多语言
4
+ # Last Updated: 2026-02-19
5
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v2/provider.json"
6
+
7
+ # === Ring 1: Core Skeleton ===
8
+ id: jina
9
+ protocol_version: "2.0"
10
+ name: "Jina AI"
11
+ version: "v3"
12
+ status: stable
13
+ category: ai_provider
14
+ official_url: "https://jina.ai"
15
+ support_contact: "https://jina.ai/contact"
16
+
17
+ endpoint:
18
+ base_url: "https://api.jina.ai"
19
+ rerank: "/v1/rerank"
20
+ auth:
21
+ type: "bearer"
22
+ header: "Authorization"
23
+ prefix: "Bearer"
24
+ token_env: "JINA_API_KEY"
25
+
26
+ error_classification:
27
+ by_http_status:
28
+ "400": "invalid_request"
29
+ "401": "authentication"
30
+ "403": "permission_denied"
31
+ "404": "not_found"
32
+ "429": "rate_limited"
33
+ "500": "server_error"
34
+
35
+ # === Ring 2: Capability Mapping ===
36
+ capabilities:
37
+ required:
38
+ - rerank
39
+ optional: []
40
+
41
+ capability_profile:
42
+ phase: "ios_v1"
43
+ inputs:
44
+ modalities: ["text"]
45
+ outcomes:
46
+ types: ["other"]
47
+ systems:
48
+ requires: ["search"]
49
+
50
+ parameters:
51
+ top_n: { type: integer, min: 1 }
52
+ model: { type: string, default: "jina-reranker-v2-base-multilingual" }
53
+
54
+ metadata:
55
+ rerank_models: [jina-reranker-v2-base-multilingual, jina-reranker-v3]
@@ -0,0 +1,186 @@
1
+ # Moonshot Kimi V2 正式提供商清单 — Agent Swarm 先驱,OpenAI 兼容 API
2
+ # AI-Protocol V2 Provider Manifest
3
+ # Provider: Moonshot AI | Models: Kimi K2.5 / K2-Thinking
4
+ # Last Updated: 2026-02-16
5
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v2/provider.json"
6
+
7
+ # === Ring 1: Core Skeleton ===
8
+ id: moonshot
9
+ protocol_version: "2.0"
10
+ name: "Moonshot AI"
11
+ version: "2.5.0"
12
+ status: stable
13
+ category: ai_provider
14
+ official_url: "https://platform.moonshot.ai/docs/"
15
+ support_contact: "https://platform.moonshot.ai/"
16
+
17
+ endpoint:
18
+ base_url: "https://api.moonshot.cn/v1"
19
+ chat: "/chat/completions"
20
+ auth:
21
+ type: "bearer"
22
+ header: "Authorization"
23
+ prefix: "Bearer"
24
+ token_env: "MOONSHOT_API_KEY"
25
+
26
+ error_classification:
27
+ by_http_status:
28
+ "400": "invalid_request"
29
+ "401": "authentication"
30
+ "403": "permission_denied"
31
+ "404": "not_found"
32
+ "429": "rate_limited"
33
+ "500": "server_error"
34
+ "503": "overloaded"
35
+ by_error_code:
36
+ "context_length_exceeded": "request_too_large"
37
+ "model_not_found": "not_found"
38
+ "rate_limit_exceeded": "rate_limited"
39
+ "insufficient_quota": "quota_exhausted"
40
+
41
+ # === Ring 2: Capability Mapping ===
42
+ capabilities:
43
+ required:
44
+ - text
45
+ - streaming
46
+ - tools
47
+ optional:
48
+ - vision
49
+ - video
50
+ - parallel_tools
51
+ - agentic
52
+ - reasoning
53
+ - structured_output
54
+ feature_flags:
55
+ structured_output: true
56
+ parallel_tool_calls: true
57
+ streaming_usage: true
58
+ system_messages: true
59
+
60
+ capability_profile:
61
+ phase: "ios_v1"
62
+ inputs:
63
+ modalities: ["text", "image", "video"]
64
+ outcomes:
65
+ types: ["text_completion", "structured_json", "tool_call_sequence"]
66
+ systems:
67
+ requires: ["mcp", "search"]
68
+
69
+ parameters:
70
+ temperature: { type: float, range: [0.0, 2.0], default: 1.0 }
71
+ max_tokens: { type: integer, min: 1, max: 33000 }
72
+ top_p: { type: float, range: [0.0, 1.0] }
73
+ stream: { type: boolean }
74
+
75
+ parameter_mappings:
76
+ temperature: "temperature"
77
+ max_tokens: "max_tokens"
78
+ stream: "stream"
79
+ top_p: "top_p"
80
+ tools: "tools"
81
+ tool_choice: "tool_choice"
82
+
83
+ streaming:
84
+ decoder:
85
+ format: "sse"
86
+ strategy: "openai_chat"
87
+ done_signal: "[DONE]"
88
+ prefix: "data: "
89
+ content_path: "$.choices[0].delta.content"
90
+ tool_call_path: "$.choices[0].delta.tool_calls"
91
+ usage_path: "$.usage"
92
+ event_map:
93
+ - match: "exists($.choices[*].delta.content)"
94
+ emit: "PartialContentDelta"
95
+ fields:
96
+ content: "$.choices[*].delta.content"
97
+ - match: "exists($.choices[*].delta.tool_calls)"
98
+ emit: "PartialToolCall"
99
+ fields:
100
+ tool_calls: "$.choices[*].delta.tool_calls"
101
+ - match: "exists($.usage)"
102
+ emit: "Metadata"
103
+ fields:
104
+ usage: "$.usage"
105
+ - match: "$.choices[*].finish_reason != null"
106
+ emit: "StreamEnd"
107
+ fields:
108
+ finish_reason: "$.choices[*].finish_reason"
109
+ stop_condition: "$.choices[0].finish_reason != null"
110
+
111
+ multimodal:
112
+ input:
113
+ vision:
114
+ supported: true
115
+ formats: [jpeg, png, webp, gif]
116
+ encoding_methods: [base64_inline, url]
117
+ audio:
118
+ supported: false
119
+ video:
120
+ supported: true
121
+ formats: [mp4, avi, mov]
122
+ output:
123
+ text: true
124
+ audio:
125
+ supported: false
126
+ image:
127
+ supported: false
128
+
129
+ # === Ring 3: Advanced Extensions ===
130
+ api_families: ["chat_completions"]
131
+ default_api_family: "chat_completions"
132
+
133
+ endpoints:
134
+ chat:
135
+ path: "/chat/completions"
136
+ method: "POST"
137
+ adapter: "openai"
138
+
139
+ services:
140
+ list_models:
141
+ path: "/models"
142
+ method: "GET"
143
+
144
+ retry_policy:
145
+ strategy: "exponential_backoff"
146
+ max_retries: 3
147
+ min_delay_ms: 1000
148
+ max_delay_ms: 30000
149
+ jitter: "full"
150
+ retry_on_http_status: [429, 500, 502, 503]
151
+
152
+ termination:
153
+ source_field: "finish_reason"
154
+ mapping:
155
+ stop: "end_turn"
156
+ length: "max_tokens"
157
+ tool_calls: "tool_use"
158
+
159
+ metadata:
160
+ api_compatibility: openai
161
+ open_source:
162
+ license: "Modified MIT"
163
+ hugging_face: "https://huggingface.co/moonshotai/Kimi-K2.5"
164
+ agent_swarm:
165
+ supported: true
166
+ status: beta
167
+ max_agents: 100
168
+ max_tool_calls: 1500
169
+ coordination: "PARL (Parallel Agent RL)"
170
+ models:
171
+ kimi-k2-5:
172
+ context_window: 256000
173
+ max_output_tokens: 33000
174
+ architecture: { type: moe, total: "1T", active: "32B", experts: 384 }
175
+ pricing: { input_per_1m: 0.60, output_per_1m: 3.00 }
176
+ kimi-k2-thinking:
177
+ context_window: 256000
178
+ max_output_tokens: 33000
179
+ pricing: { input_per_1m: 0.60, output_per_1m: 2.50 }
180
+ regional:
181
+ primary: china
182
+ international_partners: [fireworks_ai, together_ai, openrouter, nvidia_nim]
183
+ sdk:
184
+ note: "OpenAI-compatible — use openai SDK with base_url override"
185
+ python: openai
186
+ typescript: openai