@ailib-official/ai-protocol 0.8.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (194) hide show
  1. package/LICENSE +6 -0
  2. package/README.md +415 -0
  3. package/dist/index.json +8 -0
  4. package/dist/v1/models/ai21.json +140 -0
  5. package/dist/v1/models/baichuan.json +138 -0
  6. package/dist/v1/models/cerebras.json +147 -0
  7. package/dist/v1/models/claude.json +114 -0
  8. package/dist/v1/models/cohere.json +235 -0
  9. package/dist/v1/models/deepinfra.json +43 -0
  10. package/dist/v1/models/deepseek-chat.json +55 -0
  11. package/dist/v1/models/doubao.json +197 -0
  12. package/dist/v1/models/ernie.json +223 -0
  13. package/dist/v1/models/fireworks.json +222 -0
  14. package/dist/v1/models/gemini.json +58 -0
  15. package/dist/v1/models/gpt.json +166 -0
  16. package/dist/v1/models/grok.json +138 -0
  17. package/dist/v1/models/huggingface.json +183 -0
  18. package/dist/v1/models/hunyuan.json +255 -0
  19. package/dist/v1/models/jina.json +139 -0
  20. package/dist/v1/models/lepton.json +188 -0
  21. package/dist/v1/models/llama.json +143 -0
  22. package/dist/v1/models/minimax.json +194 -0
  23. package/dist/v1/models/mistral.json +177 -0
  24. package/dist/v1/models/moonshot.json +144 -0
  25. package/dist/v1/models/nvidia.json +212 -0
  26. package/dist/v1/models/palmyra.json +103 -0
  27. package/dist/v1/models/perplexity.json +143 -0
  28. package/dist/v1/models/qwen.json +49 -0
  29. package/dist/v1/models/replicate.json +206 -0
  30. package/dist/v1/models/sensenova.json +144 -0
  31. package/dist/v1/models/siliconflow.json +44 -0
  32. package/dist/v1/models/spark.json +173 -0
  33. package/dist/v1/models/stable-diffusion.json +161 -0
  34. package/dist/v1/models/tiangong.json +169 -0
  35. package/dist/v1/models/together.json +43 -0
  36. package/dist/v1/models/yi.json +199 -0
  37. package/dist/v1/models/zhipu.json +250 -0
  38. package/dist/v1/providers/ai21.json +215 -0
  39. package/dist/v1/providers/anthropic.json +253 -0
  40. package/dist/v1/providers/anyscale.json +115 -0
  41. package/dist/v1/providers/azure.json +188 -0
  42. package/dist/v1/providers/baichuan.json +205 -0
  43. package/dist/v1/providers/baidu.json +205 -0
  44. package/dist/v1/providers/cerebras.json +216 -0
  45. package/dist/v1/providers/cohere.json +209 -0
  46. package/dist/v1/providers/deepinfra.json +196 -0
  47. package/dist/v1/providers/deepseek.json +221 -0
  48. package/dist/v1/providers/doubao.json +209 -0
  49. package/dist/v1/providers/fireworks.json +227 -0
  50. package/dist/v1/providers/gemini.json +279 -0
  51. package/dist/v1/providers/groq.json +218 -0
  52. package/dist/v1/providers/huggingface.json +181 -0
  53. package/dist/v1/providers/hunyuan.json +198 -0
  54. package/dist/v1/providers/jina.json +202 -0
  55. package/dist/v1/providers/lepton.json +221 -0
  56. package/dist/v1/providers/minimax.json +209 -0
  57. package/dist/v1/providers/mistral.json +214 -0
  58. package/dist/v1/providers/moonshot.json +214 -0
  59. package/dist/v1/providers/nvidia.json +213 -0
  60. package/dist/v1/providers/openai.json +267 -0
  61. package/dist/v1/providers/openrouter.json +220 -0
  62. package/dist/v1/providers/perplexity.json +172 -0
  63. package/dist/v1/providers/qwen.json +231 -0
  64. package/dist/v1/providers/replicate.json +192 -0
  65. package/dist/v1/providers/sensenova.json +185 -0
  66. package/dist/v1/providers/siliconflow.json +197 -0
  67. package/dist/v1/providers/spark.json +204 -0
  68. package/dist/v1/providers/stability.json +221 -0
  69. package/dist/v1/providers/tiangong.json +207 -0
  70. package/dist/v1/providers/together.json +196 -0
  71. package/dist/v1/providers/writer.json +253 -0
  72. package/dist/v1/providers/xai.json +238 -0
  73. package/dist/v1/providers/yi.json +205 -0
  74. package/dist/v1/providers/zhipu.json +208 -0
  75. package/dist/v1/spec.json +783 -0
  76. package/dist/v2/providers/anthropic.json +372 -0
  77. package/dist/v2/providers/cohere.json +109 -0
  78. package/dist/v2/providers/deepseek.json +272 -0
  79. package/dist/v2/providers/doubao.json +260 -0
  80. package/dist/v2/providers/google.json +388 -0
  81. package/dist/v2/providers/jina.json +71 -0
  82. package/dist/v2/providers/moonshot.json +284 -0
  83. package/dist/v2/providers/openai.json +419 -0
  84. package/dist/v2/providers/qwen.json +274 -0
  85. package/dist/v2/providers/zhipu.json +257 -0
  86. package/dist/v2-alpha/providers/anthropic.json +182 -0
  87. package/dist/v2-alpha/providers/gemini.json +187 -0
  88. package/dist/v2-alpha/providers/openai.json +215 -0
  89. package/dist/v2-alpha/spec.json +644 -0
  90. package/package.json +61 -0
  91. package/schemas/spec.json +186 -0
  92. package/schemas/v1.json +1116 -0
  93. package/schemas/v2/availability.json +66 -0
  94. package/schemas/v2/capabilities.json +182 -0
  95. package/schemas/v2/capability-profile.json +174 -0
  96. package/schemas/v2/computer-use.json +222 -0
  97. package/schemas/v2/context-policy.json +148 -0
  98. package/schemas/v2/endpoint.json +2 -0
  99. package/schemas/v2/error-codes.yaml +225 -0
  100. package/schemas/v2/errors.json +250 -0
  101. package/schemas/v2/execution-metadata.json +59 -0
  102. package/schemas/v2/mcp.json +225 -0
  103. package/schemas/v2/message-roles.json +10 -0
  104. package/schemas/v2/multimodal.json +297 -0
  105. package/schemas/v2/pricing.json +14 -0
  106. package/schemas/v2/provider-contract.json +317 -0
  107. package/schemas/v2/provider.json +203 -0
  108. package/schemas/v2/regions.json +14 -0
  109. package/v1/models/ai21.yaml +97 -0
  110. package/v1/models/baichuan.yaml +95 -0
  111. package/v1/models/cerebras.yaml +99 -0
  112. package/v1/models/claude.yaml +59 -0
  113. package/v1/models/cohere.yaml +165 -0
  114. package/v1/models/deepinfra.yaml +29 -0
  115. package/v1/models/deepseek-chat.yaml +32 -0
  116. package/v1/models/doubao.yaml +129 -0
  117. package/v1/models/ernie.yaml +146 -0
  118. package/v1/models/fireworks.yaml +145 -0
  119. package/v1/models/gemini.yaml +32 -0
  120. package/v1/models/gpt.yaml +90 -0
  121. package/v1/models/grok.yaml +74 -0
  122. package/v1/models/huggingface.yaml +110 -0
  123. package/v1/models/hunyuan.yaml +164 -0
  124. package/v1/models/jina.yaml +98 -0
  125. package/v1/models/lepton.yaml +130 -0
  126. package/v1/models/llama.yaml +91 -0
  127. package/v1/models/minimax.yaml +132 -0
  128. package/v1/models/mistral.yaml +100 -0
  129. package/v1/models/moonshot.yaml +97 -0
  130. package/v1/models/nvidia.yaml +118 -0
  131. package/v1/models/palmyra.yaml +59 -0
  132. package/v1/models/perplexity.yaml +97 -0
  133. package/v1/models/qwen.yaml +27 -0
  134. package/v1/models/replicate.yaml +136 -0
  135. package/v1/models/sensenova.yaml +97 -0
  136. package/v1/models/siliconflow.yaml +29 -0
  137. package/v1/models/spark.yaml +114 -0
  138. package/v1/models/stable-diffusion.yaml +113 -0
  139. package/v1/models/tiangong.yaml +114 -0
  140. package/v1/models/together.yaml +29 -0
  141. package/v1/models/yi.yaml +132 -0
  142. package/v1/models/zhipu.yaml +163 -0
  143. package/v1/providers/ai21.yaml +176 -0
  144. package/v1/providers/anthropic.yaml +209 -0
  145. package/v1/providers/anyscale.yaml +106 -0
  146. package/v1/providers/azure.yaml +155 -0
  147. package/v1/providers/baichuan.yaml +168 -0
  148. package/v1/providers/baidu.yaml +173 -0
  149. package/v1/providers/cerebras.yaml +178 -0
  150. package/v1/providers/cohere.yaml +175 -0
  151. package/v1/providers/deepinfra.yaml +156 -0
  152. package/v1/providers/deepseek.yaml +189 -0
  153. package/v1/providers/doubao.yaml +172 -0
  154. package/v1/providers/fireworks.yaml +187 -0
  155. package/v1/providers/gemini.yaml +229 -0
  156. package/v1/providers/groq.yaml +181 -0
  157. package/v1/providers/huggingface.yaml +157 -0
  158. package/v1/providers/hunyuan.yaml +162 -0
  159. package/v1/providers/jina.yaml +171 -0
  160. package/v1/providers/lepton.yaml +183 -0
  161. package/v1/providers/minimax.yaml +172 -0
  162. package/v1/providers/mistral.yaml +186 -0
  163. package/v1/providers/moonshot.yaml +176 -0
  164. package/v1/providers/nvidia.yaml +172 -0
  165. package/v1/providers/openai.yaml +224 -0
  166. package/v1/providers/openrouter.yaml +181 -0
  167. package/v1/providers/perplexity.yaml +144 -0
  168. package/v1/providers/qwen.yaml +192 -0
  169. package/v1/providers/replicate.yaml +159 -0
  170. package/v1/providers/sensenova.yaml +153 -0
  171. package/v1/providers/siliconflow.yaml +156 -0
  172. package/v1/providers/spark.yaml +167 -0
  173. package/v1/providers/stability.yaml +185 -0
  174. package/v1/providers/tiangong.yaml +170 -0
  175. package/v1/providers/together.yaml +156 -0
  176. package/v1/providers/writer.yaml +212 -0
  177. package/v1/providers/xai.yaml +206 -0
  178. package/v1/providers/yi.yaml +168 -0
  179. package/v1/providers/zhipu.yaml +171 -0
  180. package/v1/spec.yaml +637 -0
  181. package/v2/providers/anthropic.yaml +244 -0
  182. package/v2/providers/cohere.yaml +75 -0
  183. package/v2/providers/deepseek.yaml +176 -0
  184. package/v2/providers/doubao.yaml +169 -0
  185. package/v2/providers/google.yaml +245 -0
  186. package/v2/providers/jina.yaml +55 -0
  187. package/v2/providers/moonshot.yaml +186 -0
  188. package/v2/providers/openai.yaml +266 -0
  189. package/v2/providers/qwen.yaml +174 -0
  190. package/v2/providers/zhipu.yaml +176 -0
  191. package/v2-alpha/providers/anthropic.yaml +134 -0
  192. package/v2-alpha/providers/gemini.yaml +144 -0
  193. package/v2-alpha/providers/openai.yaml +154 -0
  194. package/v2-alpha/spec.yaml +512 -0
@@ -0,0 +1,175 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+
3
+ id: cohere
4
+ protocol_version: "1.5"
5
+
6
+ name: Cohere
7
+ version: "v2"
8
+ status: stable
9
+ category: ai_provider
10
+ official_url: "https://docs.cohere.com"
11
+ support_contact: "https://cohere.com/contact"
12
+
13
+ endpoint:
14
+ base_url: "https://api.cohere.com/v2"
15
+ protocol: https
16
+ timeout_ms: 60000
17
+
18
+ auth:
19
+ type: bearer
20
+ token_env: "COHERE_API_KEY"
21
+
22
+ payload_format: "cohere_v2"
23
+
24
+ # Cohere V2 API
25
+ api_families: ["chat"]
26
+ default_api_family: "chat"
27
+
28
+ endpoints:
29
+ chat:
30
+ path: "/chat"
31
+ method: "POST"
32
+ adapter: "cohere_v2"
33
+
34
+ services:
35
+ list_models:
36
+ path: "/models"
37
+ method: "GET"
38
+ response_binding: "models"
39
+
40
+ termination:
41
+ source_field: "finish_reason"
42
+ mapping:
43
+ COMPLETE: "end_turn"
44
+ MAX_TOKENS: "max_tokens"
45
+ STOP_SEQUENCE: "stop_sequence"
46
+ TOOL_CALL: "tool_use"
47
+ ERROR: "error"
48
+ notes:
49
+ - "Cohere uses uppercase finish reasons."
50
+ - "Known for Command R+ and enterprise-grade RAG capabilities."
51
+
52
+ tooling:
53
+ source_model: "openai_tool_calls"
54
+ tool_use:
55
+ id_path: "id"
56
+ name_path: "name"
57
+ input_path: "parameters"
58
+ input_format: "json_object"
59
+ notes:
60
+ - "Cohere V2 uses 'tools' array similar to OpenAI."
61
+
62
+ rate_limit_headers:
63
+ requests_limit: "x-ratelimit-limit"
64
+ requests_remaining: "x-ratelimit-remaining"
65
+ requests_reset: "x-ratelimit-reset"
66
+
67
+ retry_policy:
68
+ strategy: "exponential_backoff"
69
+ max_retries: 3
70
+ min_delay_ms: 500
71
+ max_delay_ms: 30000
72
+ jitter: "full"
73
+ retry_on_http_status: [429, 500, 502, 503]
74
+
75
+ error_classification:
76
+ by_http_status:
77
+ "400": "invalid_request"
78
+ "401": "authentication"
79
+ "403": "permission_denied"
80
+ "404": "not_found"
81
+ "422": "invalid_request"
82
+ "429": "rate_limited"
83
+ "500": "server_error"
84
+ "503": "overloaded"
85
+
86
+ parameter_mappings:
87
+ temperature: "temperature"
88
+ max_tokens: "max_tokens"
89
+ stream: "stream"
90
+ top_p: "p"
91
+ top_k: "k"
92
+ stop_sequences: "stop_sequences"
93
+ tools: "tools"
94
+ frequency_penalty: "frequency_penalty"
95
+ presence_penalty: "presence_penalty"
96
+ seed: "seed"
97
+
98
+ response_format: "cohere_v2"
99
+
100
+ response_paths:
101
+ content: "message.content[0].text"
102
+ tool_calls: "message.tool_calls"
103
+ usage: "usage"
104
+ finish_reason: "finish_reason"
105
+
106
+ streaming:
107
+ event_format: "sse"
108
+ decoder:
109
+ format: "sse"
110
+ delimiter: "\n"
111
+ prefix: "data: "
112
+ done_signal: ""
113
+ content_path: "delta.message.content.text"
114
+ tool_call_path: "delta.message.tool_calls"
115
+ usage_path: "usage"
116
+ frame_selector: "exists($.type)"
117
+ event_map:
118
+ - match: "$.type == 'content-delta'"
119
+ emit: "PartialContentDelta"
120
+ fields:
121
+ content: "$.delta.message.content.text"
122
+ - match: "$.type == 'tool-call-start'"
123
+ emit: "ToolCallStarted"
124
+ fields:
125
+ tool_call_id: "$.delta.message.tool_calls.id"
126
+ tool_name: "$.delta.message.tool_calls.name"
127
+ - match: "$.type == 'tool-call-delta'"
128
+ emit: "PartialToolCall"
129
+ fields:
130
+ arguments: "$.delta.message.tool_calls.parameters"
131
+ - match: "$.type == 'message-end'"
132
+ emit: "FinalCandidate"
133
+ fields:
134
+ finish_reason: "$.delta.finish_reason"
135
+ usage: "$.delta.usage"
136
+ stop_condition: "$.type == 'message-end'"
137
+
138
+ features:
139
+ multi_candidate:
140
+ support_type: "simulated"
141
+ max_concurrent: 1
142
+ response_mapping:
143
+ tool_calls:
144
+ path: "message.tool_calls"
145
+ fields:
146
+ id: "id"
147
+ name: "name"
148
+ args: "parameters"
149
+ error:
150
+ message_path: "message"
151
+ code_path: "code"
152
+
153
+ capabilities:
154
+ streaming: true
155
+ tools: true
156
+ vision: false
157
+ agentic: true
158
+ parallel_tools: false
159
+ reasoning: false
160
+
161
+ availability:
162
+ required: false
163
+ regions:
164
+ - global
165
+ check:
166
+ method: GET
167
+ path: "/models"
168
+ expected_status: [200, 401]
169
+ timeout_ms: 5000
170
+
171
+ experimental_features:
172
+ - "rag"
173
+ - "connectors"
174
+ - "rerank"
175
+ - "embed"
@@ -0,0 +1,156 @@
1
+ $schema: ../../schemas/v1.json
2
+ protocol_version: "1.5"
3
+ id: "deepinfra"
4
+ name: "DeepInfra"
5
+ status: "stable"
6
+ category: "model_provider"
7
+ official_url: "https://deepinfra.com/"
8
+ support_contact: "https://deepinfra.com/support"
9
+
10
+ endpoint:
11
+ base_url: "https://api.deepinfra.com/v1/openai"
12
+ protocol: "https"
13
+ timeout_ms: 60000
14
+
15
+ # Auth + payload format are required for online model fact-checking.
16
+ auth:
17
+ type: bearer
18
+ token_env: "DEEPINFRA_API_KEY"
19
+ payload_format: "openai_style"
20
+
21
+ services:
22
+ list_models:
23
+ path: "/models"
24
+ method: "GET"
25
+ response_binding: "data"
26
+
27
+ availability:
28
+ required: false
29
+ regions: ["global"]
30
+ check:
31
+ method: "GET"
32
+ path: "/models"
33
+ expected_status: [200]
34
+
35
+ capabilities:
36
+ streaming: true
37
+ tools: true
38
+ vision: true
39
+ agentic: false
40
+ reasoning: false
41
+ parallel_tools: true
42
+
43
+ # DeepInfra is OpenAI-compatible
44
+ streaming:
45
+ event_format: "data_lines"
46
+ decoder:
47
+ format: "sse"
48
+ delimiter: "\n\n"
49
+ prefix: "data: "
50
+ done_signal: "[DONE]"
51
+ frame_selector: "exists($.choices) || exists($.error)"
52
+ candidate:
53
+ candidate_id_path: "$.choices[*].index"
54
+ fan_out: true
55
+ event_map:
56
+ - match: "exists($.error)"
57
+ emit: "StreamError"
58
+ fields:
59
+ error: "$.error"
60
+ - match: "exists($.choices[*].delta.content)"
61
+ emit: "PartialContentDelta"
62
+ fields:
63
+ content: "$.choices[*].delta.content"
64
+ - match: "exists($.choices[*].delta.tool_calls[*].function.name)"
65
+ emit: "ToolCallStarted"
66
+ fields:
67
+ tool_call_id: "$.choices[*].delta.tool_calls[*].id"
68
+ tool_name: "$.choices[*].delta.tool_calls[*].function.name"
69
+ index: "$.choices[*].delta.tool_calls[*].index"
70
+ - match: "exists($.choices[*].delta.tool_calls[*].function.arguments)"
71
+ emit: "PartialToolCall"
72
+ fields:
73
+ arguments: "$.choices[*].delta.tool_calls[*].function.arguments"
74
+ index: "$.choices[*].delta.tool_calls[*].index"
75
+ - match: "exists($.usage)"
76
+ emit: "Metadata"
77
+ fields:
78
+ usage: "$.usage"
79
+ - match: "exists($.choices[*].finish_reason)"
80
+ emit: "FinalCandidate"
81
+ fields:
82
+ finish_reason: "$.choices[*].finish_reason"
83
+ candidate_index: "$.choices[*].index"
84
+ stop_condition: "$.choices[0].finish_reason != null"
85
+ extra_metadata_path: "$.usage"
86
+ content_path: "$.choices[0].delta.content"
87
+ tool_call_path: "$.choices[0].delta.tool_calls"
88
+
89
+ # Termination reason normalization (DeepInfra uses OpenAI-compatible finish_reason)
90
+ termination:
91
+ source_field: "finish_reason"
92
+ mapping:
93
+ stop: "end_turn"
94
+ length: "max_tokens"
95
+ tool_calls: "tool_use"
96
+ content_filter: "refusal"
97
+ notes:
98
+ - "finish_reason is reported per candidate."
99
+
100
+ # Tool invocation normalization (DeepInfra is OpenAI-compatible)
101
+ tooling:
102
+ source_model: "openai_tool_calls"
103
+ tool_use:
104
+ id_path: "id"
105
+ name_path: "function.name"
106
+ input_path: "function.arguments"
107
+ input_format: "json_string"
108
+ notes:
109
+ - "DeepInfra tool_calls.function.arguments is typically a JSON string."
110
+
111
+ features:
112
+ multi_candidate:
113
+ support_type: "native"
114
+ param_name: "n"
115
+ response_mapping:
116
+ tool_calls:
117
+ path: "choices[0].message.tool_calls"
118
+ fields:
119
+ id: "id"
120
+ name: "function.name"
121
+ args: "function.arguments"
122
+ error:
123
+ message_path: "error.message"
124
+ code_path: "error.code"
125
+
126
+ response_paths:
127
+ content: "choices[0].message.content"
128
+ tool_calls: "choices[0].message.tool_calls"
129
+ usage: "usage"
130
+ finish_reason: "choices[0].finish_reason"
131
+
132
+ parameter_mappings:
133
+ temperature: "temperature"
134
+ max_tokens: "max_tokens"
135
+ stream: "stream"
136
+ top_p: "top_p"
137
+ stop_sequences: "stop"
138
+ tools: "tools"
139
+ tool_choice: "tool_choice"
140
+
141
+ retry_policy:
142
+ max_retries: 3
143
+ max_delay_ms: 30000
144
+ strategy: "exponential_backoff"
145
+ min_delay_ms: 1000
146
+ jitter: "full"
147
+ retry_on_http_status: [429, 500, 502, 503]
148
+
149
+ error_classification:
150
+ by_http_status:
151
+ "400": "invalid_request"
152
+ "401": "authentication"
153
+ "422": "invalid_request"
154
+ "429": "rate_limited"
155
+ "500": "server_error"
156
+ "503": "overloaded"
@@ -0,0 +1,189 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+
3
+ id: deepseek
4
+ provider_id: deepseek
5
+ protocol_version: "1.5"
6
+
7
+ name: DeepSeek
8
+ version: "v1"
9
+ status: stable
10
+ category: ai_provider
11
+ official_url: "https://platform.deepseek.com/docs"
12
+ support_contact: "https://support.deepseek.com"
13
+
14
+ endpoint:
15
+ base_url: "https://api.deepseek.com/v1"
16
+ protocol: https
17
+ timeout_ms: 10000
18
+ auth:
19
+ type: bearer
20
+ token_env: "DEEPSEEK_API_KEY"
21
+ payload_format: "openai_style"
22
+
23
+ # V1.5 Structured Endpoints
24
+ endpoints:
25
+ chat:
26
+ path: "/chat/completions"
27
+ method: "POST"
28
+ adapter: "openai"
29
+ completions:
30
+ path: "/completions"
31
+ method: "POST"
32
+ adapter: "openai"
33
+
34
+ # V1.5 Service Endpoints
35
+ services:
36
+ list_models:
37
+ path: "/models"
38
+ method: "GET"
39
+ response_binding: "data"
40
+ get_balance:
41
+ path: "/user/balance"
42
+ method: "GET"
43
+
44
+ # Legacy support
45
+ api_families: ["chat_completions"]
46
+ default_api_family: "chat_completions"
47
+
48
+ termination:
49
+ source_field: "finish_reason"
50
+ mapping:
51
+ stop: "end_turn"
52
+ length: "max_tokens"
53
+ tool_calls: "tool_use"
54
+ content_filter: "refusal"
55
+
56
+ tooling:
57
+ source_model: "openai_tool_calls"
58
+ tool_use:
59
+ id_path: "id"
60
+ name_path: "function.name"
61
+ input_path: "function.arguments"
62
+ input_format: "json_string"
63
+
64
+ retry_policy:
65
+ strategy: "exponential_backoff"
66
+ max_retries: 2
67
+ min_delay_ms: 1000
68
+ max_delay_ms: 8000
69
+ jitter: "full"
70
+ retry_on_http_status: [429, 500, 502, 503]
71
+
72
+ # Rate limit headers (OpenAI-compatible)
73
+ rate_limit_headers:
74
+ requests_limit: "x-ratelimit-limit-requests"
75
+ requests_remaining: "x-ratelimit-remaining-requests"
76
+ requests_reset: "x-ratelimit-reset-requests"
77
+ tokens_limit: "x-ratelimit-limit-tokens"
78
+ tokens_remaining: "x-ratelimit-remaining-tokens"
79
+ tokens_reset: "x-ratelimit-reset-tokens"
80
+ retry_after: "retry-after"
81
+
82
+ error_classification:
83
+ by_http_status:
84
+ "400": "invalid_request"
85
+ "401": "authentication"
86
+ "402": "quota_exhausted"
87
+ "422": "invalid_request"
88
+ "429": "rate_limited"
89
+ "500": "server_error"
90
+ "503": "overloaded"
91
+
92
+ parameter_mappings:
93
+ temperature: "temperature"
94
+ max_tokens: "max_tokens"
95
+ stream: "stream"
96
+ top_p: "top_p"
97
+ stop_sequences: "stop"
98
+ tools: "tools"
99
+ tool_choice: "tool_choice"
100
+
101
+ response_format: "openai_style"
102
+ response_paths:
103
+ content: "choices[0].message.content"
104
+ # Non-stream fallback when `content` is null (e.g. some reasoner / thinking payloads).
105
+ reasoning_content: "choices[0].message.reasoning_content"
106
+ tool_calls: "choices[0].message.tool_calls"
107
+ usage: "usage"
108
+ finish_reason: "choices[0].finish_reason"
109
+
110
+ streaming:
111
+ event_format: "data_lines"
112
+ decoder:
113
+ format: "sse"
114
+ delimiter: "\n\n"
115
+ prefix: "data: "
116
+ done_signal: "[DONE]"
117
+ strategy: "sse_ignore_comments"
118
+ content_path: "choices[0].delta.content"
119
+ tool_call_path: "choices[0].delta.tool_calls"
120
+ usage_path: "usage"
121
+ frame_selector: "exists($.choices) || exists($.error)"
122
+ event_map:
123
+ # Text content delta
124
+ - match: "exists($.choices[*].delta.content)"
125
+ emit: "PartialContentDelta"
126
+ fields:
127
+ content: "$.choices[*].delta.content"
128
+ # Tool call start
129
+ - match: "exists($.choices[*].delta.tool_calls[*].function.name)"
130
+ emit: "ToolCallStarted"
131
+ fields:
132
+ tool_call_id: "$.choices[*].delta.tool_calls[*].id"
133
+ tool_name: "$.choices[*].delta.tool_calls[*].function.name"
134
+ index: "$.choices[*].delta.tool_calls[*].index"
135
+ # Tool call arguments streaming
136
+ - match: "exists($.choices[*].delta.tool_calls[*].function.arguments)"
137
+ emit: "PartialToolCall"
138
+ fields:
139
+ arguments: "$.choices[*].delta.tool_calls[*].function.arguments"
140
+ index: "$.choices[*].delta.tool_calls[*].index"
141
+ # Usage metadata
142
+ - match: "exists($.usage)"
143
+ emit: "Metadata"
144
+ fields:
145
+ usage: "$.usage"
146
+ # Stream end with finish reason
147
+ - match: "$.choices[*].finish_reason != null"
148
+ emit: "StreamEnd"
149
+ fields:
150
+ finish_reason: "$.choices[*].finish_reason"
151
+ stop_condition: "$.choices[0].finish_reason != null"
152
+
153
+ features:
154
+ multi_candidate:
155
+ support_type: "native"
156
+ param_name: "n"
157
+ response_mapping:
158
+ tool_calls:
159
+ path: "choices[0].message.tool_calls"
160
+ fields:
161
+ id: "id"
162
+ name: "function.name"
163
+ args: "function.arguments"
164
+ error:
165
+ message_path: "error.message"
166
+ code_path: "error.code"
167
+ type_path: "error.type"
168
+ param_path: "error.param"
169
+
170
+ capabilities:
171
+ streaming: true
172
+ tools: true
173
+ vision: false
174
+ agentic: true
175
+ parallel_tools: false
176
+ reasoning: true
177
+
178
+ availability:
179
+ required: false
180
+ regions:
181
+ - cn
182
+ - global
183
+ check:
184
+ method: GET
185
+ path: "/models"
186
+ expected_status: [200, 401]
187
+ timeout_ms: 3000
188
+ experimental_features:
189
+ - "deep_thinking"
@@ -0,0 +1,172 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+
3
+ id: doubao
4
+ protocol_version: "1.5"
5
+
6
+ name: 字节跳动豆包 (Doubao)
7
+ version: "v1"
8
+ status: stable
9
+ category: ai_provider
10
+ official_url: "https://www.volcengine.com/docs/82379"
11
+ support_contact: "https://www.volcengine.com/contact"
12
+
13
+ endpoint:
14
+ base_url: "https://ark.cn-beijing.volces.com/api/v3"
15
+ protocol: https
16
+ timeout_ms: 60000
17
+
18
+ auth:
19
+ type: bearer
20
+ token_env: "VOLCENGINE_API_KEY"
21
+
22
+ payload_format: "openai_style"
23
+
24
+ # OpenAI-compatible API
25
+ api_families: ["chat_completions"]
26
+ default_api_family: "chat_completions"
27
+
28
+ endpoints:
29
+ chat:
30
+ path: "/chat/completions"
31
+ method: "POST"
32
+ adapter: "openai"
33
+
34
+ services:
35
+ list_models:
36
+ path: "/models"
37
+ method: "GET"
38
+ response_binding: "data"
39
+
40
+ termination:
41
+ source_field: "finish_reason"
42
+ mapping:
43
+ stop: "end_turn"
44
+ length: "max_tokens"
45
+ tool_calls: "tool_use"
46
+ content_filter: "refusal"
47
+ notes:
48
+ - "OpenAI-compatible finish_reason."
49
+ - "Doubao (豆包) is ByteDance's flagship LLM accessed via Volcengine."
50
+
51
+ tooling:
52
+ source_model: "openai_tool_calls"
53
+ tool_use:
54
+ id_path: "id"
55
+ name_path: "function.name"
56
+ input_path: "function.arguments"
57
+ input_format: "json_string"
58
+ notes:
59
+ - "Supports OpenAI-compatible function calling."
60
+
61
+ retry_policy:
62
+ strategy: "exponential_backoff"
63
+ max_retries: 3
64
+ min_delay_ms: 1000
65
+ max_delay_ms: 30000
66
+ jitter: "full"
67
+ retry_on_http_status: [429, 500, 502, 503]
68
+
69
+ error_classification:
70
+ by_http_status:
71
+ "400": "invalid_request"
72
+ "401": "authentication"
73
+ "403": "permission_denied"
74
+ "404": "not_found"
75
+ "429": "rate_limited"
76
+ "500": "server_error"
77
+ "503": "overloaded"
78
+
79
+ parameter_mappings:
80
+ temperature: "temperature"
81
+ max_tokens: "max_tokens"
82
+ stream: "stream"
83
+ top_p: "top_p"
84
+ stop_sequences: "stop"
85
+ tools: "tools"
86
+ tool_choice: "tool_choice"
87
+ frequency_penalty: "frequency_penalty"
88
+ presence_penalty: "presence_penalty"
89
+
90
+ response_format: "openai_style"
91
+
92
+ response_paths:
93
+ content: "choices[0].message.content"
94
+ tool_calls: "choices[0].message.tool_calls"
95
+ usage: "usage"
96
+ finish_reason: "choices[0].finish_reason"
97
+
98
+ streaming:
99
+ event_format: "data_lines"
100
+ decoder:
101
+ format: "sse"
102
+ delimiter: "\n\n"
103
+ prefix: "data: "
104
+ done_signal: "[DONE]"
105
+ content_path: "choices[0].delta.content"
106
+ tool_call_path: "choices[0].delta.tool_calls"
107
+ usage_path: "usage"
108
+ frame_selector: "exists($.choices) || exists($.error)"
109
+ event_map:
110
+ - match: "exists($.choices[*].delta.content)"
111
+ emit: "PartialContentDelta"
112
+ fields:
113
+ content: "$.choices[*].delta.content"
114
+ - match: "exists($.choices[*].delta.tool_calls[*].function.name)"
115
+ emit: "ToolCallStarted"
116
+ fields:
117
+ tool_call_id: "$.choices[*].delta.tool_calls[*].id"
118
+ tool_name: "$.choices[*].delta.tool_calls[*].function.name"
119
+ index: "$.choices[*].delta.tool_calls[*].index"
120
+ - match: "exists($.choices[*].delta.tool_calls[*].function.arguments)"
121
+ emit: "PartialToolCall"
122
+ fields:
123
+ arguments: "$.choices[*].delta.tool_calls[*].function.arguments"
124
+ index: "$.choices[*].delta.tool_calls[*].index"
125
+ - match: "exists($.usage)"
126
+ emit: "Metadata"
127
+ fields:
128
+ usage: "$.usage"
129
+ - match: "exists($.choices[*].finish_reason)"
130
+ emit: "FinalCandidate"
131
+ fields:
132
+ finish_reason: "$.choices[*].finish_reason"
133
+ stop_condition: "$.choices[0].finish_reason != null"
134
+
135
+ features:
136
+ multi_candidate:
137
+ support_type: "native"
138
+ param_name: "n"
139
+ response_mapping:
140
+ tool_calls:
141
+ path: "choices[0].message.tool_calls"
142
+ fields:
143
+ id: "id"
144
+ name: "function.name"
145
+ args: "function.arguments"
146
+ error:
147
+ message_path: "error.message"
148
+ code_path: "error.code"
149
+ type_path: "error.type"
150
+
151
+ capabilities:
152
+ streaming: true
153
+ tools: true
154
+ vision: true
155
+ agentic: true
156
+ parallel_tools: true
157
+ reasoning: true
158
+
159
+ availability:
160
+ required: false
161
+ regions:
162
+ - cn
163
+ check:
164
+ method: GET
165
+ path: "/models"
166
+ expected_status: [200, 401]
167
+ timeout_ms: 5000
168
+
169
+ experimental_features:
170
+ - "bot_chat"
171
+ - "embeddings"
172
+ - "image_generation"