@ailib-official/ai-protocol 0.8.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (194) hide show
  1. package/LICENSE +6 -0
  2. package/README.md +415 -0
  3. package/dist/index.json +8 -0
  4. package/dist/v1/models/ai21.json +140 -0
  5. package/dist/v1/models/baichuan.json +138 -0
  6. package/dist/v1/models/cerebras.json +147 -0
  7. package/dist/v1/models/claude.json +114 -0
  8. package/dist/v1/models/cohere.json +235 -0
  9. package/dist/v1/models/deepinfra.json +43 -0
  10. package/dist/v1/models/deepseek-chat.json +55 -0
  11. package/dist/v1/models/doubao.json +197 -0
  12. package/dist/v1/models/ernie.json +223 -0
  13. package/dist/v1/models/fireworks.json +222 -0
  14. package/dist/v1/models/gemini.json +58 -0
  15. package/dist/v1/models/gpt.json +166 -0
  16. package/dist/v1/models/grok.json +138 -0
  17. package/dist/v1/models/huggingface.json +183 -0
  18. package/dist/v1/models/hunyuan.json +255 -0
  19. package/dist/v1/models/jina.json +139 -0
  20. package/dist/v1/models/lepton.json +188 -0
  21. package/dist/v1/models/llama.json +143 -0
  22. package/dist/v1/models/minimax.json +194 -0
  23. package/dist/v1/models/mistral.json +177 -0
  24. package/dist/v1/models/moonshot.json +144 -0
  25. package/dist/v1/models/nvidia.json +212 -0
  26. package/dist/v1/models/palmyra.json +103 -0
  27. package/dist/v1/models/perplexity.json +143 -0
  28. package/dist/v1/models/qwen.json +49 -0
  29. package/dist/v1/models/replicate.json +206 -0
  30. package/dist/v1/models/sensenova.json +144 -0
  31. package/dist/v1/models/siliconflow.json +44 -0
  32. package/dist/v1/models/spark.json +173 -0
  33. package/dist/v1/models/stable-diffusion.json +161 -0
  34. package/dist/v1/models/tiangong.json +169 -0
  35. package/dist/v1/models/together.json +43 -0
  36. package/dist/v1/models/yi.json +199 -0
  37. package/dist/v1/models/zhipu.json +250 -0
  38. package/dist/v1/providers/ai21.json +215 -0
  39. package/dist/v1/providers/anthropic.json +253 -0
  40. package/dist/v1/providers/anyscale.json +115 -0
  41. package/dist/v1/providers/azure.json +188 -0
  42. package/dist/v1/providers/baichuan.json +205 -0
  43. package/dist/v1/providers/baidu.json +205 -0
  44. package/dist/v1/providers/cerebras.json +216 -0
  45. package/dist/v1/providers/cohere.json +209 -0
  46. package/dist/v1/providers/deepinfra.json +196 -0
  47. package/dist/v1/providers/deepseek.json +221 -0
  48. package/dist/v1/providers/doubao.json +209 -0
  49. package/dist/v1/providers/fireworks.json +227 -0
  50. package/dist/v1/providers/gemini.json +279 -0
  51. package/dist/v1/providers/groq.json +218 -0
  52. package/dist/v1/providers/huggingface.json +181 -0
  53. package/dist/v1/providers/hunyuan.json +198 -0
  54. package/dist/v1/providers/jina.json +202 -0
  55. package/dist/v1/providers/lepton.json +221 -0
  56. package/dist/v1/providers/minimax.json +209 -0
  57. package/dist/v1/providers/mistral.json +214 -0
  58. package/dist/v1/providers/moonshot.json +214 -0
  59. package/dist/v1/providers/nvidia.json +213 -0
  60. package/dist/v1/providers/openai.json +267 -0
  61. package/dist/v1/providers/openrouter.json +220 -0
  62. package/dist/v1/providers/perplexity.json +172 -0
  63. package/dist/v1/providers/qwen.json +231 -0
  64. package/dist/v1/providers/replicate.json +192 -0
  65. package/dist/v1/providers/sensenova.json +185 -0
  66. package/dist/v1/providers/siliconflow.json +197 -0
  67. package/dist/v1/providers/spark.json +204 -0
  68. package/dist/v1/providers/stability.json +221 -0
  69. package/dist/v1/providers/tiangong.json +207 -0
  70. package/dist/v1/providers/together.json +196 -0
  71. package/dist/v1/providers/writer.json +253 -0
  72. package/dist/v1/providers/xai.json +238 -0
  73. package/dist/v1/providers/yi.json +205 -0
  74. package/dist/v1/providers/zhipu.json +208 -0
  75. package/dist/v1/spec.json +783 -0
  76. package/dist/v2/providers/anthropic.json +372 -0
  77. package/dist/v2/providers/cohere.json +109 -0
  78. package/dist/v2/providers/deepseek.json +272 -0
  79. package/dist/v2/providers/doubao.json +260 -0
  80. package/dist/v2/providers/google.json +388 -0
  81. package/dist/v2/providers/jina.json +71 -0
  82. package/dist/v2/providers/moonshot.json +284 -0
  83. package/dist/v2/providers/openai.json +419 -0
  84. package/dist/v2/providers/qwen.json +274 -0
  85. package/dist/v2/providers/zhipu.json +257 -0
  86. package/dist/v2-alpha/providers/anthropic.json +182 -0
  87. package/dist/v2-alpha/providers/gemini.json +187 -0
  88. package/dist/v2-alpha/providers/openai.json +215 -0
  89. package/dist/v2-alpha/spec.json +644 -0
  90. package/package.json +61 -0
  91. package/schemas/spec.json +186 -0
  92. package/schemas/v1.json +1116 -0
  93. package/schemas/v2/availability.json +66 -0
  94. package/schemas/v2/capabilities.json +182 -0
  95. package/schemas/v2/capability-profile.json +174 -0
  96. package/schemas/v2/computer-use.json +222 -0
  97. package/schemas/v2/context-policy.json +148 -0
  98. package/schemas/v2/endpoint.json +2 -0
  99. package/schemas/v2/error-codes.yaml +225 -0
  100. package/schemas/v2/errors.json +250 -0
  101. package/schemas/v2/execution-metadata.json +59 -0
  102. package/schemas/v2/mcp.json +225 -0
  103. package/schemas/v2/message-roles.json +10 -0
  104. package/schemas/v2/multimodal.json +297 -0
  105. package/schemas/v2/pricing.json +14 -0
  106. package/schemas/v2/provider-contract.json +317 -0
  107. package/schemas/v2/provider.json +203 -0
  108. package/schemas/v2/regions.json +14 -0
  109. package/v1/models/ai21.yaml +97 -0
  110. package/v1/models/baichuan.yaml +95 -0
  111. package/v1/models/cerebras.yaml +99 -0
  112. package/v1/models/claude.yaml +59 -0
  113. package/v1/models/cohere.yaml +165 -0
  114. package/v1/models/deepinfra.yaml +29 -0
  115. package/v1/models/deepseek-chat.yaml +32 -0
  116. package/v1/models/doubao.yaml +129 -0
  117. package/v1/models/ernie.yaml +146 -0
  118. package/v1/models/fireworks.yaml +145 -0
  119. package/v1/models/gemini.yaml +32 -0
  120. package/v1/models/gpt.yaml +90 -0
  121. package/v1/models/grok.yaml +74 -0
  122. package/v1/models/huggingface.yaml +110 -0
  123. package/v1/models/hunyuan.yaml +164 -0
  124. package/v1/models/jina.yaml +98 -0
  125. package/v1/models/lepton.yaml +130 -0
  126. package/v1/models/llama.yaml +91 -0
  127. package/v1/models/minimax.yaml +132 -0
  128. package/v1/models/mistral.yaml +100 -0
  129. package/v1/models/moonshot.yaml +97 -0
  130. package/v1/models/nvidia.yaml +118 -0
  131. package/v1/models/palmyra.yaml +59 -0
  132. package/v1/models/perplexity.yaml +97 -0
  133. package/v1/models/qwen.yaml +27 -0
  134. package/v1/models/replicate.yaml +136 -0
  135. package/v1/models/sensenova.yaml +97 -0
  136. package/v1/models/siliconflow.yaml +29 -0
  137. package/v1/models/spark.yaml +114 -0
  138. package/v1/models/stable-diffusion.yaml +113 -0
  139. package/v1/models/tiangong.yaml +114 -0
  140. package/v1/models/together.yaml +29 -0
  141. package/v1/models/yi.yaml +132 -0
  142. package/v1/models/zhipu.yaml +163 -0
  143. package/v1/providers/ai21.yaml +176 -0
  144. package/v1/providers/anthropic.yaml +209 -0
  145. package/v1/providers/anyscale.yaml +106 -0
  146. package/v1/providers/azure.yaml +155 -0
  147. package/v1/providers/baichuan.yaml +168 -0
  148. package/v1/providers/baidu.yaml +173 -0
  149. package/v1/providers/cerebras.yaml +178 -0
  150. package/v1/providers/cohere.yaml +175 -0
  151. package/v1/providers/deepinfra.yaml +156 -0
  152. package/v1/providers/deepseek.yaml +189 -0
  153. package/v1/providers/doubao.yaml +172 -0
  154. package/v1/providers/fireworks.yaml +187 -0
  155. package/v1/providers/gemini.yaml +229 -0
  156. package/v1/providers/groq.yaml +181 -0
  157. package/v1/providers/huggingface.yaml +157 -0
  158. package/v1/providers/hunyuan.yaml +162 -0
  159. package/v1/providers/jina.yaml +171 -0
  160. package/v1/providers/lepton.yaml +183 -0
  161. package/v1/providers/minimax.yaml +172 -0
  162. package/v1/providers/mistral.yaml +186 -0
  163. package/v1/providers/moonshot.yaml +176 -0
  164. package/v1/providers/nvidia.yaml +172 -0
  165. package/v1/providers/openai.yaml +224 -0
  166. package/v1/providers/openrouter.yaml +181 -0
  167. package/v1/providers/perplexity.yaml +144 -0
  168. package/v1/providers/qwen.yaml +192 -0
  169. package/v1/providers/replicate.yaml +159 -0
  170. package/v1/providers/sensenova.yaml +153 -0
  171. package/v1/providers/siliconflow.yaml +156 -0
  172. package/v1/providers/spark.yaml +167 -0
  173. package/v1/providers/stability.yaml +185 -0
  174. package/v1/providers/tiangong.yaml +170 -0
  175. package/v1/providers/together.yaml +156 -0
  176. package/v1/providers/writer.yaml +212 -0
  177. package/v1/providers/xai.yaml +206 -0
  178. package/v1/providers/yi.yaml +168 -0
  179. package/v1/providers/zhipu.yaml +171 -0
  180. package/v1/spec.yaml +637 -0
  181. package/v2/providers/anthropic.yaml +244 -0
  182. package/v2/providers/cohere.yaml +75 -0
  183. package/v2/providers/deepseek.yaml +176 -0
  184. package/v2/providers/doubao.yaml +169 -0
  185. package/v2/providers/google.yaml +245 -0
  186. package/v2/providers/jina.yaml +55 -0
  187. package/v2/providers/moonshot.yaml +186 -0
  188. package/v2/providers/openai.yaml +266 -0
  189. package/v2/providers/qwen.yaml +174 -0
  190. package/v2/providers/zhipu.yaml +176 -0
  191. package/v2-alpha/providers/anthropic.yaml +134 -0
  192. package/v2-alpha/providers/gemini.yaml +144 -0
  193. package/v2-alpha/providers/openai.yaml +154 -0
  194. package/v2-alpha/spec.yaml +512 -0
@@ -0,0 +1,167 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+
3
+ id: spark
4
+ protocol_version: "1.5"
5
+
6
+ name: 讯飞星火 (iFlytek Spark)
7
+ version: "v1"
8
+ status: stable
9
+ category: ai_provider
10
+ official_url: "https://www.xfyun.cn/doc/spark/Web.html"
11
+ support_contact: "https://www.xfyun.cn/services"
12
+
13
+ endpoint:
14
+ base_url: "https://spark-api-open.xf-yun.com/v1"
15
+ protocol: https
16
+ timeout_ms: 60000
17
+
18
+ auth:
19
+ type: bearer
20
+ token_env: "SPARK_API_KEY"
21
+
22
+ payload_format: "openai_style"
23
+
24
+ # Spark uses OpenAI-compatible API
25
+ api_families: ["chat_completions"]
26
+ default_api_family: "chat_completions"
27
+
28
+ endpoints:
29
+ chat:
30
+ path: "/chat/completions"
31
+ method: "POST"
32
+ adapter: "openai"
33
+
34
+ services:
35
+ list_models:
36
+ path: "/models"
37
+ method: "GET"
38
+ response_binding: "data"
39
+
40
+ termination:
41
+ source_field: "finish_reason"
42
+ mapping:
43
+ stop: "end_turn"
44
+ length: "max_tokens"
45
+ tool_calls: "tool_use"
46
+ notes:
47
+ - "OpenAI-compatible finish_reason."
48
+ - "星火大模型 (Spark) is iFlytek's flagship LLM series."
49
+
50
+ tooling:
51
+ source_model: "openai_tool_calls"
52
+ tool_use:
53
+ id_path: "id"
54
+ name_path: "function.name"
55
+ input_path: "function.arguments"
56
+ input_format: "json_string"
57
+ notes:
58
+ - "Supports OpenAI-compatible function calling."
59
+
60
+ retry_policy:
61
+ strategy: "exponential_backoff"
62
+ max_retries: 3
63
+ min_delay_ms: 1000
64
+ max_delay_ms: 30000
65
+ jitter: "full"
66
+ retry_on_http_status: [429, 500, 502, 503]
67
+
68
+ error_classification:
69
+ by_http_status:
70
+ "400": "invalid_request"
71
+ "401": "authentication"
72
+ "403": "permission_denied"
73
+ "404": "not_found"
74
+ "429": "rate_limited"
75
+ "500": "server_error"
76
+ "503": "overloaded"
77
+
78
+ parameter_mappings:
79
+ temperature: "temperature"
80
+ max_tokens: "max_tokens"
81
+ stream: "stream"
82
+ top_k: "top_k"
83
+ tools: "tools"
84
+ tool_choice: "tool_choice"
85
+
86
+ response_format: "openai_style"
87
+
88
+ response_paths:
89
+ content: "choices[0].message.content"
90
+ tool_calls: "choices[0].message.tool_calls"
91
+ usage: "usage"
92
+ finish_reason: "choices[0].finish_reason"
93
+
94
+ streaming:
95
+ event_format: "data_lines"
96
+ decoder:
97
+ format: "sse"
98
+ delimiter: "\n\n"
99
+ prefix: "data: "
100
+ done_signal: "[DONE]"
101
+ content_path: "choices[0].delta.content"
102
+ tool_call_path: "choices[0].delta.tool_calls"
103
+ usage_path: "usage"
104
+ frame_selector: "exists($.choices) || exists($.error)"
105
+ event_map:
106
+ - match: "exists($.choices[*].delta.content)"
107
+ emit: "PartialContentDelta"
108
+ fields:
109
+ content: "$.choices[*].delta.content"
110
+ - match: "exists($.choices[*].delta.tool_calls[*].function.name)"
111
+ emit: "ToolCallStarted"
112
+ fields:
113
+ tool_call_id: "$.choices[*].delta.tool_calls[*].id"
114
+ tool_name: "$.choices[*].delta.tool_calls[*].function.name"
115
+ index: "$.choices[*].delta.tool_calls[*].index"
116
+ - match: "exists($.choices[*].delta.tool_calls[*].function.arguments)"
117
+ emit: "PartialToolCall"
118
+ fields:
119
+ arguments: "$.choices[*].delta.tool_calls[*].function.arguments"
120
+ index: "$.choices[*].delta.tool_calls[*].index"
121
+ - match: "exists($.usage)"
122
+ emit: "Metadata"
123
+ fields:
124
+ usage: "$.usage"
125
+ - match: "exists($.choices[*].finish_reason)"
126
+ emit: "FinalCandidate"
127
+ fields:
128
+ finish_reason: "$.choices[*].finish_reason"
129
+ stop_condition: "$.choices[0].finish_reason != null"
130
+
131
+ features:
132
+ multi_candidate:
133
+ support_type: "simulated"
134
+ max_concurrent: 1
135
+ response_mapping:
136
+ tool_calls:
137
+ path: "choices[0].message.tool_calls"
138
+ fields:
139
+ id: "id"
140
+ name: "function.name"
141
+ args: "function.arguments"
142
+ error:
143
+ message_path: "error.message"
144
+ code_path: "error.code"
145
+
146
+ capabilities:
147
+ streaming: true
148
+ tools: true
149
+ vision: true
150
+ agentic: true
151
+ parallel_tools: false
152
+ reasoning: false
153
+
154
+ availability:
155
+ required: false
156
+ regions:
157
+ - cn
158
+ check:
159
+ method: GET
160
+ path: "/models"
161
+ expected_status: [200, 401]
162
+ timeout_ms: 5000
163
+
164
+ experimental_features:
165
+ - "document_qa"
166
+ - "image_generation"
167
+ - "speech_synthesis"
@@ -0,0 +1,185 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+
3
+ id: stability
4
+ protocol_version: "1.5"
5
+
6
+ name: Stability AI
7
+ version: "v1"
8
+ status: stable
9
+ category: ai_provider
10
+ official_url: "https://platform.stability.ai/docs"
11
+ support_contact: "https://stability.ai/contact"
12
+
13
+ # Structured endpoint definition (v1.1+ extension)
14
+ endpoint:
15
+ base_url: "https://api.stability.ai"
16
+ protocol: https
17
+ timeout_ms: 60000
18
+
19
+ auth:
20
+ type: bearer
21
+ token_env: "STABILITY_API_KEY"
22
+ extra_headers:
23
+ - name: "Content-Type"
24
+ value: "application/json"
25
+ - name: "Accept"
26
+ value: "application/json"
27
+ payload_format: "stability_api"
28
+
29
+ # Stability AI supports multiple creative AI APIs
30
+ api_families: ["text_to_image", "image_to_image", "image_to_image_masking", "inpainting", "outpainting", "image_upscale", "video_generation"]
31
+ default_api_family: "text_to_image"
32
+ endpoints:
33
+ text_to_image:
34
+ path: "/v2beta/stable-image/generate/sd3"
35
+ method: "POST"
36
+ adapter: "stability"
37
+ image_to_image:
38
+ path: "/v2beta/stable-image/generate/sd3"
39
+ method: "POST"
40
+ adapter: "stability"
41
+ image_edit:
42
+ path: "/v2beta/stable-image/edit/erase"
43
+ method: "POST"
44
+ adapter: "stability"
45
+ image_search_and_replace:
46
+ path: "/v2beta/stable-image/edit/search-and-replace"
47
+ method: "POST"
48
+ adapter: "stability"
49
+ upscale:
50
+ path: "/v2beta/stable-image/upscale/conservative"
51
+ method: "POST"
52
+ adapter: "stability"
53
+
54
+ # V1.5 Service Endpoints
55
+ services:
56
+ list_models:
57
+ path: "/v2beta/models/list"
58
+ method: "GET"
59
+ response_binding: "data"
60
+
61
+ # Stability AI doesn't use finish_reason in the same way as LLMs
62
+ termination:
63
+ source_field: "finish"
64
+ mapping:
65
+ complete: "completed"
66
+ failed: "error"
67
+ notes:
68
+ - "Image generation uses async workflow with job IDs"
69
+ - "finish_field indicates completion status"
70
+
71
+ # Tool invocation normalization
72
+ tooling:
73
+ source_model: "unknown"
74
+ notes:
75
+ - "Stability AI is not designed for text-based tool calling"
76
+ - "Focuses on image/video generation workflows"
77
+
78
+ # Retry policy
79
+ retry_policy:
80
+ strategy: "exponential_backoff"
81
+ max_retries: 3
82
+ min_delay_ms: 1000
83
+ max_delay_ms: 10000
84
+ jitter: "full"
85
+ retry_on_http_status: [429, 500, 502, 503]
86
+ notes:
87
+ - "Image generation can be resource-intensive"
88
+ - "502/503 common during high load"
89
+ - "429 indicates rate limit exceeded"
90
+
91
+ # Error classification hints
92
+ error_classification:
93
+ by_http_status:
94
+ "400": "invalid_request"
95
+ "401": "authentication"
96
+ "403": "permission_denied"
97
+ "404": "not_found"
98
+ "429": "rate_limited"
99
+ "500": "server_error"
100
+ "502": "overloaded"
101
+ "503": "overloaded"
102
+ notes:
103
+ - "502/503 often indicate generation queue or resource constraints"
104
+ - "Error messages may include quota information"
105
+
106
+ parameter_mappings:
107
+ prompt: "prompt"
108
+ negative_prompt: "negative_prompt"
109
+ aspect_ratio: "aspect_ratio"
110
+ seed: "seed"
111
+ steps: "steps"
112
+ cfg_scale: "cfg_scale"
113
+ mode: "mode"
114
+ output_format: "output_format"
115
+ strength: "strength"
116
+ image: "image"
117
+ init_image_mode: "init_image_mode"
118
+
119
+ response_format: "stability_image"
120
+ response_paths:
121
+ content: "image"
122
+ artifacts: "artifacts"
123
+ finish_reason: "finish"
124
+ image_url: "image"
125
+
126
+ streaming:
127
+ event_format: "stability_async"
128
+ decoder:
129
+ format: "sse"
130
+ delimiter: "\n\n"
131
+ prefix: "data: "
132
+ done_signal: "[DONE]"
133
+ # Stability uses job-based async generation
134
+ frame_selector: "exists($.id) || exists($.image) || exists($.artifacts)"
135
+ event_map:
136
+ - match: "exists($.id) && !exists($.image)"
137
+ emit: "Metadata"
138
+ fields:
139
+ job_id: "$.id"
140
+ status: "$.status"
141
+ timestamp: "$.timestamp"
142
+ - match: "exists($.image)"
143
+ emit: "FinalCandidate"
144
+ fields:
145
+ image: "$.image"
146
+ finish_reason: "finish"
147
+ - match: "exists($.artifacts)"
148
+ emit: "FinalCandidate"
149
+ fields:
150
+ artifacts: "$.artifacts"
151
+ finish: "$.finish"
152
+ stop_condition: "exists($.image) || exists($.artifacts) || exists($.finish) && $.finish == 'complete'"
153
+ extra_metadata_path: "$.finish"
154
+
155
+ capabilities:
156
+ streaming: false
157
+ tools: false
158
+ vision: true
159
+ agentic: false
160
+ parallel_tools: false
161
+ reasoning: false
162
+
163
+ experimental_features:
164
+ - "async_generation"
165
+ - "video_generation"
166
+ - "3d_generation"
167
+ - "inpainting"
168
+ - "outpainting"
169
+
170
+ # Connection vars for model selection
171
+ connection_vars:
172
+ model: "model_id"
173
+
174
+ # Availability and health checking (v1.1+ extension)
175
+ availability:
176
+ required: false
177
+ regions:
178
+ - global
179
+ check:
180
+ method: GET
181
+ path: "/v2beta/models/list"
182
+ expected_status: [200]
183
+ timeout_ms: 5000
184
+ notes:
185
+ - "Check models/list endpoint to verify service health"
@@ -0,0 +1,170 @@
1
+ $schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
2
+
3
+ id: tiangong
4
+ protocol_version: "1.5"
5
+
6
+ name: 昆仑万维天工 (Kunlun Tiangong)
7
+ version: "v1"
8
+ status: stable
9
+ category: ai_provider
10
+ official_url: "https://model-platform.tiangong.cn/api-reference"
11
+ support_contact: "https://www.kunlun.com/contact"
12
+
13
+ endpoint:
14
+ base_url: "https://sky-api.singularity-ai.com/saas/api/v4"
15
+ protocol: https
16
+ timeout_ms: 60000
17
+
18
+ auth:
19
+ type: bearer
20
+ token_env: "TIANGONG_API_KEY"
21
+
22
+ payload_format: "openai_style"
23
+
24
+ # Tiangong uses OpenAI-compatible API
25
+ api_families: ["chat_completions"]
26
+ default_api_family: "chat_completions"
27
+
28
+ endpoints:
29
+ chat:
30
+ path: "/chat/completions"
31
+ method: "POST"
32
+ adapter: "openai"
33
+
34
+ services:
35
+ list_models:
36
+ path: "/models"
37
+ method: "GET"
38
+ response_binding: "data"
39
+
40
+ termination:
41
+ source_field: "finish_reason"
42
+ mapping:
43
+ stop: "end_turn"
44
+ length: "max_tokens"
45
+ tool_calls: "tool_use"
46
+ notes:
47
+ - "OpenAI-compatible finish_reason."
48
+ - "天工 (Tiangong) is Kunlun's flagship AI assistant."
49
+
50
+ tooling:
51
+ source_model: "openai_tool_calls"
52
+ tool_use:
53
+ id_path: "id"
54
+ name_path: "function.name"
55
+ input_path: "function.arguments"
56
+ input_format: "json_string"
57
+ notes:
58
+ - "Supports OpenAI-compatible function calling."
59
+
60
+ retry_policy:
61
+ strategy: "exponential_backoff"
62
+ max_retries: 3
63
+ min_delay_ms: 1000
64
+ max_delay_ms: 30000
65
+ jitter: "full"
66
+ retry_on_http_status: [429, 500, 502, 503]
67
+
68
+ error_classification:
69
+ by_http_status:
70
+ "400": "invalid_request"
71
+ "401": "authentication"
72
+ "403": "permission_denied"
73
+ "404": "not_found"
74
+ "429": "rate_limited"
75
+ "500": "server_error"
76
+ "503": "overloaded"
77
+
78
+ parameter_mappings:
79
+ temperature: "temperature"
80
+ max_tokens: "max_tokens"
81
+ stream: "stream"
82
+ top_p: "top_p"
83
+ stop_sequences: "stop"
84
+ tools: "tools"
85
+ tool_choice: "tool_choice"
86
+ frequency_penalty: "frequency_penalty"
87
+ presence_penalty: "presence_penalty"
88
+
89
+ response_format: "openai_style"
90
+
91
+ response_paths:
92
+ content: "choices[0].message.content"
93
+ tool_calls: "choices[0].message.tool_calls"
94
+ usage: "usage"
95
+ finish_reason: "choices[0].finish_reason"
96
+
97
+ streaming:
98
+ event_format: "data_lines"
99
+ decoder:
100
+ format: "sse"
101
+ delimiter: "\n\n"
102
+ prefix: "data: "
103
+ done_signal: "[DONE]"
104
+ content_path: "choices[0].delta.content"
105
+ tool_call_path: "choices[0].delta.tool_calls"
106
+ usage_path: "usage"
107
+ frame_selector: "exists($.choices) || exists($.error)"
108
+ event_map:
109
+ - match: "exists($.choices[*].delta.content)"
110
+ emit: "PartialContentDelta"
111
+ fields:
112
+ content: "$.choices[*].delta.content"
113
+ - match: "exists($.choices[*].delta.tool_calls[*].function.name)"
114
+ emit: "ToolCallStarted"
115
+ fields:
116
+ tool_call_id: "$.choices[*].delta.tool_calls[*].id"
117
+ tool_name: "$.choices[*].delta.tool_calls[*].function.name"
118
+ index: "$.choices[*].delta.tool_calls[*].index"
119
+ - match: "exists($.choices[*].delta.tool_calls[*].function.arguments)"
120
+ emit: "PartialToolCall"
121
+ fields:
122
+ arguments: "$.choices[*].delta.tool_calls[*].function.arguments"
123
+ index: "$.choices[*].delta.tool_calls[*].index"
124
+ - match: "exists($.usage)"
125
+ emit: "Metadata"
126
+ fields:
127
+ usage: "$.usage"
128
+ - match: "exists($.choices[*].finish_reason)"
129
+ emit: "FinalCandidate"
130
+ fields:
131
+ finish_reason: "$.choices[*].finish_reason"
132
+ stop_condition: "$.choices[0].finish_reason != null"
133
+
134
+ features:
135
+ multi_candidate:
136
+ support_type: "native"
137
+ param_name: "n"
138
+ response_mapping:
139
+ tool_calls:
140
+ path: "choices[0].message.tool_calls"
141
+ fields:
142
+ id: "id"
143
+ name: "function.name"
144
+ args: "function.arguments"
145
+ error:
146
+ message_path: "error.message"
147
+ code_path: "error.code"
148
+
149
+ capabilities:
150
+ streaming: true
151
+ tools: true
152
+ vision: true
153
+ agentic: true
154
+ parallel_tools: true
155
+ reasoning: false
156
+
157
+ availability:
158
+ required: false
159
+ regions:
160
+ - cn
161
+ check:
162
+ method: GET
163
+ path: "/models"
164
+ expected_status: [200, 401]
165
+ timeout_ms: 5000
166
+
167
+ experimental_features:
168
+ - "web_search"
169
+ - "music_generation"
170
+ - "image_generation"
@@ -0,0 +1,156 @@
1
+ $schema: ../../schemas/v1.json
2
+ protocol_version: "1.5"
3
+ id: "together"
4
+ name: "Together AI"
5
+ status: "stable"
6
+ category: "model_provider"
7
+ official_url: "https://www.together.ai/"
8
+ support_contact: "https://www.together.ai/contact"
9
+
10
+ endpoint:
11
+ base_url: "https://api.together.xyz/v1"
12
+ protocol: "https"
13
+ timeout_ms: 60000
14
+
15
+ # Auth + payload format are required for online model fact-checking.
16
+ auth:
17
+ type: bearer
18
+ token_env: "TOGETHER_API_KEY"
19
+ payload_format: "openai_style"
20
+
21
+ services:
22
+ list_models:
23
+ path: "/models"
24
+ method: "GET"
25
+ response_binding: "data"
26
+
27
+ availability:
28
+ required: false
29
+ regions: ["global"]
30
+ check:
31
+ method: "GET"
32
+ path: "/models"
33
+ expected_status: [200]
34
+
35
+ capabilities:
36
+ streaming: true
37
+ tools: true
38
+ vision: true
39
+ agentic: false
40
+ reasoning: false
41
+ parallel_tools: false
42
+
43
+ # Together AI is OpenAI-compatible
44
+ streaming:
45
+ event_format: "data_lines"
46
+ decoder:
47
+ format: "sse"
48
+ delimiter: "\n\n"
49
+ prefix: "data: "
50
+ done_signal: "[DONE]"
51
+ frame_selector: "exists($.choices) || exists($.error)"
52
+ candidate:
53
+ candidate_id_path: "$.choices[*].index"
54
+ fan_out: true
55
+ event_map:
56
+ - match: "exists($.error)"
57
+ emit: "StreamError"
58
+ fields:
59
+ error: "$.error"
60
+ - match: "exists($.choices[*].delta.content)"
61
+ emit: "PartialContentDelta"
62
+ fields:
63
+ content: "$.choices[*].delta.content"
64
+ - match: "exists($.choices[*].delta.tool_calls[*].function.name)"
65
+ emit: "ToolCallStarted"
66
+ fields:
67
+ tool_call_id: "$.choices[*].delta.tool_calls[*].id"
68
+ tool_name: "$.choices[*].delta.tool_calls[*].function.name"
69
+ index: "$.choices[*].delta.tool_calls[*].index"
70
+ - match: "exists($.choices[*].delta.tool_calls[*].function.arguments)"
71
+ emit: "PartialToolCall"
72
+ fields:
73
+ arguments: "$.choices[*].delta.tool_calls[*].function.arguments"
74
+ index: "$.choices[*].delta.tool_calls[*].index"
75
+ - match: "exists($.usage)"
76
+ emit: "Metadata"
77
+ fields:
78
+ usage: "$.usage"
79
+ - match: "exists($.choices[*].finish_reason)"
80
+ emit: "FinalCandidate"
81
+ fields:
82
+ finish_reason: "$.choices[*].finish_reason"
83
+ candidate_index: "$.choices[*].index"
84
+ stop_condition: "$.choices[0].finish_reason != null"
85
+ extra_metadata_path: "$.usage"
86
+ content_path: "$.choices[0].delta.content"
87
+ tool_call_path: "$.choices[0].delta.tool_calls"
88
+
89
+ # Termination reason normalization (Together AI uses OpenAI-compatible finish_reason)
90
+ termination:
91
+ source_field: "finish_reason"
92
+ mapping:
93
+ stop: "end_turn"
94
+ length: "max_tokens"
95
+ tool_calls: "tool_use"
96
+ content_filter: "refusal"
97
+ notes:
98
+ - "finish_reason is reported per candidate."
99
+
100
+ # Tool invocation normalization (Together AI is OpenAI-compatible)
101
+ tooling:
102
+ source_model: "openai_tool_calls"
103
+ tool_use:
104
+ id_path: "id"
105
+ name_path: "function.name"
106
+ input_path: "function.arguments"
107
+ input_format: "json_string"
108
+ notes:
109
+ - "Together AI tool_calls.function.arguments is typically a JSON string."
110
+
111
+ features:
112
+ multi_candidate:
113
+ support_type: "native"
114
+ param_name: "n"
115
+ response_mapping:
116
+ tool_calls:
117
+ path: "choices[0].message.tool_calls"
118
+ fields:
119
+ id: "id"
120
+ name: "function.name"
121
+ args: "function.arguments"
122
+ error:
123
+ message_path: "error.message"
124
+ code_path: "error.code"
125
+ type_path: "error.type"
126
+
127
+ response_paths:
128
+ content: "choices[0].message.content"
129
+ tool_calls: "choices[0].message.tool_calls"
130
+ usage: "usage"
131
+ finish_reason: "choices[0].finish_reason"
132
+
133
+ parameter_mappings:
134
+ temperature: "temperature"
135
+ max_tokens: "max_tokens"
136
+ stream: "stream"
137
+ top_p: "top_p"
138
+ stop_sequences: "stop"
139
+ tools: "tools"
140
+ tool_choice: "tool_choice"
141
+
142
+ retry_policy:
143
+ max_retries: 3
144
+ max_delay_ms: 30000
145
+ strategy: "exponential_backoff"
146
+ min_delay_ms: 1000
147
+ jitter: "full"
148
+ retry_on_http_status: [429, 500, 502, 503]
149
+
150
+ error_classification:
151
+ by_http_status:
152
+ "400": "invalid_request"
153
+ "401": "authentication"
154
+ "429": "rate_limited"
155
+ "500": "server_error"
156
+ "503": "overloaded"