@ailib-official/ai-protocol 0.8.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (194) hide show
  1. package/LICENSE +6 -0
  2. package/README.md +415 -0
  3. package/dist/index.json +8 -0
  4. package/dist/v1/models/ai21.json +140 -0
  5. package/dist/v1/models/baichuan.json +138 -0
  6. package/dist/v1/models/cerebras.json +147 -0
  7. package/dist/v1/models/claude.json +114 -0
  8. package/dist/v1/models/cohere.json +235 -0
  9. package/dist/v1/models/deepinfra.json +43 -0
  10. package/dist/v1/models/deepseek-chat.json +55 -0
  11. package/dist/v1/models/doubao.json +197 -0
  12. package/dist/v1/models/ernie.json +223 -0
  13. package/dist/v1/models/fireworks.json +222 -0
  14. package/dist/v1/models/gemini.json +58 -0
  15. package/dist/v1/models/gpt.json +166 -0
  16. package/dist/v1/models/grok.json +138 -0
  17. package/dist/v1/models/huggingface.json +183 -0
  18. package/dist/v1/models/hunyuan.json +255 -0
  19. package/dist/v1/models/jina.json +139 -0
  20. package/dist/v1/models/lepton.json +188 -0
  21. package/dist/v1/models/llama.json +143 -0
  22. package/dist/v1/models/minimax.json +194 -0
  23. package/dist/v1/models/mistral.json +177 -0
  24. package/dist/v1/models/moonshot.json +144 -0
  25. package/dist/v1/models/nvidia.json +212 -0
  26. package/dist/v1/models/palmyra.json +103 -0
  27. package/dist/v1/models/perplexity.json +143 -0
  28. package/dist/v1/models/qwen.json +49 -0
  29. package/dist/v1/models/replicate.json +206 -0
  30. package/dist/v1/models/sensenova.json +144 -0
  31. package/dist/v1/models/siliconflow.json +44 -0
  32. package/dist/v1/models/spark.json +173 -0
  33. package/dist/v1/models/stable-diffusion.json +161 -0
  34. package/dist/v1/models/tiangong.json +169 -0
  35. package/dist/v1/models/together.json +43 -0
  36. package/dist/v1/models/yi.json +199 -0
  37. package/dist/v1/models/zhipu.json +250 -0
  38. package/dist/v1/providers/ai21.json +215 -0
  39. package/dist/v1/providers/anthropic.json +253 -0
  40. package/dist/v1/providers/anyscale.json +115 -0
  41. package/dist/v1/providers/azure.json +188 -0
  42. package/dist/v1/providers/baichuan.json +205 -0
  43. package/dist/v1/providers/baidu.json +205 -0
  44. package/dist/v1/providers/cerebras.json +216 -0
  45. package/dist/v1/providers/cohere.json +209 -0
  46. package/dist/v1/providers/deepinfra.json +196 -0
  47. package/dist/v1/providers/deepseek.json +221 -0
  48. package/dist/v1/providers/doubao.json +209 -0
  49. package/dist/v1/providers/fireworks.json +227 -0
  50. package/dist/v1/providers/gemini.json +279 -0
  51. package/dist/v1/providers/groq.json +218 -0
  52. package/dist/v1/providers/huggingface.json +181 -0
  53. package/dist/v1/providers/hunyuan.json +198 -0
  54. package/dist/v1/providers/jina.json +202 -0
  55. package/dist/v1/providers/lepton.json +221 -0
  56. package/dist/v1/providers/minimax.json +209 -0
  57. package/dist/v1/providers/mistral.json +214 -0
  58. package/dist/v1/providers/moonshot.json +214 -0
  59. package/dist/v1/providers/nvidia.json +213 -0
  60. package/dist/v1/providers/openai.json +267 -0
  61. package/dist/v1/providers/openrouter.json +220 -0
  62. package/dist/v1/providers/perplexity.json +172 -0
  63. package/dist/v1/providers/qwen.json +231 -0
  64. package/dist/v1/providers/replicate.json +192 -0
  65. package/dist/v1/providers/sensenova.json +185 -0
  66. package/dist/v1/providers/siliconflow.json +197 -0
  67. package/dist/v1/providers/spark.json +204 -0
  68. package/dist/v1/providers/stability.json +221 -0
  69. package/dist/v1/providers/tiangong.json +207 -0
  70. package/dist/v1/providers/together.json +196 -0
  71. package/dist/v1/providers/writer.json +253 -0
  72. package/dist/v1/providers/xai.json +238 -0
  73. package/dist/v1/providers/yi.json +205 -0
  74. package/dist/v1/providers/zhipu.json +208 -0
  75. package/dist/v1/spec.json +783 -0
  76. package/dist/v2/providers/anthropic.json +372 -0
  77. package/dist/v2/providers/cohere.json +109 -0
  78. package/dist/v2/providers/deepseek.json +272 -0
  79. package/dist/v2/providers/doubao.json +260 -0
  80. package/dist/v2/providers/google.json +388 -0
  81. package/dist/v2/providers/jina.json +71 -0
  82. package/dist/v2/providers/moonshot.json +284 -0
  83. package/dist/v2/providers/openai.json +419 -0
  84. package/dist/v2/providers/qwen.json +274 -0
  85. package/dist/v2/providers/zhipu.json +257 -0
  86. package/dist/v2-alpha/providers/anthropic.json +182 -0
  87. package/dist/v2-alpha/providers/gemini.json +187 -0
  88. package/dist/v2-alpha/providers/openai.json +215 -0
  89. package/dist/v2-alpha/spec.json +644 -0
  90. package/package.json +61 -0
  91. package/schemas/spec.json +186 -0
  92. package/schemas/v1.json +1116 -0
  93. package/schemas/v2/availability.json +66 -0
  94. package/schemas/v2/capabilities.json +182 -0
  95. package/schemas/v2/capability-profile.json +174 -0
  96. package/schemas/v2/computer-use.json +222 -0
  97. package/schemas/v2/context-policy.json +148 -0
  98. package/schemas/v2/endpoint.json +2 -0
  99. package/schemas/v2/error-codes.yaml +225 -0
  100. package/schemas/v2/errors.json +250 -0
  101. package/schemas/v2/execution-metadata.json +59 -0
  102. package/schemas/v2/mcp.json +225 -0
  103. package/schemas/v2/message-roles.json +10 -0
  104. package/schemas/v2/multimodal.json +297 -0
  105. package/schemas/v2/pricing.json +14 -0
  106. package/schemas/v2/provider-contract.json +317 -0
  107. package/schemas/v2/provider.json +203 -0
  108. package/schemas/v2/regions.json +14 -0
  109. package/v1/models/ai21.yaml +97 -0
  110. package/v1/models/baichuan.yaml +95 -0
  111. package/v1/models/cerebras.yaml +99 -0
  112. package/v1/models/claude.yaml +59 -0
  113. package/v1/models/cohere.yaml +165 -0
  114. package/v1/models/deepinfra.yaml +29 -0
  115. package/v1/models/deepseek-chat.yaml +32 -0
  116. package/v1/models/doubao.yaml +129 -0
  117. package/v1/models/ernie.yaml +146 -0
  118. package/v1/models/fireworks.yaml +145 -0
  119. package/v1/models/gemini.yaml +32 -0
  120. package/v1/models/gpt.yaml +90 -0
  121. package/v1/models/grok.yaml +74 -0
  122. package/v1/models/huggingface.yaml +110 -0
  123. package/v1/models/hunyuan.yaml +164 -0
  124. package/v1/models/jina.yaml +98 -0
  125. package/v1/models/lepton.yaml +130 -0
  126. package/v1/models/llama.yaml +91 -0
  127. package/v1/models/minimax.yaml +132 -0
  128. package/v1/models/mistral.yaml +100 -0
  129. package/v1/models/moonshot.yaml +97 -0
  130. package/v1/models/nvidia.yaml +118 -0
  131. package/v1/models/palmyra.yaml +59 -0
  132. package/v1/models/perplexity.yaml +97 -0
  133. package/v1/models/qwen.yaml +27 -0
  134. package/v1/models/replicate.yaml +136 -0
  135. package/v1/models/sensenova.yaml +97 -0
  136. package/v1/models/siliconflow.yaml +29 -0
  137. package/v1/models/spark.yaml +114 -0
  138. package/v1/models/stable-diffusion.yaml +113 -0
  139. package/v1/models/tiangong.yaml +114 -0
  140. package/v1/models/together.yaml +29 -0
  141. package/v1/models/yi.yaml +132 -0
  142. package/v1/models/zhipu.yaml +163 -0
  143. package/v1/providers/ai21.yaml +176 -0
  144. package/v1/providers/anthropic.yaml +209 -0
  145. package/v1/providers/anyscale.yaml +106 -0
  146. package/v1/providers/azure.yaml +155 -0
  147. package/v1/providers/baichuan.yaml +168 -0
  148. package/v1/providers/baidu.yaml +173 -0
  149. package/v1/providers/cerebras.yaml +178 -0
  150. package/v1/providers/cohere.yaml +175 -0
  151. package/v1/providers/deepinfra.yaml +156 -0
  152. package/v1/providers/deepseek.yaml +189 -0
  153. package/v1/providers/doubao.yaml +172 -0
  154. package/v1/providers/fireworks.yaml +187 -0
  155. package/v1/providers/gemini.yaml +229 -0
  156. package/v1/providers/groq.yaml +181 -0
  157. package/v1/providers/huggingface.yaml +157 -0
  158. package/v1/providers/hunyuan.yaml +162 -0
  159. package/v1/providers/jina.yaml +171 -0
  160. package/v1/providers/lepton.yaml +183 -0
  161. package/v1/providers/minimax.yaml +172 -0
  162. package/v1/providers/mistral.yaml +186 -0
  163. package/v1/providers/moonshot.yaml +176 -0
  164. package/v1/providers/nvidia.yaml +172 -0
  165. package/v1/providers/openai.yaml +224 -0
  166. package/v1/providers/openrouter.yaml +181 -0
  167. package/v1/providers/perplexity.yaml +144 -0
  168. package/v1/providers/qwen.yaml +192 -0
  169. package/v1/providers/replicate.yaml +159 -0
  170. package/v1/providers/sensenova.yaml +153 -0
  171. package/v1/providers/siliconflow.yaml +156 -0
  172. package/v1/providers/spark.yaml +167 -0
  173. package/v1/providers/stability.yaml +185 -0
  174. package/v1/providers/tiangong.yaml +170 -0
  175. package/v1/providers/together.yaml +156 -0
  176. package/v1/providers/writer.yaml +212 -0
  177. package/v1/providers/xai.yaml +206 -0
  178. package/v1/providers/yi.yaml +168 -0
  179. package/v1/providers/zhipu.yaml +171 -0
  180. package/v1/spec.yaml +637 -0
  181. package/v2/providers/anthropic.yaml +244 -0
  182. package/v2/providers/cohere.yaml +75 -0
  183. package/v2/providers/deepseek.yaml +176 -0
  184. package/v2/providers/doubao.yaml +169 -0
  185. package/v2/providers/google.yaml +245 -0
  186. package/v2/providers/jina.yaml +55 -0
  187. package/v2/providers/moonshot.yaml +186 -0
  188. package/v2/providers/openai.yaml +266 -0
  189. package/v2/providers/qwen.yaml +174 -0
  190. package/v2/providers/zhipu.yaml +176 -0
  191. package/v2-alpha/providers/anthropic.yaml +134 -0
  192. package/v2-alpha/providers/gemini.yaml +144 -0
  193. package/v2-alpha/providers/openai.yaml +154 -0
  194. package/v2-alpha/spec.yaml +512 -0
@@ -0,0 +1,198 @@
1
+ {
2
+ "$schema": "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json",
3
+ "id": "hunyuan",
4
+ "protocol_version": "1.5",
5
+ "name": "腾讯混元 (Tencent Hunyuan)",
6
+ "version": "v1",
7
+ "status": "stable",
8
+ "category": "ai_provider",
9
+ "official_url": "https://cloud.tencent.com/document/product/1729",
10
+ "support_contact": "https://cloud.tencent.com/online-service",
11
+ "endpoint": {
12
+ "base_url": "https://hunyuan.tencentcloudapi.com",
13
+ "protocol": "https",
14
+ "timeout_ms": 60000
15
+ },
16
+ "auth": {
17
+ "type": "bearer",
18
+ "token_env": "HUNYUAN_API_KEY"
19
+ },
20
+ "payload_format": "openai_style",
21
+ "api_families": [
22
+ "chat_completions"
23
+ ],
24
+ "default_api_family": "chat_completions",
25
+ "endpoints": {
26
+ "chat": {
27
+ "path": "/v1/chat/completions",
28
+ "method": "POST",
29
+ "adapter": "openai"
30
+ }
31
+ },
32
+ "termination": {
33
+ "source_field": "finish_reason",
34
+ "mapping": {
35
+ "stop": "end_turn",
36
+ "length": "max_tokens",
37
+ "tool_calls": "tool_use",
38
+ "sensitive": "refusal"
39
+ },
40
+ "notes": [
41
+ "OpenAI-compatible finish_reason.",
42
+ "混元大模型 (Hunyuan) is Tencent's flagship LLM."
43
+ ]
44
+ },
45
+ "tooling": {
46
+ "source_model": "openai_tool_calls",
47
+ "tool_use": {
48
+ "id_path": "id",
49
+ "name_path": "function.name",
50
+ "input_path": "function.arguments",
51
+ "input_format": "json_string"
52
+ },
53
+ "notes": [
54
+ "Supports OpenAI-compatible function calling."
55
+ ]
56
+ },
57
+ "retry_policy": {
58
+ "strategy": "exponential_backoff",
59
+ "max_retries": 3,
60
+ "min_delay_ms": 1000,
61
+ "max_delay_ms": 30000,
62
+ "jitter": "full",
63
+ "retry_on_http_status": [
64
+ 429,
65
+ 500,
66
+ 502,
67
+ 503
68
+ ]
69
+ },
70
+ "error_classification": {
71
+ "by_http_status": {
72
+ "400": "invalid_request",
73
+ "401": "authentication",
74
+ "403": "permission_denied",
75
+ "404": "not_found",
76
+ "429": "rate_limited",
77
+ "500": "server_error",
78
+ "503": "overloaded"
79
+ }
80
+ },
81
+ "parameter_mappings": {
82
+ "temperature": "temperature",
83
+ "max_tokens": "max_tokens",
84
+ "stream": "stream",
85
+ "top_p": "top_p",
86
+ "tools": "tools",
87
+ "tool_choice": "tool_choice"
88
+ },
89
+ "response_format": "openai_style",
90
+ "response_paths": {
91
+ "content": "choices[0].message.content",
92
+ "tool_calls": "choices[0].message.tool_calls",
93
+ "usage": "usage",
94
+ "finish_reason": "choices[0].finish_reason"
95
+ },
96
+ "streaming": {
97
+ "event_format": "data_lines",
98
+ "decoder": {
99
+ "format": "sse",
100
+ "delimiter": "\n\n",
101
+ "prefix": "data: ",
102
+ "done_signal": "[DONE]"
103
+ },
104
+ "content_path": "choices[0].delta.content",
105
+ "tool_call_path": "choices[0].delta.tool_calls",
106
+ "usage_path": "usage",
107
+ "frame_selector": "exists($.choices) || exists($.error)",
108
+ "event_map": [
109
+ {
110
+ "match": "exists($.choices[*].delta.content)",
111
+ "emit": "PartialContentDelta",
112
+ "fields": {
113
+ "content": "$.choices[*].delta.content"
114
+ }
115
+ },
116
+ {
117
+ "match": "exists($.choices[*].delta.tool_calls[*].function.name)",
118
+ "emit": "ToolCallStarted",
119
+ "fields": {
120
+ "tool_call_id": "$.choices[*].delta.tool_calls[*].id",
121
+ "tool_name": "$.choices[*].delta.tool_calls[*].function.name",
122
+ "index": "$.choices[*].delta.tool_calls[*].index"
123
+ }
124
+ },
125
+ {
126
+ "match": "exists($.choices[*].delta.tool_calls[*].function.arguments)",
127
+ "emit": "PartialToolCall",
128
+ "fields": {
129
+ "arguments": "$.choices[*].delta.tool_calls[*].function.arguments",
130
+ "index": "$.choices[*].delta.tool_calls[*].index"
131
+ }
132
+ },
133
+ {
134
+ "match": "exists($.usage)",
135
+ "emit": "Metadata",
136
+ "fields": {
137
+ "usage": "$.usage"
138
+ }
139
+ },
140
+ {
141
+ "match": "exists($.choices[*].finish_reason)",
142
+ "emit": "FinalCandidate",
143
+ "fields": {
144
+ "finish_reason": "$.choices[*].finish_reason"
145
+ }
146
+ }
147
+ ],
148
+ "stop_condition": "$.choices[0].finish_reason != null"
149
+ },
150
+ "features": {
151
+ "multi_candidate": {
152
+ "support_type": "native",
153
+ "param_name": "n"
154
+ },
155
+ "response_mapping": {
156
+ "tool_calls": {
157
+ "path": "choices[0].message.tool_calls",
158
+ "fields": {
159
+ "id": "id",
160
+ "name": "function.name",
161
+ "args": "function.arguments"
162
+ }
163
+ },
164
+ "error": {
165
+ "message_path": "error.message",
166
+ "code_path": "error.code"
167
+ }
168
+ }
169
+ },
170
+ "capabilities": {
171
+ "streaming": true,
172
+ "tools": true,
173
+ "vision": true,
174
+ "agentic": true,
175
+ "parallel_tools": true,
176
+ "reasoning": true
177
+ },
178
+ "availability": {
179
+ "required": false,
180
+ "regions": [
181
+ "cn"
182
+ ],
183
+ "check": {
184
+ "method": "GET",
185
+ "path": "/v1/models",
186
+ "expected_status": [
187
+ 200,
188
+ 401
189
+ ],
190
+ "timeout_ms": 5000
191
+ }
192
+ },
193
+ "experimental_features": [
194
+ "search_enhancement",
195
+ "image_understanding",
196
+ "role_play"
197
+ ]
198
+ }
@@ -0,0 +1,202 @@
1
+ {
2
+ "$schema": "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json",
3
+ "id": "jina",
4
+ "protocol_version": "1.5",
5
+ "name": "Jina AI",
6
+ "version": "v1",
7
+ "status": "stable",
8
+ "category": "ai_provider",
9
+ "official_url": "https://jina.ai/docs",
10
+ "support_contact": "https://jina.ai/contact",
11
+ "endpoint": {
12
+ "base_url": "https://api.jina.ai",
13
+ "protocol": "https",
14
+ "timeout_ms": 30000
15
+ },
16
+ "auth": {
17
+ "type": "bearer",
18
+ "token_env": "JINA_API_KEY",
19
+ "payload_format": "jina_api"
20
+ },
21
+ "api_families": [
22
+ "embeddings",
23
+ "rerank",
24
+ "reader",
25
+ "search"
26
+ ],
27
+ "default_api_family": "embeddings",
28
+ "endpoints": {
29
+ "embeddings": {
30
+ "path": "/v1/embeddings",
31
+ "method": "POST",
32
+ "adapter": "openai"
33
+ },
34
+ "rerank": {
35
+ "path": "/v1/rerank",
36
+ "method": "POST",
37
+ "adapter": "jina"
38
+ },
39
+ "reader": {
40
+ "path": "/v1/reader",
41
+ "method": "POST",
42
+ "adapter": "jina"
43
+ }
44
+ },
45
+ "services": {
46
+ "list_models": {
47
+ "path": "/v1/models",
48
+ "method": "GET",
49
+ "response_binding": "data"
50
+ }
51
+ },
52
+ "termination": {
53
+ "source_field": "finish_reason",
54
+ "mapping": {
55
+ "stop": "end_turn",
56
+ "length": "max_tokens"
57
+ },
58
+ "notes": [
59
+ "Jina Reader uses finish_reason for completion",
60
+ "Embeddings API does not use finish_reason"
61
+ ]
62
+ },
63
+ "tooling": {
64
+ "source_model": "unknown",
65
+ "notes": [
66
+ "Jina AI is primarily embeddings and search",
67
+ "Does not support traditional tool calling"
68
+ ]
69
+ },
70
+ "retry_policy": {
71
+ "strategy": "exponential_backoff",
72
+ "max_retries": 3,
73
+ "max_delay_ms": 30000,
74
+ "min_delay_ms": 1000,
75
+ "jitter": "full",
76
+ "retry_on_http_status": [
77
+ 429,
78
+ 500,
79
+ 502,
80
+ 503
81
+ ],
82
+ "notes": [
83
+ "Jina API is generally fast but may experience spikes",
84
+ "Exponential backoff recommended for rate limits"
85
+ ]
86
+ },
87
+ "error_classification": {
88
+ "by_http_status": {
89
+ "400": "invalid_request",
90
+ "401": "authentication",
91
+ "403": "permission_denied",
92
+ "404": "not_found",
93
+ "429": "rate_limited",
94
+ "500": "server_error",
95
+ "502": "overloaded",
96
+ "503": "overloaded"
97
+ },
98
+ "notes": [
99
+ "Jina returns clear error messages in JSON format",
100
+ "Rate limit info included in error responses"
101
+ ]
102
+ },
103
+ "parameter_mappings": {
104
+ "model": "model",
105
+ "input": "input",
106
+ "encoding_format": "encoding_format",
107
+ "dimensions": "dimensions",
108
+ "top_n": "top_n",
109
+ "query": "query",
110
+ "documents": "documents",
111
+ "return_documents": "return_documents",
112
+ "url": "url",
113
+ "question": "question"
114
+ },
115
+ "response_format": "jina_style",
116
+ "response_paths": {
117
+ "content": "output",
118
+ "embedding": "data.embedding",
119
+ "data": "data",
120
+ "results": "results"
121
+ },
122
+ "streaming": {
123
+ "event_format": "jina_stream",
124
+ "decoder": {
125
+ "format": "sse",
126
+ "delimiter": "\n\n",
127
+ "prefix": "data: ",
128
+ "done_signal": "[DONE]"
129
+ },
130
+ "frame_selector": "exists($.delta) || exists($.embedding) || exists($.results)",
131
+ "event_map": [
132
+ {
133
+ "match": "exists($.delta)",
134
+ "emit": "PartialContentDelta",
135
+ "fields": {
136
+ "content": "$.delta.content"
137
+ }
138
+ },
139
+ {
140
+ "match": "exists($.embedding)",
141
+ "emit": "Metadata",
142
+ "fields": {
143
+ "embedding": "$.embedding",
144
+ "index": "$.index"
145
+ }
146
+ },
147
+ {
148
+ "match": "exists($.results)",
149
+ "emit": "FinalCandidate",
150
+ "fields": {
151
+ "results": "$.results"
152
+ }
153
+ }
154
+ ],
155
+ "stop_condition": "exists($.finish_reason) || exists($.results)",
156
+ "extra_metadata_path": "$.usage"
157
+ },
158
+ "features": {
159
+ "multi_candidate": {
160
+ "support_type": "native",
161
+ "param_name": "top_n"
162
+ },
163
+ "response_mapping": {
164
+ "error": {
165
+ "message_path": "message",
166
+ "code_path": "code",
167
+ "type_path": "error"
168
+ }
169
+ }
170
+ },
171
+ "capabilities": {
172
+ "streaming": false,
173
+ "tools": false,
174
+ "vision": false,
175
+ "agentic": false,
176
+ "parallel_tools": false,
177
+ "reasoning": false
178
+ },
179
+ "experimental_features": [
180
+ "rerank_api",
181
+ "reader_api",
182
+ "multimodal_embeddings",
183
+ "code_embeddings"
184
+ ],
185
+ "availability": {
186
+ "required": false,
187
+ "regions": [
188
+ "global"
189
+ ],
190
+ "check": {
191
+ "method": "GET",
192
+ "path": "/v1/models",
193
+ "expected_status": [
194
+ 200
195
+ ],
196
+ "timeout_ms": 3000
197
+ },
198
+ "notes": [
199
+ "Check v1/models endpoint to verify service health"
200
+ ]
201
+ }
202
+ }
@@ -0,0 +1,221 @@
1
+ {
2
+ "$schema": "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json",
3
+ "id": "lepton",
4
+ "protocol_version": "1.5",
5
+ "name": "Lepton AI",
6
+ "version": "v1",
7
+ "status": "stable",
8
+ "category": "ai_provider",
9
+ "official_url": "https://www.lepton.ai/docs",
10
+ "support_contact": "https://www.lepton.ai/contact",
11
+ "endpoint": {
12
+ "base_url": "https://llama3-1-8b.lepton.run/api/v1",
13
+ "protocol": "https",
14
+ "timeout_ms": 30000
15
+ },
16
+ "base_url_template": "https://{model_id}.lepton.run/api/v1",
17
+ "auth": {
18
+ "type": "bearer",
19
+ "token_env": "LEPTON_API_TOKEN"
20
+ },
21
+ "payload_format": "openai_style",
22
+ "api_families": [
23
+ "chat_completions",
24
+ "completions"
25
+ ],
26
+ "default_api_family": "chat_completions",
27
+ "endpoints": {
28
+ "chat": {
29
+ "path": "/chat/completions",
30
+ "method": "POST",
31
+ "adapter": "openai"
32
+ },
33
+ "completions": {
34
+ "path": "/completions",
35
+ "method": "POST",
36
+ "adapter": "openai"
37
+ }
38
+ },
39
+ "services": {
40
+ "list_models": {
41
+ "path": "/models",
42
+ "method": "GET",
43
+ "response_binding": "data"
44
+ }
45
+ },
46
+ "termination": {
47
+ "source_field": "finish_reason",
48
+ "mapping": {
49
+ "stop": "end_turn",
50
+ "length": "max_tokens",
51
+ "tool_calls": "tool_use"
52
+ },
53
+ "notes": [
54
+ "OpenAI-compatible finish_reason."
55
+ ]
56
+ },
57
+ "tooling": {
58
+ "source_model": "openai_tool_calls",
59
+ "tool_use": {
60
+ "id_path": "id",
61
+ "name_path": "function.name",
62
+ "input_path": "function.arguments",
63
+ "input_format": "json_string"
64
+ },
65
+ "notes": [
66
+ "OpenAI-compatible tool calling for supported models."
67
+ ]
68
+ },
69
+ "retry_policy": {
70
+ "strategy": "exponential_backoff",
71
+ "max_retries": 3,
72
+ "min_delay_ms": 1000,
73
+ "max_delay_ms": 30000,
74
+ "jitter": "full",
75
+ "retry_on_http_status": [
76
+ 429,
77
+ 500,
78
+ 502,
79
+ 503
80
+ ],
81
+ "notes": [
82
+ "Standard exponential backoff for rate limits and transient errors."
83
+ ]
84
+ },
85
+ "error_classification": {
86
+ "by_http_status": {
87
+ "400": "invalid_request",
88
+ "401": "authentication",
89
+ "403": "permission_denied",
90
+ "404": "not_found",
91
+ "429": "rate_limited",
92
+ "500": "server_error",
93
+ "502": "server_error",
94
+ "503": "overloaded"
95
+ }
96
+ },
97
+ "parameter_mappings": {
98
+ "temperature": "temperature",
99
+ "max_tokens": "max_tokens",
100
+ "stream": "stream",
101
+ "top_p": "top_p",
102
+ "stop_sequences": "stop",
103
+ "frequency_penalty": "frequency_penalty",
104
+ "presence_penalty": "presence_penalty",
105
+ "tools": "tools",
106
+ "tool_choice": "tool_choice",
107
+ "seed": "seed",
108
+ "top_k": "top_k"
109
+ },
110
+ "response_format": "openai_style",
111
+ "response_paths": {
112
+ "content": "choices[0].message.content",
113
+ "tool_calls": "choices[0].message.tool_calls",
114
+ "usage": "usage",
115
+ "finish_reason": "choices[0].finish_reason"
116
+ },
117
+ "streaming": {
118
+ "event_format": "data_lines",
119
+ "decoder": {
120
+ "format": "sse",
121
+ "delimiter": "\n\n",
122
+ "prefix": "data: ",
123
+ "done_signal": "[DONE]"
124
+ },
125
+ "content_path": "choices[0].delta.content",
126
+ "tool_call_path": "choices[0].delta.tool_calls",
127
+ "usage_path": "usage",
128
+ "frame_selector": "exists($.choices) || exists($.error)",
129
+ "event_map": [
130
+ {
131
+ "match": "exists($.choices[*].delta.content)",
132
+ "emit": "PartialContentDelta",
133
+ "fields": {
134
+ "content": "$.choices[*].delta.content"
135
+ }
136
+ },
137
+ {
138
+ "match": "exists($.choices[*].delta.tool_calls[*].function.name)",
139
+ "emit": "ToolCallStarted",
140
+ "fields": {
141
+ "tool_call_id": "$.choices[*].delta.tool_calls[*].id",
142
+ "tool_name": "$.choices[*].delta.tool_calls[*].function.name",
143
+ "index": "$.choices[*].delta.tool_calls[*].index"
144
+ }
145
+ },
146
+ {
147
+ "match": "exists($.choices[*].delta.tool_calls[*].function.arguments)",
148
+ "emit": "PartialToolCall",
149
+ "fields": {
150
+ "arguments": "$.choices[*].delta.tool_calls[*].function.arguments",
151
+ "index": "$.choices[*].delta.tool_calls[*].index"
152
+ }
153
+ },
154
+ {
155
+ "match": "exists($.usage)",
156
+ "emit": "Metadata",
157
+ "fields": {
158
+ "usage": "$.usage"
159
+ }
160
+ },
161
+ {
162
+ "match": "exists($.choices[*].finish_reason)",
163
+ "emit": "FinalCandidate",
164
+ "fields": {
165
+ "finish_reason": "$.choices[*].finish_reason",
166
+ "candidate_index": "$.choices[*].index"
167
+ }
168
+ }
169
+ ],
170
+ "stop_condition": "$.choices[0].finish_reason != null"
171
+ },
172
+ "features": {
173
+ "multi_candidate": {
174
+ "support_type": "native",
175
+ "param_name": "n"
176
+ },
177
+ "response_mapping": {
178
+ "tool_calls": {
179
+ "path": "choices[0].message.tool_calls",
180
+ "fields": {
181
+ "id": "id",
182
+ "name": "function.name",
183
+ "args": "function.arguments"
184
+ }
185
+ },
186
+ "error": {
187
+ "message_path": "error.message",
188
+ "code_path": "error.code",
189
+ "type_path": "error.type"
190
+ }
191
+ }
192
+ },
193
+ "capabilities": {
194
+ "streaming": true,
195
+ "tools": true,
196
+ "vision": true,
197
+ "agentic": true,
198
+ "parallel_tools": true,
199
+ "reasoning": false
200
+ },
201
+ "availability": {
202
+ "required": false,
203
+ "regions": [
204
+ "global"
205
+ ],
206
+ "check": {
207
+ "method": "GET",
208
+ "path": "/models",
209
+ "expected_status": [
210
+ 200,
211
+ 401
212
+ ],
213
+ "timeout_ms": 5000
214
+ }
215
+ },
216
+ "experimental_features": [
217
+ "photon_deployment",
218
+ "auto_scaling",
219
+ "custom_models"
220
+ ]
221
+ }