@ailib-official/ai-protocol 0.8.4
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +6 -0
- package/README.md +415 -0
- package/dist/index.json +8 -0
- package/dist/v1/models/ai21.json +140 -0
- package/dist/v1/models/baichuan.json +138 -0
- package/dist/v1/models/cerebras.json +147 -0
- package/dist/v1/models/claude.json +114 -0
- package/dist/v1/models/cohere.json +235 -0
- package/dist/v1/models/deepinfra.json +43 -0
- package/dist/v1/models/deepseek-chat.json +55 -0
- package/dist/v1/models/doubao.json +197 -0
- package/dist/v1/models/ernie.json +223 -0
- package/dist/v1/models/fireworks.json +222 -0
- package/dist/v1/models/gemini.json +58 -0
- package/dist/v1/models/gpt.json +166 -0
- package/dist/v1/models/grok.json +138 -0
- package/dist/v1/models/huggingface.json +183 -0
- package/dist/v1/models/hunyuan.json +255 -0
- package/dist/v1/models/jina.json +139 -0
- package/dist/v1/models/lepton.json +188 -0
- package/dist/v1/models/llama.json +143 -0
- package/dist/v1/models/minimax.json +194 -0
- package/dist/v1/models/mistral.json +177 -0
- package/dist/v1/models/moonshot.json +144 -0
- package/dist/v1/models/nvidia.json +212 -0
- package/dist/v1/models/palmyra.json +103 -0
- package/dist/v1/models/perplexity.json +143 -0
- package/dist/v1/models/qwen.json +49 -0
- package/dist/v1/models/replicate.json +206 -0
- package/dist/v1/models/sensenova.json +144 -0
- package/dist/v1/models/siliconflow.json +44 -0
- package/dist/v1/models/spark.json +173 -0
- package/dist/v1/models/stable-diffusion.json +161 -0
- package/dist/v1/models/tiangong.json +169 -0
- package/dist/v1/models/together.json +43 -0
- package/dist/v1/models/yi.json +199 -0
- package/dist/v1/models/zhipu.json +250 -0
- package/dist/v1/providers/ai21.json +215 -0
- package/dist/v1/providers/anthropic.json +253 -0
- package/dist/v1/providers/anyscale.json +115 -0
- package/dist/v1/providers/azure.json +188 -0
- package/dist/v1/providers/baichuan.json +205 -0
- package/dist/v1/providers/baidu.json +205 -0
- package/dist/v1/providers/cerebras.json +216 -0
- package/dist/v1/providers/cohere.json +209 -0
- package/dist/v1/providers/deepinfra.json +196 -0
- package/dist/v1/providers/deepseek.json +221 -0
- package/dist/v1/providers/doubao.json +209 -0
- package/dist/v1/providers/fireworks.json +227 -0
- package/dist/v1/providers/gemini.json +279 -0
- package/dist/v1/providers/groq.json +218 -0
- package/dist/v1/providers/huggingface.json +181 -0
- package/dist/v1/providers/hunyuan.json +198 -0
- package/dist/v1/providers/jina.json +202 -0
- package/dist/v1/providers/lepton.json +221 -0
- package/dist/v1/providers/minimax.json +209 -0
- package/dist/v1/providers/mistral.json +214 -0
- package/dist/v1/providers/moonshot.json +214 -0
- package/dist/v1/providers/nvidia.json +213 -0
- package/dist/v1/providers/openai.json +267 -0
- package/dist/v1/providers/openrouter.json +220 -0
- package/dist/v1/providers/perplexity.json +172 -0
- package/dist/v1/providers/qwen.json +231 -0
- package/dist/v1/providers/replicate.json +192 -0
- package/dist/v1/providers/sensenova.json +185 -0
- package/dist/v1/providers/siliconflow.json +197 -0
- package/dist/v1/providers/spark.json +204 -0
- package/dist/v1/providers/stability.json +221 -0
- package/dist/v1/providers/tiangong.json +207 -0
- package/dist/v1/providers/together.json +196 -0
- package/dist/v1/providers/writer.json +253 -0
- package/dist/v1/providers/xai.json +238 -0
- package/dist/v1/providers/yi.json +205 -0
- package/dist/v1/providers/zhipu.json +208 -0
- package/dist/v1/spec.json +783 -0
- package/dist/v2/providers/anthropic.json +372 -0
- package/dist/v2/providers/cohere.json +109 -0
- package/dist/v2/providers/deepseek.json +272 -0
- package/dist/v2/providers/doubao.json +260 -0
- package/dist/v2/providers/google.json +388 -0
- package/dist/v2/providers/jina.json +71 -0
- package/dist/v2/providers/moonshot.json +284 -0
- package/dist/v2/providers/openai.json +419 -0
- package/dist/v2/providers/qwen.json +274 -0
- package/dist/v2/providers/zhipu.json +257 -0
- package/dist/v2-alpha/providers/anthropic.json +182 -0
- package/dist/v2-alpha/providers/gemini.json +187 -0
- package/dist/v2-alpha/providers/openai.json +215 -0
- package/dist/v2-alpha/spec.json +644 -0
- package/package.json +61 -0
- package/schemas/spec.json +186 -0
- package/schemas/v1.json +1116 -0
- package/schemas/v2/availability.json +66 -0
- package/schemas/v2/capabilities.json +182 -0
- package/schemas/v2/capability-profile.json +174 -0
- package/schemas/v2/computer-use.json +222 -0
- package/schemas/v2/context-policy.json +148 -0
- package/schemas/v2/endpoint.json +2 -0
- package/schemas/v2/error-codes.yaml +225 -0
- package/schemas/v2/errors.json +250 -0
- package/schemas/v2/execution-metadata.json +59 -0
- package/schemas/v2/mcp.json +225 -0
- package/schemas/v2/message-roles.json +10 -0
- package/schemas/v2/multimodal.json +297 -0
- package/schemas/v2/pricing.json +14 -0
- package/schemas/v2/provider-contract.json +317 -0
- package/schemas/v2/provider.json +203 -0
- package/schemas/v2/regions.json +14 -0
- package/v1/models/ai21.yaml +97 -0
- package/v1/models/baichuan.yaml +95 -0
- package/v1/models/cerebras.yaml +99 -0
- package/v1/models/claude.yaml +59 -0
- package/v1/models/cohere.yaml +165 -0
- package/v1/models/deepinfra.yaml +29 -0
- package/v1/models/deepseek-chat.yaml +32 -0
- package/v1/models/doubao.yaml +129 -0
- package/v1/models/ernie.yaml +146 -0
- package/v1/models/fireworks.yaml +145 -0
- package/v1/models/gemini.yaml +32 -0
- package/v1/models/gpt.yaml +90 -0
- package/v1/models/grok.yaml +74 -0
- package/v1/models/huggingface.yaml +110 -0
- package/v1/models/hunyuan.yaml +164 -0
- package/v1/models/jina.yaml +98 -0
- package/v1/models/lepton.yaml +130 -0
- package/v1/models/llama.yaml +91 -0
- package/v1/models/minimax.yaml +132 -0
- package/v1/models/mistral.yaml +100 -0
- package/v1/models/moonshot.yaml +97 -0
- package/v1/models/nvidia.yaml +118 -0
- package/v1/models/palmyra.yaml +59 -0
- package/v1/models/perplexity.yaml +97 -0
- package/v1/models/qwen.yaml +27 -0
- package/v1/models/replicate.yaml +136 -0
- package/v1/models/sensenova.yaml +97 -0
- package/v1/models/siliconflow.yaml +29 -0
- package/v1/models/spark.yaml +114 -0
- package/v1/models/stable-diffusion.yaml +113 -0
- package/v1/models/tiangong.yaml +114 -0
- package/v1/models/together.yaml +29 -0
- package/v1/models/yi.yaml +132 -0
- package/v1/models/zhipu.yaml +163 -0
- package/v1/providers/ai21.yaml +176 -0
- package/v1/providers/anthropic.yaml +209 -0
- package/v1/providers/anyscale.yaml +106 -0
- package/v1/providers/azure.yaml +155 -0
- package/v1/providers/baichuan.yaml +168 -0
- package/v1/providers/baidu.yaml +173 -0
- package/v1/providers/cerebras.yaml +178 -0
- package/v1/providers/cohere.yaml +175 -0
- package/v1/providers/deepinfra.yaml +156 -0
- package/v1/providers/deepseek.yaml +189 -0
- package/v1/providers/doubao.yaml +172 -0
- package/v1/providers/fireworks.yaml +187 -0
- package/v1/providers/gemini.yaml +229 -0
- package/v1/providers/groq.yaml +181 -0
- package/v1/providers/huggingface.yaml +157 -0
- package/v1/providers/hunyuan.yaml +162 -0
- package/v1/providers/jina.yaml +171 -0
- package/v1/providers/lepton.yaml +183 -0
- package/v1/providers/minimax.yaml +172 -0
- package/v1/providers/mistral.yaml +186 -0
- package/v1/providers/moonshot.yaml +176 -0
- package/v1/providers/nvidia.yaml +172 -0
- package/v1/providers/openai.yaml +224 -0
- package/v1/providers/openrouter.yaml +181 -0
- package/v1/providers/perplexity.yaml +144 -0
- package/v1/providers/qwen.yaml +192 -0
- package/v1/providers/replicate.yaml +159 -0
- package/v1/providers/sensenova.yaml +153 -0
- package/v1/providers/siliconflow.yaml +156 -0
- package/v1/providers/spark.yaml +167 -0
- package/v1/providers/stability.yaml +185 -0
- package/v1/providers/tiangong.yaml +170 -0
- package/v1/providers/together.yaml +156 -0
- package/v1/providers/writer.yaml +212 -0
- package/v1/providers/xai.yaml +206 -0
- package/v1/providers/yi.yaml +168 -0
- package/v1/providers/zhipu.yaml +171 -0
- package/v1/spec.yaml +637 -0
- package/v2/providers/anthropic.yaml +244 -0
- package/v2/providers/cohere.yaml +75 -0
- package/v2/providers/deepseek.yaml +176 -0
- package/v2/providers/doubao.yaml +169 -0
- package/v2/providers/google.yaml +245 -0
- package/v2/providers/jina.yaml +55 -0
- package/v2/providers/moonshot.yaml +186 -0
- package/v2/providers/openai.yaml +266 -0
- package/v2/providers/qwen.yaml +174 -0
- package/v2/providers/zhipu.yaml +176 -0
- package/v2-alpha/providers/anthropic.yaml +134 -0
- package/v2-alpha/providers/gemini.yaml +144 -0
- package/v2-alpha/providers/openai.yaml +154 -0
- package/v2-alpha/spec.yaml +512 -0
|
@@ -0,0 +1,198 @@
|
|
|
1
|
+
{
|
|
2
|
+
"$schema": "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json",
|
|
3
|
+
"id": "hunyuan",
|
|
4
|
+
"protocol_version": "1.5",
|
|
5
|
+
"name": "腾讯混元 (Tencent Hunyuan)",
|
|
6
|
+
"version": "v1",
|
|
7
|
+
"status": "stable",
|
|
8
|
+
"category": "ai_provider",
|
|
9
|
+
"official_url": "https://cloud.tencent.com/document/product/1729",
|
|
10
|
+
"support_contact": "https://cloud.tencent.com/online-service",
|
|
11
|
+
"endpoint": {
|
|
12
|
+
"base_url": "https://hunyuan.tencentcloudapi.com",
|
|
13
|
+
"protocol": "https",
|
|
14
|
+
"timeout_ms": 60000
|
|
15
|
+
},
|
|
16
|
+
"auth": {
|
|
17
|
+
"type": "bearer",
|
|
18
|
+
"token_env": "HUNYUAN_API_KEY"
|
|
19
|
+
},
|
|
20
|
+
"payload_format": "openai_style",
|
|
21
|
+
"api_families": [
|
|
22
|
+
"chat_completions"
|
|
23
|
+
],
|
|
24
|
+
"default_api_family": "chat_completions",
|
|
25
|
+
"endpoints": {
|
|
26
|
+
"chat": {
|
|
27
|
+
"path": "/v1/chat/completions",
|
|
28
|
+
"method": "POST",
|
|
29
|
+
"adapter": "openai"
|
|
30
|
+
}
|
|
31
|
+
},
|
|
32
|
+
"termination": {
|
|
33
|
+
"source_field": "finish_reason",
|
|
34
|
+
"mapping": {
|
|
35
|
+
"stop": "end_turn",
|
|
36
|
+
"length": "max_tokens",
|
|
37
|
+
"tool_calls": "tool_use",
|
|
38
|
+
"sensitive": "refusal"
|
|
39
|
+
},
|
|
40
|
+
"notes": [
|
|
41
|
+
"OpenAI-compatible finish_reason.",
|
|
42
|
+
"混元大模型 (Hunyuan) is Tencent's flagship LLM."
|
|
43
|
+
]
|
|
44
|
+
},
|
|
45
|
+
"tooling": {
|
|
46
|
+
"source_model": "openai_tool_calls",
|
|
47
|
+
"tool_use": {
|
|
48
|
+
"id_path": "id",
|
|
49
|
+
"name_path": "function.name",
|
|
50
|
+
"input_path": "function.arguments",
|
|
51
|
+
"input_format": "json_string"
|
|
52
|
+
},
|
|
53
|
+
"notes": [
|
|
54
|
+
"Supports OpenAI-compatible function calling."
|
|
55
|
+
]
|
|
56
|
+
},
|
|
57
|
+
"retry_policy": {
|
|
58
|
+
"strategy": "exponential_backoff",
|
|
59
|
+
"max_retries": 3,
|
|
60
|
+
"min_delay_ms": 1000,
|
|
61
|
+
"max_delay_ms": 30000,
|
|
62
|
+
"jitter": "full",
|
|
63
|
+
"retry_on_http_status": [
|
|
64
|
+
429,
|
|
65
|
+
500,
|
|
66
|
+
502,
|
|
67
|
+
503
|
|
68
|
+
]
|
|
69
|
+
},
|
|
70
|
+
"error_classification": {
|
|
71
|
+
"by_http_status": {
|
|
72
|
+
"400": "invalid_request",
|
|
73
|
+
"401": "authentication",
|
|
74
|
+
"403": "permission_denied",
|
|
75
|
+
"404": "not_found",
|
|
76
|
+
"429": "rate_limited",
|
|
77
|
+
"500": "server_error",
|
|
78
|
+
"503": "overloaded"
|
|
79
|
+
}
|
|
80
|
+
},
|
|
81
|
+
"parameter_mappings": {
|
|
82
|
+
"temperature": "temperature",
|
|
83
|
+
"max_tokens": "max_tokens",
|
|
84
|
+
"stream": "stream",
|
|
85
|
+
"top_p": "top_p",
|
|
86
|
+
"tools": "tools",
|
|
87
|
+
"tool_choice": "tool_choice"
|
|
88
|
+
},
|
|
89
|
+
"response_format": "openai_style",
|
|
90
|
+
"response_paths": {
|
|
91
|
+
"content": "choices[0].message.content",
|
|
92
|
+
"tool_calls": "choices[0].message.tool_calls",
|
|
93
|
+
"usage": "usage",
|
|
94
|
+
"finish_reason": "choices[0].finish_reason"
|
|
95
|
+
},
|
|
96
|
+
"streaming": {
|
|
97
|
+
"event_format": "data_lines",
|
|
98
|
+
"decoder": {
|
|
99
|
+
"format": "sse",
|
|
100
|
+
"delimiter": "\n\n",
|
|
101
|
+
"prefix": "data: ",
|
|
102
|
+
"done_signal": "[DONE]"
|
|
103
|
+
},
|
|
104
|
+
"content_path": "choices[0].delta.content",
|
|
105
|
+
"tool_call_path": "choices[0].delta.tool_calls",
|
|
106
|
+
"usage_path": "usage",
|
|
107
|
+
"frame_selector": "exists($.choices) || exists($.error)",
|
|
108
|
+
"event_map": [
|
|
109
|
+
{
|
|
110
|
+
"match": "exists($.choices[*].delta.content)",
|
|
111
|
+
"emit": "PartialContentDelta",
|
|
112
|
+
"fields": {
|
|
113
|
+
"content": "$.choices[*].delta.content"
|
|
114
|
+
}
|
|
115
|
+
},
|
|
116
|
+
{
|
|
117
|
+
"match": "exists($.choices[*].delta.tool_calls[*].function.name)",
|
|
118
|
+
"emit": "ToolCallStarted",
|
|
119
|
+
"fields": {
|
|
120
|
+
"tool_call_id": "$.choices[*].delta.tool_calls[*].id",
|
|
121
|
+
"tool_name": "$.choices[*].delta.tool_calls[*].function.name",
|
|
122
|
+
"index": "$.choices[*].delta.tool_calls[*].index"
|
|
123
|
+
}
|
|
124
|
+
},
|
|
125
|
+
{
|
|
126
|
+
"match": "exists($.choices[*].delta.tool_calls[*].function.arguments)",
|
|
127
|
+
"emit": "PartialToolCall",
|
|
128
|
+
"fields": {
|
|
129
|
+
"arguments": "$.choices[*].delta.tool_calls[*].function.arguments",
|
|
130
|
+
"index": "$.choices[*].delta.tool_calls[*].index"
|
|
131
|
+
}
|
|
132
|
+
},
|
|
133
|
+
{
|
|
134
|
+
"match": "exists($.usage)",
|
|
135
|
+
"emit": "Metadata",
|
|
136
|
+
"fields": {
|
|
137
|
+
"usage": "$.usage"
|
|
138
|
+
}
|
|
139
|
+
},
|
|
140
|
+
{
|
|
141
|
+
"match": "exists($.choices[*].finish_reason)",
|
|
142
|
+
"emit": "FinalCandidate",
|
|
143
|
+
"fields": {
|
|
144
|
+
"finish_reason": "$.choices[*].finish_reason"
|
|
145
|
+
}
|
|
146
|
+
}
|
|
147
|
+
],
|
|
148
|
+
"stop_condition": "$.choices[0].finish_reason != null"
|
|
149
|
+
},
|
|
150
|
+
"features": {
|
|
151
|
+
"multi_candidate": {
|
|
152
|
+
"support_type": "native",
|
|
153
|
+
"param_name": "n"
|
|
154
|
+
},
|
|
155
|
+
"response_mapping": {
|
|
156
|
+
"tool_calls": {
|
|
157
|
+
"path": "choices[0].message.tool_calls",
|
|
158
|
+
"fields": {
|
|
159
|
+
"id": "id",
|
|
160
|
+
"name": "function.name",
|
|
161
|
+
"args": "function.arguments"
|
|
162
|
+
}
|
|
163
|
+
},
|
|
164
|
+
"error": {
|
|
165
|
+
"message_path": "error.message",
|
|
166
|
+
"code_path": "error.code"
|
|
167
|
+
}
|
|
168
|
+
}
|
|
169
|
+
},
|
|
170
|
+
"capabilities": {
|
|
171
|
+
"streaming": true,
|
|
172
|
+
"tools": true,
|
|
173
|
+
"vision": true,
|
|
174
|
+
"agentic": true,
|
|
175
|
+
"parallel_tools": true,
|
|
176
|
+
"reasoning": true
|
|
177
|
+
},
|
|
178
|
+
"availability": {
|
|
179
|
+
"required": false,
|
|
180
|
+
"regions": [
|
|
181
|
+
"cn"
|
|
182
|
+
],
|
|
183
|
+
"check": {
|
|
184
|
+
"method": "GET",
|
|
185
|
+
"path": "/v1/models",
|
|
186
|
+
"expected_status": [
|
|
187
|
+
200,
|
|
188
|
+
401
|
|
189
|
+
],
|
|
190
|
+
"timeout_ms": 5000
|
|
191
|
+
}
|
|
192
|
+
},
|
|
193
|
+
"experimental_features": [
|
|
194
|
+
"search_enhancement",
|
|
195
|
+
"image_understanding",
|
|
196
|
+
"role_play"
|
|
197
|
+
]
|
|
198
|
+
}
|
|
@@ -0,0 +1,202 @@
|
|
|
1
|
+
{
|
|
2
|
+
"$schema": "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json",
|
|
3
|
+
"id": "jina",
|
|
4
|
+
"protocol_version": "1.5",
|
|
5
|
+
"name": "Jina AI",
|
|
6
|
+
"version": "v1",
|
|
7
|
+
"status": "stable",
|
|
8
|
+
"category": "ai_provider",
|
|
9
|
+
"official_url": "https://jina.ai/docs",
|
|
10
|
+
"support_contact": "https://jina.ai/contact",
|
|
11
|
+
"endpoint": {
|
|
12
|
+
"base_url": "https://api.jina.ai",
|
|
13
|
+
"protocol": "https",
|
|
14
|
+
"timeout_ms": 30000
|
|
15
|
+
},
|
|
16
|
+
"auth": {
|
|
17
|
+
"type": "bearer",
|
|
18
|
+
"token_env": "JINA_API_KEY",
|
|
19
|
+
"payload_format": "jina_api"
|
|
20
|
+
},
|
|
21
|
+
"api_families": [
|
|
22
|
+
"embeddings",
|
|
23
|
+
"rerank",
|
|
24
|
+
"reader",
|
|
25
|
+
"search"
|
|
26
|
+
],
|
|
27
|
+
"default_api_family": "embeddings",
|
|
28
|
+
"endpoints": {
|
|
29
|
+
"embeddings": {
|
|
30
|
+
"path": "/v1/embeddings",
|
|
31
|
+
"method": "POST",
|
|
32
|
+
"adapter": "openai"
|
|
33
|
+
},
|
|
34
|
+
"rerank": {
|
|
35
|
+
"path": "/v1/rerank",
|
|
36
|
+
"method": "POST",
|
|
37
|
+
"adapter": "jina"
|
|
38
|
+
},
|
|
39
|
+
"reader": {
|
|
40
|
+
"path": "/v1/reader",
|
|
41
|
+
"method": "POST",
|
|
42
|
+
"adapter": "jina"
|
|
43
|
+
}
|
|
44
|
+
},
|
|
45
|
+
"services": {
|
|
46
|
+
"list_models": {
|
|
47
|
+
"path": "/v1/models",
|
|
48
|
+
"method": "GET",
|
|
49
|
+
"response_binding": "data"
|
|
50
|
+
}
|
|
51
|
+
},
|
|
52
|
+
"termination": {
|
|
53
|
+
"source_field": "finish_reason",
|
|
54
|
+
"mapping": {
|
|
55
|
+
"stop": "end_turn",
|
|
56
|
+
"length": "max_tokens"
|
|
57
|
+
},
|
|
58
|
+
"notes": [
|
|
59
|
+
"Jina Reader uses finish_reason for completion",
|
|
60
|
+
"Embeddings API does not use finish_reason"
|
|
61
|
+
]
|
|
62
|
+
},
|
|
63
|
+
"tooling": {
|
|
64
|
+
"source_model": "unknown",
|
|
65
|
+
"notes": [
|
|
66
|
+
"Jina AI is primarily embeddings and search",
|
|
67
|
+
"Does not support traditional tool calling"
|
|
68
|
+
]
|
|
69
|
+
},
|
|
70
|
+
"retry_policy": {
|
|
71
|
+
"strategy": "exponential_backoff",
|
|
72
|
+
"max_retries": 3,
|
|
73
|
+
"max_delay_ms": 30000,
|
|
74
|
+
"min_delay_ms": 1000,
|
|
75
|
+
"jitter": "full",
|
|
76
|
+
"retry_on_http_status": [
|
|
77
|
+
429,
|
|
78
|
+
500,
|
|
79
|
+
502,
|
|
80
|
+
503
|
|
81
|
+
],
|
|
82
|
+
"notes": [
|
|
83
|
+
"Jina API is generally fast but may experience spikes",
|
|
84
|
+
"Exponential backoff recommended for rate limits"
|
|
85
|
+
]
|
|
86
|
+
},
|
|
87
|
+
"error_classification": {
|
|
88
|
+
"by_http_status": {
|
|
89
|
+
"400": "invalid_request",
|
|
90
|
+
"401": "authentication",
|
|
91
|
+
"403": "permission_denied",
|
|
92
|
+
"404": "not_found",
|
|
93
|
+
"429": "rate_limited",
|
|
94
|
+
"500": "server_error",
|
|
95
|
+
"502": "overloaded",
|
|
96
|
+
"503": "overloaded"
|
|
97
|
+
},
|
|
98
|
+
"notes": [
|
|
99
|
+
"Jina returns clear error messages in JSON format",
|
|
100
|
+
"Rate limit info included in error responses"
|
|
101
|
+
]
|
|
102
|
+
},
|
|
103
|
+
"parameter_mappings": {
|
|
104
|
+
"model": "model",
|
|
105
|
+
"input": "input",
|
|
106
|
+
"encoding_format": "encoding_format",
|
|
107
|
+
"dimensions": "dimensions",
|
|
108
|
+
"top_n": "top_n",
|
|
109
|
+
"query": "query",
|
|
110
|
+
"documents": "documents",
|
|
111
|
+
"return_documents": "return_documents",
|
|
112
|
+
"url": "url",
|
|
113
|
+
"question": "question"
|
|
114
|
+
},
|
|
115
|
+
"response_format": "jina_style",
|
|
116
|
+
"response_paths": {
|
|
117
|
+
"content": "output",
|
|
118
|
+
"embedding": "data.embedding",
|
|
119
|
+
"data": "data",
|
|
120
|
+
"results": "results"
|
|
121
|
+
},
|
|
122
|
+
"streaming": {
|
|
123
|
+
"event_format": "jina_stream",
|
|
124
|
+
"decoder": {
|
|
125
|
+
"format": "sse",
|
|
126
|
+
"delimiter": "\n\n",
|
|
127
|
+
"prefix": "data: ",
|
|
128
|
+
"done_signal": "[DONE]"
|
|
129
|
+
},
|
|
130
|
+
"frame_selector": "exists($.delta) || exists($.embedding) || exists($.results)",
|
|
131
|
+
"event_map": [
|
|
132
|
+
{
|
|
133
|
+
"match": "exists($.delta)",
|
|
134
|
+
"emit": "PartialContentDelta",
|
|
135
|
+
"fields": {
|
|
136
|
+
"content": "$.delta.content"
|
|
137
|
+
}
|
|
138
|
+
},
|
|
139
|
+
{
|
|
140
|
+
"match": "exists($.embedding)",
|
|
141
|
+
"emit": "Metadata",
|
|
142
|
+
"fields": {
|
|
143
|
+
"embedding": "$.embedding",
|
|
144
|
+
"index": "$.index"
|
|
145
|
+
}
|
|
146
|
+
},
|
|
147
|
+
{
|
|
148
|
+
"match": "exists($.results)",
|
|
149
|
+
"emit": "FinalCandidate",
|
|
150
|
+
"fields": {
|
|
151
|
+
"results": "$.results"
|
|
152
|
+
}
|
|
153
|
+
}
|
|
154
|
+
],
|
|
155
|
+
"stop_condition": "exists($.finish_reason) || exists($.results)",
|
|
156
|
+
"extra_metadata_path": "$.usage"
|
|
157
|
+
},
|
|
158
|
+
"features": {
|
|
159
|
+
"multi_candidate": {
|
|
160
|
+
"support_type": "native",
|
|
161
|
+
"param_name": "top_n"
|
|
162
|
+
},
|
|
163
|
+
"response_mapping": {
|
|
164
|
+
"error": {
|
|
165
|
+
"message_path": "message",
|
|
166
|
+
"code_path": "code",
|
|
167
|
+
"type_path": "error"
|
|
168
|
+
}
|
|
169
|
+
}
|
|
170
|
+
},
|
|
171
|
+
"capabilities": {
|
|
172
|
+
"streaming": false,
|
|
173
|
+
"tools": false,
|
|
174
|
+
"vision": false,
|
|
175
|
+
"agentic": false,
|
|
176
|
+
"parallel_tools": false,
|
|
177
|
+
"reasoning": false
|
|
178
|
+
},
|
|
179
|
+
"experimental_features": [
|
|
180
|
+
"rerank_api",
|
|
181
|
+
"reader_api",
|
|
182
|
+
"multimodal_embeddings",
|
|
183
|
+
"code_embeddings"
|
|
184
|
+
],
|
|
185
|
+
"availability": {
|
|
186
|
+
"required": false,
|
|
187
|
+
"regions": [
|
|
188
|
+
"global"
|
|
189
|
+
],
|
|
190
|
+
"check": {
|
|
191
|
+
"method": "GET",
|
|
192
|
+
"path": "/v1/models",
|
|
193
|
+
"expected_status": [
|
|
194
|
+
200
|
|
195
|
+
],
|
|
196
|
+
"timeout_ms": 3000
|
|
197
|
+
},
|
|
198
|
+
"notes": [
|
|
199
|
+
"Check v1/models endpoint to verify service health"
|
|
200
|
+
]
|
|
201
|
+
}
|
|
202
|
+
}
|
|
@@ -0,0 +1,221 @@
|
|
|
1
|
+
{
|
|
2
|
+
"$schema": "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json",
|
|
3
|
+
"id": "lepton",
|
|
4
|
+
"protocol_version": "1.5",
|
|
5
|
+
"name": "Lepton AI",
|
|
6
|
+
"version": "v1",
|
|
7
|
+
"status": "stable",
|
|
8
|
+
"category": "ai_provider",
|
|
9
|
+
"official_url": "https://www.lepton.ai/docs",
|
|
10
|
+
"support_contact": "https://www.lepton.ai/contact",
|
|
11
|
+
"endpoint": {
|
|
12
|
+
"base_url": "https://llama3-1-8b.lepton.run/api/v1",
|
|
13
|
+
"protocol": "https",
|
|
14
|
+
"timeout_ms": 30000
|
|
15
|
+
},
|
|
16
|
+
"base_url_template": "https://{model_id}.lepton.run/api/v1",
|
|
17
|
+
"auth": {
|
|
18
|
+
"type": "bearer",
|
|
19
|
+
"token_env": "LEPTON_API_TOKEN"
|
|
20
|
+
},
|
|
21
|
+
"payload_format": "openai_style",
|
|
22
|
+
"api_families": [
|
|
23
|
+
"chat_completions",
|
|
24
|
+
"completions"
|
|
25
|
+
],
|
|
26
|
+
"default_api_family": "chat_completions",
|
|
27
|
+
"endpoints": {
|
|
28
|
+
"chat": {
|
|
29
|
+
"path": "/chat/completions",
|
|
30
|
+
"method": "POST",
|
|
31
|
+
"adapter": "openai"
|
|
32
|
+
},
|
|
33
|
+
"completions": {
|
|
34
|
+
"path": "/completions",
|
|
35
|
+
"method": "POST",
|
|
36
|
+
"adapter": "openai"
|
|
37
|
+
}
|
|
38
|
+
},
|
|
39
|
+
"services": {
|
|
40
|
+
"list_models": {
|
|
41
|
+
"path": "/models",
|
|
42
|
+
"method": "GET",
|
|
43
|
+
"response_binding": "data"
|
|
44
|
+
}
|
|
45
|
+
},
|
|
46
|
+
"termination": {
|
|
47
|
+
"source_field": "finish_reason",
|
|
48
|
+
"mapping": {
|
|
49
|
+
"stop": "end_turn",
|
|
50
|
+
"length": "max_tokens",
|
|
51
|
+
"tool_calls": "tool_use"
|
|
52
|
+
},
|
|
53
|
+
"notes": [
|
|
54
|
+
"OpenAI-compatible finish_reason."
|
|
55
|
+
]
|
|
56
|
+
},
|
|
57
|
+
"tooling": {
|
|
58
|
+
"source_model": "openai_tool_calls",
|
|
59
|
+
"tool_use": {
|
|
60
|
+
"id_path": "id",
|
|
61
|
+
"name_path": "function.name",
|
|
62
|
+
"input_path": "function.arguments",
|
|
63
|
+
"input_format": "json_string"
|
|
64
|
+
},
|
|
65
|
+
"notes": [
|
|
66
|
+
"OpenAI-compatible tool calling for supported models."
|
|
67
|
+
]
|
|
68
|
+
},
|
|
69
|
+
"retry_policy": {
|
|
70
|
+
"strategy": "exponential_backoff",
|
|
71
|
+
"max_retries": 3,
|
|
72
|
+
"min_delay_ms": 1000,
|
|
73
|
+
"max_delay_ms": 30000,
|
|
74
|
+
"jitter": "full",
|
|
75
|
+
"retry_on_http_status": [
|
|
76
|
+
429,
|
|
77
|
+
500,
|
|
78
|
+
502,
|
|
79
|
+
503
|
|
80
|
+
],
|
|
81
|
+
"notes": [
|
|
82
|
+
"Standard exponential backoff for rate limits and transient errors."
|
|
83
|
+
]
|
|
84
|
+
},
|
|
85
|
+
"error_classification": {
|
|
86
|
+
"by_http_status": {
|
|
87
|
+
"400": "invalid_request",
|
|
88
|
+
"401": "authentication",
|
|
89
|
+
"403": "permission_denied",
|
|
90
|
+
"404": "not_found",
|
|
91
|
+
"429": "rate_limited",
|
|
92
|
+
"500": "server_error",
|
|
93
|
+
"502": "server_error",
|
|
94
|
+
"503": "overloaded"
|
|
95
|
+
}
|
|
96
|
+
},
|
|
97
|
+
"parameter_mappings": {
|
|
98
|
+
"temperature": "temperature",
|
|
99
|
+
"max_tokens": "max_tokens",
|
|
100
|
+
"stream": "stream",
|
|
101
|
+
"top_p": "top_p",
|
|
102
|
+
"stop_sequences": "stop",
|
|
103
|
+
"frequency_penalty": "frequency_penalty",
|
|
104
|
+
"presence_penalty": "presence_penalty",
|
|
105
|
+
"tools": "tools",
|
|
106
|
+
"tool_choice": "tool_choice",
|
|
107
|
+
"seed": "seed",
|
|
108
|
+
"top_k": "top_k"
|
|
109
|
+
},
|
|
110
|
+
"response_format": "openai_style",
|
|
111
|
+
"response_paths": {
|
|
112
|
+
"content": "choices[0].message.content",
|
|
113
|
+
"tool_calls": "choices[0].message.tool_calls",
|
|
114
|
+
"usage": "usage",
|
|
115
|
+
"finish_reason": "choices[0].finish_reason"
|
|
116
|
+
},
|
|
117
|
+
"streaming": {
|
|
118
|
+
"event_format": "data_lines",
|
|
119
|
+
"decoder": {
|
|
120
|
+
"format": "sse",
|
|
121
|
+
"delimiter": "\n\n",
|
|
122
|
+
"prefix": "data: ",
|
|
123
|
+
"done_signal": "[DONE]"
|
|
124
|
+
},
|
|
125
|
+
"content_path": "choices[0].delta.content",
|
|
126
|
+
"tool_call_path": "choices[0].delta.tool_calls",
|
|
127
|
+
"usage_path": "usage",
|
|
128
|
+
"frame_selector": "exists($.choices) || exists($.error)",
|
|
129
|
+
"event_map": [
|
|
130
|
+
{
|
|
131
|
+
"match": "exists($.choices[*].delta.content)",
|
|
132
|
+
"emit": "PartialContentDelta",
|
|
133
|
+
"fields": {
|
|
134
|
+
"content": "$.choices[*].delta.content"
|
|
135
|
+
}
|
|
136
|
+
},
|
|
137
|
+
{
|
|
138
|
+
"match": "exists($.choices[*].delta.tool_calls[*].function.name)",
|
|
139
|
+
"emit": "ToolCallStarted",
|
|
140
|
+
"fields": {
|
|
141
|
+
"tool_call_id": "$.choices[*].delta.tool_calls[*].id",
|
|
142
|
+
"tool_name": "$.choices[*].delta.tool_calls[*].function.name",
|
|
143
|
+
"index": "$.choices[*].delta.tool_calls[*].index"
|
|
144
|
+
}
|
|
145
|
+
},
|
|
146
|
+
{
|
|
147
|
+
"match": "exists($.choices[*].delta.tool_calls[*].function.arguments)",
|
|
148
|
+
"emit": "PartialToolCall",
|
|
149
|
+
"fields": {
|
|
150
|
+
"arguments": "$.choices[*].delta.tool_calls[*].function.arguments",
|
|
151
|
+
"index": "$.choices[*].delta.tool_calls[*].index"
|
|
152
|
+
}
|
|
153
|
+
},
|
|
154
|
+
{
|
|
155
|
+
"match": "exists($.usage)",
|
|
156
|
+
"emit": "Metadata",
|
|
157
|
+
"fields": {
|
|
158
|
+
"usage": "$.usage"
|
|
159
|
+
}
|
|
160
|
+
},
|
|
161
|
+
{
|
|
162
|
+
"match": "exists($.choices[*].finish_reason)",
|
|
163
|
+
"emit": "FinalCandidate",
|
|
164
|
+
"fields": {
|
|
165
|
+
"finish_reason": "$.choices[*].finish_reason",
|
|
166
|
+
"candidate_index": "$.choices[*].index"
|
|
167
|
+
}
|
|
168
|
+
}
|
|
169
|
+
],
|
|
170
|
+
"stop_condition": "$.choices[0].finish_reason != null"
|
|
171
|
+
},
|
|
172
|
+
"features": {
|
|
173
|
+
"multi_candidate": {
|
|
174
|
+
"support_type": "native",
|
|
175
|
+
"param_name": "n"
|
|
176
|
+
},
|
|
177
|
+
"response_mapping": {
|
|
178
|
+
"tool_calls": {
|
|
179
|
+
"path": "choices[0].message.tool_calls",
|
|
180
|
+
"fields": {
|
|
181
|
+
"id": "id",
|
|
182
|
+
"name": "function.name",
|
|
183
|
+
"args": "function.arguments"
|
|
184
|
+
}
|
|
185
|
+
},
|
|
186
|
+
"error": {
|
|
187
|
+
"message_path": "error.message",
|
|
188
|
+
"code_path": "error.code",
|
|
189
|
+
"type_path": "error.type"
|
|
190
|
+
}
|
|
191
|
+
}
|
|
192
|
+
},
|
|
193
|
+
"capabilities": {
|
|
194
|
+
"streaming": true,
|
|
195
|
+
"tools": true,
|
|
196
|
+
"vision": true,
|
|
197
|
+
"agentic": true,
|
|
198
|
+
"parallel_tools": true,
|
|
199
|
+
"reasoning": false
|
|
200
|
+
},
|
|
201
|
+
"availability": {
|
|
202
|
+
"required": false,
|
|
203
|
+
"regions": [
|
|
204
|
+
"global"
|
|
205
|
+
],
|
|
206
|
+
"check": {
|
|
207
|
+
"method": "GET",
|
|
208
|
+
"path": "/models",
|
|
209
|
+
"expected_status": [
|
|
210
|
+
200,
|
|
211
|
+
401
|
|
212
|
+
],
|
|
213
|
+
"timeout_ms": 5000
|
|
214
|
+
}
|
|
215
|
+
},
|
|
216
|
+
"experimental_features": [
|
|
217
|
+
"photon_deployment",
|
|
218
|
+
"auto_scaling",
|
|
219
|
+
"custom_models"
|
|
220
|
+
]
|
|
221
|
+
}
|