npm - @ailib-official/ai-protocol - Versions diffs - 0.8.4 - Mend

@ailib-official/ai-protocol 0.8.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (194) hide show

package/LICENSE +6 -0
package/README.md +415 -0
package/dist/index.json +8 -0
package/dist/v1/models/ai21.json +140 -0
package/dist/v1/models/baichuan.json +138 -0
package/dist/v1/models/cerebras.json +147 -0
package/dist/v1/models/claude.json +114 -0
package/dist/v1/models/cohere.json +235 -0
package/dist/v1/models/deepinfra.json +43 -0
package/dist/v1/models/deepseek-chat.json +55 -0
package/dist/v1/models/doubao.json +197 -0
package/dist/v1/models/ernie.json +223 -0
package/dist/v1/models/fireworks.json +222 -0
package/dist/v1/models/gemini.json +58 -0
package/dist/v1/models/gpt.json +166 -0
package/dist/v1/models/grok.json +138 -0
package/dist/v1/models/huggingface.json +183 -0
package/dist/v1/models/hunyuan.json +255 -0
package/dist/v1/models/jina.json +139 -0
package/dist/v1/models/lepton.json +188 -0
package/dist/v1/models/llama.json +143 -0
package/dist/v1/models/minimax.json +194 -0
package/dist/v1/models/mistral.json +177 -0
package/dist/v1/models/moonshot.json +144 -0
package/dist/v1/models/nvidia.json +212 -0
package/dist/v1/models/palmyra.json +103 -0
package/dist/v1/models/perplexity.json +143 -0
package/dist/v1/models/qwen.json +49 -0
package/dist/v1/models/replicate.json +206 -0
package/dist/v1/models/sensenova.json +144 -0
package/dist/v1/models/siliconflow.json +44 -0
package/dist/v1/models/spark.json +173 -0
package/dist/v1/models/stable-diffusion.json +161 -0
package/dist/v1/models/tiangong.json +169 -0
package/dist/v1/models/together.json +43 -0
package/dist/v1/models/yi.json +199 -0
package/dist/v1/models/zhipu.json +250 -0
package/dist/v1/providers/ai21.json +215 -0
package/dist/v1/providers/anthropic.json +253 -0
package/dist/v1/providers/anyscale.json +115 -0
package/dist/v1/providers/azure.json +188 -0
package/dist/v1/providers/baichuan.json +205 -0
package/dist/v1/providers/baidu.json +205 -0
package/dist/v1/providers/cerebras.json +216 -0
package/dist/v1/providers/cohere.json +209 -0
package/dist/v1/providers/deepinfra.json +196 -0
package/dist/v1/providers/deepseek.json +221 -0
package/dist/v1/providers/doubao.json +209 -0
package/dist/v1/providers/fireworks.json +227 -0
package/dist/v1/providers/gemini.json +279 -0
package/dist/v1/providers/groq.json +218 -0
package/dist/v1/providers/huggingface.json +181 -0
package/dist/v1/providers/hunyuan.json +198 -0
package/dist/v1/providers/jina.json +202 -0
package/dist/v1/providers/lepton.json +221 -0
package/dist/v1/providers/minimax.json +209 -0
package/dist/v1/providers/mistral.json +214 -0
package/dist/v1/providers/moonshot.json +214 -0
package/dist/v1/providers/nvidia.json +213 -0
package/dist/v1/providers/openai.json +267 -0
package/dist/v1/providers/openrouter.json +220 -0
package/dist/v1/providers/perplexity.json +172 -0
package/dist/v1/providers/qwen.json +231 -0
package/dist/v1/providers/replicate.json +192 -0
package/dist/v1/providers/sensenova.json +185 -0
package/dist/v1/providers/siliconflow.json +197 -0
package/dist/v1/providers/spark.json +204 -0
package/dist/v1/providers/stability.json +221 -0
package/dist/v1/providers/tiangong.json +207 -0
package/dist/v1/providers/together.json +196 -0
package/dist/v1/providers/writer.json +253 -0
package/dist/v1/providers/xai.json +238 -0
package/dist/v1/providers/yi.json +205 -0
package/dist/v1/providers/zhipu.json +208 -0
package/dist/v1/spec.json +783 -0
package/dist/v2/providers/anthropic.json +372 -0
package/dist/v2/providers/cohere.json +109 -0
package/dist/v2/providers/deepseek.json +272 -0
package/dist/v2/providers/doubao.json +260 -0
package/dist/v2/providers/google.json +388 -0
package/dist/v2/providers/jina.json +71 -0
package/dist/v2/providers/moonshot.json +284 -0
package/dist/v2/providers/openai.json +419 -0
package/dist/v2/providers/qwen.json +274 -0
package/dist/v2/providers/zhipu.json +257 -0
package/dist/v2-alpha/providers/anthropic.json +182 -0
package/dist/v2-alpha/providers/gemini.json +187 -0
package/dist/v2-alpha/providers/openai.json +215 -0
package/dist/v2-alpha/spec.json +644 -0
package/package.json +61 -0
package/schemas/spec.json +186 -0
package/schemas/v1.json +1116 -0
package/schemas/v2/availability.json +66 -0
package/schemas/v2/capabilities.json +182 -0
package/schemas/v2/capability-profile.json +174 -0
package/schemas/v2/computer-use.json +222 -0
package/schemas/v2/context-policy.json +148 -0
package/schemas/v2/endpoint.json +2 -0
package/schemas/v2/error-codes.yaml +225 -0
package/schemas/v2/errors.json +250 -0
package/schemas/v2/execution-metadata.json +59 -0
package/schemas/v2/mcp.json +225 -0
package/schemas/v2/message-roles.json +10 -0
package/schemas/v2/multimodal.json +297 -0
package/schemas/v2/pricing.json +14 -0
package/schemas/v2/provider-contract.json +317 -0
package/schemas/v2/provider.json +203 -0
package/schemas/v2/regions.json +14 -0
package/v1/models/ai21.yaml +97 -0
package/v1/models/baichuan.yaml +95 -0
package/v1/models/cerebras.yaml +99 -0
package/v1/models/claude.yaml +59 -0
package/v1/models/cohere.yaml +165 -0
package/v1/models/deepinfra.yaml +29 -0
package/v1/models/deepseek-chat.yaml +32 -0
package/v1/models/doubao.yaml +129 -0
package/v1/models/ernie.yaml +146 -0
package/v1/models/fireworks.yaml +145 -0
package/v1/models/gemini.yaml +32 -0
package/v1/models/gpt.yaml +90 -0
package/v1/models/grok.yaml +74 -0
package/v1/models/huggingface.yaml +110 -0
package/v1/models/hunyuan.yaml +164 -0
package/v1/models/jina.yaml +98 -0
package/v1/models/lepton.yaml +130 -0
package/v1/models/llama.yaml +91 -0
package/v1/models/minimax.yaml +132 -0
package/v1/models/mistral.yaml +100 -0
package/v1/models/moonshot.yaml +97 -0
package/v1/models/nvidia.yaml +118 -0
package/v1/models/palmyra.yaml +59 -0
package/v1/models/perplexity.yaml +97 -0
package/v1/models/qwen.yaml +27 -0
package/v1/models/replicate.yaml +136 -0
package/v1/models/sensenova.yaml +97 -0
package/v1/models/siliconflow.yaml +29 -0
package/v1/models/spark.yaml +114 -0
package/v1/models/stable-diffusion.yaml +113 -0
package/v1/models/tiangong.yaml +114 -0
package/v1/models/together.yaml +29 -0
package/v1/models/yi.yaml +132 -0
package/v1/models/zhipu.yaml +163 -0
package/v1/providers/ai21.yaml +176 -0
package/v1/providers/anthropic.yaml +209 -0
package/v1/providers/anyscale.yaml +106 -0
package/v1/providers/azure.yaml +155 -0
package/v1/providers/baichuan.yaml +168 -0
package/v1/providers/baidu.yaml +173 -0
package/v1/providers/cerebras.yaml +178 -0
package/v1/providers/cohere.yaml +175 -0
package/v1/providers/deepinfra.yaml +156 -0
package/v1/providers/deepseek.yaml +189 -0
package/v1/providers/doubao.yaml +172 -0
package/v1/providers/fireworks.yaml +187 -0
package/v1/providers/gemini.yaml +229 -0
package/v1/providers/groq.yaml +181 -0
package/v1/providers/huggingface.yaml +157 -0
package/v1/providers/hunyuan.yaml +162 -0
package/v1/providers/jina.yaml +171 -0
package/v1/providers/lepton.yaml +183 -0
package/v1/providers/minimax.yaml +172 -0
package/v1/providers/mistral.yaml +186 -0
package/v1/providers/moonshot.yaml +176 -0
package/v1/providers/nvidia.yaml +172 -0
package/v1/providers/openai.yaml +224 -0
package/v1/providers/openrouter.yaml +181 -0
package/v1/providers/perplexity.yaml +144 -0
package/v1/providers/qwen.yaml +192 -0
package/v1/providers/replicate.yaml +159 -0
package/v1/providers/sensenova.yaml +153 -0
package/v1/providers/siliconflow.yaml +156 -0
package/v1/providers/spark.yaml +167 -0
package/v1/providers/stability.yaml +185 -0
package/v1/providers/tiangong.yaml +170 -0
package/v1/providers/together.yaml +156 -0
package/v1/providers/writer.yaml +212 -0
package/v1/providers/xai.yaml +206 -0
package/v1/providers/yi.yaml +168 -0
package/v1/providers/zhipu.yaml +171 -0
package/v1/spec.yaml +637 -0
package/v2/providers/anthropic.yaml +244 -0
package/v2/providers/cohere.yaml +75 -0
package/v2/providers/deepseek.yaml +176 -0
package/v2/providers/doubao.yaml +169 -0
package/v2/providers/google.yaml +245 -0
package/v2/providers/jina.yaml +55 -0
package/v2/providers/moonshot.yaml +186 -0
package/v2/providers/openai.yaml +266 -0
package/v2/providers/qwen.yaml +174 -0
package/v2/providers/zhipu.yaml +176 -0
package/v2-alpha/providers/anthropic.yaml +134 -0
package/v2-alpha/providers/gemini.yaml +144 -0
package/v2-alpha/providers/openai.yaml +154 -0
package/v2-alpha/spec.yaml +512 -0

package/v1/providers/minimax.yaml ADDED Viewed

@@ -0,0 +1,172 @@
+$schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
+id: minimax
+protocol_version: "1.5"
+name: MiniMax
+version: "v1"
+status: stable
+category: ai_provider
+official_url: "https://platform.minimaxi.com/document/ChatCompletion%20v2"
+support_contact: "https://www.minimaxi.com/contact"
+endpoint:
+  base_url: "https://api.minimax.chat/v1"
+  protocol: https
+  timeout_ms: 60000
+auth:
+  type: bearer
+  token_env: "MINIMAX_API_KEY"
+payload_format: "openai_style"
+# MiniMax uses OpenAI-compatible API
+api_families: ["chat_completions"]
+default_api_family: "chat_completions"
+endpoints:
+  chat:
+    path: "/chat/completions"
+    method: "POST"
+    adapter: "openai"
+services:
+  list_models:
+    path: "/models"
+    method: "GET"
+    response_binding: "data"
+termination:
+  source_field: "finish_reason"
+  mapping:
+    stop: "end_turn"
+    length: "max_tokens"
+    tool_calls: "tool_use"
+    content_filter: "refusal"
+  notes:
+    - "OpenAI-compatible finish_reason."
+    - "MiniMax is a leading Chinese AI company known for abab model series."
+tooling:
+  source_model: "openai_tool_calls"
+  tool_use:
+    id_path: "id"
+    name_path: "function.name"
+    input_path: "function.arguments"
+    input_format: "json_string"
+  notes:
+    - "Supports OpenAI-compatible function calling."
+retry_policy:
+  strategy: "exponential_backoff"
+  max_retries: 3
+  min_delay_ms: 1000
+  max_delay_ms: 30000
+  jitter: "full"
+  retry_on_http_status: [429, 500, 502, 503]
+error_classification:
+  by_http_status:
+    "400": "invalid_request"
+    "401": "authentication"
+    "403": "permission_denied"
+    "404": "not_found"
+    "429": "rate_limited"
+    "500": "server_error"
+    "503": "overloaded"
+parameter_mappings:
+  temperature: "temperature"
+  max_tokens: "max_tokens"
+  stream: "stream"
+  top_p: "top_p"
+  stop_sequences: "stop"
+  tools: "tools"
+  tool_choice: "tool_choice"
+  n: "n"
+response_format: "openai_style"
+response_paths:
+  content: "choices[0].message.content"
+  tool_calls: "choices[0].message.tool_calls"
+  usage: "usage"
+  finish_reason: "choices[0].finish_reason"
+streaming:
+  event_format: "data_lines"
+  decoder:
+    format: "sse"
+    delimiter: "\n\n"
+    prefix: "data: "
+    done_signal: "[DONE]"
+  content_path: "choices[0].delta.content"
+  tool_call_path: "choices[0].delta.tool_calls"
+  usage_path: "usage"
+  frame_selector: "exists($.choices) || exists($.error)"
+  event_map:
+    - match: "exists($.choices[*].delta.content)"
+      emit: "PartialContentDelta"
+      fields:
+        content: "$.choices[*].delta.content"
+    - match: "exists($.choices[*].delta.tool_calls[*].function.name)"
+      emit: "ToolCallStarted"
+      fields:
+        tool_call_id: "$.choices[*].delta.tool_calls[*].id"
+        tool_name: "$.choices[*].delta.tool_calls[*].function.name"
+        index: "$.choices[*].delta.tool_calls[*].index"
+    - match: "exists($.choices[*].delta.tool_calls[*].function.arguments)"
+      emit: "PartialToolCall"
+      fields:
+        arguments: "$.choices[*].delta.tool_calls[*].function.arguments"
+        index: "$.choices[*].delta.tool_calls[*].index"
+    - match: "exists($.usage)"
+      emit: "Metadata"
+      fields:
+        usage: "$.usage"
+    - match: "exists($.choices[*].finish_reason)"
+      emit: "FinalCandidate"
+      fields:
+        finish_reason: "$.choices[*].finish_reason"
+  stop_condition: "$.choices[0].finish_reason != null"
+features:
+  multi_candidate:
+    support_type: "native"
+    param_name: "n"
+  response_mapping:
+    tool_calls:
+      path: "choices[0].message.tool_calls"
+      fields:
+        id: "id"
+        name: "function.name"
+        args: "function.arguments"
+    error:
+      message_path: "error.message"
+      code_path: "error.code"
+      type_path: "error.type"
+capabilities:
+  streaming: true
+  tools: true
+  vision: true
+  agentic: true
+  parallel_tools: true
+  reasoning: false
+availability:
+  required: false
+  regions:
+    - cn
+    - global
+  check:
+    method: GET
+    path: "/models"
+    expected_status: [200, 401]
+    timeout_ms: 5000
+experimental_features:
+  - "voice_synthesis"
+  - "music_generation"
+  - "video_generation"

package/v1/providers/mistral.yaml ADDED Viewed

@@ -0,0 +1,186 @@
+$schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
+id: mistral
+protocol_version: "1.5"
+name: Mistral AI
+version: "v1"
+status: stable
+category: ai_provider
+official_url: "https://docs.mistral.ai"
+support_contact: "https://mistral.ai/contact"
+endpoint:
+  base_url: "https://api.mistral.ai/v1"
+  protocol: https
+  timeout_ms: 10000
+auth:
+  type: bearer
+  token_env: "MISTRAL_API_KEY"
+payload_format: "openai_style"
+# OpenAI-compatible API families
+api_families: ["chat_completions"]
+default_api_family: "chat_completions"
+endpoints:
+  # Runtime uses UnifiedRequest.operation (currently "chat") to resolve endpoints.
+  # Keep keys aligned with runtime expectations.
+  chat:
+    path: "/chat/completions"
+    method: "POST"
+    adapter: "openai"
+# Optional service endpoints (OpenAI-compatible).
+services:
+  list_models:
+    path: "/models"
+    method: "GET"
+    response_binding: "data"
+# Termination reason normalization (see v1/spec.yaml: standard_schema.streaming_events.termination_reasons)
+termination:
+  source_field: "finish_reason"
+  mapping:
+    stop: "end_turn"
+    length: "max_tokens"
+    tool_calls: "tool_use"
+    content_filter: "refusal"
+  notes:
+    - "OpenAI-compatible: finish_reason is reported per candidate."
+# Tool invocation normalization (see v1/spec.yaml: standard_schema.content_blocks)
+tooling:
+  source_model: "openai_tool_calls"
+  tool_use:
+    id_path: "id"
+    name_path: "function.name"
+    input_path: "function.arguments"
+    input_format: "json_string"
+  notes:
+    - "OpenAI-compatible tool_calls.function.arguments is typically a JSON string; runtimes SHOULD parse it into an object when normalizing."
+# Rate limits (Mistral uses standard HTTP headers)
+# Note: Mistral may use different header names, but we follow OpenAI-compatible pattern
+rate_limit_headers:
+  requests_limit: "x-ratelimit-limit-requests"
+  requests_remaining: "x-ratelimit-remaining-requests"
+  requests_reset: "x-ratelimit-reset-requests"
+  tokens_limit: "x-ratelimit-limit-tokens"
+  tokens_remaining: "x-ratelimit-remaining-tokens"
+  tokens_reset: "x-ratelimit-reset-tokens"
+  retry_after: "retry-after"
+# Retry policy (OpenAI-compatible guidance: exponential backoff for 429; retry 5xx after brief wait)
+retry_policy:
+  max_retries: 3
+  max_delay_ms: 30000
+  strategy: "exponential_backoff"
+  min_delay_ms: 1000
+  jitter: "full"
+  retry_on_http_status: [429, 500, 502, 503]
+  notes:
+    - "OpenAI-compatible: exponential backoff is recommended for rate limit errors (429)."
+    - "Retry 500 after a brief wait."
+parameter_mappings:
+  temperature: "temperature"
+  max_tokens: "max_tokens"
+  stream: "stream"
+  stop_sequences: "stop"
+  tools: "tools"
+  tool_choice: "tool_choice"
+  frequency_penalty: "frequency_penalty"
+  presence_penalty: "presence_penalty"
+  top_p: "top_p"
+  random_seed: "random_seed"
+  n: "n"
+  parallel_tool_calls: "parallel_tool_calls"
+  safe_prompt: "safe_prompt"
+  response_format: "response_format"
+  prompt_mode: "prompt_mode"
+  prediction: "prediction"
+  metadata: "metadata"
+response_format: "openai_style"
+response_paths:
+  content: "choices[0].message.content"
+  tool_calls: "choices[0].message.tool_calls"
+  usage: "usage"
+streaming:
+  event_format: "data_lines"
+  decoder:
+    format: "sse"
+    delimiter: "\n\n"
+    prefix: "data: "
+    done_signal: "[DONE]"
+  content_path: "choices[0].delta.content"
+  tool_call_path: "choices[0].delta.tool_calls"
+  usage_path: "usage"
+  frame_selector: "exists($.choices) || exists($.error)"
+  event_map:
+    # Text content delta
+    - match: "exists($.choices[*].delta.content)"
+      emit: "PartialContentDelta"
+      fields:
+        content: "$.choices[*].delta.content"
+    # Tool call start
+    - match: "exists($.choices[*].delta.tool_calls[*].function.name)"
+      emit: "ToolCallStarted"
+      fields:
+        tool_call_id: "$.choices[*].delta.tool_calls[*].id"
+        tool_name: "$.choices[*].delta.tool_calls[*].function.name"
+        index: "$.choices[*].delta.tool_calls[*].index"
+    # Tool call arguments streaming
+    - match: "exists($.choices[*].delta.tool_calls[*].function.arguments)"
+      emit: "PartialToolCall"
+      fields:
+        arguments: "$.choices[*].delta.tool_calls[*].function.arguments"
+        index: "$.choices[*].delta.tool_calls[*].index"
+    # Usage metadata
+    - match: "exists($.usage)"
+      emit: "Metadata"
+      fields:
+        usage: "$.usage"
+    # Finish with reason
+    - match: "exists($.choices[*].finish_reason)"
+      emit: "FinalCandidate"
+      fields:
+        finish_reason: "$.choices[*].finish_reason"
+        candidate_index: "$.choices[*].index"
+  stop_condition: "$.choices[0].finish_reason != null"
+features:
+  multi_candidate:
+    support_type: "native"
+    param_name: "n"
+  response_mapping:
+    tool_calls:
+      path: "choices[0].message.tool_calls"
+      fields:
+        id: "id"
+        name: "function.name"
+        args: "function.arguments"
+    error:
+      message_path: "error.message"
+      code_path: "error.code"
+      type_path: "error.type"
+      param_path: "error.param"
+capabilities:
+  streaming: true
+  tools: true
+  vision: false
+  agentic: true
+  parallel_tools: true
+  reasoning: false
+availability:
+  required: false
+  regions:
+    - global
+  check:
+    method: GET
+    path: "/models"
+    expected_status: [200, 401]
+    timeout_ms: 3000

package/v1/providers/moonshot.yaml ADDED Viewed

@@ -0,0 +1,176 @@
+$schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
+id: moonshot
+protocol_version: "1.5"
+name: 月之暗面 Kimi (Moonshot)
+version: "v1"
+status: stable
+category: ai_provider
+official_url: "https://platform.moonshot.cn/docs"
+support_contact: "https://www.moonshot.cn/contact"
+endpoint:
+  base_url: "https://api.moonshot.cn/v1"
+  protocol: https
+  timeout_ms: 60000
+auth:
+  type: bearer
+  token_env: "MOONSHOT_API_KEY"
+payload_format: "openai_style"
+# OpenAI-compatible API
+api_families: ["chat_completions"]
+default_api_family: "chat_completions"
+endpoints:
+  chat:
+    path: "/chat/completions"
+    method: "POST"
+    adapter: "openai"
+services:
+  list_models:
+    path: "/models"
+    method: "GET"
+    response_binding: "data"
+  # Kimi supports file upload for context
+  upload_file:
+    path: "/files"
+    method: "POST"
+  list_files:
+    path: "/files"
+    method: "GET"
+termination:
+  source_field: "finish_reason"
+  mapping:
+    stop: "end_turn"
+    length: "max_tokens"
+    tool_calls: "tool_use"
+  notes:
+    - "OpenAI-compatible finish_reason."
+    - "Kimi is known for ultra-long context (up to 200K tokens) and file understanding."
+tooling:
+  source_model: "openai_tool_calls"
+  tool_use:
+    id_path: "id"
+    name_path: "function.name"
+    input_path: "function.arguments"
+    input_format: "json_string"
+  notes:
+    - "Supports OpenAI-compatible function calling."
+retry_policy:
+  strategy: "exponential_backoff"
+  max_retries: 3
+  min_delay_ms: 1000
+  max_delay_ms: 30000
+  jitter: "full"
+  retry_on_http_status: [429, 500, 502, 503]
+error_classification:
+  by_http_status:
+    "400": "invalid_request"
+    "401": "authentication"
+    "403": "permission_denied"
+    "404": "not_found"
+    "429": "rate_limited"
+    "500": "server_error"
+    "503": "overloaded"
+parameter_mappings:
+  temperature: "temperature"
+  max_tokens: "max_tokens"
+  stream: "stream"
+  top_p: "top_p"
+  stop_sequences: "stop"
+  tools: "tools"
+  tool_choice: "tool_choice"
+  n: "n"
+response_format: "openai_style"
+response_paths:
+  content: "choices[0].message.content"
+  tool_calls: "choices[0].message.tool_calls"
+  usage: "usage"
+  finish_reason: "choices[0].finish_reason"
+streaming:
+  event_format: "data_lines"
+  decoder:
+    format: "sse"
+    delimiter: "\n\n"
+    prefix: "data: "
+    done_signal: "[DONE]"
+  content_path: "choices[0].delta.content"
+  tool_call_path: "choices[0].delta.tool_calls"
+  usage_path: "usage"
+  frame_selector: "exists($.choices) || exists($.error)"
+  event_map:
+    - match: "exists($.choices[*].delta.content)"
+      emit: "PartialContentDelta"
+      fields:
+        content: "$.choices[*].delta.content"
+    - match: "exists($.choices[*].delta.tool_calls[*].function.name)"
+      emit: "ToolCallStarted"
+      fields:
+        tool_call_id: "$.choices[*].delta.tool_calls[*].id"
+        tool_name: "$.choices[*].delta.tool_calls[*].function.name"
+        index: "$.choices[*].delta.tool_calls[*].index"
+    - match: "exists($.choices[*].delta.tool_calls[*].function.arguments)"
+      emit: "PartialToolCall"
+      fields:
+        arguments: "$.choices[*].delta.tool_calls[*].function.arguments"
+        index: "$.choices[*].delta.tool_calls[*].index"
+    - match: "exists($.usage)"
+      emit: "Metadata"
+      fields:
+        usage: "$.usage"
+    - match: "exists($.choices[*].finish_reason)"
+      emit: "FinalCandidate"
+      fields:
+        finish_reason: "$.choices[*].finish_reason"
+  stop_condition: "$.choices[0].finish_reason != null"
+features:
+  multi_candidate:
+    support_type: "native"
+    param_name: "n"
+  response_mapping:
+    tool_calls:
+      path: "choices[0].message.tool_calls"
+      fields:
+        id: "id"
+        name: "function.name"
+        args: "function.arguments"
+    error:
+      message_path: "error.message"
+      code_path: "error.code"
+capabilities:
+  streaming: true
+  tools: true
+  vision: true
+  agentic: true
+  parallel_tools: true
+  reasoning: false
+availability:
+  required: false
+  regions:
+    - cn
+  check:
+    method: GET
+    path: "/models"
+    expected_status: [200, 401]
+    timeout_ms: 5000
+experimental_features:
+  - "file_upload"
+  - "web_search"
+  - "long_context"

package/v1/providers/nvidia.yaml ADDED Viewed

@@ -0,0 +1,172 @@
+$schema: "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json"
+id: nvidia
+protocol_version: "1.5"
+name: NVIDIA API Catalog
+version: "v1"
+status: stable
+category: third_party_aggregator
+official_url: "https://build.nvidia.com/explore/discover"
+support_contact: "https://docs.api.nvidia.com/nim/docs"
+# NVIDIA API Catalog (NVIDIA Build) - OpenAI-compatible chat completions
+# Base URL: https://integrate.api.nvidia.com (docs.api.nvidia.com/nim/reference/llm-apis)
+endpoint:
+  base_url: "https://integrate.api.nvidia.com/v1"
+  protocol: https
+  timeout_ms: 60000
+auth:
+  type: bearer
+  token_env: "NVIDIA_API_KEY"
+payload_format: "openai_style"
+api_families: ["chat_completions", "completions"]
+default_api_family: "chat_completions"
+endpoints:
+  chat:
+    path: "/chat/completions"
+    method: "POST"
+    adapter: "openai"
+  completions:
+    path: "/completions"
+    method: "POST"
+    adapter: "openai"
+services:
+  list_models:
+    path: "/models"
+    method: "GET"
+    response_binding: "data"
+termination:
+  source_field: "finish_reason"
+  mapping:
+    stop: "end_turn"
+    length: "max_tokens"
+    tool_calls: "tool_use"
+    content_filter: "refusal"
+  notes:
+    - "OpenAI-compatible: finish_reason is reported per candidate."
+tooling:
+  source_model: "openai_tool_calls"
+  tool_use:
+    id_path: "id"
+    name_path: "function.name"
+    input_path: "function.arguments"
+    input_format: "json_string"
+  notes:
+    - "OpenAI-compatible tool_calls.function.arguments is typically a JSON string."
+retry_policy:
+  max_retries: 3
+  max_delay_ms: 30000
+  strategy: "exponential_backoff"
+  min_delay_ms: 1000
+  jitter: "full"
+  retry_on_http_status: [429, 500, 502, 503]
+  notes:
+    - "Exponential backoff recommended for 429; retry 5xx after brief wait."
+error_classification:
+  by_http_status:
+    "400": "invalid_request"
+    "401": "authentication"
+    "403": "permission_denied"
+    "404": "not_found"
+    "429": "rate_limited"
+    "500": "server_error"
+parameter_mappings:
+  temperature: "temperature"
+  max_tokens: "max_tokens"
+  stream: "stream"
+  stop_sequences: "stop"
+  tools: "tools"
+  tool_choice: "tool_choice"
+  frequency_penalty: "frequency_penalty"
+  presence_penalty: "presence_penalty"
+  top_p: "top_p"
+response_format: "openai_style"
+response_paths:
+  content: "choices[0].message.content"
+  tool_calls: "choices[0].message.tool_calls"
+  usage: "usage"
+  finish_reason: "choices[0].finish_reason"
+streaming:
+  event_format: "data_lines"
+  decoder:
+    format: "sse"
+    delimiter: "\n\n"
+    prefix: "data: "
+    done_signal: "[DONE]"
+  content_path: "choices[0].delta.content"
+  tool_call_path: "choices[0].delta.tool_calls"
+  usage_path: "usage"
+  frame_selector: "exists($.choices) || exists($.error)"
+  event_map:
+    - match: "exists($.choices[*].delta.content)"
+      emit: "PartialContentDelta"
+      fields:
+        content: "$.choices[*].delta.content"
+    - match: "exists($.choices[*].delta.tool_calls[*].function.name)"
+      emit: "ToolCallStarted"
+      fields:
+        tool_call_id: "$.choices[*].delta.tool_calls[*].id"
+        tool_name: "$.choices[*].delta.tool_calls[*].function.name"
+        index: "$.choices[*].delta.tool_calls[*].index"
+    - match: "exists($.choices[*].delta.tool_calls[*].function.arguments)"
+      emit: "PartialToolCall"
+      fields:
+        arguments: "$.choices[*].delta.tool_calls[*].function.arguments"
+        index: "$.choices[*].delta.tool_calls[*].index"
+    - match: "exists($.usage)"
+      emit: "Metadata"
+      fields:
+        usage: "$.usage"
+    - match: "exists($.choices[*].finish_reason)"
+      emit: "FinalCandidate"
+      fields:
+        finish_reason: "$.choices[*].finish_reason"
+        candidate_index: "$.choices[*].index"
+  stop_condition: "$.choices[0].finish_reason != null"
+features:
+  multi_candidate:
+    support_type: "native"
+    param_name: "n"
+  response_mapping:
+    tool_calls:
+      path: "choices[0].message.tool_calls"
+      fields:
+        id: "id"
+        name: "function.name"
+        args: "function.arguments"
+    error:
+      message_path: "error.message"
+      code_path: "error.code"
+      type_path: "error.type"
+      param_path: "error.param"
+capabilities:
+  streaming: true
+  tools: true
+  vision: true
+  agentic: true
+  parallel_tools: true
+  reasoning: true
+availability:
+  required: false
+  regions:
+    - global
+  check:
+    method: GET
+    path: "/models"
+    expected_status: [200, 401]
+    timeout_ms: 5000