npm - @ailib-official/ai-protocol - Versions diffs - 0.8.4 - Mend

@ailib-official/ai-protocol 0.8.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (194) hide show

package/LICENSE +6 -0
package/README.md +415 -0
package/dist/index.json +8 -0
package/dist/v1/models/ai21.json +140 -0
package/dist/v1/models/baichuan.json +138 -0
package/dist/v1/models/cerebras.json +147 -0
package/dist/v1/models/claude.json +114 -0
package/dist/v1/models/cohere.json +235 -0
package/dist/v1/models/deepinfra.json +43 -0
package/dist/v1/models/deepseek-chat.json +55 -0
package/dist/v1/models/doubao.json +197 -0
package/dist/v1/models/ernie.json +223 -0
package/dist/v1/models/fireworks.json +222 -0
package/dist/v1/models/gemini.json +58 -0
package/dist/v1/models/gpt.json +166 -0
package/dist/v1/models/grok.json +138 -0
package/dist/v1/models/huggingface.json +183 -0
package/dist/v1/models/hunyuan.json +255 -0
package/dist/v1/models/jina.json +139 -0
package/dist/v1/models/lepton.json +188 -0
package/dist/v1/models/llama.json +143 -0
package/dist/v1/models/minimax.json +194 -0
package/dist/v1/models/mistral.json +177 -0
package/dist/v1/models/moonshot.json +144 -0
package/dist/v1/models/nvidia.json +212 -0
package/dist/v1/models/palmyra.json +103 -0
package/dist/v1/models/perplexity.json +143 -0
package/dist/v1/models/qwen.json +49 -0
package/dist/v1/models/replicate.json +206 -0
package/dist/v1/models/sensenova.json +144 -0
package/dist/v1/models/siliconflow.json +44 -0
package/dist/v1/models/spark.json +173 -0
package/dist/v1/models/stable-diffusion.json +161 -0
package/dist/v1/models/tiangong.json +169 -0
package/dist/v1/models/together.json +43 -0
package/dist/v1/models/yi.json +199 -0
package/dist/v1/models/zhipu.json +250 -0
package/dist/v1/providers/ai21.json +215 -0
package/dist/v1/providers/anthropic.json +253 -0
package/dist/v1/providers/anyscale.json +115 -0
package/dist/v1/providers/azure.json +188 -0
package/dist/v1/providers/baichuan.json +205 -0
package/dist/v1/providers/baidu.json +205 -0
package/dist/v1/providers/cerebras.json +216 -0
package/dist/v1/providers/cohere.json +209 -0
package/dist/v1/providers/deepinfra.json +196 -0
package/dist/v1/providers/deepseek.json +221 -0
package/dist/v1/providers/doubao.json +209 -0
package/dist/v1/providers/fireworks.json +227 -0
package/dist/v1/providers/gemini.json +279 -0
package/dist/v1/providers/groq.json +218 -0
package/dist/v1/providers/huggingface.json +181 -0
package/dist/v1/providers/hunyuan.json +198 -0
package/dist/v1/providers/jina.json +202 -0
package/dist/v1/providers/lepton.json +221 -0
package/dist/v1/providers/minimax.json +209 -0
package/dist/v1/providers/mistral.json +214 -0
package/dist/v1/providers/moonshot.json +214 -0
package/dist/v1/providers/nvidia.json +213 -0
package/dist/v1/providers/openai.json +267 -0
package/dist/v1/providers/openrouter.json +220 -0
package/dist/v1/providers/perplexity.json +172 -0
package/dist/v1/providers/qwen.json +231 -0
package/dist/v1/providers/replicate.json +192 -0
package/dist/v1/providers/sensenova.json +185 -0
package/dist/v1/providers/siliconflow.json +197 -0
package/dist/v1/providers/spark.json +204 -0
package/dist/v1/providers/stability.json +221 -0
package/dist/v1/providers/tiangong.json +207 -0
package/dist/v1/providers/together.json +196 -0
package/dist/v1/providers/writer.json +253 -0
package/dist/v1/providers/xai.json +238 -0
package/dist/v1/providers/yi.json +205 -0
package/dist/v1/providers/zhipu.json +208 -0
package/dist/v1/spec.json +783 -0
package/dist/v2/providers/anthropic.json +372 -0
package/dist/v2/providers/cohere.json +109 -0
package/dist/v2/providers/deepseek.json +272 -0
package/dist/v2/providers/doubao.json +260 -0
package/dist/v2/providers/google.json +388 -0
package/dist/v2/providers/jina.json +71 -0
package/dist/v2/providers/moonshot.json +284 -0
package/dist/v2/providers/openai.json +419 -0
package/dist/v2/providers/qwen.json +274 -0
package/dist/v2/providers/zhipu.json +257 -0
package/dist/v2-alpha/providers/anthropic.json +182 -0
package/dist/v2-alpha/providers/gemini.json +187 -0
package/dist/v2-alpha/providers/openai.json +215 -0
package/dist/v2-alpha/spec.json +644 -0
package/package.json +61 -0
package/schemas/spec.json +186 -0
package/schemas/v1.json +1116 -0
package/schemas/v2/availability.json +66 -0
package/schemas/v2/capabilities.json +182 -0
package/schemas/v2/capability-profile.json +174 -0
package/schemas/v2/computer-use.json +222 -0
package/schemas/v2/context-policy.json +148 -0
package/schemas/v2/endpoint.json +2 -0
package/schemas/v2/error-codes.yaml +225 -0
package/schemas/v2/errors.json +250 -0
package/schemas/v2/execution-metadata.json +59 -0
package/schemas/v2/mcp.json +225 -0
package/schemas/v2/message-roles.json +10 -0
package/schemas/v2/multimodal.json +297 -0
package/schemas/v2/pricing.json +14 -0
package/schemas/v2/provider-contract.json +317 -0
package/schemas/v2/provider.json +203 -0
package/schemas/v2/regions.json +14 -0
package/v1/models/ai21.yaml +97 -0
package/v1/models/baichuan.yaml +95 -0
package/v1/models/cerebras.yaml +99 -0
package/v1/models/claude.yaml +59 -0
package/v1/models/cohere.yaml +165 -0
package/v1/models/deepinfra.yaml +29 -0
package/v1/models/deepseek-chat.yaml +32 -0
package/v1/models/doubao.yaml +129 -0
package/v1/models/ernie.yaml +146 -0
package/v1/models/fireworks.yaml +145 -0
package/v1/models/gemini.yaml +32 -0
package/v1/models/gpt.yaml +90 -0
package/v1/models/grok.yaml +74 -0
package/v1/models/huggingface.yaml +110 -0
package/v1/models/hunyuan.yaml +164 -0
package/v1/models/jina.yaml +98 -0
package/v1/models/lepton.yaml +130 -0
package/v1/models/llama.yaml +91 -0
package/v1/models/minimax.yaml +132 -0
package/v1/models/mistral.yaml +100 -0
package/v1/models/moonshot.yaml +97 -0
package/v1/models/nvidia.yaml +118 -0
package/v1/models/palmyra.yaml +59 -0
package/v1/models/perplexity.yaml +97 -0
package/v1/models/qwen.yaml +27 -0
package/v1/models/replicate.yaml +136 -0
package/v1/models/sensenova.yaml +97 -0
package/v1/models/siliconflow.yaml +29 -0
package/v1/models/spark.yaml +114 -0
package/v1/models/stable-diffusion.yaml +113 -0
package/v1/models/tiangong.yaml +114 -0
package/v1/models/together.yaml +29 -0
package/v1/models/yi.yaml +132 -0
package/v1/models/zhipu.yaml +163 -0
package/v1/providers/ai21.yaml +176 -0
package/v1/providers/anthropic.yaml +209 -0
package/v1/providers/anyscale.yaml +106 -0
package/v1/providers/azure.yaml +155 -0
package/v1/providers/baichuan.yaml +168 -0
package/v1/providers/baidu.yaml +173 -0
package/v1/providers/cerebras.yaml +178 -0
package/v1/providers/cohere.yaml +175 -0
package/v1/providers/deepinfra.yaml +156 -0
package/v1/providers/deepseek.yaml +189 -0
package/v1/providers/doubao.yaml +172 -0
package/v1/providers/fireworks.yaml +187 -0
package/v1/providers/gemini.yaml +229 -0
package/v1/providers/groq.yaml +181 -0
package/v1/providers/huggingface.yaml +157 -0
package/v1/providers/hunyuan.yaml +162 -0
package/v1/providers/jina.yaml +171 -0
package/v1/providers/lepton.yaml +183 -0
package/v1/providers/minimax.yaml +172 -0
package/v1/providers/mistral.yaml +186 -0
package/v1/providers/moonshot.yaml +176 -0
package/v1/providers/nvidia.yaml +172 -0
package/v1/providers/openai.yaml +224 -0
package/v1/providers/openrouter.yaml +181 -0
package/v1/providers/perplexity.yaml +144 -0
package/v1/providers/qwen.yaml +192 -0
package/v1/providers/replicate.yaml +159 -0
package/v1/providers/sensenova.yaml +153 -0
package/v1/providers/siliconflow.yaml +156 -0
package/v1/providers/spark.yaml +167 -0
package/v1/providers/stability.yaml +185 -0
package/v1/providers/tiangong.yaml +170 -0
package/v1/providers/together.yaml +156 -0
package/v1/providers/writer.yaml +212 -0
package/v1/providers/xai.yaml +206 -0
package/v1/providers/yi.yaml +168 -0
package/v1/providers/zhipu.yaml +171 -0
package/v1/spec.yaml +637 -0
package/v2/providers/anthropic.yaml +244 -0
package/v2/providers/cohere.yaml +75 -0
package/v2/providers/deepseek.yaml +176 -0
package/v2/providers/doubao.yaml +169 -0
package/v2/providers/google.yaml +245 -0
package/v2/providers/jina.yaml +55 -0
package/v2/providers/moonshot.yaml +186 -0
package/v2/providers/openai.yaml +266 -0
package/v2/providers/qwen.yaml +174 -0
package/v2/providers/zhipu.yaml +176 -0
package/v2-alpha/providers/anthropic.yaml +134 -0
package/v2-alpha/providers/gemini.yaml +144 -0
package/v2-alpha/providers/openai.yaml +154 -0
package/v2-alpha/spec.yaml +512 -0

package/dist/v1/providers/perplexity.json ADDED Viewed

@@ -0,0 +1,172 @@
+{
+  "$schema": "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json",
+  "id": "perplexity",
+  "protocol_version": "1.5",
+  "name": "Perplexity",
+  "version": "v1",
+  "status": "stable",
+  "category": "ai_provider",
+  "official_url": "https://docs.perplexity.ai",
+  "support_contact": "https://www.perplexity.ai/contact",
+  "endpoint": {
+    "base_url": "https://api.perplexity.ai",
+    "protocol": "https",
+    "timeout_ms": 60000
+  },
+  "auth": {
+    "type": "bearer",
+    "token_env": "PPLX_API_KEY"
+  },
+  "payload_format": "openai_style",
+  "api_families": [
+    "chat_completions"
+  ],
+  "default_api_family": "chat_completions",
+  "endpoints": {
+    "chat": {
+      "path": "/chat/completions",
+      "method": "POST",
+      "adapter": "openai"
+    }
+  },
+  "services": {
+    "list_models": {
+      "path": "/models",
+      "method": "GET",
+      "response_binding": "data"
+    }
+  },
+  "termination": {
+    "source_field": "finish_reason",
+    "mapping": {
+      "stop": "end_turn",
+      "length": "max_tokens"
+    },
+    "notes": [
+      "Perplexity is known for search-augmented AI responses.",
+      "Returns citations in responses when using online models."
+    ]
+  },
+  "tooling": {
+    "source_model": "unknown",
+    "notes": [
+      "Perplexity focuses on search/RAG, limited tool support."
+    ]
+  },
+  "retry_policy": {
+    "strategy": "exponential_backoff",
+    "max_retries": 3,
+    "min_delay_ms": 1000,
+    "max_delay_ms": 30000,
+    "jitter": "full",
+    "retry_on_http_status": [
+      429,
+      500,
+      502,
+      503
+    ]
+  },
+  "error_classification": {
+    "by_http_status": {
+      "400": "invalid_request",
+      "401": "authentication",
+      "403": "permission_denied",
+      "404": "not_found",
+      "429": "rate_limited",
+      "500": "server_error",
+      "503": "overloaded"
+    }
+  },
+  "parameter_mappings": {
+    "temperature": "temperature",
+    "max_tokens": "max_tokens",
+    "stream": "stream",
+    "top_p": "top_p",
+    "frequency_penalty": "frequency_penalty",
+    "presence_penalty": "presence_penalty"
+  },
+  "response_format": "openai_style",
+  "response_paths": {
+    "content": "choices[0].message.content",
+    "usage": "usage",
+    "finish_reason": "choices[0].finish_reason",
+    "citations": "citations"
+  },
+  "streaming": {
+    "event_format": "data_lines",
+    "decoder": {
+      "format": "sse",
+      "delimiter": "\n\n",
+      "prefix": "data: ",
+      "done_signal": "[DONE]"
+    },
+    "content_path": "choices[0].delta.content",
+    "usage_path": "usage",
+    "frame_selector": "exists($.choices) || exists($.error)",
+    "event_map": [
+      {
+        "match": "exists($.choices[*].delta.content)",
+        "emit": "PartialContentDelta",
+        "fields": {
+          "content": "$.choices[*].delta.content"
+        }
+      },
+      {
+        "match": "exists($.usage)",
+        "emit": "Metadata",
+        "fields": {
+          "usage": "$.usage"
+        }
+      },
+      {
+        "match": "exists($.choices[*].finish_reason)",
+        "emit": "FinalCandidate",
+        "fields": {
+          "finish_reason": "$.choices[*].finish_reason"
+        }
+      }
+    ],
+    "stop_condition": "$.choices[0].finish_reason != null"
+  },
+  "features": {
+    "multi_candidate": {
+      "support_type": "simulated",
+      "max_concurrent": 1
+    },
+    "response_mapping": {
+      "error": {
+        "message_path": "error.message",
+        "code_path": "error.code",
+        "type_path": "error.type"
+      }
+    }
+  },
+  "capabilities": {
+    "streaming": true,
+    "tools": false,
+    "vision": false,
+    "agentic": false,
+    "parallel_tools": false,
+    "reasoning": false
+  },
+  "availability": {
+    "required": false,
+    "regions": [
+      "global"
+    ],
+    "check": {
+      "method": "GET",
+      "path": "/models",
+      "expected_status": [
+        200,
+        401
+      ],
+      "timeout_ms": 5000
+    }
+  },
+  "experimental_features": [
+    "online_search",
+    "citations",
+    "related_questions"
+  ]
+}

package/dist/v1/providers/qwen.json ADDED Viewed

@@ -0,0 +1,231 @@
+{
+  "$schema": "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json",
+  "id": "qwen",
+  "protocol_version": "1.5",
+  "name": "Qwen (DashScope)",
+  "version": "v1",
+  "status": "stable",
+  "category": "ai_provider",
+  "official_url": "https://help.aliyun.com/zh/model-studio",
+  "support_contact": "https://help.aliyun.com",
+  "endpoint": {
+    "base_url": "https://dashscope.aliyuncs.com/compatible-mode/v1",
+    "protocol": "https",
+    "timeout_ms": 10000
+  },
+  "auth": {
+    "type": "bearer",
+    "token_env": "QWEN_API_KEY"
+  },
+  "payload_format": "openai_style",
+  "api_families": [
+    "chat_completions",
+    "completions"
+  ],
+  "default_api_family": "chat_completions",
+  "endpoints": {
+    "chat": {
+      "path": "/chat/completions",
+      "method": "POST",
+      "adapter": "openai"
+    },
+    "completions": {
+      "path": "/completions",
+      "method": "POST",
+      "adapter": "openai"
+    }
+  },
+  "services": {
+    "list_models": {
+      "path": "/models",
+      "method": "GET",
+      "response_binding": "data"
+    }
+  },
+  "termination": {
+    "source_field": "finish_reason",
+    "mapping": {
+      "stop": "end_turn",
+      "length": "max_tokens",
+      "tool_calls": "tool_use",
+      "content_filter": "refusal"
+    },
+    "notes": [
+      "OpenAI-compatible: finish_reason is reported per candidate."
+    ]
+  },
+  "tooling": {
+    "source_model": "openai_tool_calls",
+    "tool_use": {
+      "id_path": "id",
+      "name_path": "function.name",
+      "input_path": "function.arguments",
+      "input_format": "json_string"
+    },
+    "notes": [
+      "OpenAI-compatible tool_calls.function.arguments is typically a JSON string; runtimes SHOULD parse it into an object when normalizing."
+    ]
+  },
+  "rate_limit_headers": {
+    "requests_limit": "x-ratelimit-limit-requests",
+    "tokens_limit": "x-ratelimit-limit-tokens",
+    "requests_remaining": "x-ratelimit-remaining-requests",
+    "tokens_remaining": "x-ratelimit-remaining-tokens",
+    "requests_reset": "x-ratelimit-reset-requests",
+    "tokens_reset": "x-ratelimit-reset-tokens",
+    "retry_after": "retry-after"
+  },
+  "retry_policy": {
+    "strategy": "exponential_backoff",
+    "max_retries": 2,
+    "min_delay_ms": 1000,
+    "max_delay_ms": 8000,
+    "jitter": "full",
+    "retry_on_http_status": [
+      408,
+      409,
+      429,
+      500,
+      503
+    ],
+    "notes": [
+      "429 can mean rate limit exceeded (QPS/QPM/other limits) OR quota/payment issue; runtimes SHOULD inspect error messages and avoid infinite retries on quota/payment problems.",
+      "On 429, runtimes SHOULD respect Retry-After when present.",
+      "500/503 are server-side/transient; retry after a brief wait.",
+      "408/409 are commonly retried by client libraries with short exponential backoff."
+    ]
+  },
+  "error_classification": {
+    "by_http_status": {
+      "400": "invalid_request",
+      "401": "authentication",
+      "429": "rate_limited",
+      "500": "server_error",
+      "503": "overloaded"
+    },
+    "notes": [
+      "Qwen/DashScope 429 may indicate quota/payment issue; runtimes SHOULD treat as quota_exhausted when the message indicates quota/payment."
+    ]
+  },
+  "parameter_mappings": {
+    "temperature": "temperature",
+    "max_tokens": "max_tokens",
+    "stream": "stream",
+    "top_p": "top_p",
+    "stop_sequences": "stop",
+    "tools": "tools",
+    "tool_choice": "tool_choice"
+  },
+  "response_format": "openai_style",
+  "response_paths": {
+    "content": "choices[0].message.content",
+    "tool_calls": "choices[0].message.tool_calls",
+    "usage": "usage",
+    "finish_reason": "choices[0].finish_reason"
+  },
+  "streaming": {
+    "event_format": "data_lines",
+    "decoder": {
+      "format": "sse",
+      "delimiter": "\n\n",
+      "prefix": "data: ",
+      "done_signal": "[DONE]"
+    },
+    "content_path": "choices[0].delta.content",
+    "tool_call_path": "choices[0].delta.tool_calls",
+    "usage_path": "usage",
+    "frame_selector": "exists($.choices) || exists($.error)",
+    "event_map": [
+      {
+        "match": "exists($.choices[*].delta.content)",
+        "emit": "PartialContentDelta",
+        "fields": {
+          "content": "$.choices[*].delta.content"
+        }
+      },
+      {
+        "match": "exists($.choices[*].delta.tool_calls[*].function.name)",
+        "emit": "ToolCallStarted",
+        "fields": {
+          "tool_call_id": "$.choices[*].delta.tool_calls[*].id",
+          "tool_name": "$.choices[*].delta.tool_calls[*].function.name",
+          "index": "$.choices[*].delta.tool_calls[*].index"
+        }
+      },
+      {
+        "match": "exists($.choices[*].delta.tool_calls[*].function.arguments)",
+        "emit": "PartialToolCall",
+        "fields": {
+          "arguments": "$.choices[*].delta.tool_calls[*].function.arguments",
+          "index": "$.choices[*].delta.tool_calls[*].index"
+        }
+      },
+      {
+        "match": "exists($.usage)",
+        "emit": "Metadata",
+        "fields": {
+          "usage": "$.usage"
+        }
+      },
+      {
+        "match": "exists($.choices[*].finish_reason)",
+        "emit": "FinalCandidate",
+        "fields": {
+          "finish_reason": "$.choices[*].finish_reason",
+          "candidate_index": "$.choices[*].index"
+        }
+      }
+    ],
+    "stop_condition": "$.choices[0].finish_reason != null"
+  },
+  "features": {
+    "multi_candidate": {
+      "support_type": "native",
+      "param_name": "n"
+    },
+    "response_mapping": {
+      "tool_calls": {
+        "path": "choices[0].message.tool_calls",
+        "fields": {
+          "id": "id",
+          "name": "function.name",
+          "args": "function.arguments"
+        }
+      },
+      "error": {
+        "message_path": "error.message",
+        "code_path": "error.code",
+        "type_path": "error.type",
+        "param_path": "error.param"
+      }
+    }
+  },
+  "capabilities": {
+    "streaming": true,
+    "tools": true,
+    "vision": true,
+    "agentic": true,
+    "parallel_tools": false,
+    "reasoning": false
+  },
+  "availability": {
+    "required": false,
+    "regions": [
+      "cn",
+      "global"
+    ],
+    "check": {
+      "method": "GET",
+      "path": "/models",
+      "expected_status": [
+        200,
+        401
+      ],
+      "timeout_ms": 3000
+    }
+  },
+  "experimental_features": [
+    "multilingual_support",
+    "qwen_agent"
+  ]
+}

package/dist/v1/providers/replicate.json ADDED Viewed

@@ -0,0 +1,192 @@
+{
+  "$schema": "https://raw.githubusercontent.com/ailib-official/ai-protocol/main/schemas/v1.json",
+  "id": "replicate",
+  "protocol_version": "1.5",
+  "name": "Replicate",
+  "version": "v1",
+  "status": "stable",
+  "category": "model_provider",
+  "official_url": "https://replicate.com/docs",
+  "support_contact": "https://replicate.com/contact",
+  "endpoint": {
+    "base_url": "https://api.replicate.com/v1",
+    "protocol": "https",
+    "timeout_ms": 60000
+  },
+  "auth": {
+    "type": "bearer",
+    "token_env": "REPLICATE_API_TOKEN"
+  },
+  "payload_format": "replicate_style",
+  "api_families": [
+    "predictions",
+    "openai_compatible"
+  ],
+  "default_api_family": "predictions",
+  "endpoints": {
+    "chat": {
+      "path": "/models/{owner}/{model}/predictions",
+      "method": "POST",
+      "adapter": "replicate"
+    },
+    "openai_chat": {
+      "path": "/openai/v1/chat/completions",
+      "method": "POST",
+      "adapter": "openai"
+    }
+  },
+  "services": {
+    "list_models": {
+      "path": "/models",
+      "method": "GET",
+      "response_binding": "results"
+    },
+    "get_prediction": {
+      "path": "/predictions/{id}",
+      "method": "GET"
+    },
+    "cancel_prediction": {
+      "path": "/predictions/{id}/cancel",
+      "method": "POST"
+    }
+  },
+  "termination": {
+    "source_field": "status",
+    "mapping": {
+      "succeeded": "end_turn",
+      "failed": "other",
+      "canceled": "cancelled"
+    },
+    "notes": [
+      "Replicate uses async predictions with status polling.",
+      "For streaming, use the stream parameter."
+    ]
+  },
+  "tooling": {
+    "source_model": "unknown",
+    "notes": [
+      "Tool calling support varies by model.",
+      "Some models support OpenAI-compatible function calling via the openai endpoint."
+    ]
+  },
+  "retry_policy": {
+    "strategy": "exponential_backoff",
+    "max_retries": 3,
+    "min_delay_ms": 1000,
+    "max_delay_ms": 30000,
+    "jitter": "full",
+    "retry_on_http_status": [
+      429,
+      500,
+      502,
+      503,
+      504
+    ],
+    "notes": [
+      "Replicate may return 503 when models are cold-starting.",
+      "Consider longer timeouts for initial requests."
+    ]
+  },
+  "error_classification": {
+    "by_http_status": {
+      "400": "invalid_request",
+      "401": "authentication",
+      "402": "quota_exhausted",
+      "403": "permission_denied",
+      "404": "not_found",
+      "422": "invalid_request",
+      "429": "rate_limited",
+      "500": "server_error",
+      "503": "overloaded"
+    }
+  },
+  "parameter_mappings": {
+    "temperature": "input.temperature",
+    "max_tokens": "input.max_tokens",
+    "stream": "stream",
+    "top_p": "input.top_p",
+    "stop_sequences": "input.stop",
+    "prompt": "input.prompt",
+    "system_message": "input.system_prompt"
+  },
+  "response_format": "replicate_style",
+  "response_paths": {
+    "content": "output",
+    "status": "status",
+    "error": "error"
+  },
+  "streaming": {
+    "event_format": "sse",
+    "decoder": {
+      "format": "sse",
+      "delimiter": "\n\n",
+      "prefix": "data: ",
+      "done_signal": "done"
+    },
+    "content_path": "output",
+    "event_map": [
+      {
+        "match": "$.event == 'output'",
+        "emit": "PartialContentDelta",
+        "fields": {
+          "content": "$.data"
+        }
+      },
+      {
+        "match": "$.event == 'done'",
+        "emit": "StreamEnd",
+        "fields": {
+          "finish_reason": "end_turn"
+        }
+      },
+      {
+        "match": "$.event == 'error'",
+        "emit": "StreamError",
+        "fields": {
+          "error": "$.data"
+        }
+      }
+    ],
+    "stop_condition": "$.event == 'done'"
+  },
+  "features": {
+    "multi_candidate": {
+      "support_type": "simulated",
+      "max_concurrent": 4
+    },
+    "response_mapping": {
+      "error": {
+        "message_path": "detail",
+        "type_path": "type"
+      }
+    }
+  },
+  "capabilities": {
+    "streaming": true,
+    "tools": false,
+    "vision": true,
+    "agentic": false,
+    "parallel_tools": false,
+    "reasoning": false
+  },
+  "availability": {
+    "required": false,
+    "regions": [
+      "global"
+    ],
+    "check": {
+      "method": "GET",
+      "path": "/models",
+      "expected_status": [
+        200,
+        401
+      ],
+      "timeout_ms": 5000
+    }
+  },
+  "experimental_features": [
+    "async_predictions",
+    "webhooks",
+    "cold_boot_optimization"
+  ]
+}