npm - @hermespilot/link - Versions diffs - 0.7.9-beta.0 → 0.7.9 - Mend

@hermespilot/link 0.7.9-beta.0 → 0.7.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/.env.example +27 -0
package/README.md +2 -0
package/dist/{chunk-Y5S7U77X.js → chunk-LUGNDJU3.js} +3128 -528
package/dist/cli/index.js +1 -1
package/dist/http/app.d.ts +52 -0
package/dist/http/app.js +1 -1
package/model-capabilities/catalog.json +1228 -0
package/package.json +3 -1

package/model-capabilities/catalog.json ADDED Viewed

@@ -0,0 +1,1228 @@
+{
+  "schemaVersion": 1,
+  "updatedAt": "2026-06-22T00:00:00.000Z",
+  "templateGuide": {
+    "purpose": "Template only. Replace the sample rows with verified model capability records before publishing to R2.",
+    "matching": "Use canonicalId only. Link performs conservative normalization when matching model IDs.",
+    "reasoningSupportPolicy": {
+      "supported": "Use when official/provider docs clearly say this model supports reasoning controls.",
+      "unsupported": "Use when official/provider docs clearly say this model does not support reasoning controls.",
+      "null": "Use when reasoning support has not been verified. Do not write auto in the catalog; auto is only a Profile/App configuration policy."
+    },
+    "supportedReasoningEfforts": {
+      "allowedValues": ["none", "minimal", "low", "medium", "high", "xhigh"],
+      "forSupportedModels": "Use the exact verified subset. The sample reasoning row shows the complete possible list.",
+      "forUnsupportedModels": [],
+      "forUnknownModels": null
+    }
+  },
+  "models": [
+    {
+      "canonicalId": "deepseek-v4-flash",
+      "contextLength": 1000000,
+      "maxOutputTokens": 384000,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "low",
+        "medium",
+        "high",
+        "xhigh"
+      ],
+      "supportsVision": null,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://api-docs.deepseek.com/quick_start/pricing",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Current DeepSeek API model. Official docs list 1M context and 384K max output, with both non-thinking and thinking modes. DeepSeek's official docs also say deepseek-chat and deepseek-reasoner are compatibility names that will be deprecated on 2026/07/24 15:59 UTC and correspond to the non-thinking/thinking modes of this model. I did not find a current official image-input declaration, so supportsVision is left null."
+    },
+    {
+      "canonicalId": "deepseek-v4-pro",
+      "contextLength": 1000000,
+      "maxOutputTokens": 384000,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "low",
+        "medium",
+        "high",
+        "xhigh"
+      ],
+      "supportsVision": null,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://api-docs.deepseek.com/quick_start/pricing",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Current DeepSeek API model. Official docs show the same public capability envelope as deepseek-v4-flash: 1M context, 384K max output, and both non-thinking and thinking modes. I did not find a current official image-input declaration, so supportsVision is left null."
+    },
+    {
+      "canonicalId": "gpt-4.1",
+      "contextLength": 1047576,
+      "maxOutputTokens": 32768,
+      "reasoningSupportPolicy": "unsupported",
+      "supportedReasoningEfforts": [],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://developers.openai.com/api/docs/models/gpt-4.1",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "OpenAI's current non-reasoning GPT-4.1 model. Official docs list text/image input, text output, a 1,047,576-token context window, and 32,768 max output tokens."
+    },
+    {
+      "canonicalId": "gpt-4.1-mini",
+      "contextLength": 1047576,
+      "maxOutputTokens": 32768,
+      "reasoningSupportPolicy": "unsupported",
+      "supportedReasoningEfforts": [],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://developers.openai.com/api/docs/models/gpt-4.1-mini",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Smaller, faster GPT-4.1 variant. Official docs list text/image input, text output, a 1,047,576-token context window, and 32,768 max output tokens."
+    },
+    {
+      "canonicalId": "gpt-4.1-nano",
+      "contextLength": 1047576,
+      "maxOutputTokens": 32768,
+      "reasoningSupportPolicy": "unsupported",
+      "supportedReasoningEfforts": [],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://developers.openai.com/api/docs/models/gpt-4.1-nano",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Fastest GPT-4.1 variant. Official docs list text/image input, text output, a 1,047,576-token context window, and 32,768 max output tokens. The page says it runs without a reasoning step."
+    },
+    {
+      "canonicalId": "gpt-4o",
+      "contextLength": 128000,
+      "maxOutputTokens": 16384,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://developers.openai.com/api/docs/models/gpt-4o",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Fast, intelligent, flexible GPT model. Official docs list text/image input, text output, a 128k context window, and 16,384 max output tokens. I did not find a page-level reasoning-effort matrix, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "gpt-4o-mini",
+      "contextLength": 128000,
+      "maxOutputTokens": 16384,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://developers.openai.com/api/docs/models/gpt-4o-mini",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Fast, affordable small GPT model. Official docs list text/image input, text output, a 128k context window, and 16,384 max output tokens. I did not find a page-level reasoning-effort matrix, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "gpt-5",
+      "contextLength": 400000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "minimal",
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://developers.openai.com/api/docs/models/gpt-5",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Previous GPT-5 generation flagship model. Official docs list text/image input, text output, a 400,000-token context window, 128,000 max output tokens, and reasoning.effort support for minimal, low, medium, and high."
+    },
+    {
+      "canonicalId": "gpt-5-mini",
+      "contextLength": 400000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://developers.openai.com/api/docs/models/gpt-5-mini",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Faster, lower-cost GPT-5 variant. Official docs list text/image input, text output, a 400,000-token context window, and 128,000 max output tokens. The page surfaces reasoning token support but does not clearly publish a reasoning.effort matrix, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "gpt-5-nano",
+      "contextLength": 400000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://developers.openai.com/api/docs/models/gpt-5-nano",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Fastest and cheapest GPT-5 variant. Official docs list text/image input, text output, a 400,000-token context window, and 128,000 max output tokens. The page surfaces reasoning token support but does not clearly publish a reasoning.effort matrix, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "gpt-5.4",
+      "contextLength": 1050000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "none",
+        "low",
+        "medium",
+        "high",
+        "xhigh"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://developers.openai.com/api/docs/models/gpt-5.4",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "OpenAI's frontier model for complex professional work. Official docs list text/image input, text output, a 1,050,000-token context window, 128,000 max output tokens, and reasoning.effort support for none, low, medium, high, and xhigh."
+    },
+    {
+      "canonicalId": "gpt-5.4-pro",
+      "contextLength": 1050000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "medium",
+        "high",
+        "xhigh"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://developers.openai.com/api/docs/models/gpt-5.4-pro",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "GPT-5.4 Pro is available in the Responses API only. Official docs list text/image input, text output, a 1,050,000-token context window, 128,000 max output tokens, and reasoning.effort support for medium, high, and xhigh."
+    },
+    {
+      "canonicalId": "gpt-5.4-mini",
+      "contextLength": 400000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://developers.openai.com/api/docs/models/gpt-5.4-mini",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "OpenAI's strongest mini model for coding, computer use, and subagents. Official docs list text/image input, text output, a 400,000-token context window, and 128,000 max output tokens. The page does not explicitly surface an effort matrix, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "gpt-5.4-nano",
+      "contextLength": 400000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://developers.openai.com/api/docs/models/gpt-5.4-nano",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "OpenAI's cheapest GPT-5.4-class model for simple high-volume tasks. Official docs list text/image input, text output, a 400,000-token context window, and 128,000 max output tokens. The page does not explicitly surface an effort matrix, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "gpt-5.5",
+      "contextLength": 1050000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "none",
+        "low",
+        "medium",
+        "high",
+        "xhigh"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://developers.openai.com/api/docs/models/gpt-5.5",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "OpenAI's newest frontier model for coding and professional work. Official docs list text/image input, text output, a 1,050,000-token context window, 128,000 max output tokens, and reasoning.effort support for none, low, medium, high, and xhigh."
+    },
+    {
+      "canonicalId": "gpt-5.5-pro",
+      "contextLength": 1050000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://developers.openai.com/api/docs/models/gpt-5.5-pro",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Higher-compute GPT-5.5 Pro variant. Official docs list text/image input, text output, a 1,050,000-token context window, 128,000 max output tokens, and Responses API availability. I did not find a page-level reasoning.effort matrix, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "gemini-2.5-pro",
+      "contextLength": 1048576,
+      "maxOutputTokens": 65536,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "minimal",
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video", "audio", "pdf"],
+      "outputModalities": ["text"],
+      "source": "https://ai.google.dev/gemini-api/docs/models/gemini-2.5-pro",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Gemini 2.5 Pro is Google's current thinking model. Official docs list 1,048,576 input tokens, 65,536 output tokens, and multimodal input including PDF. Google's OpenAI compatibility guide says Gemini 2.5 Pro cannot turn thinking off, so this catalog keeps the verified minimal/low/medium/high subset."
+    },
+    {
+      "canonicalId": "gemini-2.5-flash",
+      "contextLength": 1048576,
+      "maxOutputTokens": 65536,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "none",
+        "minimal",
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video", "audio"],
+      "outputModalities": ["text"],
+      "source": "https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Gemini 2.5 Flash supports thinking and Google's OpenAI compatibility guide allows reasoning_effort none/minimal/low/medium/high for Gemini 2.5 models. Official docs list text, image, video, and audio input with 65,536 max output tokens."
+    },
+    {
+      "canonicalId": "gemini-2.5-flash-lite",
+      "contextLength": 1048576,
+      "maxOutputTokens": 65536,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "none",
+        "minimal",
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video", "audio", "pdf"],
+      "outputModalities": ["text"],
+      "source": "https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash-lite",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Gemini 2.5 Flash-Lite is Google's most cost-efficient multimodal model. Official docs list text, image, video, audio, and PDF input, 1,048,576 input tokens, 65,536 output tokens, and thinking support. Google's OpenAI compatibility guide says reasoning_effort none disables thinking on Gemini 2.5 models."
+    },
+    {
+      "canonicalId": "gemini-3.1-flash-lite",
+      "contextLength": 1048576,
+      "maxOutputTokens": 65536,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "minimal",
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video", "audio", "pdf"],
+      "outputModalities": ["text"],
+      "source": "https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-lite",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Current stable Gemini 3.1 Flash-Lite model. Official docs list text, image, video, audio, and PDF input, 1,048,576 input tokens, 65,536 output tokens, and thinking support. Google's OpenAI compatibility guide maps reasoning_effort minimal/low/medium/high to Gemini 3.1 Flash-Lite and says Gemini 3 models cannot disable thinking."
+    },
+    {
+      "canonicalId": "gemini-3.1-pro-preview",
+      "contextLength": 1048576,
+      "maxOutputTokens": 65536,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video", "audio", "pdf"],
+      "outputModalities": ["text"],
+      "source": "https://ai.google.dev/gemini-api/docs/models/gemini-3.1-pro-preview",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Gemini 3.1 Pro preview model. Official docs list text, image, video, audio, and PDF input, 1,048,576 input tokens, 65,536 output tokens, and thinking support. Google's OpenAI compatibility guide maps reasoning_effort low/medium/high to Gemini 3.1 Pro and says Gemini 3 models cannot disable thinking."
+    },
+    {
+      "canonicalId": "gemini-3.5-flash",
+      "contextLength": 1048576,
+      "maxOutputTokens": 65536,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "minimal",
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video", "audio", "pdf"],
+      "outputModalities": ["text"],
+      "source": "https://ai.google.dev/gemini-api/docs/models/gemini-3.5-flash",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Gemini 3.5 Flash is Google's current stable Gemini 3.5 model. Official docs list text, image, video, audio, and PDF input, 1,048,576 input tokens, 65,536 output tokens, and thinking support. Google's OpenAI compatibility docs show reasoning_effort low on gemini-3.5-flash and do not allow turning thinking off on Gemini 3 models."
+    },
+    {
+      "canonicalId": "claude-fable-5",
+      "contextLength": 1000000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "low",
+        "medium",
+        "high",
+        "xhigh"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.anthropic.com/en/docs/about-claude/models/overview",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Anthropic's most capable widely released model. Official docs list 1M context, 128k max output, text/image input, vision support, and always-on adaptive thinking. Anthropic's model-config docs expose low, medium, high, xhigh, and max effort on Fable 5; this catalog records the normalized subset and omits max because the schema does not include it."
+    },
+    {
+      "canonicalId": "claude-opus-4-8",
+      "contextLength": 1000000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "low",
+        "medium",
+        "high",
+        "xhigh"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.anthropic.com/en/docs/about-claude/models/overview",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Anthropic's current Opus-tier model. Official docs list 1M context, 128k max output, and vision support. Anthropic docs expose low, medium, high, xhigh, and max effort on Opus 4.8; this catalog records the normalized subset and omits max because the schema does not include it."
+    },
+    {
+      "canonicalId": "claude-sonnet-4-6",
+      "contextLength": 1000000,
+      "maxOutputTokens": 64000,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.anthropic.com/en/docs/about-claude/models/overview",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Anthropic's current Sonnet-tier model. Official docs list 1M context, 64k max output, and vision support. Anthropic docs expose low, medium, high, and max effort on Sonnet 4.6; this catalog keeps the normalized low/medium/high subset and omits max because the schema does not include it."
+    },
+    {
+      "canonicalId": "claude-haiku-4-5",
+      "contextLength": 200000,
+      "maxOutputTokens": 64000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.anthropic.com/en/docs/about-claude/models/overview",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Anthropic's current Haiku-tier model. Official docs list 200k context, 64k max output, and vision support. Anthropic docs clearly describe extended thinking support on Haiku 4.5, but I did not find a clean official effort-level subset that matches this catalog schema, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "qwen3.7-max",
+      "contextLength": 1000000,
+      "maxOutputTokens": 64000,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "none",
+        "minimal",
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://help.aliyun.com/document_detail/3026903.html",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Alibaba Cloud Model Studio docs list qwen3.7-max with a 1M context window and 64k max output. The OpenAI Responses API compatibility docs expose reasoning.effort values none, minimal, low, medium, and high for Qwen3.7 models. Official multimodal docs list Qwen3.7 Max snapshots with text, image, and video input, so the base alias is recorded as vision-capable."
+    },
+    {
+      "canonicalId": "qwen3.7-plus",
+      "contextLength": 1000000,
+      "maxOutputTokens": 64000,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "none",
+        "minimal",
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://help.aliyun.com/document_detail/3026903.html",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Alibaba Cloud Model Studio docs list qwen3.7-plus with a 1M context window, 64k max output, and text, image, and video input with text output. The OpenAI Responses API compatibility docs expose reasoning.effort values none, minimal, low, medium, and high for Qwen3.7 models."
+    },
+    {
+      "canonicalId": "qwen3.6-flash",
+      "contextLength": 1000000,
+      "maxOutputTokens": 64000,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "none",
+        "minimal",
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://help.aliyun.com/document_detail/3026903.html",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Alibaba Cloud Model Studio docs list qwen3.6-flash with a 1M context window, 64k max output, and text, image, and video input with text output. The OpenAI Responses API compatibility docs expose reasoning.effort values none, minimal, low, medium, and high for the supported Qwen thinking models."
+    },
+    {
+      "canonicalId": "doubao-seed-2.0-code",
+      "contextLength": null,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list doubao-seed-2.0-code as a multimodal model with context cache, enabling/disabling deep thinking, and adjustable thinking depth. I did not find a clear context window, max output ceiling, or schema-compatible effort subset for this exact model, so those fields are left null."
+    },
+    {
+      "canonicalId": "doubao-seed-2.0-pro",
+      "contextLength": null,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list doubao-seed-2.0-pro as a flagship multimodal model for agentic complex reasoning, multimodal understanding, long-context reasoning, structured generation, and video understanding. The same page says it supports enabling/disabling deep thinking and adjustable thinking depth, but does not publish a clear context window, max output ceiling, or schema-compatible effort subset."
+    },
+    {
+      "canonicalId": "doubao-seed-2.0-lite",
+      "contextLength": null,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list doubao-seed-2.0-lite as a multimodal model with context cache, enabling/disabling deep thinking, and adjustable thinking depth. The page says it supports long context but does not publish a clear numeric context window, max output ceiling, or schema-compatible effort subset."
+    },
+    {
+      "canonicalId": "doubao-seed-2.0-mini",
+      "contextLength": 256000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "minimal",
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list doubao-seed-2.0-mini as a multimodal model that supports 256k context and four thinking lengths. Because the documented four levels match minimal, low, medium, and high in adjacent Doubao entries, this catalog records those normalized efforts. I did not find a clear max output ceiling."
+    },
+    {
+      "canonicalId": "doubao-seed-1.8-251228",
+      "contextLength": null,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "minimal",
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list doubao-Seed-1.8-251228 as a multimodal deep-thinking model and explicitly say it supports minimal, low, medium, and high modes. I did not find a clear context window or max output ceiling for this exact model."
+    },
+    {
+      "canonicalId": "doubao-seed-code",
+      "contextLength": null,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list Doubao-Seed-Code as a multimodal model optimized for agentic programming tasks, with deep thinking enable/disable support and Responses API context cache. I did not find a clear context window, max output ceiling, or schema-compatible effort subset."
+    },
+    {
+      "canonicalId": "doubao-seed-1.6-flash-250828",
+      "contextLength": null,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list Doubao-seed-1.6-flash-250828 as a multimodal model with deep thinking enable/disable support and context cache. The page describes it as an improved flash version but does not publish a clear context window, max output ceiling, or schema-compatible effort subset for this exact model."
+    },
+    {
+      "canonicalId": "doubao-seed-1-6-251015",
+      "contextLength": null,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "minimal",
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list doubao-seed-1-6-251015 as a multimodal model that supports the reasoning_effort field with minimal, low, medium, and high. I did not find a clear context window or max output ceiling for this exact model."
+    },
+    {
+      "canonicalId": "doubao-seed-1.6-250615",
+      "contextLength": 256000,
+      "maxOutputTokens": 16000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list Doubao-Seed-1.6-250615 as a multimodal deep-thinking model with 256k context and 16k max output. It supports enabling/disabling deep thinking or auto mode, but I did not find a clean effort-level subset that matches this catalog schema."
+    },
+    {
+      "canonicalId": "doubao-1-6-flash-250615",
+      "contextLength": 256000,
+      "maxOutputTokens": 16000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list doubao-1-6-flash-250615 as a fast multimodal deep-thinking model with text and vision understanding, 256k context, and 16k max output. It supports enabling/disabling deep thinking, but I did not find a clean effort-level subset that matches this catalog schema."
+    },
+    {
+      "canonicalId": "doubao-seed-1-6-vision-250815",
+      "contextLength": 256000,
+      "maxOutputTokens": 64000,
+      "reasoningSupportPolicy": "unsupported",
+      "supportedReasoningEfforts": [],
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list doubao-seed-1-6-vision-250815 as a multimodal model for video understanding, grounding, and GUI Agent scenarios, with 256k max context and 64k max output. Its advanced function list only shows context cache, so reasoning is recorded as unsupported."
+    },
+    {
+      "canonicalId": "doubao-1.5-pro-32k",
+      "contextLength": 32000,
+      "maxOutputTokens": 12000,
+      "reasoningSupportPolicy": "unsupported",
+      "supportedReasoningEfforts": [],
+      "supportsVision": false,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list Doubao-1.5-pro-32k as a text model with 32k context and 12k max output. The advanced function list shows context cache only, so reasoning is recorded as unsupported."
+    },
+    {
+      "canonicalId": "doubao-1.5-lite-32k-250115",
+      "contextLength": 32000,
+      "maxOutputTokens": 12000,
+      "reasoningSupportPolicy": "unsupported",
+      "supportedReasoningEfforts": [],
+      "supportsVision": false,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list Doubao-1.5-lite-32k/250115 as a text model with 32k context and 12k max output. The slash in the displayed model version is normalized to a hyphen here because model IDs are matched conservatively by canonicalId. The advanced function list shows context cache only, so reasoning is recorded as unsupported."
+    },
+    {
+      "canonicalId": "doubao-1.5-pro-vision-32k-250115",
+      "contextLength": 32000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": "unsupported",
+      "supportedReasoningEfforts": [],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list Doubao-1.5-pro-vision-32k/250115 as a multimodal vision-understanding model. The version name itself indicates 32k context, but I did not find a clear max output ceiling. The advanced function list says no advanced features, so reasoning is recorded as unsupported."
+    },
+    {
+      "canonicalId": "doubao-1.5-pro-32k-character-250715",
+      "contextLength": 32000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": "unsupported",
+      "supportedReasoningEfforts": [],
+      "supportsVision": false,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list Doubao-1.5-pro-32k-character-250715 as a text role-play model. The version name itself indicates 32k context, but I did not find a clear max output ceiling. The advanced function list says no advanced features, so reasoning is recorded as unsupported."
+    },
+    {
+      "canonicalId": "doubao-lite",
+      "contextLength": 32000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": "unsupported",
+      "supportedReasoningEfforts": [],
+      "supportsVision": false,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://docs.coze.cn/api/open/docs/guides/model_service",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "ByteDance Coze official model-service docs list Doubao-lite as a text model that supports 32k context inference and fine-tuning. I did not find a clear max output ceiling. The advanced function list says no advanced features, so reasoning is recorded as unsupported."
+    },
+    {
+      "canonicalId": "kimi-k2.7-code",
+      "contextLength": 256000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://platform.kimi.com/docs/models.md",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Moonshot's Kimi model list describes kimi-k2.7-code as the current coding model with a 256k context window. The Kimi K2.7 Code guide documents text, image, and video input and text output. The model is thinking-oriented, but I did not find a clean effort-level mapping that matches this catalog schema, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "kimi-k2.7-code-highspeed",
+      "contextLength": 256000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://platform.kimi.com/docs/models.md",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Moonshot's Kimi model list describes kimi-k2.7-code-highspeed as the high-speed version of Kimi K2.7 Code. It shares the 256k context family and multimodal text, image, and video input capability. No official max output ceiling or schema-compatible reasoning effort matrix was found."
+    },
+    {
+      "canonicalId": "kimi-k2.6",
+      "contextLength": 256000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://platform.kimi.com/docs/models.md",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Moonshot's Kimi model list describes kimi-k2.6 as a current 256k-context multimodal model. The Kimi K2.6 guide documents text, image, and video input and supports thinking and non-thinking modes, but the control does not map cleanly to this catalog's effort enum, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "glm-5.2",
+      "contextLength": 1000000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": false,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://docs.bigmodel.cn/cn/guide/start/model-overview",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Zhipu's official model overview lists GLM-5.2 in the text model table with 1M context and 128K max output. I did not find a clean official reasoning-effort subset for this model that matches this catalog schema, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "glm-5.1",
+      "contextLength": 200000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": false,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://docs.bigmodel.cn/cn/guide/models/text/glm-5.1",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Zhipu's official GLM-5.1 model page lists text input, text output, a 200K context window, and 128K max output tokens. The page documents thinking modes, but I did not find a clean effort-level subset that matches this catalog schema, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "glm-5",
+      "contextLength": 200000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": false,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://docs.bigmodel.cn/cn/guide/models/text/glm-5",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Zhipu's official GLM-5 model page lists text input, text output, a 200K context window, and 128K max output tokens. The page documents thinking modes, but I did not find a clean effort-level subset that matches this catalog schema, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "glm-5-turbo",
+      "contextLength": 200000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": false,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://docs.bigmodel.cn/cn/guide/models/text/glm-5-turbo",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Zhipu's official GLM-5-Turbo model page lists text input, text output, a 200K context window, and 128K max output tokens. The page documents thinking modes, but I did not find a clean effort-level subset that matches this catalog schema, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "glm-4.7",
+      "contextLength": 200000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": false,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://docs.bigmodel.cn/cn/guide/models/text/glm-4.7",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Zhipu's official GLM-4.7 model page lists text input, text output, a 200K context window, and 128K max output tokens. The page documents thinking modes, but I did not find a clean effort-level subset that matches this catalog schema, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "glm-4.7-flashx",
+      "contextLength": 200000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": false,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://docs.bigmodel.cn/cn/guide/models/text/glm-4.7",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Zhipu's GLM-4.7 page lists GLM-4.7-FlashX as a text-input, text-output GLM-4.7 family variant with a 200K context window and 128K max output tokens. The page documents thinking modes, but I did not find a clean effort-level subset that matches this catalog schema, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "glm-4.7-flash",
+      "contextLength": 200000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": false,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://docs.bigmodel.cn/cn/guide/models/free/glm-4.7-flash",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Zhipu's official GLM-4.7-Flash page lists text input, text output, a 200K context window, and 128K max output tokens. The page documents thinking modes, but I did not find a clean effort-level subset that matches this catalog schema, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "glm-4.6",
+      "contextLength": 200000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": false,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://docs.bigmodel.cn/cn/guide/models/text/glm-4.6",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Zhipu's official GLM-4.6 model page lists text input, text output, a 200K context window, and 128K max output tokens. The page documents deep thinking support, but I did not find a clean effort-level subset that matches this catalog schema, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "glm-5v-turbo",
+      "contextLength": 200000,
+      "maxOutputTokens": 128000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video", "file"],
+      "outputModalities": ["text"],
+      "source": "https://docs.bigmodel.cn/cn/guide/models/vlm/glm-5v-turbo",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Zhipu's official GLM-5V-Turbo page lists video, image, text, and file input with text output, a 200K context window, and 128K max output tokens. It supports enabling or disabling thinking mode, but I did not find a clean effort-level subset that matches this catalog schema."
+    },
+    {
+      "canonicalId": "glm-4.6v",
+      "contextLength": 128000,
+      "maxOutputTokens": 32000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video", "file"],
+      "outputModalities": ["text"],
+      "source": "https://docs.bigmodel.cn/cn/guide/models/vlm/glm-4.6v",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Zhipu's official model overview lists GLM-4.6V with 128K context and 32K max output, and the GLM-4.6V page lists video, image, text, and file input with text output. It supports enabling or disabling thinking mode, but I did not find a clean effort-level subset that matches this catalog schema."
+    },
+    {
+      "canonicalId": "glm-4.6v-flash",
+      "contextLength": 128000,
+      "maxOutputTokens": 32000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video", "file"],
+      "outputModalities": ["text"],
+      "source": "https://docs.bigmodel.cn/cn/guide/models/free/glm-4.6v-flash",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Zhipu's official model overview lists GLM-4.6V-Flash with 128K context and 32K max output, and the GLM-4.6V-Flash page lists video, image, text, and file input with text output. It supports enabling or disabling thinking mode, but I did not find a clean effort-level subset that matches this catalog schema."
+    },
+    {
+      "canonicalId": "glm-4.1v-thinking",
+      "contextLength": 64000,
+      "maxOutputTokens": 16000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://docs.bigmodel.cn/cn/guide/models/vlm/glm-4.1v-thinking",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Zhipu's official model overview lists GLM-4.1V-Thinking with 64K context and 16K max output, and the model page lists video, image, and text input with text output. It has built-in deep thinking, but I did not find a clean effort-level subset that matches this catalog schema."
+    },
+    {
+      "canonicalId": "glm-4.1v-thinking-flash",
+      "contextLength": 64000,
+      "maxOutputTokens": 16000,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://docs.bigmodel.cn/cn/guide/models/free/glm-4.1v-thinking-flash",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Zhipu's official model overview lists GLM-4.1V-Thinking-Flash with 64K context and 16K max output, and the model page describes it as a visual reasoning model for image and video understanding. It has built-in deep thinking, but I did not find a clean effort-level subset that matches this catalog schema."
+    },
+    {
+      "canonicalId": "MiniMax-M3",
+      "contextLength": 1000000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://platform.minimaxi.com/docs/guides/text-generation.md",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "MiniMax official text generation docs list MiniMax-M3 as a native multimodal 1M-context model. The same page says OpenAI-compatible Chat Completions support text, image, and video input. Thinking is available in MiniMax-compatible protocol surfaces, but I did not find a schema-compatible reasoning effort matrix, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "MiniMax-M2.7",
+      "contextLength": 204800,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": null,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://platform.minimaxi.com/docs/guides/text-generation.md",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "MiniMax official text generation docs list MiniMax-M2.7 with a 204,800-token context window. I did not find an official max output ceiling, vision declaration, or schema-compatible reasoning effort matrix for this model."
+    },
+    {
+      "canonicalId": "MiniMax-M2.7-highspeed",
+      "contextLength": 204800,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": null,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://platform.minimaxi.com/docs/guides/text-generation.md",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "MiniMax official text generation docs list MiniMax-M2.7-highspeed with a 204,800-token context window. I did not find an official max output ceiling, vision declaration, or schema-compatible reasoning effort matrix for this model."
+    },
+    {
+      "canonicalId": "MiniMax-M2.5",
+      "contextLength": 204800,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": null,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://platform.minimaxi.com/docs/guides/text-generation.md",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "MiniMax official text generation docs list MiniMax-M2.5 with a 204,800-token context window. I did not find an official max output ceiling, vision declaration, or schema-compatible reasoning effort matrix for this model."
+    },
+    {
+      "canonicalId": "MiniMax-M2.5-highspeed",
+      "contextLength": 204800,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": null,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://platform.minimaxi.com/docs/guides/text-generation.md",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "MiniMax official text generation docs list MiniMax-M2.5-highspeed with a 204,800-token context window. I did not find an official max output ceiling, vision declaration, or schema-compatible reasoning effort matrix for this model."
+    },
+    {
+      "canonicalId": "MiniMax-M2.1",
+      "contextLength": 204800,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": null,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://platform.minimaxi.com/docs/guides/text-generation.md",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "MiniMax official text generation docs list MiniMax-M2.1 with a 204,800-token context window. I did not find an official max output ceiling, vision declaration, or schema-compatible reasoning effort matrix for this model."
+    },
+    {
+      "canonicalId": "MiniMax-M2.1-highspeed",
+      "contextLength": 204800,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": null,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://platform.minimaxi.com/docs/guides/text-generation.md",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "MiniMax official text generation docs list MiniMax-M2.1-highspeed with a 204,800-token context window. I did not find an official max output ceiling, vision declaration, or schema-compatible reasoning effort matrix for this model."
+    },
+    {
+      "canonicalId": "MiniMax-M2",
+      "contextLength": 204800,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": null,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://platform.minimaxi.com/docs/guides/text-generation.md",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "MiniMax official text generation docs list MiniMax-M2 with a 204,800-token context window. I did not find an official max output ceiling, vision declaration, or schema-compatible reasoning effort matrix for this model."
+    },
+    {
+      "canonicalId": "M2-her",
+      "contextLength": 64000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": null,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://platform.minimaxi.com/docs/guides/text-generation.md",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "MiniMax official text generation docs list M2-her as a chat model with a 64K context window. I did not find an official max output ceiling, vision declaration, or schema-compatible reasoning effort matrix for this model."
+    },
+    {
+      "canonicalId": "step-3.7-flash",
+      "contextLength": 256000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image", "video"],
+      "outputModalities": ["text"],
+      "source": "https://platform.stepfun.com/docs/zh/guides/models/step-3.7-flash",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "StepFun official docs describe step-3.7-flash as a 256K-context native multimodal reasoning model with image and video understanding. The same page documents reasoning_effort levels low, medium, and high for Chat Completions, plus output_config.effort for the Messages API. I did not find a clear max output ceiling."
+    },
+    {
+      "canonicalId": "step-3.5-flash",
+      "contextLength": 256000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": false,
+      "inputModalities": ["text"],
+      "outputModalities": ["text"],
+      "source": "https://platform.stepfun.com/docs/zh/guides/models/step-3.5-flash",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "StepFun official docs describe step-3.5-flash as a 256K-context pure text reasoning model. Variant-specific pages expose some reasoning strengths, but I did not find a clean base-model effort subset for this canonical ID, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "grok-4.3",
+      "contextLength": 1000000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "none",
+        "low",
+        "medium",
+        "high"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.x.ai/developers/models/grok-4.3",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "xAI official docs list grok-4.3 with text and image input, text output, and a 1,000,000-token max prompt length. The model page describes configurable reasoning and links effort levels none, low, medium, and high. I did not find a clear max output ceiling."
+    },
+    {
+      "canonicalId": "grok-4.20",
+      "contextLength": 1000000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.x.ai/developers/models/grok-4.20-reasoning",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "xAI official docs list grok-4.20 as an alias for model name grok-4.20-0309-reasoning, with text and image input, text output, a 1,000,000-token context window, and reasoning capability. I did not find an official reasoning.effort matrix for this reasoning-model alias, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "grok-4.20-0309-reasoning",
+      "contextLength": 1000000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.x.ai/developers/models/grok-4.20-reasoning",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "xAI official docs list grok-4.20-0309-reasoning with text and image input, text output, a 1,000,000-token context window, and reasoning capability. I did not find an official reasoning.effort matrix for this exact model name, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "grok-4.20-non-reasoning",
+      "contextLength": 1000000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": "unsupported",
+      "supportedReasoningEfforts": [],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.x.ai/developers/models/grok-4.20-0309-non-reasoning",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "xAI official docs list grok-4.20-non-reasoning as an alias for model name grok-4.20-0309-non-reasoning, with text and image input, text output, a 1,000,000-token context window, and Reasoning: No."
+    },
+    {
+      "canonicalId": "grok-4.20-0309-non-reasoning",
+      "contextLength": 1000000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": "unsupported",
+      "supportedReasoningEfforts": [],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.x.ai/developers/models/grok-4.20-0309-non-reasoning",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "xAI official docs list grok-4.20-0309-non-reasoning with text and image input, text output, a 1,000,000-token context window, and Reasoning: No."
+    },
+    {
+      "canonicalId": "grok-4.20-multi-agent",
+      "contextLength": 1000000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "low",
+        "medium",
+        "high",
+        "xhigh"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.x.ai/developers/models/grok-4.20-multi-agent-0309",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "xAI official docs list grok-4.20-multi-agent as an alias for model name grok-4.20-multi-agent-0309, with text and image input, text output, a 1,000,000-token context window, and reasoning capability. xAI's reasoning guide says reasoning.effort values low, medium, high, and xhigh are supported for grok-4.20-multi-agent, but this controls agent count rather than reasoning depth."
+    },
+    {
+      "canonicalId": "grok-4.20-multi-agent-0309",
+      "contextLength": 1000000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": "supported",
+      "supportedReasoningEfforts": [
+        "low",
+        "medium",
+        "high",
+        "xhigh"
+      ],
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.x.ai/developers/models/grok-4.20-multi-agent-0309",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "xAI official docs list grok-4.20-multi-agent-0309 with text and image input, text output, a 1,000,000-token context window, and reasoning capability. xAI's reasoning guide says reasoning.effort values low, medium, high, and xhigh are supported for grok-4.20-multi-agent, but this controls agent count rather than reasoning depth."
+    },
+    {
+      "canonicalId": "grok-build-0.1",
+      "contextLength": 256000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.x.ai/developers/models/grok-build-0.1",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "xAI official docs list grok-build-0.1 as an early-access fast coding model with text and image input, text output, a 256,000-token context window, and reasoning capability. I did not find an official reasoning.effort matrix for this model, so reasoning fields are left null."
+    },
+    {
+      "canonicalId": "mistral-medium-3-5-26-04",
+      "contextLength": 256000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.mistral.ai/models/model-cards/mistral-medium-3-5-26-04",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Mistral official model card identifies Mistral Medium 3.5 as a frontier-class multimodal model and shows a 256k context window. I did not find a clear max output ceiling or schema-compatible reasoning effort matrix."
+    },
+    {
+      "canonicalId": "mistral-large-3-25-12",
+      "contextLength": 256000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.mistral.ai/models/model-cards/mistral-large-3-25-12",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Mistral official model card identifies Mistral Large 3 as a general-purpose multimodal model and shows a 256k context window. I did not find a clear max output ceiling or schema-compatible reasoning effort matrix."
+    },
+    {
+      "canonicalId": "mistral-small-4-0-26-03",
+      "contextLength": 256000,
+      "maxOutputTokens": null,
+      "reasoningSupportPolicy": null,
+      "supportedReasoningEfforts": null,
+      "supportsVision": true,
+      "inputModalities": ["text", "image"],
+      "outputModalities": ["text"],
+      "source": "https://docs.mistral.ai/models/model-cards/mistral-small-4-0-26-03",
+      "updatedAt": "2026-06-22T00:00:00.000Z",
+      "notes": "Mistral official model card identifies Mistral Small 4.0 as a multimodal model and shows a 256k context window. I did not find a clear max output ceiling or schema-compatible reasoning effort matrix."
+    }
+  ]
+}