@mastra/mcp-docs-server 1.1.26-alpha.8 → 1.1.26
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.docs/docs/agents/structured-output.md +22 -0
- package/.docs/docs/agents/supervisor-agents.md +18 -0
- package/.docs/docs/editor/overview.md +69 -0
- package/.docs/docs/memory/storage.md +1 -0
- package/.docs/docs/observability/tracing/exporters/langfuse.md +31 -0
- package/.docs/guides/deployment/netlify.md +16 -1
- package/.docs/guides/getting-started/next-js.md +0 -4
- package/.docs/guides/migrations/mastra-cloud.md +2 -2
- package/.docs/models/gateways/netlify.md +2 -3
- package/.docs/models/gateways/openrouter.md +3 -1
- package/.docs/models/index.md +1 -1
- package/.docs/models/providers/302ai.md +32 -1
- package/.docs/models/providers/berget.md +9 -12
- package/.docs/models/providers/cloudflare-workers-ai.md +2 -1
- package/.docs/models/providers/cortecs.md +2 -1
- package/.docs/models/providers/deepinfra.md +4 -1
- package/.docs/models/providers/digitalocean.md +116 -0
- package/.docs/models/providers/fireworks-ai.md +2 -1
- package/.docs/models/providers/helicone.md +1 -2
- package/.docs/models/providers/huggingface.md +2 -1
- package/.docs/models/providers/kilo.md +2 -1
- package/.docs/models/providers/kimi-for-coding.md +2 -1
- package/.docs/models/providers/llmgateway.md +59 -77
- package/.docs/models/providers/moonshotai-cn.md +3 -2
- package/.docs/models/providers/moonshotai.md +3 -2
- package/.docs/models/providers/nano-gpt.md +8 -1
- package/.docs/models/providers/nvidia.md +2 -1
- package/.docs/models/providers/ollama-cloud.md +2 -1
- package/.docs/models/providers/openai.md +1 -2
- package/.docs/models/providers/opencode-go.md +2 -1
- package/.docs/models/providers/opencode.md +4 -1
- package/.docs/models/providers/ovhcloud.md +4 -7
- package/.docs/models/providers/poe.md +2 -1
- package/.docs/models/providers/tencent-token-plan.md +71 -0
- package/.docs/models/providers/tencent-tokenhub.md +71 -0
- package/.docs/models/providers/wafer.ai.md +72 -0
- package/.docs/models/providers/zenmux.md +2 -1
- package/.docs/models/providers.md +4 -0
- package/.docs/reference/agents/generate.md +8 -0
- package/.docs/reference/client-js/workflows.md +12 -0
- package/.docs/reference/core/mastra-class.md +9 -1
- package/.docs/reference/deployer/cloudflare.md +14 -1
- package/.docs/reference/deployer/netlify.md +50 -2
- package/.docs/reference/harness/harness-class.md +72 -49
- package/.docs/reference/index.md +2 -0
- package/.docs/reference/observability/tracing/exporters/langfuse.md +2 -0
- package/.docs/reference/processors/prefill-error-handler.md +5 -5
- package/.docs/reference/storage/cloudflare-d1.md +42 -42
- package/.docs/reference/storage/redis.md +266 -0
- package/.docs/reference/streaming/agents/stream.md +8 -0
- package/.docs/reference/streaming/workflows/resumeStream.md +2 -0
- package/.docs/reference/tools/tavily.md +307 -0
- package/.docs/reference/workflows/run-methods/resume.md +24 -0
- package/.docs/reference/workflows/workflow-methods/foreach.md +14 -1
- package/CHANGELOG.md +71 -0
- package/package.json +10 -10
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Fireworks AI
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 18 Fireworks AI models through Mastra's model router. Authentication is handled automatically using the `FIREWORKS_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Fireworks AI documentation](https://fireworks.ai/docs/).
|
|
6
6
|
|
|
@@ -46,6 +46,7 @@ for await (const chunk of stream) {
|
|
|
46
46
|
| `fireworks-ai/accounts/fireworks/models/kimi-k2-instruct` | 128K | | | | | | $1 | $3 |
|
|
47
47
|
| `fireworks-ai/accounts/fireworks/models/kimi-k2-thinking` | 256K | | | | | | $0.60 | $3 |
|
|
48
48
|
| `fireworks-ai/accounts/fireworks/models/kimi-k2p5` | 256K | | | | | | $0.60 | $3 |
|
|
49
|
+
| `fireworks-ai/accounts/fireworks/models/kimi-k2p6` | 262K | | | | | | $0.95 | $4 |
|
|
49
50
|
| `fireworks-ai/accounts/fireworks/models/minimax-m2p1` | 200K | | | | | | $0.30 | $1 |
|
|
50
51
|
| `fireworks-ai/accounts/fireworks/models/minimax-m2p5` | 197K | | | | | | $0.30 | $1 |
|
|
51
52
|
| `fireworks-ai/accounts/fireworks/models/minimax-m2p7` | 197K | | | | | | $0.30 | $1 |
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Helicone
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 90 Helicone models through Mastra's model router. Authentication is handled automatically using the `HELICONE_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Helicone documentation](https://helicone.ai/models).
|
|
6
6
|
|
|
@@ -48,7 +48,6 @@ for await (const chunk of stream) {
|
|
|
48
48
|
| `helicone/claude-opus-4-1-20250805` | 200K | | | | | | $15 | $75 |
|
|
49
49
|
| `helicone/claude-sonnet-4` | 200K | | | | | | $3 | $15 |
|
|
50
50
|
| `helicone/claude-sonnet-4-5-20250929` | 200K | | | | | | $3 | $15 |
|
|
51
|
-
| `helicone/codex-mini-latest` | 200K | | | | | | $2 | $6 |
|
|
52
51
|
| `helicone/deepseek-r1-distill-llama-70b` | 128K | | | | | | $0.03 | $0.13 |
|
|
53
52
|
| `helicone/deepseek-reasoner` | 128K | | | | | | $0.56 | $2 |
|
|
54
53
|
| `helicone/deepseek-tng-r1t2-chimera` | 130K | | | | | | $0.30 | $1 |
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Hugging Face
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 23 Hugging Face models through Mastra's model router. Authentication is handled automatically using the `HF_TOKEN` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Hugging Face documentation](https://huggingface.co).
|
|
6
6
|
|
|
@@ -43,6 +43,7 @@ for await (const chunk of stream) {
|
|
|
43
43
|
| `huggingface/moonshotai/Kimi-K2-Instruct-0905` | 262K | | | | | | $1 | $3 |
|
|
44
44
|
| `huggingface/moonshotai/Kimi-K2-Thinking` | 262K | | | | | | $0.60 | $3 |
|
|
45
45
|
| `huggingface/moonshotai/Kimi-K2.5` | 262K | | | | | | $0.60 | $3 |
|
|
46
|
+
| `huggingface/moonshotai/Kimi-K2.6` | 262K | | | | | | $0.95 | $4 |
|
|
46
47
|
| `huggingface/Qwen/Qwen3-235B-A22B-Thinking-2507` | 262K | | | | | | $0.30 | $3 |
|
|
47
48
|
| `huggingface/Qwen/Qwen3-Coder-480B-A35B-Instruct` | 262K | | | | | | $2 | $2 |
|
|
48
49
|
| `huggingface/Qwen/Qwen3-Coder-Next` | 262K | | | | | | $0.20 | $2 |
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Kilo Gateway
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 335 Kilo Gateway models through Mastra's model router. Authentication is handled automatically using the `KILO_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Kilo Gateway documentation](https://kilo.ai).
|
|
6
6
|
|
|
@@ -189,6 +189,7 @@ for await (const chunk of stream) {
|
|
|
189
189
|
| `kilo/moonshotai/kimi-k2-0905` | 131K | | | | | | $0.40 | $2 |
|
|
190
190
|
| `kilo/moonshotai/kimi-k2-thinking` | 131K | | | | | | $0.47 | $2 |
|
|
191
191
|
| `kilo/moonshotai/kimi-k2.5` | 262K | | | | | | $0.45 | $2 |
|
|
192
|
+
| `kilo/moonshotai/kimi-k2.6` | 262K | | | | | | $0.95 | $4 |
|
|
192
193
|
| `kilo/morph/morph-v3-fast` | 82K | | | | | | $0.80 | $1 |
|
|
193
194
|
| `kilo/morph/morph-v3-large` | 262K | | | | | | $0.90 | $2 |
|
|
194
195
|
| `kilo/nex-agi/deepseek-v3.1-nex-n1` | 131K | | | | | | $0.27 | $1 |
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Kimi For Coding
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 3 Kimi For Coding models through Mastra's model router. Authentication is handled automatically using the `KIMI_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Kimi For Coding documentation](https://www.kimi.com/coding/docs/en/third-party-agents.html).
|
|
6
6
|
|
|
@@ -35,6 +35,7 @@ for await (const chunk of stream) {
|
|
|
35
35
|
| Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
|
|
36
36
|
| ---------------------------------- | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
|
|
37
37
|
| `kimi-for-coding/k2p5` | 262K | | | | | | — | — |
|
|
38
|
+
| `kimi-for-coding/k2p6` | 262K | | | | | | — | — |
|
|
38
39
|
| `kimi-for-coding/kimi-k2-thinking` | 262K | | | | | | — | — |
|
|
39
40
|
|
|
40
41
|
## Advanced configuration
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# LLM Gateway
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 181 LLM Gateway models through Mastra's model router. Authentication is handled automatically using the `LLMGATEWAY_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [LLM Gateway documentation](https://llmgateway.io/docs).
|
|
6
6
|
|
|
@@ -35,11 +35,9 @@ for await (const chunk of stream) {
|
|
|
35
35
|
| Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
|
|
36
36
|
| -------------------------------------------------- | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
|
|
37
37
|
| `llmgateway/auto` | 128K | | | | | | — | — |
|
|
38
|
-
| `llmgateway/claude-3-5-sonnet`
|
|
38
|
+
| `llmgateway/claude-3-5-sonnet-20241022` | 200K | | | | | | $3 | $15 |
|
|
39
39
|
| `llmgateway/claude-3-7-sonnet` | 200K | | | | | | $3 | $15 |
|
|
40
40
|
| `llmgateway/claude-3-7-sonnet-20250219` | 200K | | | | | | $3 | $15 |
|
|
41
|
-
| `llmgateway/claude-3-haiku` | 200K | | | | | | $0.25 | $1 |
|
|
42
|
-
| `llmgateway/claude-3-haiku-20240307` | 200K | | | | | | $0.25 | $1 |
|
|
43
41
|
| `llmgateway/claude-3-opus` | 200K | | | | | | $15 | $75 |
|
|
44
42
|
| `llmgateway/claude-haiku-4-5` | 200K | | | | | | $1 | $5 |
|
|
45
43
|
| `llmgateway/claude-haiku-4-5-20251001` | 200K | | | | | | $1 | $5 |
|
|
@@ -47,53 +45,51 @@ for await (const chunk of stream) {
|
|
|
47
45
|
| `llmgateway/claude-opus-4-20250514` | 200K | | | | | | $15 | $75 |
|
|
48
46
|
| `llmgateway/claude-opus-4-5-20251101` | 200K | | | | | | $5 | $25 |
|
|
49
47
|
| `llmgateway/claude-opus-4-6` | 1.0M | | | | | | $5 | $25 |
|
|
48
|
+
| `llmgateway/claude-opus-4-7` | 1.0M | | | | | | $5 | $25 |
|
|
50
49
|
| `llmgateway/claude-sonnet-4-20250514` | 200K | | | | | | $3 | $15 |
|
|
51
50
|
| `llmgateway/claude-sonnet-4-5` | 200K | | | | | | $3 | $15 |
|
|
52
51
|
| `llmgateway/claude-sonnet-4-5-20250929` | 200K | | | | | | $3 | $15 |
|
|
53
|
-
| `llmgateway/claude-sonnet-4-6` |
|
|
52
|
+
| `llmgateway/claude-sonnet-4-6` | 1.0M | | | | | | $3 | $15 |
|
|
54
53
|
| `llmgateway/codestral-2508` | 256K | | | | | | $0.30 | $0.90 |
|
|
55
|
-
| `llmgateway/cogview-4` | 2K | | | | | | — | — |
|
|
56
54
|
| `llmgateway/custom` | 128K | | | | | | — | — |
|
|
57
55
|
| `llmgateway/deepseek-r1-0528` | 64K | | | | | | $0.80 | $2 |
|
|
58
56
|
| `llmgateway/deepseek-v3.1` | 128K | | | | | | $0.56 | $2 |
|
|
59
57
|
| `llmgateway/deepseek-v3.2` | 164K | | | | | | $0.28 | $0.42 |
|
|
60
58
|
| `llmgateway/devstral-2512` | 262K | | | | | | $0.40 | $2 |
|
|
61
|
-
| `llmgateway/devstral-small-2507` |
|
|
59
|
+
| `llmgateway/devstral-small-2507` | 128K | | | | | | $0.10 | $0.30 |
|
|
60
|
+
| `llmgateway/gemini-2.0-flash` | 1.0M | | | | | | $0.10 | $0.40 |
|
|
61
|
+
| `llmgateway/gemini-2.0-flash-lite` | 1.0M | | | | | | $0.07 | $0.30 |
|
|
62
62
|
| `llmgateway/gemini-2.5-flash` | 1.0M | | | | | | $0.30 | $3 |
|
|
63
|
-
| `llmgateway/gemini-2.5-flash-image` | 33K | | | | | | $0.30 | $30 |
|
|
64
|
-
| `llmgateway/gemini-2.5-flash-image-preview` | 33K | | | | | | $0.30 | $3 |
|
|
65
63
|
| `llmgateway/gemini-2.5-flash-lite` | 1.0M | | | | | | $0.10 | $0.40 |
|
|
66
64
|
| `llmgateway/gemini-2.5-flash-lite-preview-09-2025` | 1.0M | | | | | | $0.10 | $0.40 |
|
|
67
65
|
| `llmgateway/gemini-2.5-pro` | 1.0M | | | | | | $1 | $10 |
|
|
68
66
|
| `llmgateway/gemini-3-flash-preview` | 1.0M | | | | | | $0.50 | $3 |
|
|
69
|
-
| `llmgateway/gemini-3-pro-image-preview` | 66K | | | | | | $2 | $12 |
|
|
70
|
-
| `llmgateway/gemini-3.1-flash-image-preview` | 66K | | | | | | $0.25 | $2 |
|
|
71
67
|
| `llmgateway/gemini-3.1-flash-lite-preview` | 1.0M | | | | | | $0.25 | $2 |
|
|
72
68
|
| `llmgateway/gemini-3.1-pro-preview` | 1.0M | | | | | | $2 | $12 |
|
|
73
69
|
| `llmgateway/gemini-pro-latest` | 1.0M | | | | | | $2 | $12 |
|
|
74
70
|
| `llmgateway/gemma-2-27b-it-together` | 8K | | | | | | $0.08 | $0.08 |
|
|
75
|
-
| `llmgateway/gemma-3-12b-it` |
|
|
71
|
+
| `llmgateway/gemma-3-12b-it` | 33K | | | | | | — | — |
|
|
76
72
|
| `llmgateway/gemma-3-1b-it` | 1.0M | | | | | | $0.08 | $0.30 |
|
|
77
73
|
| `llmgateway/gemma-3-27b` | 128K | | | | | | $0.27 | $0.27 |
|
|
78
|
-
| `llmgateway/gemma-3-4b-it` |
|
|
79
|
-
| `llmgateway/gemma-3n-e2b-it` |
|
|
80
|
-
| `llmgateway/gemma-3n-e4b-it` |
|
|
74
|
+
| `llmgateway/gemma-3-4b-it` | 33K | | | | | | — | — |
|
|
75
|
+
| `llmgateway/gemma-3n-e2b-it` | 8K | | | | | | — | — |
|
|
76
|
+
| `llmgateway/gemma-3n-e4b-it` | 8K | | | | | | — | — |
|
|
81
77
|
| `llmgateway/glm-4-32b-0414-128k` | 128K | | | | | | $0.10 | $0.10 |
|
|
82
|
-
| `llmgateway/glm-4.5` |
|
|
83
|
-
| `llmgateway/glm-4.5-air` |
|
|
78
|
+
| `llmgateway/glm-4.5` | 131K | | | | | | $0.60 | $2 |
|
|
79
|
+
| `llmgateway/glm-4.5-air` | 131K | | | | | | $0.20 | $1 |
|
|
84
80
|
| `llmgateway/glm-4.5-airx` | 128K | | | | | | $1 | $5 |
|
|
85
|
-
| `llmgateway/glm-4.5-flash` |
|
|
81
|
+
| `llmgateway/glm-4.5-flash` | 131K | | | | | | — | — |
|
|
86
82
|
| `llmgateway/glm-4.5-x` | 128K | | | | | | $2 | $9 |
|
|
87
|
-
| `llmgateway/glm-4.5v` |
|
|
88
|
-
| `llmgateway/glm-4.6` |
|
|
83
|
+
| `llmgateway/glm-4.5v` | 64K | | | | | | $0.60 | $2 |
|
|
84
|
+
| `llmgateway/glm-4.6` | 205K | | | | | | $0.60 | $2 |
|
|
89
85
|
| `llmgateway/glm-4.6v` | 128K | | | | | | $0.30 | $0.90 |
|
|
90
86
|
| `llmgateway/glm-4.6v-flash` | 128K | | | | | | — | — |
|
|
91
87
|
| `llmgateway/glm-4.6v-flashx` | 128K | | | | | | $0.04 | $0.40 |
|
|
92
|
-
| `llmgateway/glm-4.7` |
|
|
88
|
+
| `llmgateway/glm-4.7` | 205K | | | | | | $0.60 | $2 |
|
|
93
89
|
| `llmgateway/glm-4.7-flash` | 200K | | | | | | — | — |
|
|
94
90
|
| `llmgateway/glm-4.7-flashx` | 200K | | | | | | $0.07 | $0.40 |
|
|
95
|
-
| `llmgateway/glm-5` |
|
|
96
|
-
| `llmgateway/glm-
|
|
91
|
+
| `llmgateway/glm-5` | 205K | | | | | | $1 | $3 |
|
|
92
|
+
| `llmgateway/glm-5.1` | 200K | | | | | | $6 | $24 |
|
|
97
93
|
| `llmgateway/gpt-3.5-turbo` | 16K | | | | | | $0.50 | $2 |
|
|
98
94
|
| `llmgateway/gpt-4` | 8K | | | | | | $30 | $60 |
|
|
99
95
|
| `llmgateway/gpt-4-turbo` | 128K | | | | | | $10 | $30 |
|
|
@@ -132,13 +128,10 @@ for await (const chunk of stream) {
|
|
|
132
128
|
| `llmgateway/grok-4-1-fast-reasoning` | 2.0M | | | | | | $0.20 | $0.50 |
|
|
133
129
|
| `llmgateway/grok-4-20-beta-0309-non-reasoning` | 2.0M | | | | | | $2 | $6 |
|
|
134
130
|
| `llmgateway/grok-4-20-beta-0309-reasoning` | 2.0M | | | | | | $2 | $6 |
|
|
135
|
-
| `llmgateway/grok-4-20-multi-agent-beta-0309` | 2.0M | | | | | | $2 | $6 |
|
|
136
131
|
| `llmgateway/grok-4-fast` | 2.0M | | | | | | $0.20 | $0.50 |
|
|
137
132
|
| `llmgateway/grok-4-fast-non-reasoning` | 2.0M | | | | | | $0.20 | $0.50 |
|
|
138
133
|
| `llmgateway/grok-4-fast-reasoning` | 2.0M | | | | | | $0.20 | $0.50 |
|
|
139
134
|
| `llmgateway/grok-code-fast-1` | 256K | | | | | | $0.20 | $2 |
|
|
140
|
-
| `llmgateway/grok-imagine-image` | 2K | | | | | | — | — |
|
|
141
|
-
| `llmgateway/grok-imagine-image-pro` | 2K | | | | | | — | — |
|
|
142
135
|
| `llmgateway/hermes-2-pro-llama-3-8b` | 8K | | | | | | $0.14 | $0.14 |
|
|
143
136
|
| `llmgateway/kimi-k2` | 131K | | | | | | $1 | $3 |
|
|
144
137
|
| `llmgateway/kimi-k2-thinking` | 262K | | | | | | $0.60 | $3 |
|
|
@@ -151,13 +144,13 @@ for await (const chunk of stream) {
|
|
|
151
144
|
| `llmgateway/llama-3.1-nemotron-ultra-253b` | 128K | | | | | | $0.60 | $2 |
|
|
152
145
|
| `llmgateway/llama-3.2-11b-instruct` | 128K | | | | | | $0.07 | $0.33 |
|
|
153
146
|
| `llmgateway/llama-3.2-3b-instruct` | 33K | | | | | | $0.03 | $0.05 |
|
|
154
|
-
| `llmgateway/llama-3.3-70b-instruct` | 128K | | | | | |
|
|
147
|
+
| `llmgateway/llama-3.3-70b-instruct` | 128K | | | | | | — | — |
|
|
155
148
|
| `llmgateway/llama-4-maverick-17b-instruct` | 8K | | | | | | $0.24 | $0.97 |
|
|
156
149
|
| `llmgateway/llama-4-scout` | 33K | | | | | | $0.18 | $0.59 |
|
|
157
150
|
| `llmgateway/llama-4-scout-17b-instruct` | 8K | | | | | | $0.17 | $0.66 |
|
|
158
|
-
| `llmgateway/
|
|
159
|
-
| `llmgateway/minimax-m2` | 197K | | | | | | $0.
|
|
160
|
-
| `llmgateway/minimax-m2.1` |
|
|
151
|
+
| `llmgateway/mimo-v2-flash` | 256K | | | | | | $0.10 | $0.30 |
|
|
152
|
+
| `llmgateway/minimax-m2` | 197K | | | | | | $0.30 | $1 |
|
|
153
|
+
| `llmgateway/minimax-m2.1` | 205K | | | | | | $0.30 | $1 |
|
|
161
154
|
| `llmgateway/minimax-m2.1-lightning` | 197K | | | | | | $0.12 | $0.48 |
|
|
162
155
|
| `llmgateway/minimax-m2.5` | 205K | | | | | | $0.30 | $1 |
|
|
163
156
|
| `llmgateway/minimax-m2.5-highspeed` | 205K | | | | | | $0.60 | $2 |
|
|
@@ -168,57 +161,50 @@ for await (const chunk of stream) {
|
|
|
168
161
|
| `llmgateway/ministral-3b-2512` | 131K | | | | | | $0.10 | $0.10 |
|
|
169
162
|
| `llmgateway/ministral-8b-2512` | 262K | | | | | | $0.15 | $0.15 |
|
|
170
163
|
| `llmgateway/mistral-large-2512` | 262K | | | | | | $0.50 | $2 |
|
|
171
|
-
| `llmgateway/mistral-large-latest` |
|
|
164
|
+
| `llmgateway/mistral-large-latest` | 262K | | | | | | $0.50 | $2 |
|
|
172
165
|
| `llmgateway/mistral-small-2506` | 128K | | | | | | $0.10 | $0.30 |
|
|
173
|
-
| `llmgateway/mixtral-8x7b-instruct-together` | 33K | | | | | | $0.06 | $0.06 |
|
|
174
166
|
| `llmgateway/o1` | 200K | | | | | | $15 | $60 |
|
|
175
167
|
| `llmgateway/o3` | 200K | | | | | | $2 | $8 |
|
|
176
168
|
| `llmgateway/o3-mini` | 200K | | | | | | $1 | $4 |
|
|
177
169
|
| `llmgateway/o4-mini` | 200K | | | | | | $1 | $4 |
|
|
178
|
-
| `llmgateway/pixtral-large-latest` | 128K | | | | | | $
|
|
179
|
-
| `llmgateway/qwen-coder-plus` | 131K | | | | | | $
|
|
170
|
+
| `llmgateway/pixtral-large-latest` | 128K | | | | | | $2 | $6 |
|
|
171
|
+
| `llmgateway/qwen-coder-plus` | 131K | | | | | | $0.50 | $1 |
|
|
180
172
|
| `llmgateway/qwen-flash` | 1.0M | | | | | | $0.05 | $0.40 |
|
|
181
|
-
| `llmgateway/qwen-
|
|
182
|
-
| `llmgateway/qwen-
|
|
183
|
-
| `llmgateway/qwen-
|
|
184
|
-
| `llmgateway/qwen-
|
|
185
|
-
| `llmgateway/qwen-
|
|
186
|
-
| `llmgateway/qwen-image-plus` | 2K | | | | | | — | — |
|
|
187
|
-
| `llmgateway/qwen-max` | 131K | | | | | | $2 | $6 |
|
|
188
|
-
| `llmgateway/qwen-max-latest` | 131K | | | | | | $2 | $6 |
|
|
189
|
-
| `llmgateway/qwen-omni-turbo` | 33K | | | | | | $0.20 | $0.80 |
|
|
190
|
-
| `llmgateway/qwen-plus` | 131K | | | | | | $0.40 | $1 |
|
|
191
|
-
| `llmgateway/qwen-plus-latest` | 1.0M | | | | | | $0.40 | $1 |
|
|
173
|
+
| `llmgateway/qwen-max` | 33K | | | | | | $2 | $6 |
|
|
174
|
+
| `llmgateway/qwen-max-latest` | 33K | | | | | | $2 | $6 |
|
|
175
|
+
| `llmgateway/qwen-omni-turbo` | 33K | | | | | | $0.07 | $0.27 |
|
|
176
|
+
| `llmgateway/qwen-plus` | 1.0M | | | | | | $0.40 | $1 |
|
|
177
|
+
| `llmgateway/qwen-plus-latest` | 131K | | | | | | $0.30 | $0.90 |
|
|
192
178
|
| `llmgateway/qwen-turbo` | 1.0M | | | | | | $0.05 | $0.20 |
|
|
193
179
|
| `llmgateway/qwen-vl-max` | 131K | | | | | | $0.80 | $3 |
|
|
194
|
-
| `llmgateway/qwen-vl-plus` | 131K | | | | | | $0.21 | $0.
|
|
195
|
-
| `llmgateway/qwen2-5-vl-32b-instruct` | 131K | | | | | | $
|
|
196
|
-
| `llmgateway/qwen2-5-vl-72b-instruct` |
|
|
197
|
-
| `llmgateway/qwen25-coder-7b` |
|
|
198
|
-
| `llmgateway/qwen3-235b-a22b-fp8` |
|
|
199
|
-
| `llmgateway/qwen3-235b-a22b-instruct-2507` |
|
|
200
|
-
| `llmgateway/qwen3-235b-a22b-thinking-2507` |
|
|
201
|
-
| `llmgateway/qwen3-30b-a3b-fp8` |
|
|
202
|
-
| `llmgateway/qwen3-30b-a3b-instruct-2507` |
|
|
203
|
-
| `llmgateway/qwen3-30b-a3b-thinking-2507` |
|
|
204
|
-
| `llmgateway/qwen3-32b` |
|
|
205
|
-
| `llmgateway/qwen3-32b-fp8` |
|
|
206
|
-
| `llmgateway/qwen3-4b-fp8` |
|
|
207
|
-
| `llmgateway/qwen3-coder-30b-a3b-instruct` | 262K | | | | | | $0.
|
|
208
|
-
| `llmgateway/qwen3-coder-480b-a35b-instruct` | 262K | | | | | | $
|
|
180
|
+
| `llmgateway/qwen-vl-plus` | 131K | | | | | | $0.21 | $0.63 |
|
|
181
|
+
| `llmgateway/qwen2-5-vl-32b-instruct` | 131K | | | | | | $0.30 | $0.30 |
|
|
182
|
+
| `llmgateway/qwen2-5-vl-72b-instruct` | 131K | | | | | | $3 | $8 |
|
|
183
|
+
| `llmgateway/qwen25-coder-7b` | 131K | | | | | | $0.05 | $0.05 |
|
|
184
|
+
| `llmgateway/qwen3-235b-a22b-fp8` | 131K | | | | | | $0.50 | $3 |
|
|
185
|
+
| `llmgateway/qwen3-235b-a22b-instruct-2507` | 131K | | | | | | $0.80 | $2 |
|
|
186
|
+
| `llmgateway/qwen3-235b-a22b-thinking-2507` | 131K | | | | | | $0.80 | $2 |
|
|
187
|
+
| `llmgateway/qwen3-30b-a3b-fp8` | 131K | | | | | | $0.10 | $0.10 |
|
|
188
|
+
| `llmgateway/qwen3-30b-a3b-instruct-2507` | 131K | | | | | | $0.10 | $0.10 |
|
|
189
|
+
| `llmgateway/qwen3-30b-a3b-thinking-2507` | 131K | | | | | | $0.10 | $0.10 |
|
|
190
|
+
| `llmgateway/qwen3-32b` | 131K | | | | | | $0.70 | $3 |
|
|
191
|
+
| `llmgateway/qwen3-32b-fp8` | 131K | | | | | | $0.10 | $0.10 |
|
|
192
|
+
| `llmgateway/qwen3-4b-fp8` | 131K | | | | | | $0.03 | $0.05 |
|
|
193
|
+
| `llmgateway/qwen3-coder-30b-a3b-instruct` | 262K | | | | | | $0.45 | $2 |
|
|
194
|
+
| `llmgateway/qwen3-coder-480b-a35b-instruct` | 262K | | | | | | $2 | $8 |
|
|
209
195
|
| `llmgateway/qwen3-coder-flash` | 1.0M | | | | | | $0.30 | $2 |
|
|
210
|
-
| `llmgateway/qwen3-coder-next` | 262K | | | | | | $0.
|
|
211
|
-
| `llmgateway/qwen3-coder-plus` | 1.0M | | | | | | $
|
|
212
|
-
| `llmgateway/qwen3-max` |
|
|
213
|
-
| `llmgateway/qwen3-max-2026-01-23` |
|
|
214
|
-
| `llmgateway/qwen3-next-80b-a3b-instruct` |
|
|
196
|
+
| `llmgateway/qwen3-coder-next` | 262K | | | | | | $0.80 | $4 |
|
|
197
|
+
| `llmgateway/qwen3-coder-plus` | 1.0M | | | | | | $1 | $5 |
|
|
198
|
+
| `llmgateway/qwen3-max` | 262K | | | | | | $1 | $6 |
|
|
199
|
+
| `llmgateway/qwen3-max-2026-01-23` | 256K | | | | | | $3 | $15 |
|
|
200
|
+
| `llmgateway/qwen3-next-80b-a3b-instruct` | 131K | | | | | | $0.50 | $2 |
|
|
215
201
|
| `llmgateway/qwen3-next-80b-a3b-thinking` | 131K | | | | | | $0.50 | $6 |
|
|
216
|
-
| `llmgateway/qwen3-vl-235b-a22b-instruct` | 131K | | | | | | $0.
|
|
217
|
-
| `llmgateway/qwen3-vl-235b-a22b-thinking` | 131K | | | | | | $0.
|
|
218
|
-
| `llmgateway/qwen3-vl-30b-a3b-instruct` | 131K | | | | | | $0.
|
|
219
|
-
| `llmgateway/qwen3-vl-30b-a3b-thinking` | 131K | | | | | | $0.
|
|
220
|
-
| `llmgateway/qwen3-vl-8b-instruct` | 131K | | | | | | $0.
|
|
221
|
-
| `llmgateway/qwen3-vl-flash` |
|
|
202
|
+
| `llmgateway/qwen3-vl-235b-a22b-instruct` | 131K | | | | | | $0.80 | $2 |
|
|
203
|
+
| `llmgateway/qwen3-vl-235b-a22b-thinking` | 131K | | | | | | $0.80 | $2 |
|
|
204
|
+
| `llmgateway/qwen3-vl-30b-a3b-instruct` | 131K | | | | | | $0.10 | $0.10 |
|
|
205
|
+
| `llmgateway/qwen3-vl-30b-a3b-thinking` | 131K | | | | | | $0.10 | $0.10 |
|
|
206
|
+
| `llmgateway/qwen3-vl-8b-instruct` | 131K | | | | | | $0.10 | $0.10 |
|
|
207
|
+
| `llmgateway/qwen3-vl-flash` | 1.0M | | | | | | $0.05 | $0.40 |
|
|
222
208
|
| `llmgateway/qwen3-vl-plus` | 262K | | | | | | $0.20 | $2 |
|
|
223
209
|
| `llmgateway/qwen35-397b-a17b` | 262K | | | | | | $0.60 | $4 |
|
|
224
210
|
| `llmgateway/qwq-plus` | 131K | | | | | | $0.80 | $2 |
|
|
@@ -226,13 +212,9 @@ for await (const chunk of stream) {
|
|
|
226
212
|
| `llmgateway/seed-1-6-250915` | 256K | | | | | | $0.25 | $2 |
|
|
227
213
|
| `llmgateway/seed-1-6-flash-250715` | 256K | | | | | | $0.07 | $0.30 |
|
|
228
214
|
| `llmgateway/seed-1-8-251228` | 256K | | | | | | $0.25 | $2 |
|
|
229
|
-
| `llmgateway/
|
|
230
|
-
| `llmgateway/seedream-4-5` | 2K | | | | | | — | — |
|
|
231
|
-
| `llmgateway/sonar` | 130K | | | | | | $1 | $1 |
|
|
215
|
+
| `llmgateway/sonar` | 128K | | | | | | $1 | $1 |
|
|
232
216
|
| `llmgateway/sonar-pro` | 200K | | | | | | $3 | $15 |
|
|
233
217
|
| `llmgateway/sonar-reasoning-pro` | 128K | | | | | | $2 | $8 |
|
|
234
|
-
| `llmgateway/veo-3.1-fast-generate-preview` | 33K | | | | | | — | — |
|
|
235
|
-
| `llmgateway/veo-3.1-generate-preview` | 33K | | | | | | — | — |
|
|
236
218
|
|
|
237
219
|
## Advanced configuration
|
|
238
220
|
|
|
@@ -262,7 +244,7 @@ const agent = new Agent({
|
|
|
262
244
|
model: ({ requestContext }) => {
|
|
263
245
|
const useAdvanced = requestContext.task === "complex";
|
|
264
246
|
return useAdvanced
|
|
265
|
-
? "llmgateway/
|
|
247
|
+
? "llmgateway/sonar-reasoning-pro"
|
|
266
248
|
: "llmgateway/auto";
|
|
267
249
|
}
|
|
268
250
|
});
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Moonshot AI (China)
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 7 Moonshot AI (China) models through Mastra's model router. Authentication is handled automatically using the `MOONSHOT_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Moonshot AI (China) documentation](https://platform.moonshot.cn).
|
|
6
6
|
|
|
@@ -40,6 +40,7 @@ for await (const chunk of stream) {
|
|
|
40
40
|
| `moonshotai-cn/kimi-k2-thinking-turbo` | 262K | | | | | | $1 | $8 |
|
|
41
41
|
| `moonshotai-cn/kimi-k2-turbo-preview` | 262K | | | | | | $2 | $10 |
|
|
42
42
|
| `moonshotai-cn/kimi-k2.5` | 262K | | | | | | $0.60 | $3 |
|
|
43
|
+
| `moonshotai-cn/kimi-k2.6` | 262K | | | | | | $0.95 | $4 |
|
|
43
44
|
|
|
44
45
|
## Advanced configuration
|
|
45
46
|
|
|
@@ -69,7 +70,7 @@ const agent = new Agent({
|
|
|
69
70
|
model: ({ requestContext }) => {
|
|
70
71
|
const useAdvanced = requestContext.task === "complex";
|
|
71
72
|
return useAdvanced
|
|
72
|
-
? "moonshotai-cn/kimi-k2.
|
|
73
|
+
? "moonshotai-cn/kimi-k2.6"
|
|
73
74
|
: "moonshotai-cn/kimi-k2-0711-preview";
|
|
74
75
|
}
|
|
75
76
|
});
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Moonshot AI
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 7 Moonshot AI models through Mastra's model router. Authentication is handled automatically using the `MOONSHOT_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Moonshot AI documentation](https://platform.moonshot.ai).
|
|
6
6
|
|
|
@@ -40,6 +40,7 @@ for await (const chunk of stream) {
|
|
|
40
40
|
| `moonshotai/kimi-k2-thinking-turbo` | 262K | | | | | | $1 | $8 |
|
|
41
41
|
| `moonshotai/kimi-k2-turbo-preview` | 262K | | | | | | $2 | $10 |
|
|
42
42
|
| `moonshotai/kimi-k2.5` | 262K | | | | | | $0.60 | $3 |
|
|
43
|
+
| `moonshotai/kimi-k2.6` | 262K | | | | | | $0.95 | $4 |
|
|
43
44
|
|
|
44
45
|
## Advanced configuration
|
|
45
46
|
|
|
@@ -69,7 +70,7 @@ const agent = new Agent({
|
|
|
69
70
|
model: ({ requestContext }) => {
|
|
70
71
|
const useAdvanced = requestContext.task === "complex";
|
|
71
72
|
return useAdvanced
|
|
72
|
-
? "moonshotai/kimi-k2.
|
|
73
|
+
? "moonshotai/kimi-k2.6"
|
|
73
74
|
: "moonshotai/kimi-k2-0711-preview";
|
|
74
75
|
}
|
|
75
76
|
});
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# NanoGPT
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 525 NanoGPT models through Mastra's model router. Authentication is handled automatically using the `NANO_GPT_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [NanoGPT documentation](https://docs.nano-gpt.com).
|
|
6
6
|
|
|
@@ -39,6 +39,7 @@ for await (const chunk of stream) {
|
|
|
39
39
|
| `nano-gpt/aion-labs/aion-1.0-mini` | 131K | | | | | | $0.80 | $1 |
|
|
40
40
|
| `nano-gpt/aion-labs/aion-rp-llama-3.1-8b` | 33K | | | | | | $0.20 | $0.20 |
|
|
41
41
|
| `nano-gpt/Alibaba-NLP/Tongyi-DeepResearch-30B-A3B` | 128K | | | | | | $0.08 | $0.24 |
|
|
42
|
+
| `nano-gpt/alibaba/qwen3.6-flash` | 992K | | | | | | $0.19 | $1 |
|
|
42
43
|
| `nano-gpt/allenai/molmo-2-8b` | 37K | | | | | | $0.20 | $0.20 |
|
|
43
44
|
| `nano-gpt/allenai/olmo-3-32b-think` | 128K | | | | | | $0.30 | $0.45 |
|
|
44
45
|
| `nano-gpt/allenai/olmo-3.1-32b-instruct` | 66K | | | | | | $0.20 | $0.60 |
|
|
@@ -367,6 +368,8 @@ for await (const chunk of stream) {
|
|
|
367
368
|
| `nano-gpt/moonshotai/kimi-k2-thinking-turbo-original` | 256K | | | | | | $1 | $8 |
|
|
368
369
|
| `nano-gpt/moonshotai/kimi-k2.5` | 256K | | | | | | $0.30 | $2 |
|
|
369
370
|
| `nano-gpt/moonshotai/kimi-k2.5:thinking` | 256K | | | | | | $0.30 | $2 |
|
|
371
|
+
| `nano-gpt/moonshotai/kimi-k2.6` | 256K | | | | | | $0.53 | $3 |
|
|
372
|
+
| `nano-gpt/moonshotai/kimi-k2.6:thinking` | 256K | | | | | | $0.53 | $3 |
|
|
370
373
|
| `nano-gpt/NeverSleep/Llama-3-Lumimaid-70B-v0.1` | 16K | | | | | | $2 | $2 |
|
|
371
374
|
| `nano-gpt/NeverSleep/Lumimaid-v0.2-70B` | 16K | | | | | | $1 | $2 |
|
|
372
375
|
| `nano-gpt/nex-agi/deepseek-v3.1-nex-n1` | 128K | | | | | | $0.28 | $0.42 |
|
|
@@ -432,12 +435,15 @@ for await (const chunk of stream) {
|
|
|
432
435
|
| `nano-gpt/phi-4-mini-instruct` | 128K | | | | | | $0.17 | $0.68 |
|
|
433
436
|
| `nano-gpt/phi-4-multimodal-instruct` | 128K | | | | | | $0.07 | $0.11 |
|
|
434
437
|
| `nano-gpt/qvq-max` | 128K | | | | | | $1 | $5 |
|
|
438
|
+
| `nano-gpt/qwen-3.6-plus` | 992K | | | | | | $0.45 | $3 |
|
|
435
439
|
| `nano-gpt/qwen-image` | — | | | | | | — | — |
|
|
436
440
|
| `nano-gpt/qwen-long` | 10.0M | | | | | | $0.10 | $0.41 |
|
|
437
441
|
| `nano-gpt/qwen-max` | 32K | | | | | | $2 | $6 |
|
|
438
442
|
| `nano-gpt/qwen-plus` | 996K | | | | | | $0.40 | $1 |
|
|
439
443
|
| `nano-gpt/qwen-turbo` | 1.0M | | | | | | $0.05 | $0.20 |
|
|
440
444
|
| `nano-gpt/qwen/qwen3.5-397b-a17b` | 258K | | | | | | $0.60 | $4 |
|
|
445
|
+
| `nano-gpt/qwen/Qwen3.6-35B-A3B` | 262K | | | | | | $0.29 | $2 |
|
|
446
|
+
| `nano-gpt/qwen/Qwen3.6-35B-A3B:thinking` | 262K | | | | | | $0.29 | $2 |
|
|
441
447
|
| `nano-gpt/Qwen2.5-32B-EVA-v0.2` | 25K | | | | | | $0.49 | $0.49 |
|
|
442
448
|
| `nano-gpt/qwen25-vl-72b-instruct` | 32K | | | | | | $0.70 | $0.70 |
|
|
443
449
|
| `nano-gpt/qwen3-30b-a3b-instruct-2507` | 256K | | | | | | $0.20 | $0.50 |
|
|
@@ -445,6 +451,7 @@ for await (const chunk of stream) {
|
|
|
445
451
|
| `nano-gpt/qwen3-max-2026-01-23` | 256K | | | | | | $1 | $6 |
|
|
446
452
|
| `nano-gpt/qwen3-vl-235b-a22b-instruct-original` | 33K | | | | | | $0.50 | $1 |
|
|
447
453
|
| `nano-gpt/qwen3-vl-235b-a22b-thinking` | 33K | | | | | | $0.50 | $6 |
|
|
454
|
+
| `nano-gpt/qwen3.6-max-preview` | 246K | | | | | | $1 | $8 |
|
|
448
455
|
| `nano-gpt/qwq-32b` | 128K | | | | | | $0.26 | $0.30 |
|
|
449
456
|
| `nano-gpt/QwQ-32B-ArliAI-RpR-v1` | 33K | | | | | | $0.20 | $0.20 |
|
|
450
457
|
| `nano-gpt/raifle/sorcererlm-8x22b` | 16K | | | | | | $5 | $5 |
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Nvidia
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 77 Nvidia models through Mastra's model router. Authentication is handled automatically using the `NVIDIA_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Nvidia documentation](https://docs.api.nvidia.com/nim/).
|
|
6
6
|
|
|
@@ -108,6 +108,7 @@ for await (const chunk of stream) {
|
|
|
108
108
|
| `nvidia/qwen/qwen3.5-397b-a17b` | 262K | | | | | | — | — |
|
|
109
109
|
| `nvidia/qwen/qwq-32b` | 128K | | | | | | — | — |
|
|
110
110
|
| `nvidia/stepfun-ai/step-3.5-flash` | 256K | | | | | | — | — |
|
|
111
|
+
| `nvidia/z-ai/glm-5.1` | 131K | | | | | | — | — |
|
|
111
112
|
| `nvidia/z-ai/glm4.7` | 205K | | | | | | — | — |
|
|
112
113
|
| `nvidia/z-ai/glm5` | 203K | | | | | | — | — |
|
|
113
114
|
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Ollama Cloud
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 37 Ollama Cloud models through Mastra's model router. Authentication is handled automatically using the `OLLAMA_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Ollama Cloud documentation](https://docs.ollama.com/cloud).
|
|
6
6
|
|
|
@@ -53,6 +53,7 @@ for await (const chunk of stream) {
|
|
|
53
53
|
| `ollama-cloud/kimi-k2-thinking` | 262K | | | | | | — | — |
|
|
54
54
|
| `ollama-cloud/kimi-k2:1t` | 262K | | | | | | — | — |
|
|
55
55
|
| `ollama-cloud/kimi-k2.5` | 262K | | | | | | — | — |
|
|
56
|
+
| `ollama-cloud/kimi-k2.6:cloud` | 262K | | | | | | — | — |
|
|
56
57
|
| `ollama-cloud/minimax-m2` | 205K | | | | | | — | — |
|
|
57
58
|
| `ollama-cloud/minimax-m2.1` | 205K | | | | | | — | — |
|
|
58
59
|
| `ollama-cloud/minimax-m2.5` | 205K | | | | | | — | — |
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# OpenAI
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 50 OpenAI models through Mastra's model router. Authentication is handled automatically using the `OPENAI_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [OpenAI documentation](https://platform.openai.com/docs/models).
|
|
6
6
|
|
|
@@ -33,7 +33,6 @@ for await (const chunk of stream) {
|
|
|
33
33
|
| Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
|
|
34
34
|
| ------------------------------- | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
|
|
35
35
|
| `openai/chatgpt-image-latest` | — | | | | | | — | — |
|
|
36
|
-
| `openai/codex-mini-latest` | 200K | | | | | | $2 | $6 |
|
|
37
36
|
| `openai/gpt-3.5-turbo` | 16K | | | | | | $0.50 | $2 |
|
|
38
37
|
| `openai/gpt-4` | 8K | | | | | | $30 | $60 |
|
|
39
38
|
| `openai/gpt-4-turbo` | 128K | | | | | | $10 | $30 |
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# OpenCode Go
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 10 OpenCode Go models through Mastra's model router. Authentication is handled automatically using the `OPENCODE_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [OpenCode Go documentation](https://opencode.ai/docs/zen).
|
|
6
6
|
|
|
@@ -37,6 +37,7 @@ for await (const chunk of stream) {
|
|
|
37
37
|
| `opencode-go/glm-5` | 205K | | | | | | $1 | $3 |
|
|
38
38
|
| `opencode-go/glm-5.1` | 205K | | | | | | $1 | $4 |
|
|
39
39
|
| `opencode-go/kimi-k2.5` | 262K | | | | | | $0.60 | $3 |
|
|
40
|
+
| `opencode-go/kimi-k2.6` | 262K | | | | | | $0.32 | $1 |
|
|
40
41
|
| `opencode-go/mimo-v2-omni` | 262K | | | | | | $0.40 | $2 |
|
|
41
42
|
| `opencode-go/mimo-v2-pro` | 1.0M | | | | | | $1 | $3 |
|
|
42
43
|
| `opencode-go/minimax-m2.5` | 205K | | | | | | $0.30 | $1 |
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# OpenCode Zen
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 38 OpenCode Zen models through Mastra's model router. Authentication is handled automatically using the `OPENCODE_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [OpenCode Zen documentation](https://opencode.ai/docs/zen).
|
|
6
6
|
|
|
@@ -64,8 +64,11 @@ for await (const chunk of stream) {
|
|
|
64
64
|
| `opencode/gpt-5.4-nano` | 400K | | | | | | $0.20 | $1 |
|
|
65
65
|
| `opencode/gpt-5.4-pro` | 1.1M | | | | | | $30 | $180 |
|
|
66
66
|
| `opencode/kimi-k2.5` | 262K | | | | | | $0.60 | $3 |
|
|
67
|
+
| `opencode/kimi-k2.6` | 262K | | | | | | $0.95 | $4 |
|
|
68
|
+
| `opencode/ling-2.6-flash-free` | 262K | | | | | | — | — |
|
|
67
69
|
| `opencode/minimax-m2.5` | 205K | | | | | | $0.30 | $1 |
|
|
68
70
|
| `opencode/minimax-m2.5-free` | 205K | | | | | | — | — |
|
|
71
|
+
| `opencode/minimax-m2.7` | 205K | | | | | | $0.30 | $1 |
|
|
69
72
|
| `opencode/nemotron-3-super-free` | 205K | | | | | | — | — |
|
|
70
73
|
| `opencode/qwen3.5-plus` | 262K | | | | | | $0.20 | $1 |
|
|
71
74
|
| `opencode/qwen3.6-plus` | 262K | | | | | | $0.50 | $3 |
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# OVHcloud AI Endpoints
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 10 OVHcloud AI Endpoints models through Mastra's model router. Authentication is handled automatically using the `OVHCLOUD_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [OVHcloud AI Endpoints documentation](https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog//).
|
|
6
6
|
|
|
@@ -15,7 +15,7 @@ const agent = new Agent({
|
|
|
15
15
|
id: "my-agent",
|
|
16
16
|
name: "My Agent",
|
|
17
17
|
instructions: "You are a helpful assistant",
|
|
18
|
-
model: "ovhcloud/
|
|
18
|
+
model: "ovhcloud/gpt-oss-120b"
|
|
19
19
|
});
|
|
20
20
|
|
|
21
21
|
// Generate a response
|
|
@@ -34,7 +34,6 @@ for await (const chunk of stream) {
|
|
|
34
34
|
|
|
35
35
|
| Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
|
|
36
36
|
| ---------------------------------------------- | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
|
|
37
|
-
| `ovhcloud/deepseek-r1-distill-llama-70b` | 131K | | | | | | $0.74 | $0.74 |
|
|
38
37
|
| `ovhcloud/gpt-oss-120b` | 131K | | | | | | $0.09 | $0.47 |
|
|
39
38
|
| `ovhcloud/gpt-oss-20b` | 131K | | | | | | $0.05 | $0.18 |
|
|
40
39
|
| `ovhcloud/llama-3.1-8b-instruct` | 131K | | | | | | $0.11 | $0.11 |
|
|
@@ -42,8 +41,6 @@ for await (const chunk of stream) {
|
|
|
42
41
|
| `ovhcloud/mistral-7b-instruct-v0.3` | 66K | | | | | | $0.11 | $0.11 |
|
|
43
42
|
| `ovhcloud/mistral-nemo-instruct-2407` | 66K | | | | | | $0.14 | $0.14 |
|
|
44
43
|
| `ovhcloud/mistral-small-3.2-24b-instruct-2506` | 131K | | | | | | $0.10 | $0.31 |
|
|
45
|
-
| `ovhcloud/mixtral-8x7b-instruct-v0.1` | 33K | | | | | | $0.70 | $0.70 |
|
|
46
|
-
| `ovhcloud/qwen2.5-coder-32b-instruct` | 33K | | | | | | $0.96 | $0.96 |
|
|
47
44
|
| `ovhcloud/qwen2.5-vl-72b-instruct` | 33K | | | | | | $1 | $1 |
|
|
48
45
|
| `ovhcloud/qwen3-32b` | 33K | | | | | | $0.09 | $0.25 |
|
|
49
46
|
| `ovhcloud/qwen3-coder-30b-a3b-instruct` | 262K | | | | | | $0.07 | $0.26 |
|
|
@@ -58,7 +55,7 @@ const agent = new Agent({
|
|
|
58
55
|
name: "custom-agent",
|
|
59
56
|
model: {
|
|
60
57
|
url: "https://oai.endpoints.kepler.ai.cloud.ovh.net/v1",
|
|
61
|
-
id: "ovhcloud/
|
|
58
|
+
id: "ovhcloud/gpt-oss-120b",
|
|
62
59
|
apiKey: process.env.OVHCLOUD_API_KEY,
|
|
63
60
|
headers: {
|
|
64
61
|
"X-Custom-Header": "value"
|
|
@@ -77,7 +74,7 @@ const agent = new Agent({
|
|
|
77
74
|
const useAdvanced = requestContext.task === "complex";
|
|
78
75
|
return useAdvanced
|
|
79
76
|
? "ovhcloud/qwen3-coder-30b-a3b-instruct"
|
|
80
|
-
: "ovhcloud/
|
|
77
|
+
: "ovhcloud/gpt-oss-120b";
|
|
81
78
|
}
|
|
82
79
|
});
|
|
83
80
|
```
|