@mastra/mcp-docs-server 1.1.26-alpha.6 → 1.1.26
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.docs/docs/agents/structured-output.md +22 -0
- package/.docs/docs/agents/supervisor-agents.md +18 -0
- package/.docs/docs/editor/overview.md +69 -0
- package/.docs/docs/memory/observational-memory.md +4 -0
- package/.docs/docs/memory/storage.md +1 -0
- package/.docs/docs/observability/tracing/exporters/langfuse.md +31 -0
- package/.docs/guides/deployment/netlify.md +16 -1
- package/.docs/guides/getting-started/next-js.md +0 -4
- package/.docs/guides/migrations/mastra-cloud.md +128 -3
- package/.docs/models/gateways/netlify.md +2 -2
- package/.docs/models/gateways/openrouter.md +3 -1
- package/.docs/models/gateways/vercel.md +4 -1
- package/.docs/models/index.md +36 -1
- package/.docs/models/providers/302ai.md +32 -1
- package/.docs/models/providers/alibaba-cn.md +2 -1
- package/.docs/models/providers/anthropic.md +2 -1
- package/.docs/models/providers/berget.md +9 -12
- package/.docs/models/providers/cloudflare-workers-ai.md +2 -1
- package/.docs/models/providers/cortecs.md +4 -1
- package/.docs/models/providers/deepinfra.md +4 -1
- package/.docs/models/providers/digitalocean.md +116 -0
- package/.docs/models/providers/fireworks-ai.md +2 -1
- package/.docs/models/providers/firmware.md +2 -3
- package/.docs/models/providers/helicone.md +1 -2
- package/.docs/models/providers/huggingface.md +2 -1
- package/.docs/models/providers/kilo.md +2 -1
- package/.docs/models/providers/kimi-for-coding.md +2 -1
- package/.docs/models/providers/llmgateway.md +59 -77
- package/.docs/models/providers/moonshotai-cn.md +3 -2
- package/.docs/models/providers/moonshotai.md +3 -2
- package/.docs/models/providers/nano-gpt.md +8 -1
- package/.docs/models/providers/nvidia.md +2 -1
- package/.docs/models/providers/ollama-cloud.md +2 -1
- package/.docs/models/providers/openai.md +1 -2
- package/.docs/models/providers/opencode-go.md +2 -1
- package/.docs/models/providers/opencode.md +5 -1
- package/.docs/models/providers/ovhcloud.md +4 -7
- package/.docs/models/providers/poe.md +2 -1
- package/.docs/models/providers/tencent-token-plan.md +71 -0
- package/.docs/models/providers/tencent-tokenhub.md +71 -0
- package/.docs/models/providers/wafer.ai.md +72 -0
- package/.docs/models/providers/zenmux.md +3 -1
- package/.docs/models/providers.md +4 -0
- package/.docs/reference/agents/generate.md +8 -0
- package/.docs/reference/client-js/workflows.md +12 -0
- package/.docs/reference/core/mastra-class.md +9 -1
- package/.docs/reference/deployer/cloudflare.md +14 -1
- package/.docs/reference/deployer/netlify.md +50 -2
- package/.docs/reference/harness/harness-class.md +72 -49
- package/.docs/reference/index.md +3 -0
- package/.docs/reference/observability/tracing/exporters/langfuse.md +2 -0
- package/.docs/reference/processors/prefill-error-handler.md +5 -5
- package/.docs/reference/storage/cloudflare-d1.md +42 -42
- package/.docs/reference/storage/redis.md +266 -0
- package/.docs/reference/streaming/agents/stream.md +8 -0
- package/.docs/reference/streaming/workflows/resumeStream.md +2 -0
- package/.docs/reference/tools/tavily.md +307 -0
- package/.docs/reference/workflows/run-methods/resume.md +24 -0
- package/.docs/reference/workflows/workflow-methods/foreach.md +14 -1
- package/.docs/reference/workspace/docker-sandbox.md +196 -0
- package/CHANGELOG.md +78 -0
- package/package.json +10 -10
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# LLM Gateway
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 181 LLM Gateway models through Mastra's model router. Authentication is handled automatically using the `LLMGATEWAY_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [LLM Gateway documentation](https://llmgateway.io/docs).
|
|
6
6
|
|
|
@@ -35,11 +35,9 @@ for await (const chunk of stream) {
|
|
|
35
35
|
| Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
|
|
36
36
|
| -------------------------------------------------- | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
|
|
37
37
|
| `llmgateway/auto` | 128K | | | | | | — | — |
|
|
38
|
-
| `llmgateway/claude-3-5-sonnet`
|
|
38
|
+
| `llmgateway/claude-3-5-sonnet-20241022` | 200K | | | | | | $3 | $15 |
|
|
39
39
|
| `llmgateway/claude-3-7-sonnet` | 200K | | | | | | $3 | $15 |
|
|
40
40
|
| `llmgateway/claude-3-7-sonnet-20250219` | 200K | | | | | | $3 | $15 |
|
|
41
|
-
| `llmgateway/claude-3-haiku` | 200K | | | | | | $0.25 | $1 |
|
|
42
|
-
| `llmgateway/claude-3-haiku-20240307` | 200K | | | | | | $0.25 | $1 |
|
|
43
41
|
| `llmgateway/claude-3-opus` | 200K | | | | | | $15 | $75 |
|
|
44
42
|
| `llmgateway/claude-haiku-4-5` | 200K | | | | | | $1 | $5 |
|
|
45
43
|
| `llmgateway/claude-haiku-4-5-20251001` | 200K | | | | | | $1 | $5 |
|
|
@@ -47,53 +45,51 @@ for await (const chunk of stream) {
|
|
|
47
45
|
| `llmgateway/claude-opus-4-20250514` | 200K | | | | | | $15 | $75 |
|
|
48
46
|
| `llmgateway/claude-opus-4-5-20251101` | 200K | | | | | | $5 | $25 |
|
|
49
47
|
| `llmgateway/claude-opus-4-6` | 1.0M | | | | | | $5 | $25 |
|
|
48
|
+
| `llmgateway/claude-opus-4-7` | 1.0M | | | | | | $5 | $25 |
|
|
50
49
|
| `llmgateway/claude-sonnet-4-20250514` | 200K | | | | | | $3 | $15 |
|
|
51
50
|
| `llmgateway/claude-sonnet-4-5` | 200K | | | | | | $3 | $15 |
|
|
52
51
|
| `llmgateway/claude-sonnet-4-5-20250929` | 200K | | | | | | $3 | $15 |
|
|
53
|
-
| `llmgateway/claude-sonnet-4-6` |
|
|
52
|
+
| `llmgateway/claude-sonnet-4-6` | 1.0M | | | | | | $3 | $15 |
|
|
54
53
|
| `llmgateway/codestral-2508` | 256K | | | | | | $0.30 | $0.90 |
|
|
55
|
-
| `llmgateway/cogview-4` | 2K | | | | | | — | — |
|
|
56
54
|
| `llmgateway/custom` | 128K | | | | | | — | — |
|
|
57
55
|
| `llmgateway/deepseek-r1-0528` | 64K | | | | | | $0.80 | $2 |
|
|
58
56
|
| `llmgateway/deepseek-v3.1` | 128K | | | | | | $0.56 | $2 |
|
|
59
57
|
| `llmgateway/deepseek-v3.2` | 164K | | | | | | $0.28 | $0.42 |
|
|
60
58
|
| `llmgateway/devstral-2512` | 262K | | | | | | $0.40 | $2 |
|
|
61
|
-
| `llmgateway/devstral-small-2507` |
|
|
59
|
+
| `llmgateway/devstral-small-2507` | 128K | | | | | | $0.10 | $0.30 |
|
|
60
|
+
| `llmgateway/gemini-2.0-flash` | 1.0M | | | | | | $0.10 | $0.40 |
|
|
61
|
+
| `llmgateway/gemini-2.0-flash-lite` | 1.0M | | | | | | $0.07 | $0.30 |
|
|
62
62
|
| `llmgateway/gemini-2.5-flash` | 1.0M | | | | | | $0.30 | $3 |
|
|
63
|
-
| `llmgateway/gemini-2.5-flash-image` | 33K | | | | | | $0.30 | $30 |
|
|
64
|
-
| `llmgateway/gemini-2.5-flash-image-preview` | 33K | | | | | | $0.30 | $3 |
|
|
65
63
|
| `llmgateway/gemini-2.5-flash-lite` | 1.0M | | | | | | $0.10 | $0.40 |
|
|
66
64
|
| `llmgateway/gemini-2.5-flash-lite-preview-09-2025` | 1.0M | | | | | | $0.10 | $0.40 |
|
|
67
65
|
| `llmgateway/gemini-2.5-pro` | 1.0M | | | | | | $1 | $10 |
|
|
68
66
|
| `llmgateway/gemini-3-flash-preview` | 1.0M | | | | | | $0.50 | $3 |
|
|
69
|
-
| `llmgateway/gemini-3-pro-image-preview` | 66K | | | | | | $2 | $12 |
|
|
70
|
-
| `llmgateway/gemini-3.1-flash-image-preview` | 66K | | | | | | $0.25 | $2 |
|
|
71
67
|
| `llmgateway/gemini-3.1-flash-lite-preview` | 1.0M | | | | | | $0.25 | $2 |
|
|
72
68
|
| `llmgateway/gemini-3.1-pro-preview` | 1.0M | | | | | | $2 | $12 |
|
|
73
69
|
| `llmgateway/gemini-pro-latest` | 1.0M | | | | | | $2 | $12 |
|
|
74
70
|
| `llmgateway/gemma-2-27b-it-together` | 8K | | | | | | $0.08 | $0.08 |
|
|
75
|
-
| `llmgateway/gemma-3-12b-it` |
|
|
71
|
+
| `llmgateway/gemma-3-12b-it` | 33K | | | | | | — | — |
|
|
76
72
|
| `llmgateway/gemma-3-1b-it` | 1.0M | | | | | | $0.08 | $0.30 |
|
|
77
73
|
| `llmgateway/gemma-3-27b` | 128K | | | | | | $0.27 | $0.27 |
|
|
78
|
-
| `llmgateway/gemma-3-4b-it` |
|
|
79
|
-
| `llmgateway/gemma-3n-e2b-it` |
|
|
80
|
-
| `llmgateway/gemma-3n-e4b-it` |
|
|
74
|
+
| `llmgateway/gemma-3-4b-it` | 33K | | | | | | — | — |
|
|
75
|
+
| `llmgateway/gemma-3n-e2b-it` | 8K | | | | | | — | — |
|
|
76
|
+
| `llmgateway/gemma-3n-e4b-it` | 8K | | | | | | — | — |
|
|
81
77
|
| `llmgateway/glm-4-32b-0414-128k` | 128K | | | | | | $0.10 | $0.10 |
|
|
82
|
-
| `llmgateway/glm-4.5` |
|
|
83
|
-
| `llmgateway/glm-4.5-air` |
|
|
78
|
+
| `llmgateway/glm-4.5` | 131K | | | | | | $0.60 | $2 |
|
|
79
|
+
| `llmgateway/glm-4.5-air` | 131K | | | | | | $0.20 | $1 |
|
|
84
80
|
| `llmgateway/glm-4.5-airx` | 128K | | | | | | $1 | $5 |
|
|
85
|
-
| `llmgateway/glm-4.5-flash` |
|
|
81
|
+
| `llmgateway/glm-4.5-flash` | 131K | | | | | | — | — |
|
|
86
82
|
| `llmgateway/glm-4.5-x` | 128K | | | | | | $2 | $9 |
|
|
87
|
-
| `llmgateway/glm-4.5v` |
|
|
88
|
-
| `llmgateway/glm-4.6` |
|
|
83
|
+
| `llmgateway/glm-4.5v` | 64K | | | | | | $0.60 | $2 |
|
|
84
|
+
| `llmgateway/glm-4.6` | 205K | | | | | | $0.60 | $2 |
|
|
89
85
|
| `llmgateway/glm-4.6v` | 128K | | | | | | $0.30 | $0.90 |
|
|
90
86
|
| `llmgateway/glm-4.6v-flash` | 128K | | | | | | — | — |
|
|
91
87
|
| `llmgateway/glm-4.6v-flashx` | 128K | | | | | | $0.04 | $0.40 |
|
|
92
|
-
| `llmgateway/glm-4.7` |
|
|
88
|
+
| `llmgateway/glm-4.7` | 205K | | | | | | $0.60 | $2 |
|
|
93
89
|
| `llmgateway/glm-4.7-flash` | 200K | | | | | | — | — |
|
|
94
90
|
| `llmgateway/glm-4.7-flashx` | 200K | | | | | | $0.07 | $0.40 |
|
|
95
|
-
| `llmgateway/glm-5` |
|
|
96
|
-
| `llmgateway/glm-
|
|
91
|
+
| `llmgateway/glm-5` | 205K | | | | | | $1 | $3 |
|
|
92
|
+
| `llmgateway/glm-5.1` | 200K | | | | | | $6 | $24 |
|
|
97
93
|
| `llmgateway/gpt-3.5-turbo` | 16K | | | | | | $0.50 | $2 |
|
|
98
94
|
| `llmgateway/gpt-4` | 8K | | | | | | $30 | $60 |
|
|
99
95
|
| `llmgateway/gpt-4-turbo` | 128K | | | | | | $10 | $30 |
|
|
@@ -132,13 +128,10 @@ for await (const chunk of stream) {
|
|
|
132
128
|
| `llmgateway/grok-4-1-fast-reasoning` | 2.0M | | | | | | $0.20 | $0.50 |
|
|
133
129
|
| `llmgateway/grok-4-20-beta-0309-non-reasoning` | 2.0M | | | | | | $2 | $6 |
|
|
134
130
|
| `llmgateway/grok-4-20-beta-0309-reasoning` | 2.0M | | | | | | $2 | $6 |
|
|
135
|
-
| `llmgateway/grok-4-20-multi-agent-beta-0309` | 2.0M | | | | | | $2 | $6 |
|
|
136
131
|
| `llmgateway/grok-4-fast` | 2.0M | | | | | | $0.20 | $0.50 |
|
|
137
132
|
| `llmgateway/grok-4-fast-non-reasoning` | 2.0M | | | | | | $0.20 | $0.50 |
|
|
138
133
|
| `llmgateway/grok-4-fast-reasoning` | 2.0M | | | | | | $0.20 | $0.50 |
|
|
139
134
|
| `llmgateway/grok-code-fast-1` | 256K | | | | | | $0.20 | $2 |
|
|
140
|
-
| `llmgateway/grok-imagine-image` | 2K | | | | | | — | — |
|
|
141
|
-
| `llmgateway/grok-imagine-image-pro` | 2K | | | | | | — | — |
|
|
142
135
|
| `llmgateway/hermes-2-pro-llama-3-8b` | 8K | | | | | | $0.14 | $0.14 |
|
|
143
136
|
| `llmgateway/kimi-k2` | 131K | | | | | | $1 | $3 |
|
|
144
137
|
| `llmgateway/kimi-k2-thinking` | 262K | | | | | | $0.60 | $3 |
|
|
@@ -151,13 +144,13 @@ for await (const chunk of stream) {
|
|
|
151
144
|
| `llmgateway/llama-3.1-nemotron-ultra-253b` | 128K | | | | | | $0.60 | $2 |
|
|
152
145
|
| `llmgateway/llama-3.2-11b-instruct` | 128K | | | | | | $0.07 | $0.33 |
|
|
153
146
|
| `llmgateway/llama-3.2-3b-instruct` | 33K | | | | | | $0.03 | $0.05 |
|
|
154
|
-
| `llmgateway/llama-3.3-70b-instruct` | 128K | | | | | |
|
|
147
|
+
| `llmgateway/llama-3.3-70b-instruct` | 128K | | | | | | — | — |
|
|
155
148
|
| `llmgateway/llama-4-maverick-17b-instruct` | 8K | | | | | | $0.24 | $0.97 |
|
|
156
149
|
| `llmgateway/llama-4-scout` | 33K | | | | | | $0.18 | $0.59 |
|
|
157
150
|
| `llmgateway/llama-4-scout-17b-instruct` | 8K | | | | | | $0.17 | $0.66 |
|
|
158
|
-
| `llmgateway/
|
|
159
|
-
| `llmgateway/minimax-m2` | 197K | | | | | | $0.
|
|
160
|
-
| `llmgateway/minimax-m2.1` |
|
|
151
|
+
| `llmgateway/mimo-v2-flash` | 256K | | | | | | $0.10 | $0.30 |
|
|
152
|
+
| `llmgateway/minimax-m2` | 197K | | | | | | $0.30 | $1 |
|
|
153
|
+
| `llmgateway/minimax-m2.1` | 205K | | | | | | $0.30 | $1 |
|
|
161
154
|
| `llmgateway/minimax-m2.1-lightning` | 197K | | | | | | $0.12 | $0.48 |
|
|
162
155
|
| `llmgateway/minimax-m2.5` | 205K | | | | | | $0.30 | $1 |
|
|
163
156
|
| `llmgateway/minimax-m2.5-highspeed` | 205K | | | | | | $0.60 | $2 |
|
|
@@ -168,57 +161,50 @@ for await (const chunk of stream) {
|
|
|
168
161
|
| `llmgateway/ministral-3b-2512` | 131K | | | | | | $0.10 | $0.10 |
|
|
169
162
|
| `llmgateway/ministral-8b-2512` | 262K | | | | | | $0.15 | $0.15 |
|
|
170
163
|
| `llmgateway/mistral-large-2512` | 262K | | | | | | $0.50 | $2 |
|
|
171
|
-
| `llmgateway/mistral-large-latest` |
|
|
164
|
+
| `llmgateway/mistral-large-latest` | 262K | | | | | | $0.50 | $2 |
|
|
172
165
|
| `llmgateway/mistral-small-2506` | 128K | | | | | | $0.10 | $0.30 |
|
|
173
|
-
| `llmgateway/mixtral-8x7b-instruct-together` | 33K | | | | | | $0.06 | $0.06 |
|
|
174
166
|
| `llmgateway/o1` | 200K | | | | | | $15 | $60 |
|
|
175
167
|
| `llmgateway/o3` | 200K | | | | | | $2 | $8 |
|
|
176
168
|
| `llmgateway/o3-mini` | 200K | | | | | | $1 | $4 |
|
|
177
169
|
| `llmgateway/o4-mini` | 200K | | | | | | $1 | $4 |
|
|
178
|
-
| `llmgateway/pixtral-large-latest` | 128K | | | | | | $
|
|
179
|
-
| `llmgateway/qwen-coder-plus` | 131K | | | | | | $
|
|
170
|
+
| `llmgateway/pixtral-large-latest` | 128K | | | | | | $2 | $6 |
|
|
171
|
+
| `llmgateway/qwen-coder-plus` | 131K | | | | | | $0.50 | $1 |
|
|
180
172
|
| `llmgateway/qwen-flash` | 1.0M | | | | | | $0.05 | $0.40 |
|
|
181
|
-
| `llmgateway/qwen-
|
|
182
|
-
| `llmgateway/qwen-
|
|
183
|
-
| `llmgateway/qwen-
|
|
184
|
-
| `llmgateway/qwen-
|
|
185
|
-
| `llmgateway/qwen-
|
|
186
|
-
| `llmgateway/qwen-image-plus` | 2K | | | | | | — | — |
|
|
187
|
-
| `llmgateway/qwen-max` | 131K | | | | | | $2 | $6 |
|
|
188
|
-
| `llmgateway/qwen-max-latest` | 131K | | | | | | $2 | $6 |
|
|
189
|
-
| `llmgateway/qwen-omni-turbo` | 33K | | | | | | $0.20 | $0.80 |
|
|
190
|
-
| `llmgateway/qwen-plus` | 131K | | | | | | $0.40 | $1 |
|
|
191
|
-
| `llmgateway/qwen-plus-latest` | 1.0M | | | | | | $0.40 | $1 |
|
|
173
|
+
| `llmgateway/qwen-max` | 33K | | | | | | $2 | $6 |
|
|
174
|
+
| `llmgateway/qwen-max-latest` | 33K | | | | | | $2 | $6 |
|
|
175
|
+
| `llmgateway/qwen-omni-turbo` | 33K | | | | | | $0.07 | $0.27 |
|
|
176
|
+
| `llmgateway/qwen-plus` | 1.0M | | | | | | $0.40 | $1 |
|
|
177
|
+
| `llmgateway/qwen-plus-latest` | 131K | | | | | | $0.30 | $0.90 |
|
|
192
178
|
| `llmgateway/qwen-turbo` | 1.0M | | | | | | $0.05 | $0.20 |
|
|
193
179
|
| `llmgateway/qwen-vl-max` | 131K | | | | | | $0.80 | $3 |
|
|
194
|
-
| `llmgateway/qwen-vl-plus` | 131K | | | | | | $0.21 | $0.
|
|
195
|
-
| `llmgateway/qwen2-5-vl-32b-instruct` | 131K | | | | | | $
|
|
196
|
-
| `llmgateway/qwen2-5-vl-72b-instruct` |
|
|
197
|
-
| `llmgateway/qwen25-coder-7b` |
|
|
198
|
-
| `llmgateway/qwen3-235b-a22b-fp8` |
|
|
199
|
-
| `llmgateway/qwen3-235b-a22b-instruct-2507` |
|
|
200
|
-
| `llmgateway/qwen3-235b-a22b-thinking-2507` |
|
|
201
|
-
| `llmgateway/qwen3-30b-a3b-fp8` |
|
|
202
|
-
| `llmgateway/qwen3-30b-a3b-instruct-2507` |
|
|
203
|
-
| `llmgateway/qwen3-30b-a3b-thinking-2507` |
|
|
204
|
-
| `llmgateway/qwen3-32b` |
|
|
205
|
-
| `llmgateway/qwen3-32b-fp8` |
|
|
206
|
-
| `llmgateway/qwen3-4b-fp8` |
|
|
207
|
-
| `llmgateway/qwen3-coder-30b-a3b-instruct` | 262K | | | | | | $0.
|
|
208
|
-
| `llmgateway/qwen3-coder-480b-a35b-instruct` | 262K | | | | | | $
|
|
180
|
+
| `llmgateway/qwen-vl-plus` | 131K | | | | | | $0.21 | $0.63 |
|
|
181
|
+
| `llmgateway/qwen2-5-vl-32b-instruct` | 131K | | | | | | $0.30 | $0.30 |
|
|
182
|
+
| `llmgateway/qwen2-5-vl-72b-instruct` | 131K | | | | | | $3 | $8 |
|
|
183
|
+
| `llmgateway/qwen25-coder-7b` | 131K | | | | | | $0.05 | $0.05 |
|
|
184
|
+
| `llmgateway/qwen3-235b-a22b-fp8` | 131K | | | | | | $0.50 | $3 |
|
|
185
|
+
| `llmgateway/qwen3-235b-a22b-instruct-2507` | 131K | | | | | | $0.80 | $2 |
|
|
186
|
+
| `llmgateway/qwen3-235b-a22b-thinking-2507` | 131K | | | | | | $0.80 | $2 |
|
|
187
|
+
| `llmgateway/qwen3-30b-a3b-fp8` | 131K | | | | | | $0.10 | $0.10 |
|
|
188
|
+
| `llmgateway/qwen3-30b-a3b-instruct-2507` | 131K | | | | | | $0.10 | $0.10 |
|
|
189
|
+
| `llmgateway/qwen3-30b-a3b-thinking-2507` | 131K | | | | | | $0.10 | $0.10 |
|
|
190
|
+
| `llmgateway/qwen3-32b` | 131K | | | | | | $0.70 | $3 |
|
|
191
|
+
| `llmgateway/qwen3-32b-fp8` | 131K | | | | | | $0.10 | $0.10 |
|
|
192
|
+
| `llmgateway/qwen3-4b-fp8` | 131K | | | | | | $0.03 | $0.05 |
|
|
193
|
+
| `llmgateway/qwen3-coder-30b-a3b-instruct` | 262K | | | | | | $0.45 | $2 |
|
|
194
|
+
| `llmgateway/qwen3-coder-480b-a35b-instruct` | 262K | | | | | | $2 | $8 |
|
|
209
195
|
| `llmgateway/qwen3-coder-flash` | 1.0M | | | | | | $0.30 | $2 |
|
|
210
|
-
| `llmgateway/qwen3-coder-next` | 262K | | | | | | $0.
|
|
211
|
-
| `llmgateway/qwen3-coder-plus` | 1.0M | | | | | | $
|
|
212
|
-
| `llmgateway/qwen3-max` |
|
|
213
|
-
| `llmgateway/qwen3-max-2026-01-23` |
|
|
214
|
-
| `llmgateway/qwen3-next-80b-a3b-instruct` |
|
|
196
|
+
| `llmgateway/qwen3-coder-next` | 262K | | | | | | $0.80 | $4 |
|
|
197
|
+
| `llmgateway/qwen3-coder-plus` | 1.0M | | | | | | $1 | $5 |
|
|
198
|
+
| `llmgateway/qwen3-max` | 262K | | | | | | $1 | $6 |
|
|
199
|
+
| `llmgateway/qwen3-max-2026-01-23` | 256K | | | | | | $3 | $15 |
|
|
200
|
+
| `llmgateway/qwen3-next-80b-a3b-instruct` | 131K | | | | | | $0.50 | $2 |
|
|
215
201
|
| `llmgateway/qwen3-next-80b-a3b-thinking` | 131K | | | | | | $0.50 | $6 |
|
|
216
|
-
| `llmgateway/qwen3-vl-235b-a22b-instruct` | 131K | | | | | | $0.
|
|
217
|
-
| `llmgateway/qwen3-vl-235b-a22b-thinking` | 131K | | | | | | $0.
|
|
218
|
-
| `llmgateway/qwen3-vl-30b-a3b-instruct` | 131K | | | | | | $0.
|
|
219
|
-
| `llmgateway/qwen3-vl-30b-a3b-thinking` | 131K | | | | | | $0.
|
|
220
|
-
| `llmgateway/qwen3-vl-8b-instruct` | 131K | | | | | | $0.
|
|
221
|
-
| `llmgateway/qwen3-vl-flash` |
|
|
202
|
+
| `llmgateway/qwen3-vl-235b-a22b-instruct` | 131K | | | | | | $0.80 | $2 |
|
|
203
|
+
| `llmgateway/qwen3-vl-235b-a22b-thinking` | 131K | | | | | | $0.80 | $2 |
|
|
204
|
+
| `llmgateway/qwen3-vl-30b-a3b-instruct` | 131K | | | | | | $0.10 | $0.10 |
|
|
205
|
+
| `llmgateway/qwen3-vl-30b-a3b-thinking` | 131K | | | | | | $0.10 | $0.10 |
|
|
206
|
+
| `llmgateway/qwen3-vl-8b-instruct` | 131K | | | | | | $0.10 | $0.10 |
|
|
207
|
+
| `llmgateway/qwen3-vl-flash` | 1.0M | | | | | | $0.05 | $0.40 |
|
|
222
208
|
| `llmgateway/qwen3-vl-plus` | 262K | | | | | | $0.20 | $2 |
|
|
223
209
|
| `llmgateway/qwen35-397b-a17b` | 262K | | | | | | $0.60 | $4 |
|
|
224
210
|
| `llmgateway/qwq-plus` | 131K | | | | | | $0.80 | $2 |
|
|
@@ -226,13 +212,9 @@ for await (const chunk of stream) {
|
|
|
226
212
|
| `llmgateway/seed-1-6-250915` | 256K | | | | | | $0.25 | $2 |
|
|
227
213
|
| `llmgateway/seed-1-6-flash-250715` | 256K | | | | | | $0.07 | $0.30 |
|
|
228
214
|
| `llmgateway/seed-1-8-251228` | 256K | | | | | | $0.25 | $2 |
|
|
229
|
-
| `llmgateway/
|
|
230
|
-
| `llmgateway/seedream-4-5` | 2K | | | | | | — | — |
|
|
231
|
-
| `llmgateway/sonar` | 130K | | | | | | $1 | $1 |
|
|
215
|
+
| `llmgateway/sonar` | 128K | | | | | | $1 | $1 |
|
|
232
216
|
| `llmgateway/sonar-pro` | 200K | | | | | | $3 | $15 |
|
|
233
217
|
| `llmgateway/sonar-reasoning-pro` | 128K | | | | | | $2 | $8 |
|
|
234
|
-
| `llmgateway/veo-3.1-fast-generate-preview` | 33K | | | | | | — | — |
|
|
235
|
-
| `llmgateway/veo-3.1-generate-preview` | 33K | | | | | | — | — |
|
|
236
218
|
|
|
237
219
|
## Advanced configuration
|
|
238
220
|
|
|
@@ -262,7 +244,7 @@ const agent = new Agent({
|
|
|
262
244
|
model: ({ requestContext }) => {
|
|
263
245
|
const useAdvanced = requestContext.task === "complex";
|
|
264
246
|
return useAdvanced
|
|
265
|
-
? "llmgateway/
|
|
247
|
+
? "llmgateway/sonar-reasoning-pro"
|
|
266
248
|
: "llmgateway/auto";
|
|
267
249
|
}
|
|
268
250
|
});
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Moonshot AI (China)
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 7 Moonshot AI (China) models through Mastra's model router. Authentication is handled automatically using the `MOONSHOT_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Moonshot AI (China) documentation](https://platform.moonshot.cn).
|
|
6
6
|
|
|
@@ -40,6 +40,7 @@ for await (const chunk of stream) {
|
|
|
40
40
|
| `moonshotai-cn/kimi-k2-thinking-turbo` | 262K | | | | | | $1 | $8 |
|
|
41
41
|
| `moonshotai-cn/kimi-k2-turbo-preview` | 262K | | | | | | $2 | $10 |
|
|
42
42
|
| `moonshotai-cn/kimi-k2.5` | 262K | | | | | | $0.60 | $3 |
|
|
43
|
+
| `moonshotai-cn/kimi-k2.6` | 262K | | | | | | $0.95 | $4 |
|
|
43
44
|
|
|
44
45
|
## Advanced configuration
|
|
45
46
|
|
|
@@ -69,7 +70,7 @@ const agent = new Agent({
|
|
|
69
70
|
model: ({ requestContext }) => {
|
|
70
71
|
const useAdvanced = requestContext.task === "complex";
|
|
71
72
|
return useAdvanced
|
|
72
|
-
? "moonshotai-cn/kimi-k2.
|
|
73
|
+
? "moonshotai-cn/kimi-k2.6"
|
|
73
74
|
: "moonshotai-cn/kimi-k2-0711-preview";
|
|
74
75
|
}
|
|
75
76
|
});
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Moonshot AI
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 7 Moonshot AI models through Mastra's model router. Authentication is handled automatically using the `MOONSHOT_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Moonshot AI documentation](https://platform.moonshot.ai).
|
|
6
6
|
|
|
@@ -40,6 +40,7 @@ for await (const chunk of stream) {
|
|
|
40
40
|
| `moonshotai/kimi-k2-thinking-turbo` | 262K | | | | | | $1 | $8 |
|
|
41
41
|
| `moonshotai/kimi-k2-turbo-preview` | 262K | | | | | | $2 | $10 |
|
|
42
42
|
| `moonshotai/kimi-k2.5` | 262K | | | | | | $0.60 | $3 |
|
|
43
|
+
| `moonshotai/kimi-k2.6` | 262K | | | | | | $0.95 | $4 |
|
|
43
44
|
|
|
44
45
|
## Advanced configuration
|
|
45
46
|
|
|
@@ -69,7 +70,7 @@ const agent = new Agent({
|
|
|
69
70
|
model: ({ requestContext }) => {
|
|
70
71
|
const useAdvanced = requestContext.task === "complex";
|
|
71
72
|
return useAdvanced
|
|
72
|
-
? "moonshotai/kimi-k2.
|
|
73
|
+
? "moonshotai/kimi-k2.6"
|
|
73
74
|
: "moonshotai/kimi-k2-0711-preview";
|
|
74
75
|
}
|
|
75
76
|
});
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# NanoGPT
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 525 NanoGPT models through Mastra's model router. Authentication is handled automatically using the `NANO_GPT_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [NanoGPT documentation](https://docs.nano-gpt.com).
|
|
6
6
|
|
|
@@ -39,6 +39,7 @@ for await (const chunk of stream) {
|
|
|
39
39
|
| `nano-gpt/aion-labs/aion-1.0-mini` | 131K | | | | | | $0.80 | $1 |
|
|
40
40
|
| `nano-gpt/aion-labs/aion-rp-llama-3.1-8b` | 33K | | | | | | $0.20 | $0.20 |
|
|
41
41
|
| `nano-gpt/Alibaba-NLP/Tongyi-DeepResearch-30B-A3B` | 128K | | | | | | $0.08 | $0.24 |
|
|
42
|
+
| `nano-gpt/alibaba/qwen3.6-flash` | 992K | | | | | | $0.19 | $1 |
|
|
42
43
|
| `nano-gpt/allenai/molmo-2-8b` | 37K | | | | | | $0.20 | $0.20 |
|
|
43
44
|
| `nano-gpt/allenai/olmo-3-32b-think` | 128K | | | | | | $0.30 | $0.45 |
|
|
44
45
|
| `nano-gpt/allenai/olmo-3.1-32b-instruct` | 66K | | | | | | $0.20 | $0.60 |
|
|
@@ -367,6 +368,8 @@ for await (const chunk of stream) {
|
|
|
367
368
|
| `nano-gpt/moonshotai/kimi-k2-thinking-turbo-original` | 256K | | | | | | $1 | $8 |
|
|
368
369
|
| `nano-gpt/moonshotai/kimi-k2.5` | 256K | | | | | | $0.30 | $2 |
|
|
369
370
|
| `nano-gpt/moonshotai/kimi-k2.5:thinking` | 256K | | | | | | $0.30 | $2 |
|
|
371
|
+
| `nano-gpt/moonshotai/kimi-k2.6` | 256K | | | | | | $0.53 | $3 |
|
|
372
|
+
| `nano-gpt/moonshotai/kimi-k2.6:thinking` | 256K | | | | | | $0.53 | $3 |
|
|
370
373
|
| `nano-gpt/NeverSleep/Llama-3-Lumimaid-70B-v0.1` | 16K | | | | | | $2 | $2 |
|
|
371
374
|
| `nano-gpt/NeverSleep/Lumimaid-v0.2-70B` | 16K | | | | | | $1 | $2 |
|
|
372
375
|
| `nano-gpt/nex-agi/deepseek-v3.1-nex-n1` | 128K | | | | | | $0.28 | $0.42 |
|
|
@@ -432,12 +435,15 @@ for await (const chunk of stream) {
|
|
|
432
435
|
| `nano-gpt/phi-4-mini-instruct` | 128K | | | | | | $0.17 | $0.68 |
|
|
433
436
|
| `nano-gpt/phi-4-multimodal-instruct` | 128K | | | | | | $0.07 | $0.11 |
|
|
434
437
|
| `nano-gpt/qvq-max` | 128K | | | | | | $1 | $5 |
|
|
438
|
+
| `nano-gpt/qwen-3.6-plus` | 992K | | | | | | $0.45 | $3 |
|
|
435
439
|
| `nano-gpt/qwen-image` | — | | | | | | — | — |
|
|
436
440
|
| `nano-gpt/qwen-long` | 10.0M | | | | | | $0.10 | $0.41 |
|
|
437
441
|
| `nano-gpt/qwen-max` | 32K | | | | | | $2 | $6 |
|
|
438
442
|
| `nano-gpt/qwen-plus` | 996K | | | | | | $0.40 | $1 |
|
|
439
443
|
| `nano-gpt/qwen-turbo` | 1.0M | | | | | | $0.05 | $0.20 |
|
|
440
444
|
| `nano-gpt/qwen/qwen3.5-397b-a17b` | 258K | | | | | | $0.60 | $4 |
|
|
445
|
+
| `nano-gpt/qwen/Qwen3.6-35B-A3B` | 262K | | | | | | $0.29 | $2 |
|
|
446
|
+
| `nano-gpt/qwen/Qwen3.6-35B-A3B:thinking` | 262K | | | | | | $0.29 | $2 |
|
|
441
447
|
| `nano-gpt/Qwen2.5-32B-EVA-v0.2` | 25K | | | | | | $0.49 | $0.49 |
|
|
442
448
|
| `nano-gpt/qwen25-vl-72b-instruct` | 32K | | | | | | $0.70 | $0.70 |
|
|
443
449
|
| `nano-gpt/qwen3-30b-a3b-instruct-2507` | 256K | | | | | | $0.20 | $0.50 |
|
|
@@ -445,6 +451,7 @@ for await (const chunk of stream) {
|
|
|
445
451
|
| `nano-gpt/qwen3-max-2026-01-23` | 256K | | | | | | $1 | $6 |
|
|
446
452
|
| `nano-gpt/qwen3-vl-235b-a22b-instruct-original` | 33K | | | | | | $0.50 | $1 |
|
|
447
453
|
| `nano-gpt/qwen3-vl-235b-a22b-thinking` | 33K | | | | | | $0.50 | $6 |
|
|
454
|
+
| `nano-gpt/qwen3.6-max-preview` | 246K | | | | | | $1 | $8 |
|
|
448
455
|
| `nano-gpt/qwq-32b` | 128K | | | | | | $0.26 | $0.30 |
|
|
449
456
|
| `nano-gpt/QwQ-32B-ArliAI-RpR-v1` | 33K | | | | | | $0.20 | $0.20 |
|
|
450
457
|
| `nano-gpt/raifle/sorcererlm-8x22b` | 16K | | | | | | $5 | $5 |
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Nvidia
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 77 Nvidia models through Mastra's model router. Authentication is handled automatically using the `NVIDIA_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Nvidia documentation](https://docs.api.nvidia.com/nim/).
|
|
6
6
|
|
|
@@ -108,6 +108,7 @@ for await (const chunk of stream) {
|
|
|
108
108
|
| `nvidia/qwen/qwen3.5-397b-a17b` | 262K | | | | | | — | — |
|
|
109
109
|
| `nvidia/qwen/qwq-32b` | 128K | | | | | | — | — |
|
|
110
110
|
| `nvidia/stepfun-ai/step-3.5-flash` | 256K | | | | | | — | — |
|
|
111
|
+
| `nvidia/z-ai/glm-5.1` | 131K | | | | | | — | — |
|
|
111
112
|
| `nvidia/z-ai/glm4.7` | 205K | | | | | | — | — |
|
|
112
113
|
| `nvidia/z-ai/glm5` | 203K | | | | | | — | — |
|
|
113
114
|
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Ollama Cloud
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 37 Ollama Cloud models through Mastra's model router. Authentication is handled automatically using the `OLLAMA_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Ollama Cloud documentation](https://docs.ollama.com/cloud).
|
|
6
6
|
|
|
@@ -53,6 +53,7 @@ for await (const chunk of stream) {
|
|
|
53
53
|
| `ollama-cloud/kimi-k2-thinking` | 262K | | | | | | — | — |
|
|
54
54
|
| `ollama-cloud/kimi-k2:1t` | 262K | | | | | | — | — |
|
|
55
55
|
| `ollama-cloud/kimi-k2.5` | 262K | | | | | | — | — |
|
|
56
|
+
| `ollama-cloud/kimi-k2.6:cloud` | 262K | | | | | | — | — |
|
|
56
57
|
| `ollama-cloud/minimax-m2` | 205K | | | | | | — | — |
|
|
57
58
|
| `ollama-cloud/minimax-m2.1` | 205K | | | | | | — | — |
|
|
58
59
|
| `ollama-cloud/minimax-m2.5` | 205K | | | | | | — | — |
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# OpenAI
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 50 OpenAI models through Mastra's model router. Authentication is handled automatically using the `OPENAI_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [OpenAI documentation](https://platform.openai.com/docs/models).
|
|
6
6
|
|
|
@@ -33,7 +33,6 @@ for await (const chunk of stream) {
|
|
|
33
33
|
| Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
|
|
34
34
|
| ------------------------------- | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
|
|
35
35
|
| `openai/chatgpt-image-latest` | — | | | | | | — | — |
|
|
36
|
-
| `openai/codex-mini-latest` | 200K | | | | | | $2 | $6 |
|
|
37
36
|
| `openai/gpt-3.5-turbo` | 16K | | | | | | $0.50 | $2 |
|
|
38
37
|
| `openai/gpt-4` | 8K | | | | | | $30 | $60 |
|
|
39
38
|
| `openai/gpt-4-turbo` | 128K | | | | | | $10 | $30 |
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# OpenCode Go
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 10 OpenCode Go models through Mastra's model router. Authentication is handled automatically using the `OPENCODE_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [OpenCode Go documentation](https://opencode.ai/docs/zen).
|
|
6
6
|
|
|
@@ -37,6 +37,7 @@ for await (const chunk of stream) {
|
|
|
37
37
|
| `opencode-go/glm-5` | 205K | | | | | | $1 | $3 |
|
|
38
38
|
| `opencode-go/glm-5.1` | 205K | | | | | | $1 | $4 |
|
|
39
39
|
| `opencode-go/kimi-k2.5` | 262K | | | | | | $0.60 | $3 |
|
|
40
|
+
| `opencode-go/kimi-k2.6` | 262K | | | | | | $0.32 | $1 |
|
|
40
41
|
| `opencode-go/mimo-v2-omni` | 262K | | | | | | $0.40 | $2 |
|
|
41
42
|
| `opencode-go/mimo-v2-pro` | 1.0M | | | | | | $1 | $3 |
|
|
42
43
|
| `opencode-go/minimax-m2.5` | 205K | | | | | | $0.30 | $1 |
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# OpenCode Zen
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 38 OpenCode Zen models through Mastra's model router. Authentication is handled automatically using the `OPENCODE_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [OpenCode Zen documentation](https://opencode.ai/docs/zen).
|
|
6
6
|
|
|
@@ -40,6 +40,7 @@ for await (const chunk of stream) {
|
|
|
40
40
|
| `opencode/claude-opus-4-1` | 200K | | | | | | $15 | $75 |
|
|
41
41
|
| `opencode/claude-opus-4-5` | 200K | | | | | | $5 | $25 |
|
|
42
42
|
| `opencode/claude-opus-4-6` | 1.0M | | | | | | $5 | $25 |
|
|
43
|
+
| `opencode/claude-opus-4-7` | 1.0M | | | | | | $5 | $25 |
|
|
43
44
|
| `opencode/claude-sonnet-4` | 1.0M | | | | | | $3 | $15 |
|
|
44
45
|
| `opencode/claude-sonnet-4-5` | 1.0M | | | | | | $3 | $15 |
|
|
45
46
|
| `opencode/claude-sonnet-4-6` | 1.0M | | | | | | $3 | $15 |
|
|
@@ -63,8 +64,11 @@ for await (const chunk of stream) {
|
|
|
63
64
|
| `opencode/gpt-5.4-nano` | 400K | | | | | | $0.20 | $1 |
|
|
64
65
|
| `opencode/gpt-5.4-pro` | 1.1M | | | | | | $30 | $180 |
|
|
65
66
|
| `opencode/kimi-k2.5` | 262K | | | | | | $0.60 | $3 |
|
|
67
|
+
| `opencode/kimi-k2.6` | 262K | | | | | | $0.95 | $4 |
|
|
68
|
+
| `opencode/ling-2.6-flash-free` | 262K | | | | | | — | — |
|
|
66
69
|
| `opencode/minimax-m2.5` | 205K | | | | | | $0.30 | $1 |
|
|
67
70
|
| `opencode/minimax-m2.5-free` | 205K | | | | | | — | — |
|
|
71
|
+
| `opencode/minimax-m2.7` | 205K | | | | | | $0.30 | $1 |
|
|
68
72
|
| `opencode/nemotron-3-super-free` | 205K | | | | | | — | — |
|
|
69
73
|
| `opencode/qwen3.5-plus` | 262K | | | | | | $0.20 | $1 |
|
|
70
74
|
| `opencode/qwen3.6-plus` | 262K | | | | | | $0.50 | $3 |
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# OVHcloud AI Endpoints
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 10 OVHcloud AI Endpoints models through Mastra's model router. Authentication is handled automatically using the `OVHCLOUD_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [OVHcloud AI Endpoints documentation](https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog//).
|
|
6
6
|
|
|
@@ -15,7 +15,7 @@ const agent = new Agent({
|
|
|
15
15
|
id: "my-agent",
|
|
16
16
|
name: "My Agent",
|
|
17
17
|
instructions: "You are a helpful assistant",
|
|
18
|
-
model: "ovhcloud/
|
|
18
|
+
model: "ovhcloud/gpt-oss-120b"
|
|
19
19
|
});
|
|
20
20
|
|
|
21
21
|
// Generate a response
|
|
@@ -34,7 +34,6 @@ for await (const chunk of stream) {
|
|
|
34
34
|
|
|
35
35
|
| Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
|
|
36
36
|
| ---------------------------------------------- | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
|
|
37
|
-
| `ovhcloud/deepseek-r1-distill-llama-70b` | 131K | | | | | | $0.74 | $0.74 |
|
|
38
37
|
| `ovhcloud/gpt-oss-120b` | 131K | | | | | | $0.09 | $0.47 |
|
|
39
38
|
| `ovhcloud/gpt-oss-20b` | 131K | | | | | | $0.05 | $0.18 |
|
|
40
39
|
| `ovhcloud/llama-3.1-8b-instruct` | 131K | | | | | | $0.11 | $0.11 |
|
|
@@ -42,8 +41,6 @@ for await (const chunk of stream) {
|
|
|
42
41
|
| `ovhcloud/mistral-7b-instruct-v0.3` | 66K | | | | | | $0.11 | $0.11 |
|
|
43
42
|
| `ovhcloud/mistral-nemo-instruct-2407` | 66K | | | | | | $0.14 | $0.14 |
|
|
44
43
|
| `ovhcloud/mistral-small-3.2-24b-instruct-2506` | 131K | | | | | | $0.10 | $0.31 |
|
|
45
|
-
| `ovhcloud/mixtral-8x7b-instruct-v0.1` | 33K | | | | | | $0.70 | $0.70 |
|
|
46
|
-
| `ovhcloud/qwen2.5-coder-32b-instruct` | 33K | | | | | | $0.96 | $0.96 |
|
|
47
44
|
| `ovhcloud/qwen2.5-vl-72b-instruct` | 33K | | | | | | $1 | $1 |
|
|
48
45
|
| `ovhcloud/qwen3-32b` | 33K | | | | | | $0.09 | $0.25 |
|
|
49
46
|
| `ovhcloud/qwen3-coder-30b-a3b-instruct` | 262K | | | | | | $0.07 | $0.26 |
|
|
@@ -58,7 +55,7 @@ const agent = new Agent({
|
|
|
58
55
|
name: "custom-agent",
|
|
59
56
|
model: {
|
|
60
57
|
url: "https://oai.endpoints.kepler.ai.cloud.ovh.net/v1",
|
|
61
|
-
id: "ovhcloud/
|
|
58
|
+
id: "ovhcloud/gpt-oss-120b",
|
|
62
59
|
apiKey: process.env.OVHCLOUD_API_KEY,
|
|
63
60
|
headers: {
|
|
64
61
|
"X-Custom-Header": "value"
|
|
@@ -77,7 +74,7 @@ const agent = new Agent({
|
|
|
77
74
|
const useAdvanced = requestContext.task === "complex";
|
|
78
75
|
return useAdvanced
|
|
79
76
|
? "ovhcloud/qwen3-coder-30b-a3b-instruct"
|
|
80
|
-
: "ovhcloud/
|
|
77
|
+
: "ovhcloud/gpt-oss-120b";
|
|
81
78
|
}
|
|
82
79
|
});
|
|
83
80
|
```
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Poe
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 118 Poe models through Mastra's model router. Authentication is handled automatically using the `POE_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Poe documentation](https://creator.poe.com/docs/external-applications/openai-compatible-api).
|
|
6
6
|
|
|
@@ -41,6 +41,7 @@ for await (const chunk of stream) {
|
|
|
41
41
|
| `poe/anthropic/claude-opus-4.1` | 197K | | | | | | $13 | $64 |
|
|
42
42
|
| `poe/anthropic/claude-opus-4.5` | 197K | | | | | | $4 | $21 |
|
|
43
43
|
| `poe/anthropic/claude-opus-4.6` | 983K | | | | | | $4 | $21 |
|
|
44
|
+
| `poe/anthropic/claude-opus-4.7` | 1.0M | | | | | | $4 | $21 |
|
|
44
45
|
| `poe/anthropic/claude-sonnet-3.7` | 197K | | | | | | $3 | $13 |
|
|
45
46
|
| `poe/anthropic/claude-sonnet-4` | 983K | | | | | | $3 | $13 |
|
|
46
47
|
| `poe/anthropic/claude-sonnet-4.5` | 983K | | | | | | $3 | $13 |
|
|
@@ -0,0 +1,71 @@
|
|
|
1
|
+
# Tencent Token Plan
|
|
2
|
+
|
|
3
|
+
Access 1 Tencent Token Plan model through Mastra's model router. Authentication is handled automatically using the `TENCENT_TOKEN_PLAN_API_KEY` environment variable.
|
|
4
|
+
|
|
5
|
+
Learn more in the [Tencent Token Plan documentation](https://cloud.tencent.com/document/product/1823/130060).
|
|
6
|
+
|
|
7
|
+
```bash
|
|
8
|
+
TENCENT_TOKEN_PLAN_API_KEY=your-api-key
|
|
9
|
+
```
|
|
10
|
+
|
|
11
|
+
```typescript
|
|
12
|
+
import { Agent } from "@mastra/core/agent";
|
|
13
|
+
|
|
14
|
+
const agent = new Agent({
|
|
15
|
+
id: "my-agent",
|
|
16
|
+
name: "My Agent",
|
|
17
|
+
instructions: "You are a helpful assistant",
|
|
18
|
+
model: "tencent-token-plan/hy3-preview"
|
|
19
|
+
});
|
|
20
|
+
|
|
21
|
+
// Generate a response
|
|
22
|
+
const response = await agent.generate("Hello!");
|
|
23
|
+
|
|
24
|
+
// Stream a response
|
|
25
|
+
const stream = await agent.stream("Tell me a story");
|
|
26
|
+
for await (const chunk of stream) {
|
|
27
|
+
console.log(chunk);
|
|
28
|
+
}
|
|
29
|
+
```
|
|
30
|
+
|
|
31
|
+
> **Info:** Mastra uses the OpenAI-compatible `/chat/completions` endpoint. Some provider-specific features may not be available. Check the [Tencent Token Plan documentation](https://cloud.tencent.com/document/product/1823/130060) for details.
|
|
32
|
+
|
|
33
|
+
## Models
|
|
34
|
+
|
|
35
|
+
| Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
|
|
36
|
+
| -------------------------------- | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
|
|
37
|
+
| `tencent-token-plan/hy3-preview` | 256K | | | | | | — | — |
|
|
38
|
+
|
|
39
|
+
## Advanced configuration
|
|
40
|
+
|
|
41
|
+
### Custom headers
|
|
42
|
+
|
|
43
|
+
```typescript
|
|
44
|
+
const agent = new Agent({
|
|
45
|
+
id: "custom-agent",
|
|
46
|
+
name: "custom-agent",
|
|
47
|
+
model: {
|
|
48
|
+
url: "https://api.lkeap.cloud.tencent.com/plan/v3",
|
|
49
|
+
id: "tencent-token-plan/hy3-preview",
|
|
50
|
+
apiKey: process.env.TENCENT_TOKEN_PLAN_API_KEY,
|
|
51
|
+
headers: {
|
|
52
|
+
"X-Custom-Header": "value"
|
|
53
|
+
}
|
|
54
|
+
}
|
|
55
|
+
});
|
|
56
|
+
```
|
|
57
|
+
|
|
58
|
+
### Dynamic model selection
|
|
59
|
+
|
|
60
|
+
```typescript
|
|
61
|
+
const agent = new Agent({
|
|
62
|
+
id: "dynamic-agent",
|
|
63
|
+
name: "Dynamic Agent",
|
|
64
|
+
model: ({ requestContext }) => {
|
|
65
|
+
const useAdvanced = requestContext.task === "complex";
|
|
66
|
+
return useAdvanced
|
|
67
|
+
? "tencent-token-plan/hy3-preview"
|
|
68
|
+
: "tencent-token-plan/hy3-preview";
|
|
69
|
+
}
|
|
70
|
+
});
|
|
71
|
+
```
|