@mastra/mcp-docs-server 1.1.35-alpha.6 → 1.1.35
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.docs/course/03-agent-memory/18-advanced-configuration-semantic-recall.md +48 -4
- package/.docs/docs/agents/background-tasks.md +62 -2
- package/.docs/docs/agents/processors.md +9 -1
- package/.docs/docs/agents/response-caching.md +148 -0
- package/.docs/docs/agents/signals.md +151 -0
- package/.docs/docs/agents/using-tools.md +8 -0
- package/.docs/docs/browser/agent-browser.md +15 -0
- package/.docs/docs/browser/stagehand.md +25 -1
- package/.docs/docs/editor/tools.md +1 -1
- package/.docs/docs/index.md +2 -2
- package/.docs/docs/mastra-platform/configuration.md +1 -1
- package/.docs/docs/mastra-platform/overview.md +1 -1
- package/.docs/docs/memory/observational-memory.md +61 -13
- package/.docs/docs/memory/semantic-recall.md +68 -6
- package/.docs/docs/observability/logging.md +2 -2
- package/.docs/docs/observability/metrics/overview.md +4 -4
- package/.docs/docs/observability/overview.md +6 -6
- package/.docs/docs/observability/tracing/bridges/otel.md +25 -0
- package/.docs/docs/observability/tracing/exporters/arize.md +5 -5
- package/.docs/docs/observability/tracing/exporters/braintrust.md +37 -0
- package/.docs/docs/observability/tracing/exporters/langfuse.md +21 -0
- package/.docs/docs/observability/tracing/exporters/{cloud.md → mastra-platform.md} +28 -26
- package/.docs/docs/observability/tracing/exporters/{default.md → mastra-storage.md} +56 -19
- package/.docs/docs/observability/tracing/exporters/otel.md +79 -2
- package/.docs/docs/observability/tracing/overview.md +30 -29
- package/.docs/docs/observability/tracing/processors/sensitive-data-filter.md +6 -6
- package/.docs/docs/server/mastra-server.md +30 -19
- package/.docs/docs/studio/observability.md +4 -4
- package/.docs/docs/studio/overview.md +6 -0
- package/.docs/docs/voice/overview.md +84 -0
- package/.docs/docs/workflows/suspend-and-resume.md +28 -1
- package/.docs/guides/deployment/inngest.md +23 -0
- package/.docs/guides/guide/web-search.md +7 -7
- package/.docs/guides/migrations/mastra-cloud.md +6 -6
- package/.docs/guides/migrations/upgrade-to-v1/tracing.md +19 -17
- package/.docs/models/gateways/azure-openai.md +94 -23
- package/.docs/models/gateways/netlify.md +2 -1
- package/.docs/models/gateways/openrouter.md +4 -1
- package/.docs/models/gateways/vercel.md +2 -1
- package/.docs/models/index.md +1 -1
- package/.docs/models/providers/chutes.md +23 -54
- package/.docs/models/providers/databricks.md +96 -0
- package/.docs/models/providers/deepseek.md +3 -1
- package/.docs/models/providers/digitalocean.md +9 -2
- package/.docs/models/providers/firepass.md +71 -0
- package/.docs/models/providers/google.md +3 -2
- package/.docs/models/providers/kilo.md +5 -3
- package/.docs/models/providers/llmgateway.md +7 -1
- package/.docs/models/providers/nebius.md +37 -55
- package/.docs/models/providers/novita-ai.md +5 -5
- package/.docs/models/providers/nvidia.md +59 -49
- package/.docs/models/providers/ollama-cloud.md +1 -1
- package/.docs/models/providers/openai.md +2 -0
- package/.docs/models/providers/opencode.md +44 -43
- package/.docs/models/providers/poe.md +4 -1
- package/.docs/models/providers/sarvam.md +72 -0
- package/.docs/models/providers/wafer.ai.md +2 -1
- package/.docs/models/providers/xiaomi-token-plan-ams.md +6 -5
- package/.docs/models/providers/xiaomi-token-plan-cn.md +6 -5
- package/.docs/models/providers/xiaomi-token-plan-sgp.md +6 -5
- package/.docs/models/providers.md +3 -1
- package/.docs/reference/agents/agent.md +85 -0
- package/.docs/reference/browser/agent-browser.md +37 -11
- package/.docs/reference/browser/stagehand-browser.md +35 -9
- package/.docs/reference/cli/mastra.md +497 -1
- package/.docs/reference/client-js/agents.md +115 -1
- package/.docs/reference/client-js/responses.md +4 -0
- package/.docs/reference/configuration.md +6 -6
- package/.docs/reference/editor/tool-provider.md +3 -3
- package/.docs/reference/harness/harness-class.md +21 -8
- package/.docs/reference/index.md +5 -0
- package/.docs/reference/memory/observational-memory.md +11 -1
- package/.docs/reference/observability/metrics/automatic-metrics.md +2 -4
- package/.docs/reference/observability/tracing/bridges/datadog.md +2 -2
- package/.docs/reference/observability/tracing/bridges/otel.md +26 -4
- package/.docs/reference/observability/tracing/configuration.md +6 -3
- package/.docs/reference/observability/tracing/exporters/arize.md +1 -1
- package/.docs/reference/observability/tracing/exporters/braintrust.md +2 -0
- package/.docs/reference/observability/tracing/exporters/cloud-exporter.md +3 -1
- package/.docs/reference/observability/tracing/exporters/console-exporter.md +2 -2
- package/.docs/reference/observability/tracing/exporters/default-exporter.md +7 -1
- package/.docs/reference/observability/tracing/exporters/mastra-platform-exporter.md +263 -0
- package/.docs/reference/observability/tracing/exporters/mastra-storage-exporter.md +194 -0
- package/.docs/reference/observability/tracing/exporters/otel.md +12 -8
- package/.docs/reference/observability/tracing/instances.md +2 -2
- package/.docs/reference/observability/tracing/interfaces.md +37 -2
- package/.docs/reference/observability/tracing/processors/sensitive-data-filter.md +22 -0
- package/.docs/reference/observability/tracing/span-filtering.md +2 -2
- package/.docs/reference/processors/prefill-error-handler.md +3 -3
- package/.docs/reference/processors/response-cache.md +114 -0
- package/.docs/reference/processors/tool-call-filter.md +28 -0
- package/.docs/reference/storage/clickhouse.md +8 -8
- package/.docs/reference/storage/cloudflare-d1.md +1 -1
- package/.docs/reference/storage/cloudflare.md +1 -1
- package/.docs/reference/storage/composite.md +1 -1
- package/.docs/reference/storage/convex.md +1 -1
- package/.docs/reference/storage/dsql.md +428 -0
- package/.docs/reference/storage/duckdb.md +3 -3
- package/.docs/reference/storage/dynamodb.md +1 -1
- package/.docs/reference/storage/lance.md +1 -1
- package/.docs/reference/storage/libsql.md +1 -1
- package/.docs/reference/storage/postgresql.md +1 -1
- package/.docs/reference/storage/upstash.md +1 -1
- package/.docs/reference/streaming/ChunkType.md +44 -0
- package/.docs/reference/streaming/agents/stream.md +18 -2
- package/.docs/reference/tools/brightdata.md +167 -0
- package/.docs/reference/tools/create-tool.md +46 -0
- package/.docs/reference/voice/inworld.md +133 -0
- package/.docs/reference/workflows/workflow-state-reader.md +113 -0
- package/CHANGELOG.md +113 -0
- package/package.json +6 -6
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Nebius Token Factory
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 31 Nebius Token Factory models through Mastra's model router. Authentication is handled automatically using the `NEBIUS_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Nebius Token Factory documentation](https://docs.tokenfactory.nebius.com/).
|
|
6
6
|
|
|
@@ -15,7 +15,7 @@ const agent = new Agent({
|
|
|
15
15
|
id: "my-agent",
|
|
16
16
|
name: "My Agent",
|
|
17
17
|
instructions: "You are a helpful assistant",
|
|
18
|
-
model: "nebius/
|
|
18
|
+
model: "nebius/MiniMaxAI/MiniMax-M2.5"
|
|
19
19
|
});
|
|
20
20
|
|
|
21
21
|
// Generate a response
|
|
@@ -32,57 +32,39 @@ for await (const chunk of stream) {
|
|
|
32
32
|
|
|
33
33
|
## Models
|
|
34
34
|
|
|
35
|
-
| Model
|
|
36
|
-
|
|
|
37
|
-
| `nebius/
|
|
38
|
-
| `nebius/
|
|
39
|
-
| `nebius/
|
|
40
|
-
| `nebius/
|
|
41
|
-
| `nebius/
|
|
42
|
-
| `nebius/
|
|
43
|
-
| `nebius/
|
|
44
|
-
| `nebius/
|
|
45
|
-
| `nebius/
|
|
46
|
-
| `nebius/
|
|
47
|
-
| `nebius/
|
|
48
|
-
| `nebius/
|
|
49
|
-
| `nebius/
|
|
50
|
-
| `nebius/
|
|
51
|
-
| `nebius/
|
|
52
|
-
| `nebius/
|
|
53
|
-
| `nebius/
|
|
54
|
-
| `nebius/
|
|
55
|
-
| `nebius/
|
|
56
|
-
| `nebius/
|
|
57
|
-
| `nebius/
|
|
58
|
-
| `nebius/
|
|
59
|
-
| `nebius/
|
|
60
|
-
| `nebius/
|
|
61
|
-
| `nebius/
|
|
62
|
-
| `nebius/
|
|
63
|
-
| `nebius/
|
|
64
|
-
| `nebius/
|
|
65
|
-
| `nebius/
|
|
66
|
-
| `nebius/
|
|
67
|
-
| `nebius/
|
|
68
|
-
| `nebius/openai/gpt-oss-20b` | 128K | | | | | | $0.05 | $0.20 |
|
|
69
|
-
| `nebius/PrimeIntellect/INTELLECT-3` | 128K | | | | | | $0.20 | $1 |
|
|
70
|
-
| `nebius/Qwen/Qwen2.5-Coder-7B-fast` | 128K | | | | | | $0.03 | $0.09 |
|
|
71
|
-
| `nebius/Qwen/Qwen2.5-VL-72B-Instruct` | 128K | | | | | | $0.25 | $0.75 |
|
|
72
|
-
| `nebius/Qwen/Qwen3-235B-A22B-Instruct-2507` | 262K | | | | | | $0.20 | $0.60 |
|
|
73
|
-
| `nebius/Qwen/Qwen3-235B-A22B-Thinking-2507` | 262K | | | | | | $0.20 | $0.80 |
|
|
74
|
-
| `nebius/Qwen/Qwen3-30B-A3B-Instruct-2507` | 128K | | | | | | $0.10 | $0.30 |
|
|
75
|
-
| `nebius/Qwen/Qwen3-30B-A3B-Thinking-2507` | 128K | | | | | | $0.10 | $0.30 |
|
|
76
|
-
| `nebius/Qwen/Qwen3-32B` | 128K | | | | | | $0.10 | $0.30 |
|
|
77
|
-
| `nebius/Qwen/Qwen3-32B-fast` | 128K | | | | | | $0.20 | $0.60 |
|
|
78
|
-
| `nebius/Qwen/Qwen3-Coder-30B-A3B-Instruct` | 128K | | | | | | $0.10 | $0.30 |
|
|
79
|
-
| `nebius/Qwen/Qwen3-Coder-480B-A35B-Instruct` | 262K | | | | | | $0.40 | $2 |
|
|
80
|
-
| `nebius/Qwen/Qwen3-Embedding-8B` | 33K | | | | | | $0.01 | — |
|
|
81
|
-
| `nebius/Qwen/Qwen3-Next-80B-A3B-Thinking` | 128K | | | | | | $0.15 | $1 |
|
|
82
|
-
| `nebius/zai-org/GLM-4.5` | 128K | | | | | | $0.60 | $2 |
|
|
83
|
-
| `nebius/zai-org/GLM-4.5-Air` | 128K | | | | | | $0.20 | $1 |
|
|
84
|
-
| `nebius/zai-org/GLM-4.7-FP8` | 128K | | | | | | $0.40 | $2 |
|
|
85
|
-
| `nebius/zai-org/GLM-5` | 200K | | | | | | $1 | $3 |
|
|
35
|
+
| Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
|
|
36
|
+
| ------------------------------------------------ | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
|
|
37
|
+
| `nebius/deepseek-ai/DeepSeek-V3.2` | 163K | | | | | | $0.30 | $0.45 |
|
|
38
|
+
| `nebius/deepseek-ai/DeepSeek-V3.2-fast` | 8K | | | | | | $0.40 | $2 |
|
|
39
|
+
| `nebius/deepseek-ai/DeepSeek-V4-Pro` | 1.0M | | | | | | $2 | $4 |
|
|
40
|
+
| `nebius/google/gemma-2-2b-it` | 8K | | | | | | $0.02 | $0.06 |
|
|
41
|
+
| `nebius/google/gemma-3-27b-it` | 110K | | | | | | $0.10 | $0.30 |
|
|
42
|
+
| `nebius/meta-llama/Llama-3.3-70B-Instruct` | 128K | | | | | | $0.13 | $0.40 |
|
|
43
|
+
| `nebius/meta-llama/Meta-Llama-3.1-8B-Instruct` | 128K | | | | | | $0.02 | $0.06 |
|
|
44
|
+
| `nebius/MiniMaxAI/MiniMax-M2.5` | 197K | | | | | | $0.30 | $1 |
|
|
45
|
+
| `nebius/MiniMaxAI/MiniMax-M2.5-fast` | 8K | | | | | | $0.30 | $1 |
|
|
46
|
+
| `nebius/moonshotai/Kimi-K2.5` | 256K | | | | | | $0.50 | $3 |
|
|
47
|
+
| `nebius/moonshotai/Kimi-K2.5-fast` | 256K | | | | | | $0.50 | $3 |
|
|
48
|
+
| `nebius/NousResearch/Hermes-4-405B` | 128K | | | | | | $1 | $3 |
|
|
49
|
+
| `nebius/NousResearch/Hermes-4-70B` | 128K | | | | | | $0.13 | $0.40 |
|
|
50
|
+
| `nebius/nvidia/Llama-3_1-Nemotron-Ultra-253B-v1` | 128K | | | | | | $0.60 | $2 |
|
|
51
|
+
| `nebius/nvidia/Nemotron-3-Nano-Omni` | 66K | | | | | | $0.06 | $0.24 |
|
|
52
|
+
| `nebius/nvidia/nemotron-3-super-120b-a12b` | 256K | | | | | | $0.30 | $0.90 |
|
|
53
|
+
| `nebius/nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B` | 32K | | | | | | $0.06 | $0.24 |
|
|
54
|
+
| `nebius/openai/gpt-oss-120b` | 128K | | | | | | $0.15 | $0.60 |
|
|
55
|
+
| `nebius/openai/gpt-oss-120b-fast` | 8K | | | | | | $0.10 | $0.50 |
|
|
56
|
+
| `nebius/PrimeIntellect/INTELLECT-3` | 128K | | | | | | $0.20 | $1 |
|
|
57
|
+
| `nebius/Qwen/Qwen2.5-VL-72B-Instruct` | 128K | | | | | | $0.25 | $0.75 |
|
|
58
|
+
| `nebius/Qwen/Qwen3-235B-A22B-Instruct-2507` | 262K | | | | | | $0.20 | $0.60 |
|
|
59
|
+
| `nebius/Qwen/Qwen3-235B-A22B-Thinking-2507-fast` | 8K | | | | | | $0.50 | $2 |
|
|
60
|
+
| `nebius/Qwen/Qwen3-30B-A3B-Instruct-2507` | 128K | | | | | | $0.10 | $0.30 |
|
|
61
|
+
| `nebius/Qwen/Qwen3-32B` | 128K | | | | | | $0.10 | $0.30 |
|
|
62
|
+
| `nebius/Qwen/Qwen3-Embedding-8B` | 33K | | | | | | $0.01 | — |
|
|
63
|
+
| `nebius/Qwen/Qwen3-Next-80B-A3B-Thinking` | 128K | | | | | | $0.15 | $1 |
|
|
64
|
+
| `nebius/Qwen/Qwen3-Next-80B-A3B-Thinking-fast` | 8K | | | | | | $0.15 | $1 |
|
|
65
|
+
| `nebius/Qwen/Qwen3.5-397B-A17B` | 262K | | | | | | $0.60 | $4 |
|
|
66
|
+
| `nebius/Qwen/Qwen3.5-397B-A17B-fast` | 8K | | | | | | $0.60 | $4 |
|
|
67
|
+
| `nebius/zai-org/GLM-5` | 200K | | | | | | $1 | $3 |
|
|
86
68
|
|
|
87
69
|
## Advanced configuration
|
|
88
70
|
|
|
@@ -94,7 +76,7 @@ const agent = new Agent({
|
|
|
94
76
|
name: "custom-agent",
|
|
95
77
|
model: {
|
|
96
78
|
url: "https://api.tokenfactory.nebius.com/v1",
|
|
97
|
-
id: "nebius/
|
|
79
|
+
id: "nebius/MiniMaxAI/MiniMax-M2.5",
|
|
98
80
|
apiKey: process.env.NEBIUS_API_KEY,
|
|
99
81
|
headers: {
|
|
100
82
|
"X-Custom-Header": "value"
|
|
@@ -113,7 +95,7 @@ const agent = new Agent({
|
|
|
113
95
|
const useAdvanced = requestContext.task === "complex";
|
|
114
96
|
return useAdvanced
|
|
115
97
|
? "nebius/zai-org/GLM-5"
|
|
116
|
-
: "nebius/
|
|
98
|
+
: "nebius/MiniMaxAI/MiniMax-M2.5";
|
|
117
99
|
}
|
|
118
100
|
});
|
|
119
101
|
```
|
|
@@ -15,7 +15,7 @@ const agent = new Agent({
|
|
|
15
15
|
id: "my-agent",
|
|
16
16
|
name: "My Agent",
|
|
17
17
|
instructions: "You are a helpful assistant",
|
|
18
|
-
model: "novita-ai/
|
|
18
|
+
model: "novita-ai/Sao10K/L3-8B-Stheno-v3.2"
|
|
19
19
|
});
|
|
20
20
|
|
|
21
21
|
// Generate a response
|
|
@@ -64,6 +64,7 @@ for await (const chunk of stream) {
|
|
|
64
64
|
| `novita-ai/google/gemma-4-31b-it` | 262K | | | | | | $0.14 | $0.40 |
|
|
65
65
|
| `novita-ai/gryphe/mythomax-l2-13b` | 4K | | | | | | $0.09 | $0.09 |
|
|
66
66
|
| `novita-ai/inclusionai/ling-2.6-1t` | 262K | | | | | | — | — |
|
|
67
|
+
| `novita-ai/inclusionai/ling-2.6-flash` | 262K | | | | | | $0.10 | $0.30 |
|
|
67
68
|
| `novita-ai/kwaipilot/kat-coder-pro` | 256K | | | | | | $0.30 | $1 |
|
|
68
69
|
| `novita-ai/meta-llama/llama-3-70b-instruct` | 8K | | | | | | $0.51 | $0.74 |
|
|
69
70
|
| `novita-ai/meta-llama/llama-3-8b-instruct` | 8K | | | | | | $0.04 | $0.04 |
|
|
@@ -117,10 +118,9 @@ for await (const chunk of stream) {
|
|
|
117
118
|
| `novita-ai/qwen/qwen3.5-27b` | 262K | | | | | | $0.30 | $2 |
|
|
118
119
|
| `novita-ai/qwen/qwen3.5-35b-a3b` | 262K | | | | | | $0.25 | $2 |
|
|
119
120
|
| `novita-ai/qwen/qwen3.5-397b-a17b` | 262K | | | | | | $0.60 | $4 |
|
|
120
|
-
| `novita-ai/qwen/qwen3.6-27b` | 262K | | | | | | $0.60 | $4 |
|
|
121
121
|
| `novita-ai/sao10k/l3-70b-euryale-v2.1` | 8K | | | | | | $1 | $1 |
|
|
122
122
|
| `novita-ai/sao10k/l3-8b-lunaris` | 8K | | | | | | $0.05 | $0.05 |
|
|
123
|
-
| `novita-ai/
|
|
123
|
+
| `novita-ai/Sao10K/L3-8B-Stheno-v3.2` | 8K | | | | | | $0.05 | $0.05 |
|
|
124
124
|
| `novita-ai/sao10k/l31-70b-euryale-v2.2` | 8K | | | | | | $1 | $1 |
|
|
125
125
|
| `novita-ai/xiaomimimo/mimo-v2-flash` | 262K | | | | | | $0.10 | $0.30 |
|
|
126
126
|
| `novita-ai/zai-org/autoglm-phone-9b-multilingual` | 66K | | | | | | $0.04 | $0.14 |
|
|
@@ -144,7 +144,7 @@ const agent = new Agent({
|
|
|
144
144
|
name: "custom-agent",
|
|
145
145
|
model: {
|
|
146
146
|
url: "https://api.novita.ai/openai",
|
|
147
|
-
id: "novita-ai/
|
|
147
|
+
id: "novita-ai/Sao10K/L3-8B-Stheno-v3.2",
|
|
148
148
|
apiKey: process.env.NOVITA_API_KEY,
|
|
149
149
|
headers: {
|
|
150
150
|
"X-Custom-Header": "value"
|
|
@@ -163,7 +163,7 @@ const agent = new Agent({
|
|
|
163
163
|
const useAdvanced = requestContext.task === "complex";
|
|
164
164
|
return useAdvanced
|
|
165
165
|
? "novita-ai/zai-org/glm-5.1"
|
|
166
|
-
: "novita-ai/
|
|
166
|
+
: "novita-ai/Sao10K/L3-8B-Stheno-v3.2";
|
|
167
167
|
}
|
|
168
168
|
});
|
|
169
169
|
```
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Nvidia
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 92 Nvidia models through Mastra's model router. Authentication is handled automatically using the `NVIDIA_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Nvidia documentation](https://docs.api.nvidia.com/nim/).
|
|
6
6
|
|
|
@@ -15,7 +15,7 @@ const agent = new Agent({
|
|
|
15
15
|
id: "my-agent",
|
|
16
16
|
name: "My Agent",
|
|
17
17
|
instructions: "You are a helpful assistant",
|
|
18
|
-
model: "nvidia/
|
|
18
|
+
model: "nvidia/abacusai/dracarys-llama-3_1-70b-instruct"
|
|
19
19
|
});
|
|
20
20
|
|
|
21
21
|
// Generate a response
|
|
@@ -34,88 +34,98 @@ for await (const chunk of stream) {
|
|
|
34
34
|
|
|
35
35
|
| Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
|
|
36
36
|
| ------------------------------------------------------ | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
|
|
37
|
+
| `nvidia/abacusai/dracarys-llama-3_1-70b-instruct` | 128K | | | | | | — | — |
|
|
38
|
+
| `nvidia/baai/bge-m3` | 8K | | | | | | — | — |
|
|
39
|
+
| `nvidia/black-forest-labs/flux_1-kontext-dev` | 41K | | | | | | — | — |
|
|
40
|
+
| `nvidia/black-forest-labs/flux_1-schnell` | 77 | | | | | | — | — |
|
|
41
|
+
| `nvidia/black-forest-labs/flux_2-klein-4b` | 41K | | | | | | — | — |
|
|
37
42
|
| `nvidia/black-forest-labs/flux.1-dev` | 4K | | | | | | — | — |
|
|
38
|
-
| `nvidia/
|
|
39
|
-
| `nvidia/deepseek-ai/deepseek-r1` | 128K | | | | | | — | — |
|
|
40
|
-
| `nvidia/deepseek-ai/deepseek-r1-0528` | 128K | | | | | | — | — |
|
|
41
|
-
| `nvidia/deepseek-ai/deepseek-v3.1` | 128K | | | | | | — | — |
|
|
43
|
+
| `nvidia/bytedance/seed-oss-36b-instruct` | 262K | | | | | | — | — |
|
|
42
44
|
| `nvidia/deepseek-ai/deepseek-v3.1-terminus` | 128K | | | | | | — | — |
|
|
43
45
|
| `nvidia/deepseek-ai/deepseek-v3.2` | 164K | | | | | | — | — |
|
|
44
46
|
| `nvidia/deepseek-ai/deepseek-v4-flash` | 1.0M | | | | | | $0.14 | $0.28 |
|
|
45
47
|
| `nvidia/deepseek-ai/deepseek-v4-pro` | 1.0M | | | | | | $2 | $3 |
|
|
46
|
-
| `nvidia/google/codegemma-1.1-7b` | 128K | | | | | | — | — |
|
|
47
|
-
| `nvidia/google/codegemma-7b` | 128K | | | | | | — | — |
|
|
48
|
-
| `nvidia/google/gemma-2-27b-it` | 128K | | | | | | — | — |
|
|
49
48
|
| `nvidia/google/gemma-2-2b-it` | 128K | | | | | | — | — |
|
|
50
|
-
| `nvidia/google/gemma-3-12b-it` | 128K | | | | | | — | — |
|
|
51
|
-
| `nvidia/google/gemma-3-1b-it` | 128K | | | | | | — | — |
|
|
52
49
|
| `nvidia/google/gemma-3-27b-it` | 131K | | | | | | — | — |
|
|
53
50
|
| `nvidia/google/gemma-3n-e2b-it` | 128K | | | | | | — | — |
|
|
54
51
|
| `nvidia/google/gemma-3n-e4b-it` | 128K | | | | | | — | — |
|
|
55
52
|
| `nvidia/google/gemma-4-31b-it` | 256K | | | | | | — | — |
|
|
56
|
-
| `nvidia/
|
|
57
|
-
| `nvidia/meta/
|
|
53
|
+
| `nvidia/google/google-paligemma` | 128K | | | | | | — | — |
|
|
54
|
+
| `nvidia/meta/esm2-650m` | 128K | | | | | | — | — |
|
|
55
|
+
| `nvidia/meta/esmfold` | 128K | | | | | | — | — |
|
|
58
56
|
| `nvidia/meta/llama-3.1-70b-instruct` | 128K | | | | | | — | — |
|
|
57
|
+
| `nvidia/meta/llama-3.1-8b-instruct` | 16K | | | | | | — | — |
|
|
59
58
|
| `nvidia/meta/llama-3.2-11b-vision-instruct` | 128K | | | | | | — | — |
|
|
60
59
|
| `nvidia/meta/llama-3.2-1b-instruct` | 128K | | | | | | — | — |
|
|
60
|
+
| `nvidia/meta/llama-3.2-3b-instruct` | 33K | | | | | | — | — |
|
|
61
|
+
| `nvidia/meta/llama-3.2-90b-vision-instruct` | 128K | | | | | | — | — |
|
|
61
62
|
| `nvidia/meta/llama-3.3-70b-instruct` | 128K | | | | | | — | — |
|
|
62
63
|
| `nvidia/meta/llama-4-maverick-17b-128e-instruct` | 128K | | | | | | — | — |
|
|
63
|
-
| `nvidia/meta/llama-4-
|
|
64
|
-
| `nvidia/meta/llama3-70b-instruct` | 128K | | | | | | — | — |
|
|
65
|
-
| `nvidia/meta/llama3-8b-instruct` | 128K | | | | | | — | — |
|
|
66
|
-
| `nvidia/microsoft/phi-3-medium-128k-instruct` | 128K | | | | | | — | — |
|
|
67
|
-
| `nvidia/microsoft/phi-3-medium-4k-instruct` | 4K | | | | | | — | — |
|
|
68
|
-
| `nvidia/microsoft/phi-3-small-128k-instruct` | 128K | | | | | | — | — |
|
|
69
|
-
| `nvidia/microsoft/phi-3-small-8k-instruct` | 8K | | | | | | — | — |
|
|
70
|
-
| `nvidia/microsoft/phi-3-vision-128k-instruct` | 128K | | | | | | — | — |
|
|
71
|
-
| `nvidia/microsoft/phi-3.5-moe-instruct` | 128K | | | | | | — | — |
|
|
72
|
-
| `nvidia/microsoft/phi-3.5-vision-instruct` | 128K | | | | | | — | — |
|
|
64
|
+
| `nvidia/meta/llama-guard-4-12b` | 128K | | | | | | — | — |
|
|
73
65
|
| `nvidia/microsoft/phi-4-mini-instruct` | 131K | | | | | | — | — |
|
|
74
|
-
| `nvidia/
|
|
66
|
+
| `nvidia/microsoft/phi-4-multimodal-instruct` | 128K | | | | | | — | — |
|
|
75
67
|
| `nvidia/minimaxai/minimax-m2.5` | 205K | | | | | | — | — |
|
|
76
68
|
| `nvidia/minimaxai/minimax-m2.7` | 205K | | | | | | — | — |
|
|
77
|
-
| `nvidia/mistralai/codestral-22b-instruct-v0.1` | 128K | | | | | | — | — |
|
|
78
69
|
| `nvidia/mistralai/devstral-2-123b-instruct-2512` | 262K | | | | | | — | — |
|
|
79
|
-
| `nvidia/mistralai/
|
|
80
|
-
| `nvidia/mistralai/
|
|
81
|
-
| `nvidia/mistralai/mistral-large-2-instruct` | 128K | | | | | | — | — |
|
|
70
|
+
| `nvidia/mistralai/magistral-small-2506` | 33K | | | | | | — | — |
|
|
71
|
+
| `nvidia/mistralai/mistral-7b-instruct-v03` | 66K | | | | | | — | — |
|
|
82
72
|
| `nvidia/mistralai/mistral-large-3-675b-instruct-2512` | 262K | | | | | | — | — |
|
|
83
|
-
| `nvidia/mistralai/mistral-medium-3
|
|
84
|
-
| `nvidia/mistralai/mistral-
|
|
73
|
+
| `nvidia/mistralai/mistral-medium-3-instruct` | 131K | | | | | | — | — |
|
|
74
|
+
| `nvidia/mistralai/mistral-nemotron` | 128K | | | | | | — | — |
|
|
75
|
+
| `nvidia/mistralai/mistral-small-4-119b-2603` | 128K | | | | | | — | — |
|
|
76
|
+
| `nvidia/mistralai/mixtral-8x22b-instruct` | 66K | | | | | | — | — |
|
|
77
|
+
| `nvidia/mistralai/mixtral-8x7b-instruct` | 33K | | | | | | — | — |
|
|
85
78
|
| `nvidia/moonshotai/kimi-k2-instruct` | 128K | | | | | | — | — |
|
|
86
79
|
| `nvidia/moonshotai/kimi-k2-instruct-0905` | 262K | | | | | | — | — |
|
|
87
80
|
| `nvidia/moonshotai/kimi-k2-thinking` | 262K | | | | | | — | — |
|
|
88
|
-
| `nvidia/moonshotai/kimi-k2.5` | 262K | | | | | | — | — |
|
|
89
81
|
| `nvidia/moonshotai/kimi-k2.6` | 262K | | | | | | — | — |
|
|
90
|
-
| `nvidia/nvidia/
|
|
91
|
-
| `nvidia/nvidia/
|
|
92
|
-
| `nvidia/nvidia/
|
|
93
|
-
| `nvidia/nvidia/
|
|
94
|
-
| `nvidia/nvidia/
|
|
95
|
-
| `nvidia/nvidia/
|
|
96
|
-
| `nvidia/nvidia/llama-
|
|
97
|
-
| `nvidia/nvidia/
|
|
98
|
-
| `nvidia/nvidia/
|
|
82
|
+
| `nvidia/nvidia/active-speaker-detection` | — | | | | | | — | — |
|
|
83
|
+
| `nvidia/nvidia/bevformer` | 128K | | | | | | — | — |
|
|
84
|
+
| `nvidia/nvidia/cosmos-predict1-5b` | — | | | | | | — | — |
|
|
85
|
+
| `nvidia/nvidia/cosmos-transfer1-7b` | — | | | | | | — | — |
|
|
86
|
+
| `nvidia/nvidia/cosmos-transfer2_5-2b` | — | | | | | | — | — |
|
|
87
|
+
| `nvidia/nvidia/gliner-pii` | 128K | | | | | | — | — |
|
|
88
|
+
| `nvidia/nvidia/llama-3_1-nemotron-safety-guard-8b-v3` | 128K | | | | | | — | — |
|
|
89
|
+
| `nvidia/nvidia/llama-3_2-nemoretriever-300m-embed-v1` | 33K | | | | | | — | — |
|
|
90
|
+
| `nvidia/nvidia/llama-3_3-nemotron-super-49b-v1` | 131K | | | | | | — | — |
|
|
91
|
+
| `nvidia/nvidia/llama-3_3-nemotron-super-49b-v1_5` | 131K | | | | | | — | — |
|
|
92
|
+
| `nvidia/nvidia/llama-nemotron-embed-vl-1b-v2` | 33K | | | | | | — | — |
|
|
93
|
+
| `nvidia/nvidia/llama-nemotron-rerank-vl-1b-v2` | 128K | | | | | | — | — |
|
|
94
|
+
| `nvidia/nvidia/magpie-tts-zeroshot` | — | | | | | | — | — |
|
|
95
|
+
| `nvidia/nvidia/nemotron-3-content-safety` | 128K | | | | | | — | — |
|
|
99
96
|
| `nvidia/nvidia/nemotron-3-nano-30b-a3b` | 131K | | | | | | — | — |
|
|
100
97
|
| `nvidia/nvidia/nemotron-3-nano-omni-30b-a3b-reasoning` | 256K | | | | | | — | — |
|
|
101
98
|
| `nvidia/nvidia/nemotron-3-super-120b-a12b` | 262K | | | | | | $0.20 | $0.80 |
|
|
102
|
-
| `nvidia/nvidia/nemotron-
|
|
99
|
+
| `nvidia/nvidia/nemotron-content-safety-reasoning-4b` | 128K | | | | | | — | — |
|
|
100
|
+
| `nvidia/nvidia/nemotron-mini-4b-instruct` | 128K | | | | | | — | — |
|
|
101
|
+
| `nvidia/nvidia/nemotron-voicechat` | 128K | | | | | | — | — |
|
|
102
|
+
| `nvidia/nvidia/nv-embed-v1` | 33K | | | | | | — | — |
|
|
103
|
+
| `nvidia/nvidia/nv-embedcode-7b-v1` | 33K | | | | | | — | — |
|
|
103
104
|
| `nvidia/nvidia/nvidia-nemotron-nano-9b-v2` | 131K | | | | | | — | — |
|
|
104
|
-
| `nvidia/nvidia/
|
|
105
|
+
| `nvidia/nvidia/rerank-qa-mistral-4b` | 128K | | | | | | — | — |
|
|
106
|
+
| `nvidia/nvidia/riva-translate-4b-instruct-v1_1` | 128K | | | | | | — | — |
|
|
107
|
+
| `nvidia/nvidia/sparsedrive` | 128K | | | | | | — | — |
|
|
108
|
+
| `nvidia/nvidia/streampetr` | 128K | | | | | | — | — |
|
|
109
|
+
| `nvidia/nvidia/studiovoice` | 128K | | | | | | — | — |
|
|
110
|
+
| `nvidia/nvidia/synthetic-video-detector` | — | | | | | | — | — |
|
|
111
|
+
| `nvidia/nvidia/usdcode` | 128K | | | | | | — | — |
|
|
112
|
+
| `nvidia/nvidia/usdvalidate` | — | | | | | | — | — |
|
|
105
113
|
| `nvidia/openai/gpt-oss-120b` | 128K | | | | | | — | — |
|
|
114
|
+
| `nvidia/openai/gpt-oss-20b` | 131K | | | | | | — | — |
|
|
106
115
|
| `nvidia/openai/whisper-large-v3` | — | | | | | | — | — |
|
|
116
|
+
| `nvidia/qwen/qwen-image` | — | | | | | | — | — |
|
|
117
|
+
| `nvidia/qwen/qwen-image-edit` | — | | | | | | — | — |
|
|
107
118
|
| `nvidia/qwen/qwen2.5-coder-32b-instruct` | 128K | | | | | | — | — |
|
|
108
|
-
| `nvidia/qwen/qwen2.5-coder-7b-instruct` | 128K | | | | | | — | — |
|
|
109
|
-
| `nvidia/qwen/qwen3-235b-a22b` | 131K | | | | | | — | — |
|
|
110
119
|
| `nvidia/qwen/qwen3-coder-480b-a35b-instruct` | 262K | | | | | | — | — |
|
|
111
120
|
| `nvidia/qwen/qwen3-next-80b-a3b-instruct` | 262K | | | | | | — | — |
|
|
112
121
|
| `nvidia/qwen/qwen3-next-80b-a3b-thinking` | 262K | | | | | | — | — |
|
|
122
|
+
| `nvidia/qwen/qwen3.5-122b-a10b` | 262K | | | | | | — | — |
|
|
113
123
|
| `nvidia/qwen/qwen3.5-397b-a17b` | 262K | | | | | | — | — |
|
|
114
|
-
| `nvidia/
|
|
124
|
+
| `nvidia/sarvamai/sarvam-m` | 128K | | | | | | — | — |
|
|
115
125
|
| `nvidia/stepfun-ai/step-3.5-flash` | 256K | | | | | | — | — |
|
|
126
|
+
| `nvidia/upstage/solar-10_7b-instruct` | 128K | | | | | | — | — |
|
|
116
127
|
| `nvidia/z-ai/glm-5.1` | 131K | | | | | | — | — |
|
|
117
128
|
| `nvidia/z-ai/glm4.7` | 205K | | | | | | — | — |
|
|
118
|
-
| `nvidia/z-ai/glm5` | 203K | | | | | | — | — |
|
|
119
129
|
|
|
120
130
|
## Advanced configuration
|
|
121
131
|
|
|
@@ -127,7 +137,7 @@ const agent = new Agent({
|
|
|
127
137
|
name: "custom-agent",
|
|
128
138
|
model: {
|
|
129
139
|
url: "https://integrate.api.nvidia.com/v1",
|
|
130
|
-
id: "nvidia/
|
|
140
|
+
id: "nvidia/abacusai/dracarys-llama-3_1-70b-instruct",
|
|
131
141
|
apiKey: process.env.NVIDIA_API_KEY,
|
|
132
142
|
headers: {
|
|
133
143
|
"X-Custom-Header": "value"
|
|
@@ -145,8 +155,8 @@ const agent = new Agent({
|
|
|
145
155
|
model: ({ requestContext }) => {
|
|
146
156
|
const useAdvanced = requestContext.task === "complex";
|
|
147
157
|
return useAdvanced
|
|
148
|
-
? "nvidia/z-ai/
|
|
149
|
-
: "nvidia/
|
|
158
|
+
? "nvidia/z-ai/glm4.7"
|
|
159
|
+
: "nvidia/abacusai/dracarys-llama-3_1-70b-instruct";
|
|
150
160
|
}
|
|
151
161
|
});
|
|
152
162
|
```
|
|
@@ -55,7 +55,7 @@ for await (const chunk of stream) {
|
|
|
55
55
|
| `ollama-cloud/kimi-k2-thinking` | 262K | | | | | | — | — |
|
|
56
56
|
| `ollama-cloud/kimi-k2:1t` | 262K | | | | | | — | — |
|
|
57
57
|
| `ollama-cloud/kimi-k2.5` | 262K | | | | | | — | — |
|
|
58
|
-
| `ollama-cloud/kimi-k2.6
|
|
58
|
+
| `ollama-cloud/kimi-k2.6` | 262K | | | | | | — | — |
|
|
59
59
|
| `ollama-cloud/minimax-m2` | 205K | | | | | | — | — |
|
|
60
60
|
| `ollama-cloud/minimax-m2.1` | 205K | | | | | | — | — |
|
|
61
61
|
| `ollama-cloud/minimax-m2.5` | 205K | | | | | | — | — |
|
|
@@ -176,6 +176,8 @@ const response = await agent.generate("Hello!", {
|
|
|
176
176
|
|
|
177
177
|
**forceReasoning** (`boolean | undefined`)
|
|
178
178
|
|
|
179
|
+
**allowedTools** (`{ toolNames: string[]; mode?: "auto" | "required" | undefined; } | undefined`)
|
|
180
|
+
|
|
179
181
|
## Direct provider installation
|
|
180
182
|
|
|
181
183
|
This provider can also be installed directly as a standalone package, which can be used instead of the Mastra model router string. View the [package documentation](https://www.npmjs.com/package/@ai-sdk/openai) for more details.
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# OpenCode Zen
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 40 OpenCode Zen models through Mastra's model router. Authentication is handled automatically using the `OPENCODE_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [OpenCode Zen documentation](https://opencode.ai/docs/zen).
|
|
6
6
|
|
|
@@ -32,47 +32,48 @@ for await (const chunk of stream) {
|
|
|
32
32
|
|
|
33
33
|
## Models
|
|
34
34
|
|
|
35
|
-
| Model
|
|
36
|
-
|
|
|
37
|
-
| `opencode/big-pickle`
|
|
38
|
-
| `opencode/claude-haiku-4-5`
|
|
39
|
-
| `opencode/claude-opus-4-1`
|
|
40
|
-
| `opencode/claude-opus-4-5`
|
|
41
|
-
| `opencode/claude-opus-4-6`
|
|
42
|
-
| `opencode/claude-opus-4-7`
|
|
43
|
-
| `opencode/claude-sonnet-4`
|
|
44
|
-
| `opencode/claude-sonnet-4-5`
|
|
45
|
-
| `opencode/claude-sonnet-4-6`
|
|
46
|
-
| `opencode/
|
|
47
|
-
| `opencode/gemini-3
|
|
48
|
-
| `opencode/
|
|
49
|
-
| `opencode/glm-5
|
|
50
|
-
| `opencode/
|
|
51
|
-
| `opencode/gpt-5
|
|
52
|
-
| `opencode/gpt-5-
|
|
53
|
-
| `opencode/gpt-5
|
|
54
|
-
| `opencode/gpt-5.1
|
|
55
|
-
| `opencode/gpt-5.1-codex
|
|
56
|
-
| `opencode/gpt-5.1-codex-
|
|
57
|
-
| `opencode/gpt-5.
|
|
58
|
-
| `opencode/gpt-5.2
|
|
59
|
-
| `opencode/gpt-5.
|
|
60
|
-
| `opencode/gpt-5.3-codex
|
|
61
|
-
| `opencode/gpt-5.
|
|
62
|
-
| `opencode/gpt-5.4
|
|
63
|
-
| `opencode/gpt-5.4-
|
|
64
|
-
| `opencode/gpt-5.4-
|
|
65
|
-
| `opencode/gpt-5.
|
|
66
|
-
| `opencode/gpt-5.5
|
|
67
|
-
| `opencode/
|
|
68
|
-
| `opencode/kimi-k2.5`
|
|
69
|
-
| `opencode/kimi-k2.6`
|
|
70
|
-
| `opencode/minimax-m2.5`
|
|
71
|
-
| `opencode/minimax-m2.5-free`
|
|
72
|
-
| `opencode/minimax-m2.7`
|
|
73
|
-
| `opencode/nemotron-3-super-free`
|
|
74
|
-
| `opencode/qwen3.5-plus`
|
|
75
|
-
| `opencode/qwen3.6-plus`
|
|
35
|
+
| Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
|
|
36
|
+
| --------------------------------- | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
|
|
37
|
+
| `opencode/big-pickle` | 200K | | | | | | — | — |
|
|
38
|
+
| `opencode/claude-haiku-4-5` | 200K | | | | | | $1 | $5 |
|
|
39
|
+
| `opencode/claude-opus-4-1` | 200K | | | | | | $15 | $75 |
|
|
40
|
+
| `opencode/claude-opus-4-5` | 200K | | | | | | $5 | $25 |
|
|
41
|
+
| `opencode/claude-opus-4-6` | 1.0M | | | | | | $5 | $25 |
|
|
42
|
+
| `opencode/claude-opus-4-7` | 1.0M | | | | | | $5 | $25 |
|
|
43
|
+
| `opencode/claude-sonnet-4` | 1.0M | | | | | | $3 | $15 |
|
|
44
|
+
| `opencode/claude-sonnet-4-5` | 1.0M | | | | | | $3 | $15 |
|
|
45
|
+
| `opencode/claude-sonnet-4-6` | 1.0M | | | | | | $3 | $15 |
|
|
46
|
+
| `opencode/deepseek-v4-flash-free` | 1.0M | | | | | | — | — |
|
|
47
|
+
| `opencode/gemini-3-flash` | 1.0M | | | | | | $0.50 | $3 |
|
|
48
|
+
| `opencode/gemini-3.1-pro` | 1.0M | | | | | | $2 | $12 |
|
|
49
|
+
| `opencode/glm-5` | 205K | | | | | | $1 | $3 |
|
|
50
|
+
| `opencode/glm-5.1` | 205K | | | | | | $1 | $4 |
|
|
51
|
+
| `opencode/gpt-5` | 400K | | | | | | $1 | $9 |
|
|
52
|
+
| `opencode/gpt-5-codex` | 400K | | | | | | $1 | $9 |
|
|
53
|
+
| `opencode/gpt-5-nano` | 400K | | | | | | $0.05 | $0.40 |
|
|
54
|
+
| `opencode/gpt-5.1` | 400K | | | | | | $1 | $9 |
|
|
55
|
+
| `opencode/gpt-5.1-codex` | 400K | | | | | | $1 | $9 |
|
|
56
|
+
| `opencode/gpt-5.1-codex-max` | 400K | | | | | | $1 | $10 |
|
|
57
|
+
| `opencode/gpt-5.1-codex-mini` | 400K | | | | | | $0.25 | $2 |
|
|
58
|
+
| `opencode/gpt-5.2` | 400K | | | | | | $2 | $14 |
|
|
59
|
+
| `opencode/gpt-5.2-codex` | 400K | | | | | | $2 | $14 |
|
|
60
|
+
| `opencode/gpt-5.3-codex` | 400K | | | | | | $2 | $14 |
|
|
61
|
+
| `opencode/gpt-5.3-codex-spark` | 128K | | | | | | $2 | $14 |
|
|
62
|
+
| `opencode/gpt-5.4` | 1.1M | | | | | | $3 | $15 |
|
|
63
|
+
| `opencode/gpt-5.4-mini` | 400K | | | | | | $0.75 | $5 |
|
|
64
|
+
| `opencode/gpt-5.4-nano` | 400K | | | | | | $0.20 | $1 |
|
|
65
|
+
| `opencode/gpt-5.4-pro` | 1.1M | | | | | | $30 | $180 |
|
|
66
|
+
| `opencode/gpt-5.5` | 1.1M | | | | | | $5 | $30 |
|
|
67
|
+
| `opencode/gpt-5.5-pro` | 1.1M | | | | | | $30 | $180 |
|
|
68
|
+
| `opencode/kimi-k2.5` | 262K | | | | | | $0.60 | $3 |
|
|
69
|
+
| `opencode/kimi-k2.6` | 262K | | | | | | $0.95 | $4 |
|
|
70
|
+
| `opencode/minimax-m2.5` | 205K | | | | | | $0.30 | $1 |
|
|
71
|
+
| `opencode/minimax-m2.5-free` | 205K | | | | | | — | — |
|
|
72
|
+
| `opencode/minimax-m2.7` | 205K | | | | | | $0.30 | $1 |
|
|
73
|
+
| `opencode/nemotron-3-super-free` | 205K | | | | | | — | — |
|
|
74
|
+
| `opencode/qwen3.5-plus` | 262K | | | | | | $0.20 | $1 |
|
|
75
|
+
| `opencode/qwen3.6-plus` | 262K | | | | | | $0.50 | $3 |
|
|
76
|
+
| `opencode/ring-2.6-1t-free` | 262K | | | | | | — | — |
|
|
76
77
|
|
|
77
78
|
## Advanced configuration
|
|
78
79
|
|
|
@@ -102,7 +103,7 @@ const agent = new Agent({
|
|
|
102
103
|
model: ({ requestContext }) => {
|
|
103
104
|
const useAdvanced = requestContext.task === "complex";
|
|
104
105
|
return useAdvanced
|
|
105
|
-
? "opencode/
|
|
106
|
+
? "opencode/ring-2.6-1t-free"
|
|
106
107
|
: "opencode/big-pickle";
|
|
107
108
|
}
|
|
108
109
|
});
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# Poe
|
|
2
2
|
|
|
3
|
-
Access
|
|
3
|
+
Access 124 Poe models through Mastra's model router. Authentication is handled automatically using the `POE_API_KEY` environment variable.
|
|
4
4
|
|
|
5
5
|
Learn more in the [Poe documentation](https://creator.poe.com/docs/external-applications/openai-compatible-api).
|
|
6
6
|
|
|
@@ -51,6 +51,8 @@ for await (const chunk of stream) {
|
|
|
51
51
|
| `poe/elevenlabs/elevenlabs-music` | 2K | | | | | | — | — |
|
|
52
52
|
| `poe/elevenlabs/elevenlabs-v2.5-turbo` | 128K | | | | | | — | — |
|
|
53
53
|
| `poe/elevenlabs/elevenlabs-v3` | 128K | | | | | | — | — |
|
|
54
|
+
| `poe/empiriolabs/deepseek-v4-flash-el` | 1.0M | | | | | | $0.14 | $0.28 |
|
|
55
|
+
| `poe/empiriolabs/deepseek-v4-pro-el` | 1.0M | | | | | | $2 | $3 |
|
|
54
56
|
| `poe/fireworks-ai/kimi-k2.5-fw` | 262K | | | | | | — | — |
|
|
55
57
|
| `poe/google/gemini-2.0-flash` | 990K | | | | | | $0.10 | $0.42 |
|
|
56
58
|
| `poe/google/gemini-2.0-flash-lite` | 990K | | | | | | $0.05 | $0.21 |
|
|
@@ -87,6 +89,7 @@ for await (const chunk of stream) {
|
|
|
87
89
|
| `poe/novita/glm-5` | 205K | | | | | | $1 | $3 |
|
|
88
90
|
| `poe/novita/kimi-k2-thinking` | 256K | | | | | | — | — |
|
|
89
91
|
| `poe/novita/kimi-k2.5` | 128K | | | | | | $0.60 | $3 |
|
|
92
|
+
| `poe/novita/kimi-k2.6` | 262K | | | | | | $0.96 | $4 |
|
|
90
93
|
| `poe/novita/minimax-m2.1` | 205K | | | | | | — | — |
|
|
91
94
|
| `poe/openai/dall-e-3` | 800 | | | | | | — | — |
|
|
92
95
|
| `poe/openai/gpt-3.5-turbo` | 16K | | | | | | $0.45 | $1 |
|