@mastra/mcp-docs-server 1.1.35-alpha.2 → 1.1.35-alpha.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (105) hide show
  1. package/.docs/course/03-agent-memory/18-advanced-configuration-semantic-recall.md +48 -4
  2. package/.docs/docs/agents/background-tasks.md +62 -2
  3. package/.docs/docs/agents/processors.md +34 -2
  4. package/.docs/docs/agents/response-caching.md +148 -0
  5. package/.docs/docs/agents/using-tools.md +8 -0
  6. package/.docs/docs/editor/tools.md +1 -1
  7. package/.docs/docs/index.md +2 -2
  8. package/.docs/docs/mastra-platform/configuration.md +1 -1
  9. package/.docs/docs/mastra-platform/overview.md +1 -1
  10. package/.docs/docs/memory/observational-memory.md +63 -14
  11. package/.docs/docs/memory/overview.md +2 -1
  12. package/.docs/docs/memory/semantic-recall.md +68 -6
  13. package/.docs/docs/observability/logging.md +2 -2
  14. package/.docs/docs/observability/metrics/overview.md +4 -4
  15. package/.docs/docs/observability/overview.md +6 -6
  16. package/.docs/docs/observability/tracing/bridges/otel.md +25 -0
  17. package/.docs/docs/observability/tracing/exporters/arize.md +5 -5
  18. package/.docs/docs/observability/tracing/exporters/braintrust.md +37 -0
  19. package/.docs/docs/observability/tracing/exporters/langfuse.md +21 -0
  20. package/.docs/docs/observability/tracing/exporters/{cloud.md → mastra-platform.md} +28 -26
  21. package/.docs/docs/observability/tracing/exporters/{default.md → mastra-storage.md} +56 -19
  22. package/.docs/docs/observability/tracing/exporters/otel.md +79 -2
  23. package/.docs/docs/observability/tracing/overview.md +30 -29
  24. package/.docs/docs/observability/tracing/processors/sensitive-data-filter.md +6 -6
  25. package/.docs/docs/server/mastra-server.md +30 -19
  26. package/.docs/docs/studio/observability.md +4 -4
  27. package/.docs/docs/studio/overview.md +4 -0
  28. package/.docs/docs/workflows/suspend-and-resume.md +28 -1
  29. package/.docs/guides/deployment/inngest.md +29 -8
  30. package/.docs/guides/guide/web-search.md +7 -7
  31. package/.docs/guides/migrations/mastra-cloud.md +6 -6
  32. package/.docs/guides/migrations/upgrade-to-v1/tracing.md +19 -17
  33. package/.docs/models/gateways/azure-openai.md +94 -23
  34. package/.docs/models/gateways/netlify.md +3 -1
  35. package/.docs/models/gateways/openrouter.md +5 -1
  36. package/.docs/models/gateways/vercel.md +2 -1
  37. package/.docs/models/index.md +1 -1
  38. package/.docs/models/providers/deepinfra.md +2 -1
  39. package/.docs/models/providers/deepseek.md +3 -1
  40. package/.docs/models/providers/digitalocean.md +10 -2
  41. package/.docs/models/providers/firepass.md +71 -0
  42. package/.docs/models/providers/google.md +3 -2
  43. package/.docs/models/providers/kilo.md +5 -3
  44. package/.docs/models/providers/kiro.md +110 -0
  45. package/.docs/models/providers/llmgateway.md +8 -2
  46. package/.docs/models/providers/nebius.md +37 -55
  47. package/.docs/models/providers/openai.md +2 -0
  48. package/.docs/models/providers/opencode-go.md +2 -4
  49. package/.docs/models/providers/opencode.md +3 -3
  50. package/.docs/models/providers/poe.md +4 -1
  51. package/.docs/models/providers/qiniu-ai.md +2 -2
  52. package/.docs/models/providers/wafer.ai.md +2 -1
  53. package/.docs/models/providers/xiaomi-token-plan-ams.md +6 -5
  54. package/.docs/models/providers/xiaomi-token-plan-cn.md +6 -5
  55. package/.docs/models/providers/xiaomi-token-plan-sgp.md +6 -5
  56. package/.docs/models/providers/xiaomi.md +2 -2
  57. package/.docs/models/providers/zenmux.md +1 -1
  58. package/.docs/models/providers.md +1 -0
  59. package/.docs/reference/agents/agent.md +2 -0
  60. package/.docs/reference/cli/mastra.md +464 -0
  61. package/.docs/reference/client-js/agents.md +26 -1
  62. package/.docs/reference/client-js/responses.md +4 -0
  63. package/.docs/reference/configuration.md +6 -6
  64. package/.docs/reference/editor/tool-provider.md +3 -3
  65. package/.docs/reference/harness/harness-class.md +23 -8
  66. package/.docs/reference/index.md +3 -0
  67. package/.docs/reference/memory/observational-memory.md +11 -1
  68. package/.docs/reference/observability/metrics/automatic-metrics.md +2 -4
  69. package/.docs/reference/observability/tracing/bridges/datadog.md +2 -2
  70. package/.docs/reference/observability/tracing/bridges/otel.md +26 -4
  71. package/.docs/reference/observability/tracing/configuration.md +6 -3
  72. package/.docs/reference/observability/tracing/exporters/arize.md +1 -1
  73. package/.docs/reference/observability/tracing/exporters/braintrust.md +2 -0
  74. package/.docs/reference/observability/tracing/exporters/cloud-exporter.md +3 -1
  75. package/.docs/reference/observability/tracing/exporters/console-exporter.md +2 -2
  76. package/.docs/reference/observability/tracing/exporters/default-exporter.md +7 -1
  77. package/.docs/reference/observability/tracing/exporters/mastra-platform-exporter.md +263 -0
  78. package/.docs/reference/observability/tracing/exporters/mastra-storage-exporter.md +194 -0
  79. package/.docs/reference/observability/tracing/exporters/otel.md +12 -8
  80. package/.docs/reference/observability/tracing/instances.md +2 -2
  81. package/.docs/reference/observability/tracing/interfaces.md +37 -2
  82. package/.docs/reference/observability/tracing/processors/sensitive-data-filter.md +22 -0
  83. package/.docs/reference/observability/tracing/span-filtering.md +2 -2
  84. package/.docs/reference/processors/processor-interface.md +74 -12
  85. package/.docs/reference/processors/provider-history-compat.md +132 -0
  86. package/.docs/reference/processors/response-cache.md +114 -0
  87. package/.docs/reference/processors/tool-call-filter.md +28 -0
  88. package/.docs/reference/storage/clickhouse.md +8 -8
  89. package/.docs/reference/storage/cloudflare-d1.md +1 -1
  90. package/.docs/reference/storage/cloudflare.md +1 -1
  91. package/.docs/reference/storage/composite.md +1 -1
  92. package/.docs/reference/storage/convex.md +1 -1
  93. package/.docs/reference/storage/duckdb.md +3 -3
  94. package/.docs/reference/storage/dynamodb.md +1 -1
  95. package/.docs/reference/storage/lance.md +1 -1
  96. package/.docs/reference/storage/libsql.md +1 -1
  97. package/.docs/reference/storage/postgresql.md +1 -1
  98. package/.docs/reference/storage/upstash.md +1 -1
  99. package/.docs/reference/streaming/ChunkType.md +44 -0
  100. package/.docs/reference/streaming/agents/stream.md +18 -2
  101. package/.docs/reference/tools/create-tool.md +46 -0
  102. package/.docs/reference/tools/mcp-client.md +47 -0
  103. package/.docs/reference/workflows/workflow-state-reader.md +113 -0
  104. package/CHANGELOG.md +71 -0
  105. package/package.json +4 -4
@@ -0,0 +1,71 @@
1
+ # ![Fireworks (Firepass) logo](https://models.dev/logos/firepass.svg)Fireworks (Firepass)
2
+
3
+ Access 1 Fireworks (Firepass) model through Mastra's model router. Authentication is handled automatically using the `FIREPASS_API_KEY` environment variable.
4
+
5
+ Learn more in the [Fireworks (Firepass) documentation](https://docs.fireworks.ai/firepass).
6
+
7
+ ```bash
8
+ FIREPASS_API_KEY=your-api-key
9
+ ```
10
+
11
+ ```typescript
12
+ import { Agent } from "@mastra/core/agent";
13
+
14
+ const agent = new Agent({
15
+ id: "my-agent",
16
+ name: "My Agent",
17
+ instructions: "You are a helpful assistant",
18
+ model: "firepass/accounts/fireworks/routers/kimi-k2p6-turbo"
19
+ });
20
+
21
+ // Generate a response
22
+ const response = await agent.generate("Hello!");
23
+
24
+ // Stream a response
25
+ const stream = await agent.stream("Tell me a story");
26
+ for await (const chunk of stream) {
27
+ console.log(chunk);
28
+ }
29
+ ```
30
+
31
+ > **Info:** Mastra uses the OpenAI-compatible `/chat/completions` endpoint. Some provider-specific features may not be available. Check the [Fireworks (Firepass) documentation](https://docs.fireworks.ai/firepass) for details.
32
+
33
+ ## Models
34
+
35
+ | Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
36
+ | ----------------------------------------------------- | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
37
+ | `firepass/accounts/fireworks/routers/kimi-k2p6-turbo` | 262K | | | | | | — | — |
38
+
39
+ ## Advanced configuration
40
+
41
+ ### Custom headers
42
+
43
+ ```typescript
44
+ const agent = new Agent({
45
+ id: "custom-agent",
46
+ name: "custom-agent",
47
+ model: {
48
+ url: "https://api.fireworks.ai/inference/v1/",
49
+ id: "firepass/accounts/fireworks/routers/kimi-k2p6-turbo",
50
+ apiKey: process.env.FIREPASS_API_KEY,
51
+ headers: {
52
+ "X-Custom-Header": "value"
53
+ }
54
+ }
55
+ });
56
+ ```
57
+
58
+ ### Dynamic model selection
59
+
60
+ ```typescript
61
+ const agent = new Agent({
62
+ id: "dynamic-agent",
63
+ name: "Dynamic Agent",
64
+ model: ({ requestContext }) => {
65
+ const useAdvanced = requestContext.task === "complex";
66
+ return useAdvanced
67
+ ? "firepass/accounts/fireworks/routers/kimi-k2p6-turbo"
68
+ : "firepass/accounts/fireworks/routers/kimi-k2p6-turbo";
69
+ }
70
+ });
71
+ ```
@@ -1,8 +1,8 @@
1
1
  # ![Google logo](https://models.dev/logos/google.svg)Google
2
2
 
3
- Access 37 Google models through Mastra's model router. Authentication is handled automatically using the `GOOGLE_GENERATIVE_AI_API_KEY` environment variable.
3
+ Access 38 Google models through Mastra's model router. Authentication is handled automatically using the `GOOGLE_GENERATIVE_AI_API_KEY` environment variable.
4
4
 
5
- Learn more in the [Google documentation](https://ai.google.dev/gemini-api/docs/pricing).
5
+ Learn more in the [Google documentation](https://ai.google.dev/gemini-api/docs/models).
6
6
 
7
7
  ```bash
8
8
  GOOGLE_GENERATIVE_AI_API_KEY=your-api-key
@@ -54,6 +54,7 @@ for await (const chunk of stream) {
54
54
  | `google/gemini-3-flash-preview` | 1.0M | | | | | | $0.50 | $3 |
55
55
  | `google/gemini-3-pro-preview` | 1.0M | | | | | | $2 | $12 |
56
56
  | `google/gemini-3.1-flash-image-preview` | 131K | | | | | | $0.25 | $60 |
57
+ | `google/gemini-3.1-flash-lite` | 1.0M | | | | | | $0.25 | $2 |
57
58
  | `google/gemini-3.1-flash-lite-preview` | 1.0M | | | | | | $0.25 | $2 |
58
59
  | `google/gemini-3.1-pro-preview` | 1.0M | | | | | | $2 | $12 |
59
60
  | `google/gemini-3.1-pro-preview-customtools` | 1.0M | | | | | | $2 | $12 |
@@ -1,6 +1,6 @@
1
1
  # ![Kilo Gateway logo](https://models.dev/logos/kilo.svg)Kilo Gateway
2
2
 
3
- Access 355 Kilo Gateway models through Mastra's model router. Authentication is handled automatically using the `KILO_API_KEY` environment variable.
3
+ Access 357 Kilo Gateway models through Mastra's model router. Authentication is handled automatically using the `KILO_API_KEY` environment variable.
4
4
 
5
5
  Learn more in the [Kilo Gateway documentation](https://kilo.ai).
6
6
 
@@ -50,7 +50,6 @@ for await (const chunk of stream) {
50
50
  | `kilo/alfredpros/codellama-7b-instruct-solidity` | 4K | | | | | | $0.80 | $1 |
51
51
  | `kilo/alibaba/tongyi-deepresearch-30b-a3b` | 131K | | | | | | $0.09 | $0.45 |
52
52
  | `kilo/allenai/olmo-3-32b-think` | 66K | | | | | | $0.15 | $0.50 |
53
- | `kilo/allenai/olmo-3.1-32b-instruct` | 66K | | | | | | $0.20 | $0.60 |
54
53
  | `kilo/alpindale/goliath-120b` | 6K | | | | | | $4 | $8 |
55
54
  | `kilo/amazon/nova-2-lite-v1` | 1.0M | | | | | | $0.30 | $3 |
56
55
  | `kilo/amazon/nova-lite-v1` | 300K | | | | | | $0.06 | $0.24 |
@@ -79,6 +78,7 @@ for await (const chunk of stream) {
79
78
  | `kilo/arcee-ai/trinity-large-thinking` | 262K | | | | | | $0.22 | $0.85 |
80
79
  | `kilo/arcee-ai/trinity-mini` | 131K | | | | | | $0.04 | $0.15 |
81
80
  | `kilo/arcee-ai/virtuoso-large` | 131K | | | | | | $0.75 | $1 |
81
+ | `kilo/baidu/cobuddy:free` | 131K | | | | | | — | — |
82
82
  | `kilo/baidu/ernie-4.5-21b-a3b` | 120K | | | | | | $0.07 | $0.28 |
83
83
  | `kilo/baidu/ernie-4.5-21b-a3b-thinking` | 131K | | | | | | $0.07 | $0.28 |
84
84
  | `kilo/baidu/ernie-4.5-300b-a47b` | 123K | | | | | | $0.28 | $1 |
@@ -161,6 +161,7 @@ for await (const chunk of stream) {
161
161
  | `kilo/meta-llama/llama-guard-3-8b` | 131K | | | | | | $0.02 | $0.06 |
162
162
  | `kilo/meta-llama/llama-guard-4-12b` | 164K | | | | | | $0.18 | $0.18 |
163
163
  | `kilo/microsoft/phi-4` | 16K | | | | | | $0.06 | $0.14 |
164
+ | `kilo/microsoft/phi-4-mini-instruct` | 128K | | | | | | $0.08 | $0.35 |
164
165
  | `kilo/microsoft/wizardlm-2-8x22b` | 66K | | | | | | $0.62 | $0.62 |
165
166
  | `kilo/minimax/minimax-01` | 1.0M | | | | | | $0.20 | $1 |
166
167
  | `kilo/minimax/minimax-m1` | 1.0M | | | | | | $0.40 | $2 |
@@ -182,6 +183,7 @@ for await (const chunk of stream) {
182
183
  | `kilo/mistralai/mistral-large-2411` | 131K | | | | | | $2 | $6 |
183
184
  | `kilo/mistralai/mistral-large-2512` | 262K | | | | | | $0.50 | $2 |
184
185
  | `kilo/mistralai/mistral-medium-3` | 131K | | | | | | $0.40 | $2 |
186
+ | `kilo/mistralai/mistral-medium-3-5` | 262K | | | | | | $2 | $8 |
185
187
  | `kilo/mistralai/mistral-medium-3.1` | 131K | | | | | | $0.40 | $2 |
186
188
  | `kilo/mistralai/mistral-nemo` | 131K | | | | | | $0.02 | $0.04 |
187
189
  | `kilo/mistralai/mistral-saba` | 33K | | | | | | $0.20 | $0.60 |
@@ -212,7 +214,6 @@ for await (const chunk of stream) {
212
214
  | `kilo/nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free` | 256K | | | | | | — | — |
213
215
  | `kilo/nvidia/nemotron-3-super-120b-a12b` | 262K | | | | | | $0.10 | $0.50 |
214
216
  | `kilo/nvidia/nemotron-3-super-120b-a12b:free` | 262K | | | | | | — | — |
215
- | `kilo/nvidia/nemotron-nano-12b-v2-vl` | 131K | | | | | | $0.20 | $0.60 |
216
217
  | `kilo/nvidia/nemotron-nano-9b-v2` | 131K | | | | | | $0.04 | $0.16 |
217
218
  | `kilo/openai/gpt-3.5-turbo` | 16K | | | | | | $0.50 | $2 |
218
219
  | `kilo/openai/gpt-3.5-turbo-0613` | 4K | | | | | | $1 | $2 |
@@ -263,6 +264,7 @@ for await (const chunk of stream) {
263
264
  | `kilo/openai/gpt-5.5-pro` | 1.1M | | | | | | $30 | $180 |
264
265
  | `kilo/openai/gpt-audio` | 128K | | | | | | $3 | $10 |
265
266
  | `kilo/openai/gpt-audio-mini` | 128K | | | | | | $0.60 | $2 |
267
+ | `kilo/openai/gpt-chat-latest` | 400K | | | | | | $5 | $30 |
266
268
  | `kilo/openai/gpt-oss-120b` | 131K | | | | | | $0.04 | $0.19 |
267
269
  | `kilo/openai/gpt-oss-20b` | 131K | | | | | | $0.03 | $0.14 |
268
270
  | `kilo/openai/gpt-oss-safeguard-20b` | 131K | | | | | | $0.07 | $0.30 |
@@ -0,0 +1,110 @@
1
+ # ![Kiro logo](https://models.dev/logos/kiro.svg)Kiro
2
+
3
+ Access 12 Kiro models through Mastra's model router. Authentication is handled automatically using the `KIRO_API_KEY` environment variable.
4
+
5
+ Learn more in the [Kiro documentation](https://kiro.dev).
6
+
7
+ ```bash
8
+ KIRO_API_KEY=your-api-key
9
+ ```
10
+
11
+ ```typescript
12
+ import { Agent } from "@mastra/core/agent";
13
+
14
+ const agent = new Agent({
15
+ id: "my-agent",
16
+ name: "My Agent",
17
+ instructions: "You are a helpful assistant",
18
+ model: "kiro/auto"
19
+ });
20
+
21
+ // Generate a response
22
+ const response = await agent.generate("Hello!");
23
+
24
+ // Stream a response
25
+ const stream = await agent.stream("Tell me a story");
26
+ for await (const chunk of stream) {
27
+ console.log(chunk);
28
+ }
29
+ ```
30
+
31
+ > **Info:** Mastra uses the OpenAI-compatible `/chat/completions` endpoint. Some provider-specific features may not be available. Check the [Kiro documentation](https://kiro.dev) for details.
32
+
33
+ ## Models
34
+
35
+ | Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
36
+ | ------------------------ | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
37
+ | `kiro/auto` | 1.0M | | | | | | — | — |
38
+ | `kiro/claude-haiku-4.5` | 200K | | | | | | — | — |
39
+ | `kiro/claude-opus-4.5` | 200K | | | | | | — | — |
40
+ | `kiro/claude-opus-4.6` | 1.0M | | | | | | — | — |
41
+ | `kiro/claude-opus-4.7` | 1.0M | | | | | | — | — |
42
+ | `kiro/claude-sonnet-4` | 200K | | | | | | — | — |
43
+ | `kiro/claude-sonnet-4.5` | 200K | | | | | | — | — |
44
+ | `kiro/claude-sonnet-4.6` | 1.0M | | | | | | — | — |
45
+ | `kiro/deepseek-3.2` | 164K | | | | | | — | — |
46
+ | `kiro/minimax-m2.1` | 196K | | | | | | — | — |
47
+ | `kiro/minimax-m2.5` | 196K | | | | | | — | — |
48
+ | `kiro/qwen3-coder-next` | 256K | | | | | | — | — |
49
+
50
+ ## Advanced configuration
51
+
52
+ ### Custom headers
53
+
54
+ ```typescript
55
+ const agent = new Agent({
56
+ id: "custom-agent",
57
+ name: "custom-agent",
58
+ model: {
59
+ url: "https://q.us-east-1.amazonaws.com",
60
+ id: "kiro/auto",
61
+ apiKey: process.env.KIRO_API_KEY,
62
+ headers: {
63
+ "X-Custom-Header": "value"
64
+ }
65
+ }
66
+ });
67
+ ```
68
+
69
+ ### Dynamic model selection
70
+
71
+ ```typescript
72
+ const agent = new Agent({
73
+ id: "dynamic-agent",
74
+ name: "Dynamic Agent",
75
+ model: ({ requestContext }) => {
76
+ const useAdvanced = requestContext.task === "complex";
77
+ return useAdvanced
78
+ ? "kiro/qwen3-coder-next"
79
+ : "kiro/auto";
80
+ }
81
+ });
82
+ ```
83
+
84
+ ## Direct provider installation
85
+
86
+ This provider can also be installed directly as a standalone package, which can be used instead of the Mastra model router string. View the [package documentation](https://www.npmjs.com/package/kiro-acp-ai-provider) for more details.
87
+
88
+ **npm**:
89
+
90
+ ```bash
91
+ npm install kiro-acp-ai-provider
92
+ ```
93
+
94
+ **pnpm**:
95
+
96
+ ```bash
97
+ pnpm add kiro-acp-ai-provider
98
+ ```
99
+
100
+ **Yarn**:
101
+
102
+ ```bash
103
+ yarn add kiro-acp-ai-provider
104
+ ```
105
+
106
+ **Bun**:
107
+
108
+ ```bash
109
+ bun add kiro-acp-ai-provider
110
+ ```
@@ -1,6 +1,6 @@
1
1
  # ![LLM Gateway logo](https://models.dev/logos/llmgateway.svg)LLM Gateway
2
2
 
3
- Access 189 LLM Gateway models through Mastra's model router. Authentication is handled automatically using the `LLMGATEWAY_API_KEY` environment variable.
3
+ Access 195 LLM Gateway models through Mastra's model router. Authentication is handled automatically using the `LLMGATEWAY_API_KEY` environment variable.
4
4
 
5
5
  Learn more in the [LLM Gateway documentation](https://llmgateway.io/docs).
6
6
 
@@ -66,6 +66,7 @@ for await (const chunk of stream) {
66
66
  | `llmgateway/gemini-2.5-flash-lite-preview-09-2025` | 1.0M | | | | | | $0.10 | $0.40 |
67
67
  | `llmgateway/gemini-2.5-pro` | 1.0M | | | | | | $1 | $10 |
68
68
  | `llmgateway/gemini-3-flash-preview` | 1.0M | | | | | | $0.50 | $3 |
69
+ | `llmgateway/gemini-3.1-flash-lite` | 1.0M | | | | | | $0.25 | $2 |
69
70
  | `llmgateway/gemini-3.1-flash-lite-preview` | 1.0M | | | | | | $0.25 | $2 |
70
71
  | `llmgateway/gemini-3.1-pro-preview` | 1.0M | | | | | | $2 | $12 |
71
72
  | `llmgateway/gemini-pro-latest` | 1.0M | | | | | | $2 | $12 |
@@ -132,6 +133,7 @@ for await (const chunk of stream) {
132
133
  | `llmgateway/grok-4-1-fast-reasoning` | 2.0M | | | | | | $0.20 | $0.50 |
133
134
  | `llmgateway/grok-4-20-beta-0309-non-reasoning` | 2.0M | | | | | | $2 | $6 |
134
135
  | `llmgateway/grok-4-20-beta-0309-reasoning` | 2.0M | | | | | | $2 | $6 |
136
+ | `llmgateway/grok-4-3` | 1.0M | | | | | | $1 | $3 |
135
137
  | `llmgateway/grok-4-fast` | 2.0M | | | | | | $0.20 | $0.50 |
136
138
  | `llmgateway/grok-4-fast-non-reasoning` | 2.0M | | | | | | $0.20 | $0.50 |
137
139
  | `llmgateway/grok-4-fast-reasoning` | 2.0M | | | | | | $0.20 | $0.50 |
@@ -153,7 +155,11 @@ for await (const chunk of stream) {
153
155
  | `llmgateway/llama-4-maverick-17b-instruct` | 8K | | | | | | $0.24 | $0.97 |
154
156
  | `llmgateway/llama-4-scout` | 33K | | | | | | $0.18 | $0.59 |
155
157
  | `llmgateway/llama-4-scout-17b-instruct` | 8K | | | | | | $0.17 | $0.66 |
156
- | `llmgateway/mimo-v2-flash` | 256K | | | | | | $0.10 | $0.30 |
158
+ | `llmgateway/mimo-v2-flash` | 262K | | | | | | $0.10 | $0.30 |
159
+ | `llmgateway/mimo-v2-omni` | 262K | | | | | | $0.40 | $2 |
160
+ | `llmgateway/mimo-v2-pro` | 1.0M | | | | | | $1 | $3 |
161
+ | `llmgateway/mimo-v2.5` | 1.0M | | | | | | $0.40 | $2 |
162
+ | `llmgateway/mimo-v2.5-pro` | 1.0M | | | | | | $1 | $3 |
157
163
  | `llmgateway/minimax-m2` | 197K | | | | | | $0.30 | $1 |
158
164
  | `llmgateway/minimax-m2.1` | 205K | | | | | | $0.30 | $1 |
159
165
  | `llmgateway/minimax-m2.1-lightning` | 197K | | | | | | $0.12 | $0.48 |
@@ -1,6 +1,6 @@
1
1
  # ![Nebius Token Factory logo](https://models.dev/logos/nebius.svg)Nebius Token Factory
2
2
 
3
- Access 49 Nebius Token Factory models through Mastra's model router. Authentication is handled automatically using the `NEBIUS_API_KEY` environment variable.
3
+ Access 31 Nebius Token Factory models through Mastra's model router. Authentication is handled automatically using the `NEBIUS_API_KEY` environment variable.
4
4
 
5
5
  Learn more in the [Nebius Token Factory documentation](https://docs.tokenfactory.nebius.com/).
6
6
 
@@ -15,7 +15,7 @@ const agent = new Agent({
15
15
  id: "my-agent",
16
16
  name: "My Agent",
17
17
  instructions: "You are a helpful assistant",
18
- model: "nebius/BAAI/bge-en-icl"
18
+ model: "nebius/MiniMaxAI/MiniMax-M2.5"
19
19
  });
20
20
 
21
21
  // Generate a response
@@ -32,57 +32,39 @@ for await (const chunk of stream) {
32
32
 
33
33
  ## Models
34
34
 
35
- | Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
36
- | --------------------------------------------------- | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
37
- | `nebius/BAAI/bge-en-icl` | 33K | | | | | | $0.01 | |
38
- | `nebius/BAAI/bge-multilingual-gemma2` | 8K | | | | | | $0.01 | |
39
- | `nebius/black-forest-labs/flux-dev` | 77 | | | | | | | |
40
- | `nebius/black-forest-labs/flux-schnell` | 77 | | | | | | | |
41
- | `nebius/deepseek-ai/DeepSeek-R1-0528` | 128K | | | | | | $0.80 | $2 |
42
- | `nebius/deepseek-ai/DeepSeek-R1-0528-fast` | 131K | | | | | | $2 | $6 |
43
- | `nebius/deepseek-ai/DeepSeek-V3-0324` | 128K | | | | | | $0.50 | $2 |
44
- | `nebius/deepseek-ai/DeepSeek-V3-0324-fast` | 128K | | | | | | $0.75 | $2 |
45
- | `nebius/deepseek-ai/DeepSeek-V3.2` | 163K | | | | | | $0.30 | $0.45 |
46
- | `nebius/google/gemma-2-2b-it` | 8K | | | | | | $0.02 | $0.06 |
47
- | `nebius/google/gemma-2-9b-it-fast` | 8K | | | | | | $0.03 | $0.09 |
48
- | `nebius/google/gemma-3-27b-it` | 110K | | | | | | $0.10 | $0.30 |
49
- | `nebius/google/gemma-3-27b-it-fast` | 110K | | | | | | $0.20 | $0.60 |
50
- | `nebius/intfloat/e5-mistral-7b-instruct` | 33K | | | | | | $0.01 | |
51
- | `nebius/meta-llama/Llama-3.3-70B-Instruct` | 128K | | | | | | $0.13 | $0.40 |
52
- | `nebius/meta-llama/Llama-3.3-70B-Instruct-fast` | 128K | | | | | | $0.25 | $0.75 |
53
- | `nebius/meta-llama/Llama-Guard-3-8B` | 8K | | | | | | $0.02 | $0.06 |
54
- | `nebius/meta-llama/Meta-Llama-3.1-8B-Instruct` | 128K | | | | | | $0.02 | $0.06 |
55
- | `nebius/meta-llama/Meta-Llama-3.1-8B-Instruct-fast` | 128K | | | | | | $0.03 | $0.09 |
56
- | `nebius/MiniMaxAI/MiniMax-M2.1` | 128K | | | | | | $0.30 | $1 |
57
- | `nebius/moonshotai/Kimi-K2-Instruct` | 200K | | | | | | $0.50 | $2 |
58
- | `nebius/moonshotai/Kimi-K2-Thinking` | 128K | | | | | | $0.60 | $3 |
59
- | `nebius/moonshotai/Kimi-K2.5` | 256K | | | | | | $0.50 | $3 |
60
- | `nebius/moonshotai/Kimi-K2.5-fast` | 256K | | | | | | $0.50 | $3 |
61
- | `nebius/NousResearch/Hermes-4-405B` | 128K | | | | | | $1 | $3 |
62
- | `nebius/NousResearch/Hermes-4-70B` | 128K | | | | | | $0.13 | $0.40 |
63
- | `nebius/nvidia/Llama-3_1-Nemotron-Ultra-253B-v1` | 128K | | | | | | $0.60 | $2 |
64
- | `nebius/nvidia/nemotron-3-super-120b-a12b` | 256K | | | | | | $0.30 | $0.90 |
65
- | `nebius/nvidia/Nemotron-Nano-V2-12b` | 32K | | | | | | $0.07 | $0.20 |
66
- | `nebius/nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B` | 32K | | | | | | $0.06 | $0.24 |
67
- | `nebius/openai/gpt-oss-120b` | 128K | | | | | | $0.15 | $0.60 |
68
- | `nebius/openai/gpt-oss-20b` | 128K | | | | | | $0.05 | $0.20 |
69
- | `nebius/PrimeIntellect/INTELLECT-3` | 128K | | | | | | $0.20 | $1 |
70
- | `nebius/Qwen/Qwen2.5-Coder-7B-fast` | 128K | | | | | | $0.03 | $0.09 |
71
- | `nebius/Qwen/Qwen2.5-VL-72B-Instruct` | 128K | | | | | | $0.25 | $0.75 |
72
- | `nebius/Qwen/Qwen3-235B-A22B-Instruct-2507` | 262K | | | | | | $0.20 | $0.60 |
73
- | `nebius/Qwen/Qwen3-235B-A22B-Thinking-2507` | 262K | | | | | | $0.20 | $0.80 |
74
- | `nebius/Qwen/Qwen3-30B-A3B-Instruct-2507` | 128K | | | | | | $0.10 | $0.30 |
75
- | `nebius/Qwen/Qwen3-30B-A3B-Thinking-2507` | 128K | | | | | | $0.10 | $0.30 |
76
- | `nebius/Qwen/Qwen3-32B` | 128K | | | | | | $0.10 | $0.30 |
77
- | `nebius/Qwen/Qwen3-32B-fast` | 128K | | | | | | $0.20 | $0.60 |
78
- | `nebius/Qwen/Qwen3-Coder-30B-A3B-Instruct` | 128K | | | | | | $0.10 | $0.30 |
79
- | `nebius/Qwen/Qwen3-Coder-480B-A35B-Instruct` | 262K | | | | | | $0.40 | $2 |
80
- | `nebius/Qwen/Qwen3-Embedding-8B` | 33K | | | | | | $0.01 | — |
81
- | `nebius/Qwen/Qwen3-Next-80B-A3B-Thinking` | 128K | | | | | | $0.15 | $1 |
82
- | `nebius/zai-org/GLM-4.5` | 128K | | | | | | $0.60 | $2 |
83
- | `nebius/zai-org/GLM-4.5-Air` | 128K | | | | | | $0.20 | $1 |
84
- | `nebius/zai-org/GLM-4.7-FP8` | 128K | | | | | | $0.40 | $2 |
85
- | `nebius/zai-org/GLM-5` | 200K | | | | | | $1 | $3 |
35
+ | Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
36
+ | ------------------------------------------------ | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
37
+ | `nebius/deepseek-ai/DeepSeek-V3.2` | 163K | | | | | | $0.30 | $0.45 |
38
+ | `nebius/deepseek-ai/DeepSeek-V3.2-fast` | 8K | | | | | | $0.40 | $2 |
39
+ | `nebius/deepseek-ai/DeepSeek-V4-Pro` | 1.0M | | | | | | $2 | $4 |
40
+ | `nebius/google/gemma-2-2b-it` | 8K | | | | | | $0.02 | $0.06 |
41
+ | `nebius/google/gemma-3-27b-it` | 110K | | | | | | $0.10 | $0.30 |
42
+ | `nebius/meta-llama/Llama-3.3-70B-Instruct` | 128K | | | | | | $0.13 | $0.40 |
43
+ | `nebius/meta-llama/Meta-Llama-3.1-8B-Instruct` | 128K | | | | | | $0.02 | $0.06 |
44
+ | `nebius/MiniMaxAI/MiniMax-M2.5` | 197K | | | | | | $0.30 | $1 |
45
+ | `nebius/MiniMaxAI/MiniMax-M2.5-fast` | 8K | | | | | | $0.30 | $1 |
46
+ | `nebius/moonshotai/Kimi-K2.5` | 256K | | | | | | $0.50 | $3 |
47
+ | `nebius/moonshotai/Kimi-K2.5-fast` | 256K | | | | | | $0.50 | $3 |
48
+ | `nebius/NousResearch/Hermes-4-405B` | 128K | | | | | | $1 | $3 |
49
+ | `nebius/NousResearch/Hermes-4-70B` | 128K | | | | | | $0.13 | $0.40 |
50
+ | `nebius/nvidia/Llama-3_1-Nemotron-Ultra-253B-v1` | 128K | | | | | | $0.60 | $2 |
51
+ | `nebius/nvidia/Nemotron-3-Nano-Omni` | 66K | | | | | | $0.06 | $0.24 |
52
+ | `nebius/nvidia/nemotron-3-super-120b-a12b` | 256K | | | | | | $0.30 | $0.90 |
53
+ | `nebius/nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B` | 32K | | | | | | $0.06 | $0.24 |
54
+ | `nebius/openai/gpt-oss-120b` | 128K | | | | | | $0.15 | $0.60 |
55
+ | `nebius/openai/gpt-oss-120b-fast` | 8K | | | | | | $0.10 | $0.50 |
56
+ | `nebius/PrimeIntellect/INTELLECT-3` | 128K | | | | | | $0.20 | $1 |
57
+ | `nebius/Qwen/Qwen2.5-VL-72B-Instruct` | 128K | | | | | | $0.25 | $0.75 |
58
+ | `nebius/Qwen/Qwen3-235B-A22B-Instruct-2507` | 262K | | | | | | $0.20 | $0.60 |
59
+ | `nebius/Qwen/Qwen3-235B-A22B-Thinking-2507-fast` | 8K | | | | | | $0.50 | $2 |
60
+ | `nebius/Qwen/Qwen3-30B-A3B-Instruct-2507` | 128K | | | | | | $0.10 | $0.30 |
61
+ | `nebius/Qwen/Qwen3-32B` | 128K | | | | | | $0.10 | $0.30 |
62
+ | `nebius/Qwen/Qwen3-Embedding-8B` | 33K | | | | | | $0.01 | |
63
+ | `nebius/Qwen/Qwen3-Next-80B-A3B-Thinking` | 128K | | | | | | $0.15 | $1 |
64
+ | `nebius/Qwen/Qwen3-Next-80B-A3B-Thinking-fast` | 8K | | | | | | $0.15 | $1 |
65
+ | `nebius/Qwen/Qwen3.5-397B-A17B` | 262K | | | | | | $0.60 | $4 |
66
+ | `nebius/Qwen/Qwen3.5-397B-A17B-fast` | 8K | | | | | | $0.60 | $4 |
67
+ | `nebius/zai-org/GLM-5` | 200K | | | | | | $1 | $3 |
86
68
 
87
69
  ## Advanced configuration
88
70
 
@@ -94,7 +76,7 @@ const agent = new Agent({
94
76
  name: "custom-agent",
95
77
  model: {
96
78
  url: "https://api.tokenfactory.nebius.com/v1",
97
- id: "nebius/BAAI/bge-en-icl",
79
+ id: "nebius/MiniMaxAI/MiniMax-M2.5",
98
80
  apiKey: process.env.NEBIUS_API_KEY,
99
81
  headers: {
100
82
  "X-Custom-Header": "value"
@@ -113,7 +95,7 @@ const agent = new Agent({
113
95
  const useAdvanced = requestContext.task === "complex";
114
96
  return useAdvanced
115
97
  ? "nebius/zai-org/GLM-5"
116
- : "nebius/BAAI/bge-en-icl";
98
+ : "nebius/MiniMaxAI/MiniMax-M2.5";
117
99
  }
118
100
  });
119
101
  ```
@@ -176,6 +176,8 @@ const response = await agent.generate("Hello!", {
176
176
 
177
177
  **forceReasoning** (`boolean | undefined`)
178
178
 
179
+ **allowedTools** (`{ toolNames: string[]; mode?: "auto" | "required" | undefined; } | undefined`)
180
+
179
181
  ## Direct provider installation
180
182
 
181
183
  This provider can also be installed directly as a standalone package, which can be used instead of the Mastra model router string. View the [package documentation](https://www.npmjs.com/package/@ai-sdk/openai) for more details.
@@ -1,6 +1,6 @@
1
1
  # ![OpenCode Go logo](https://models.dev/logos/opencode-go.svg)OpenCode Go
2
2
 
3
- Access 14 OpenCode Go models through Mastra's model router. Authentication is handled automatically using the `OPENCODE_API_KEY` environment variable.
3
+ Access 12 OpenCode Go models through Mastra's model router. Authentication is handled automatically using the `OPENCODE_API_KEY` environment variable.
4
4
 
5
5
  Learn more in the [OpenCode Go documentation](https://opencode.ai/docs/zen).
6
6
 
@@ -39,9 +39,7 @@ for await (const chunk of stream) {
39
39
  | `opencode-go/glm-5` | 203K | | | | | | $1 | $3 |
40
40
  | `opencode-go/glm-5.1` | 203K | | | | | | $1 | $4 |
41
41
  | `opencode-go/kimi-k2.5` | 262K | | | | | | $0.60 | $3 |
42
- | `opencode-go/kimi-k2.6` | 262K | | | | | | $0.32 | $1 |
43
- | `opencode-go/mimo-v2-omni` | 262K | | | | | | $0.40 | $2 |
44
- | `opencode-go/mimo-v2-pro` | 1.0M | | | | | | $1 | $3 |
42
+ | `opencode-go/kimi-k2.6` | 262K | | | | | | $0.95 | $4 |
45
43
  | `opencode-go/mimo-v2.5` | 1.0M | | | | | | $0.40 | $2 |
46
44
  | `opencode-go/mimo-v2.5-pro` | 1.0M | | | | | | $1 | $3 |
47
45
  | `opencode-go/minimax-m2.5` | 205K | | | | | | $0.30 | $1 |
@@ -49,7 +49,7 @@ for await (const chunk of stream) {
49
49
  | `opencode/glm-5.1` | 205K | | | | | | $1 | $4 |
50
50
  | `opencode/gpt-5` | 400K | | | | | | $1 | $9 |
51
51
  | `opencode/gpt-5-codex` | 400K | | | | | | $1 | $9 |
52
- | `opencode/gpt-5-nano` | 400K | | | | | | | |
52
+ | `opencode/gpt-5-nano` | 400K | | | | | | $0.05 | $0.40 |
53
53
  | `opencode/gpt-5.1` | 400K | | | | | | $1 | $9 |
54
54
  | `opencode/gpt-5.1-codex` | 400K | | | | | | $1 | $9 |
55
55
  | `opencode/gpt-5.1-codex-max` | 400K | | | | | | $1 | $10 |
@@ -64,7 +64,6 @@ for await (const chunk of stream) {
64
64
  | `opencode/gpt-5.4-pro` | 1.1M | | | | | | $30 | $180 |
65
65
  | `opencode/gpt-5.5` | 1.1M | | | | | | $5 | $30 |
66
66
  | `opencode/gpt-5.5-pro` | 1.1M | | | | | | $30 | $180 |
67
- | `opencode/hy3-preview-free` | 256K | | | | | | — | — |
68
67
  | `opencode/kimi-k2.5` | 262K | | | | | | $0.60 | $3 |
69
68
  | `opencode/kimi-k2.6` | 262K | | | | | | $0.95 | $4 |
70
69
  | `opencode/minimax-m2.5` | 205K | | | | | | $0.30 | $1 |
@@ -73,6 +72,7 @@ for await (const chunk of stream) {
73
72
  | `opencode/nemotron-3-super-free` | 205K | | | | | | — | — |
74
73
  | `opencode/qwen3.5-plus` | 262K | | | | | | $0.20 | $1 |
75
74
  | `opencode/qwen3.6-plus` | 262K | | | | | | $0.50 | $3 |
75
+ | `opencode/ring-2.6-1t-free` | 262K | | | | | | — | — |
76
76
 
77
77
  ## Advanced configuration
78
78
 
@@ -102,7 +102,7 @@ const agent = new Agent({
102
102
  model: ({ requestContext }) => {
103
103
  const useAdvanced = requestContext.task === "complex";
104
104
  return useAdvanced
105
- ? "opencode/qwen3.6-plus"
105
+ ? "opencode/ring-2.6-1t-free"
106
106
  : "opencode/big-pickle";
107
107
  }
108
108
  });
@@ -1,6 +1,6 @@
1
1
  # ![Poe logo](https://models.dev/logos/poe.svg)Poe
2
2
 
3
- Access 121 Poe models through Mastra's model router. Authentication is handled automatically using the `POE_API_KEY` environment variable.
3
+ Access 124 Poe models through Mastra's model router. Authentication is handled automatically using the `POE_API_KEY` environment variable.
4
4
 
5
5
  Learn more in the [Poe documentation](https://creator.poe.com/docs/external-applications/openai-compatible-api).
6
6
 
@@ -51,6 +51,8 @@ for await (const chunk of stream) {
51
51
  | `poe/elevenlabs/elevenlabs-music` | 2K | | | | | | — | — |
52
52
  | `poe/elevenlabs/elevenlabs-v2.5-turbo` | 128K | | | | | | — | — |
53
53
  | `poe/elevenlabs/elevenlabs-v3` | 128K | | | | | | — | — |
54
+ | `poe/empiriolabs/deepseek-v4-flash-el` | 1.0M | | | | | | $0.14 | $0.28 |
55
+ | `poe/empiriolabs/deepseek-v4-pro-el` | 1.0M | | | | | | $2 | $3 |
54
56
  | `poe/fireworks-ai/kimi-k2.5-fw` | 262K | | | | | | — | — |
55
57
  | `poe/google/gemini-2.0-flash` | 990K | | | | | | $0.10 | $0.42 |
56
58
  | `poe/google/gemini-2.0-flash-lite` | 990K | | | | | | $0.05 | $0.21 |
@@ -87,6 +89,7 @@ for await (const chunk of stream) {
87
89
  | `poe/novita/glm-5` | 205K | | | | | | $1 | $3 |
88
90
  | `poe/novita/kimi-k2-thinking` | 256K | | | | | | — | — |
89
91
  | `poe/novita/kimi-k2.5` | 128K | | | | | | $0.60 | $3 |
92
+ | `poe/novita/kimi-k2.6` | 262K | | | | | | $0.96 | $4 |
90
93
  | `poe/novita/minimax-m2.1` | 205K | | | | | | — | — |
91
94
  | `poe/openai/dall-e-3` | 800 | | | | | | — | — |
92
95
  | `poe/openai/gpt-3.5-turbo` | 16K | | | | | | $0.45 | $1 |
@@ -81,7 +81,7 @@ for await (const chunk of stream) {
81
81
  | `qiniu-ai/kling-v2-6` | 100.0M | | | | | | — | — |
82
82
  | `qiniu-ai/meituan/longcat-flash-chat` | 131K | | | | | | — | — |
83
83
  | `qiniu-ai/meituan/longcat-flash-lite` | 256K | | | | | | — | — |
84
- | `qiniu-ai/mimo-v2-flash` | 256K | | | | | | | |
84
+ | `qiniu-ai/mimo-v2-flash` | 256K | | | | | | $0.10 | $0.30 |
85
85
  | `qiniu-ai/MiniMax-M1` | 1.0M | | | | | | — | — |
86
86
  | `qiniu-ai/minimax/minimax-m2` | 200K | | | | | | — | — |
87
87
  | `qiniu-ai/minimax/minimax-m2.1` | 205K | | | | | | — | — |
@@ -120,7 +120,7 @@ for await (const chunk of stream) {
120
120
  | `qiniu-ai/x-ai/grok-4.1-fast-non-reasoning` | 2.0M | | | | | | — | — |
121
121
  | `qiniu-ai/x-ai/grok-4.1-fast-reasoning` | 20.0M | | | | | | — | — |
122
122
  | `qiniu-ai/x-ai/grok-code-fast-1` | 256K | | | | | | — | — |
123
- | `qiniu-ai/xiaomi/mimo-v2-flash` | 256K | | | | | | | |
123
+ | `qiniu-ai/xiaomi/mimo-v2-flash` | 256K | | | | | | $0.10 | $0.30 |
124
124
  | `qiniu-ai/z-ai/autoglm-phone-9b` | 13K | | | | | | — | — |
125
125
  | `qiniu-ai/z-ai/glm-4.6` | 200K | | | | | | — | — |
126
126
  | `qiniu-ai/z-ai/glm-4.7` | 200K | | | | | | — | — |
@@ -1,6 +1,6 @@
1
1
  # ![Wafer logo](https://models.dev/logos/wafer.ai.svg)Wafer
2
2
 
3
- Access 3 Wafer models through Mastra's model router. Authentication is handled automatically using the `WAFER_API_KEY` environment variable.
3
+ Access 4 Wafer models through Mastra's model router. Authentication is handled automatically using the `WAFER_API_KEY` environment variable.
4
4
 
5
5
  Learn more in the [Wafer documentation](https://docs.wafer.ai/wafer-pass).
6
6
 
@@ -36,6 +36,7 @@ for await (const chunk of stream) {
36
36
  | ---------------------------- | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
37
37
  | `wafer.ai/DeepSeek-V4-Pro` | 1.0M | | | | | | — | — |
38
38
  | `wafer.ai/GLM-5.1` | 203K | | | | | | — | — |
39
+ | `wafer.ai/MiniMax-M2.7` | 205K | | | | | | — | — |
39
40
  | `wafer.ai/Qwen3.5-397B-A17B` | 262K | | | | | | — | — |
40
41
 
41
42
  ## Advanced configuration
@@ -1,6 +1,6 @@
1
1
  # ![Xiaomi Token Plan (Europe) logo](https://models.dev/logos/xiaomi-token-plan-ams.svg)Xiaomi Token Plan (Europe)
2
2
 
3
- Access 5 Xiaomi Token Plan (Europe) models through Mastra's model router. Authentication is handled automatically using the `XIAOMI_API_KEY` environment variable.
3
+ Access 6 Xiaomi Token Plan (Europe) models through Mastra's model router. Authentication is handled automatically using the `XIAOMI_API_KEY` environment variable.
4
4
 
5
5
  Learn more in the [Xiaomi Token Plan (Europe) documentation](https://platform.xiaomimimo.com/#/docs).
6
6
 
@@ -15,7 +15,7 @@ const agent = new Agent({
15
15
  id: "my-agent",
16
16
  name: "My Agent",
17
17
  instructions: "You are a helpful assistant",
18
- model: "xiaomi-token-plan-ams/mimo-v2-omni"
18
+ model: "xiaomi-token-plan-ams/mimo-v2-flash"
19
19
  });
20
20
 
21
21
  // Generate a response
@@ -34,7 +34,8 @@ for await (const chunk of stream) {
34
34
 
35
35
  | Model | Context | Tools | Reasoning | Image | Audio | Video | Input $/1M | Output $/1M |
36
36
  | ------------------------------------- | ------- | ----- | --------- | ----- | ----- | ----- | ---------- | ----------- |
37
- | `xiaomi-token-plan-ams/mimo-v2-omni` | 256K | | | | | | — | — |
37
+ | `xiaomi-token-plan-ams/mimo-v2-flash` | 262K | | | | | | — | — |
38
+ | `xiaomi-token-plan-ams/mimo-v2-omni` | 262K | | | | | | — | — |
38
39
  | `xiaomi-token-plan-ams/mimo-v2-pro` | 1.0M | | | | | | — | — |
39
40
  | `xiaomi-token-plan-ams/mimo-v2-tts` | 8K | | | | | | — | — |
40
41
  | `xiaomi-token-plan-ams/mimo-v2.5` | 1.0M | | | | | | — | — |
@@ -50,7 +51,7 @@ const agent = new Agent({
50
51
  name: "custom-agent",
51
52
  model: {
52
53
  url: "https://token-plan-ams.xiaomimimo.com/v1",
53
- id: "xiaomi-token-plan-ams/mimo-v2-omni",
54
+ id: "xiaomi-token-plan-ams/mimo-v2-flash",
54
55
  apiKey: process.env.XIAOMI_API_KEY,
55
56
  headers: {
56
57
  "X-Custom-Header": "value"
@@ -69,7 +70,7 @@ const agent = new Agent({
69
70
  const useAdvanced = requestContext.task === "complex";
70
71
  return useAdvanced
71
72
  ? "xiaomi-token-plan-ams/mimo-v2.5-pro"
72
- : "xiaomi-token-plan-ams/mimo-v2-omni";
73
+ : "xiaomi-token-plan-ams/mimo-v2-flash";
73
74
  }
74
75
  });
75
76
  ```