@mastra/mcp-docs-server 1.1.4 → 1.1.5-alpha.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (547) hide show
  1. package/CHANGELOG.md +7 -0
  2. package/package.json +3 -3
  3. package/.docs/docs/agents/adding-voice.md +0 -353
  4. package/.docs/docs/agents/agent-approval.md +0 -377
  5. package/.docs/docs/agents/agent-memory.md +0 -212
  6. package/.docs/docs/agents/guardrails.md +0 -382
  7. package/.docs/docs/agents/network-approval.md +0 -275
  8. package/.docs/docs/agents/networks.md +0 -290
  9. package/.docs/docs/agents/overview.md +0 -309
  10. package/.docs/docs/agents/processors.md +0 -632
  11. package/.docs/docs/agents/structured-output.md +0 -271
  12. package/.docs/docs/agents/using-tools.md +0 -214
  13. package/.docs/docs/build-with-ai/mcp-docs-server.md +0 -241
  14. package/.docs/docs/build-with-ai/skills.md +0 -35
  15. package/.docs/docs/community/contributing-templates.md +0 -3
  16. package/.docs/docs/community/discord.md +0 -9
  17. package/.docs/docs/community/licensing.md +0 -66
  18. package/.docs/docs/deployment/cloud-providers.md +0 -15
  19. package/.docs/docs/deployment/mastra-server.md +0 -122
  20. package/.docs/docs/deployment/monorepo.md +0 -142
  21. package/.docs/docs/deployment/overview.md +0 -62
  22. package/.docs/docs/deployment/studio.md +0 -234
  23. package/.docs/docs/deployment/web-framework.md +0 -52
  24. package/.docs/docs/deployment/workflow-runners.md +0 -9
  25. package/.docs/docs/evals/built-in-scorers.md +0 -47
  26. package/.docs/docs/evals/custom-scorers.md +0 -519
  27. package/.docs/docs/evals/overview.md +0 -146
  28. package/.docs/docs/evals/running-in-ci.md +0 -106
  29. package/.docs/docs/getting-started/build-with-ai.md +0 -68
  30. package/.docs/docs/getting-started/manual-install.md +0 -226
  31. package/.docs/docs/getting-started/project-structure.md +0 -60
  32. package/.docs/docs/getting-started/start.md +0 -28
  33. package/.docs/docs/getting-started/studio.md +0 -101
  34. package/.docs/docs/index.md +0 -43
  35. package/.docs/docs/mastra-cloud/deployment.md +0 -77
  36. package/.docs/docs/mastra-cloud/observability.md +0 -38
  37. package/.docs/docs/mastra-cloud/overview.md +0 -23
  38. package/.docs/docs/mastra-cloud/setup.md +0 -42
  39. package/.docs/docs/mastra-cloud/studio.md +0 -24
  40. package/.docs/docs/mcp/overview.md +0 -370
  41. package/.docs/docs/mcp/publishing-mcp-server.md +0 -95
  42. package/.docs/docs/memory/memory-processors.md +0 -316
  43. package/.docs/docs/memory/message-history.md +0 -260
  44. package/.docs/docs/memory/observational-memory.md +0 -246
  45. package/.docs/docs/memory/overview.md +0 -45
  46. package/.docs/docs/memory/semantic-recall.md +0 -272
  47. package/.docs/docs/memory/storage.md +0 -261
  48. package/.docs/docs/memory/working-memory.md +0 -400
  49. package/.docs/docs/observability/datasets/overview.md +0 -188
  50. package/.docs/docs/observability/datasets/running-experiments.md +0 -266
  51. package/.docs/docs/observability/logging.md +0 -99
  52. package/.docs/docs/observability/overview.md +0 -70
  53. package/.docs/docs/observability/tracing/bridges/otel.md +0 -209
  54. package/.docs/docs/observability/tracing/exporters/arize.md +0 -274
  55. package/.docs/docs/observability/tracing/exporters/braintrust.md +0 -111
  56. package/.docs/docs/observability/tracing/exporters/cloud.md +0 -129
  57. package/.docs/docs/observability/tracing/exporters/datadog.md +0 -187
  58. package/.docs/docs/observability/tracing/exporters/default.md +0 -211
  59. package/.docs/docs/observability/tracing/exporters/laminar.md +0 -100
  60. package/.docs/docs/observability/tracing/exporters/langfuse.md +0 -217
  61. package/.docs/docs/observability/tracing/exporters/langsmith.md +0 -202
  62. package/.docs/docs/observability/tracing/exporters/otel.md +0 -479
  63. package/.docs/docs/observability/tracing/exporters/posthog.md +0 -148
  64. package/.docs/docs/observability/tracing/exporters/sentry.md +0 -208
  65. package/.docs/docs/observability/tracing/overview.md +0 -1114
  66. package/.docs/docs/observability/tracing/processors/sensitive-data-filter.md +0 -303
  67. package/.docs/docs/rag/chunking-and-embedding.md +0 -183
  68. package/.docs/docs/rag/graph-rag.md +0 -215
  69. package/.docs/docs/rag/overview.md +0 -72
  70. package/.docs/docs/rag/retrieval.md +0 -521
  71. package/.docs/docs/rag/vector-databases.md +0 -648
  72. package/.docs/docs/server/auth/auth0.md +0 -222
  73. package/.docs/docs/server/auth/better-auth.md +0 -203
  74. package/.docs/docs/server/auth/clerk.md +0 -132
  75. package/.docs/docs/server/auth/composite-auth.md +0 -234
  76. package/.docs/docs/server/auth/custom-auth-provider.md +0 -513
  77. package/.docs/docs/server/auth/firebase.md +0 -272
  78. package/.docs/docs/server/auth/jwt.md +0 -110
  79. package/.docs/docs/server/auth/simple-auth.md +0 -178
  80. package/.docs/docs/server/auth/supabase.md +0 -117
  81. package/.docs/docs/server/auth/workos.md +0 -190
  82. package/.docs/docs/server/auth.md +0 -38
  83. package/.docs/docs/server/custom-adapters.md +0 -374
  84. package/.docs/docs/server/custom-api-routes.md +0 -267
  85. package/.docs/docs/server/mastra-client.md +0 -243
  86. package/.docs/docs/server/mastra-server.md +0 -71
  87. package/.docs/docs/server/middleware.md +0 -228
  88. package/.docs/docs/server/request-context.md +0 -478
  89. package/.docs/docs/server/server-adapters.md +0 -547
  90. package/.docs/docs/streaming/events.md +0 -247
  91. package/.docs/docs/streaming/overview.md +0 -181
  92. package/.docs/docs/streaming/tool-streaming.md +0 -178
  93. package/.docs/docs/streaming/workflow-streaming.md +0 -109
  94. package/.docs/docs/voice/overview.md +0 -979
  95. package/.docs/docs/voice/speech-to-speech.md +0 -103
  96. package/.docs/docs/voice/speech-to-text.md +0 -80
  97. package/.docs/docs/voice/text-to-speech.md +0 -84
  98. package/.docs/docs/workflows/agents-and-tools.md +0 -170
  99. package/.docs/docs/workflows/control-flow.md +0 -823
  100. package/.docs/docs/workflows/error-handling.md +0 -360
  101. package/.docs/docs/workflows/human-in-the-loop.md +0 -213
  102. package/.docs/docs/workflows/overview.md +0 -372
  103. package/.docs/docs/workflows/snapshots.md +0 -238
  104. package/.docs/docs/workflows/suspend-and-resume.md +0 -205
  105. package/.docs/docs/workflows/time-travel.md +0 -309
  106. package/.docs/docs/workflows/workflow-state.md +0 -181
  107. package/.docs/docs/workspace/filesystem.md +0 -162
  108. package/.docs/docs/workspace/overview.md +0 -239
  109. package/.docs/docs/workspace/sandbox.md +0 -63
  110. package/.docs/docs/workspace/search.md +0 -219
  111. package/.docs/docs/workspace/skills.md +0 -126
  112. package/.docs/guides/agent-frameworks/ai-sdk.md +0 -140
  113. package/.docs/guides/build-your-ui/ai-sdk-ui.md +0 -1463
  114. package/.docs/guides/build-your-ui/assistant-ui.md +0 -156
  115. package/.docs/guides/build-your-ui/copilotkit.md +0 -292
  116. package/.docs/guides/deployment/amazon-ec2.md +0 -130
  117. package/.docs/guides/deployment/aws-lambda.md +0 -248
  118. package/.docs/guides/deployment/azure-app-services.md +0 -114
  119. package/.docs/guides/deployment/cloudflare.md +0 -99
  120. package/.docs/guides/deployment/digital-ocean.md +0 -168
  121. package/.docs/guides/deployment/inngest.md +0 -685
  122. package/.docs/guides/deployment/netlify.md +0 -77
  123. package/.docs/guides/deployment/vercel.md +0 -101
  124. package/.docs/guides/getting-started/astro.md +0 -408
  125. package/.docs/guides/getting-started/electron.md +0 -504
  126. package/.docs/guides/getting-started/express.md +0 -251
  127. package/.docs/guides/getting-started/hono.md +0 -191
  128. package/.docs/guides/getting-started/next-js.md +0 -355
  129. package/.docs/guides/getting-started/nuxt.md +0 -476
  130. package/.docs/guides/getting-started/quickstart.md +0 -67
  131. package/.docs/guides/getting-started/sveltekit.md +0 -300
  132. package/.docs/guides/getting-started/vite-react.md +0 -439
  133. package/.docs/guides/guide/ai-recruiter.md +0 -227
  134. package/.docs/guides/guide/chef-michel.md +0 -215
  135. package/.docs/guides/guide/code-review-bot.md +0 -221
  136. package/.docs/guides/guide/dev-assistant.md +0 -304
  137. package/.docs/guides/guide/docs-manager.md +0 -238
  138. package/.docs/guides/guide/github-actions-pr-description.md +0 -236
  139. package/.docs/guides/guide/notes-mcp-server.md +0 -425
  140. package/.docs/guides/guide/research-assistant.md +0 -349
  141. package/.docs/guides/guide/stock-agent.md +0 -134
  142. package/.docs/guides/guide/web-search.md +0 -326
  143. package/.docs/guides/guide/whatsapp-chat-bot.md +0 -416
  144. package/.docs/guides/index.md +0 -3
  145. package/.docs/guides/migrations/agentnetwork.md +0 -101
  146. package/.docs/guides/migrations/ai-sdk-v4-to-v5.md +0 -112
  147. package/.docs/guides/migrations/upgrade-to-v1/agent.md +0 -404
  148. package/.docs/guides/migrations/upgrade-to-v1/cli.md +0 -57
  149. package/.docs/guides/migrations/upgrade-to-v1/client.md +0 -337
  150. package/.docs/guides/migrations/upgrade-to-v1/deployment.md +0 -37
  151. package/.docs/guides/migrations/upgrade-to-v1/evals.md +0 -239
  152. package/.docs/guides/migrations/upgrade-to-v1/mastra.md +0 -143
  153. package/.docs/guides/migrations/upgrade-to-v1/mcp.md +0 -97
  154. package/.docs/guides/migrations/upgrade-to-v1/memory.md +0 -285
  155. package/.docs/guides/migrations/upgrade-to-v1/overview.md +0 -119
  156. package/.docs/guides/migrations/upgrade-to-v1/processors.md +0 -68
  157. package/.docs/guides/migrations/upgrade-to-v1/rag.md +0 -42
  158. package/.docs/guides/migrations/upgrade-to-v1/storage.md +0 -553
  159. package/.docs/guides/migrations/upgrade-to-v1/tools.md +0 -180
  160. package/.docs/guides/migrations/upgrade-to-v1/tracing.md +0 -417
  161. package/.docs/guides/migrations/upgrade-to-v1/vectors.md +0 -87
  162. package/.docs/guides/migrations/upgrade-to-v1/voice.md +0 -30
  163. package/.docs/guides/migrations/upgrade-to-v1/workflows.md +0 -341
  164. package/.docs/guides/migrations/vnext-to-standard-apis.md +0 -364
  165. package/.docs/models/embeddings.md +0 -161
  166. package/.docs/models/gateways/azure-openai.md +0 -128
  167. package/.docs/models/gateways/custom-gateways.md +0 -545
  168. package/.docs/models/gateways/netlify.md +0 -88
  169. package/.docs/models/gateways/openrouter.md +0 -219
  170. package/.docs/models/gateways/vercel.md +0 -225
  171. package/.docs/models/gateways.md +0 -14
  172. package/.docs/models/index.md +0 -286
  173. package/.docs/models/providers/302ai.md +0 -134
  174. package/.docs/models/providers/abacus.md +0 -125
  175. package/.docs/models/providers/agentrouter.md +0 -90
  176. package/.docs/models/providers/aihubmix.md +0 -107
  177. package/.docs/models/providers/alibaba-cn.md +0 -135
  178. package/.docs/models/providers/alibaba.md +0 -111
  179. package/.docs/models/providers/amazon-bedrock.md +0 -33
  180. package/.docs/models/providers/anthropic.md +0 -153
  181. package/.docs/models/providers/azure.md +0 -33
  182. package/.docs/models/providers/bailing.md +0 -72
  183. package/.docs/models/providers/baseten.md +0 -77
  184. package/.docs/models/providers/berget.md +0 -78
  185. package/.docs/models/providers/cerebras.md +0 -101
  186. package/.docs/models/providers/chutes.md +0 -136
  187. package/.docs/models/providers/cloudflare-ai-gateway.md +0 -33
  188. package/.docs/models/providers/cloudflare-workers-ai.md +0 -109
  189. package/.docs/models/providers/cohere.md +0 -33
  190. package/.docs/models/providers/cortecs.md +0 -91
  191. package/.docs/models/providers/deepinfra.md +0 -112
  192. package/.docs/models/providers/deepseek.md +0 -88
  193. package/.docs/models/providers/fastrouter.md +0 -84
  194. package/.docs/models/providers/fireworks-ai.md +0 -89
  195. package/.docs/models/providers/firmware.md +0 -85
  196. package/.docs/models/providers/friendli.md +0 -78
  197. package/.docs/models/providers/github-models.md +0 -125
  198. package/.docs/models/providers/google-vertex.md +0 -33
  199. package/.docs/models/providers/google.md +0 -159
  200. package/.docs/models/providers/groq.md +0 -107
  201. package/.docs/models/providers/helicone.md +0 -161
  202. package/.docs/models/providers/huggingface.md +0 -90
  203. package/.docs/models/providers/iflowcn.md +0 -84
  204. package/.docs/models/providers/inception.md +0 -72
  205. package/.docs/models/providers/inference.md +0 -79
  206. package/.docs/models/providers/io-intelligence.md +0 -87
  207. package/.docs/models/providers/io-net.md +0 -87
  208. package/.docs/models/providers/jiekou.md +0 -131
  209. package/.docs/models/providers/kilo.md +0 -333
  210. package/.docs/models/providers/kimi-for-coding.md +0 -100
  211. package/.docs/models/providers/kuae-cloud-coding-plan.md +0 -71
  212. package/.docs/models/providers/llama.md +0 -77
  213. package/.docs/models/providers/lmstudio.md +0 -73
  214. package/.docs/models/providers/lucidquery.md +0 -72
  215. package/.docs/models/providers/minimax-cn-coding-plan.md +0 -102
  216. package/.docs/models/providers/minimax-cn.md +0 -102
  217. package/.docs/models/providers/minimax-coding-plan.md +0 -102
  218. package/.docs/models/providers/minimax.md +0 -104
  219. package/.docs/models/providers/mistral.md +0 -124
  220. package/.docs/models/providers/moark.md +0 -72
  221. package/.docs/models/providers/modelscope.md +0 -77
  222. package/.docs/models/providers/moonshotai-cn.md +0 -76
  223. package/.docs/models/providers/moonshotai.md +0 -76
  224. package/.docs/models/providers/morph.md +0 -73
  225. package/.docs/models/providers/nano-gpt.md +0 -103
  226. package/.docs/models/providers/nebius.md +0 -116
  227. package/.docs/models/providers/nova.md +0 -72
  228. package/.docs/models/providers/novita-ai.md +0 -154
  229. package/.docs/models/providers/nvidia.md +0 -141
  230. package/.docs/models/providers/ollama-cloud.md +0 -103
  231. package/.docs/models/providers/ollama.md +0 -33
  232. package/.docs/models/providers/openai.md +0 -193
  233. package/.docs/models/providers/opencode.md +0 -100
  234. package/.docs/models/providers/ovhcloud.md +0 -83
  235. package/.docs/models/providers/perplexity.md +0 -100
  236. package/.docs/models/providers/poe.md +0 -183
  237. package/.docs/models/providers/privatemode-ai.md +0 -75
  238. package/.docs/models/providers/requesty.md +0 -90
  239. package/.docs/models/providers/scaleway.md +0 -84
  240. package/.docs/models/providers/siliconflow-cn.md +0 -138
  241. package/.docs/models/providers/siliconflow.md +0 -140
  242. package/.docs/models/providers/stackit.md +0 -78
  243. package/.docs/models/providers/stepfun.md +0 -73
  244. package/.docs/models/providers/submodel.md +0 -79
  245. package/.docs/models/providers/synthetic.md +0 -96
  246. package/.docs/models/providers/togetherai.md +0 -115
  247. package/.docs/models/providers/upstage.md +0 -73
  248. package/.docs/models/providers/venice.md +0 -95
  249. package/.docs/models/providers/vivgrid.md +0 -106
  250. package/.docs/models/providers/vultr.md +0 -75
  251. package/.docs/models/providers/wandb.md +0 -80
  252. package/.docs/models/providers/xai.md +0 -141
  253. package/.docs/models/providers/xiaomi.md +0 -71
  254. package/.docs/models/providers/zai-coding-plan.md +0 -80
  255. package/.docs/models/providers/zai.md +0 -79
  256. package/.docs/models/providers/zenmux.md +0 -161
  257. package/.docs/models/providers/zhipuai-coding-plan.md +0 -79
  258. package/.docs/models/providers/zhipuai.md +0 -79
  259. package/.docs/models/providers.md +0 -81
  260. package/.docs/reference/agents/agent.md +0 -142
  261. package/.docs/reference/agents/generate.md +0 -174
  262. package/.docs/reference/agents/generateLegacy.md +0 -176
  263. package/.docs/reference/agents/getDefaultGenerateOptions.md +0 -36
  264. package/.docs/reference/agents/getDefaultOptions.md +0 -34
  265. package/.docs/reference/agents/getDefaultStreamOptions.md +0 -36
  266. package/.docs/reference/agents/getDescription.md +0 -21
  267. package/.docs/reference/agents/getInstructions.md +0 -34
  268. package/.docs/reference/agents/getLLM.md +0 -37
  269. package/.docs/reference/agents/getMemory.md +0 -34
  270. package/.docs/reference/agents/getModel.md +0 -34
  271. package/.docs/reference/agents/getTools.md +0 -29
  272. package/.docs/reference/agents/getVoice.md +0 -34
  273. package/.docs/reference/agents/listAgents.md +0 -35
  274. package/.docs/reference/agents/listScorers.md +0 -34
  275. package/.docs/reference/agents/listTools.md +0 -34
  276. package/.docs/reference/agents/listWorkflows.md +0 -34
  277. package/.docs/reference/agents/network.md +0 -134
  278. package/.docs/reference/ai-sdk/chat-route.md +0 -82
  279. package/.docs/reference/ai-sdk/handle-chat-stream.md +0 -53
  280. package/.docs/reference/ai-sdk/handle-network-stream.md +0 -37
  281. package/.docs/reference/ai-sdk/handle-workflow-stream.md +0 -55
  282. package/.docs/reference/ai-sdk/network-route.md +0 -74
  283. package/.docs/reference/ai-sdk/to-ai-sdk-stream.md +0 -232
  284. package/.docs/reference/ai-sdk/to-ai-sdk-v4-messages.md +0 -79
  285. package/.docs/reference/ai-sdk/to-ai-sdk-v5-messages.md +0 -73
  286. package/.docs/reference/ai-sdk/with-mastra.md +0 -59
  287. package/.docs/reference/ai-sdk/workflow-route.md +0 -79
  288. package/.docs/reference/auth/auth0.md +0 -73
  289. package/.docs/reference/auth/better-auth.md +0 -71
  290. package/.docs/reference/auth/clerk.md +0 -36
  291. package/.docs/reference/auth/firebase.md +0 -80
  292. package/.docs/reference/auth/jwt.md +0 -26
  293. package/.docs/reference/auth/supabase.md +0 -33
  294. package/.docs/reference/auth/workos.md +0 -84
  295. package/.docs/reference/cli/create-mastra.md +0 -137
  296. package/.docs/reference/cli/mastra.md +0 -336
  297. package/.docs/reference/client-js/agents.md +0 -438
  298. package/.docs/reference/client-js/error-handling.md +0 -16
  299. package/.docs/reference/client-js/logs.md +0 -24
  300. package/.docs/reference/client-js/mastra-client.md +0 -63
  301. package/.docs/reference/client-js/memory.md +0 -225
  302. package/.docs/reference/client-js/observability.md +0 -72
  303. package/.docs/reference/client-js/telemetry.md +0 -20
  304. package/.docs/reference/client-js/tools.md +0 -44
  305. package/.docs/reference/client-js/vectors.md +0 -79
  306. package/.docs/reference/client-js/workflows.md +0 -199
  307. package/.docs/reference/configuration.md +0 -749
  308. package/.docs/reference/core/addGateway.md +0 -42
  309. package/.docs/reference/core/getAgent.md +0 -21
  310. package/.docs/reference/core/getAgentById.md +0 -21
  311. package/.docs/reference/core/getDeployer.md +0 -22
  312. package/.docs/reference/core/getGateway.md +0 -38
  313. package/.docs/reference/core/getGatewayById.md +0 -41
  314. package/.docs/reference/core/getLogger.md +0 -22
  315. package/.docs/reference/core/getMCPServer.md +0 -45
  316. package/.docs/reference/core/getMCPServerById.md +0 -53
  317. package/.docs/reference/core/getMemory.md +0 -50
  318. package/.docs/reference/core/getScorer.md +0 -54
  319. package/.docs/reference/core/getScorerById.md +0 -54
  320. package/.docs/reference/core/getServer.md +0 -22
  321. package/.docs/reference/core/getStorage.md +0 -22
  322. package/.docs/reference/core/getStoredAgentById.md +0 -89
  323. package/.docs/reference/core/getTelemetry.md +0 -22
  324. package/.docs/reference/core/getVector.md +0 -22
  325. package/.docs/reference/core/getWorkflow.md +0 -40
  326. package/.docs/reference/core/listAgents.md +0 -21
  327. package/.docs/reference/core/listGateways.md +0 -40
  328. package/.docs/reference/core/listLogs.md +0 -38
  329. package/.docs/reference/core/listLogsByRunId.md +0 -36
  330. package/.docs/reference/core/listMCPServers.md +0 -51
  331. package/.docs/reference/core/listMemory.md +0 -56
  332. package/.docs/reference/core/listScorers.md +0 -29
  333. package/.docs/reference/core/listStoredAgents.md +0 -93
  334. package/.docs/reference/core/listVectors.md +0 -22
  335. package/.docs/reference/core/listWorkflows.md +0 -21
  336. package/.docs/reference/core/mastra-class.md +0 -66
  337. package/.docs/reference/core/mastra-model-gateway.md +0 -153
  338. package/.docs/reference/core/setLogger.md +0 -26
  339. package/.docs/reference/core/setStorage.md +0 -27
  340. package/.docs/reference/datasets/addItem.md +0 -35
  341. package/.docs/reference/datasets/addItems.md +0 -33
  342. package/.docs/reference/datasets/compareExperiments.md +0 -48
  343. package/.docs/reference/datasets/create.md +0 -49
  344. package/.docs/reference/datasets/dataset.md +0 -78
  345. package/.docs/reference/datasets/datasets-manager.md +0 -84
  346. package/.docs/reference/datasets/delete.md +0 -23
  347. package/.docs/reference/datasets/deleteExperiment.md +0 -25
  348. package/.docs/reference/datasets/deleteItem.md +0 -25
  349. package/.docs/reference/datasets/deleteItems.md +0 -27
  350. package/.docs/reference/datasets/get.md +0 -29
  351. package/.docs/reference/datasets/getDetails.md +0 -45
  352. package/.docs/reference/datasets/getExperiment.md +0 -28
  353. package/.docs/reference/datasets/getItem.md +0 -31
  354. package/.docs/reference/datasets/getItemHistory.md +0 -29
  355. package/.docs/reference/datasets/list.md +0 -29
  356. package/.docs/reference/datasets/listExperimentResults.md +0 -37
  357. package/.docs/reference/datasets/listExperiments.md +0 -31
  358. package/.docs/reference/datasets/listItems.md +0 -44
  359. package/.docs/reference/datasets/listVersions.md +0 -31
  360. package/.docs/reference/datasets/startExperiment.md +0 -60
  361. package/.docs/reference/datasets/startExperimentAsync.md +0 -41
  362. package/.docs/reference/datasets/update.md +0 -46
  363. package/.docs/reference/datasets/updateItem.md +0 -36
  364. package/.docs/reference/deployer/cloudflare.md +0 -79
  365. package/.docs/reference/deployer/netlify.md +0 -82
  366. package/.docs/reference/deployer/vercel.md +0 -91
  367. package/.docs/reference/deployer.md +0 -100
  368. package/.docs/reference/evals/answer-relevancy.md +0 -105
  369. package/.docs/reference/evals/answer-similarity.md +0 -99
  370. package/.docs/reference/evals/bias.md +0 -120
  371. package/.docs/reference/evals/completeness.md +0 -137
  372. package/.docs/reference/evals/content-similarity.md +0 -101
  373. package/.docs/reference/evals/context-precision.md +0 -196
  374. package/.docs/reference/evals/context-relevance.md +0 -536
  375. package/.docs/reference/evals/create-scorer.md +0 -270
  376. package/.docs/reference/evals/faithfulness.md +0 -114
  377. package/.docs/reference/evals/hallucination.md +0 -220
  378. package/.docs/reference/evals/keyword-coverage.md +0 -128
  379. package/.docs/reference/evals/mastra-scorer.md +0 -123
  380. package/.docs/reference/evals/noise-sensitivity.md +0 -685
  381. package/.docs/reference/evals/prompt-alignment.md +0 -619
  382. package/.docs/reference/evals/run-evals.md +0 -138
  383. package/.docs/reference/evals/scorer-utils.md +0 -330
  384. package/.docs/reference/evals/textual-difference.md +0 -113
  385. package/.docs/reference/evals/tone-consistency.md +0 -119
  386. package/.docs/reference/evals/tool-call-accuracy.md +0 -533
  387. package/.docs/reference/evals/toxicity.md +0 -123
  388. package/.docs/reference/harness/harness-class.md +0 -645
  389. package/.docs/reference/index.md +0 -276
  390. package/.docs/reference/logging/pino-logger.md +0 -117
  391. package/.docs/reference/memory/clone-utilities.md +0 -199
  392. package/.docs/reference/memory/cloneThread.md +0 -130
  393. package/.docs/reference/memory/createThread.md +0 -68
  394. package/.docs/reference/memory/deleteMessages.md +0 -40
  395. package/.docs/reference/memory/getThreadById.md +0 -24
  396. package/.docs/reference/memory/listThreads.md +0 -145
  397. package/.docs/reference/memory/memory-class.md +0 -147
  398. package/.docs/reference/memory/observational-memory.md +0 -565
  399. package/.docs/reference/memory/recall.md +0 -91
  400. package/.docs/reference/observability/tracing/bridges/otel.md +0 -131
  401. package/.docs/reference/observability/tracing/configuration.md +0 -178
  402. package/.docs/reference/observability/tracing/exporters/arize.md +0 -141
  403. package/.docs/reference/observability/tracing/exporters/braintrust.md +0 -93
  404. package/.docs/reference/observability/tracing/exporters/cloud-exporter.md +0 -163
  405. package/.docs/reference/observability/tracing/exporters/console-exporter.md +0 -138
  406. package/.docs/reference/observability/tracing/exporters/datadog.md +0 -116
  407. package/.docs/reference/observability/tracing/exporters/default-exporter.md +0 -174
  408. package/.docs/reference/observability/tracing/exporters/laminar.md +0 -78
  409. package/.docs/reference/observability/tracing/exporters/langfuse.md +0 -134
  410. package/.docs/reference/observability/tracing/exporters/langsmith.md +0 -110
  411. package/.docs/reference/observability/tracing/exporters/otel.md +0 -199
  412. package/.docs/reference/observability/tracing/exporters/posthog.md +0 -92
  413. package/.docs/reference/observability/tracing/exporters/sentry.md +0 -184
  414. package/.docs/reference/observability/tracing/instances.md +0 -109
  415. package/.docs/reference/observability/tracing/interfaces.md +0 -749
  416. package/.docs/reference/observability/tracing/processors/sensitive-data-filter.md +0 -144
  417. package/.docs/reference/observability/tracing/spans.md +0 -224
  418. package/.docs/reference/processors/batch-parts-processor.md +0 -61
  419. package/.docs/reference/processors/language-detector.md +0 -81
  420. package/.docs/reference/processors/message-history-processor.md +0 -85
  421. package/.docs/reference/processors/moderation-processor.md +0 -104
  422. package/.docs/reference/processors/pii-detector.md +0 -107
  423. package/.docs/reference/processors/processor-interface.md +0 -525
  424. package/.docs/reference/processors/prompt-injection-detector.md +0 -71
  425. package/.docs/reference/processors/semantic-recall-processor.md +0 -123
  426. package/.docs/reference/processors/system-prompt-scrubber.md +0 -80
  427. package/.docs/reference/processors/token-limiter-processor.md +0 -113
  428. package/.docs/reference/processors/tool-call-filter.md +0 -85
  429. package/.docs/reference/processors/tool-search-processor.md +0 -113
  430. package/.docs/reference/processors/unicode-normalizer.md +0 -62
  431. package/.docs/reference/processors/working-memory-processor.md +0 -154
  432. package/.docs/reference/rag/chunk.md +0 -221
  433. package/.docs/reference/rag/database-config.md +0 -264
  434. package/.docs/reference/rag/document.md +0 -114
  435. package/.docs/reference/rag/embeddings.md +0 -92
  436. package/.docs/reference/rag/extract-params.md +0 -168
  437. package/.docs/reference/rag/graph-rag.md +0 -111
  438. package/.docs/reference/rag/metadata-filters.md +0 -216
  439. package/.docs/reference/rag/rerank.md +0 -80
  440. package/.docs/reference/rag/rerankWithScorer.md +0 -80
  441. package/.docs/reference/server/create-route.md +0 -260
  442. package/.docs/reference/server/express-adapter.md +0 -176
  443. package/.docs/reference/server/fastify-adapter.md +0 -90
  444. package/.docs/reference/server/hono-adapter.md +0 -162
  445. package/.docs/reference/server/koa-adapter.md +0 -127
  446. package/.docs/reference/server/mastra-server.md +0 -298
  447. package/.docs/reference/server/register-api-route.md +0 -249
  448. package/.docs/reference/server/routes.md +0 -306
  449. package/.docs/reference/storage/cloudflare-d1.md +0 -218
  450. package/.docs/reference/storage/cloudflare.md +0 -88
  451. package/.docs/reference/storage/composite.md +0 -235
  452. package/.docs/reference/storage/convex.md +0 -161
  453. package/.docs/reference/storage/dynamodb.md +0 -282
  454. package/.docs/reference/storage/lance.md +0 -131
  455. package/.docs/reference/storage/libsql.md +0 -135
  456. package/.docs/reference/storage/mongodb.md +0 -262
  457. package/.docs/reference/storage/mssql.md +0 -155
  458. package/.docs/reference/storage/overview.md +0 -121
  459. package/.docs/reference/storage/postgresql.md +0 -529
  460. package/.docs/reference/storage/upstash.md +0 -160
  461. package/.docs/reference/streaming/ChunkType.md +0 -292
  462. package/.docs/reference/streaming/agents/MastraModelOutput.md +0 -182
  463. package/.docs/reference/streaming/agents/stream.md +0 -212
  464. package/.docs/reference/streaming/agents/streamLegacy.md +0 -142
  465. package/.docs/reference/streaming/workflows/observeStream.md +0 -42
  466. package/.docs/reference/streaming/workflows/resumeStream.md +0 -61
  467. package/.docs/reference/streaming/workflows/stream.md +0 -88
  468. package/.docs/reference/streaming/workflows/timeTravelStream.md +0 -142
  469. package/.docs/reference/templates/overview.md +0 -194
  470. package/.docs/reference/tools/create-tool.md +0 -237
  471. package/.docs/reference/tools/document-chunker-tool.md +0 -89
  472. package/.docs/reference/tools/graph-rag-tool.md +0 -185
  473. package/.docs/reference/tools/mcp-client.md +0 -962
  474. package/.docs/reference/tools/mcp-server.md +0 -1275
  475. package/.docs/reference/tools/vector-query-tool.md +0 -459
  476. package/.docs/reference/vectors/astra.md +0 -121
  477. package/.docs/reference/vectors/chroma.md +0 -267
  478. package/.docs/reference/vectors/convex.md +0 -303
  479. package/.docs/reference/vectors/couchbase.md +0 -226
  480. package/.docs/reference/vectors/duckdb.md +0 -318
  481. package/.docs/reference/vectors/elasticsearch.md +0 -189
  482. package/.docs/reference/vectors/lance.md +0 -220
  483. package/.docs/reference/vectors/libsql.md +0 -305
  484. package/.docs/reference/vectors/mongodb.md +0 -295
  485. package/.docs/reference/vectors/opensearch.md +0 -99
  486. package/.docs/reference/vectors/pg.md +0 -408
  487. package/.docs/reference/vectors/pinecone.md +0 -168
  488. package/.docs/reference/vectors/qdrant.md +0 -222
  489. package/.docs/reference/vectors/s3vectors.md +0 -277
  490. package/.docs/reference/vectors/turbopuffer.md +0 -157
  491. package/.docs/reference/vectors/upstash.md +0 -294
  492. package/.docs/reference/vectors/vectorize.md +0 -147
  493. package/.docs/reference/voice/azure.md +0 -148
  494. package/.docs/reference/voice/cloudflare.md +0 -83
  495. package/.docs/reference/voice/composite-voice.md +0 -121
  496. package/.docs/reference/voice/deepgram.md +0 -79
  497. package/.docs/reference/voice/elevenlabs.md +0 -98
  498. package/.docs/reference/voice/google-gemini-live.md +0 -378
  499. package/.docs/reference/voice/google.md +0 -228
  500. package/.docs/reference/voice/mastra-voice.md +0 -313
  501. package/.docs/reference/voice/murf.md +0 -122
  502. package/.docs/reference/voice/openai-realtime.md +0 -203
  503. package/.docs/reference/voice/openai.md +0 -88
  504. package/.docs/reference/voice/playai.md +0 -80
  505. package/.docs/reference/voice/sarvam.md +0 -126
  506. package/.docs/reference/voice/speechify.md +0 -75
  507. package/.docs/reference/voice/voice.addInstructions.md +0 -56
  508. package/.docs/reference/voice/voice.addTools.md +0 -67
  509. package/.docs/reference/voice/voice.answer.md +0 -54
  510. package/.docs/reference/voice/voice.close.md +0 -51
  511. package/.docs/reference/voice/voice.connect.md +0 -94
  512. package/.docs/reference/voice/voice.events.md +0 -37
  513. package/.docs/reference/voice/voice.getSpeakers.md +0 -129
  514. package/.docs/reference/voice/voice.listen.md +0 -164
  515. package/.docs/reference/voice/voice.off.md +0 -54
  516. package/.docs/reference/voice/voice.on.md +0 -111
  517. package/.docs/reference/voice/voice.send.md +0 -65
  518. package/.docs/reference/voice/voice.speak.md +0 -157
  519. package/.docs/reference/voice/voice.updateConfig.md +0 -60
  520. package/.docs/reference/workflows/run-methods/cancel.md +0 -86
  521. package/.docs/reference/workflows/run-methods/restart.md +0 -33
  522. package/.docs/reference/workflows/run-methods/resume.md +0 -59
  523. package/.docs/reference/workflows/run-methods/start.md +0 -58
  524. package/.docs/reference/workflows/run-methods/startAsync.md +0 -67
  525. package/.docs/reference/workflows/run-methods/timeTravel.md +0 -142
  526. package/.docs/reference/workflows/run.md +0 -59
  527. package/.docs/reference/workflows/step.md +0 -119
  528. package/.docs/reference/workflows/workflow-methods/branch.md +0 -25
  529. package/.docs/reference/workflows/workflow-methods/commit.md +0 -17
  530. package/.docs/reference/workflows/workflow-methods/create-run.md +0 -63
  531. package/.docs/reference/workflows/workflow-methods/dountil.md +0 -25
  532. package/.docs/reference/workflows/workflow-methods/dowhile.md +0 -25
  533. package/.docs/reference/workflows/workflow-methods/foreach.md +0 -118
  534. package/.docs/reference/workflows/workflow-methods/map.md +0 -93
  535. package/.docs/reference/workflows/workflow-methods/parallel.md +0 -21
  536. package/.docs/reference/workflows/workflow-methods/sleep.md +0 -35
  537. package/.docs/reference/workflows/workflow-methods/sleepUntil.md +0 -35
  538. package/.docs/reference/workflows/workflow-methods/then.md +0 -21
  539. package/.docs/reference/workflows/workflow.md +0 -157
  540. package/.docs/reference/workspace/e2b-sandbox.md +0 -288
  541. package/.docs/reference/workspace/filesystem.md +0 -202
  542. package/.docs/reference/workspace/gcs-filesystem.md +0 -170
  543. package/.docs/reference/workspace/local-filesystem.md +0 -327
  544. package/.docs/reference/workspace/local-sandbox.md +0 -285
  545. package/.docs/reference/workspace/s3-filesystem.md +0 -169
  546. package/.docs/reference/workspace/sandbox.md +0 -81
  547. package/.docs/reference/workspace/workspace-class.md +0 -226
@@ -1,138 +0,0 @@
1
- # runEvals
2
-
3
- The `runEvals` function enables batch evaluation of agents and workflows by running multiple test cases against scorers concurrently. This is essential for systematic testing, performance analysis, and validation of AI systems.
4
-
5
- ## Usage Example
6
-
7
- ```typescript
8
- import { runEvals } from "@mastra/core/evals";
9
- import { myAgent } from "./agents/my-agent";
10
- import { myScorer1, myScorer2 } from "./scorers";
11
-
12
- const result = await runEvals({
13
- target: myAgent,
14
- data: [
15
- { input: "What is machine learning?" },
16
- { input: "Explain neural networks" },
17
- { input: "How does AI work?" },
18
- ],
19
- scorers: [myScorer1, myScorer2],
20
- concurrency: 2,
21
- onItemComplete: ({ item, targetResult, scorerResults }) => {
22
- console.log(`Completed: ${item.input}`);
23
- console.log(`Scores:`, scorerResults);
24
- },
25
- });
26
-
27
- console.log(`Average scores:`, result.scores);
28
- console.log(`Processed ${result.summary.totalItems} items`);
29
- ```
30
-
31
- ## Parameters
32
-
33
- **target:** (`Agent | Workflow`): The agent or workflow to evaluate.
34
-
35
- **data:** (`RunEvalsDataItem[]`): Array of test cases with input data and optional ground truth.
36
-
37
- **scorers:** (`MastraScorer[] | WorkflowScorerConfig`): Array of scorers for agents, or configuration object for workflows specifying scorers for the workflow and individual steps.
38
-
39
- **concurrency?:** (`number`): Number of test cases to run concurrently. (Default: `1`)
40
-
41
- **onItemComplete?:** (`function`): Callback function called after each test case completes. Receives item, target result, and scorer results.
42
-
43
- ## Data Item Structure
44
-
45
- **input:** (`string | string[] | CoreMessage[] | any`): Input data for the target. For agents: messages or strings. For workflows: workflow input data.
46
-
47
- **groundTruth?:** (`any`): Expected or reference output for comparison during scoring.
48
-
49
- **requestContext?:** (`RequestContext`): Request Context to pass to the target during execution.
50
-
51
- **tracingContext?:** (`TracingContext`): Tracing context for observability and debugging.
52
-
53
- ## Workflow Scorer Configuration
54
-
55
- For workflows, you can specify scorers at different levels using `WorkflowScorerConfig`:
56
-
57
- **workflow?:** (`MastraScorer[]`): Array of scorers to evaluate the entire workflow output.
58
-
59
- **steps?:** (`Record<string, MastraScorer[]>`): Object mapping step IDs to arrays of scorers for evaluating individual step outputs.
60
-
61
- ## Returns
62
-
63
- **scores:** (`Record<string, any>`): Average scores across all test cases, organized by scorer name.
64
-
65
- **summary:** (`object`): Summary information about the experiment execution.
66
-
67
- **summary.totalItems:** (`number`): Total number of test cases processed.
68
-
69
- ## Examples
70
-
71
- ### Agent Evaluation
72
-
73
- ```typescript
74
- import { createScorer, runEvals } from "@mastra/core/evals";
75
-
76
- const myScorer = createScorer({
77
- id: "my-scorer",
78
- description: "Check if Agent's response contains ground truth",
79
- type: "agent",
80
- }).generateScore(({ run }) => {
81
- const response = run.output[0]?.content || "";
82
- const expectedResponse = run.groundTruth;
83
- return response.includes(expectedResponse) ? 1 : 0;
84
- });
85
-
86
- const result = await runEvals({
87
- target: chatAgent,
88
- data: [
89
- {
90
- input: "What is AI?",
91
- groundTruth:
92
- "AI is a field of computer science that creates intelligent machines.",
93
- },
94
- {
95
- input: "How does machine learning work?",
96
- groundTruth:
97
- "Machine learning uses algorithms to learn patterns from data.",
98
- },
99
- ],
100
- scorers: [relevancyScorer],
101
- concurrency: 3,
102
- });
103
- ```
104
-
105
- ### Workflow Evaluation
106
-
107
- ```typescript
108
- const workflowResult = await runEvals({
109
- target: myWorkflow,
110
- data: [
111
- { input: { query: "Process this data", priority: "high" } },
112
- { input: { query: "Another task", priority: "low" } },
113
- ],
114
- scorers: {
115
- workflow: [outputQualityScorer],
116
- steps: {
117
- "validation-step": [validationScorer],
118
- "processing-step": [processingScorer],
119
- },
120
- },
121
- onItemComplete: ({ item, targetResult, scorerResults }) => {
122
- console.log(`Workflow completed for: ${item.inputData.query}`);
123
- if (scorerResults.workflow) {
124
- console.log("Workflow scores:", scorerResults.workflow);
125
- }
126
- if (scorerResults.steps) {
127
- console.log("Step scores:", scorerResults.steps);
128
- }
129
- },
130
- });
131
- ```
132
-
133
- ## Related
134
-
135
- - [createScorer()](https://mastra.ai/reference/evals/create-scorer) - Create custom scorers for experiments
136
- - [MastraScorer](https://mastra.ai/reference/evals/mastra-scorer) - Learn about scorer structure and methods
137
- - [Custom Scorers](https://mastra.ai/docs/evals/custom-scorers) - Guide to building evaluation logic
138
- - [Scorers Overview](https://mastra.ai/docs/evals/overview) - Understanding scorer concepts
@@ -1,330 +0,0 @@
1
- # Scorer Utils
2
-
3
- Mastra provides utility functions to help extract and process data from scorer run inputs and outputs. These utilities are particularly useful in the `preprocess` step of custom scorers.
4
-
5
- ## Import
6
-
7
- ```typescript
8
- import {
9
- getAssistantMessageFromRunOutput,
10
- getReasoningFromRunOutput,
11
- getUserMessageFromRunInput,
12
- getSystemMessagesFromRunInput,
13
- getCombinedSystemPrompt,
14
- extractToolCalls,
15
- extractInputMessages,
16
- extractAgentResponseMessages,
17
- } from "@mastra/evals/scorers/utils";
18
- ```
19
-
20
- ## Message Extraction
21
-
22
- ### getAssistantMessageFromRunOutput
23
-
24
- Extracts the text content from the first assistant message in the run output.
25
-
26
- ```typescript
27
- const scorer = createScorer({
28
- id: "my-scorer",
29
- description: "My scorer",
30
- type: "agent",
31
- })
32
- .preprocess(({ run }) => {
33
- const response = getAssistantMessageFromRunOutput(run.output);
34
- return { response };
35
- })
36
- .generateScore(({ results }) => {
37
- return results.preprocessStepResult?.response ? 1 : 0;
38
- });
39
- ```
40
-
41
- **output?:** (`ScorerRunOutputForAgent`): The scorer run output (array of MastraDBMessage)
42
-
43
- **Returns:** `string | undefined` - The assistant message text, or undefined if no assistant message is found.
44
-
45
- ### getUserMessageFromRunInput
46
-
47
- Extracts the text content from the first user message in the run input.
48
-
49
- ```typescript
50
- .preprocess(({ run }) => {
51
- const userMessage = getUserMessageFromRunInput(run.input);
52
- return { userMessage };
53
- })
54
- ```
55
-
56
- **input?:** (`ScorerRunInputForAgent`): The scorer run input containing input messages
57
-
58
- **Returns:** `string | undefined` - The user message text, or undefined if no user message is found.
59
-
60
- ### extractInputMessages
61
-
62
- Extracts text content from all input messages as an array.
63
-
64
- ```typescript
65
- .preprocess(({ run }) => {
66
- const allUserMessages = extractInputMessages(run.input);
67
- return { conversationHistory: allUserMessages.join("\n") };
68
- })
69
- ```
70
-
71
- **Returns:** `string[]` - Array of text strings from each input message.
72
-
73
- ### extractAgentResponseMessages
74
-
75
- Extracts text content from all assistant response messages as an array.
76
-
77
- ```typescript
78
- .preprocess(({ run }) => {
79
- const allResponses = extractAgentResponseMessages(run.output);
80
- return { allResponses };
81
- })
82
- ```
83
-
84
- **Returns:** `string[]` - Array of text strings from each assistant message.
85
-
86
- ## Reasoning Extraction
87
-
88
- ### getReasoningFromRunOutput
89
-
90
- Extracts reasoning text from the run output. This is particularly useful when evaluating responses from reasoning models like `deepseek-reasoner` that produce chain-of-thought reasoning.
91
-
92
- Reasoning can be stored in two places:
93
-
94
- 1. `content.reasoning` - a string field on the message content
95
- 2. `content.parts` - as parts with `type: 'reasoning'` containing `details`
96
-
97
- ```typescript
98
- import {
99
- getReasoningFromRunOutput,
100
- getAssistantMessageFromRunOutput
101
- } from "@mastra/evals/scorers/utils";
102
-
103
- const reasoningQualityScorer = createScorer({
104
- id: "reasoning-quality",
105
- name: "Reasoning Quality",
106
- description: "Evaluates the quality of model reasoning",
107
- type: "agent",
108
- })
109
- .preprocess(({ run }) => {
110
- const reasoning = getReasoningFromRunOutput(run.output);
111
- const response = getAssistantMessageFromRunOutput(run.output);
112
- return { reasoning, response };
113
- })
114
- .analyze(({ results }) => {
115
- const { reasoning } = results.preprocessStepResult || {};
116
- return {
117
- hasReasoning: !!reasoning,
118
- reasoningLength: reasoning?.length || 0,
119
- hasStepByStep: reasoning?.includes("step") || false,
120
- };
121
- })
122
- .generateScore(({ results }) => {
123
- const { hasReasoning, reasoningLength } = results.analyzeStepResult || {};
124
- if (!hasReasoning) return 0;
125
- // Score based on reasoning length (normalized to 0-1)
126
- return Math.min(reasoningLength / 500, 1);
127
- })
128
- .generateReason(({ results, score }) => {
129
- const { hasReasoning, reasoningLength } = results.analyzeStepResult || {};
130
- if (!hasReasoning) {
131
- return "No reasoning was provided by the model.";
132
- }
133
- return `Model provided ${reasoningLength} characters of reasoning. Score: ${score}`;
134
- });
135
- ```
136
-
137
- **output?:** (`ScorerRunOutputForAgent`): The scorer run output (array of MastraDBMessage)
138
-
139
- **Returns:** `string | undefined` - The reasoning text, or undefined if no reasoning is present.
140
-
141
- ## System Message Extraction
142
-
143
- ### getSystemMessagesFromRunInput
144
-
145
- Extracts all system messages from the run input, including both standard system messages and tagged system messages (specialized prompts like memory instructions).
146
-
147
- ```typescript
148
- .preprocess(({ run }) => {
149
- const systemMessages = getSystemMessagesFromRunInput(run.input);
150
- return {
151
- systemPromptCount: systemMessages.length,
152
- systemPrompts: systemMessages
153
- };
154
- })
155
- ```
156
-
157
- **Returns:** `string[]` - Array of system message strings.
158
-
159
- ### getCombinedSystemPrompt
160
-
161
- Combines all system messages into a single prompt string, joined with double newlines.
162
-
163
- ```typescript
164
- .preprocess(({ run }) => {
165
- const fullSystemPrompt = getCombinedSystemPrompt(run.input);
166
- return { fullSystemPrompt };
167
- })
168
- ```
169
-
170
- **Returns:** `string` - Combined system prompt string.
171
-
172
- ## Tool Call Extraction
173
-
174
- ### extractToolCalls
175
-
176
- Extracts information about all tool calls from the run output, including tool names, call IDs, and their positions in the message array.
177
-
178
- ```typescript
179
- const toolUsageScorer = createScorer({
180
- id: "tool-usage",
181
- description: "Evaluates tool usage patterns",
182
- type: "agent",
183
- })
184
- .preprocess(({ run }) => {
185
- const { tools, toolCallInfos } = extractToolCalls(run.output);
186
- return {
187
- toolsUsed: tools,
188
- toolCount: tools.length,
189
- toolDetails: toolCallInfos,
190
- };
191
- })
192
- .generateScore(({ results }) => {
193
- const { toolCount } = results.preprocessStepResult || {};
194
- // Score based on appropriate tool usage
195
- return toolCount > 0 ? 1 : 0;
196
- });
197
- ```
198
-
199
- **Returns:**
200
-
201
- ```typescript
202
- {
203
- tools: string[]; // Array of tool names
204
- toolCallInfos: ToolCallInfo[]; // Detailed tool call information
205
- }
206
- ```
207
-
208
- Where `ToolCallInfo` is:
209
-
210
- ```typescript
211
- type ToolCallInfo = {
212
- toolName: string; // Name of the tool
213
- toolCallId: string; // Unique call identifier
214
- messageIndex: number; // Index in the output array
215
- invocationIndex: number; // Index within message's tool invocations
216
- };
217
- ```
218
-
219
- ## Test Utilities
220
-
221
- These utilities help create test data for scorer development.
222
-
223
- ### createTestMessage
224
-
225
- Creates a `MastraDBMessage` object for testing purposes.
226
-
227
- ```typescript
228
- import { createTestMessage } from "@mastra/evals/scorers/utils";
229
-
230
- const userMessage = createTestMessage({
231
- content: "What is the weather?",
232
- role: "user",
233
- });
234
-
235
- const assistantMessage = createTestMessage({
236
- content: "The weather is sunny.",
237
- role: "assistant",
238
- toolInvocations: [
239
- {
240
- toolCallId: "call-1",
241
- toolName: "weatherTool",
242
- args: { location: "London" },
243
- result: { temp: 20 },
244
- state: "result",
245
- },
246
- ],
247
- });
248
- ```
249
-
250
- ### createAgentTestRun
251
-
252
- Creates a complete test run object for testing scorers.
253
-
254
- ```typescript
255
- import { createAgentTestRun, createTestMessage } from "@mastra/evals/scorers/utils";
256
-
257
- const testRun = createAgentTestRun({
258
- inputMessages: [
259
- createTestMessage({ content: "Hello", role: "user" }),
260
- ],
261
- output: [
262
- createTestMessage({ content: "Hi there!", role: "assistant" }),
263
- ],
264
- });
265
-
266
- // Run your scorer with the test data
267
- const result = await myScorer.run({
268
- input: testRun.input,
269
- output: testRun.output,
270
- });
271
- ```
272
-
273
- ## Complete Example
274
-
275
- Here's a complete example showing how to use multiple utilities together:
276
-
277
- ```typescript
278
- import { createScorer } from "@mastra/core/evals";
279
- import {
280
- getAssistantMessageFromRunOutput,
281
- getReasoningFromRunOutput,
282
- getUserMessageFromRunInput,
283
- getCombinedSystemPrompt,
284
- extractToolCalls,
285
- } from "@mastra/evals/scorers/utils";
286
-
287
- const comprehensiveScorer = createScorer({
288
- id: "comprehensive-analysis",
289
- name: "Comprehensive Analysis",
290
- description: "Analyzes all aspects of an agent response",
291
- type: "agent",
292
- })
293
- .preprocess(({ run }) => {
294
- // Extract all relevant data
295
- const userMessage = getUserMessageFromRunInput(run.input);
296
- const response = getAssistantMessageFromRunOutput(run.output);
297
- const reasoning = getReasoningFromRunOutput(run.output);
298
- const systemPrompt = getCombinedSystemPrompt(run.input);
299
- const { tools, toolCallInfos } = extractToolCalls(run.output);
300
-
301
- return {
302
- userMessage,
303
- response,
304
- reasoning,
305
- systemPrompt,
306
- toolsUsed: tools,
307
- toolCount: tools.length,
308
- };
309
- })
310
- .generateScore(({ results }) => {
311
- const { response, reasoning, toolCount } = results.preprocessStepResult || {};
312
-
313
- let score = 0;
314
- if (response && response.length > 0) score += 0.4;
315
- if (reasoning) score += 0.3;
316
- if (toolCount > 0) score += 0.3;
317
-
318
- return score;
319
- })
320
- .generateReason(({ results, score }) => {
321
- const { response, reasoning, toolCount } = results.preprocessStepResult || {};
322
-
323
- const parts = [];
324
- if (response) parts.push("provided a response");
325
- if (reasoning) parts.push("included reasoning");
326
- if (toolCount > 0) parts.push(`used ${toolCount} tool(s)`);
327
-
328
- return `Score: ${score}. The agent ${parts.join(", ")}.`;
329
- });
330
- ```
@@ -1,113 +0,0 @@
1
- # Textual Difference Scorer
2
-
3
- The `createTextualDifferenceScorer()` function uses sequence matching to measure the textual differences between two strings. It provides detailed information about changes, including the number of operations needed to transform one text into another.
4
-
5
- ## Parameters
6
-
7
- The `createTextualDifferenceScorer()` function does not take any options.
8
-
9
- This function returns an instance of the MastraScorer class. See the [MastraScorer reference](https://mastra.ai/reference/evals/mastra-scorer) for details on the `.run()` method and its input/output.
10
-
11
- ## .run() Returns
12
-
13
- **runId:** (`string`): The id of the run (optional).
14
-
15
- **analyzeStepResult:** (`object`): Object with difference metrics: { confidence: number, changes: number, lengthDiff: number }
16
-
17
- **score:** (`number`): Similarity ratio (0-1) where 1 indicates identical texts.
18
-
19
- `.run()` returns a result in the following shape:
20
-
21
- ```typescript
22
- {
23
- runId: string,
24
- analyzeStepResult: {
25
- confidence: number,
26
- ratio: number,
27
- changes: number,
28
- lengthDiff: number
29
- },
30
- score: number
31
- }
32
- ```
33
-
34
- ## Scoring Details
35
-
36
- The scorer calculates several measures:
37
-
38
- - **Similarity Ratio**: Based on sequence matching between texts (0-1)
39
- - **Changes**: Count of non-matching operations needed
40
- - **Length Difference**: Normalized difference in text lengths
41
- - **Confidence**: Inversely proportional to length difference
42
-
43
- ### Scoring Process
44
-
45
- 1. Analyzes textual differences:
46
-
47
- - Performs sequence matching between input and output
48
- - Counts the number of change operations required
49
- - Measures length differences
50
-
51
- 2. Calculates metrics:
52
-
53
- - Computes similarity ratio
54
- - Determines confidence score
55
- - Combines into weighted score
56
-
57
- Final score: `(similarity_ratio * confidence) * scale`
58
-
59
- ### Score interpretation
60
-
61
- A textual difference score between 0 and 1:
62
-
63
- - **1.0**: Identical texts – no differences detected.
64
- - **0.7–0.9**: Minor differences – few changes needed.
65
- - **0.4–0.6**: Moderate differences – noticeable changes required.
66
- - **0.1–0.3**: Major differences – extensive changes needed.
67
- - **0.0**: Completely different texts.
68
-
69
- ## Example
70
-
71
- Measure textual differences between expected and actual agent outputs:
72
-
73
- ```typescript
74
- import { runEvals } from "@mastra/core/evals";
75
- import { createTextualDifferenceScorer } from "@mastra/evals/scorers/prebuilt";
76
- import { myAgent } from "./agent";
77
-
78
- const scorer = createTextualDifferenceScorer();
79
-
80
- const result = await runEvals({
81
- data: [
82
- {
83
- input: "Summarize the concept of recursion",
84
- groundTruth:
85
- "Recursion is when a function calls itself to solve a problem by breaking it into smaller subproblems.",
86
- },
87
- {
88
- input: "What is the capital of France?",
89
- groundTruth: "The capital of France is Paris.",
90
- },
91
- ],
92
- scorers: [scorer],
93
- target: myAgent,
94
- onItemComplete: ({ scorerResults }) => {
95
- console.log({
96
- score: scorerResults[scorer.id].score,
97
- groundTruth: scorerResults[scorer.id].groundTruth,
98
- });
99
- },
100
- });
101
-
102
- console.log(result.scores);
103
- ```
104
-
105
- For more details on `runEvals`, see the [runEvals reference](https://mastra.ai/reference/evals/run-evals).
106
-
107
- To add this scorer to an agent, see the [Scorers overview](https://mastra.ai/docs/evals/overview) guide.
108
-
109
- ## Related
110
-
111
- - [Content Similarity Scorer](https://mastra.ai/reference/evals/content-similarity)
112
- - [Completeness Scorer](https://mastra.ai/reference/evals/completeness)
113
- - [Keyword Coverage Scorer](https://mastra.ai/reference/evals/keyword-coverage)
@@ -1,119 +0,0 @@
1
- # Tone Consistency Scorer
2
-
3
- The `createToneScorer()` function evaluates the text's emotional tone and sentiment consistency. It can operate in two modes: comparing tone between input/output pairs or analyzing tone stability within a single text.
4
-
5
- ## Parameters
6
-
7
- The `createToneScorer()` function does not take any options.
8
-
9
- This function returns an instance of the MastraScorer class. See the [MastraScorer reference](https://mastra.ai/reference/evals/mastra-scorer) for details on the `.run()` method and its input/output.
10
-
11
- ## .run() Returns
12
-
13
- **runId:** (`string`): The id of the run (optional).
14
-
15
- **analyzeStepResult:** (`object`): Object with tone metrics: { responseSentiment: number, referenceSentiment: number, difference: number } (for comparison mode) OR { avgSentiment: number, sentimentVariance: number } (for stability mode)
16
-
17
- **score:** (`number`): Tone consistency/stability score (0-1).
18
-
19
- `.run()` returns a result in the following shape:
20
-
21
- ```typescript
22
- {
23
- runId: string,
24
- analyzeStepResult: {
25
- responseSentiment?: number,
26
- referenceSentiment?: number,
27
- difference?: number,
28
- avgSentiment?: number,
29
- sentimentVariance?: number,
30
- },
31
- score: number
32
- }
33
- ```
34
-
35
- ## Scoring Details
36
-
37
- The scorer evaluates sentiment consistency through tone pattern analysis and mode-specific scoring.
38
-
39
- ### Scoring Process
40
-
41
- 1. Analyzes tone patterns:
42
-
43
- - Extracts sentiment features
44
- - Computes sentiment scores
45
- - Measures tone variations
46
-
47
- 2. Calculates mode-specific score: **Tone Consistency** (input and output):
48
-
49
- - Compares sentiment between texts
50
- - Calculates sentiment difference
51
- - Score = 1 - (sentiment\_difference / max\_difference) **Tone Stability** (single input):
52
- - Analyzes sentiment across sentences
53
- - Calculates sentiment variance
54
- - Score = 1 - (sentiment\_variance / max\_variance)
55
-
56
- Final score: `mode_specific_score * scale`
57
-
58
- ### Score interpretation
59
-
60
- (0 to scale, default 0-1)
61
-
62
- - 1.0: Perfect tone consistency/stability
63
- - 0.7-0.9: Strong consistency with minor variations
64
- - 0.4-0.6: Moderate consistency with noticeable shifts
65
- - 0.1-0.3: Poor consistency with major tone changes
66
- - 0.0: No consistency - completely different tones
67
-
68
- ### analyzeStepResult
69
-
70
- Object with tone metrics:
71
-
72
- - **responseSentiment**: Sentiment score for the response (comparison mode).
73
- - **referenceSentiment**: Sentiment score for the input/reference (comparison mode).
74
- - **difference**: Absolute difference between sentiment scores (comparison mode).
75
- - **avgSentiment**: Average sentiment across sentences (stability mode).
76
- - **sentimentVariance**: Variance of sentiment across sentences (stability mode).
77
-
78
- ## Example
79
-
80
- Evaluate tone consistency between related agent responses:
81
-
82
- ```typescript
83
- import { runEvals } from "@mastra/core/evals";
84
- import { createToneScorer } from "@mastra/evals/scorers/prebuilt";
85
- import { myAgent } from "./agent";
86
-
87
- const scorer = createToneScorer();
88
-
89
- const result = await runEvals({
90
- data: [
91
- {
92
- input: "How was your experience with our service?",
93
- groundTruth: "The service was excellent and exceeded expectations!",
94
- },
95
- {
96
- input: "Tell me about the customer support",
97
- groundTruth: "The support team was friendly and very helpful.",
98
- },
99
- ],
100
- scorers: [scorer],
101
- target: myAgent,
102
- onItemComplete: ({ scorerResults }) => {
103
- console.log({
104
- score: scorerResults[scorer.id].score,
105
- });
106
- },
107
- });
108
-
109
- console.log(result.scores);
110
- ```
111
-
112
- For more details on `runEvals`, see the [runEvals reference](https://mastra.ai/reference/evals/run-evals).
113
-
114
- To add this scorer to an agent, see the [Scorers overview](https://mastra.ai/docs/evals/overview) guide.
115
-
116
- ## Related
117
-
118
- - [Content Similarity Scorer](https://mastra.ai/reference/evals/content-similarity)
119
- - [Toxicity Scorer](https://mastra.ai/reference/evals/toxicity)