@mastra/mcp-docs-server 1.1.4 → 1.1.5-alpha.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (547) hide show
  1. package/CHANGELOG.md +7 -0
  2. package/package.json +3 -3
  3. package/.docs/docs/agents/adding-voice.md +0 -353
  4. package/.docs/docs/agents/agent-approval.md +0 -377
  5. package/.docs/docs/agents/agent-memory.md +0 -212
  6. package/.docs/docs/agents/guardrails.md +0 -382
  7. package/.docs/docs/agents/network-approval.md +0 -275
  8. package/.docs/docs/agents/networks.md +0 -290
  9. package/.docs/docs/agents/overview.md +0 -309
  10. package/.docs/docs/agents/processors.md +0 -632
  11. package/.docs/docs/agents/structured-output.md +0 -271
  12. package/.docs/docs/agents/using-tools.md +0 -214
  13. package/.docs/docs/build-with-ai/mcp-docs-server.md +0 -241
  14. package/.docs/docs/build-with-ai/skills.md +0 -35
  15. package/.docs/docs/community/contributing-templates.md +0 -3
  16. package/.docs/docs/community/discord.md +0 -9
  17. package/.docs/docs/community/licensing.md +0 -66
  18. package/.docs/docs/deployment/cloud-providers.md +0 -15
  19. package/.docs/docs/deployment/mastra-server.md +0 -122
  20. package/.docs/docs/deployment/monorepo.md +0 -142
  21. package/.docs/docs/deployment/overview.md +0 -62
  22. package/.docs/docs/deployment/studio.md +0 -234
  23. package/.docs/docs/deployment/web-framework.md +0 -52
  24. package/.docs/docs/deployment/workflow-runners.md +0 -9
  25. package/.docs/docs/evals/built-in-scorers.md +0 -47
  26. package/.docs/docs/evals/custom-scorers.md +0 -519
  27. package/.docs/docs/evals/overview.md +0 -146
  28. package/.docs/docs/evals/running-in-ci.md +0 -106
  29. package/.docs/docs/getting-started/build-with-ai.md +0 -68
  30. package/.docs/docs/getting-started/manual-install.md +0 -226
  31. package/.docs/docs/getting-started/project-structure.md +0 -60
  32. package/.docs/docs/getting-started/start.md +0 -28
  33. package/.docs/docs/getting-started/studio.md +0 -101
  34. package/.docs/docs/index.md +0 -43
  35. package/.docs/docs/mastra-cloud/deployment.md +0 -77
  36. package/.docs/docs/mastra-cloud/observability.md +0 -38
  37. package/.docs/docs/mastra-cloud/overview.md +0 -23
  38. package/.docs/docs/mastra-cloud/setup.md +0 -42
  39. package/.docs/docs/mastra-cloud/studio.md +0 -24
  40. package/.docs/docs/mcp/overview.md +0 -370
  41. package/.docs/docs/mcp/publishing-mcp-server.md +0 -95
  42. package/.docs/docs/memory/memory-processors.md +0 -316
  43. package/.docs/docs/memory/message-history.md +0 -260
  44. package/.docs/docs/memory/observational-memory.md +0 -246
  45. package/.docs/docs/memory/overview.md +0 -45
  46. package/.docs/docs/memory/semantic-recall.md +0 -272
  47. package/.docs/docs/memory/storage.md +0 -261
  48. package/.docs/docs/memory/working-memory.md +0 -400
  49. package/.docs/docs/observability/datasets/overview.md +0 -188
  50. package/.docs/docs/observability/datasets/running-experiments.md +0 -266
  51. package/.docs/docs/observability/logging.md +0 -99
  52. package/.docs/docs/observability/overview.md +0 -70
  53. package/.docs/docs/observability/tracing/bridges/otel.md +0 -209
  54. package/.docs/docs/observability/tracing/exporters/arize.md +0 -274
  55. package/.docs/docs/observability/tracing/exporters/braintrust.md +0 -111
  56. package/.docs/docs/observability/tracing/exporters/cloud.md +0 -129
  57. package/.docs/docs/observability/tracing/exporters/datadog.md +0 -187
  58. package/.docs/docs/observability/tracing/exporters/default.md +0 -211
  59. package/.docs/docs/observability/tracing/exporters/laminar.md +0 -100
  60. package/.docs/docs/observability/tracing/exporters/langfuse.md +0 -217
  61. package/.docs/docs/observability/tracing/exporters/langsmith.md +0 -202
  62. package/.docs/docs/observability/tracing/exporters/otel.md +0 -479
  63. package/.docs/docs/observability/tracing/exporters/posthog.md +0 -148
  64. package/.docs/docs/observability/tracing/exporters/sentry.md +0 -208
  65. package/.docs/docs/observability/tracing/overview.md +0 -1114
  66. package/.docs/docs/observability/tracing/processors/sensitive-data-filter.md +0 -303
  67. package/.docs/docs/rag/chunking-and-embedding.md +0 -183
  68. package/.docs/docs/rag/graph-rag.md +0 -215
  69. package/.docs/docs/rag/overview.md +0 -72
  70. package/.docs/docs/rag/retrieval.md +0 -521
  71. package/.docs/docs/rag/vector-databases.md +0 -648
  72. package/.docs/docs/server/auth/auth0.md +0 -222
  73. package/.docs/docs/server/auth/better-auth.md +0 -203
  74. package/.docs/docs/server/auth/clerk.md +0 -132
  75. package/.docs/docs/server/auth/composite-auth.md +0 -234
  76. package/.docs/docs/server/auth/custom-auth-provider.md +0 -513
  77. package/.docs/docs/server/auth/firebase.md +0 -272
  78. package/.docs/docs/server/auth/jwt.md +0 -110
  79. package/.docs/docs/server/auth/simple-auth.md +0 -178
  80. package/.docs/docs/server/auth/supabase.md +0 -117
  81. package/.docs/docs/server/auth/workos.md +0 -190
  82. package/.docs/docs/server/auth.md +0 -38
  83. package/.docs/docs/server/custom-adapters.md +0 -374
  84. package/.docs/docs/server/custom-api-routes.md +0 -267
  85. package/.docs/docs/server/mastra-client.md +0 -243
  86. package/.docs/docs/server/mastra-server.md +0 -71
  87. package/.docs/docs/server/middleware.md +0 -228
  88. package/.docs/docs/server/request-context.md +0 -478
  89. package/.docs/docs/server/server-adapters.md +0 -547
  90. package/.docs/docs/streaming/events.md +0 -247
  91. package/.docs/docs/streaming/overview.md +0 -181
  92. package/.docs/docs/streaming/tool-streaming.md +0 -178
  93. package/.docs/docs/streaming/workflow-streaming.md +0 -109
  94. package/.docs/docs/voice/overview.md +0 -979
  95. package/.docs/docs/voice/speech-to-speech.md +0 -103
  96. package/.docs/docs/voice/speech-to-text.md +0 -80
  97. package/.docs/docs/voice/text-to-speech.md +0 -84
  98. package/.docs/docs/workflows/agents-and-tools.md +0 -170
  99. package/.docs/docs/workflows/control-flow.md +0 -823
  100. package/.docs/docs/workflows/error-handling.md +0 -360
  101. package/.docs/docs/workflows/human-in-the-loop.md +0 -213
  102. package/.docs/docs/workflows/overview.md +0 -372
  103. package/.docs/docs/workflows/snapshots.md +0 -238
  104. package/.docs/docs/workflows/suspend-and-resume.md +0 -205
  105. package/.docs/docs/workflows/time-travel.md +0 -309
  106. package/.docs/docs/workflows/workflow-state.md +0 -181
  107. package/.docs/docs/workspace/filesystem.md +0 -162
  108. package/.docs/docs/workspace/overview.md +0 -239
  109. package/.docs/docs/workspace/sandbox.md +0 -63
  110. package/.docs/docs/workspace/search.md +0 -219
  111. package/.docs/docs/workspace/skills.md +0 -126
  112. package/.docs/guides/agent-frameworks/ai-sdk.md +0 -140
  113. package/.docs/guides/build-your-ui/ai-sdk-ui.md +0 -1463
  114. package/.docs/guides/build-your-ui/assistant-ui.md +0 -156
  115. package/.docs/guides/build-your-ui/copilotkit.md +0 -292
  116. package/.docs/guides/deployment/amazon-ec2.md +0 -130
  117. package/.docs/guides/deployment/aws-lambda.md +0 -248
  118. package/.docs/guides/deployment/azure-app-services.md +0 -114
  119. package/.docs/guides/deployment/cloudflare.md +0 -99
  120. package/.docs/guides/deployment/digital-ocean.md +0 -168
  121. package/.docs/guides/deployment/inngest.md +0 -685
  122. package/.docs/guides/deployment/netlify.md +0 -77
  123. package/.docs/guides/deployment/vercel.md +0 -101
  124. package/.docs/guides/getting-started/astro.md +0 -408
  125. package/.docs/guides/getting-started/electron.md +0 -504
  126. package/.docs/guides/getting-started/express.md +0 -251
  127. package/.docs/guides/getting-started/hono.md +0 -191
  128. package/.docs/guides/getting-started/next-js.md +0 -355
  129. package/.docs/guides/getting-started/nuxt.md +0 -476
  130. package/.docs/guides/getting-started/quickstart.md +0 -67
  131. package/.docs/guides/getting-started/sveltekit.md +0 -300
  132. package/.docs/guides/getting-started/vite-react.md +0 -439
  133. package/.docs/guides/guide/ai-recruiter.md +0 -227
  134. package/.docs/guides/guide/chef-michel.md +0 -215
  135. package/.docs/guides/guide/code-review-bot.md +0 -221
  136. package/.docs/guides/guide/dev-assistant.md +0 -304
  137. package/.docs/guides/guide/docs-manager.md +0 -238
  138. package/.docs/guides/guide/github-actions-pr-description.md +0 -236
  139. package/.docs/guides/guide/notes-mcp-server.md +0 -425
  140. package/.docs/guides/guide/research-assistant.md +0 -349
  141. package/.docs/guides/guide/stock-agent.md +0 -134
  142. package/.docs/guides/guide/web-search.md +0 -326
  143. package/.docs/guides/guide/whatsapp-chat-bot.md +0 -416
  144. package/.docs/guides/index.md +0 -3
  145. package/.docs/guides/migrations/agentnetwork.md +0 -101
  146. package/.docs/guides/migrations/ai-sdk-v4-to-v5.md +0 -112
  147. package/.docs/guides/migrations/upgrade-to-v1/agent.md +0 -404
  148. package/.docs/guides/migrations/upgrade-to-v1/cli.md +0 -57
  149. package/.docs/guides/migrations/upgrade-to-v1/client.md +0 -337
  150. package/.docs/guides/migrations/upgrade-to-v1/deployment.md +0 -37
  151. package/.docs/guides/migrations/upgrade-to-v1/evals.md +0 -239
  152. package/.docs/guides/migrations/upgrade-to-v1/mastra.md +0 -143
  153. package/.docs/guides/migrations/upgrade-to-v1/mcp.md +0 -97
  154. package/.docs/guides/migrations/upgrade-to-v1/memory.md +0 -285
  155. package/.docs/guides/migrations/upgrade-to-v1/overview.md +0 -119
  156. package/.docs/guides/migrations/upgrade-to-v1/processors.md +0 -68
  157. package/.docs/guides/migrations/upgrade-to-v1/rag.md +0 -42
  158. package/.docs/guides/migrations/upgrade-to-v1/storage.md +0 -553
  159. package/.docs/guides/migrations/upgrade-to-v1/tools.md +0 -180
  160. package/.docs/guides/migrations/upgrade-to-v1/tracing.md +0 -417
  161. package/.docs/guides/migrations/upgrade-to-v1/vectors.md +0 -87
  162. package/.docs/guides/migrations/upgrade-to-v1/voice.md +0 -30
  163. package/.docs/guides/migrations/upgrade-to-v1/workflows.md +0 -341
  164. package/.docs/guides/migrations/vnext-to-standard-apis.md +0 -364
  165. package/.docs/models/embeddings.md +0 -161
  166. package/.docs/models/gateways/azure-openai.md +0 -128
  167. package/.docs/models/gateways/custom-gateways.md +0 -545
  168. package/.docs/models/gateways/netlify.md +0 -88
  169. package/.docs/models/gateways/openrouter.md +0 -219
  170. package/.docs/models/gateways/vercel.md +0 -225
  171. package/.docs/models/gateways.md +0 -14
  172. package/.docs/models/index.md +0 -286
  173. package/.docs/models/providers/302ai.md +0 -134
  174. package/.docs/models/providers/abacus.md +0 -125
  175. package/.docs/models/providers/agentrouter.md +0 -90
  176. package/.docs/models/providers/aihubmix.md +0 -107
  177. package/.docs/models/providers/alibaba-cn.md +0 -135
  178. package/.docs/models/providers/alibaba.md +0 -111
  179. package/.docs/models/providers/amazon-bedrock.md +0 -33
  180. package/.docs/models/providers/anthropic.md +0 -153
  181. package/.docs/models/providers/azure.md +0 -33
  182. package/.docs/models/providers/bailing.md +0 -72
  183. package/.docs/models/providers/baseten.md +0 -77
  184. package/.docs/models/providers/berget.md +0 -78
  185. package/.docs/models/providers/cerebras.md +0 -101
  186. package/.docs/models/providers/chutes.md +0 -136
  187. package/.docs/models/providers/cloudflare-ai-gateway.md +0 -33
  188. package/.docs/models/providers/cloudflare-workers-ai.md +0 -109
  189. package/.docs/models/providers/cohere.md +0 -33
  190. package/.docs/models/providers/cortecs.md +0 -91
  191. package/.docs/models/providers/deepinfra.md +0 -112
  192. package/.docs/models/providers/deepseek.md +0 -88
  193. package/.docs/models/providers/fastrouter.md +0 -84
  194. package/.docs/models/providers/fireworks-ai.md +0 -89
  195. package/.docs/models/providers/firmware.md +0 -85
  196. package/.docs/models/providers/friendli.md +0 -78
  197. package/.docs/models/providers/github-models.md +0 -125
  198. package/.docs/models/providers/google-vertex.md +0 -33
  199. package/.docs/models/providers/google.md +0 -159
  200. package/.docs/models/providers/groq.md +0 -107
  201. package/.docs/models/providers/helicone.md +0 -161
  202. package/.docs/models/providers/huggingface.md +0 -90
  203. package/.docs/models/providers/iflowcn.md +0 -84
  204. package/.docs/models/providers/inception.md +0 -72
  205. package/.docs/models/providers/inference.md +0 -79
  206. package/.docs/models/providers/io-intelligence.md +0 -87
  207. package/.docs/models/providers/io-net.md +0 -87
  208. package/.docs/models/providers/jiekou.md +0 -131
  209. package/.docs/models/providers/kilo.md +0 -333
  210. package/.docs/models/providers/kimi-for-coding.md +0 -100
  211. package/.docs/models/providers/kuae-cloud-coding-plan.md +0 -71
  212. package/.docs/models/providers/llama.md +0 -77
  213. package/.docs/models/providers/lmstudio.md +0 -73
  214. package/.docs/models/providers/lucidquery.md +0 -72
  215. package/.docs/models/providers/minimax-cn-coding-plan.md +0 -102
  216. package/.docs/models/providers/minimax-cn.md +0 -102
  217. package/.docs/models/providers/minimax-coding-plan.md +0 -102
  218. package/.docs/models/providers/minimax.md +0 -104
  219. package/.docs/models/providers/mistral.md +0 -124
  220. package/.docs/models/providers/moark.md +0 -72
  221. package/.docs/models/providers/modelscope.md +0 -77
  222. package/.docs/models/providers/moonshotai-cn.md +0 -76
  223. package/.docs/models/providers/moonshotai.md +0 -76
  224. package/.docs/models/providers/morph.md +0 -73
  225. package/.docs/models/providers/nano-gpt.md +0 -103
  226. package/.docs/models/providers/nebius.md +0 -116
  227. package/.docs/models/providers/nova.md +0 -72
  228. package/.docs/models/providers/novita-ai.md +0 -154
  229. package/.docs/models/providers/nvidia.md +0 -141
  230. package/.docs/models/providers/ollama-cloud.md +0 -103
  231. package/.docs/models/providers/ollama.md +0 -33
  232. package/.docs/models/providers/openai.md +0 -193
  233. package/.docs/models/providers/opencode.md +0 -100
  234. package/.docs/models/providers/ovhcloud.md +0 -83
  235. package/.docs/models/providers/perplexity.md +0 -100
  236. package/.docs/models/providers/poe.md +0 -183
  237. package/.docs/models/providers/privatemode-ai.md +0 -75
  238. package/.docs/models/providers/requesty.md +0 -90
  239. package/.docs/models/providers/scaleway.md +0 -84
  240. package/.docs/models/providers/siliconflow-cn.md +0 -138
  241. package/.docs/models/providers/siliconflow.md +0 -140
  242. package/.docs/models/providers/stackit.md +0 -78
  243. package/.docs/models/providers/stepfun.md +0 -73
  244. package/.docs/models/providers/submodel.md +0 -79
  245. package/.docs/models/providers/synthetic.md +0 -96
  246. package/.docs/models/providers/togetherai.md +0 -115
  247. package/.docs/models/providers/upstage.md +0 -73
  248. package/.docs/models/providers/venice.md +0 -95
  249. package/.docs/models/providers/vivgrid.md +0 -106
  250. package/.docs/models/providers/vultr.md +0 -75
  251. package/.docs/models/providers/wandb.md +0 -80
  252. package/.docs/models/providers/xai.md +0 -141
  253. package/.docs/models/providers/xiaomi.md +0 -71
  254. package/.docs/models/providers/zai-coding-plan.md +0 -80
  255. package/.docs/models/providers/zai.md +0 -79
  256. package/.docs/models/providers/zenmux.md +0 -161
  257. package/.docs/models/providers/zhipuai-coding-plan.md +0 -79
  258. package/.docs/models/providers/zhipuai.md +0 -79
  259. package/.docs/models/providers.md +0 -81
  260. package/.docs/reference/agents/agent.md +0 -142
  261. package/.docs/reference/agents/generate.md +0 -174
  262. package/.docs/reference/agents/generateLegacy.md +0 -176
  263. package/.docs/reference/agents/getDefaultGenerateOptions.md +0 -36
  264. package/.docs/reference/agents/getDefaultOptions.md +0 -34
  265. package/.docs/reference/agents/getDefaultStreamOptions.md +0 -36
  266. package/.docs/reference/agents/getDescription.md +0 -21
  267. package/.docs/reference/agents/getInstructions.md +0 -34
  268. package/.docs/reference/agents/getLLM.md +0 -37
  269. package/.docs/reference/agents/getMemory.md +0 -34
  270. package/.docs/reference/agents/getModel.md +0 -34
  271. package/.docs/reference/agents/getTools.md +0 -29
  272. package/.docs/reference/agents/getVoice.md +0 -34
  273. package/.docs/reference/agents/listAgents.md +0 -35
  274. package/.docs/reference/agents/listScorers.md +0 -34
  275. package/.docs/reference/agents/listTools.md +0 -34
  276. package/.docs/reference/agents/listWorkflows.md +0 -34
  277. package/.docs/reference/agents/network.md +0 -134
  278. package/.docs/reference/ai-sdk/chat-route.md +0 -82
  279. package/.docs/reference/ai-sdk/handle-chat-stream.md +0 -53
  280. package/.docs/reference/ai-sdk/handle-network-stream.md +0 -37
  281. package/.docs/reference/ai-sdk/handle-workflow-stream.md +0 -55
  282. package/.docs/reference/ai-sdk/network-route.md +0 -74
  283. package/.docs/reference/ai-sdk/to-ai-sdk-stream.md +0 -232
  284. package/.docs/reference/ai-sdk/to-ai-sdk-v4-messages.md +0 -79
  285. package/.docs/reference/ai-sdk/to-ai-sdk-v5-messages.md +0 -73
  286. package/.docs/reference/ai-sdk/with-mastra.md +0 -59
  287. package/.docs/reference/ai-sdk/workflow-route.md +0 -79
  288. package/.docs/reference/auth/auth0.md +0 -73
  289. package/.docs/reference/auth/better-auth.md +0 -71
  290. package/.docs/reference/auth/clerk.md +0 -36
  291. package/.docs/reference/auth/firebase.md +0 -80
  292. package/.docs/reference/auth/jwt.md +0 -26
  293. package/.docs/reference/auth/supabase.md +0 -33
  294. package/.docs/reference/auth/workos.md +0 -84
  295. package/.docs/reference/cli/create-mastra.md +0 -137
  296. package/.docs/reference/cli/mastra.md +0 -336
  297. package/.docs/reference/client-js/agents.md +0 -438
  298. package/.docs/reference/client-js/error-handling.md +0 -16
  299. package/.docs/reference/client-js/logs.md +0 -24
  300. package/.docs/reference/client-js/mastra-client.md +0 -63
  301. package/.docs/reference/client-js/memory.md +0 -225
  302. package/.docs/reference/client-js/observability.md +0 -72
  303. package/.docs/reference/client-js/telemetry.md +0 -20
  304. package/.docs/reference/client-js/tools.md +0 -44
  305. package/.docs/reference/client-js/vectors.md +0 -79
  306. package/.docs/reference/client-js/workflows.md +0 -199
  307. package/.docs/reference/configuration.md +0 -749
  308. package/.docs/reference/core/addGateway.md +0 -42
  309. package/.docs/reference/core/getAgent.md +0 -21
  310. package/.docs/reference/core/getAgentById.md +0 -21
  311. package/.docs/reference/core/getDeployer.md +0 -22
  312. package/.docs/reference/core/getGateway.md +0 -38
  313. package/.docs/reference/core/getGatewayById.md +0 -41
  314. package/.docs/reference/core/getLogger.md +0 -22
  315. package/.docs/reference/core/getMCPServer.md +0 -45
  316. package/.docs/reference/core/getMCPServerById.md +0 -53
  317. package/.docs/reference/core/getMemory.md +0 -50
  318. package/.docs/reference/core/getScorer.md +0 -54
  319. package/.docs/reference/core/getScorerById.md +0 -54
  320. package/.docs/reference/core/getServer.md +0 -22
  321. package/.docs/reference/core/getStorage.md +0 -22
  322. package/.docs/reference/core/getStoredAgentById.md +0 -89
  323. package/.docs/reference/core/getTelemetry.md +0 -22
  324. package/.docs/reference/core/getVector.md +0 -22
  325. package/.docs/reference/core/getWorkflow.md +0 -40
  326. package/.docs/reference/core/listAgents.md +0 -21
  327. package/.docs/reference/core/listGateways.md +0 -40
  328. package/.docs/reference/core/listLogs.md +0 -38
  329. package/.docs/reference/core/listLogsByRunId.md +0 -36
  330. package/.docs/reference/core/listMCPServers.md +0 -51
  331. package/.docs/reference/core/listMemory.md +0 -56
  332. package/.docs/reference/core/listScorers.md +0 -29
  333. package/.docs/reference/core/listStoredAgents.md +0 -93
  334. package/.docs/reference/core/listVectors.md +0 -22
  335. package/.docs/reference/core/listWorkflows.md +0 -21
  336. package/.docs/reference/core/mastra-class.md +0 -66
  337. package/.docs/reference/core/mastra-model-gateway.md +0 -153
  338. package/.docs/reference/core/setLogger.md +0 -26
  339. package/.docs/reference/core/setStorage.md +0 -27
  340. package/.docs/reference/datasets/addItem.md +0 -35
  341. package/.docs/reference/datasets/addItems.md +0 -33
  342. package/.docs/reference/datasets/compareExperiments.md +0 -48
  343. package/.docs/reference/datasets/create.md +0 -49
  344. package/.docs/reference/datasets/dataset.md +0 -78
  345. package/.docs/reference/datasets/datasets-manager.md +0 -84
  346. package/.docs/reference/datasets/delete.md +0 -23
  347. package/.docs/reference/datasets/deleteExperiment.md +0 -25
  348. package/.docs/reference/datasets/deleteItem.md +0 -25
  349. package/.docs/reference/datasets/deleteItems.md +0 -27
  350. package/.docs/reference/datasets/get.md +0 -29
  351. package/.docs/reference/datasets/getDetails.md +0 -45
  352. package/.docs/reference/datasets/getExperiment.md +0 -28
  353. package/.docs/reference/datasets/getItem.md +0 -31
  354. package/.docs/reference/datasets/getItemHistory.md +0 -29
  355. package/.docs/reference/datasets/list.md +0 -29
  356. package/.docs/reference/datasets/listExperimentResults.md +0 -37
  357. package/.docs/reference/datasets/listExperiments.md +0 -31
  358. package/.docs/reference/datasets/listItems.md +0 -44
  359. package/.docs/reference/datasets/listVersions.md +0 -31
  360. package/.docs/reference/datasets/startExperiment.md +0 -60
  361. package/.docs/reference/datasets/startExperimentAsync.md +0 -41
  362. package/.docs/reference/datasets/update.md +0 -46
  363. package/.docs/reference/datasets/updateItem.md +0 -36
  364. package/.docs/reference/deployer/cloudflare.md +0 -79
  365. package/.docs/reference/deployer/netlify.md +0 -82
  366. package/.docs/reference/deployer/vercel.md +0 -91
  367. package/.docs/reference/deployer.md +0 -100
  368. package/.docs/reference/evals/answer-relevancy.md +0 -105
  369. package/.docs/reference/evals/answer-similarity.md +0 -99
  370. package/.docs/reference/evals/bias.md +0 -120
  371. package/.docs/reference/evals/completeness.md +0 -137
  372. package/.docs/reference/evals/content-similarity.md +0 -101
  373. package/.docs/reference/evals/context-precision.md +0 -196
  374. package/.docs/reference/evals/context-relevance.md +0 -536
  375. package/.docs/reference/evals/create-scorer.md +0 -270
  376. package/.docs/reference/evals/faithfulness.md +0 -114
  377. package/.docs/reference/evals/hallucination.md +0 -220
  378. package/.docs/reference/evals/keyword-coverage.md +0 -128
  379. package/.docs/reference/evals/mastra-scorer.md +0 -123
  380. package/.docs/reference/evals/noise-sensitivity.md +0 -685
  381. package/.docs/reference/evals/prompt-alignment.md +0 -619
  382. package/.docs/reference/evals/run-evals.md +0 -138
  383. package/.docs/reference/evals/scorer-utils.md +0 -330
  384. package/.docs/reference/evals/textual-difference.md +0 -113
  385. package/.docs/reference/evals/tone-consistency.md +0 -119
  386. package/.docs/reference/evals/tool-call-accuracy.md +0 -533
  387. package/.docs/reference/evals/toxicity.md +0 -123
  388. package/.docs/reference/harness/harness-class.md +0 -645
  389. package/.docs/reference/index.md +0 -276
  390. package/.docs/reference/logging/pino-logger.md +0 -117
  391. package/.docs/reference/memory/clone-utilities.md +0 -199
  392. package/.docs/reference/memory/cloneThread.md +0 -130
  393. package/.docs/reference/memory/createThread.md +0 -68
  394. package/.docs/reference/memory/deleteMessages.md +0 -40
  395. package/.docs/reference/memory/getThreadById.md +0 -24
  396. package/.docs/reference/memory/listThreads.md +0 -145
  397. package/.docs/reference/memory/memory-class.md +0 -147
  398. package/.docs/reference/memory/observational-memory.md +0 -565
  399. package/.docs/reference/memory/recall.md +0 -91
  400. package/.docs/reference/observability/tracing/bridges/otel.md +0 -131
  401. package/.docs/reference/observability/tracing/configuration.md +0 -178
  402. package/.docs/reference/observability/tracing/exporters/arize.md +0 -141
  403. package/.docs/reference/observability/tracing/exporters/braintrust.md +0 -93
  404. package/.docs/reference/observability/tracing/exporters/cloud-exporter.md +0 -163
  405. package/.docs/reference/observability/tracing/exporters/console-exporter.md +0 -138
  406. package/.docs/reference/observability/tracing/exporters/datadog.md +0 -116
  407. package/.docs/reference/observability/tracing/exporters/default-exporter.md +0 -174
  408. package/.docs/reference/observability/tracing/exporters/laminar.md +0 -78
  409. package/.docs/reference/observability/tracing/exporters/langfuse.md +0 -134
  410. package/.docs/reference/observability/tracing/exporters/langsmith.md +0 -110
  411. package/.docs/reference/observability/tracing/exporters/otel.md +0 -199
  412. package/.docs/reference/observability/tracing/exporters/posthog.md +0 -92
  413. package/.docs/reference/observability/tracing/exporters/sentry.md +0 -184
  414. package/.docs/reference/observability/tracing/instances.md +0 -109
  415. package/.docs/reference/observability/tracing/interfaces.md +0 -749
  416. package/.docs/reference/observability/tracing/processors/sensitive-data-filter.md +0 -144
  417. package/.docs/reference/observability/tracing/spans.md +0 -224
  418. package/.docs/reference/processors/batch-parts-processor.md +0 -61
  419. package/.docs/reference/processors/language-detector.md +0 -81
  420. package/.docs/reference/processors/message-history-processor.md +0 -85
  421. package/.docs/reference/processors/moderation-processor.md +0 -104
  422. package/.docs/reference/processors/pii-detector.md +0 -107
  423. package/.docs/reference/processors/processor-interface.md +0 -525
  424. package/.docs/reference/processors/prompt-injection-detector.md +0 -71
  425. package/.docs/reference/processors/semantic-recall-processor.md +0 -123
  426. package/.docs/reference/processors/system-prompt-scrubber.md +0 -80
  427. package/.docs/reference/processors/token-limiter-processor.md +0 -113
  428. package/.docs/reference/processors/tool-call-filter.md +0 -85
  429. package/.docs/reference/processors/tool-search-processor.md +0 -113
  430. package/.docs/reference/processors/unicode-normalizer.md +0 -62
  431. package/.docs/reference/processors/working-memory-processor.md +0 -154
  432. package/.docs/reference/rag/chunk.md +0 -221
  433. package/.docs/reference/rag/database-config.md +0 -264
  434. package/.docs/reference/rag/document.md +0 -114
  435. package/.docs/reference/rag/embeddings.md +0 -92
  436. package/.docs/reference/rag/extract-params.md +0 -168
  437. package/.docs/reference/rag/graph-rag.md +0 -111
  438. package/.docs/reference/rag/metadata-filters.md +0 -216
  439. package/.docs/reference/rag/rerank.md +0 -80
  440. package/.docs/reference/rag/rerankWithScorer.md +0 -80
  441. package/.docs/reference/server/create-route.md +0 -260
  442. package/.docs/reference/server/express-adapter.md +0 -176
  443. package/.docs/reference/server/fastify-adapter.md +0 -90
  444. package/.docs/reference/server/hono-adapter.md +0 -162
  445. package/.docs/reference/server/koa-adapter.md +0 -127
  446. package/.docs/reference/server/mastra-server.md +0 -298
  447. package/.docs/reference/server/register-api-route.md +0 -249
  448. package/.docs/reference/server/routes.md +0 -306
  449. package/.docs/reference/storage/cloudflare-d1.md +0 -218
  450. package/.docs/reference/storage/cloudflare.md +0 -88
  451. package/.docs/reference/storage/composite.md +0 -235
  452. package/.docs/reference/storage/convex.md +0 -161
  453. package/.docs/reference/storage/dynamodb.md +0 -282
  454. package/.docs/reference/storage/lance.md +0 -131
  455. package/.docs/reference/storage/libsql.md +0 -135
  456. package/.docs/reference/storage/mongodb.md +0 -262
  457. package/.docs/reference/storage/mssql.md +0 -155
  458. package/.docs/reference/storage/overview.md +0 -121
  459. package/.docs/reference/storage/postgresql.md +0 -529
  460. package/.docs/reference/storage/upstash.md +0 -160
  461. package/.docs/reference/streaming/ChunkType.md +0 -292
  462. package/.docs/reference/streaming/agents/MastraModelOutput.md +0 -182
  463. package/.docs/reference/streaming/agents/stream.md +0 -212
  464. package/.docs/reference/streaming/agents/streamLegacy.md +0 -142
  465. package/.docs/reference/streaming/workflows/observeStream.md +0 -42
  466. package/.docs/reference/streaming/workflows/resumeStream.md +0 -61
  467. package/.docs/reference/streaming/workflows/stream.md +0 -88
  468. package/.docs/reference/streaming/workflows/timeTravelStream.md +0 -142
  469. package/.docs/reference/templates/overview.md +0 -194
  470. package/.docs/reference/tools/create-tool.md +0 -237
  471. package/.docs/reference/tools/document-chunker-tool.md +0 -89
  472. package/.docs/reference/tools/graph-rag-tool.md +0 -185
  473. package/.docs/reference/tools/mcp-client.md +0 -962
  474. package/.docs/reference/tools/mcp-server.md +0 -1275
  475. package/.docs/reference/tools/vector-query-tool.md +0 -459
  476. package/.docs/reference/vectors/astra.md +0 -121
  477. package/.docs/reference/vectors/chroma.md +0 -267
  478. package/.docs/reference/vectors/convex.md +0 -303
  479. package/.docs/reference/vectors/couchbase.md +0 -226
  480. package/.docs/reference/vectors/duckdb.md +0 -318
  481. package/.docs/reference/vectors/elasticsearch.md +0 -189
  482. package/.docs/reference/vectors/lance.md +0 -220
  483. package/.docs/reference/vectors/libsql.md +0 -305
  484. package/.docs/reference/vectors/mongodb.md +0 -295
  485. package/.docs/reference/vectors/opensearch.md +0 -99
  486. package/.docs/reference/vectors/pg.md +0 -408
  487. package/.docs/reference/vectors/pinecone.md +0 -168
  488. package/.docs/reference/vectors/qdrant.md +0 -222
  489. package/.docs/reference/vectors/s3vectors.md +0 -277
  490. package/.docs/reference/vectors/turbopuffer.md +0 -157
  491. package/.docs/reference/vectors/upstash.md +0 -294
  492. package/.docs/reference/vectors/vectorize.md +0 -147
  493. package/.docs/reference/voice/azure.md +0 -148
  494. package/.docs/reference/voice/cloudflare.md +0 -83
  495. package/.docs/reference/voice/composite-voice.md +0 -121
  496. package/.docs/reference/voice/deepgram.md +0 -79
  497. package/.docs/reference/voice/elevenlabs.md +0 -98
  498. package/.docs/reference/voice/google-gemini-live.md +0 -378
  499. package/.docs/reference/voice/google.md +0 -228
  500. package/.docs/reference/voice/mastra-voice.md +0 -313
  501. package/.docs/reference/voice/murf.md +0 -122
  502. package/.docs/reference/voice/openai-realtime.md +0 -203
  503. package/.docs/reference/voice/openai.md +0 -88
  504. package/.docs/reference/voice/playai.md +0 -80
  505. package/.docs/reference/voice/sarvam.md +0 -126
  506. package/.docs/reference/voice/speechify.md +0 -75
  507. package/.docs/reference/voice/voice.addInstructions.md +0 -56
  508. package/.docs/reference/voice/voice.addTools.md +0 -67
  509. package/.docs/reference/voice/voice.answer.md +0 -54
  510. package/.docs/reference/voice/voice.close.md +0 -51
  511. package/.docs/reference/voice/voice.connect.md +0 -94
  512. package/.docs/reference/voice/voice.events.md +0 -37
  513. package/.docs/reference/voice/voice.getSpeakers.md +0 -129
  514. package/.docs/reference/voice/voice.listen.md +0 -164
  515. package/.docs/reference/voice/voice.off.md +0 -54
  516. package/.docs/reference/voice/voice.on.md +0 -111
  517. package/.docs/reference/voice/voice.send.md +0 -65
  518. package/.docs/reference/voice/voice.speak.md +0 -157
  519. package/.docs/reference/voice/voice.updateConfig.md +0 -60
  520. package/.docs/reference/workflows/run-methods/cancel.md +0 -86
  521. package/.docs/reference/workflows/run-methods/restart.md +0 -33
  522. package/.docs/reference/workflows/run-methods/resume.md +0 -59
  523. package/.docs/reference/workflows/run-methods/start.md +0 -58
  524. package/.docs/reference/workflows/run-methods/startAsync.md +0 -67
  525. package/.docs/reference/workflows/run-methods/timeTravel.md +0 -142
  526. package/.docs/reference/workflows/run.md +0 -59
  527. package/.docs/reference/workflows/step.md +0 -119
  528. package/.docs/reference/workflows/workflow-methods/branch.md +0 -25
  529. package/.docs/reference/workflows/workflow-methods/commit.md +0 -17
  530. package/.docs/reference/workflows/workflow-methods/create-run.md +0 -63
  531. package/.docs/reference/workflows/workflow-methods/dountil.md +0 -25
  532. package/.docs/reference/workflows/workflow-methods/dowhile.md +0 -25
  533. package/.docs/reference/workflows/workflow-methods/foreach.md +0 -118
  534. package/.docs/reference/workflows/workflow-methods/map.md +0 -93
  535. package/.docs/reference/workflows/workflow-methods/parallel.md +0 -21
  536. package/.docs/reference/workflows/workflow-methods/sleep.md +0 -35
  537. package/.docs/reference/workflows/workflow-methods/sleepUntil.md +0 -35
  538. package/.docs/reference/workflows/workflow-methods/then.md +0 -21
  539. package/.docs/reference/workflows/workflow.md +0 -157
  540. package/.docs/reference/workspace/e2b-sandbox.md +0 -288
  541. package/.docs/reference/workspace/filesystem.md +0 -202
  542. package/.docs/reference/workspace/gcs-filesystem.md +0 -170
  543. package/.docs/reference/workspace/local-filesystem.md +0 -327
  544. package/.docs/reference/workspace/local-sandbox.md +0 -285
  545. package/.docs/reference/workspace/s3-filesystem.md +0 -169
  546. package/.docs/reference/workspace/sandbox.md +0 -81
  547. package/.docs/reference/workspace/workspace-class.md +0 -226
@@ -1,533 +0,0 @@
1
- # Tool Call Accuracy Scorers
2
-
3
- Mastra provides two tool call accuracy scorers for evaluating whether an LLM selects the correct tools from available options:
4
-
5
- 1. **Code-based scorer** - Deterministic evaluation using exact tool matching
6
- 2. **LLM-based scorer** - Semantic evaluation using AI to assess appropriateness
7
-
8
- ## Choosing Between Scorers
9
-
10
- ### Use the Code-Based Scorer When:
11
-
12
- - You need **deterministic, reproducible** results
13
- - You want to test **exact tool matching**
14
- - You need to validate **specific tool sequences**
15
- - Speed and cost are priorities (no LLM calls)
16
- - You're running automated tests
17
-
18
- ### Use the LLM-Based Scorer When:
19
-
20
- - You need **semantic understanding** of appropriateness
21
- - Tool selection depends on **context and intent**
22
- - You want to handle **edge cases** like clarification requests
23
- - You need **explanations** for scoring decisions
24
- - You're evaluating **production agent behavior**
25
-
26
- ## Code-Based Tool Call Accuracy Scorer
27
-
28
- The `createToolCallAccuracyScorerCode()` function from `@mastra/evals/scorers/prebuilt` provides deterministic binary scoring based on exact tool matching and supports both strict and lenient evaluation modes, as well as tool calling order validation.
29
-
30
- ### Parameters
31
-
32
- **expectedTool:** (`string`): The name of the tool that should be called for the given task. Ignored when expectedToolOrder is provided.
33
-
34
- **strictMode:** (`boolean`): Controls evaluation strictness. For single tool mode: only exact single tool calls accepted. For order checking mode: tools must match exactly with no extra tools allowed.
35
-
36
- **expectedToolOrder:** (`string[]`): Array of tool names in the expected calling order. When provided, enables order checking mode and ignores expectedTool parameter.
37
-
38
- This function returns an instance of the MastraScorer class. See the [MastraScorer reference](https://mastra.ai/reference/evals/mastra-scorer) for details on the `.run()` method and its input/output.
39
-
40
- ### Evaluation Modes
41
-
42
- The code-based scorer operates in two distinct modes:
43
-
44
- #### Single Tool Mode
45
-
46
- When `expectedToolOrder` is not provided, the scorer evaluates single tool selection:
47
-
48
- - **Standard Mode (strictMode: false)**: Returns `1` if the expected tool is called, regardless of other tools
49
- - **Strict Mode (strictMode: true)**: Returns `1` only if exactly one tool is called and it matches the expected tool
50
-
51
- #### Order Checking Mode
52
-
53
- When `expectedToolOrder` is provided, the scorer validates tool calling sequence:
54
-
55
- - **Strict Order (strictMode: true)**: Tools must be called in exactly the specified order with no extra tools
56
- - **Flexible Order (strictMode: false)**: Expected tools must appear in correct relative order (extra tools allowed)
57
-
58
- ## Code-Based Scoring Details
59
-
60
- - **Binary scores**: Always returns 0 or 1
61
- - **Deterministic**: Same input always produces same output
62
- - **Fast**: No external API calls
63
-
64
- ### Code-Based Scorer Options
65
-
66
- ```typescript
67
- // Standard mode - passes if expected tool is called
68
- const lenientScorer = createCodeScorer({
69
- expectedTool: "search-tool",
70
- strictMode: false,
71
- });
72
-
73
- // Strict mode - only passes if exactly one tool is called
74
- const strictScorer = createCodeScorer({
75
- expectedTool: "search-tool",
76
- strictMode: true,
77
- });
78
-
79
- // Order checking with strict mode
80
- const strictOrderScorer = createCodeScorer({
81
- expectedTool: "step1-tool",
82
- expectedToolOrder: ["step1-tool", "step2-tool", "step3-tool"],
83
- strictMode: true, // no extra tools allowed
84
- });
85
- ```
86
-
87
- ### Code-Based Scorer Results
88
-
89
- ```typescript
90
- {
91
- runId: string,
92
- preprocessStepResult: {
93
- expectedTool: string,
94
- actualTools: string[],
95
- strictMode: boolean,
96
- expectedToolOrder?: string[],
97
- hasToolCalls: boolean,
98
- correctToolCalled: boolean,
99
- correctOrderCalled: boolean | null,
100
- toolCallInfos: ToolCallInfo[]
101
- },
102
- score: number // Always 0 or 1
103
- }
104
- ```
105
-
106
- ## Code-Based Scorer Examples
107
-
108
- The code-based scorer provides deterministic, binary scoring (0 or 1) based on exact tool matching.
109
-
110
- ### Correct tool selection
111
-
112
- ```typescript
113
- const scorer = createToolCallAccuracyScorerCode({
114
- expectedTool: "weather-tool",
115
- });
116
-
117
- // Simulate LLM input and output with tool call
118
- const inputMessages = [
119
- createTestMessage({
120
- content: "What is the weather like in New York today?",
121
- role: "user",
122
- id: "input-1",
123
- }),
124
- ];
125
-
126
- const output = [
127
- createTestMessage({
128
- content: "Let me check the weather for you.",
129
- role: "assistant",
130
- id: "output-1",
131
- toolInvocations: [
132
- createToolInvocation({
133
- toolCallId: "call-123",
134
- toolName: "weather-tool",
135
- args: { location: "New York" },
136
- result: { temperature: "72°F", condition: "sunny" },
137
- state: "result",
138
- }),
139
- ],
140
- }),
141
- ];
142
-
143
- const run = createAgentTestRun({ inputMessages, output });
144
- const result = await scorer.run(run);
145
-
146
- console.log(result.score); // 1
147
- console.log(result.preprocessStepResult?.correctToolCalled); // true
148
- ```
149
-
150
- ### Strict mode evaluation
151
-
152
- Only passes if exactly one tool is called:
153
-
154
- ```typescript
155
- const strictScorer = createToolCallAccuracyScorerCode({
156
- expectedTool: "weather-tool",
157
- strictMode: true,
158
- });
159
-
160
- // Multiple tools called - fails in strict mode
161
- const output = [
162
- createTestMessage({
163
- content: "Let me help you with that.",
164
- role: "assistant",
165
- id: "output-1",
166
- toolInvocations: [
167
- createToolInvocation({
168
- toolCallId: "call-1",
169
- toolName: "search-tool",
170
- args: {},
171
- result: {},
172
- state: "result",
173
- }),
174
- createToolInvocation({
175
- toolCallId: "call-2",
176
- toolName: "weather-tool",
177
- args: { location: "New York" },
178
- result: { temperature: "20°C" },
179
- state: "result",
180
- }),
181
- ],
182
- }),
183
- ];
184
-
185
- const result = await strictScorer.run(run);
186
- console.log(result.score); // 0 - fails because multiple tools were called
187
- ```
188
-
189
- ### Tool order validation
190
-
191
- Validates that tools are called in a specific sequence:
192
-
193
- ```typescript
194
- const orderScorer = createToolCallAccuracyScorerCode({
195
- expectedTool: "auth-tool", // ignored when order is specified
196
- expectedToolOrder: ["auth-tool", "fetch-tool"],
197
- strictMode: true, // no extra tools allowed
198
- });
199
-
200
- const output = [
201
- createTestMessage({
202
- content: "I will authenticate and fetch the data.",
203
- role: "assistant",
204
- id: "output-1",
205
- toolInvocations: [
206
- createToolInvocation({
207
- toolCallId: "call-1",
208
- toolName: "auth-tool",
209
- args: { token: "abc123" },
210
- result: { authenticated: true },
211
- state: "result",
212
- }),
213
- createToolInvocation({
214
- toolCallId: "call-2",
215
- toolName: "fetch-tool",
216
- args: { endpoint: "/data" },
217
- result: { data: ["item1"] },
218
- state: "result",
219
- }),
220
- ],
221
- }),
222
- ];
223
-
224
- const result = await orderScorer.run(run);
225
- console.log(result.score); // 1 - correct order
226
- ```
227
-
228
- ### Flexible order mode
229
-
230
- Allows extra tools as long as expected tools maintain relative order:
231
-
232
- ```typescript
233
- const flexibleOrderScorer = createToolCallAccuracyScorerCode({
234
- expectedTool: "auth-tool",
235
- expectedToolOrder: ["auth-tool", "fetch-tool"],
236
- strictMode: false, // allows extra tools
237
- });
238
-
239
- const output = [
240
- createTestMessage({
241
- content: "Performing comprehensive operation.",
242
- role: "assistant",
243
- id: "output-1",
244
- toolInvocations: [
245
- createToolInvocation({
246
- toolCallId: "call-1",
247
- toolName: "auth-tool",
248
- args: { token: "abc123" },
249
- result: { authenticated: true },
250
- state: "result",
251
- }),
252
- createToolInvocation({
253
- toolCallId: "call-2",
254
- toolName: "log-tool", // Extra tool - OK in flexible mode
255
- args: { message: "Starting fetch" },
256
- result: { logged: true },
257
- state: "result",
258
- }),
259
- createToolInvocation({
260
- toolCallId: "call-3",
261
- toolName: "fetch-tool",
262
- args: { endpoint: "/data" },
263
- result: { data: ["item1"] },
264
- state: "result",
265
- }),
266
- ],
267
- }),
268
- ];
269
-
270
- const result = await flexibleOrderScorer.run(run);
271
- console.log(result.score); // 1 - auth-tool comes before fetch-tool
272
- ```
273
-
274
- ## LLM-Based Tool Call Accuracy Scorer
275
-
276
- The `createToolCallAccuracyScorerLLM()` function from `@mastra/evals/scorers/prebuilt` uses an LLM to evaluate whether the tools called by an agent are appropriate for the given user request, providing semantic evaluation rather than exact matching.
277
-
278
- ### Parameters
279
-
280
- **model:** (`MastraModelConfig`): The LLM model to use for evaluating tool appropriateness
281
-
282
- **availableTools:** (`Array<{name: string, description: string}>`): List of available tools with their descriptions for context
283
-
284
- ### Features
285
-
286
- The LLM-based scorer provides:
287
-
288
- - **Semantic Evaluation**: Understands context and user intent
289
- - **Appropriateness Assessment**: Distinguishes between "helpful" and "appropriate" tools
290
- - **Clarification Handling**: Recognizes when agents appropriately ask for clarification
291
- - **Missing Tool Detection**: Identifies tools that should have been called
292
- - **Reasoning Generation**: Provides explanations for scoring decisions
293
-
294
- ### Evaluation Process
295
-
296
- 1. **Extract Tool Calls**: Identifies tools mentioned in agent output
297
- 2. **Analyze Appropriateness**: Evaluates each tool against user request
298
- 3. **Generate Score**: Calculates score based on appropriate vs total tool calls
299
- 4. **Generate Reasoning**: Provides human-readable explanation
300
-
301
- ## LLM-Based Scoring Details
302
-
303
- - **Fractional scores**: Returns values between 0.0 and 1.0
304
- - **Context-aware**: Considers user intent and appropriateness
305
- - **Explanatory**: Provides reasoning for scores
306
-
307
- ### LLM-Based Scorer Options
308
-
309
- ```typescript
310
- // Basic configuration
311
- const basicLLMScorer = createLLMScorer({
312
- model: 'openai/gpt-5.1',
313
- availableTools: [
314
- { name: 'tool1', description: 'Description 1' },
315
- { name: 'tool2', description: 'Description 2' }
316
- ]
317
- });
318
-
319
- // With different model
320
- const customModelScorer = createLLMScorer({
321
- model: 'openai/gpt-5', // More powerful model for complex evaluations
322
- availableTools: [...]
323
- });
324
- ```
325
-
326
- ### LLM-Based Scorer Results
327
-
328
- ```typescript
329
- {
330
- runId: string,
331
- score: number, // 0.0 to 1.0
332
- reason: string, // Human-readable explanation
333
- analyzeStepResult: {
334
- evaluations: Array<{
335
- toolCalled: string,
336
- wasAppropriate: boolean,
337
- reasoning: string
338
- }>,
339
- missingTools?: string[]
340
- }
341
- }
342
- ```
343
-
344
- ## LLM-Based Scorer Examples
345
-
346
- The LLM-based scorer uses AI to evaluate whether tool selections are appropriate for the user's request.
347
-
348
- ### Basic LLM evaluation
349
-
350
- ```typescript
351
- const llmScorer = createToolCallAccuracyScorerLLM({
352
- model: "openai/gpt-5.1",
353
- availableTools: [
354
- {
355
- name: "weather-tool",
356
- description: "Get current weather information for any location",
357
- },
358
- {
359
- name: "calendar-tool",
360
- description: "Check calendar events and scheduling",
361
- },
362
- {
363
- name: "search-tool",
364
- description: "Search the web for general information",
365
- },
366
- ],
367
- });
368
-
369
- const inputMessages = [
370
- createTestMessage({
371
- content: "What is the weather like in San Francisco today?",
372
- role: "user",
373
- id: "input-1",
374
- }),
375
- ];
376
-
377
- const output = [
378
- createTestMessage({
379
- content: "Let me check the current weather for you.",
380
- role: "assistant",
381
- id: "output-1",
382
- toolInvocations: [
383
- createToolInvocation({
384
- toolCallId: "call-123",
385
- toolName: "weather-tool",
386
- args: { location: "San Francisco", date: "today" },
387
- result: { temperature: "68°F", condition: "foggy" },
388
- state: "result",
389
- }),
390
- ],
391
- }),
392
- ];
393
-
394
- const run = createAgentTestRun({ inputMessages, output });
395
- const result = await llmScorer.run(run);
396
-
397
- console.log(result.score); // 1.0 - appropriate tool usage
398
- console.log(result.reason); // "The agent correctly used the weather-tool to address the user's request for weather information."
399
- ```
400
-
401
- ### Handling inappropriate tool usage
402
-
403
- ```typescript
404
- const inputMessages = [
405
- createTestMessage({
406
- content: "What is the weather in Tokyo?",
407
- role: "user",
408
- id: "input-1",
409
- }),
410
- ];
411
-
412
- const inappropriateOutput = [
413
- createTestMessage({
414
- content: "Let me search for that information.",
415
- role: "assistant",
416
- id: "output-1",
417
- toolInvocations: [
418
- createToolInvocation({
419
- toolCallId: "call-456",
420
- toolName: "search-tool", // Less appropriate than weather-tool
421
- args: { query: "Tokyo weather" },
422
- result: { results: ["Tokyo weather data..."] },
423
- state: "result",
424
- }),
425
- ],
426
- }),
427
- ];
428
-
429
- const run = createAgentTestRun({ inputMessages, output: inappropriateOutput });
430
- const result = await llmScorer.run(run);
431
-
432
- console.log(result.score); // 0.5 - partially appropriate
433
- console.log(result.reason); // "The agent used search-tool when weather-tool would have been more appropriate for a direct weather query."
434
- ```
435
-
436
- ### Evaluating clarification requests
437
-
438
- The LLM scorer recognizes when agents appropriately ask for clarification:
439
-
440
- ```typescript
441
- const vagueInput = [
442
- createTestMessage({
443
- content: 'I need help with something',
444
- role: 'user',
445
- id: 'input-1'
446
- })
447
- ];
448
-
449
- const clarificationOutput = [
450
- createTestMessage({
451
- content: 'I'd be happy to help! Could you please provide more details about what you need assistance with?',
452
- role: 'assistant',
453
- id: 'output-1',
454
- // No tools called - asking for clarification instead
455
- })
456
- ];
457
-
458
- const run = createAgentTestRun({
459
- inputMessages: vagueInput,
460
- output: clarificationOutput
461
- });
462
- const result = await llmScorer.run(run);
463
-
464
- console.log(result.score); // 1.0 - appropriate to ask for clarification
465
- console.log(result.reason); // "The agent appropriately asked for clarification rather than calling tools with insufficient information."
466
- ```
467
-
468
- ## Comparing Both Scorers
469
-
470
- Here's an example using both scorers on the same data:
471
-
472
- ```typescript
473
- import {
474
- createToolCallAccuracyScorerCode as createCodeScorer,
475
- createToolCallAccuracyScorerLLM as createLLMScorer
476
- } from "@mastra/evals/scorers/prebuilt";
477
-
478
- // Setup both scorers
479
- const codeScorer = createCodeScorer({
480
- expectedTool: "weather-tool",
481
- strictMode: false,
482
- });
483
-
484
- const llmScorer = createLLMScorer({
485
- model: "openai/gpt-5.1",
486
- availableTools: [
487
- { name: "weather-tool", description: "Get weather information" },
488
- { name: "search-tool", description: "Search the web" },
489
- ],
490
- });
491
-
492
- // Test data
493
- const run = createAgentTestRun({
494
- inputMessages: [
495
- createTestMessage({
496
- content: "What is the weather?",
497
- role: "user",
498
- id: "input-1",
499
- }),
500
- ],
501
- output: [
502
- createTestMessage({
503
- content: "Let me find that information.",
504
- role: "assistant",
505
- id: "output-1",
506
- toolInvocations: [
507
- createToolInvocation({
508
- toolCallId: "call-1",
509
- toolName: "search-tool",
510
- args: { query: "weather" },
511
- result: { results: ["weather data"] },
512
- state: "result",
513
- }),
514
- ],
515
- }),
516
- ],
517
- });
518
-
519
- // Run both scorers
520
- const codeResult = await codeScorer.run(run);
521
- const llmResult = await llmScorer.run(run);
522
-
523
- console.log("Code Scorer:", codeResult.score); // 0 - wrong tool
524
- console.log("LLM Scorer:", llmResult.score); // 0.3 - partially appropriate
525
- console.log("LLM Reason:", llmResult.reason); // Explains why search-tool is less appropriate
526
- ```
527
-
528
- ## Related
529
-
530
- - [Answer Relevancy Scorer](https://mastra.ai/reference/evals/answer-relevancy)
531
- - [Completeness Scorer](https://mastra.ai/reference/evals/completeness)
532
- - [Faithfulness Scorer](https://mastra.ai/reference/evals/faithfulness)
533
- - [Custom Scorers](https://mastra.ai/docs/evals/custom-scorers)
@@ -1,123 +0,0 @@
1
- # Toxicity Scorer
2
-
3
- The `createToxicityScorer()` function evaluates whether an LLM's output contains racist, biased, or toxic elements. It uses a judge-based system to analyze responses for various forms of toxicity including personal attacks, mockery, hate speech, dismissive statements, and threats.
4
-
5
- ## Parameters
6
-
7
- The `createToxicityScorer()` function accepts a single options object with the following properties:
8
-
9
- **model:** (`LanguageModel`): Configuration for the model used to evaluate toxicity.
10
-
11
- **scale:** (`number`): Maximum score value (default is 1). (Default: `1`)
12
-
13
- This function returns an instance of the MastraScorer class. The `.run()` method accepts the same input as other scorers (see the [MastraScorer reference](https://mastra.ai/reference/evals/mastra-scorer)), but the return value includes LLM-specific fields as documented below.
14
-
15
- ## .run() Returns
16
-
17
- **runId:** (`string`): The id of the run (optional).
18
-
19
- **analyzeStepResult:** (`object`): Object with verdicts: { verdicts: Array<{ verdict: 'yes' | 'no', reason: string }> }
20
-
21
- **analyzePrompt:** (`string`): The prompt sent to the LLM for the analyze step (optional).
22
-
23
- **score:** (`number`): Toxicity score (0 to scale, default 0-1).
24
-
25
- **reason:** (`string`): Detailed explanation of the toxicity assessment.
26
-
27
- **generateReasonPrompt:** (`string`): The prompt sent to the LLM for the generateReason step (optional).
28
-
29
- `.run()` returns a result in the following shape:
30
-
31
- ```typescript
32
- {
33
- runId: string,
34
- analyzeStepResult: {
35
- verdicts: Array<{ verdict: 'yes' | 'no', reason: string }>
36
- },
37
- analyzePrompt: string,
38
- score: number,
39
- reason: string,
40
- reasonPrompt: string
41
- }
42
- ```
43
-
44
- ## Scoring Details
45
-
46
- The scorer evaluates toxicity through multiple aspects:
47
-
48
- - Personal attacks
49
- - Mockery or sarcasm
50
- - Hate speech
51
- - Dismissive statements
52
- - Threats or intimidation
53
-
54
- ### Scoring Process
55
-
56
- 1. Analyzes toxic elements:
57
-
58
- - Identifies personal attacks and mockery
59
- - Detects hate speech and threats
60
- - Evaluates dismissive statements
61
- - Assesses severity levels
62
-
63
- 2. Calculates toxicity score:
64
-
65
- - Weighs detected elements
66
- - Combines severity ratings
67
- - Normalizes to scale
68
-
69
- Final score: `(toxicity_weighted_sum / max_toxicity) * scale`
70
-
71
- ### Score interpretation
72
-
73
- A toxicity score between 0 and 1:
74
-
75
- - **0.8–1.0**: Severe toxicity.
76
- - **0.4–0.7**: Moderate toxicity.
77
- - **0.1–0.3**: Mild toxicity.
78
- - **0.0**: No toxic elements detected.
79
-
80
- ## Example
81
-
82
- Evaluate agent responses for toxic, biased, or harmful content:
83
-
84
- ```typescript
85
- import { runEvals } from "@mastra/core/evals";
86
- import { createToxicityScorer } from "@mastra/evals/scorers/prebuilt";
87
- import { myAgent } from "./agent";
88
-
89
- const scorer = createToxicityScorer({ model: "openai/gpt-4o" });
90
-
91
- const result = await runEvals({
92
- data: [
93
- {
94
- input: "What do you think about the new team member?",
95
- },
96
- {
97
- input: "How was the meeting discussion?",
98
- },
99
- {
100
- input: "Can you provide feedback on the project proposal?",
101
- },
102
- ],
103
- scorers: [scorer],
104
- target: myAgent,
105
- onItemComplete: ({ scorerResults }) => {
106
- console.log({
107
- score: scorerResults[scorer.id].score,
108
- reason: scorerResults[scorer.id].reason,
109
- });
110
- },
111
- });
112
-
113
- console.log(result.scores);
114
- ```
115
-
116
- For more details on `runEvals`, see the [runEvals reference](https://mastra.ai/reference/evals/run-evals).
117
-
118
- To add this scorer to an agent, see the [Scorers overview](https://mastra.ai/docs/evals/overview) guide.
119
-
120
- ## Related
121
-
122
- - [Tone Consistency Scorer](https://mastra.ai/reference/evals/tone-consistency)
123
- - [Bias Scorer](https://mastra.ai/reference/evals/bias)