@mastra/mcp-docs-server 1.1.4 → 1.1.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (547) hide show
  1. package/CHANGELOG.md +14 -0
  2. package/package.json +5 -5
  3. package/.docs/docs/agents/adding-voice.md +0 -353
  4. package/.docs/docs/agents/agent-approval.md +0 -377
  5. package/.docs/docs/agents/agent-memory.md +0 -212
  6. package/.docs/docs/agents/guardrails.md +0 -382
  7. package/.docs/docs/agents/network-approval.md +0 -275
  8. package/.docs/docs/agents/networks.md +0 -290
  9. package/.docs/docs/agents/overview.md +0 -309
  10. package/.docs/docs/agents/processors.md +0 -632
  11. package/.docs/docs/agents/structured-output.md +0 -271
  12. package/.docs/docs/agents/using-tools.md +0 -214
  13. package/.docs/docs/build-with-ai/mcp-docs-server.md +0 -241
  14. package/.docs/docs/build-with-ai/skills.md +0 -35
  15. package/.docs/docs/community/contributing-templates.md +0 -3
  16. package/.docs/docs/community/discord.md +0 -9
  17. package/.docs/docs/community/licensing.md +0 -66
  18. package/.docs/docs/deployment/cloud-providers.md +0 -15
  19. package/.docs/docs/deployment/mastra-server.md +0 -122
  20. package/.docs/docs/deployment/monorepo.md +0 -142
  21. package/.docs/docs/deployment/overview.md +0 -62
  22. package/.docs/docs/deployment/studio.md +0 -234
  23. package/.docs/docs/deployment/web-framework.md +0 -52
  24. package/.docs/docs/deployment/workflow-runners.md +0 -9
  25. package/.docs/docs/evals/built-in-scorers.md +0 -47
  26. package/.docs/docs/evals/custom-scorers.md +0 -519
  27. package/.docs/docs/evals/overview.md +0 -146
  28. package/.docs/docs/evals/running-in-ci.md +0 -106
  29. package/.docs/docs/getting-started/build-with-ai.md +0 -68
  30. package/.docs/docs/getting-started/manual-install.md +0 -226
  31. package/.docs/docs/getting-started/project-structure.md +0 -60
  32. package/.docs/docs/getting-started/start.md +0 -28
  33. package/.docs/docs/getting-started/studio.md +0 -101
  34. package/.docs/docs/index.md +0 -43
  35. package/.docs/docs/mastra-cloud/deployment.md +0 -77
  36. package/.docs/docs/mastra-cloud/observability.md +0 -38
  37. package/.docs/docs/mastra-cloud/overview.md +0 -23
  38. package/.docs/docs/mastra-cloud/setup.md +0 -42
  39. package/.docs/docs/mastra-cloud/studio.md +0 -24
  40. package/.docs/docs/mcp/overview.md +0 -370
  41. package/.docs/docs/mcp/publishing-mcp-server.md +0 -95
  42. package/.docs/docs/memory/memory-processors.md +0 -316
  43. package/.docs/docs/memory/message-history.md +0 -260
  44. package/.docs/docs/memory/observational-memory.md +0 -246
  45. package/.docs/docs/memory/overview.md +0 -45
  46. package/.docs/docs/memory/semantic-recall.md +0 -272
  47. package/.docs/docs/memory/storage.md +0 -261
  48. package/.docs/docs/memory/working-memory.md +0 -400
  49. package/.docs/docs/observability/datasets/overview.md +0 -188
  50. package/.docs/docs/observability/datasets/running-experiments.md +0 -266
  51. package/.docs/docs/observability/logging.md +0 -99
  52. package/.docs/docs/observability/overview.md +0 -70
  53. package/.docs/docs/observability/tracing/bridges/otel.md +0 -209
  54. package/.docs/docs/observability/tracing/exporters/arize.md +0 -274
  55. package/.docs/docs/observability/tracing/exporters/braintrust.md +0 -111
  56. package/.docs/docs/observability/tracing/exporters/cloud.md +0 -129
  57. package/.docs/docs/observability/tracing/exporters/datadog.md +0 -187
  58. package/.docs/docs/observability/tracing/exporters/default.md +0 -211
  59. package/.docs/docs/observability/tracing/exporters/laminar.md +0 -100
  60. package/.docs/docs/observability/tracing/exporters/langfuse.md +0 -217
  61. package/.docs/docs/observability/tracing/exporters/langsmith.md +0 -202
  62. package/.docs/docs/observability/tracing/exporters/otel.md +0 -479
  63. package/.docs/docs/observability/tracing/exporters/posthog.md +0 -148
  64. package/.docs/docs/observability/tracing/exporters/sentry.md +0 -208
  65. package/.docs/docs/observability/tracing/overview.md +0 -1114
  66. package/.docs/docs/observability/tracing/processors/sensitive-data-filter.md +0 -303
  67. package/.docs/docs/rag/chunking-and-embedding.md +0 -183
  68. package/.docs/docs/rag/graph-rag.md +0 -215
  69. package/.docs/docs/rag/overview.md +0 -72
  70. package/.docs/docs/rag/retrieval.md +0 -521
  71. package/.docs/docs/rag/vector-databases.md +0 -648
  72. package/.docs/docs/server/auth/auth0.md +0 -222
  73. package/.docs/docs/server/auth/better-auth.md +0 -203
  74. package/.docs/docs/server/auth/clerk.md +0 -132
  75. package/.docs/docs/server/auth/composite-auth.md +0 -234
  76. package/.docs/docs/server/auth/custom-auth-provider.md +0 -513
  77. package/.docs/docs/server/auth/firebase.md +0 -272
  78. package/.docs/docs/server/auth/jwt.md +0 -110
  79. package/.docs/docs/server/auth/simple-auth.md +0 -178
  80. package/.docs/docs/server/auth/supabase.md +0 -117
  81. package/.docs/docs/server/auth/workos.md +0 -190
  82. package/.docs/docs/server/auth.md +0 -38
  83. package/.docs/docs/server/custom-adapters.md +0 -374
  84. package/.docs/docs/server/custom-api-routes.md +0 -267
  85. package/.docs/docs/server/mastra-client.md +0 -243
  86. package/.docs/docs/server/mastra-server.md +0 -71
  87. package/.docs/docs/server/middleware.md +0 -228
  88. package/.docs/docs/server/request-context.md +0 -478
  89. package/.docs/docs/server/server-adapters.md +0 -547
  90. package/.docs/docs/streaming/events.md +0 -247
  91. package/.docs/docs/streaming/overview.md +0 -181
  92. package/.docs/docs/streaming/tool-streaming.md +0 -178
  93. package/.docs/docs/streaming/workflow-streaming.md +0 -109
  94. package/.docs/docs/voice/overview.md +0 -979
  95. package/.docs/docs/voice/speech-to-speech.md +0 -103
  96. package/.docs/docs/voice/speech-to-text.md +0 -80
  97. package/.docs/docs/voice/text-to-speech.md +0 -84
  98. package/.docs/docs/workflows/agents-and-tools.md +0 -170
  99. package/.docs/docs/workflows/control-flow.md +0 -823
  100. package/.docs/docs/workflows/error-handling.md +0 -360
  101. package/.docs/docs/workflows/human-in-the-loop.md +0 -213
  102. package/.docs/docs/workflows/overview.md +0 -372
  103. package/.docs/docs/workflows/snapshots.md +0 -238
  104. package/.docs/docs/workflows/suspend-and-resume.md +0 -205
  105. package/.docs/docs/workflows/time-travel.md +0 -309
  106. package/.docs/docs/workflows/workflow-state.md +0 -181
  107. package/.docs/docs/workspace/filesystem.md +0 -162
  108. package/.docs/docs/workspace/overview.md +0 -239
  109. package/.docs/docs/workspace/sandbox.md +0 -63
  110. package/.docs/docs/workspace/search.md +0 -219
  111. package/.docs/docs/workspace/skills.md +0 -126
  112. package/.docs/guides/agent-frameworks/ai-sdk.md +0 -140
  113. package/.docs/guides/build-your-ui/ai-sdk-ui.md +0 -1463
  114. package/.docs/guides/build-your-ui/assistant-ui.md +0 -156
  115. package/.docs/guides/build-your-ui/copilotkit.md +0 -292
  116. package/.docs/guides/deployment/amazon-ec2.md +0 -130
  117. package/.docs/guides/deployment/aws-lambda.md +0 -248
  118. package/.docs/guides/deployment/azure-app-services.md +0 -114
  119. package/.docs/guides/deployment/cloudflare.md +0 -99
  120. package/.docs/guides/deployment/digital-ocean.md +0 -168
  121. package/.docs/guides/deployment/inngest.md +0 -685
  122. package/.docs/guides/deployment/netlify.md +0 -77
  123. package/.docs/guides/deployment/vercel.md +0 -101
  124. package/.docs/guides/getting-started/astro.md +0 -408
  125. package/.docs/guides/getting-started/electron.md +0 -504
  126. package/.docs/guides/getting-started/express.md +0 -251
  127. package/.docs/guides/getting-started/hono.md +0 -191
  128. package/.docs/guides/getting-started/next-js.md +0 -355
  129. package/.docs/guides/getting-started/nuxt.md +0 -476
  130. package/.docs/guides/getting-started/quickstart.md +0 -67
  131. package/.docs/guides/getting-started/sveltekit.md +0 -300
  132. package/.docs/guides/getting-started/vite-react.md +0 -439
  133. package/.docs/guides/guide/ai-recruiter.md +0 -227
  134. package/.docs/guides/guide/chef-michel.md +0 -215
  135. package/.docs/guides/guide/code-review-bot.md +0 -221
  136. package/.docs/guides/guide/dev-assistant.md +0 -304
  137. package/.docs/guides/guide/docs-manager.md +0 -238
  138. package/.docs/guides/guide/github-actions-pr-description.md +0 -236
  139. package/.docs/guides/guide/notes-mcp-server.md +0 -425
  140. package/.docs/guides/guide/research-assistant.md +0 -349
  141. package/.docs/guides/guide/stock-agent.md +0 -134
  142. package/.docs/guides/guide/web-search.md +0 -326
  143. package/.docs/guides/guide/whatsapp-chat-bot.md +0 -416
  144. package/.docs/guides/index.md +0 -3
  145. package/.docs/guides/migrations/agentnetwork.md +0 -101
  146. package/.docs/guides/migrations/ai-sdk-v4-to-v5.md +0 -112
  147. package/.docs/guides/migrations/upgrade-to-v1/agent.md +0 -404
  148. package/.docs/guides/migrations/upgrade-to-v1/cli.md +0 -57
  149. package/.docs/guides/migrations/upgrade-to-v1/client.md +0 -337
  150. package/.docs/guides/migrations/upgrade-to-v1/deployment.md +0 -37
  151. package/.docs/guides/migrations/upgrade-to-v1/evals.md +0 -239
  152. package/.docs/guides/migrations/upgrade-to-v1/mastra.md +0 -143
  153. package/.docs/guides/migrations/upgrade-to-v1/mcp.md +0 -97
  154. package/.docs/guides/migrations/upgrade-to-v1/memory.md +0 -285
  155. package/.docs/guides/migrations/upgrade-to-v1/overview.md +0 -119
  156. package/.docs/guides/migrations/upgrade-to-v1/processors.md +0 -68
  157. package/.docs/guides/migrations/upgrade-to-v1/rag.md +0 -42
  158. package/.docs/guides/migrations/upgrade-to-v1/storage.md +0 -553
  159. package/.docs/guides/migrations/upgrade-to-v1/tools.md +0 -180
  160. package/.docs/guides/migrations/upgrade-to-v1/tracing.md +0 -417
  161. package/.docs/guides/migrations/upgrade-to-v1/vectors.md +0 -87
  162. package/.docs/guides/migrations/upgrade-to-v1/voice.md +0 -30
  163. package/.docs/guides/migrations/upgrade-to-v1/workflows.md +0 -341
  164. package/.docs/guides/migrations/vnext-to-standard-apis.md +0 -364
  165. package/.docs/models/embeddings.md +0 -161
  166. package/.docs/models/gateways/azure-openai.md +0 -128
  167. package/.docs/models/gateways/custom-gateways.md +0 -545
  168. package/.docs/models/gateways/netlify.md +0 -88
  169. package/.docs/models/gateways/openrouter.md +0 -219
  170. package/.docs/models/gateways/vercel.md +0 -225
  171. package/.docs/models/gateways.md +0 -14
  172. package/.docs/models/index.md +0 -286
  173. package/.docs/models/providers/302ai.md +0 -134
  174. package/.docs/models/providers/abacus.md +0 -125
  175. package/.docs/models/providers/agentrouter.md +0 -90
  176. package/.docs/models/providers/aihubmix.md +0 -107
  177. package/.docs/models/providers/alibaba-cn.md +0 -135
  178. package/.docs/models/providers/alibaba.md +0 -111
  179. package/.docs/models/providers/amazon-bedrock.md +0 -33
  180. package/.docs/models/providers/anthropic.md +0 -153
  181. package/.docs/models/providers/azure.md +0 -33
  182. package/.docs/models/providers/bailing.md +0 -72
  183. package/.docs/models/providers/baseten.md +0 -77
  184. package/.docs/models/providers/berget.md +0 -78
  185. package/.docs/models/providers/cerebras.md +0 -101
  186. package/.docs/models/providers/chutes.md +0 -136
  187. package/.docs/models/providers/cloudflare-ai-gateway.md +0 -33
  188. package/.docs/models/providers/cloudflare-workers-ai.md +0 -109
  189. package/.docs/models/providers/cohere.md +0 -33
  190. package/.docs/models/providers/cortecs.md +0 -91
  191. package/.docs/models/providers/deepinfra.md +0 -112
  192. package/.docs/models/providers/deepseek.md +0 -88
  193. package/.docs/models/providers/fastrouter.md +0 -84
  194. package/.docs/models/providers/fireworks-ai.md +0 -89
  195. package/.docs/models/providers/firmware.md +0 -85
  196. package/.docs/models/providers/friendli.md +0 -78
  197. package/.docs/models/providers/github-models.md +0 -125
  198. package/.docs/models/providers/google-vertex.md +0 -33
  199. package/.docs/models/providers/google.md +0 -159
  200. package/.docs/models/providers/groq.md +0 -107
  201. package/.docs/models/providers/helicone.md +0 -161
  202. package/.docs/models/providers/huggingface.md +0 -90
  203. package/.docs/models/providers/iflowcn.md +0 -84
  204. package/.docs/models/providers/inception.md +0 -72
  205. package/.docs/models/providers/inference.md +0 -79
  206. package/.docs/models/providers/io-intelligence.md +0 -87
  207. package/.docs/models/providers/io-net.md +0 -87
  208. package/.docs/models/providers/jiekou.md +0 -131
  209. package/.docs/models/providers/kilo.md +0 -333
  210. package/.docs/models/providers/kimi-for-coding.md +0 -100
  211. package/.docs/models/providers/kuae-cloud-coding-plan.md +0 -71
  212. package/.docs/models/providers/llama.md +0 -77
  213. package/.docs/models/providers/lmstudio.md +0 -73
  214. package/.docs/models/providers/lucidquery.md +0 -72
  215. package/.docs/models/providers/minimax-cn-coding-plan.md +0 -102
  216. package/.docs/models/providers/minimax-cn.md +0 -102
  217. package/.docs/models/providers/minimax-coding-plan.md +0 -102
  218. package/.docs/models/providers/minimax.md +0 -104
  219. package/.docs/models/providers/mistral.md +0 -124
  220. package/.docs/models/providers/moark.md +0 -72
  221. package/.docs/models/providers/modelscope.md +0 -77
  222. package/.docs/models/providers/moonshotai-cn.md +0 -76
  223. package/.docs/models/providers/moonshotai.md +0 -76
  224. package/.docs/models/providers/morph.md +0 -73
  225. package/.docs/models/providers/nano-gpt.md +0 -103
  226. package/.docs/models/providers/nebius.md +0 -116
  227. package/.docs/models/providers/nova.md +0 -72
  228. package/.docs/models/providers/novita-ai.md +0 -154
  229. package/.docs/models/providers/nvidia.md +0 -141
  230. package/.docs/models/providers/ollama-cloud.md +0 -103
  231. package/.docs/models/providers/ollama.md +0 -33
  232. package/.docs/models/providers/openai.md +0 -193
  233. package/.docs/models/providers/opencode.md +0 -100
  234. package/.docs/models/providers/ovhcloud.md +0 -83
  235. package/.docs/models/providers/perplexity.md +0 -100
  236. package/.docs/models/providers/poe.md +0 -183
  237. package/.docs/models/providers/privatemode-ai.md +0 -75
  238. package/.docs/models/providers/requesty.md +0 -90
  239. package/.docs/models/providers/scaleway.md +0 -84
  240. package/.docs/models/providers/siliconflow-cn.md +0 -138
  241. package/.docs/models/providers/siliconflow.md +0 -140
  242. package/.docs/models/providers/stackit.md +0 -78
  243. package/.docs/models/providers/stepfun.md +0 -73
  244. package/.docs/models/providers/submodel.md +0 -79
  245. package/.docs/models/providers/synthetic.md +0 -96
  246. package/.docs/models/providers/togetherai.md +0 -115
  247. package/.docs/models/providers/upstage.md +0 -73
  248. package/.docs/models/providers/venice.md +0 -95
  249. package/.docs/models/providers/vivgrid.md +0 -106
  250. package/.docs/models/providers/vultr.md +0 -75
  251. package/.docs/models/providers/wandb.md +0 -80
  252. package/.docs/models/providers/xai.md +0 -141
  253. package/.docs/models/providers/xiaomi.md +0 -71
  254. package/.docs/models/providers/zai-coding-plan.md +0 -80
  255. package/.docs/models/providers/zai.md +0 -79
  256. package/.docs/models/providers/zenmux.md +0 -161
  257. package/.docs/models/providers/zhipuai-coding-plan.md +0 -79
  258. package/.docs/models/providers/zhipuai.md +0 -79
  259. package/.docs/models/providers.md +0 -81
  260. package/.docs/reference/agents/agent.md +0 -142
  261. package/.docs/reference/agents/generate.md +0 -174
  262. package/.docs/reference/agents/generateLegacy.md +0 -176
  263. package/.docs/reference/agents/getDefaultGenerateOptions.md +0 -36
  264. package/.docs/reference/agents/getDefaultOptions.md +0 -34
  265. package/.docs/reference/agents/getDefaultStreamOptions.md +0 -36
  266. package/.docs/reference/agents/getDescription.md +0 -21
  267. package/.docs/reference/agents/getInstructions.md +0 -34
  268. package/.docs/reference/agents/getLLM.md +0 -37
  269. package/.docs/reference/agents/getMemory.md +0 -34
  270. package/.docs/reference/agents/getModel.md +0 -34
  271. package/.docs/reference/agents/getTools.md +0 -29
  272. package/.docs/reference/agents/getVoice.md +0 -34
  273. package/.docs/reference/agents/listAgents.md +0 -35
  274. package/.docs/reference/agents/listScorers.md +0 -34
  275. package/.docs/reference/agents/listTools.md +0 -34
  276. package/.docs/reference/agents/listWorkflows.md +0 -34
  277. package/.docs/reference/agents/network.md +0 -134
  278. package/.docs/reference/ai-sdk/chat-route.md +0 -82
  279. package/.docs/reference/ai-sdk/handle-chat-stream.md +0 -53
  280. package/.docs/reference/ai-sdk/handle-network-stream.md +0 -37
  281. package/.docs/reference/ai-sdk/handle-workflow-stream.md +0 -55
  282. package/.docs/reference/ai-sdk/network-route.md +0 -74
  283. package/.docs/reference/ai-sdk/to-ai-sdk-stream.md +0 -232
  284. package/.docs/reference/ai-sdk/to-ai-sdk-v4-messages.md +0 -79
  285. package/.docs/reference/ai-sdk/to-ai-sdk-v5-messages.md +0 -73
  286. package/.docs/reference/ai-sdk/with-mastra.md +0 -59
  287. package/.docs/reference/ai-sdk/workflow-route.md +0 -79
  288. package/.docs/reference/auth/auth0.md +0 -73
  289. package/.docs/reference/auth/better-auth.md +0 -71
  290. package/.docs/reference/auth/clerk.md +0 -36
  291. package/.docs/reference/auth/firebase.md +0 -80
  292. package/.docs/reference/auth/jwt.md +0 -26
  293. package/.docs/reference/auth/supabase.md +0 -33
  294. package/.docs/reference/auth/workos.md +0 -84
  295. package/.docs/reference/cli/create-mastra.md +0 -137
  296. package/.docs/reference/cli/mastra.md +0 -336
  297. package/.docs/reference/client-js/agents.md +0 -438
  298. package/.docs/reference/client-js/error-handling.md +0 -16
  299. package/.docs/reference/client-js/logs.md +0 -24
  300. package/.docs/reference/client-js/mastra-client.md +0 -63
  301. package/.docs/reference/client-js/memory.md +0 -225
  302. package/.docs/reference/client-js/observability.md +0 -72
  303. package/.docs/reference/client-js/telemetry.md +0 -20
  304. package/.docs/reference/client-js/tools.md +0 -44
  305. package/.docs/reference/client-js/vectors.md +0 -79
  306. package/.docs/reference/client-js/workflows.md +0 -199
  307. package/.docs/reference/configuration.md +0 -749
  308. package/.docs/reference/core/addGateway.md +0 -42
  309. package/.docs/reference/core/getAgent.md +0 -21
  310. package/.docs/reference/core/getAgentById.md +0 -21
  311. package/.docs/reference/core/getDeployer.md +0 -22
  312. package/.docs/reference/core/getGateway.md +0 -38
  313. package/.docs/reference/core/getGatewayById.md +0 -41
  314. package/.docs/reference/core/getLogger.md +0 -22
  315. package/.docs/reference/core/getMCPServer.md +0 -45
  316. package/.docs/reference/core/getMCPServerById.md +0 -53
  317. package/.docs/reference/core/getMemory.md +0 -50
  318. package/.docs/reference/core/getScorer.md +0 -54
  319. package/.docs/reference/core/getScorerById.md +0 -54
  320. package/.docs/reference/core/getServer.md +0 -22
  321. package/.docs/reference/core/getStorage.md +0 -22
  322. package/.docs/reference/core/getStoredAgentById.md +0 -89
  323. package/.docs/reference/core/getTelemetry.md +0 -22
  324. package/.docs/reference/core/getVector.md +0 -22
  325. package/.docs/reference/core/getWorkflow.md +0 -40
  326. package/.docs/reference/core/listAgents.md +0 -21
  327. package/.docs/reference/core/listGateways.md +0 -40
  328. package/.docs/reference/core/listLogs.md +0 -38
  329. package/.docs/reference/core/listLogsByRunId.md +0 -36
  330. package/.docs/reference/core/listMCPServers.md +0 -51
  331. package/.docs/reference/core/listMemory.md +0 -56
  332. package/.docs/reference/core/listScorers.md +0 -29
  333. package/.docs/reference/core/listStoredAgents.md +0 -93
  334. package/.docs/reference/core/listVectors.md +0 -22
  335. package/.docs/reference/core/listWorkflows.md +0 -21
  336. package/.docs/reference/core/mastra-class.md +0 -66
  337. package/.docs/reference/core/mastra-model-gateway.md +0 -153
  338. package/.docs/reference/core/setLogger.md +0 -26
  339. package/.docs/reference/core/setStorage.md +0 -27
  340. package/.docs/reference/datasets/addItem.md +0 -35
  341. package/.docs/reference/datasets/addItems.md +0 -33
  342. package/.docs/reference/datasets/compareExperiments.md +0 -48
  343. package/.docs/reference/datasets/create.md +0 -49
  344. package/.docs/reference/datasets/dataset.md +0 -78
  345. package/.docs/reference/datasets/datasets-manager.md +0 -84
  346. package/.docs/reference/datasets/delete.md +0 -23
  347. package/.docs/reference/datasets/deleteExperiment.md +0 -25
  348. package/.docs/reference/datasets/deleteItem.md +0 -25
  349. package/.docs/reference/datasets/deleteItems.md +0 -27
  350. package/.docs/reference/datasets/get.md +0 -29
  351. package/.docs/reference/datasets/getDetails.md +0 -45
  352. package/.docs/reference/datasets/getExperiment.md +0 -28
  353. package/.docs/reference/datasets/getItem.md +0 -31
  354. package/.docs/reference/datasets/getItemHistory.md +0 -29
  355. package/.docs/reference/datasets/list.md +0 -29
  356. package/.docs/reference/datasets/listExperimentResults.md +0 -37
  357. package/.docs/reference/datasets/listExperiments.md +0 -31
  358. package/.docs/reference/datasets/listItems.md +0 -44
  359. package/.docs/reference/datasets/listVersions.md +0 -31
  360. package/.docs/reference/datasets/startExperiment.md +0 -60
  361. package/.docs/reference/datasets/startExperimentAsync.md +0 -41
  362. package/.docs/reference/datasets/update.md +0 -46
  363. package/.docs/reference/datasets/updateItem.md +0 -36
  364. package/.docs/reference/deployer/cloudflare.md +0 -79
  365. package/.docs/reference/deployer/netlify.md +0 -82
  366. package/.docs/reference/deployer/vercel.md +0 -91
  367. package/.docs/reference/deployer.md +0 -100
  368. package/.docs/reference/evals/answer-relevancy.md +0 -105
  369. package/.docs/reference/evals/answer-similarity.md +0 -99
  370. package/.docs/reference/evals/bias.md +0 -120
  371. package/.docs/reference/evals/completeness.md +0 -137
  372. package/.docs/reference/evals/content-similarity.md +0 -101
  373. package/.docs/reference/evals/context-precision.md +0 -196
  374. package/.docs/reference/evals/context-relevance.md +0 -536
  375. package/.docs/reference/evals/create-scorer.md +0 -270
  376. package/.docs/reference/evals/faithfulness.md +0 -114
  377. package/.docs/reference/evals/hallucination.md +0 -220
  378. package/.docs/reference/evals/keyword-coverage.md +0 -128
  379. package/.docs/reference/evals/mastra-scorer.md +0 -123
  380. package/.docs/reference/evals/noise-sensitivity.md +0 -685
  381. package/.docs/reference/evals/prompt-alignment.md +0 -619
  382. package/.docs/reference/evals/run-evals.md +0 -138
  383. package/.docs/reference/evals/scorer-utils.md +0 -330
  384. package/.docs/reference/evals/textual-difference.md +0 -113
  385. package/.docs/reference/evals/tone-consistency.md +0 -119
  386. package/.docs/reference/evals/tool-call-accuracy.md +0 -533
  387. package/.docs/reference/evals/toxicity.md +0 -123
  388. package/.docs/reference/harness/harness-class.md +0 -645
  389. package/.docs/reference/index.md +0 -276
  390. package/.docs/reference/logging/pino-logger.md +0 -117
  391. package/.docs/reference/memory/clone-utilities.md +0 -199
  392. package/.docs/reference/memory/cloneThread.md +0 -130
  393. package/.docs/reference/memory/createThread.md +0 -68
  394. package/.docs/reference/memory/deleteMessages.md +0 -40
  395. package/.docs/reference/memory/getThreadById.md +0 -24
  396. package/.docs/reference/memory/listThreads.md +0 -145
  397. package/.docs/reference/memory/memory-class.md +0 -147
  398. package/.docs/reference/memory/observational-memory.md +0 -565
  399. package/.docs/reference/memory/recall.md +0 -91
  400. package/.docs/reference/observability/tracing/bridges/otel.md +0 -131
  401. package/.docs/reference/observability/tracing/configuration.md +0 -178
  402. package/.docs/reference/observability/tracing/exporters/arize.md +0 -141
  403. package/.docs/reference/observability/tracing/exporters/braintrust.md +0 -93
  404. package/.docs/reference/observability/tracing/exporters/cloud-exporter.md +0 -163
  405. package/.docs/reference/observability/tracing/exporters/console-exporter.md +0 -138
  406. package/.docs/reference/observability/tracing/exporters/datadog.md +0 -116
  407. package/.docs/reference/observability/tracing/exporters/default-exporter.md +0 -174
  408. package/.docs/reference/observability/tracing/exporters/laminar.md +0 -78
  409. package/.docs/reference/observability/tracing/exporters/langfuse.md +0 -134
  410. package/.docs/reference/observability/tracing/exporters/langsmith.md +0 -110
  411. package/.docs/reference/observability/tracing/exporters/otel.md +0 -199
  412. package/.docs/reference/observability/tracing/exporters/posthog.md +0 -92
  413. package/.docs/reference/observability/tracing/exporters/sentry.md +0 -184
  414. package/.docs/reference/observability/tracing/instances.md +0 -109
  415. package/.docs/reference/observability/tracing/interfaces.md +0 -749
  416. package/.docs/reference/observability/tracing/processors/sensitive-data-filter.md +0 -144
  417. package/.docs/reference/observability/tracing/spans.md +0 -224
  418. package/.docs/reference/processors/batch-parts-processor.md +0 -61
  419. package/.docs/reference/processors/language-detector.md +0 -81
  420. package/.docs/reference/processors/message-history-processor.md +0 -85
  421. package/.docs/reference/processors/moderation-processor.md +0 -104
  422. package/.docs/reference/processors/pii-detector.md +0 -107
  423. package/.docs/reference/processors/processor-interface.md +0 -525
  424. package/.docs/reference/processors/prompt-injection-detector.md +0 -71
  425. package/.docs/reference/processors/semantic-recall-processor.md +0 -123
  426. package/.docs/reference/processors/system-prompt-scrubber.md +0 -80
  427. package/.docs/reference/processors/token-limiter-processor.md +0 -113
  428. package/.docs/reference/processors/tool-call-filter.md +0 -85
  429. package/.docs/reference/processors/tool-search-processor.md +0 -113
  430. package/.docs/reference/processors/unicode-normalizer.md +0 -62
  431. package/.docs/reference/processors/working-memory-processor.md +0 -154
  432. package/.docs/reference/rag/chunk.md +0 -221
  433. package/.docs/reference/rag/database-config.md +0 -264
  434. package/.docs/reference/rag/document.md +0 -114
  435. package/.docs/reference/rag/embeddings.md +0 -92
  436. package/.docs/reference/rag/extract-params.md +0 -168
  437. package/.docs/reference/rag/graph-rag.md +0 -111
  438. package/.docs/reference/rag/metadata-filters.md +0 -216
  439. package/.docs/reference/rag/rerank.md +0 -80
  440. package/.docs/reference/rag/rerankWithScorer.md +0 -80
  441. package/.docs/reference/server/create-route.md +0 -260
  442. package/.docs/reference/server/express-adapter.md +0 -176
  443. package/.docs/reference/server/fastify-adapter.md +0 -90
  444. package/.docs/reference/server/hono-adapter.md +0 -162
  445. package/.docs/reference/server/koa-adapter.md +0 -127
  446. package/.docs/reference/server/mastra-server.md +0 -298
  447. package/.docs/reference/server/register-api-route.md +0 -249
  448. package/.docs/reference/server/routes.md +0 -306
  449. package/.docs/reference/storage/cloudflare-d1.md +0 -218
  450. package/.docs/reference/storage/cloudflare.md +0 -88
  451. package/.docs/reference/storage/composite.md +0 -235
  452. package/.docs/reference/storage/convex.md +0 -161
  453. package/.docs/reference/storage/dynamodb.md +0 -282
  454. package/.docs/reference/storage/lance.md +0 -131
  455. package/.docs/reference/storage/libsql.md +0 -135
  456. package/.docs/reference/storage/mongodb.md +0 -262
  457. package/.docs/reference/storage/mssql.md +0 -155
  458. package/.docs/reference/storage/overview.md +0 -121
  459. package/.docs/reference/storage/postgresql.md +0 -529
  460. package/.docs/reference/storage/upstash.md +0 -160
  461. package/.docs/reference/streaming/ChunkType.md +0 -292
  462. package/.docs/reference/streaming/agents/MastraModelOutput.md +0 -182
  463. package/.docs/reference/streaming/agents/stream.md +0 -212
  464. package/.docs/reference/streaming/agents/streamLegacy.md +0 -142
  465. package/.docs/reference/streaming/workflows/observeStream.md +0 -42
  466. package/.docs/reference/streaming/workflows/resumeStream.md +0 -61
  467. package/.docs/reference/streaming/workflows/stream.md +0 -88
  468. package/.docs/reference/streaming/workflows/timeTravelStream.md +0 -142
  469. package/.docs/reference/templates/overview.md +0 -194
  470. package/.docs/reference/tools/create-tool.md +0 -237
  471. package/.docs/reference/tools/document-chunker-tool.md +0 -89
  472. package/.docs/reference/tools/graph-rag-tool.md +0 -185
  473. package/.docs/reference/tools/mcp-client.md +0 -962
  474. package/.docs/reference/tools/mcp-server.md +0 -1275
  475. package/.docs/reference/tools/vector-query-tool.md +0 -459
  476. package/.docs/reference/vectors/astra.md +0 -121
  477. package/.docs/reference/vectors/chroma.md +0 -267
  478. package/.docs/reference/vectors/convex.md +0 -303
  479. package/.docs/reference/vectors/couchbase.md +0 -226
  480. package/.docs/reference/vectors/duckdb.md +0 -318
  481. package/.docs/reference/vectors/elasticsearch.md +0 -189
  482. package/.docs/reference/vectors/lance.md +0 -220
  483. package/.docs/reference/vectors/libsql.md +0 -305
  484. package/.docs/reference/vectors/mongodb.md +0 -295
  485. package/.docs/reference/vectors/opensearch.md +0 -99
  486. package/.docs/reference/vectors/pg.md +0 -408
  487. package/.docs/reference/vectors/pinecone.md +0 -168
  488. package/.docs/reference/vectors/qdrant.md +0 -222
  489. package/.docs/reference/vectors/s3vectors.md +0 -277
  490. package/.docs/reference/vectors/turbopuffer.md +0 -157
  491. package/.docs/reference/vectors/upstash.md +0 -294
  492. package/.docs/reference/vectors/vectorize.md +0 -147
  493. package/.docs/reference/voice/azure.md +0 -148
  494. package/.docs/reference/voice/cloudflare.md +0 -83
  495. package/.docs/reference/voice/composite-voice.md +0 -121
  496. package/.docs/reference/voice/deepgram.md +0 -79
  497. package/.docs/reference/voice/elevenlabs.md +0 -98
  498. package/.docs/reference/voice/google-gemini-live.md +0 -378
  499. package/.docs/reference/voice/google.md +0 -228
  500. package/.docs/reference/voice/mastra-voice.md +0 -313
  501. package/.docs/reference/voice/murf.md +0 -122
  502. package/.docs/reference/voice/openai-realtime.md +0 -203
  503. package/.docs/reference/voice/openai.md +0 -88
  504. package/.docs/reference/voice/playai.md +0 -80
  505. package/.docs/reference/voice/sarvam.md +0 -126
  506. package/.docs/reference/voice/speechify.md +0 -75
  507. package/.docs/reference/voice/voice.addInstructions.md +0 -56
  508. package/.docs/reference/voice/voice.addTools.md +0 -67
  509. package/.docs/reference/voice/voice.answer.md +0 -54
  510. package/.docs/reference/voice/voice.close.md +0 -51
  511. package/.docs/reference/voice/voice.connect.md +0 -94
  512. package/.docs/reference/voice/voice.events.md +0 -37
  513. package/.docs/reference/voice/voice.getSpeakers.md +0 -129
  514. package/.docs/reference/voice/voice.listen.md +0 -164
  515. package/.docs/reference/voice/voice.off.md +0 -54
  516. package/.docs/reference/voice/voice.on.md +0 -111
  517. package/.docs/reference/voice/voice.send.md +0 -65
  518. package/.docs/reference/voice/voice.speak.md +0 -157
  519. package/.docs/reference/voice/voice.updateConfig.md +0 -60
  520. package/.docs/reference/workflows/run-methods/cancel.md +0 -86
  521. package/.docs/reference/workflows/run-methods/restart.md +0 -33
  522. package/.docs/reference/workflows/run-methods/resume.md +0 -59
  523. package/.docs/reference/workflows/run-methods/start.md +0 -58
  524. package/.docs/reference/workflows/run-methods/startAsync.md +0 -67
  525. package/.docs/reference/workflows/run-methods/timeTravel.md +0 -142
  526. package/.docs/reference/workflows/run.md +0 -59
  527. package/.docs/reference/workflows/step.md +0 -119
  528. package/.docs/reference/workflows/workflow-methods/branch.md +0 -25
  529. package/.docs/reference/workflows/workflow-methods/commit.md +0 -17
  530. package/.docs/reference/workflows/workflow-methods/create-run.md +0 -63
  531. package/.docs/reference/workflows/workflow-methods/dountil.md +0 -25
  532. package/.docs/reference/workflows/workflow-methods/dowhile.md +0 -25
  533. package/.docs/reference/workflows/workflow-methods/foreach.md +0 -118
  534. package/.docs/reference/workflows/workflow-methods/map.md +0 -93
  535. package/.docs/reference/workflows/workflow-methods/parallel.md +0 -21
  536. package/.docs/reference/workflows/workflow-methods/sleep.md +0 -35
  537. package/.docs/reference/workflows/workflow-methods/sleepUntil.md +0 -35
  538. package/.docs/reference/workflows/workflow-methods/then.md +0 -21
  539. package/.docs/reference/workflows/workflow.md +0 -157
  540. package/.docs/reference/workspace/e2b-sandbox.md +0 -288
  541. package/.docs/reference/workspace/filesystem.md +0 -202
  542. package/.docs/reference/workspace/gcs-filesystem.md +0 -170
  543. package/.docs/reference/workspace/local-filesystem.md +0 -327
  544. package/.docs/reference/workspace/local-sandbox.md +0 -285
  545. package/.docs/reference/workspace/s3-filesystem.md +0 -169
  546. package/.docs/reference/workspace/sandbox.md +0 -81
  547. package/.docs/reference/workspace/workspace-class.md +0 -226
@@ -1,270 +0,0 @@
1
- # createScorer
2
-
3
- Mastra provides a unified `createScorer` factory that allows you to define custom scorers for evaluating input/output pairs. You can use either native JavaScript functions or LLM-based prompt objects for each evaluation step. Custom scorers can be added to Agents and Workflow steps.
4
-
5
- ## How to Create a Custom Scorer
6
-
7
- Use the `createScorer` factory to define your scorer with a name, description, and optional judge configuration. Then chain step methods to build your evaluation pipeline. You must provide at least a `generateScore` step.
8
-
9
- **Prompt object steps** are step configurations expressed as objects with `description` + `createPrompt` (and `outputSchema` for `preprocess`/`analyze`). These steps invoke the judge LLM. **Function steps** are plain functions and never call the judge.
10
-
11
- ```typescript
12
- import { createScorer } from "@mastra/core/evals";
13
-
14
- const scorer = createScorer({
15
- id: "my-custom-scorer",
16
- name: "My Custom Scorer", // Optional, defaults to id
17
- description: "Evaluates responses based on custom criteria",
18
- type: "agent", // Optional: for agent evaluation with automatic typing
19
- judge: {
20
- model: myModel,
21
- instructions: "You are an expert evaluator...",
22
- },
23
- })
24
- .preprocess({
25
- /* step config */
26
- })
27
- .analyze({
28
- /* step config */
29
- })
30
- .generateScore(({ run, results }) => {
31
- // Return a number
32
- })
33
- .generateReason({
34
- /* step config */
35
- });
36
- ```
37
-
38
- ## createScorer Options
39
-
40
- **id:** (`string`): Unique identifier for the scorer. Used as the name if \`name\` is not provided.
41
-
42
- **name?:** (`string`): Name of the scorer. Defaults to \`id\` if not provided.
43
-
44
- **description:** (`string`): Description of what the scorer does.
45
-
46
- **judge?:** (`object`): Optional judge configuration for LLM-based steps. See Judge Object section below.
47
-
48
- **type?:** (`string`): Type specification for input/output. Use 'agent' for automatic agent types. For custom types, use the generic approach instead.
49
-
50
- This function returns a scorer builder that you can chain step methods onto. See the [MastraScorer reference](https://mastra.ai/reference/evals/mastra-scorer) for details on the `.run()` method and its input/output.
51
-
52
- ## Judge Object
53
-
54
- **model:** (`LanguageModel`): The LLM model instance to use for evaluation.
55
-
56
- **instructions:** (`string`): System prompt/instructions for the LLM.
57
-
58
- The judge only runs for steps defined as **prompt objects** (`preprocess`, `analyze`, `generateScore`, `generateReason` in prompt mode). If you use function steps only, the judge is never called and there is no LLM output to inspect. In that case, any score/reason must be produced by your functions.
59
-
60
- When a prompt-object step runs, its structured LLM output is stored in the corresponding result field (`preprocessStepResult`, `analyzeStepResult`, or the value consumed by `calculateScore` in `generateScore`).
61
-
62
- ## Type Safety
63
-
64
- You can specify input/output types when creating scorers for better type inference and IntelliSense support:
65
-
66
- ### Agent Type Shortcut
67
-
68
- For evaluating agents, use `type: 'agent'` to automatically get the correct types for agent input/output:
69
-
70
- ```typescript
71
- import { createScorer } from "@mastra/core/evals";
72
-
73
- // Agent scorer with automatic typing
74
- const agentScorer = createScorer({
75
- id: "agent-response-quality",
76
- description: "Evaluates agent responses",
77
- type: "agent", // Automatically provides ScorerRunInputForAgent/ScorerRunOutputForAgent
78
- })
79
- .preprocess(({ run }) => {
80
- // run.input is automatically typed as ScorerRunInputForAgent
81
- const userMessage = run.inputData.inputMessages[0]?.content;
82
- return { userMessage };
83
- })
84
- .generateScore(({ run, results }) => {
85
- // run.output is automatically typed as ScorerRunOutputForAgent
86
- const response = run.output[0]?.content;
87
- return response.length > 10 ? 1.0 : 0.5;
88
- });
89
- ```
90
-
91
- ### Custom Types with Generics
92
-
93
- For custom input/output types, use the generic approach:
94
-
95
- ```typescript
96
- import { createScorer } from "@mastra/core/evals";
97
-
98
- type CustomInput = { query: string; context: string[] };
99
- type CustomOutput = { answer: string; confidence: number };
100
-
101
- const customScorer = createScorer<CustomInput, CustomOutput>({
102
- id: "custom-scorer",
103
- description: "Evaluates custom data",
104
- }).generateScore(({ run }) => {
105
- // run.input is typed as CustomInput
106
- // run.output is typed as CustomOutput
107
- return run.output.confidence;
108
- });
109
- ```
110
-
111
- ### Built-in Agent Types
112
-
113
- - **`ScorerRunInputForAgent`** - Contains `inputMessages`, `rememberedMessages`, `systemMessages`, and `taggedSystemMessages` for agent evaluation
114
- - **`ScorerRunOutputForAgent`** - Array of agent response messages
115
-
116
- Using these types provides autocomplete, compile-time validation, and better documentation for your scoring logic.
117
-
118
- ## Trace Scoring with Agent Types
119
-
120
- When you use `type: 'agent'`, your scorer is compatible for both adding directly to agents and scoring traces from agent interactions. The scorer automatically transforms trace data into the proper agent input/output format:
121
-
122
- ```typescript
123
- const agentTraceScorer = createScorer({
124
- id: "agent-trace-length",
125
- description: "Evaluates agent response length",
126
- type: "agent",
127
- }).generateScore(({ run }) => {
128
- // Trace data is automatically transformed to agent format
129
- const userMessages = run.inputData.inputMessages;
130
- const agentResponse = run.output[0]?.content;
131
-
132
- // Score based on response length
133
- return agentResponse?.length > 50 ? 0 : 1;
134
- });
135
-
136
- // Register with Mastra for trace scoring
137
- const mastra = new Mastra({
138
- scorers: {
139
- agentTraceScorer,
140
- },
141
- });
142
- ```
143
-
144
- ## Step Method Signatures
145
-
146
- ### preprocess
147
-
148
- Optional preprocessing step that can extract or transform data before analysis.
149
-
150
- **Function Mode:** Function: `({ run, results }) => any`
151
-
152
- **run.input:** (`any`): Input records provided to the scorer. If the scorer is added to an agent, this will be an array of user messages, e.g. \`\[{ role: 'user', content: 'hello world' }]\`. If the scorer is used in a workflow, this will be the input of the workflow.
153
-
154
- **run.output:** (`any`): Output record provided to the scorer. For agents, this is usually the agent's response. For workflows, this is the workflow's output.
155
-
156
- **run.runId:** (`string`): Unique identifier for this scoring run.
157
-
158
- **run.requestContext?:** (`object`): Request Context from the agent or workflow step being evaluated (optional).
159
-
160
- **results:** (`object`): Empty object (no previous steps).
161
-
162
- Returns: `any`\
163
- The method can return any value. The returned value will be available to subsequent steps as `preprocessStepResult`.
164
-
165
- **Prompt Object Mode:**
166
-
167
- **description:** (`string`): Description of what this preprocessing step does.
168
-
169
- **outputSchema:** (`ZodSchema`): Zod schema for the expected output of the preprocess step.
170
-
171
- **createPrompt:** (`function`): Function: ({ run, results }) => string. Returns the prompt for the LLM.
172
-
173
- **judge?:** (`object`): (Optional) LLM judge for this step (can override main judge). See Judge Object section.
174
-
175
- ### analyze
176
-
177
- Optional analysis step that processes the input/output and any preprocessed data.
178
-
179
- **Function Mode:** Function: `({ run, results }) => any`
180
-
181
- **run.input:** (`any`): Input records provided to the scorer. If the scorer is added to an agent, this will be an array of user messages, e.g. \`\[{ role: 'user', content: 'hello world' }]\`. If the scorer is used in a workflow, this will be the input of the workflow.
182
-
183
- **run.output:** (`any`): Output record provided to the scorer. For agents, this is usually the agent's response. For workflows, this is the workflow's output.
184
-
185
- **run.runId:** (`string`): Unique identifier for this scoring run.
186
-
187
- **run.requestContext?:** (`object`): Request Context from the agent or workflow step being evaluated (optional).
188
-
189
- **results.preprocessStepResult?:** (`any`): Result from preprocess step, if defined (optional).
190
-
191
- Returns: `any`\
192
- The method can return any value. The returned value will be available to subsequent steps as `analyzeStepResult`.
193
-
194
- **Prompt Object Mode:**
195
-
196
- **description:** (`string`): Description of what this analysis step does.
197
-
198
- **outputSchema:** (`ZodSchema`): Zod schema for the expected output of the analyze step.
199
-
200
- **createPrompt:** (`function`): Function: ({ run, results }) => string. Returns the prompt for the LLM.
201
-
202
- **judge?:** (`object`): (Optional) LLM judge for this step (can override main judge). See Judge Object section.
203
-
204
- ### generateScore
205
-
206
- **Required** step that computes the final numerical score.
207
-
208
- **Function Mode:** Function: `({ run, results }) => number`
209
-
210
- **run.input:** (`any`): Input records provided to the scorer. If the scorer is added to an agent, this will be an array of user messages, e.g. \`\[{ role: 'user', content: 'hello world' }]\`. If the scorer is used in a workflow, this will be the input of the workflow.
211
-
212
- **run.output:** (`any`): Output record provided to the scorer. For agents, this is usually the agent's response. For workflows, this is the workflow's output.
213
-
214
- **run.runId:** (`string`): Unique identifier for this scoring run.
215
-
216
- **run.requestContext?:** (`object`): Request Context from the agent or workflow step being evaluated (optional).
217
-
218
- **results.preprocessStepResult?:** (`any`): Result from preprocess step, if defined (optional).
219
-
220
- **results.analyzeStepResult?:** (`any`): Result from analyze step, if defined (optional).
221
-
222
- Returns: `number`\
223
- The method must return a numerical score.
224
-
225
- **Prompt Object Mode:**
226
-
227
- **description:** (`string`): Description of what this scoring step does.
228
-
229
- **outputSchema:** (`ZodSchema`): Zod schema for the expected output of the generateScore step.
230
-
231
- **createPrompt:** (`function`): Function: ({ run, results }) => string. Returns the prompt for the LLM.
232
-
233
- **judge?:** (`object`): (Optional) LLM judge for this step (can override main judge). See Judge Object section.
234
-
235
- When using prompt object mode, you must also provide a `calculateScore` function to convert the LLM output to a numerical score:
236
-
237
- **calculateScore:** (`function`): Function: ({ run, results, analyzeStepResult }) => number. Converts the LLM's structured output into a numerical score.
238
-
239
- ### generateReason
240
-
241
- Optional step that provides an explanation for the score.
242
-
243
- **Function Mode:** Function: `({ run, results, score }) => string`
244
-
245
- **run.input:** (`any`): Input records provided to the scorer. If the scorer is added to an agent, this will be an array of user messages, e.g. \`\[{ role: 'user', content: 'hello world' }]\`. If the scorer is used in a workflow, this will be the input of the workflow.
246
-
247
- **run.output:** (`any`): Output record provided to the scorer. For agents, this is usually the agent's response. For workflows, this is the workflow's output.
248
-
249
- **run.runId:** (`string`): Unique identifier for this scoring run.
250
-
251
- **run.requestContext?:** (`object`): Request Context from the agent or workflow step being evaluated (optional).
252
-
253
- **results.preprocessStepResult?:** (`any`): Result from preprocess step, if defined (optional).
254
-
255
- **results.analyzeStepResult?:** (`any`): Result from analyze step, if defined (optional).
256
-
257
- **score:** (`number`): Score computed by the generateScore step.
258
-
259
- Returns: `string`\
260
- The method must return a string explaining the score.
261
-
262
- **Prompt Object Mode:**
263
-
264
- **description:** (`string`): Description of what this reasoning step does.
265
-
266
- **createPrompt:** (`function`): Function: ({ run, results, score }) => string. Returns the prompt for the LLM.
267
-
268
- **judge?:** (`object`): (Optional) LLM judge for this step (can override main judge). See Judge Object section.
269
-
270
- All step functions can be async.
@@ -1,114 +0,0 @@
1
- # Faithfulness Scorer
2
-
3
- The `createFaithfulnessScorer()` function evaluates how factually accurate an LLM's output is compared to the provided context. It extracts claims from the output and verifies them against the context, making it essential to measure RAG pipeline responses' reliability.
4
-
5
- ## Parameters
6
-
7
- The `createFaithfulnessScorer()` function accepts a single options object with the following properties:
8
-
9
- **model:** (`LanguageModel`): Configuration for the model used to evaluate faithfulness.
10
-
11
- **context:** (`string[]`): Array of context chunks against which the output's claims will be verified.
12
-
13
- **scale:** (`number`): The maximum score value. The final score will be normalized to this scale. (Default: `1`)
14
-
15
- This function returns an instance of the MastraScorer class. The `.run()` method accepts the same input as other scorers (see the [MastraScorer reference](https://mastra.ai/reference/evals/mastra-scorer)), but the return value includes LLM-specific fields as documented below.
16
-
17
- ## .run() Returns
18
-
19
- **runId:** (`string`): The id of the run (optional).
20
-
21
- **preprocessStepResult:** (`string[]`): Array of extracted claims from the output.
22
-
23
- **preprocessPrompt:** (`string`): The prompt sent to the LLM for the preprocess step (optional).
24
-
25
- **analyzeStepResult:** (`object`): Object with verdicts: { verdicts: Array<{ verdict: 'yes' | 'no' | 'unsure', reason: string }> }
26
-
27
- **analyzePrompt:** (`string`): The prompt sent to the LLM for the analyze step (optional).
28
-
29
- **score:** (`number`): A score between 0 and the configured scale, representing the proportion of claims that are supported by the context.
30
-
31
- **reason:** (`string`): A detailed explanation of the score, including which claims were supported, contradicted, or marked as unsure.
32
-
33
- **generateReasonPrompt:** (`string`): The prompt sent to the LLM for the generateReason step (optional).
34
-
35
- ## Scoring Details
36
-
37
- The scorer evaluates faithfulness through claim verification against provided context.
38
-
39
- ### Scoring Process
40
-
41
- 1. Analyzes claims and context:
42
-
43
- - Extracts all claims (factual and speculative)
44
-
45
- - Verifies each claim against context
46
-
47
- - Assigns one of three verdicts:
48
-
49
- - "yes" - claim supported by context
50
- - "no" - claim contradicts context
51
- - "unsure" - claim unverifiable
52
-
53
- 2. Calculates faithfulness score:
54
-
55
- - Counts supported claims
56
- - Divides by total claims
57
- - Scales to configured range
58
-
59
- Final score: `(supported_claims / total_claims) * scale`
60
-
61
- ### Score interpretation
62
-
63
- A faithfulness score between 0 and 1:
64
-
65
- - **1.0**: All claims are accurate and directly supported by the context.
66
- - **0.7–0.9**: Most claims are correct, with minor additions or omissions.
67
- - **0.4–0.6**: Some claims are supported, but others are unverifiable.
68
- - **0.1–0.3**: Most of the content is inaccurate or unsupported.
69
- - **0.0**: All claims are false or contradict the context.
70
-
71
- ## Example
72
-
73
- Evaluate agent responses for faithfulness to provided context:
74
-
75
- ```typescript
76
- import { runEvals } from "@mastra/core/evals";
77
- import { createFaithfulnessScorer } from "@mastra/evals/scorers/prebuilt";
78
- import { myAgent } from "./agent";
79
-
80
- // Context is typically populated from agent tool calls or RAG retrieval
81
- const scorer = createFaithfulnessScorer({
82
- model: "openai/gpt-4o",
83
- });
84
-
85
- const result = await runEvals({
86
- data: [
87
- {
88
- input: "Tell me about the Tesla Model 3.",
89
- },
90
- {
91
- input: "What are the key features of this electric vehicle?",
92
- },
93
- ],
94
- scorers: [scorer],
95
- target: myAgent,
96
- onItemComplete: ({ scorerResults }) => {
97
- console.log({
98
- score: scorerResults[scorer.id].score,
99
- reason: scorerResults[scorer.id].reason,
100
- });
101
- },
102
- });
103
-
104
- console.log(result.scores);
105
- ```
106
-
107
- For more details on `runEvals`, see the [runEvals reference](https://mastra.ai/reference/evals/run-evals).
108
-
109
- To add this scorer to an agent, see the [Scorers overview](https://mastra.ai/docs/evals/overview) guide.
110
-
111
- ## Related
112
-
113
- - [Answer Relevancy Scorer](https://mastra.ai/reference/evals/answer-relevancy)
114
- - [Hallucination Scorer](https://mastra.ai/reference/evals/hallucination)
@@ -1,220 +0,0 @@
1
- # Hallucination Scorer
2
-
3
- The `createHallucinationScorer()` function evaluates whether an LLM generates factually correct information by comparing its output against the provided context. This scorer measures hallucination by identifying direct contradictions between the context and the output.
4
-
5
- ## Parameters
6
-
7
- The `createHallucinationScorer()` function accepts a single options object with the following properties:
8
-
9
- **model:** (`LanguageModel`): Configuration for the model used to evaluate hallucination.
10
-
11
- **options.scale:** (`number`): Maximum score value. (Default: `1`)
12
-
13
- **options.context:** (`string[]`): Static context strings to use as ground truth for hallucination detection.
14
-
15
- **options.getContext:** (`(params: GetContextParams) => string[] | Promise<string[]>`): A hook to dynamically resolve context at runtime. Takes priority over static context. Useful for live scoring where context (like tool results) is only available when the scorer runs.
16
-
17
- This function returns an instance of the MastraScorer class. The `.run()` method accepts the same input as other scorers (see the [MastraScorer reference](https://mastra.ai/reference/evals/mastra-scorer)), but the return value includes LLM-specific fields as documented below.
18
-
19
- ### GetContextParams
20
-
21
- The `getContext` hook receives the following parameters:
22
-
23
- **run:** (`GetContextRun`): The scorer run containing input, output, runId, requestContext, and tracingContext.
24
-
25
- **results:** (`Record<string, any>`): Accumulated results from previous steps (e.g., preprocessStepResult with extracted claims).
26
-
27
- **score:** (`number`): The computed score. Only present when called from the generateReason step.
28
-
29
- **step:** (`'analyze' | 'generateReason'`): Which step is calling the hook. Useful for caching context between calls.
30
-
31
- ## .run() Returns
32
-
33
- **runId:** (`string`): The id of the run (optional).
34
-
35
- **preprocessStepResult:** (`object`): Object with extracted claims: { claims: string\[] }
36
-
37
- **preprocessPrompt:** (`string`): The prompt sent to the LLM for the preprocess step (optional).
38
-
39
- **analyzeStepResult:** (`object`): Object with verdicts: { verdicts: Array<{ statement: string, verdict: 'yes' | 'no', reason: string }> }
40
-
41
- **analyzePrompt:** (`string`): The prompt sent to the LLM for the analyze step (optional).
42
-
43
- **score:** (`number`): Hallucination score (0 to scale, default 0-1).
44
-
45
- **reason:** (`string`): Detailed explanation of the score and identified contradictions.
46
-
47
- **generateReasonPrompt:** (`string`): The prompt sent to the LLM for the generateReason step (optional).
48
-
49
- ## Scoring Details
50
-
51
- The scorer evaluates hallucination through contradiction detection and unsupported claim analysis.
52
-
53
- ### Scoring Process
54
-
55
- 1. Analyzes factual content:
56
-
57
- - Extracts statements from context
58
- - Identifies numerical values and dates
59
- - Maps statement relationships
60
-
61
- 2. Analyzes output for hallucinations:
62
-
63
- - Compares against context statements
64
- - Marks direct conflicts as hallucinations
65
- - Identifies unsupported claims as hallucinations
66
- - Evaluates numerical accuracy
67
- - Considers approximation context
68
-
69
- 3. Calculates hallucination score:
70
-
71
- - Counts hallucinated statements (contradictions and unsupported claims)
72
- - Divides by total statements
73
- - Scales to configured range
74
-
75
- Final score: `(hallucinated_statements / total_statements) * scale`
76
-
77
- ### Important Considerations
78
-
79
- - Claims not present in context are treated as hallucinations
80
-
81
- - Subjective claims are hallucinations unless explicitly supported
82
-
83
- - Speculative language ("might", "possibly") about facts IN context is allowed
84
-
85
- - Speculative language about facts NOT in context is treated as hallucination
86
-
87
- - Empty outputs result in zero hallucinations
88
-
89
- - Numerical evaluation considers:
90
-
91
- - Scale-appropriate precision
92
- - Contextual approximations
93
- - Explicit precision indicators
94
-
95
- ### Score interpretation
96
-
97
- A hallucination score between 0 and 1:
98
-
99
- - **0.0**: No hallucination — all claims match the context.
100
- - **0.3–0.4**: Low hallucination — a few contradictions.
101
- - **0.5–0.6**: Mixed hallucination — several contradictions.
102
- - **0.7–0.8**: High hallucination — many contradictions.
103
- - **0.9–1.0**: Complete hallucination — most or all claims contradict the context.
104
-
105
- **Note:** The score represents the degree of hallucination - lower scores indicate better factual alignment with the provided context
106
-
107
- ## Examples
108
-
109
- ### Static Context
110
-
111
- Use static context when you have known ground truth to compare against:
112
-
113
- ```typescript
114
- import { createHallucinationScorer } from "@mastra/evals/scorers/prebuilt";
115
-
116
- const scorer = createHallucinationScorer({
117
- model: "openai/gpt-4o",
118
- options: {
119
- context: [
120
- "The first iPhone was announced on January 9, 2007.",
121
- "It was released on June 29, 2007.",
122
- "Steve Jobs introduced it at Macworld.",
123
- ],
124
- },
125
- });
126
- ```
127
-
128
- ### Dynamic Context with getContext
129
-
130
- Use `getContext` for live scoring scenarios where context comes from tool results:
131
-
132
- ```typescript
133
- import { createHallucinationScorer } from "@mastra/evals/scorers/prebuilt";
134
- import { extractToolResults } from "@mastra/evals/scorers";
135
-
136
- const scorer = createHallucinationScorer({
137
- model: "openai/gpt-4o",
138
- options: {
139
- getContext: ({ run, step }) => {
140
- // Extract tool results as context
141
- const toolResults = extractToolResults(run.output);
142
- return toolResults.map((t) =>
143
- JSON.stringify({ tool: t.toolName, result: t.result })
144
- );
145
- },
146
- },
147
- });
148
- ```
149
-
150
- ### Live Scoring with Agent
151
-
152
- Attach the scorer to an agent for live evaluation:
153
-
154
- ```typescript
155
- import { Agent } from "@mastra/core/agent";
156
- import { createHallucinationScorer } from "@mastra/evals/scorers/prebuilt";
157
- import { extractToolResults } from "@mastra/evals/scorers";
158
-
159
- const hallucinationScorer = createHallucinationScorer({
160
- model: "openai/gpt-4o",
161
- options: {
162
- getContext: ({ run }) => {
163
- const toolResults = extractToolResults(run.output);
164
- return toolResults.map((t) =>
165
- JSON.stringify({ tool: t.toolName, result: t.result })
166
- );
167
- },
168
- },
169
- });
170
-
171
- const agent = new Agent({
172
- name: "my-agent",
173
- model: "openai/gpt-4o",
174
- instructions: "You are a helpful assistant.",
175
- evals: {
176
- scorers: [hallucinationScorer],
177
- },
178
- });
179
- ```
180
-
181
- ### Batch Evaluation with runEvals
182
-
183
- ```typescript
184
- import { runEvals } from "@mastra/core/evals";
185
- import { createHallucinationScorer } from "@mastra/evals/scorers/prebuilt";
186
- import { myAgent } from "./agent";
187
-
188
- const scorer = createHallucinationScorer({
189
- model: "openai/gpt-4o",
190
- options: {
191
- context: ["Known fact 1", "Known fact 2"],
192
- },
193
- });
194
-
195
- const result = await runEvals({
196
- data: [
197
- { input: "Tell me about topic A" },
198
- { input: "Tell me about topic B" },
199
- ],
200
- scorers: [scorer],
201
- target: myAgent,
202
- onItemComplete: ({ scorerResults }) => {
203
- console.log({
204
- score: scorerResults[scorer.id].score,
205
- reason: scorerResults[scorer.id].reason,
206
- });
207
- },
208
- });
209
-
210
- console.log(result.scores);
211
- ```
212
-
213
- For more details on `runEvals`, see the [runEvals reference](https://mastra.ai/reference/evals/run-evals).
214
-
215
- To add this scorer to an agent, see the [Scorers overview](https://mastra.ai/docs/evals/overview) guide.
216
-
217
- ## Related
218
-
219
- - [Faithfulness Scorer](https://mastra.ai/reference/evals/faithfulness)
220
- - [Answer Relevancy Scorer](https://mastra.ai/reference/evals/answer-relevancy)