@mastra/core 1.7.0 → 1.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (498) hide show
  1. package/CHANGELOG.md +218 -0
  2. package/dist/agent/agent-legacy.d.ts +15 -0
  3. package/dist/agent/agent-legacy.d.ts.map +1 -1
  4. package/dist/agent/agent.d.ts +7 -0
  5. package/dist/agent/agent.d.ts.map +1 -1
  6. package/dist/agent/agent.types.d.ts +311 -2
  7. package/dist/agent/agent.types.d.ts.map +1 -1
  8. package/dist/agent/index.cjs +13 -13
  9. package/dist/agent/index.d.ts +3 -1
  10. package/dist/agent/index.d.ts.map +1 -1
  11. package/dist/agent/index.js +2 -2
  12. package/dist/agent/message-list/index.cjs +18 -18
  13. package/dist/agent/message-list/index.js +1 -1
  14. package/dist/agent/message-list/merge/MessageMerger.d.ts.map +1 -1
  15. package/dist/agent/message-list/message-list.d.ts.map +1 -1
  16. package/dist/agent/workflows/prepare-stream/map-results-step.d.ts.map +1 -1
  17. package/dist/agent/workflows/prepare-stream/prepare-tools-step.d.ts.map +1 -1
  18. package/dist/{chunk-A72NTLFT.cjs → chunk-2IO5Q7OZ.cjs} +7 -7
  19. package/dist/{chunk-A72NTLFT.cjs.map → chunk-2IO5Q7OZ.cjs.map} +1 -1
  20. package/dist/{chunk-DFCRXDVK.js → chunk-2KHPZJNU.js} +10 -8
  21. package/dist/chunk-2KHPZJNU.js.map +1 -0
  22. package/dist/{chunk-R4N65TLG.js → chunk-2R5MQMSA.js} +35 -16
  23. package/dist/chunk-2R5MQMSA.js.map +1 -0
  24. package/dist/{chunk-ZSBM2SVU.js → chunk-4H5F6AFP.js} +1064 -226
  25. package/dist/chunk-4H5F6AFP.js.map +1 -0
  26. package/dist/{chunk-BQHWJLXU.js → chunk-63G75DJE.js} +9 -3
  27. package/dist/chunk-63G75DJE.js.map +1 -0
  28. package/dist/{chunk-SBOHDNIZ.cjs → chunk-6GSWC5ZA.cjs} +2 -2
  29. package/dist/{chunk-SBOHDNIZ.cjs.map → chunk-6GSWC5ZA.cjs.map} +1 -1
  30. package/dist/{chunk-QTAS3HND.cjs → chunk-6Q2UD3XF.cjs} +21 -14
  31. package/dist/chunk-6Q2UD3XF.cjs.map +1 -0
  32. package/dist/{chunk-GPJGPARM.js → chunk-DTPR3JAM.js} +2 -2
  33. package/dist/{chunk-GPJGPARM.js.map → chunk-DTPR3JAM.js.map} +1 -1
  34. package/dist/{chunk-NN26FSKL.js → chunk-FHJ2KIU5.js} +3 -3
  35. package/dist/{chunk-NN26FSKL.js.map → chunk-FHJ2KIU5.js.map} +1 -1
  36. package/dist/{chunk-RABITNTG.cjs → chunk-HWG7NPJA.cjs} +55 -55
  37. package/dist/{chunk-RABITNTG.cjs.map → chunk-HWG7NPJA.cjs.map} +1 -1
  38. package/dist/{chunk-HB6T4554.cjs → chunk-KH3G65IS.cjs} +10 -8
  39. package/dist/chunk-KH3G65IS.cjs.map +1 -0
  40. package/dist/{chunk-YQG7NBPR.cjs → chunk-KZ4IKNPN.cjs} +25 -23
  41. package/dist/chunk-KZ4IKNPN.cjs.map +1 -0
  42. package/dist/{chunk-6DUTLERJ.js → chunk-MRV5NCPC.js} +3 -3
  43. package/dist/{chunk-6DUTLERJ.js.map → chunk-MRV5NCPC.js.map} +1 -1
  44. package/dist/{chunk-O7PZ4VOO.cjs → chunk-N3ROEJG4.cjs} +12 -10
  45. package/dist/chunk-N3ROEJG4.cjs.map +1 -0
  46. package/dist/{chunk-7EXW4AAG.js → chunk-NXKI2L4X.js} +6 -4
  47. package/dist/chunk-NXKI2L4X.js.map +1 -0
  48. package/dist/{chunk-QWTB53GS.js → chunk-OSEPGSLN.js} +6 -6
  49. package/dist/{chunk-QWTB53GS.js.map → chunk-OSEPGSLN.js.map} +1 -1
  50. package/dist/{chunk-6OXW5E2O.js → chunk-PI7ONENO.js} +4 -4
  51. package/dist/{chunk-6OXW5E2O.js.map → chunk-PI7ONENO.js.map} +1 -1
  52. package/dist/{chunk-KUXNBWN7.js → chunk-Q4MV4XKX.js} +8 -6
  53. package/dist/chunk-Q4MV4XKX.js.map +1 -0
  54. package/dist/{chunk-7UAJ6LMR.cjs → chunk-QKQGKEN7.cjs} +1078 -241
  55. package/dist/chunk-QKQGKEN7.cjs.map +1 -0
  56. package/dist/{chunk-IC5OUWKJ.js → chunk-SP7P6Z4L.js} +19 -2
  57. package/dist/chunk-SP7P6Z4L.js.map +1 -0
  58. package/dist/{chunk-QDH6MVJ7.cjs → chunk-TGUDI64A.cjs} +14 -14
  59. package/dist/{chunk-QDH6MVJ7.cjs.map → chunk-TGUDI64A.cjs.map} +1 -1
  60. package/dist/{chunk-EAZ6YDCQ.cjs → chunk-U3HBG2GU.cjs} +9 -2
  61. package/dist/chunk-U3HBG2GU.cjs.map +1 -0
  62. package/dist/{chunk-6QBN6MZY.cjs → chunk-VAKB5EXJ.cjs} +42 -23
  63. package/dist/chunk-VAKB5EXJ.cjs.map +1 -0
  64. package/dist/{chunk-QSHV7GPT.js → chunk-VBPU6CLZ.js} +3808 -3026
  65. package/dist/chunk-VBPU6CLZ.js.map +1 -0
  66. package/dist/{chunk-2X66GWF5.cjs → chunk-VTVCMIAI.cjs} +3905 -3121
  67. package/dist/chunk-VTVCMIAI.cjs.map +1 -0
  68. package/dist/{chunk-PHHJLGZU.cjs → chunk-XNWF6CYR.cjs} +6 -6
  69. package/dist/{chunk-PHHJLGZU.cjs.map → chunk-XNWF6CYR.cjs.map} +1 -1
  70. package/dist/{chunk-T6GAM3SQ.js → chunk-ZRPTWYWJ.js} +18 -11
  71. package/dist/chunk-ZRPTWYWJ.js.map +1 -0
  72. package/dist/{chunk-DB7U2C5B.cjs → chunk-ZXOWG32X.cjs} +19 -2
  73. package/dist/chunk-ZXOWG32X.cjs.map +1 -0
  74. package/dist/datasets/experiment/index.d.ts.map +1 -1
  75. package/dist/datasets/experiment/scorer.d.ts +1 -1
  76. package/dist/datasets/experiment/scorer.d.ts.map +1 -1
  77. package/dist/datasets/index.cjs +17 -17
  78. package/dist/datasets/index.js +2 -2
  79. package/dist/docs/SKILL.md +300 -0
  80. package/dist/docs/assets/SOURCE_MAP.json +1423 -0
  81. package/dist/docs/references/docs-agents-adding-voice.md +349 -0
  82. package/dist/docs/references/docs-agents-agent-approval.md +558 -0
  83. package/dist/docs/references/docs-agents-agent-memory.md +209 -0
  84. package/dist/docs/references/docs-agents-guardrails.md +374 -0
  85. package/dist/docs/references/docs-agents-network-approval.md +275 -0
  86. package/dist/docs/references/docs-agents-networks.md +299 -0
  87. package/dist/docs/references/docs-agents-overview.md +304 -0
  88. package/dist/docs/references/docs-agents-processors.md +622 -0
  89. package/dist/docs/references/docs-agents-structured-output.md +273 -0
  90. package/dist/docs/references/docs-agents-supervisor-agents.md +304 -0
  91. package/dist/docs/references/docs-agents-using-tools.md +214 -0
  92. package/dist/docs/references/docs-evals-custom-scorers.md +519 -0
  93. package/dist/docs/references/docs-evals-overview.md +141 -0
  94. package/dist/docs/references/docs-evals-running-in-ci.md +124 -0
  95. package/dist/docs/references/docs-memory-memory-processors.md +314 -0
  96. package/dist/docs/references/docs-memory-observational-memory.md +248 -0
  97. package/dist/docs/references/docs-memory-overview.md +45 -0
  98. package/dist/docs/references/docs-memory-semantic-recall.md +272 -0
  99. package/dist/docs/references/docs-memory-storage.md +261 -0
  100. package/dist/docs/references/docs-memory-working-memory.md +400 -0
  101. package/dist/docs/references/docs-observability-datasets-overview.md +198 -0
  102. package/dist/docs/references/docs-observability-datasets-running-experiments.md +274 -0
  103. package/dist/docs/references/docs-observability-logging.md +99 -0
  104. package/dist/docs/references/docs-observability-overview.md +70 -0
  105. package/dist/docs/references/docs-observability-tracing-bridges-otel.md +209 -0
  106. package/dist/docs/references/docs-observability-tracing-exporters-arize.md +272 -0
  107. package/dist/docs/references/docs-observability-tracing-exporters-braintrust.md +111 -0
  108. package/dist/docs/references/docs-observability-tracing-exporters-cloud.md +127 -0
  109. package/dist/docs/references/docs-observability-tracing-exporters-datadog.md +187 -0
  110. package/dist/docs/references/docs-observability-tracing-exporters-default.md +209 -0
  111. package/dist/docs/references/docs-observability-tracing-exporters-laminar.md +100 -0
  112. package/dist/docs/references/docs-observability-tracing-exporters-langfuse.md +213 -0
  113. package/dist/docs/references/docs-observability-tracing-exporters-langsmith.md +198 -0
  114. package/dist/docs/references/docs-observability-tracing-exporters-otel.md +476 -0
  115. package/dist/docs/references/docs-observability-tracing-exporters-posthog.md +148 -0
  116. package/dist/docs/references/docs-observability-tracing-overview.md +1112 -0
  117. package/dist/docs/references/docs-rag-chunking-and-embedding.md +183 -0
  118. package/dist/docs/references/docs-rag-graph-rag.md +215 -0
  119. package/dist/docs/references/docs-rag-overview.md +72 -0
  120. package/dist/docs/references/docs-rag-retrieval.md +515 -0
  121. package/dist/docs/references/docs-rag-vector-databases.md +645 -0
  122. package/dist/docs/references/docs-server-auth-auth0.md +220 -0
  123. package/dist/docs/references/docs-server-auth-clerk.md +132 -0
  124. package/dist/docs/references/docs-server-auth-composite-auth.md +234 -0
  125. package/dist/docs/references/docs-server-auth-custom-auth-provider.md +513 -0
  126. package/dist/docs/references/docs-server-auth-firebase.md +272 -0
  127. package/dist/docs/references/docs-server-auth-jwt.md +110 -0
  128. package/dist/docs/references/docs-server-auth-simple-auth.md +180 -0
  129. package/dist/docs/references/docs-server-auth-supabase.md +117 -0
  130. package/dist/docs/references/docs-server-auth-workos.md +186 -0
  131. package/dist/docs/references/docs-server-custom-adapters.md +378 -0
  132. package/dist/docs/references/docs-server-custom-api-routes.md +267 -0
  133. package/dist/docs/references/docs-server-mastra-client.md +243 -0
  134. package/dist/docs/references/docs-server-mastra-server.md +71 -0
  135. package/dist/docs/references/docs-server-middleware.md +225 -0
  136. package/dist/docs/references/docs-server-request-context.md +471 -0
  137. package/dist/docs/references/docs-streaming-events.md +237 -0
  138. package/dist/docs/references/docs-streaming-tool-streaming.md +175 -0
  139. package/dist/docs/references/docs-streaming-workflow-streaming.md +109 -0
  140. package/dist/docs/references/docs-voice-overview.md +959 -0
  141. package/dist/docs/references/docs-voice-speech-to-speech.md +102 -0
  142. package/dist/docs/references/docs-voice-speech-to-text.md +79 -0
  143. package/dist/docs/references/docs-voice-text-to-speech.md +83 -0
  144. package/dist/docs/references/docs-workflows-agents-and-tools.md +166 -0
  145. package/dist/docs/references/docs-workflows-control-flow.md +822 -0
  146. package/dist/docs/references/docs-workflows-error-handling.md +360 -0
  147. package/dist/docs/references/docs-workflows-human-in-the-loop.md +215 -0
  148. package/dist/docs/references/docs-workflows-overview.md +370 -0
  149. package/dist/docs/references/docs-workflows-snapshots.md +238 -0
  150. package/dist/docs/references/docs-workflows-suspend-and-resume.md +205 -0
  151. package/dist/docs/references/docs-workflows-time-travel.md +309 -0
  152. package/dist/docs/references/docs-workflows-workflow-state.md +181 -0
  153. package/dist/docs/references/docs-workspace-filesystem.md +164 -0
  154. package/dist/docs/references/docs-workspace-overview.md +239 -0
  155. package/dist/docs/references/docs-workspace-sandbox.md +63 -0
  156. package/dist/docs/references/docs-workspace-search.md +243 -0
  157. package/dist/docs/references/docs-workspace-skills.md +169 -0
  158. package/dist/docs/references/guides-agent-frameworks-ai-sdk.md +140 -0
  159. package/dist/docs/references/reference-agents-agent.md +141 -0
  160. package/dist/docs/references/reference-agents-generate.md +186 -0
  161. package/dist/docs/references/reference-agents-generateLegacy.md +173 -0
  162. package/dist/docs/references/reference-agents-getDefaultGenerateOptions.md +36 -0
  163. package/dist/docs/references/reference-agents-getDefaultOptions.md +34 -0
  164. package/dist/docs/references/reference-agents-getDefaultStreamOptions.md +36 -0
  165. package/dist/docs/references/reference-agents-getDescription.md +21 -0
  166. package/dist/docs/references/reference-agents-getInstructions.md +34 -0
  167. package/dist/docs/references/reference-agents-getLLM.md +37 -0
  168. package/dist/docs/references/reference-agents-getMemory.md +34 -0
  169. package/dist/docs/references/reference-agents-getModel.md +34 -0
  170. package/dist/docs/references/reference-agents-getTools.md +29 -0
  171. package/dist/docs/references/reference-agents-getVoice.md +34 -0
  172. package/dist/docs/references/reference-agents-listAgents.md +35 -0
  173. package/dist/docs/references/reference-agents-listScorers.md +34 -0
  174. package/dist/docs/references/reference-agents-listTools.md +34 -0
  175. package/dist/docs/references/reference-agents-listWorkflows.md +34 -0
  176. package/dist/docs/references/reference-agents-network.md +133 -0
  177. package/dist/docs/references/reference-ai-sdk-chat-route.md +82 -0
  178. package/dist/docs/references/reference-ai-sdk-network-route.md +74 -0
  179. package/dist/docs/references/reference-ai-sdk-to-ai-sdk-stream.md +231 -0
  180. package/dist/docs/references/reference-ai-sdk-with-mastra.md +59 -0
  181. package/dist/docs/references/reference-ai-sdk-workflow-route.md +79 -0
  182. package/dist/docs/references/reference-auth-auth0.md +73 -0
  183. package/dist/docs/references/reference-auth-clerk.md +36 -0
  184. package/dist/docs/references/reference-auth-firebase.md +80 -0
  185. package/dist/docs/references/reference-auth-jwt.md +26 -0
  186. package/dist/docs/references/reference-auth-supabase.md +33 -0
  187. package/dist/docs/references/reference-auth-workos.md +84 -0
  188. package/dist/docs/references/reference-client-js-agents.md +437 -0
  189. package/dist/docs/references/reference-configuration.md +752 -0
  190. package/dist/docs/references/reference-core-addGateway.md +42 -0
  191. package/dist/docs/references/reference-core-getAgent.md +21 -0
  192. package/dist/docs/references/reference-core-getAgentById.md +21 -0
  193. package/dist/docs/references/reference-core-getDeployer.md +22 -0
  194. package/dist/docs/references/reference-core-getGateway.md +38 -0
  195. package/dist/docs/references/reference-core-getGatewayById.md +41 -0
  196. package/dist/docs/references/reference-core-getLogger.md +22 -0
  197. package/dist/docs/references/reference-core-getMCPServer.md +47 -0
  198. package/dist/docs/references/reference-core-getMCPServerById.md +55 -0
  199. package/dist/docs/references/reference-core-getMemory.md +50 -0
  200. package/dist/docs/references/reference-core-getScorer.md +54 -0
  201. package/dist/docs/references/reference-core-getScorerById.md +54 -0
  202. package/dist/docs/references/reference-core-getServer.md +22 -0
  203. package/dist/docs/references/reference-core-getStorage.md +22 -0
  204. package/dist/docs/references/reference-core-getStoredAgentById.md +89 -0
  205. package/dist/docs/references/reference-core-getTelemetry.md +22 -0
  206. package/dist/docs/references/reference-core-getVector.md +22 -0
  207. package/dist/docs/references/reference-core-getWorkflow.md +42 -0
  208. package/dist/docs/references/reference-core-listAgents.md +21 -0
  209. package/dist/docs/references/reference-core-listGateways.md +40 -0
  210. package/dist/docs/references/reference-core-listLogs.md +38 -0
  211. package/dist/docs/references/reference-core-listLogsByRunId.md +36 -0
  212. package/dist/docs/references/reference-core-listMCPServers.md +55 -0
  213. package/dist/docs/references/reference-core-listMemory.md +56 -0
  214. package/dist/docs/references/reference-core-listScorers.md +29 -0
  215. package/dist/docs/references/reference-core-listStoredAgents.md +93 -0
  216. package/dist/docs/references/reference-core-listVectors.md +22 -0
  217. package/dist/docs/references/reference-core-listWorkflows.md +21 -0
  218. package/dist/docs/references/reference-core-mastra-class.md +66 -0
  219. package/dist/docs/references/reference-core-mastra-model-gateway.md +153 -0
  220. package/dist/docs/references/reference-core-setLogger.md +26 -0
  221. package/dist/docs/references/reference-core-setStorage.md +27 -0
  222. package/dist/docs/references/reference-datasets-addItem.md +37 -0
  223. package/dist/docs/references/reference-datasets-addItems.md +35 -0
  224. package/dist/docs/references/reference-datasets-compareExperiments.md +52 -0
  225. package/dist/docs/references/reference-datasets-create.md +51 -0
  226. package/dist/docs/references/reference-datasets-dataset.md +82 -0
  227. package/dist/docs/references/reference-datasets-datasets-manager.md +94 -0
  228. package/dist/docs/references/reference-datasets-delete.md +25 -0
  229. package/dist/docs/references/reference-datasets-deleteExperiment.md +27 -0
  230. package/dist/docs/references/reference-datasets-deleteItem.md +27 -0
  231. package/dist/docs/references/reference-datasets-deleteItems.md +29 -0
  232. package/dist/docs/references/reference-datasets-get.md +31 -0
  233. package/dist/docs/references/reference-datasets-getDetails.md +47 -0
  234. package/dist/docs/references/reference-datasets-getExperiment.md +30 -0
  235. package/dist/docs/references/reference-datasets-getItem.md +33 -0
  236. package/dist/docs/references/reference-datasets-getItemHistory.md +31 -0
  237. package/dist/docs/references/reference-datasets-list.md +31 -0
  238. package/dist/docs/references/reference-datasets-listExperimentResults.md +39 -0
  239. package/dist/docs/references/reference-datasets-listExperiments.md +33 -0
  240. package/dist/docs/references/reference-datasets-listItems.md +46 -0
  241. package/dist/docs/references/reference-datasets-listVersions.md +33 -0
  242. package/dist/docs/references/reference-datasets-startExperiment.md +62 -0
  243. package/dist/docs/references/reference-datasets-startExperimentAsync.md +43 -0
  244. package/dist/docs/references/reference-datasets-update.md +48 -0
  245. package/dist/docs/references/reference-datasets-updateItem.md +38 -0
  246. package/dist/docs/references/reference-evals-answer-relevancy.md +105 -0
  247. package/dist/docs/references/reference-evals-answer-similarity.md +99 -0
  248. package/dist/docs/references/reference-evals-bias.md +120 -0
  249. package/dist/docs/references/reference-evals-completeness.md +136 -0
  250. package/dist/docs/references/reference-evals-content-similarity.md +101 -0
  251. package/dist/docs/references/reference-evals-context-precision.md +196 -0
  252. package/dist/docs/references/reference-evals-create-scorer.md +270 -0
  253. package/dist/docs/references/reference-evals-faithfulness.md +114 -0
  254. package/dist/docs/references/reference-evals-hallucination.md +213 -0
  255. package/dist/docs/references/reference-evals-keyword-coverage.md +128 -0
  256. package/dist/docs/references/reference-evals-mastra-scorer.md +123 -0
  257. package/dist/docs/references/reference-evals-run-evals.md +179 -0
  258. package/dist/docs/references/reference-evals-scorer-utils.md +326 -0
  259. package/dist/docs/references/reference-evals-textual-difference.md +113 -0
  260. package/dist/docs/references/reference-evals-tone-consistency.md +119 -0
  261. package/dist/docs/references/reference-evals-toxicity.md +123 -0
  262. package/dist/docs/references/reference-harness-harness-class.md +708 -0
  263. package/dist/docs/references/reference-logging-pino-logger.md +117 -0
  264. package/dist/docs/references/reference-memory-deleteMessages.md +38 -0
  265. package/dist/docs/references/reference-memory-memory-class.md +147 -0
  266. package/dist/docs/references/reference-memory-observational-memory.md +565 -0
  267. package/dist/docs/references/reference-observability-tracing-bridges-otel.md +131 -0
  268. package/dist/docs/references/reference-observability-tracing-configuration.md +178 -0
  269. package/dist/docs/references/reference-observability-tracing-exporters-console-exporter.md +138 -0
  270. package/dist/docs/references/reference-observability-tracing-exporters-datadog.md +116 -0
  271. package/dist/docs/references/reference-observability-tracing-instances.md +107 -0
  272. package/dist/docs/references/reference-observability-tracing-interfaces.md +743 -0
  273. package/dist/docs/references/reference-observability-tracing-processors-sensitive-data-filter.md +144 -0
  274. package/dist/docs/references/reference-observability-tracing-spans.md +224 -0
  275. package/dist/docs/references/reference-processors-batch-parts-processor.md +61 -0
  276. package/dist/docs/references/reference-processors-language-detector.md +82 -0
  277. package/dist/docs/references/reference-processors-message-history-processor.md +85 -0
  278. package/dist/docs/references/reference-processors-moderation-processor.md +104 -0
  279. package/dist/docs/references/reference-processors-pii-detector.md +108 -0
  280. package/dist/docs/references/reference-processors-processor-interface.md +521 -0
  281. package/dist/docs/references/reference-processors-prompt-injection-detector.md +72 -0
  282. package/dist/docs/references/reference-processors-semantic-recall-processor.md +117 -0
  283. package/dist/docs/references/reference-processors-system-prompt-scrubber.md +80 -0
  284. package/dist/docs/references/reference-processors-token-limiter-processor.md +115 -0
  285. package/dist/docs/references/reference-processors-tool-call-filter.md +85 -0
  286. package/dist/docs/references/reference-processors-tool-search-processor.md +111 -0
  287. package/dist/docs/references/reference-processors-unicode-normalizer.md +62 -0
  288. package/dist/docs/references/reference-processors-working-memory-processor.md +152 -0
  289. package/dist/docs/references/reference-rag-database-config.md +261 -0
  290. package/dist/docs/references/reference-rag-embeddings.md +92 -0
  291. package/dist/docs/references/reference-server-mastra-server.md +298 -0
  292. package/dist/docs/references/reference-server-register-api-route.md +249 -0
  293. package/dist/docs/references/reference-storage-cloudflare-d1.md +218 -0
  294. package/dist/docs/references/reference-storage-composite.md +235 -0
  295. package/dist/docs/references/reference-storage-lance.md +131 -0
  296. package/dist/docs/references/reference-storage-libsql.md +135 -0
  297. package/dist/docs/references/reference-storage-mongodb.md +262 -0
  298. package/dist/docs/references/reference-storage-mssql.md +157 -0
  299. package/dist/docs/references/reference-storage-overview.md +121 -0
  300. package/dist/docs/references/reference-storage-postgresql.md +526 -0
  301. package/dist/docs/references/reference-storage-upstash.md +160 -0
  302. package/dist/docs/references/reference-streaming-ChunkType.md +292 -0
  303. package/dist/docs/references/reference-streaming-agents-MastraModelOutput.md +182 -0
  304. package/dist/docs/references/reference-streaming-agents-streamLegacy.md +142 -0
  305. package/dist/docs/references/reference-streaming-workflows-observeStream.md +42 -0
  306. package/dist/docs/references/reference-streaming-workflows-resumeStream.md +61 -0
  307. package/dist/docs/references/reference-streaming-workflows-stream.md +88 -0
  308. package/dist/docs/references/reference-streaming-workflows-timeTravelStream.md +142 -0
  309. package/dist/docs/references/reference-templates-overview.md +194 -0
  310. package/dist/docs/references/reference-tools-create-tool.md +237 -0
  311. package/dist/docs/references/reference-tools-graph-rag-tool.md +182 -0
  312. package/dist/docs/references/reference-tools-mcp-client.md +954 -0
  313. package/dist/docs/references/reference-tools-mcp-server.md +1271 -0
  314. package/dist/docs/references/reference-tools-vector-query-tool.md +459 -0
  315. package/dist/docs/references/reference-vectors-libsql.md +305 -0
  316. package/dist/docs/references/reference-vectors-mongodb.md +295 -0
  317. package/dist/docs/references/reference-vectors-pg.md +408 -0
  318. package/dist/docs/references/reference-vectors-upstash.md +294 -0
  319. package/dist/docs/references/reference-voice-composite-voice.md +121 -0
  320. package/dist/docs/references/reference-voice-mastra-voice.md +311 -0
  321. package/dist/docs/references/reference-voice-voice.addInstructions.md +55 -0
  322. package/dist/docs/references/reference-voice-voice.addTools.md +67 -0
  323. package/dist/docs/references/reference-voice-voice.connect.md +94 -0
  324. package/dist/docs/references/reference-voice-voice.events.md +37 -0
  325. package/dist/docs/references/reference-voice-voice.listen.md +164 -0
  326. package/dist/docs/references/reference-voice-voice.on.md +111 -0
  327. package/dist/docs/references/reference-voice-voice.speak.md +157 -0
  328. package/dist/docs/references/reference-workflows-run-methods-cancel.md +86 -0
  329. package/dist/docs/references/reference-workflows-run-methods-restart.md +33 -0
  330. package/dist/docs/references/reference-workflows-run-methods-resume.md +59 -0
  331. package/dist/docs/references/reference-workflows-run-methods-start.md +58 -0
  332. package/dist/docs/references/reference-workflows-run-methods-startAsync.md +67 -0
  333. package/dist/docs/references/reference-workflows-run-methods-timeTravel.md +142 -0
  334. package/dist/docs/references/reference-workflows-run.md +59 -0
  335. package/dist/docs/references/reference-workflows-step.md +119 -0
  336. package/dist/docs/references/reference-workflows-workflow-methods-branch.md +25 -0
  337. package/dist/docs/references/reference-workflows-workflow-methods-commit.md +17 -0
  338. package/dist/docs/references/reference-workflows-workflow-methods-create-run.md +63 -0
  339. package/dist/docs/references/reference-workflows-workflow-methods-dountil.md +25 -0
  340. package/dist/docs/references/reference-workflows-workflow-methods-dowhile.md +25 -0
  341. package/dist/docs/references/reference-workflows-workflow-methods-foreach.md +118 -0
  342. package/dist/docs/references/reference-workflows-workflow-methods-map.md +93 -0
  343. package/dist/docs/references/reference-workflows-workflow-methods-parallel.md +21 -0
  344. package/dist/docs/references/reference-workflows-workflow-methods-sleep.md +35 -0
  345. package/dist/docs/references/reference-workflows-workflow-methods-sleepUntil.md +35 -0
  346. package/dist/docs/references/reference-workflows-workflow-methods-then.md +21 -0
  347. package/dist/docs/references/reference-workflows-workflow.md +157 -0
  348. package/dist/docs/references/reference-workspace-filesystem.md +255 -0
  349. package/dist/docs/references/reference-workspace-local-filesystem.md +343 -0
  350. package/dist/docs/references/reference-workspace-local-sandbox.md +301 -0
  351. package/dist/docs/references/reference-workspace-sandbox.md +87 -0
  352. package/dist/docs/references/reference-workspace-workspace-class.md +244 -0
  353. package/dist/docs/references/reference.md +277 -0
  354. package/dist/evals/index.cjs +20 -20
  355. package/dist/evals/index.js +3 -3
  356. package/dist/evals/run/index.d.ts +9 -2
  357. package/dist/evals/run/index.d.ts.map +1 -1
  358. package/dist/evals/scoreTraces/index.cjs +5 -5
  359. package/dist/evals/scoreTraces/index.js +2 -2
  360. package/dist/harness/harness.d.ts +6 -0
  361. package/dist/harness/harness.d.ts.map +1 -1
  362. package/dist/harness/index.cjs +28 -13
  363. package/dist/harness/index.cjs.map +1 -1
  364. package/dist/harness/index.js +20 -5
  365. package/dist/harness/index.js.map +1 -1
  366. package/dist/index.cjs +2 -2
  367. package/dist/index.js +1 -1
  368. package/dist/integration/index.cjs +2 -2
  369. package/dist/integration/index.js +1 -1
  370. package/dist/llm/index.cjs +6 -6
  371. package/dist/llm/index.js +1 -1
  372. package/dist/llm/model/embedding-router.d.ts.map +1 -1
  373. package/dist/llm/model/model.loop.d.ts +1 -1
  374. package/dist/llm/model/model.loop.d.ts.map +1 -1
  375. package/dist/loop/index.cjs +20 -12
  376. package/dist/loop/index.js +1 -1
  377. package/dist/loop/network/index.d.ts.map +1 -1
  378. package/dist/loop/network/validation.d.ts +51 -0
  379. package/dist/loop/network/validation.d.ts.map +1 -1
  380. package/dist/loop/test-utils/generateText.d.ts.map +1 -1
  381. package/dist/loop/test-utils/options.d.ts.map +1 -1
  382. package/dist/loop/test-utils/streamObject.d.ts.map +1 -1
  383. package/dist/loop/types.d.ts +15 -0
  384. package/dist/loop/types.d.ts.map +1 -1
  385. package/dist/loop/workflows/agentic-execution/index.d.ts +3 -0
  386. package/dist/loop/workflows/agentic-execution/index.d.ts.map +1 -1
  387. package/dist/loop/workflows/agentic-execution/is-task-complete-step.d.ts +126 -0
  388. package/dist/loop/workflows/agentic-execution/is-task-complete-step.d.ts.map +1 -0
  389. package/dist/loop/workflows/agentic-execution/llm-execution-step.d.ts +3 -1
  390. package/dist/loop/workflows/agentic-execution/llm-execution-step.d.ts.map +1 -1
  391. package/dist/loop/workflows/agentic-execution/llm-mapping-step.d.ts +1 -0
  392. package/dist/loop/workflows/agentic-execution/llm-mapping-step.d.ts.map +1 -1
  393. package/dist/loop/workflows/agentic-execution/tool-call-step.d.ts.map +1 -1
  394. package/dist/loop/workflows/agentic-loop/index.d.ts +3 -0
  395. package/dist/loop/workflows/agentic-loop/index.d.ts.map +1 -1
  396. package/dist/loop/workflows/schema.d.ts +3 -0
  397. package/dist/loop/workflows/schema.d.ts.map +1 -1
  398. package/dist/mastra/index.cjs +2 -2
  399. package/dist/mastra/index.d.ts +9 -5
  400. package/dist/mastra/index.d.ts.map +1 -1
  401. package/dist/mastra/index.js +1 -1
  402. package/dist/memory/index.cjs +14 -14
  403. package/dist/memory/index.js +1 -1
  404. package/dist/processor-provider/index.cjs +10 -10
  405. package/dist/processor-provider/index.js +1 -1
  406. package/dist/processors/index.cjs +42 -42
  407. package/dist/processors/index.js +1 -1
  408. package/dist/processors/processors/skills.d.ts.map +1 -1
  409. package/dist/relevance/index.cjs +3 -3
  410. package/dist/relevance/index.js +1 -1
  411. package/dist/storage/constants.cjs +56 -56
  412. package/dist/storage/constants.js +1 -1
  413. package/dist/storage/domains/memory/inmemory.d.ts.map +1 -1
  414. package/dist/storage/index.cjs +160 -160
  415. package/dist/storage/index.js +2 -2
  416. package/dist/storage/types.d.ts +2 -3
  417. package/dist/storage/types.d.ts.map +1 -1
  418. package/dist/stream/aisdk/v5/compat/prepare-tools.d.ts.map +1 -1
  419. package/dist/stream/base/output.d.ts +1 -0
  420. package/dist/stream/base/output.d.ts.map +1 -1
  421. package/dist/stream/index.cjs +11 -11
  422. package/dist/stream/index.js +2 -2
  423. package/dist/stream/types.d.ts +27 -1
  424. package/dist/stream/types.d.ts.map +1 -1
  425. package/dist/test-utils/llm-mock.cjs +4 -4
  426. package/dist/test-utils/llm-mock.js +1 -1
  427. package/dist/tool-loop-agent/index.cjs +4 -4
  428. package/dist/tool-loop-agent/index.js +1 -1
  429. package/dist/tools/index.cjs +9 -5
  430. package/dist/tools/index.d.ts +1 -1
  431. package/dist/tools/index.d.ts.map +1 -1
  432. package/dist/tools/index.js +1 -1
  433. package/dist/tools/is-vercel-tool.cjs +2 -2
  434. package/dist/tools/is-vercel-tool.js +1 -1
  435. package/dist/tools/toolchecks.d.ts +10 -0
  436. package/dist/tools/toolchecks.d.ts.map +1 -1
  437. package/dist/utils.cjs +23 -23
  438. package/dist/utils.js +1 -1
  439. package/dist/vector/index.cjs +7 -7
  440. package/dist/vector/index.js +1 -1
  441. package/dist/vector/types.d.ts +9 -1
  442. package/dist/vector/types.d.ts.map +1 -1
  443. package/dist/workflows/evented/index.cjs +10 -10
  444. package/dist/workflows/evented/index.js +1 -1
  445. package/dist/workflows/index.cjs +25 -25
  446. package/dist/workflows/index.js +1 -1
  447. package/dist/workflows/types.d.ts +14 -1
  448. package/dist/workflows/types.d.ts.map +1 -1
  449. package/dist/workflows/workflow.d.ts +3 -17
  450. package/dist/workflows/workflow.d.ts.map +1 -1
  451. package/dist/workspace/filesystem/composite-filesystem.d.ts +5 -0
  452. package/dist/workspace/filesystem/composite-filesystem.d.ts.map +1 -1
  453. package/dist/workspace/filesystem/filesystem.d.ts +12 -0
  454. package/dist/workspace/filesystem/filesystem.d.ts.map +1 -1
  455. package/dist/workspace/filesystem/fs-utils.d.ts +12 -0
  456. package/dist/workspace/filesystem/fs-utils.d.ts.map +1 -1
  457. package/dist/workspace/filesystem/local-filesystem.d.ts +6 -0
  458. package/dist/workspace/filesystem/local-filesystem.d.ts.map +1 -1
  459. package/dist/workspace/index.cjs +66 -66
  460. package/dist/workspace/index.js +1 -1
  461. package/dist/workspace/lsp/client.d.ts +76 -0
  462. package/dist/workspace/lsp/client.d.ts.map +1 -0
  463. package/dist/workspace/lsp/index.d.ts +6 -0
  464. package/dist/workspace/lsp/index.d.ts.map +1 -0
  465. package/dist/workspace/lsp/language.d.ts +16 -0
  466. package/dist/workspace/lsp/language.d.ts.map +1 -0
  467. package/dist/workspace/lsp/manager.d.ts +72 -0
  468. package/dist/workspace/lsp/manager.d.ts.map +1 -0
  469. package/dist/workspace/lsp/servers.d.ts +43 -0
  470. package/dist/workspace/lsp/servers.d.ts.map +1 -0
  471. package/dist/workspace/lsp/types.d.ts +45 -0
  472. package/dist/workspace/lsp/types.d.ts.map +1 -0
  473. package/dist/workspace/tools/ast-edit.d.ts.map +1 -1
  474. package/dist/workspace/tools/edit-file.d.ts.map +1 -1
  475. package/dist/workspace/tools/helpers.d.ts +13 -0
  476. package/dist/workspace/tools/helpers.d.ts.map +1 -1
  477. package/dist/workspace/tools/write-file.d.ts.map +1 -1
  478. package/dist/workspace/workspace.d.ts +33 -0
  479. package/dist/workspace/workspace.d.ts.map +1 -1
  480. package/package.json +10 -8
  481. package/dist/chunk-2X66GWF5.cjs.map +0 -1
  482. package/dist/chunk-6QBN6MZY.cjs.map +0 -1
  483. package/dist/chunk-7EXW4AAG.js.map +0 -1
  484. package/dist/chunk-7UAJ6LMR.cjs.map +0 -1
  485. package/dist/chunk-BQHWJLXU.js.map +0 -1
  486. package/dist/chunk-DB7U2C5B.cjs.map +0 -1
  487. package/dist/chunk-DFCRXDVK.js.map +0 -1
  488. package/dist/chunk-EAZ6YDCQ.cjs.map +0 -1
  489. package/dist/chunk-HB6T4554.cjs.map +0 -1
  490. package/dist/chunk-IC5OUWKJ.js.map +0 -1
  491. package/dist/chunk-KUXNBWN7.js.map +0 -1
  492. package/dist/chunk-O7PZ4VOO.cjs.map +0 -1
  493. package/dist/chunk-QSHV7GPT.js.map +0 -1
  494. package/dist/chunk-QTAS3HND.cjs.map +0 -1
  495. package/dist/chunk-R4N65TLG.js.map +0 -1
  496. package/dist/chunk-T6GAM3SQ.js.map +0 -1
  497. package/dist/chunk-YQG7NBPR.cjs.map +0 -1
  498. package/dist/chunk-ZSBM2SVU.js.map +0 -1
@@ -0,0 +1,270 @@
1
+ # createScorer
2
+
3
+ Mastra provides a unified `createScorer` factory that allows you to define custom scorers for evaluating input/output pairs. You can use either native JavaScript functions or LLM-based prompt objects for each evaluation step. Custom scorers can be added to Agents and Workflow steps.
4
+
5
+ ## How to Create a Custom Scorer
6
+
7
+ Use the `createScorer` factory to define your scorer with a name, description, and optional judge configuration. Then chain step methods to build your evaluation pipeline. You must provide at least a `generateScore` step.
8
+
9
+ **Prompt object steps** are step configurations expressed as objects with `description` + `createPrompt` (and `outputSchema` for `preprocess`/`analyze`). These steps invoke the judge LLM. **Function steps** are plain functions and never call the judge.
10
+
11
+ ```typescript
12
+ import { createScorer } from '@mastra/core/evals'
13
+
14
+ const scorer = createScorer({
15
+ id: 'my-custom-scorer',
16
+ name: 'My Custom Scorer', // Optional, defaults to id
17
+ description: 'Evaluates responses based on custom criteria',
18
+ type: 'agent', // Optional: for agent evaluation with automatic typing
19
+ judge: {
20
+ model: myModel,
21
+ instructions: 'You are an expert evaluator...',
22
+ },
23
+ })
24
+ .preprocess({
25
+ /* step config */
26
+ })
27
+ .analyze({
28
+ /* step config */
29
+ })
30
+ .generateScore(({ run, results }) => {
31
+ // Return a number
32
+ })
33
+ .generateReason({
34
+ /* step config */
35
+ })
36
+ ```
37
+
38
+ ## createScorer Options
39
+
40
+ **id:** (`string`): Unique identifier for the scorer. Used as the name if \`name\` is not provided.
41
+
42
+ **name?:** (`string`): Name of the scorer. Defaults to \`id\` if not provided.
43
+
44
+ **description:** (`string`): Description of what the scorer does.
45
+
46
+ **judge?:** (`object`): Optional judge configuration for LLM-based steps. See Judge Object section below.
47
+
48
+ **type?:** (`string`): Type specification for input/output. Use 'agent' for automatic agent types. For custom types, use the generic approach instead.
49
+
50
+ This function returns a scorer builder that you can chain step methods onto. See the [MastraScorer reference](https://mastra.ai/reference/evals/mastra-scorer) for details on the `.run()` method and its input/output.
51
+
52
+ ## Judge Object
53
+
54
+ **model:** (`LanguageModel`): The LLM model instance to use for evaluation.
55
+
56
+ **instructions:** (`string`): System prompt/instructions for the LLM.
57
+
58
+ The judge only runs for steps defined as **prompt objects** (`preprocess`, `analyze`, `generateScore`, `generateReason` in prompt mode). If you use function steps only, the judge is never called and there is no LLM output to inspect. In that case, any score/reason must be produced by your functions.
59
+
60
+ When a prompt-object step runs, its structured LLM output is stored in the corresponding result field (`preprocessStepResult`, `analyzeStepResult`, or the value consumed by `calculateScore` in `generateScore`).
61
+
62
+ ## Type Safety
63
+
64
+ You can specify input/output types when creating scorers for better type inference and IntelliSense support:
65
+
66
+ ### Agent Type Shortcut
67
+
68
+ For evaluating agents, use `type: 'agent'` to automatically get the correct types for agent input/output:
69
+
70
+ ```typescript
71
+ import { createScorer } from '@mastra/core/evals'
72
+
73
+ // Agent scorer with automatic typing
74
+ const agentScorer = createScorer({
75
+ id: 'agent-response-quality',
76
+ description: 'Evaluates agent responses',
77
+ type: 'agent', // Automatically provides ScorerRunInputForAgent/ScorerRunOutputForAgent
78
+ })
79
+ .preprocess(({ run }) => {
80
+ // run.input is automatically typed as ScorerRunInputForAgent
81
+ const userMessage = run.inputData.inputMessages[0]?.content
82
+ return { userMessage }
83
+ })
84
+ .generateScore(({ run, results }) => {
85
+ // run.output is automatically typed as ScorerRunOutputForAgent
86
+ const response = run.output[0]?.content
87
+ return response.length > 10 ? 1.0 : 0.5
88
+ })
89
+ ```
90
+
91
+ ### Custom Types with Generics
92
+
93
+ For custom input/output types, use the generic approach:
94
+
95
+ ```typescript
96
+ import { createScorer } from '@mastra/core/evals'
97
+
98
+ type CustomInput = { query: string; context: string[] }
99
+ type CustomOutput = { answer: string; confidence: number }
100
+
101
+ const customScorer = createScorer<CustomInput, CustomOutput>({
102
+ id: 'custom-scorer',
103
+ description: 'Evaluates custom data',
104
+ }).generateScore(({ run }) => {
105
+ // run.input is typed as CustomInput
106
+ // run.output is typed as CustomOutput
107
+ return run.output.confidence
108
+ })
109
+ ```
110
+
111
+ ### Built-in Agent Types
112
+
113
+ - **`ScorerRunInputForAgent`** - Contains `inputMessages`, `rememberedMessages`, `systemMessages`, and `taggedSystemMessages` for agent evaluation
114
+ - **`ScorerRunOutputForAgent`** - Array of agent response messages
115
+
116
+ Using these types provides autocomplete, compile-time validation, and better documentation for your scoring logic.
117
+
118
+ ## Trace Scoring with Agent Types
119
+
120
+ When you use `type: 'agent'`, your scorer is compatible for both adding directly to agents and scoring traces from agent interactions. The scorer automatically transforms trace data into the proper agent input/output format:
121
+
122
+ ```typescript
123
+ const agentTraceScorer = createScorer({
124
+ id: 'agent-trace-length',
125
+ description: 'Evaluates agent response length',
126
+ type: 'agent',
127
+ }).generateScore(({ run }) => {
128
+ // Trace data is automatically transformed to agent format
129
+ const userMessages = run.inputData.inputMessages
130
+ const agentResponse = run.output[0]?.content
131
+
132
+ // Score based on response length
133
+ return agentResponse?.length > 50 ? 0 : 1
134
+ })
135
+
136
+ // Register with Mastra for trace scoring
137
+ const mastra = new Mastra({
138
+ scorers: {
139
+ agentTraceScorer,
140
+ },
141
+ })
142
+ ```
143
+
144
+ ## Step Method Signatures
145
+
146
+ ### preprocess
147
+
148
+ Optional preprocessing step that can extract or transform data before analysis.
149
+
150
+ **Function Mode:** Function: `({ run, results }) => any`
151
+
152
+ **run.input:** (`any`): Input records provided to the scorer. If the scorer is added to an agent, this will be an array of user messages, e.g. \`\[{ role: 'user', content: 'hello world' }]\`. If the scorer is used in a workflow, this will be the input of the workflow.
153
+
154
+ **run.output:** (`any`): Output record provided to the scorer. For agents, this is usually the agent's response. For workflows, this is the workflow's output.
155
+
156
+ **run.runId:** (`string`): Unique identifier for this scoring run.
157
+
158
+ **run.requestContext?:** (`object`): Request Context from the agent or workflow step being evaluated (optional).
159
+
160
+ **results:** (`object`): Empty object (no previous steps).
161
+
162
+ Returns: `any`\
163
+ The method can return any value. The returned value will be available to subsequent steps as `preprocessStepResult`.
164
+
165
+ **Prompt Object Mode:**
166
+
167
+ **description:** (`string`): Description of what this preprocessing step does.
168
+
169
+ **outputSchema:** (`ZodSchema`): Zod schema for the expected output of the preprocess step.
170
+
171
+ **createPrompt:** (`function`): Function: ({ run, results }) => string. Returns the prompt for the LLM.
172
+
173
+ **judge?:** (`object`): (Optional) LLM judge for this step (can override main judge). See Judge Object section.
174
+
175
+ ### analyze
176
+
177
+ Optional analysis step that processes the input/output and any preprocessed data.
178
+
179
+ **Function Mode:** Function: `({ run, results }) => any`
180
+
181
+ **run.input:** (`any`): Input records provided to the scorer. If the scorer is added to an agent, this will be an array of user messages, e.g. \`\[{ role: 'user', content: 'hello world' }]\`. If the scorer is used in a workflow, this will be the input of the workflow.
182
+
183
+ **run.output:** (`any`): Output record provided to the scorer. For agents, this is usually the agent's response. For workflows, this is the workflow's output.
184
+
185
+ **run.runId:** (`string`): Unique identifier for this scoring run.
186
+
187
+ **run.requestContext?:** (`object`): Request Context from the agent or workflow step being evaluated (optional).
188
+
189
+ **results.preprocessStepResult?:** (`any`): Result from preprocess step, if defined (optional).
190
+
191
+ Returns: `any`\
192
+ The method can return any value. The returned value will be available to subsequent steps as `analyzeStepResult`.
193
+
194
+ **Prompt Object Mode:**
195
+
196
+ **description:** (`string`): Description of what this analysis step does.
197
+
198
+ **outputSchema:** (`ZodSchema`): Zod schema for the expected output of the analyze step.
199
+
200
+ **createPrompt:** (`function`): Function: ({ run, results }) => string. Returns the prompt for the LLM.
201
+
202
+ **judge?:** (`object`): (Optional) LLM judge for this step (can override main judge). See Judge Object section.
203
+
204
+ ### generateScore
205
+
206
+ **Required** step that computes the final numerical score.
207
+
208
+ **Function Mode:** Function: `({ run, results }) => number`
209
+
210
+ **run.input:** (`any`): Input records provided to the scorer. If the scorer is added to an agent, this will be an array of user messages, e.g. \`\[{ role: 'user', content: 'hello world' }]\`. If the scorer is used in a workflow, this will be the input of the workflow.
211
+
212
+ **run.output:** (`any`): Output record provided to the scorer. For agents, this is usually the agent's response. For workflows, this is the workflow's output.
213
+
214
+ **run.runId:** (`string`): Unique identifier for this scoring run.
215
+
216
+ **run.requestContext?:** (`object`): Request Context from the agent or workflow step being evaluated (optional).
217
+
218
+ **results.preprocessStepResult?:** (`any`): Result from preprocess step, if defined (optional).
219
+
220
+ **results.analyzeStepResult?:** (`any`): Result from analyze step, if defined (optional).
221
+
222
+ Returns: `number`\
223
+ The method must return a numerical score.
224
+
225
+ **Prompt Object Mode:**
226
+
227
+ **description:** (`string`): Description of what this scoring step does.
228
+
229
+ **outputSchema:** (`ZodSchema`): Zod schema for the expected output of the generateScore step.
230
+
231
+ **createPrompt:** (`function`): Function: ({ run, results }) => string. Returns the prompt for the LLM.
232
+
233
+ **judge?:** (`object`): (Optional) LLM judge for this step (can override main judge). See Judge Object section.
234
+
235
+ When using prompt object mode, you must also provide a `calculateScore` function to convert the LLM output to a numerical score:
236
+
237
+ **calculateScore:** (`function`): Function: ({ run, results, analyzeStepResult }) => number. Converts the LLM's structured output into a numerical score.
238
+
239
+ ### generateReason
240
+
241
+ Optional step that provides an explanation for the score.
242
+
243
+ **Function Mode:** Function: `({ run, results, score }) => string`
244
+
245
+ **run.input:** (`any`): Input records provided to the scorer. If the scorer is added to an agent, this will be an array of user messages, e.g. \`\[{ role: 'user', content: 'hello world' }]\`. If the scorer is used in a workflow, this will be the input of the workflow.
246
+
247
+ **run.output:** (`any`): Output record provided to the scorer. For agents, this is usually the agent's response. For workflows, this is the workflow's output.
248
+
249
+ **run.runId:** (`string`): Unique identifier for this scoring run.
250
+
251
+ **run.requestContext?:** (`object`): Request Context from the agent or workflow step being evaluated (optional).
252
+
253
+ **results.preprocessStepResult?:** (`any`): Result from preprocess step, if defined (optional).
254
+
255
+ **results.analyzeStepResult?:** (`any`): Result from analyze step, if defined (optional).
256
+
257
+ **score:** (`number`): Score computed by the generateScore step.
258
+
259
+ Returns: `string`\
260
+ The method must return a string explaining the score.
261
+
262
+ **Prompt Object Mode:**
263
+
264
+ **description:** (`string`): Description of what this reasoning step does.
265
+
266
+ **createPrompt:** (`function`): Function: ({ run, results, score }) => string. Returns the prompt for the LLM.
267
+
268
+ **judge?:** (`object`): (Optional) LLM judge for this step (can override main judge). See Judge Object section.
269
+
270
+ All step functions can be async.
@@ -0,0 +1,114 @@
1
+ # Faithfulness Scorer
2
+
3
+ The `createFaithfulnessScorer()` function evaluates how factually accurate an LLM's output is compared to the provided context. It extracts claims from the output and verifies them against the context, making it essential to measure RAG pipeline responses' reliability.
4
+
5
+ ## Parameters
6
+
7
+ The `createFaithfulnessScorer()` function accepts a single options object with the following properties:
8
+
9
+ **model:** (`LanguageModel`): Configuration for the model used to evaluate faithfulness.
10
+
11
+ **context:** (`string[]`): Array of context chunks against which the output's claims will be verified.
12
+
13
+ **scale:** (`number`): The maximum score value. The final score will be normalized to this scale. (Default: `1`)
14
+
15
+ This function returns an instance of the MastraScorer class. The `.run()` method accepts the same input as other scorers (see the [MastraScorer reference](https://mastra.ai/reference/evals/mastra-scorer)), but the return value includes LLM-specific fields as documented below.
16
+
17
+ ## .run() Returns
18
+
19
+ **runId:** (`string`): The id of the run (optional).
20
+
21
+ **preprocessStepResult:** (`string[]`): Array of extracted claims from the output.
22
+
23
+ **preprocessPrompt:** (`string`): The prompt sent to the LLM for the preprocess step (optional).
24
+
25
+ **analyzeStepResult:** (`object`): Object with verdicts: { verdicts: Array<{ verdict: 'yes' | 'no' | 'unsure', reason: string }> }
26
+
27
+ **analyzePrompt:** (`string`): The prompt sent to the LLM for the analyze step (optional).
28
+
29
+ **score:** (`number`): A score between 0 and the configured scale, representing the proportion of claims that are supported by the context.
30
+
31
+ **reason:** (`string`): A detailed explanation of the score, including which claims were supported, contradicted, or marked as unsure.
32
+
33
+ **generateReasonPrompt:** (`string`): The prompt sent to the LLM for the generateReason step (optional).
34
+
35
+ ## Scoring Details
36
+
37
+ The scorer evaluates faithfulness through claim verification against provided context.
38
+
39
+ ### Scoring Process
40
+
41
+ 1. Analyzes claims and context:
42
+
43
+ - Extracts all claims (factual and speculative)
44
+
45
+ - Verifies each claim against context
46
+
47
+ - Assigns one of three verdicts:
48
+
49
+ - "yes" - claim supported by context
50
+ - "no" - claim contradicts context
51
+ - "unsure" - claim unverifiable
52
+
53
+ 2. Calculates faithfulness score:
54
+
55
+ - Counts supported claims
56
+ - Divides by total claims
57
+ - Scales to configured range
58
+
59
+ Final score: `(supported_claims / total_claims) * scale`
60
+
61
+ ### Score interpretation
62
+
63
+ A faithfulness score between 0 and 1:
64
+
65
+ - **1.0**: All claims are accurate and directly supported by the context.
66
+ - **0.7–0.9**: Most claims are correct, with minor additions or omissions.
67
+ - **0.4–0.6**: Some claims are supported, but others are unverifiable.
68
+ - **0.1–0.3**: Most of the content is inaccurate or unsupported.
69
+ - **0.0**: All claims are false or contradict the context.
70
+
71
+ ## Example
72
+
73
+ Evaluate agent responses for faithfulness to provided context:
74
+
75
+ ```typescript
76
+ import { runEvals } from '@mastra/core/evals'
77
+ import { createFaithfulnessScorer } from '@mastra/evals/scorers/prebuilt'
78
+ import { myAgent } from './agent'
79
+
80
+ // Context is typically populated from agent tool calls or RAG retrieval
81
+ const scorer = createFaithfulnessScorer({
82
+ model: 'openai/gpt-4o',
83
+ })
84
+
85
+ const result = await runEvals({
86
+ data: [
87
+ {
88
+ input: 'Tell me about the Tesla Model 3.',
89
+ },
90
+ {
91
+ input: 'What are the key features of this electric vehicle?',
92
+ },
93
+ ],
94
+ scorers: [scorer],
95
+ target: myAgent,
96
+ onItemComplete: ({ scorerResults }) => {
97
+ console.log({
98
+ score: scorerResults[scorer.id].score,
99
+ reason: scorerResults[scorer.id].reason,
100
+ })
101
+ },
102
+ })
103
+
104
+ console.log(result.scores)
105
+ ```
106
+
107
+ For more details on `runEvals`, see the [runEvals reference](https://mastra.ai/reference/evals/run-evals).
108
+
109
+ To add this scorer to an agent, see the [Scorers overview](https://mastra.ai/docs/evals/overview) guide.
110
+
111
+ ## Related
112
+
113
+ - [Answer Relevancy Scorer](https://mastra.ai/reference/evals/answer-relevancy)
114
+ - [Hallucination Scorer](https://mastra.ai/reference/evals/hallucination)
@@ -0,0 +1,213 @@
1
+ # Hallucination Scorer
2
+
3
+ The `createHallucinationScorer()` function evaluates whether an LLM generates factually correct information by comparing its output against the provided context. This scorer measures hallucination by identifying direct contradictions between the context and the output.
4
+
5
+ ## Parameters
6
+
7
+ The `createHallucinationScorer()` function accepts a single options object with the following properties:
8
+
9
+ **model:** (`LanguageModel`): Configuration for the model used to evaluate hallucination.
10
+
11
+ **options.scale:** (`number`): Maximum score value. (Default: `1`)
12
+
13
+ **options.context:** (`string[]`): Static context strings to use as ground truth for hallucination detection.
14
+
15
+ **options.getContext:** (`(params: GetContextParams) => string[] | Promise<string[]>`): A hook to dynamically resolve context at runtime. Takes priority over static context. Useful for live scoring where context (like tool results) is only available when the scorer runs.
16
+
17
+ This function returns an instance of the MastraScorer class. The `.run()` method accepts the same input as other scorers (see the [MastraScorer reference](https://mastra.ai/reference/evals/mastra-scorer)), but the return value includes LLM-specific fields as documented below.
18
+
19
+ ### GetContextParams
20
+
21
+ The `getContext` hook receives the following parameters:
22
+
23
+ **run:** (`GetContextRun`): The scorer run containing input, output, runId, requestContext, and tracingContext.
24
+
25
+ **results:** (`Record<string, any>`): Accumulated results from previous steps (e.g., preprocessStepResult with extracted claims).
26
+
27
+ **score:** (`number`): The computed score. Only present when called from the generateReason step.
28
+
29
+ **step:** (`'analyze' | 'generateReason'`): Which step is calling the hook. Useful for caching context between calls.
30
+
31
+ ## .run() Returns
32
+
33
+ **runId:** (`string`): The id of the run (optional).
34
+
35
+ **preprocessStepResult:** (`object`): Object with extracted claims: { claims: string\[] }
36
+
37
+ **preprocessPrompt:** (`string`): The prompt sent to the LLM for the preprocess step (optional).
38
+
39
+ **analyzeStepResult:** (`object`): Object with verdicts: { verdicts: Array<{ statement: string, verdict: 'yes' | 'no', reason: string }> }
40
+
41
+ **analyzePrompt:** (`string`): The prompt sent to the LLM for the analyze step (optional).
42
+
43
+ **score:** (`number`): Hallucination score (0 to scale, default 0-1).
44
+
45
+ **reason:** (`string`): Detailed explanation of the score and identified contradictions.
46
+
47
+ **generateReasonPrompt:** (`string`): The prompt sent to the LLM for the generateReason step (optional).
48
+
49
+ ## Scoring Details
50
+
51
+ The scorer evaluates hallucination through contradiction detection and unsupported claim analysis.
52
+
53
+ ### Scoring Process
54
+
55
+ 1. Analyzes factual content:
56
+
57
+ - Extracts statements from context
58
+ - Identifies numerical values and dates
59
+ - Maps statement relationships
60
+
61
+ 2. Analyzes output for hallucinations:
62
+
63
+ - Compares against context statements
64
+ - Marks direct conflicts as hallucinations
65
+ - Identifies unsupported claims as hallucinations
66
+ - Evaluates numerical accuracy
67
+ - Considers approximation context
68
+
69
+ 3. Calculates hallucination score:
70
+
71
+ - Counts hallucinated statements (contradictions and unsupported claims)
72
+ - Divides by total statements
73
+ - Scales to configured range
74
+
75
+ Final score: `(hallucinated_statements / total_statements) * scale`
76
+
77
+ ### Important Considerations
78
+
79
+ - Claims not present in context are treated as hallucinations
80
+
81
+ - Subjective claims are hallucinations unless explicitly supported
82
+
83
+ - Speculative language ("might", "possibly") about facts IN context is allowed
84
+
85
+ - Speculative language about facts NOT in context is treated as hallucination
86
+
87
+ - Empty outputs result in zero hallucinations
88
+
89
+ - Numerical evaluation considers:
90
+
91
+ - Scale-appropriate precision
92
+ - Contextual approximations
93
+ - Explicit precision indicators
94
+
95
+ ### Score interpretation
96
+
97
+ A hallucination score between 0 and 1:
98
+
99
+ - **0.0**: No hallucination — all claims match the context.
100
+ - **0.3–0.4**: Low hallucination — a few contradictions.
101
+ - **0.5–0.6**: Mixed hallucination — several contradictions.
102
+ - **0.7–0.8**: High hallucination — many contradictions.
103
+ - **0.9–1.0**: Complete hallucination — most or all claims contradict the context.
104
+
105
+ **Note:** The score represents the degree of hallucination - lower scores indicate better factual alignment with the provided context
106
+
107
+ ## Examples
108
+
109
+ ### Static Context
110
+
111
+ Use static context when you have known ground truth to compare against:
112
+
113
+ ```typescript
114
+ import { createHallucinationScorer } from '@mastra/evals/scorers/prebuilt'
115
+
116
+ const scorer = createHallucinationScorer({
117
+ model: 'openai/gpt-4o',
118
+ options: {
119
+ context: [
120
+ 'The first iPhone was announced on January 9, 2007.',
121
+ 'It was released on June 29, 2007.',
122
+ 'Steve Jobs introduced it at Macworld.',
123
+ ],
124
+ },
125
+ })
126
+ ```
127
+
128
+ ### Dynamic Context with getContext
129
+
130
+ Use `getContext` for live scoring scenarios where context comes from tool results:
131
+
132
+ ```typescript
133
+ import { createHallucinationScorer } from '@mastra/evals/scorers/prebuilt'
134
+ import { extractToolResults } from '@mastra/evals/scorers'
135
+
136
+ const scorer = createHallucinationScorer({
137
+ model: 'openai/gpt-4o',
138
+ options: {
139
+ getContext: ({ run, step }) => {
140
+ // Extract tool results as context
141
+ const toolResults = extractToolResults(run.output)
142
+ return toolResults.map(t => JSON.stringify({ tool: t.toolName, result: t.result }))
143
+ },
144
+ },
145
+ })
146
+ ```
147
+
148
+ ### Live Scoring with Agent
149
+
150
+ Attach the scorer to an agent for live evaluation:
151
+
152
+ ```typescript
153
+ import { Agent } from '@mastra/core/agent'
154
+ import { createHallucinationScorer } from '@mastra/evals/scorers/prebuilt'
155
+ import { extractToolResults } from '@mastra/evals/scorers'
156
+
157
+ const hallucinationScorer = createHallucinationScorer({
158
+ model: 'openai/gpt-4o',
159
+ options: {
160
+ getContext: ({ run }) => {
161
+ const toolResults = extractToolResults(run.output)
162
+ return toolResults.map(t => JSON.stringify({ tool: t.toolName, result: t.result }))
163
+ },
164
+ },
165
+ })
166
+
167
+ const agent = new Agent({
168
+ name: 'my-agent',
169
+ model: 'openai/gpt-4o',
170
+ instructions: 'You are a helpful assistant.',
171
+ evals: {
172
+ scorers: [hallucinationScorer],
173
+ },
174
+ })
175
+ ```
176
+
177
+ ### Batch Evaluation with runEvals
178
+
179
+ ```typescript
180
+ import { runEvals } from '@mastra/core/evals'
181
+ import { createHallucinationScorer } from '@mastra/evals/scorers/prebuilt'
182
+ import { myAgent } from './agent'
183
+
184
+ const scorer = createHallucinationScorer({
185
+ model: 'openai/gpt-4o',
186
+ options: {
187
+ context: ['Known fact 1', 'Known fact 2'],
188
+ },
189
+ })
190
+
191
+ const result = await runEvals({
192
+ data: [{ input: 'Tell me about topic A' }, { input: 'Tell me about topic B' }],
193
+ scorers: [scorer],
194
+ target: myAgent,
195
+ onItemComplete: ({ scorerResults }) => {
196
+ console.log({
197
+ score: scorerResults[scorer.id].score,
198
+ reason: scorerResults[scorer.id].reason,
199
+ })
200
+ },
201
+ })
202
+
203
+ console.log(result.scores)
204
+ ```
205
+
206
+ For more details on `runEvals`, see the [runEvals reference](https://mastra.ai/reference/evals/run-evals).
207
+
208
+ To add this scorer to an agent, see the [Scorers overview](https://mastra.ai/docs/evals/overview) guide.
209
+
210
+ ## Related
211
+
212
+ - [Faithfulness Scorer](https://mastra.ai/reference/evals/faithfulness)
213
+ - [Answer Relevancy Scorer](https://mastra.ai/reference/evals/answer-relevancy)