@mastra/mcp-docs-server 1.1.4 → 1.1.5-alpha.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (547) hide show
  1. package/CHANGELOG.md +7 -0
  2. package/package.json +3 -3
  3. package/.docs/docs/agents/adding-voice.md +0 -353
  4. package/.docs/docs/agents/agent-approval.md +0 -377
  5. package/.docs/docs/agents/agent-memory.md +0 -212
  6. package/.docs/docs/agents/guardrails.md +0 -382
  7. package/.docs/docs/agents/network-approval.md +0 -275
  8. package/.docs/docs/agents/networks.md +0 -290
  9. package/.docs/docs/agents/overview.md +0 -309
  10. package/.docs/docs/agents/processors.md +0 -632
  11. package/.docs/docs/agents/structured-output.md +0 -271
  12. package/.docs/docs/agents/using-tools.md +0 -214
  13. package/.docs/docs/build-with-ai/mcp-docs-server.md +0 -241
  14. package/.docs/docs/build-with-ai/skills.md +0 -35
  15. package/.docs/docs/community/contributing-templates.md +0 -3
  16. package/.docs/docs/community/discord.md +0 -9
  17. package/.docs/docs/community/licensing.md +0 -66
  18. package/.docs/docs/deployment/cloud-providers.md +0 -15
  19. package/.docs/docs/deployment/mastra-server.md +0 -122
  20. package/.docs/docs/deployment/monorepo.md +0 -142
  21. package/.docs/docs/deployment/overview.md +0 -62
  22. package/.docs/docs/deployment/studio.md +0 -234
  23. package/.docs/docs/deployment/web-framework.md +0 -52
  24. package/.docs/docs/deployment/workflow-runners.md +0 -9
  25. package/.docs/docs/evals/built-in-scorers.md +0 -47
  26. package/.docs/docs/evals/custom-scorers.md +0 -519
  27. package/.docs/docs/evals/overview.md +0 -146
  28. package/.docs/docs/evals/running-in-ci.md +0 -106
  29. package/.docs/docs/getting-started/build-with-ai.md +0 -68
  30. package/.docs/docs/getting-started/manual-install.md +0 -226
  31. package/.docs/docs/getting-started/project-structure.md +0 -60
  32. package/.docs/docs/getting-started/start.md +0 -28
  33. package/.docs/docs/getting-started/studio.md +0 -101
  34. package/.docs/docs/index.md +0 -43
  35. package/.docs/docs/mastra-cloud/deployment.md +0 -77
  36. package/.docs/docs/mastra-cloud/observability.md +0 -38
  37. package/.docs/docs/mastra-cloud/overview.md +0 -23
  38. package/.docs/docs/mastra-cloud/setup.md +0 -42
  39. package/.docs/docs/mastra-cloud/studio.md +0 -24
  40. package/.docs/docs/mcp/overview.md +0 -370
  41. package/.docs/docs/mcp/publishing-mcp-server.md +0 -95
  42. package/.docs/docs/memory/memory-processors.md +0 -316
  43. package/.docs/docs/memory/message-history.md +0 -260
  44. package/.docs/docs/memory/observational-memory.md +0 -246
  45. package/.docs/docs/memory/overview.md +0 -45
  46. package/.docs/docs/memory/semantic-recall.md +0 -272
  47. package/.docs/docs/memory/storage.md +0 -261
  48. package/.docs/docs/memory/working-memory.md +0 -400
  49. package/.docs/docs/observability/datasets/overview.md +0 -188
  50. package/.docs/docs/observability/datasets/running-experiments.md +0 -266
  51. package/.docs/docs/observability/logging.md +0 -99
  52. package/.docs/docs/observability/overview.md +0 -70
  53. package/.docs/docs/observability/tracing/bridges/otel.md +0 -209
  54. package/.docs/docs/observability/tracing/exporters/arize.md +0 -274
  55. package/.docs/docs/observability/tracing/exporters/braintrust.md +0 -111
  56. package/.docs/docs/observability/tracing/exporters/cloud.md +0 -129
  57. package/.docs/docs/observability/tracing/exporters/datadog.md +0 -187
  58. package/.docs/docs/observability/tracing/exporters/default.md +0 -211
  59. package/.docs/docs/observability/tracing/exporters/laminar.md +0 -100
  60. package/.docs/docs/observability/tracing/exporters/langfuse.md +0 -217
  61. package/.docs/docs/observability/tracing/exporters/langsmith.md +0 -202
  62. package/.docs/docs/observability/tracing/exporters/otel.md +0 -479
  63. package/.docs/docs/observability/tracing/exporters/posthog.md +0 -148
  64. package/.docs/docs/observability/tracing/exporters/sentry.md +0 -208
  65. package/.docs/docs/observability/tracing/overview.md +0 -1114
  66. package/.docs/docs/observability/tracing/processors/sensitive-data-filter.md +0 -303
  67. package/.docs/docs/rag/chunking-and-embedding.md +0 -183
  68. package/.docs/docs/rag/graph-rag.md +0 -215
  69. package/.docs/docs/rag/overview.md +0 -72
  70. package/.docs/docs/rag/retrieval.md +0 -521
  71. package/.docs/docs/rag/vector-databases.md +0 -648
  72. package/.docs/docs/server/auth/auth0.md +0 -222
  73. package/.docs/docs/server/auth/better-auth.md +0 -203
  74. package/.docs/docs/server/auth/clerk.md +0 -132
  75. package/.docs/docs/server/auth/composite-auth.md +0 -234
  76. package/.docs/docs/server/auth/custom-auth-provider.md +0 -513
  77. package/.docs/docs/server/auth/firebase.md +0 -272
  78. package/.docs/docs/server/auth/jwt.md +0 -110
  79. package/.docs/docs/server/auth/simple-auth.md +0 -178
  80. package/.docs/docs/server/auth/supabase.md +0 -117
  81. package/.docs/docs/server/auth/workos.md +0 -190
  82. package/.docs/docs/server/auth.md +0 -38
  83. package/.docs/docs/server/custom-adapters.md +0 -374
  84. package/.docs/docs/server/custom-api-routes.md +0 -267
  85. package/.docs/docs/server/mastra-client.md +0 -243
  86. package/.docs/docs/server/mastra-server.md +0 -71
  87. package/.docs/docs/server/middleware.md +0 -228
  88. package/.docs/docs/server/request-context.md +0 -478
  89. package/.docs/docs/server/server-adapters.md +0 -547
  90. package/.docs/docs/streaming/events.md +0 -247
  91. package/.docs/docs/streaming/overview.md +0 -181
  92. package/.docs/docs/streaming/tool-streaming.md +0 -178
  93. package/.docs/docs/streaming/workflow-streaming.md +0 -109
  94. package/.docs/docs/voice/overview.md +0 -979
  95. package/.docs/docs/voice/speech-to-speech.md +0 -103
  96. package/.docs/docs/voice/speech-to-text.md +0 -80
  97. package/.docs/docs/voice/text-to-speech.md +0 -84
  98. package/.docs/docs/workflows/agents-and-tools.md +0 -170
  99. package/.docs/docs/workflows/control-flow.md +0 -823
  100. package/.docs/docs/workflows/error-handling.md +0 -360
  101. package/.docs/docs/workflows/human-in-the-loop.md +0 -213
  102. package/.docs/docs/workflows/overview.md +0 -372
  103. package/.docs/docs/workflows/snapshots.md +0 -238
  104. package/.docs/docs/workflows/suspend-and-resume.md +0 -205
  105. package/.docs/docs/workflows/time-travel.md +0 -309
  106. package/.docs/docs/workflows/workflow-state.md +0 -181
  107. package/.docs/docs/workspace/filesystem.md +0 -162
  108. package/.docs/docs/workspace/overview.md +0 -239
  109. package/.docs/docs/workspace/sandbox.md +0 -63
  110. package/.docs/docs/workspace/search.md +0 -219
  111. package/.docs/docs/workspace/skills.md +0 -126
  112. package/.docs/guides/agent-frameworks/ai-sdk.md +0 -140
  113. package/.docs/guides/build-your-ui/ai-sdk-ui.md +0 -1463
  114. package/.docs/guides/build-your-ui/assistant-ui.md +0 -156
  115. package/.docs/guides/build-your-ui/copilotkit.md +0 -292
  116. package/.docs/guides/deployment/amazon-ec2.md +0 -130
  117. package/.docs/guides/deployment/aws-lambda.md +0 -248
  118. package/.docs/guides/deployment/azure-app-services.md +0 -114
  119. package/.docs/guides/deployment/cloudflare.md +0 -99
  120. package/.docs/guides/deployment/digital-ocean.md +0 -168
  121. package/.docs/guides/deployment/inngest.md +0 -685
  122. package/.docs/guides/deployment/netlify.md +0 -77
  123. package/.docs/guides/deployment/vercel.md +0 -101
  124. package/.docs/guides/getting-started/astro.md +0 -408
  125. package/.docs/guides/getting-started/electron.md +0 -504
  126. package/.docs/guides/getting-started/express.md +0 -251
  127. package/.docs/guides/getting-started/hono.md +0 -191
  128. package/.docs/guides/getting-started/next-js.md +0 -355
  129. package/.docs/guides/getting-started/nuxt.md +0 -476
  130. package/.docs/guides/getting-started/quickstart.md +0 -67
  131. package/.docs/guides/getting-started/sveltekit.md +0 -300
  132. package/.docs/guides/getting-started/vite-react.md +0 -439
  133. package/.docs/guides/guide/ai-recruiter.md +0 -227
  134. package/.docs/guides/guide/chef-michel.md +0 -215
  135. package/.docs/guides/guide/code-review-bot.md +0 -221
  136. package/.docs/guides/guide/dev-assistant.md +0 -304
  137. package/.docs/guides/guide/docs-manager.md +0 -238
  138. package/.docs/guides/guide/github-actions-pr-description.md +0 -236
  139. package/.docs/guides/guide/notes-mcp-server.md +0 -425
  140. package/.docs/guides/guide/research-assistant.md +0 -349
  141. package/.docs/guides/guide/stock-agent.md +0 -134
  142. package/.docs/guides/guide/web-search.md +0 -326
  143. package/.docs/guides/guide/whatsapp-chat-bot.md +0 -416
  144. package/.docs/guides/index.md +0 -3
  145. package/.docs/guides/migrations/agentnetwork.md +0 -101
  146. package/.docs/guides/migrations/ai-sdk-v4-to-v5.md +0 -112
  147. package/.docs/guides/migrations/upgrade-to-v1/agent.md +0 -404
  148. package/.docs/guides/migrations/upgrade-to-v1/cli.md +0 -57
  149. package/.docs/guides/migrations/upgrade-to-v1/client.md +0 -337
  150. package/.docs/guides/migrations/upgrade-to-v1/deployment.md +0 -37
  151. package/.docs/guides/migrations/upgrade-to-v1/evals.md +0 -239
  152. package/.docs/guides/migrations/upgrade-to-v1/mastra.md +0 -143
  153. package/.docs/guides/migrations/upgrade-to-v1/mcp.md +0 -97
  154. package/.docs/guides/migrations/upgrade-to-v1/memory.md +0 -285
  155. package/.docs/guides/migrations/upgrade-to-v1/overview.md +0 -119
  156. package/.docs/guides/migrations/upgrade-to-v1/processors.md +0 -68
  157. package/.docs/guides/migrations/upgrade-to-v1/rag.md +0 -42
  158. package/.docs/guides/migrations/upgrade-to-v1/storage.md +0 -553
  159. package/.docs/guides/migrations/upgrade-to-v1/tools.md +0 -180
  160. package/.docs/guides/migrations/upgrade-to-v1/tracing.md +0 -417
  161. package/.docs/guides/migrations/upgrade-to-v1/vectors.md +0 -87
  162. package/.docs/guides/migrations/upgrade-to-v1/voice.md +0 -30
  163. package/.docs/guides/migrations/upgrade-to-v1/workflows.md +0 -341
  164. package/.docs/guides/migrations/vnext-to-standard-apis.md +0 -364
  165. package/.docs/models/embeddings.md +0 -161
  166. package/.docs/models/gateways/azure-openai.md +0 -128
  167. package/.docs/models/gateways/custom-gateways.md +0 -545
  168. package/.docs/models/gateways/netlify.md +0 -88
  169. package/.docs/models/gateways/openrouter.md +0 -219
  170. package/.docs/models/gateways/vercel.md +0 -225
  171. package/.docs/models/gateways.md +0 -14
  172. package/.docs/models/index.md +0 -286
  173. package/.docs/models/providers/302ai.md +0 -134
  174. package/.docs/models/providers/abacus.md +0 -125
  175. package/.docs/models/providers/agentrouter.md +0 -90
  176. package/.docs/models/providers/aihubmix.md +0 -107
  177. package/.docs/models/providers/alibaba-cn.md +0 -135
  178. package/.docs/models/providers/alibaba.md +0 -111
  179. package/.docs/models/providers/amazon-bedrock.md +0 -33
  180. package/.docs/models/providers/anthropic.md +0 -153
  181. package/.docs/models/providers/azure.md +0 -33
  182. package/.docs/models/providers/bailing.md +0 -72
  183. package/.docs/models/providers/baseten.md +0 -77
  184. package/.docs/models/providers/berget.md +0 -78
  185. package/.docs/models/providers/cerebras.md +0 -101
  186. package/.docs/models/providers/chutes.md +0 -136
  187. package/.docs/models/providers/cloudflare-ai-gateway.md +0 -33
  188. package/.docs/models/providers/cloudflare-workers-ai.md +0 -109
  189. package/.docs/models/providers/cohere.md +0 -33
  190. package/.docs/models/providers/cortecs.md +0 -91
  191. package/.docs/models/providers/deepinfra.md +0 -112
  192. package/.docs/models/providers/deepseek.md +0 -88
  193. package/.docs/models/providers/fastrouter.md +0 -84
  194. package/.docs/models/providers/fireworks-ai.md +0 -89
  195. package/.docs/models/providers/firmware.md +0 -85
  196. package/.docs/models/providers/friendli.md +0 -78
  197. package/.docs/models/providers/github-models.md +0 -125
  198. package/.docs/models/providers/google-vertex.md +0 -33
  199. package/.docs/models/providers/google.md +0 -159
  200. package/.docs/models/providers/groq.md +0 -107
  201. package/.docs/models/providers/helicone.md +0 -161
  202. package/.docs/models/providers/huggingface.md +0 -90
  203. package/.docs/models/providers/iflowcn.md +0 -84
  204. package/.docs/models/providers/inception.md +0 -72
  205. package/.docs/models/providers/inference.md +0 -79
  206. package/.docs/models/providers/io-intelligence.md +0 -87
  207. package/.docs/models/providers/io-net.md +0 -87
  208. package/.docs/models/providers/jiekou.md +0 -131
  209. package/.docs/models/providers/kilo.md +0 -333
  210. package/.docs/models/providers/kimi-for-coding.md +0 -100
  211. package/.docs/models/providers/kuae-cloud-coding-plan.md +0 -71
  212. package/.docs/models/providers/llama.md +0 -77
  213. package/.docs/models/providers/lmstudio.md +0 -73
  214. package/.docs/models/providers/lucidquery.md +0 -72
  215. package/.docs/models/providers/minimax-cn-coding-plan.md +0 -102
  216. package/.docs/models/providers/minimax-cn.md +0 -102
  217. package/.docs/models/providers/minimax-coding-plan.md +0 -102
  218. package/.docs/models/providers/minimax.md +0 -104
  219. package/.docs/models/providers/mistral.md +0 -124
  220. package/.docs/models/providers/moark.md +0 -72
  221. package/.docs/models/providers/modelscope.md +0 -77
  222. package/.docs/models/providers/moonshotai-cn.md +0 -76
  223. package/.docs/models/providers/moonshotai.md +0 -76
  224. package/.docs/models/providers/morph.md +0 -73
  225. package/.docs/models/providers/nano-gpt.md +0 -103
  226. package/.docs/models/providers/nebius.md +0 -116
  227. package/.docs/models/providers/nova.md +0 -72
  228. package/.docs/models/providers/novita-ai.md +0 -154
  229. package/.docs/models/providers/nvidia.md +0 -141
  230. package/.docs/models/providers/ollama-cloud.md +0 -103
  231. package/.docs/models/providers/ollama.md +0 -33
  232. package/.docs/models/providers/openai.md +0 -193
  233. package/.docs/models/providers/opencode.md +0 -100
  234. package/.docs/models/providers/ovhcloud.md +0 -83
  235. package/.docs/models/providers/perplexity.md +0 -100
  236. package/.docs/models/providers/poe.md +0 -183
  237. package/.docs/models/providers/privatemode-ai.md +0 -75
  238. package/.docs/models/providers/requesty.md +0 -90
  239. package/.docs/models/providers/scaleway.md +0 -84
  240. package/.docs/models/providers/siliconflow-cn.md +0 -138
  241. package/.docs/models/providers/siliconflow.md +0 -140
  242. package/.docs/models/providers/stackit.md +0 -78
  243. package/.docs/models/providers/stepfun.md +0 -73
  244. package/.docs/models/providers/submodel.md +0 -79
  245. package/.docs/models/providers/synthetic.md +0 -96
  246. package/.docs/models/providers/togetherai.md +0 -115
  247. package/.docs/models/providers/upstage.md +0 -73
  248. package/.docs/models/providers/venice.md +0 -95
  249. package/.docs/models/providers/vivgrid.md +0 -106
  250. package/.docs/models/providers/vultr.md +0 -75
  251. package/.docs/models/providers/wandb.md +0 -80
  252. package/.docs/models/providers/xai.md +0 -141
  253. package/.docs/models/providers/xiaomi.md +0 -71
  254. package/.docs/models/providers/zai-coding-plan.md +0 -80
  255. package/.docs/models/providers/zai.md +0 -79
  256. package/.docs/models/providers/zenmux.md +0 -161
  257. package/.docs/models/providers/zhipuai-coding-plan.md +0 -79
  258. package/.docs/models/providers/zhipuai.md +0 -79
  259. package/.docs/models/providers.md +0 -81
  260. package/.docs/reference/agents/agent.md +0 -142
  261. package/.docs/reference/agents/generate.md +0 -174
  262. package/.docs/reference/agents/generateLegacy.md +0 -176
  263. package/.docs/reference/agents/getDefaultGenerateOptions.md +0 -36
  264. package/.docs/reference/agents/getDefaultOptions.md +0 -34
  265. package/.docs/reference/agents/getDefaultStreamOptions.md +0 -36
  266. package/.docs/reference/agents/getDescription.md +0 -21
  267. package/.docs/reference/agents/getInstructions.md +0 -34
  268. package/.docs/reference/agents/getLLM.md +0 -37
  269. package/.docs/reference/agents/getMemory.md +0 -34
  270. package/.docs/reference/agents/getModel.md +0 -34
  271. package/.docs/reference/agents/getTools.md +0 -29
  272. package/.docs/reference/agents/getVoice.md +0 -34
  273. package/.docs/reference/agents/listAgents.md +0 -35
  274. package/.docs/reference/agents/listScorers.md +0 -34
  275. package/.docs/reference/agents/listTools.md +0 -34
  276. package/.docs/reference/agents/listWorkflows.md +0 -34
  277. package/.docs/reference/agents/network.md +0 -134
  278. package/.docs/reference/ai-sdk/chat-route.md +0 -82
  279. package/.docs/reference/ai-sdk/handle-chat-stream.md +0 -53
  280. package/.docs/reference/ai-sdk/handle-network-stream.md +0 -37
  281. package/.docs/reference/ai-sdk/handle-workflow-stream.md +0 -55
  282. package/.docs/reference/ai-sdk/network-route.md +0 -74
  283. package/.docs/reference/ai-sdk/to-ai-sdk-stream.md +0 -232
  284. package/.docs/reference/ai-sdk/to-ai-sdk-v4-messages.md +0 -79
  285. package/.docs/reference/ai-sdk/to-ai-sdk-v5-messages.md +0 -73
  286. package/.docs/reference/ai-sdk/with-mastra.md +0 -59
  287. package/.docs/reference/ai-sdk/workflow-route.md +0 -79
  288. package/.docs/reference/auth/auth0.md +0 -73
  289. package/.docs/reference/auth/better-auth.md +0 -71
  290. package/.docs/reference/auth/clerk.md +0 -36
  291. package/.docs/reference/auth/firebase.md +0 -80
  292. package/.docs/reference/auth/jwt.md +0 -26
  293. package/.docs/reference/auth/supabase.md +0 -33
  294. package/.docs/reference/auth/workos.md +0 -84
  295. package/.docs/reference/cli/create-mastra.md +0 -137
  296. package/.docs/reference/cli/mastra.md +0 -336
  297. package/.docs/reference/client-js/agents.md +0 -438
  298. package/.docs/reference/client-js/error-handling.md +0 -16
  299. package/.docs/reference/client-js/logs.md +0 -24
  300. package/.docs/reference/client-js/mastra-client.md +0 -63
  301. package/.docs/reference/client-js/memory.md +0 -225
  302. package/.docs/reference/client-js/observability.md +0 -72
  303. package/.docs/reference/client-js/telemetry.md +0 -20
  304. package/.docs/reference/client-js/tools.md +0 -44
  305. package/.docs/reference/client-js/vectors.md +0 -79
  306. package/.docs/reference/client-js/workflows.md +0 -199
  307. package/.docs/reference/configuration.md +0 -749
  308. package/.docs/reference/core/addGateway.md +0 -42
  309. package/.docs/reference/core/getAgent.md +0 -21
  310. package/.docs/reference/core/getAgentById.md +0 -21
  311. package/.docs/reference/core/getDeployer.md +0 -22
  312. package/.docs/reference/core/getGateway.md +0 -38
  313. package/.docs/reference/core/getGatewayById.md +0 -41
  314. package/.docs/reference/core/getLogger.md +0 -22
  315. package/.docs/reference/core/getMCPServer.md +0 -45
  316. package/.docs/reference/core/getMCPServerById.md +0 -53
  317. package/.docs/reference/core/getMemory.md +0 -50
  318. package/.docs/reference/core/getScorer.md +0 -54
  319. package/.docs/reference/core/getScorerById.md +0 -54
  320. package/.docs/reference/core/getServer.md +0 -22
  321. package/.docs/reference/core/getStorage.md +0 -22
  322. package/.docs/reference/core/getStoredAgentById.md +0 -89
  323. package/.docs/reference/core/getTelemetry.md +0 -22
  324. package/.docs/reference/core/getVector.md +0 -22
  325. package/.docs/reference/core/getWorkflow.md +0 -40
  326. package/.docs/reference/core/listAgents.md +0 -21
  327. package/.docs/reference/core/listGateways.md +0 -40
  328. package/.docs/reference/core/listLogs.md +0 -38
  329. package/.docs/reference/core/listLogsByRunId.md +0 -36
  330. package/.docs/reference/core/listMCPServers.md +0 -51
  331. package/.docs/reference/core/listMemory.md +0 -56
  332. package/.docs/reference/core/listScorers.md +0 -29
  333. package/.docs/reference/core/listStoredAgents.md +0 -93
  334. package/.docs/reference/core/listVectors.md +0 -22
  335. package/.docs/reference/core/listWorkflows.md +0 -21
  336. package/.docs/reference/core/mastra-class.md +0 -66
  337. package/.docs/reference/core/mastra-model-gateway.md +0 -153
  338. package/.docs/reference/core/setLogger.md +0 -26
  339. package/.docs/reference/core/setStorage.md +0 -27
  340. package/.docs/reference/datasets/addItem.md +0 -35
  341. package/.docs/reference/datasets/addItems.md +0 -33
  342. package/.docs/reference/datasets/compareExperiments.md +0 -48
  343. package/.docs/reference/datasets/create.md +0 -49
  344. package/.docs/reference/datasets/dataset.md +0 -78
  345. package/.docs/reference/datasets/datasets-manager.md +0 -84
  346. package/.docs/reference/datasets/delete.md +0 -23
  347. package/.docs/reference/datasets/deleteExperiment.md +0 -25
  348. package/.docs/reference/datasets/deleteItem.md +0 -25
  349. package/.docs/reference/datasets/deleteItems.md +0 -27
  350. package/.docs/reference/datasets/get.md +0 -29
  351. package/.docs/reference/datasets/getDetails.md +0 -45
  352. package/.docs/reference/datasets/getExperiment.md +0 -28
  353. package/.docs/reference/datasets/getItem.md +0 -31
  354. package/.docs/reference/datasets/getItemHistory.md +0 -29
  355. package/.docs/reference/datasets/list.md +0 -29
  356. package/.docs/reference/datasets/listExperimentResults.md +0 -37
  357. package/.docs/reference/datasets/listExperiments.md +0 -31
  358. package/.docs/reference/datasets/listItems.md +0 -44
  359. package/.docs/reference/datasets/listVersions.md +0 -31
  360. package/.docs/reference/datasets/startExperiment.md +0 -60
  361. package/.docs/reference/datasets/startExperimentAsync.md +0 -41
  362. package/.docs/reference/datasets/update.md +0 -46
  363. package/.docs/reference/datasets/updateItem.md +0 -36
  364. package/.docs/reference/deployer/cloudflare.md +0 -79
  365. package/.docs/reference/deployer/netlify.md +0 -82
  366. package/.docs/reference/deployer/vercel.md +0 -91
  367. package/.docs/reference/deployer.md +0 -100
  368. package/.docs/reference/evals/answer-relevancy.md +0 -105
  369. package/.docs/reference/evals/answer-similarity.md +0 -99
  370. package/.docs/reference/evals/bias.md +0 -120
  371. package/.docs/reference/evals/completeness.md +0 -137
  372. package/.docs/reference/evals/content-similarity.md +0 -101
  373. package/.docs/reference/evals/context-precision.md +0 -196
  374. package/.docs/reference/evals/context-relevance.md +0 -536
  375. package/.docs/reference/evals/create-scorer.md +0 -270
  376. package/.docs/reference/evals/faithfulness.md +0 -114
  377. package/.docs/reference/evals/hallucination.md +0 -220
  378. package/.docs/reference/evals/keyword-coverage.md +0 -128
  379. package/.docs/reference/evals/mastra-scorer.md +0 -123
  380. package/.docs/reference/evals/noise-sensitivity.md +0 -685
  381. package/.docs/reference/evals/prompt-alignment.md +0 -619
  382. package/.docs/reference/evals/run-evals.md +0 -138
  383. package/.docs/reference/evals/scorer-utils.md +0 -330
  384. package/.docs/reference/evals/textual-difference.md +0 -113
  385. package/.docs/reference/evals/tone-consistency.md +0 -119
  386. package/.docs/reference/evals/tool-call-accuracy.md +0 -533
  387. package/.docs/reference/evals/toxicity.md +0 -123
  388. package/.docs/reference/harness/harness-class.md +0 -645
  389. package/.docs/reference/index.md +0 -276
  390. package/.docs/reference/logging/pino-logger.md +0 -117
  391. package/.docs/reference/memory/clone-utilities.md +0 -199
  392. package/.docs/reference/memory/cloneThread.md +0 -130
  393. package/.docs/reference/memory/createThread.md +0 -68
  394. package/.docs/reference/memory/deleteMessages.md +0 -40
  395. package/.docs/reference/memory/getThreadById.md +0 -24
  396. package/.docs/reference/memory/listThreads.md +0 -145
  397. package/.docs/reference/memory/memory-class.md +0 -147
  398. package/.docs/reference/memory/observational-memory.md +0 -565
  399. package/.docs/reference/memory/recall.md +0 -91
  400. package/.docs/reference/observability/tracing/bridges/otel.md +0 -131
  401. package/.docs/reference/observability/tracing/configuration.md +0 -178
  402. package/.docs/reference/observability/tracing/exporters/arize.md +0 -141
  403. package/.docs/reference/observability/tracing/exporters/braintrust.md +0 -93
  404. package/.docs/reference/observability/tracing/exporters/cloud-exporter.md +0 -163
  405. package/.docs/reference/observability/tracing/exporters/console-exporter.md +0 -138
  406. package/.docs/reference/observability/tracing/exporters/datadog.md +0 -116
  407. package/.docs/reference/observability/tracing/exporters/default-exporter.md +0 -174
  408. package/.docs/reference/observability/tracing/exporters/laminar.md +0 -78
  409. package/.docs/reference/observability/tracing/exporters/langfuse.md +0 -134
  410. package/.docs/reference/observability/tracing/exporters/langsmith.md +0 -110
  411. package/.docs/reference/observability/tracing/exporters/otel.md +0 -199
  412. package/.docs/reference/observability/tracing/exporters/posthog.md +0 -92
  413. package/.docs/reference/observability/tracing/exporters/sentry.md +0 -184
  414. package/.docs/reference/observability/tracing/instances.md +0 -109
  415. package/.docs/reference/observability/tracing/interfaces.md +0 -749
  416. package/.docs/reference/observability/tracing/processors/sensitive-data-filter.md +0 -144
  417. package/.docs/reference/observability/tracing/spans.md +0 -224
  418. package/.docs/reference/processors/batch-parts-processor.md +0 -61
  419. package/.docs/reference/processors/language-detector.md +0 -81
  420. package/.docs/reference/processors/message-history-processor.md +0 -85
  421. package/.docs/reference/processors/moderation-processor.md +0 -104
  422. package/.docs/reference/processors/pii-detector.md +0 -107
  423. package/.docs/reference/processors/processor-interface.md +0 -525
  424. package/.docs/reference/processors/prompt-injection-detector.md +0 -71
  425. package/.docs/reference/processors/semantic-recall-processor.md +0 -123
  426. package/.docs/reference/processors/system-prompt-scrubber.md +0 -80
  427. package/.docs/reference/processors/token-limiter-processor.md +0 -113
  428. package/.docs/reference/processors/tool-call-filter.md +0 -85
  429. package/.docs/reference/processors/tool-search-processor.md +0 -113
  430. package/.docs/reference/processors/unicode-normalizer.md +0 -62
  431. package/.docs/reference/processors/working-memory-processor.md +0 -154
  432. package/.docs/reference/rag/chunk.md +0 -221
  433. package/.docs/reference/rag/database-config.md +0 -264
  434. package/.docs/reference/rag/document.md +0 -114
  435. package/.docs/reference/rag/embeddings.md +0 -92
  436. package/.docs/reference/rag/extract-params.md +0 -168
  437. package/.docs/reference/rag/graph-rag.md +0 -111
  438. package/.docs/reference/rag/metadata-filters.md +0 -216
  439. package/.docs/reference/rag/rerank.md +0 -80
  440. package/.docs/reference/rag/rerankWithScorer.md +0 -80
  441. package/.docs/reference/server/create-route.md +0 -260
  442. package/.docs/reference/server/express-adapter.md +0 -176
  443. package/.docs/reference/server/fastify-adapter.md +0 -90
  444. package/.docs/reference/server/hono-adapter.md +0 -162
  445. package/.docs/reference/server/koa-adapter.md +0 -127
  446. package/.docs/reference/server/mastra-server.md +0 -298
  447. package/.docs/reference/server/register-api-route.md +0 -249
  448. package/.docs/reference/server/routes.md +0 -306
  449. package/.docs/reference/storage/cloudflare-d1.md +0 -218
  450. package/.docs/reference/storage/cloudflare.md +0 -88
  451. package/.docs/reference/storage/composite.md +0 -235
  452. package/.docs/reference/storage/convex.md +0 -161
  453. package/.docs/reference/storage/dynamodb.md +0 -282
  454. package/.docs/reference/storage/lance.md +0 -131
  455. package/.docs/reference/storage/libsql.md +0 -135
  456. package/.docs/reference/storage/mongodb.md +0 -262
  457. package/.docs/reference/storage/mssql.md +0 -155
  458. package/.docs/reference/storage/overview.md +0 -121
  459. package/.docs/reference/storage/postgresql.md +0 -529
  460. package/.docs/reference/storage/upstash.md +0 -160
  461. package/.docs/reference/streaming/ChunkType.md +0 -292
  462. package/.docs/reference/streaming/agents/MastraModelOutput.md +0 -182
  463. package/.docs/reference/streaming/agents/stream.md +0 -212
  464. package/.docs/reference/streaming/agents/streamLegacy.md +0 -142
  465. package/.docs/reference/streaming/workflows/observeStream.md +0 -42
  466. package/.docs/reference/streaming/workflows/resumeStream.md +0 -61
  467. package/.docs/reference/streaming/workflows/stream.md +0 -88
  468. package/.docs/reference/streaming/workflows/timeTravelStream.md +0 -142
  469. package/.docs/reference/templates/overview.md +0 -194
  470. package/.docs/reference/tools/create-tool.md +0 -237
  471. package/.docs/reference/tools/document-chunker-tool.md +0 -89
  472. package/.docs/reference/tools/graph-rag-tool.md +0 -185
  473. package/.docs/reference/tools/mcp-client.md +0 -962
  474. package/.docs/reference/tools/mcp-server.md +0 -1275
  475. package/.docs/reference/tools/vector-query-tool.md +0 -459
  476. package/.docs/reference/vectors/astra.md +0 -121
  477. package/.docs/reference/vectors/chroma.md +0 -267
  478. package/.docs/reference/vectors/convex.md +0 -303
  479. package/.docs/reference/vectors/couchbase.md +0 -226
  480. package/.docs/reference/vectors/duckdb.md +0 -318
  481. package/.docs/reference/vectors/elasticsearch.md +0 -189
  482. package/.docs/reference/vectors/lance.md +0 -220
  483. package/.docs/reference/vectors/libsql.md +0 -305
  484. package/.docs/reference/vectors/mongodb.md +0 -295
  485. package/.docs/reference/vectors/opensearch.md +0 -99
  486. package/.docs/reference/vectors/pg.md +0 -408
  487. package/.docs/reference/vectors/pinecone.md +0 -168
  488. package/.docs/reference/vectors/qdrant.md +0 -222
  489. package/.docs/reference/vectors/s3vectors.md +0 -277
  490. package/.docs/reference/vectors/turbopuffer.md +0 -157
  491. package/.docs/reference/vectors/upstash.md +0 -294
  492. package/.docs/reference/vectors/vectorize.md +0 -147
  493. package/.docs/reference/voice/azure.md +0 -148
  494. package/.docs/reference/voice/cloudflare.md +0 -83
  495. package/.docs/reference/voice/composite-voice.md +0 -121
  496. package/.docs/reference/voice/deepgram.md +0 -79
  497. package/.docs/reference/voice/elevenlabs.md +0 -98
  498. package/.docs/reference/voice/google-gemini-live.md +0 -378
  499. package/.docs/reference/voice/google.md +0 -228
  500. package/.docs/reference/voice/mastra-voice.md +0 -313
  501. package/.docs/reference/voice/murf.md +0 -122
  502. package/.docs/reference/voice/openai-realtime.md +0 -203
  503. package/.docs/reference/voice/openai.md +0 -88
  504. package/.docs/reference/voice/playai.md +0 -80
  505. package/.docs/reference/voice/sarvam.md +0 -126
  506. package/.docs/reference/voice/speechify.md +0 -75
  507. package/.docs/reference/voice/voice.addInstructions.md +0 -56
  508. package/.docs/reference/voice/voice.addTools.md +0 -67
  509. package/.docs/reference/voice/voice.answer.md +0 -54
  510. package/.docs/reference/voice/voice.close.md +0 -51
  511. package/.docs/reference/voice/voice.connect.md +0 -94
  512. package/.docs/reference/voice/voice.events.md +0 -37
  513. package/.docs/reference/voice/voice.getSpeakers.md +0 -129
  514. package/.docs/reference/voice/voice.listen.md +0 -164
  515. package/.docs/reference/voice/voice.off.md +0 -54
  516. package/.docs/reference/voice/voice.on.md +0 -111
  517. package/.docs/reference/voice/voice.send.md +0 -65
  518. package/.docs/reference/voice/voice.speak.md +0 -157
  519. package/.docs/reference/voice/voice.updateConfig.md +0 -60
  520. package/.docs/reference/workflows/run-methods/cancel.md +0 -86
  521. package/.docs/reference/workflows/run-methods/restart.md +0 -33
  522. package/.docs/reference/workflows/run-methods/resume.md +0 -59
  523. package/.docs/reference/workflows/run-methods/start.md +0 -58
  524. package/.docs/reference/workflows/run-methods/startAsync.md +0 -67
  525. package/.docs/reference/workflows/run-methods/timeTravel.md +0 -142
  526. package/.docs/reference/workflows/run.md +0 -59
  527. package/.docs/reference/workflows/step.md +0 -119
  528. package/.docs/reference/workflows/workflow-methods/branch.md +0 -25
  529. package/.docs/reference/workflows/workflow-methods/commit.md +0 -17
  530. package/.docs/reference/workflows/workflow-methods/create-run.md +0 -63
  531. package/.docs/reference/workflows/workflow-methods/dountil.md +0 -25
  532. package/.docs/reference/workflows/workflow-methods/dowhile.md +0 -25
  533. package/.docs/reference/workflows/workflow-methods/foreach.md +0 -118
  534. package/.docs/reference/workflows/workflow-methods/map.md +0 -93
  535. package/.docs/reference/workflows/workflow-methods/parallel.md +0 -21
  536. package/.docs/reference/workflows/workflow-methods/sleep.md +0 -35
  537. package/.docs/reference/workflows/workflow-methods/sleepUntil.md +0 -35
  538. package/.docs/reference/workflows/workflow-methods/then.md +0 -21
  539. package/.docs/reference/workflows/workflow.md +0 -157
  540. package/.docs/reference/workspace/e2b-sandbox.md +0 -288
  541. package/.docs/reference/workspace/filesystem.md +0 -202
  542. package/.docs/reference/workspace/gcs-filesystem.md +0 -170
  543. package/.docs/reference/workspace/local-filesystem.md +0 -327
  544. package/.docs/reference/workspace/local-sandbox.md +0 -285
  545. package/.docs/reference/workspace/s3-filesystem.md +0 -169
  546. package/.docs/reference/workspace/sandbox.md +0 -81
  547. package/.docs/reference/workspace/workspace-class.md +0 -226
@@ -1,619 +0,0 @@
1
- # Prompt Alignment Scorer
2
-
3
- The `createPromptAlignmentScorerLLM()` function creates a scorer that evaluates how well agent responses align with user prompts across multiple dimensions: intent understanding, requirement fulfillment, response completeness, and format appropriateness.
4
-
5
- ## Parameters
6
-
7
- **model:** (`MastraModelConfig`): The language model to use for evaluating prompt-response alignment
8
-
9
- **options:** (`PromptAlignmentOptions`): Configuration options for the scorer
10
-
11
- ## .run() Returns
12
-
13
- **score:** (`number`): Multi-dimensional alignment score between 0 and scale (default 0-1)
14
-
15
- **reason:** (`string`): Human-readable explanation of the prompt alignment evaluation with detailed breakdown
16
-
17
- `.run()` returns a result in the following shape:
18
-
19
- ```typescript
20
- {
21
- runId: string,
22
- score: number,
23
- reason: string,
24
- analyzeStepResult: {
25
- intentAlignment: {
26
- score: number,
27
- primaryIntent: string,
28
- isAddressed: boolean,
29
- reasoning: string
30
- },
31
- requirementsFulfillment: {
32
- requirements: Array<{
33
- requirement: string,
34
- isFulfilled: boolean,
35
- reasoning: string
36
- }>,
37
- overallScore: number
38
- },
39
- completeness: {
40
- score: number,
41
- missingElements: string[],
42
- reasoning: string
43
- },
44
- responseAppropriateness: {
45
- score: number,
46
- formatAlignment: boolean,
47
- toneAlignment: boolean,
48
- reasoning: string
49
- },
50
- overallAssessment: string
51
- }
52
- }
53
- ```
54
-
55
- ## Scoring Details
56
-
57
- ### Scorer configuration
58
-
59
- You can customize the Prompt Alignment Scorer by adjusting the scale parameter and evaluation mode to fit your scoring needs.
60
-
61
- ```typescript
62
- const scorer = createPromptAlignmentScorerLLM({
63
- model: "openai/gpt-5.1",
64
- options: {
65
- scale: 10, // Score from 0-10 instead of 0-1
66
- evaluationMode: "both", // 'user', 'system', or 'both' (default)
67
- },
68
- });
69
- ```
70
-
71
- ### Multi-Dimensional Analysis
72
-
73
- Prompt Alignment evaluates responses across four key dimensions with weighted scoring that adapts based on the evaluation mode:
74
-
75
- #### User Mode ('user')
76
-
77
- Evaluates alignment with user prompts only:
78
-
79
- 1. **Intent Alignment** (40% weight) - Whether the response addresses the user's core request
80
- 2. **Requirements Fulfillment** (30% weight) - If all user requirements are met
81
- 3. **Completeness** (20% weight) - Whether the response is comprehensive for user needs
82
- 4. **Response Appropriateness** (10% weight) - If format and tone match user expectations
83
-
84
- #### System Mode ('system')
85
-
86
- Evaluates compliance with system guidelines only:
87
-
88
- 1. **Intent Alignment** (35% weight) - Whether the response follows system behavioral guidelines
89
- 2. **Requirements Fulfillment** (35% weight) - If all system constraints are respected
90
- 3. **Completeness** (15% weight) - Whether the response adheres to all system rules
91
- 4. **Response Appropriateness** (15% weight) - If format and tone match system specifications
92
-
93
- #### Both Mode ('both' - default)
94
-
95
- Combines evaluation of both user and system alignment:
96
-
97
- - **User alignment**: 70% of final score (using user mode weights)
98
- - **System compliance**: 30% of final score (using system mode weights)
99
- - Provides balanced assessment of user satisfaction and system adherence
100
-
101
- ### Scoring Formula
102
-
103
- **User Mode:**
104
-
105
- ```text
106
- Weighted Score = (intent_score × 0.4) + (requirements_score × 0.3) +
107
- (completeness_score × 0.2) + (appropriateness_score × 0.1)
108
- Final Score = Weighted Score × scale
109
- ```
110
-
111
- **System Mode:**
112
-
113
- ```text
114
- Weighted Score = (intent_score × 0.35) + (requirements_score × 0.35) +
115
- (completeness_score × 0.15) + (appropriateness_score × 0.15)
116
- Final Score = Weighted Score × scale
117
- ```
118
-
119
- **Both Mode (default):**
120
-
121
- ```text
122
- User Score = (user dimensions with user weights)
123
- System Score = (system dimensions with system weights)
124
- Weighted Score = (User Score × 0.7) + (System Score × 0.3)
125
- Final Score = Weighted Score × scale
126
- ```
127
-
128
- **Weight Distribution Rationale**:
129
-
130
- - **User Mode**: Prioritizes intent (40%) and requirements (30%) for user satisfaction
131
- - **System Mode**: Balances behavioral compliance (35%) and constraints (35%) equally
132
- - **Both Mode**: 70/30 split ensures user needs are primary while maintaining system compliance
133
-
134
- ### Score Interpretation
135
-
136
- - **0.9-1.0** = Excellent alignment across all dimensions
137
- - **0.8-0.9** = Very good alignment with minor gaps
138
- - **0.7-0.8** = Good alignment but missing some requirements or completeness
139
- - **0.6-0.7** = Moderate alignment with noticeable gaps
140
- - **0.4-0.6** = Poor alignment with significant issues
141
- - **0.0-0.4** = Very poor alignment, response doesn't address the prompt effectively
142
-
143
- ### When to Use Each Mode
144
-
145
- **User Mode (`'user'`)** - Use when:
146
-
147
- - Evaluating customer service responses for user satisfaction
148
- - Testing content generation quality from user perspective
149
- - Measuring how well responses address user questions
150
- - Focusing purely on request fulfillment without system constraints
151
-
152
- **System Mode (`'system'`)** - Use when:
153
-
154
- - Auditing AI safety and compliance with behavioral guidelines
155
- - Ensuring agents follow brand voice and tone requirements
156
- - Validating adherence to content policies and constraints
157
- - Testing system-level behavioral consistency
158
-
159
- **Both Mode (`'both'`)** - Use when (default, recommended):
160
-
161
- - Comprehensive evaluation of overall AI agent performance
162
- - Balancing user satisfaction with system compliance
163
- - Production monitoring where both user and system requirements matter
164
- - Holistic assessment of prompt-response alignment
165
-
166
- ## Common Use Cases
167
-
168
- ### Code Generation Evaluation
169
-
170
- Ideal for evaluating:
171
-
172
- - Programming task completion
173
- - Code quality and completeness
174
- - Adherence to coding requirements
175
- - Format specifications (functions, classes, etc.)
176
-
177
- ```typescript
178
- // Example: API endpoint creation
179
- const codePrompt =
180
- "Create a REST API endpoint with authentication and rate limiting";
181
- // Scorer evaluates: intent (API creation), requirements (auth + rate limiting),
182
- // completeness (full implementation), format (code structure)
183
- ```
184
-
185
- ### Instruction Following Assessment
186
-
187
- Perfect for:
188
-
189
- - Task completion verification
190
- - Multi-step instruction adherence
191
- - Requirement compliance checking
192
- - Educational content evaluation
193
-
194
- ```typescript
195
- // Example: Multi-requirement task
196
- const taskPrompt =
197
- "Write a Python class with initialization, validation, error handling, and documentation";
198
- // Scorer tracks each requirement individually and provides detailed breakdown
199
- ```
200
-
201
- ### Content Format Validation
202
-
203
- Useful for:
204
-
205
- - Format specification compliance
206
- - Style guide adherence
207
- - Output structure verification
208
- - Response appropriateness checking
209
-
210
- ```typescript
211
- // Example: Structured output
212
- const formatPrompt =
213
- "Explain the differences between let and const in JavaScript using bullet points";
214
- // Scorer evaluates content accuracy AND format compliance
215
- ```
216
-
217
- ### Agent Response Quality
218
-
219
- Measure how well your AI agents follow user instructions:
220
-
221
- ```typescript
222
- const agent = new Agent({
223
- name: "CodingAssistant",
224
- instructions:
225
- "You are a helpful coding assistant. Always provide working code examples.",
226
- model: "openai/gpt-5.1",
227
- });
228
-
229
- // Evaluate comprehensive alignment (default)
230
- const scorer = createPromptAlignmentScorerLLM({
231
- model: "openai/gpt-5.1",
232
- options: { evaluationMode: "both" }, // Evaluates both user intent and system guidelines
233
- });
234
-
235
- // Evaluate just user satisfaction
236
- const userScorer = createPromptAlignmentScorerLLM({
237
- model: "openai/gpt-5.1",
238
- options: { evaluationMode: "user" }, // Focus only on user request fulfillment
239
- });
240
-
241
- // Evaluate system compliance
242
- const systemScorer = createPromptAlignmentScorerLLM({
243
- model: "openai/gpt-5.1",
244
- options: { evaluationMode: "system" }, // Check adherence to system instructions
245
- });
246
-
247
- const result = await scorer.run(agentRun);
248
- ```
249
-
250
- ### Prompt Engineering Optimization
251
-
252
- Test different prompts to improve alignment:
253
-
254
- ```typescript
255
- const prompts = [
256
- "Write a function to calculate factorial",
257
- "Create a Python function that calculates factorial with error handling for negative inputs",
258
- "Implement a factorial calculator in Python with: input validation, error handling, and docstring",
259
- ];
260
-
261
- // Compare alignment scores to find the best prompt
262
- for (const prompt of prompts) {
263
- const result = await scorer.run(createTestRun(prompt, response));
264
- console.log(`Prompt alignment: ${result.score}`);
265
- }
266
- ```
267
-
268
- ### Multi-Agent System Evaluation
269
-
270
- Compare different agents or models:
271
-
272
- ```typescript
273
- const agents = [agent1, agent2, agent3];
274
- const testPrompts = [...]; // Array of test prompts
275
-
276
- for (const agent of agents) {
277
- let totalScore = 0;
278
- for (const prompt of testPrompts) {
279
- const response = await agent.run(prompt);
280
- const evaluation = await scorer.run({ input: prompt, output: response });
281
- totalScore += evaluation.score;
282
- }
283
- console.log(`${agent.name} average alignment: ${totalScore / testPrompts.length}`);
284
- }
285
- ```
286
-
287
- ## Examples
288
-
289
- ### Basic Configuration
290
-
291
- ```typescript
292
- import { createPromptAlignmentScorerLLM } from "@mastra/evals";
293
-
294
- const scorer = createPromptAlignmentScorerLLM({
295
- model: "openai/gpt-5.1",
296
- });
297
-
298
- // Evaluate a code generation task
299
- const result = await scorer.run({
300
- input: [
301
- {
302
- role: "user",
303
- content:
304
- "Write a Python function to calculate factorial with error handling",
305
- },
306
- ],
307
- output: {
308
- role: "assistant",
309
- text: `def factorial(n):
310
- if n < 0:
311
- raise ValueError("Factorial not defined for negative numbers")
312
- if n == 0:
313
- return 1
314
- return n * factorial(n-1)`,
315
- },
316
- });
317
- // Result: { score: 0.95, reason: "Excellent alignment - function addresses intent, includes error handling..." }
318
- ```
319
-
320
- ### Custom Configuration Examples
321
-
322
- ```typescript
323
- // Configure scale and evaluation mode
324
- const scorer = createPromptAlignmentScorerLLM({
325
- model: "openai/gpt-5.1",
326
- options: {
327
- scale: 10, // Score from 0-10 instead of 0-1
328
- evaluationMode: "both", // 'user', 'system', or 'both' (default)
329
- },
330
- });
331
-
332
- // User-only evaluation - focus on user satisfaction
333
- const userScorer = createPromptAlignmentScorerLLM({
334
- model: "openai/gpt-5.1",
335
- options: { evaluationMode: "user" },
336
- });
337
-
338
- // System-only evaluation - focus on compliance
339
- const systemScorer = createPromptAlignmentScorerLLM({
340
- model: "openai/gpt-5.1",
341
- options: { evaluationMode: "system" },
342
- });
343
-
344
- const result = await scorer.run(testRun);
345
- // Result: { score: 8.5, reason: "Score: 8.5 out of 10 - Good alignment with both user intent and system guidelines..." }
346
- ```
347
-
348
- ### Format-Specific Evaluation
349
-
350
- ```typescript
351
- // Evaluate bullet point formatting
352
- const result = await scorer.run({
353
- input: [
354
- {
355
- role: "user",
356
- content: "List the benefits of TypeScript in bullet points",
357
- },
358
- ],
359
- output: {
360
- role: "assistant",
361
- text: "TypeScript provides static typing, better IDE support, and enhanced code reliability.",
362
- },
363
- });
364
- // Result: Lower appropriateness score due to format mismatch (paragraph vs bullet points)
365
- ```
366
-
367
- ### Excellent alignment example
368
-
369
- In this example, the response fully addresses the user's prompt with all requirements met.
370
-
371
- ```typescript
372
- import { createPromptAlignmentScorerLLM } from "@mastra/evals/scorers/prebuilt";
373
-
374
- const scorer = createPromptAlignmentScorerLLM({
375
- model: "openai/gpt-5.1",
376
- });
377
-
378
- const inputMessages = [
379
- {
380
- role: "user",
381
- content:
382
- "Write a Python function to calculate factorial with error handling for negative numbers",
383
- },
384
- ];
385
-
386
- const outputMessage = {
387
- text: `def factorial(n):
388
- """Calculate factorial of a number."""
389
- if n < 0:
390
- raise ValueError("Factorial not defined for negative numbers")
391
- if n == 0 or n == 1:
392
- return 1
393
- return n * factorial(n - 1)`,
394
- };
395
-
396
- const result = await scorer.run({
397
- input: inputMessages,
398
- output: outputMessage,
399
- });
400
-
401
- console.log(result);
402
- ```
403
-
404
- ### Excellent alignment output
405
-
406
- The output receives a high score because it perfectly addresses the intent, fulfills all requirements, and uses appropriate format.
407
-
408
- ```typescript
409
- {
410
- score: 0.95,
411
- reason: 'The score is 0.95 because the response perfectly addresses the primary intent of creating a factorial function and fulfills all requirements including Python implementation, error handling for negative numbers, and proper documentation. The code format is appropriate and the implementation is complete.'
412
- }
413
- ```
414
-
415
- ### Partial alignment example
416
-
417
- In this example, the response addresses the core intent but misses some requirements or has format issues.
418
-
419
- ```typescript
420
- import { createPromptAlignmentScorerLLM } from "@mastra/evals/scorers/prebuilt";
421
-
422
- const scorer = createPromptAlignmentScorerLLM({
423
- model: "openai/gpt-5.1",
424
- });
425
-
426
- const inputMessages = [
427
- {
428
- role: "user",
429
- content: "List the benefits of TypeScript in bullet points",
430
- },
431
- ];
432
-
433
- const outputMessage = {
434
- text: "TypeScript provides static typing, better IDE support, and enhanced code reliability through compile-time error checking.",
435
- };
436
-
437
- const result = await scorer.run({
438
- input: inputMessages,
439
- output: outputMessage,
440
- });
441
-
442
- console.log(result);
443
- ```
444
-
445
- #### Partial alignment output
446
-
447
- The output receives a lower score because while the content is accurate, it doesn't follow the requested format (bullet points).
448
-
449
- ```typescript
450
- {
451
- score: 0.75,
452
- reason: 'The score is 0.75 because the response addresses the intent of explaining TypeScript benefits and provides accurate information, but fails to use the requested bullet point format, resulting in lower appropriateness scoring.'
453
- }
454
- ```
455
-
456
- ### Poor alignment example
457
-
458
- In this example, the response fails to address the user's specific requirements.
459
-
460
- ```typescript
461
- import { createPromptAlignmentScorerLLM } from "@mastra/evals/scorers/prebuilt";
462
-
463
- const scorer = createPromptAlignmentScorerLLM({
464
- model: "openai/gpt-5.1",
465
- });
466
-
467
- const inputMessages = [
468
- {
469
- role: "user",
470
- content:
471
- "Write a Python class with initialization, validation, error handling, and documentation",
472
- },
473
- ];
474
-
475
- const outputMessage = {
476
- text: `class Example:
477
- def __init__(self, value):
478
- self.value = value`,
479
- };
480
-
481
- const result = await scorer.run({
482
- input: inputMessages,
483
- output: outputMessage,
484
- });
485
-
486
- console.log(result);
487
- ```
488
-
489
- ### Poor alignment output
490
-
491
- The output receives a low score because it only partially fulfills the requirements, missing validation, error handling, and documentation.
492
-
493
- ```typescript
494
- {
495
- score: 0.35,
496
- reason: 'The score is 0.35 because while the response addresses the basic intent of creating a Python class with initialization, it fails to include validation, error handling, and documentation as specifically requested, resulting in incomplete requirement fulfillment.'
497
- }
498
- ```
499
-
500
- ### Evaluation Mode Examples
501
-
502
- #### User Mode - Focus on User Prompt Only
503
-
504
- Evaluates how well the response addresses the user's request, ignoring system instructions:
505
-
506
- ```typescript
507
- const scorer = createPromptAlignmentScorerLLM({
508
- model: "openai/gpt-5.1",
509
- options: { evaluationMode: "user" },
510
- });
511
-
512
- const result = await scorer.run({
513
- input: {
514
- inputMessages: [
515
- {
516
- role: "user",
517
- content: "Explain recursion with an example",
518
- },
519
- ],
520
- systemMessages: [
521
- {
522
- role: "system",
523
- content: "Always provide code examples in Python",
524
- },
525
- ],
526
- },
527
- output: {
528
- text: "Recursion is when a function calls itself. For example: factorial(5) = 5 * factorial(4)",
529
- },
530
- });
531
- // Scores high for addressing user request, even without Python code
532
- ```
533
-
534
- #### System Mode - Focus on System Guidelines Only
535
-
536
- Evaluates compliance with system behavioral guidelines and constraints:
537
-
538
- ```typescript
539
- const scorer = createPromptAlignmentScorerLLM({
540
- model: "openai/gpt-5.1",
541
- options: { evaluationMode: "system" },
542
- });
543
-
544
- const result = await scorer.run({
545
- input: {
546
- systemMessages: [
547
- {
548
- role: "system",
549
- content:
550
- "You are a helpful assistant. Always be polite, concise, and provide examples.",
551
- },
552
- ],
553
- inputMessages: [
554
- {
555
- role: "user",
556
- content: "What is machine learning?",
557
- },
558
- ],
559
- },
560
- output: {
561
- text: "Machine learning is a subset of AI where computers learn from data. For example, spam filters learn to identify unwanted emails by analyzing patterns in previously marked spam.",
562
- },
563
- });
564
- // Evaluates politeness, conciseness, and example provision
565
- ```
566
-
567
- #### Both Mode - Combined Evaluation (Default)
568
-
569
- Evaluates both user intent fulfillment and system compliance with weighted scoring (70% user, 30% system):
570
-
571
- ```typescript
572
- const scorer = createPromptAlignmentScorerLLM({
573
- model: "openai/gpt-5.1",
574
- options: { evaluationMode: "both" }, // This is the default
575
- });
576
-
577
- const result = await scorer.run({
578
- input: {
579
- systemMessages: [
580
- {
581
- role: "system",
582
- content:
583
- "Always provide code examples when explaining programming concepts",
584
- },
585
- ],
586
- inputMessages: [
587
- {
588
- role: "user",
589
- content: "Explain how to reverse a string",
590
- },
591
- ],
592
- },
593
- output: {
594
- text: `To reverse a string, you can iterate through it backwards. Here's an example in Python:
595
-
596
- def reverse_string(s):
597
- return s[::-1]
598
-
599
- # Usage: reverse_string("hello") returns "olleh"`,
600
- },
601
- });
602
- // High score for both addressing the user's request AND following system guidelines
603
- ```
604
-
605
- ## Comparison with Other Scorers
606
-
607
- | Aspect | Prompt Alignment | Answer Relevancy | Faithfulness |
608
- | -------------- | ------------------------------------------ | ---------------------------- | -------------------------------- |
609
- | **Focus** | Multi-dimensional prompt adherence | Query-response relevance | Context groundedness |
610
- | **Evaluation** | Intent, requirements, completeness, format | Semantic similarity to query | Factual consistency with context |
611
- | **Use Case** | General prompt following | Information retrieval | RAG/context-based systems |
612
- | **Dimensions** | 4 weighted dimensions | Single relevance dimension | Single faithfulness dimension |
613
-
614
- ## Related
615
-
616
- - [Answer Relevancy Scorer](https://mastra.ai/reference/evals/answer-relevancy) - Evaluates query-response relevance
617
- - [Faithfulness Scorer](https://mastra.ai/reference/evals/faithfulness) - Measures context groundedness
618
- - [Tool Call Accuracy Scorer](https://mastra.ai/reference/evals/tool-call-accuracy) - Evaluates tool selection
619
- - [Custom Scorers](https://mastra.ai/docs/evals/custom-scorers) - Creating your own evaluation metrics