@mastra/evals 0.13.2 → 0.13.3-alpha.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (45) hide show
  1. package/dist/{chunk-5CVZXIFW.js → chunk-4LRZVFXR.js} +32 -3
  2. package/dist/chunk-4LRZVFXR.js.map +1 -0
  3. package/dist/{chunk-QVZBKGOE.cjs → chunk-EKSPLMYP.cjs} +32 -2
  4. package/dist/chunk-EKSPLMYP.cjs.map +1 -0
  5. package/dist/{dist-JVIEAZJ6.js → dist-CI72CYZJ.js} +10 -10
  6. package/dist/{dist-JVIEAZJ6.js.map → dist-CI72CYZJ.js.map} +1 -1
  7. package/dist/{dist-JQCAD3AD.cjs → dist-IKJJ2AX4.cjs} +10 -10
  8. package/dist/{dist-JQCAD3AD.cjs.map → dist-IKJJ2AX4.cjs.map} +1 -1
  9. package/dist/index.cjs +1 -1
  10. package/dist/index.js +1 -1
  11. package/dist/{magic-string.es-NBXOXRCK.cjs → magic-string.es-VZN2EYER.cjs} +3 -3
  12. package/dist/{magic-string.es-NBXOXRCK.cjs.map → magic-string.es-VZN2EYER.cjs.map} +1 -1
  13. package/dist/{magic-string.es-6JSI7KY4.js → magic-string.es-WQRLTQPQ.js} +3 -3
  14. package/dist/{magic-string.es-6JSI7KY4.js.map → magic-string.es-WQRLTQPQ.js.map} +1 -1
  15. package/dist/scorers/code/index.cjs +2 -2
  16. package/dist/scorers/code/index.js +1 -1
  17. package/dist/scorers/llm/context-precision/index.d.ts +18 -0
  18. package/dist/scorers/llm/context-precision/index.d.ts.map +1 -0
  19. package/dist/scorers/llm/context-precision/prompts.d.ts +19 -0
  20. package/dist/scorers/llm/context-precision/prompts.d.ts.map +1 -0
  21. package/dist/scorers/llm/context-relevance/index.d.ts +27 -0
  22. package/dist/scorers/llm/context-relevance/index.d.ts.map +1 -0
  23. package/dist/scorers/llm/context-relevance/prompts.d.ts +20 -0
  24. package/dist/scorers/llm/context-relevance/prompts.d.ts.map +1 -0
  25. package/dist/scorers/llm/index.cjs +1163 -25
  26. package/dist/scorers/llm/index.cjs.map +1 -1
  27. package/dist/scorers/llm/index.d.ts +4 -0
  28. package/dist/scorers/llm/index.d.ts.map +1 -1
  29. package/dist/scorers/llm/index.js +1137 -3
  30. package/dist/scorers/llm/index.js.map +1 -1
  31. package/dist/scorers/llm/noise-sensitivity/index.d.ts +36 -0
  32. package/dist/scorers/llm/noise-sensitivity/index.d.ts.map +1 -0
  33. package/dist/scorers/llm/noise-sensitivity/prompts.d.ts +21 -0
  34. package/dist/scorers/llm/noise-sensitivity/prompts.d.ts.map +1 -0
  35. package/dist/scorers/llm/prompt-alignment/index.d.ts +38 -0
  36. package/dist/scorers/llm/prompt-alignment/index.d.ts.map +1 -0
  37. package/dist/scorers/llm/prompt-alignment/prompts.d.ts +44 -0
  38. package/dist/scorers/llm/prompt-alignment/prompts.d.ts.map +1 -0
  39. package/dist/scorers/llm/tool-call-accuracy/index.d.ts +2 -4
  40. package/dist/scorers/llm/tool-call-accuracy/index.d.ts.map +1 -1
  41. package/dist/scorers/utils.d.ts +2 -0
  42. package/dist/scorers/utils.d.ts.map +1 -1
  43. package/package.json +3 -3
  44. package/dist/chunk-5CVZXIFW.js.map +0 -1
  45. package/dist/chunk-QVZBKGOE.cjs.map +0 -1
@@ -0,0 +1,20 @@
1
+ export declare const CONTEXT_RELEVANCE_INSTRUCTIONS = "You are an expert context relevance evaluator. Your job is to analyze whether the provided context information was appropriate and useful for generating the agent's response to the user's query.\n\nKey Evaluation Criteria:\n1. **Relevance**: Does the context directly relate to the user's query?\n2. **Utility**: Did the context help produce a better response?\n3. **Completeness**: Was the context sufficient for the task?\n4. **Quality**: Is the context accurate and trustworthy?\n\nEvaluation Guidelines:\n- Context that directly answers or supports the user's query should be marked as highly relevant\n- Context that provides background information relevant to the query should be considered moderately relevant \n- Context that is tangentially related but doesn't directly help should be marked as low relevance\n- Context that is completely unrelated should be marked as irrelevant\n- Consider whether missing context might have led to a better response\n\nBe thorough and fair in your evaluation, considering both what context was provided and what might have been more useful.";
2
+ export declare function createAnalyzePrompt({ userQuery, agentResponse, providedContext, }: {
3
+ userQuery: string;
4
+ agentResponse: string;
5
+ providedContext: string[];
6
+ }): string;
7
+ export declare function createReasonPrompt({ userQuery, score, evaluations, missingContext, scale, }: {
8
+ userQuery: string;
9
+ score: number;
10
+ evaluations: Array<{
11
+ context_index: number;
12
+ contextPiece: string;
13
+ relevanceLevel: string;
14
+ wasUsed: boolean;
15
+ reasoning: string;
16
+ }>;
17
+ missingContext: string[];
18
+ scale: number;
19
+ }): string;
20
+ //# sourceMappingURL=prompts.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"prompts.d.ts","sourceRoot":"","sources":["../../../../src/scorers/llm/context-relevance/prompts.ts"],"names":[],"mappings":"AAAA,eAAO,MAAM,8BAA8B,mkCAe+E,CAAC;AAE3H,wBAAgB,mBAAmB,CAAC,EAClC,SAAS,EACT,aAAa,EACb,eAAe,GAChB,EAAE;IACD,SAAS,EAAE,MAAM,CAAC;IAClB,aAAa,EAAE,MAAM,CAAC;IACtB,eAAe,EAAE,MAAM,EAAE,CAAC;CAC3B,UAiFA;AAED,wBAAgB,kBAAkB,CAAC,EACjC,SAAS,EACT,KAAK,EACL,WAAW,EACX,cAAc,EACd,KAAK,GACN,EAAE;IACD,SAAS,EAAE,MAAM,CAAC;IAClB,KAAK,EAAE,MAAM,CAAC;IACd,WAAW,EAAE,KAAK,CAAC;QACjB,aAAa,EAAE,MAAM,CAAC;QACtB,YAAY,EAAE,MAAM,CAAC;QACrB,cAAc,EAAE,MAAM,CAAC;QACvB,OAAO,EAAE,OAAO,CAAC;QACjB,SAAS,EAAE,MAAM,CAAC;KACnB,CAAC,CAAC;IACH,cAAc,EAAE,MAAM,EAAE,CAAC;IACzB,KAAK,EAAE,MAAM,CAAC;CACf,UAsCA"}