@mastra/evals 0.0.0-storage-20250225005900
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.turbo/turbo-build.log +30 -0
- package/CHANGELOG.md +736 -0
- package/LICENSE +44 -0
- package/README.md +185 -0
- package/dist/_tsup-dts-rollup.d.ts +764 -0
- package/dist/chunk-4VNS5WPM.js +37 -0
- package/dist/chunk-TXXJUIES.js +15 -0
- package/dist/dist-IPSL6GJH.js +17947 -0
- package/dist/index.d.ts +3 -0
- package/dist/index.js +86 -0
- package/dist/magic-string.es-5UDOWOAZ.js +1296 -0
- package/dist/metrics/judge/index.d.ts +1 -0
- package/dist/metrics/judge/index.js +2 -0
- package/dist/metrics/llm/index.d.ts +11 -0
- package/dist/metrics/llm/index.js +2459 -0
- package/dist/metrics/nlp/index.d.ts +5 -0
- package/dist/metrics/nlp/index.js +189 -0
- package/eslint.config.js +6 -0
- package/package.json +73 -0
- package/src/attachListeners.ts +40 -0
- package/src/constants.ts +1 -0
- package/src/evaluation.test.ts +29 -0
- package/src/evaluation.ts +58 -0
- package/src/index.ts +2 -0
- package/src/metrics/index.ts +3 -0
- package/src/metrics/judge/index.ts +14 -0
- package/src/metrics/llm/answer-relevancy/index.test.ts +156 -0
- package/src/metrics/llm/answer-relevancy/index.ts +58 -0
- package/src/metrics/llm/answer-relevancy/metricJudge.ts +56 -0
- package/src/metrics/llm/answer-relevancy/prompts.ts +214 -0
- package/src/metrics/llm/bias/index.test.ts +152 -0
- package/src/metrics/llm/bias/index.ts +52 -0
- package/src/metrics/llm/bias/metricJudge.ts +53 -0
- package/src/metrics/llm/bias/prompts.ts +109 -0
- package/src/metrics/llm/context-position/index.test.ts +275 -0
- package/src/metrics/llm/context-position/index.ts +69 -0
- package/src/metrics/llm/context-position/metricJudge.ts +55 -0
- package/src/metrics/llm/context-position/prompts.ts +135 -0
- package/src/metrics/llm/context-precision/index.test.ts +213 -0
- package/src/metrics/llm/context-precision/index.ts +68 -0
- package/src/metrics/llm/context-precision/metricJudge.ts +55 -0
- package/src/metrics/llm/context-precision/prompts.ts +139 -0
- package/src/metrics/llm/context-relevancy/index.test.ts +162 -0
- package/src/metrics/llm/context-relevancy/index.ts +59 -0
- package/src/metrics/llm/context-relevancy/metricJudge.ts +51 -0
- package/src/metrics/llm/context-relevancy/prompts.ts +111 -0
- package/src/metrics/llm/contextual-recall/index.test.ts +90 -0
- package/src/metrics/llm/contextual-recall/index.ts +56 -0
- package/src/metrics/llm/contextual-recall/metricJudge.ts +52 -0
- package/src/metrics/llm/contextual-recall/prompts.ts +82 -0
- package/src/metrics/llm/faithfulness/index.test.ts +254 -0
- package/src/metrics/llm/faithfulness/index.ts +59 -0
- package/src/metrics/llm/faithfulness/metricJudge.ts +62 -0
- package/src/metrics/llm/faithfulness/prompts.ts +166 -0
- package/src/metrics/llm/hallucination/index.test.ts +214 -0
- package/src/metrics/llm/hallucination/index.ts +59 -0
- package/src/metrics/llm/hallucination/metricJudge.ts +44 -0
- package/src/metrics/llm/hallucination/prompts.ts +143 -0
- package/src/metrics/llm/index.ts +11 -0
- package/src/metrics/llm/prompt-alignment/index.test.ts +335 -0
- package/src/metrics/llm/prompt-alignment/index.ts +116 -0
- package/src/metrics/llm/prompt-alignment/metricJudge.ts +43 -0
- package/src/metrics/llm/prompt-alignment/prompts.ts +224 -0
- package/src/metrics/llm/summarization/index.test.ts +274 -0
- package/src/metrics/llm/summarization/index.ts +72 -0
- package/src/metrics/llm/summarization/metricJudge.ts +101 -0
- package/src/metrics/llm/summarization/prompts.ts +252 -0
- package/src/metrics/llm/toxicity/index.test.ts +84 -0
- package/src/metrics/llm/toxicity/index.ts +54 -0
- package/src/metrics/llm/toxicity/metricJudge.ts +39 -0
- package/src/metrics/llm/toxicity/prompts.ts +87 -0
- package/src/metrics/llm/types.ts +7 -0
- package/src/metrics/llm/utils.ts +20 -0
- package/src/metrics/nlp/completeness/index.test.ts +98 -0
- package/src/metrics/nlp/completeness/index.ts +121 -0
- package/src/metrics/nlp/content-similarity/index.test.ts +76 -0
- package/src/metrics/nlp/content-similarity/index.ts +49 -0
- package/src/metrics/nlp/index.ts +5 -0
- package/src/metrics/nlp/keyword-coverage/index.test.ts +85 -0
- package/src/metrics/nlp/keyword-coverage/index.ts +49 -0
- package/src/metrics/nlp/textual-difference/index.test.ts +88 -0
- package/src/metrics/nlp/textual-difference/index.ts +38 -0
- package/src/metrics/nlp/tone/index.test.ts +100 -0
- package/src/metrics/nlp/tone/index.ts +55 -0
- package/tsconfig.json +5 -0
- package/vitest.config.ts +12 -0
|
@@ -0,0 +1,30 @@
|
|
|
1
|
+
|
|
2
|
+
|
|
3
|
+
> @mastra/evals@0.1.5-alpha.0 build /Users/ward/projects/mastra/mastra/packages/evals
|
|
4
|
+
> pnpm check && tsup src/index.ts src/metrics/judge/index.ts src/metrics/llm/index.ts src/metrics/nlp/index.ts --format esm --experimental-dts --clean --treeshake
|
|
5
|
+
|
|
6
|
+
|
|
7
|
+
> @mastra/evals@0.1.5-alpha.0 check /Users/ward/projects/mastra/mastra/packages/evals
|
|
8
|
+
> tsc --noEmit
|
|
9
|
+
|
|
10
|
+
[34mCLI[39m Building entry: src/index.ts, src/metrics/judge/index.ts, src/metrics/llm/index.ts, src/metrics/nlp/index.ts
|
|
11
|
+
[34mCLI[39m Using tsconfig: tsconfig.json
|
|
12
|
+
[34mCLI[39m tsup v8.3.6
|
|
13
|
+
[34mTSC[39m Build start
|
|
14
|
+
[32mTSC[39m ⚡️ Build success in 3520ms
|
|
15
|
+
[34mDTS[39m Build start
|
|
16
|
+
[34mCLI[39m Target: es2022
|
|
17
|
+
Analysis will use the bundled TypeScript version 5.7.3
|
|
18
|
+
[36mWriting package typings: /Users/ward/projects/mastra/mastra/packages/evals/dist/_tsup-dts-rollup.d.ts[39m
|
|
19
|
+
[32mDTS[39m ⚡️ Build success in 2474ms
|
|
20
|
+
[34mCLI[39m Cleaning output folder
|
|
21
|
+
[34mESM[39m Build start
|
|
22
|
+
[32mESM[39m [1mdist/index.js [22m[32m2.63 KB[39m
|
|
23
|
+
[32mESM[39m [1mdist/magic-string.es-5UDOWOAZ.js [22m[32m40.80 KB[39m
|
|
24
|
+
[32mESM[39m [1mdist/chunk-4VNS5WPM.js [22m[32m1.82 KB[39m
|
|
25
|
+
[32mESM[39m [1mdist/metrics/llm/index.js [22m[32m85.32 KB[39m
|
|
26
|
+
[32mESM[39m [1mdist/metrics/judge/index.js [22m[32m94.00 B[39m
|
|
27
|
+
[32mESM[39m [1mdist/metrics/nlp/index.js [22m[32m6.30 KB[39m
|
|
28
|
+
[32mESM[39m [1mdist/chunk-TXXJUIES.js [22m[32m305.00 B[39m
|
|
29
|
+
[32mESM[39m [1mdist/dist-IPSL6GJH.js [22m[32m571.17 KB[39m
|
|
30
|
+
[32mESM[39m ⚡️ Build success in 2292ms
|