@mastra/core 1.18.0-alpha.0 → 1.18.0-alpha.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +31 -0
- package/dist/agent/index.cjs +8 -8
- package/dist/agent/index.js +1 -1
- package/dist/{chunk-YXNO6AHV.js → chunk-45M6KUQZ.js} +7 -7
- package/dist/{chunk-YXNO6AHV.js.map → chunk-45M6KUQZ.js.map} +1 -1
- package/dist/{chunk-AEIPJW4F.cjs → chunk-4KGTZPYF.cjs} +185 -185
- package/dist/{chunk-AEIPJW4F.cjs.map → chunk-4KGTZPYF.cjs.map} +1 -1
- package/dist/{chunk-DL4A7URO.cjs → chunk-5AVTFQEP.cjs} +236 -20
- package/dist/chunk-5AVTFQEP.cjs.map +1 -0
- package/dist/{chunk-DV7FIKOO.cjs → chunk-6WVZQBYQ.cjs} +10 -10
- package/dist/{chunk-DV7FIKOO.cjs.map → chunk-6WVZQBYQ.cjs.map} +1 -1
- package/dist/{chunk-QVQ3PGG2.cjs → chunk-7IDACSBM.cjs} +206 -2
- package/dist/chunk-7IDACSBM.cjs.map +1 -0
- package/dist/{chunk-V54LY5HR.cjs → chunk-DQYOFNZ7.cjs} +6107 -5697
- package/dist/chunk-DQYOFNZ7.cjs.map +1 -0
- package/dist/{chunk-F7YLMJSQ.js → chunk-E6XNM5ES.js} +4 -4
- package/dist/{chunk-F7YLMJSQ.js.map → chunk-E6XNM5ES.js.map} +1 -1
- package/dist/{chunk-CYQ2TNSK.js → chunk-EYM6DWKD.js} +18 -3
- package/dist/{chunk-CYQ2TNSK.js.map → chunk-EYM6DWKD.js.map} +1 -1
- package/dist/{chunk-3ECYXW43.cjs → chunk-H5O522FY.cjs} +16 -16
- package/dist/{chunk-3ECYXW43.cjs.map → chunk-H5O522FY.cjs.map} +1 -1
- package/dist/{chunk-BIB2LCIR.js → chunk-IOCCTQYZ.js} +6106 -5696
- package/dist/chunk-IOCCTQYZ.js.map +1 -0
- package/dist/{chunk-KMVGT2JI.js → chunk-JEWTRDRI.js} +233 -17
- package/dist/chunk-JEWTRDRI.js.map +1 -0
- package/dist/{chunk-AIYWGXK7.js → chunk-L53NRDFU.js} +3 -3
- package/dist/{chunk-AIYWGXK7.js.map → chunk-L53NRDFU.js.map} +1 -1
- package/dist/{chunk-SLG7AUBK.cjs → chunk-LUONHWL6.cjs} +6 -6
- package/dist/{chunk-SLG7AUBK.cjs.map → chunk-LUONHWL6.cjs.map} +1 -1
- package/dist/{chunk-3DDJ33AU.js → chunk-M5CZCWWW.js} +4 -4
- package/dist/{chunk-3DDJ33AU.js.map → chunk-M5CZCWWW.js.map} +1 -1
- package/dist/{chunk-3H34KWBU.cjs → chunk-PK3X5KIF.cjs} +24 -9
- package/dist/{chunk-3H34KWBU.cjs.map → chunk-PK3X5KIF.cjs.map} +1 -1
- package/dist/{chunk-AIEKKCJ7.js → chunk-QR2Z4WQ7.js} +3 -3
- package/dist/{chunk-AIEKKCJ7.js.map → chunk-QR2Z4WQ7.js.map} +1 -1
- package/dist/{chunk-TG4U3K3I.cjs → chunk-T2CILERS.cjs} +50 -50
- package/dist/{chunk-TG4U3K3I.cjs.map → chunk-T2CILERS.cjs.map} +1 -1
- package/dist/{chunk-P2C4NFMY.js → chunk-URN2SKVG.js} +4 -4
- package/dist/{chunk-P2C4NFMY.js.map → chunk-URN2SKVG.js.map} +1 -1
- package/dist/{chunk-BHVF4Z5D.cjs → chunk-VAVK4KJI.cjs} +28 -28
- package/dist/chunk-VAVK4KJI.cjs.map +1 -0
- package/dist/{chunk-ZOPIN73X.js → chunk-VF3CL3JV.js} +19 -19
- package/dist/chunk-VF3CL3JV.js.map +1 -0
- package/dist/{chunk-AGEYVARR.js → chunk-VMKNS3YO.js} +204 -3
- package/dist/chunk-VMKNS3YO.js.map +1 -0
- package/dist/{chunk-A5JHKGFY.cjs → chunk-WPDB2VAM.cjs} +7 -7
- package/dist/{chunk-A5JHKGFY.cjs.map → chunk-WPDB2VAM.cjs.map} +1 -1
- package/dist/{chunk-YFYB3Q5L.js → chunk-WVTVBWOQ.js} +9 -9
- package/dist/{chunk-YFYB3Q5L.js.map → chunk-WVTVBWOQ.js.map} +1 -1
- package/dist/{chunk-3LH5QX5F.cjs → chunk-XRZNAZRP.cjs} +3 -3
- package/dist/{chunk-3LH5QX5F.cjs.map → chunk-XRZNAZRP.cjs.map} +1 -1
- package/dist/{chunk-7CDFI4GW.cjs → chunk-YEKQKMCU.cjs} +76 -76
- package/dist/{chunk-7CDFI4GW.cjs.map → chunk-YEKQKMCU.cjs.map} +1 -1
- package/dist/{chunk-JEEYINIB.js → chunk-YN3FI4AD.js} +4 -4
- package/dist/{chunk-JEEYINIB.js.map → chunk-YN3FI4AD.js.map} +1 -1
- package/dist/datasets/index.cjs +17 -17
- package/dist/datasets/index.js +2 -2
- package/dist/docs/SKILL.md +2 -3
- package/dist/docs/assets/SOURCE_MAP.json +349 -334
- package/dist/docs/references/reference-evals-run-evals.md +78 -3
- package/dist/docs/references/reference-evals-scorer-utils.md +184 -0
- package/dist/docs/references/reference-evals-trajectory-accuracy.md +613 -0
- package/dist/docs/references/reference-logging-pino-logger.md +58 -0
- package/dist/docs/references/reference.md +1 -2
- package/dist/evals/base.d.ts +8 -2
- package/dist/evals/base.d.ts.map +1 -1
- package/dist/evals/index.cjs +32 -20
- package/dist/evals/index.js +3 -3
- package/dist/evals/run/index.d.ts +28 -1
- package/dist/evals/run/index.d.ts.map +1 -1
- package/dist/evals/run/scorerAccumulator.d.ts +4 -1
- package/dist/evals/run/scorerAccumulator.d.ts.map +1 -1
- package/dist/evals/scoreTraces/index.cjs +5 -5
- package/dist/evals/scoreTraces/index.js +2 -2
- package/dist/evals/types.d.ts +305 -10
- package/dist/evals/types.d.ts.map +1 -1
- package/dist/harness/index.cjs +7 -7
- package/dist/harness/index.js +5 -5
- package/dist/index.cjs +2 -2
- package/dist/index.js +1 -1
- package/dist/llm/index.cjs +16 -16
- package/dist/llm/index.js +5 -5
- package/dist/llm/model/provider-types.generated.d.ts +2444 -2243
- package/dist/loop/index.cjs +14 -14
- package/dist/loop/index.js +1 -1
- package/dist/loop/network/index.d.ts +3 -3
- package/dist/loop/types.d.ts +1 -1
- package/dist/mastra/index.cjs +2 -2
- package/dist/mastra/index.js +1 -1
- package/dist/memory/index.cjs +14 -14
- package/dist/memory/index.js +1 -1
- package/dist/models-dev-GLFQVCT4.cjs +12 -0
- package/dist/{models-dev-MU7QGI4O.cjs.map → models-dev-GLFQVCT4.cjs.map} +1 -1
- package/dist/models-dev-WSLKK6FO.js +3 -0
- package/dist/{models-dev-JEMMVJFN.js.map → models-dev-WSLKK6FO.js.map} +1 -1
- package/dist/netlify-SNTN56QS.js +3 -0
- package/dist/{netlify-BROEKRZF.js.map → netlify-SNTN56QS.js.map} +1 -1
- package/dist/netlify-VFRYJYBK.cjs +12 -0
- package/dist/{netlify-GOEIG6IC.cjs.map → netlify-VFRYJYBK.cjs.map} +1 -1
- package/dist/processor-provider/index.cjs +10 -10
- package/dist/processor-provider/index.js +1 -1
- package/dist/processors/index.cjs +44 -44
- package/dist/processors/index.js +1 -1
- package/dist/provider-registry-L6KDLMFM.cjs +40 -0
- package/dist/{provider-registry-CKFMYEBK.cjs.map → provider-registry-L6KDLMFM.cjs.map} +1 -1
- package/dist/provider-registry-LEXW2E53.js +3 -0
- package/dist/{provider-registry-P7EMCVJI.js.map → provider-registry-LEXW2E53.js.map} +1 -1
- package/dist/provider-registry.json +6102 -5692
- package/dist/relevance/index.cjs +3 -3
- package/dist/relevance/index.js +1 -1
- package/dist/storage/constants.cjs +56 -56
- package/dist/storage/constants.d.ts +1 -1
- package/dist/storage/constants.js +1 -1
- package/dist/storage/domains/experiments/base.d.ts +2 -1
- package/dist/storage/domains/experiments/base.d.ts.map +1 -1
- package/dist/storage/domains/experiments/inmemory.d.ts +2 -1
- package/dist/storage/domains/experiments/inmemory.d.ts.map +1 -1
- package/dist/storage/domains/observability/tracing.d.ts +45 -45
- package/dist/storage/index.cjs +160 -160
- package/dist/storage/index.js +2 -2
- package/dist/storage/types.d.ts +12 -0
- package/dist/storage/types.d.ts.map +1 -1
- package/dist/stream/MastraAgentNetworkStream.d.ts +1 -1
- package/dist/stream/MastraWorkflowStream.d.ts +1 -1
- package/dist/stream/index.cjs +8 -8
- package/dist/stream/index.js +1 -1
- package/dist/tool-loop-agent/index.cjs +4 -4
- package/dist/tool-loop-agent/index.js +1 -1
- package/dist/vector/index.cjs +7 -7
- package/dist/vector/index.js +1 -1
- package/dist/workflows/evented/index.cjs +10 -10
- package/dist/workflows/evented/index.js +1 -1
- package/dist/workflows/index.cjs +24 -24
- package/dist/workflows/index.js +1 -1
- package/package.json +5 -5
- package/src/llm/model/provider-types.generated.d.ts +2444 -2243
- package/dist/chunk-AGEYVARR.js.map +0 -1
- package/dist/chunk-BHVF4Z5D.cjs.map +0 -1
- package/dist/chunk-BIB2LCIR.js.map +0 -1
- package/dist/chunk-DL4A7URO.cjs.map +0 -1
- package/dist/chunk-KMVGT2JI.js.map +0 -1
- package/dist/chunk-QVQ3PGG2.cjs.map +0 -1
- package/dist/chunk-V54LY5HR.cjs.map +0 -1
- package/dist/chunk-ZOPIN73X.js.map +0 -1
- package/dist/docs/references/reference-core-getStoredAgentById.md +0 -87
- package/dist/docs/references/reference-core-listStoredAgents.md +0 -91
- package/dist/models-dev-JEMMVJFN.js +0 -3
- package/dist/models-dev-MU7QGI4O.cjs +0 -12
- package/dist/netlify-BROEKRZF.js +0 -3
- package/dist/netlify-GOEIG6IC.cjs +0 -12
- package/dist/provider-registry-CKFMYEBK.cjs +0 -40
- package/dist/provider-registry-P7EMCVJI.js +0 -3
package/dist/evals/base.d.ts
CHANGED
|
@@ -3,7 +3,7 @@ import type { MastraModelConfig } from '../llm/model/shared.types.js';
|
|
|
3
3
|
import type { Mastra } from '../mastra/index.js';
|
|
4
4
|
import type { ObservabilityContext } from '../observability/index.js';
|
|
5
5
|
import type { PublicSchema } from '../schema/index.js';
|
|
6
|
-
import type { ScoringSamplingConfig, ScorerRunInputForAgent, ScorerRunOutputForAgent } from './types.js';
|
|
6
|
+
import type { ScoringSamplingConfig, ScorerRunInputForAgent, ScorerRunOutputForAgent, Trajectory, TrajectoryExpectation } from './types.js';
|
|
7
7
|
interface ScorerStepDefinition {
|
|
8
8
|
name: string;
|
|
9
9
|
definition: any;
|
|
@@ -14,6 +14,10 @@ type ScorerTypeShortcuts = {
|
|
|
14
14
|
input: ScorerRunInputForAgent;
|
|
15
15
|
output: ScorerRunOutputForAgent;
|
|
16
16
|
};
|
|
17
|
+
trajectory: {
|
|
18
|
+
input: ScorerRunInputForAgent;
|
|
19
|
+
output: Trajectory;
|
|
20
|
+
};
|
|
17
21
|
};
|
|
18
22
|
interface ScorerConfig<TID extends string, TInput = any, TRunOutput = any> {
|
|
19
23
|
id: TID;
|
|
@@ -33,6 +37,8 @@ interface ScorerRun<TInput = any, TOutput = any> extends Partial<ObservabilityCo
|
|
|
33
37
|
input?: TInput;
|
|
34
38
|
output: TOutput;
|
|
35
39
|
groundTruth?: any;
|
|
40
|
+
/** Expected trajectory config for trajectory scorers. Flows from dataset items or scorer constructor. */
|
|
41
|
+
expectedTrajectory?: TrajectoryExpectation;
|
|
36
42
|
requestContext?: Record<string, any>;
|
|
37
43
|
}
|
|
38
44
|
interface PromptObject<TOutput, TAccumulated extends Record<string, any>, TStepName extends string = string, TInput = any, TRunOutput = any> {
|
|
@@ -128,7 +134,7 @@ declare class MastraScorer<TID extends string = string, TInput = any, TRunOutput
|
|
|
128
134
|
* @internal
|
|
129
135
|
*/
|
|
130
136
|
__setRawConfig(rawConfig: Record<string, unknown>): void;
|
|
131
|
-
get type():
|
|
137
|
+
get type(): keyof ScorerTypeShortcuts | {
|
|
132
138
|
input: z.ZodType<TInput, unknown, z.core.$ZodTypeInternals<TInput, unknown>>;
|
|
133
139
|
output: z.ZodType<TRunOutput, unknown, z.core.$ZodTypeInternals<TRunOutput, unknown>>;
|
|
134
140
|
} | undefined;
|
package/dist/evals/base.d.ts.map
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"base.d.ts","sourceRoot":"","sources":["../../src/evals/base.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,CAAC,EAAE,MAAM,QAAQ,CAAC;AAK3B,OAAO,KAAK,EAAE,iBAAiB,EAAE,MAAM,2BAA2B,CAAC;AAEnE,OAAO,KAAK,EAAE,MAAM,EAAE,MAAM,WAAW,CAAC;AAExC,OAAO,KAAK,EAAE,oBAAoB,EAAE,MAAM,kBAAkB,CAAC;AAC7D,OAAO,KAAK,EAAE,YAAY,EAAE,MAAM,WAAW,CAAC;AAG9C,OAAO,KAAK,
|
|
1
|
+
{"version":3,"file":"base.d.ts","sourceRoot":"","sources":["../../src/evals/base.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,CAAC,EAAE,MAAM,QAAQ,CAAC;AAK3B,OAAO,KAAK,EAAE,iBAAiB,EAAE,MAAM,2BAA2B,CAAC;AAEnE,OAAO,KAAK,EAAE,MAAM,EAAE,MAAM,WAAW,CAAC;AAExC,OAAO,KAAK,EAAE,oBAAoB,EAAE,MAAM,kBAAkB,CAAC;AAC7D,OAAO,KAAK,EAAE,YAAY,EAAE,MAAM,WAAW,CAAC;AAG9C,OAAO,KAAK,EACV,qBAAqB,EACrB,sBAAsB,EACtB,uBAAuB,EACvB,UAAU,EACV,qBAAqB,EACtB,MAAM,SAAS,CAAC;AAEjB,UAAU,oBAAoB;IAC5B,IAAI,EAAE,MAAM,CAAC;IACb,UAAU,EAAE,GAAG,CAAC;IAChB,cAAc,EAAE,OAAO,CAAC;CACzB;AAGD,KAAK,mBAAmB,GAAG;IACzB,KAAK,EAAE;QACL,KAAK,EAAE,sBAAsB,CAAC;QAC9B,MAAM,EAAE,uBAAuB,CAAC;KACjC,CAAC;IACF,UAAU,EAAE;QACV,KAAK,EAAE,sBAAsB,CAAC;QAC9B,MAAM,EAAE,UAAU,CAAC;KACpB,CAAC;CACH,CAAC;AAKF,UAAU,YAAY,CAAC,GAAG,SAAS,MAAM,EAAE,MAAM,GAAG,GAAG,EAAE,UAAU,GAAG,GAAG;IACvE,EAAE,EAAE,GAAG,CAAC;IACR,IAAI,CAAC,EAAE,MAAM,CAAC;IACd,WAAW,EAAE,MAAM,CAAC;IACpB,KAAK,CAAC,EAAE;QACN,KAAK,EAAE,iBAAiB,CAAC;QACzB,YAAY,EAAE,MAAM,CAAC;KACtB,CAAC;IAEF,IAAI,CAAC,EACD,MAAM,mBAAmB,GACzB;QACE,KAAK,EAAE,CAAC,CAAC,SAAS,CAAC,MAAM,CAAC,CAAC;QAC3B,MAAM,EAAE,CAAC,CAAC,SAAS,CAAC,UAAU,CAAC,CAAC;KACjC,CAAC;CACP;AAGD,UAAU,SAAS,CAAC,MAAM,GAAG,GAAG,EAAE,OAAO,GAAG,GAAG,CAAE,SAAQ,OAAO,CAAC,oBAAoB,CAAC;IACpF,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,MAAM,EAAE,OAAO,CAAC;IAChB,WAAW,CAAC,EAAE,GAAG,CAAC;IAClB,yGAAyG;IACzG,kBAAkB,CAAC,EAAE,qBAAqB,CAAC;IAC3C,cAAc,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;CACtC;AAGD,UAAU,YAAY,CACpB,OAAO,EACP,YAAY,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EACxC,SAAS,SAAS,MAAM,GAAG,MAAM,EACjC,MAAM,GAAG,GAAG,EACZ,UAAU,GAAG,GAAG;IAEhB,WAAW,EAAE,MAAM,CAAC;IACpB;;;;;;OAMG;IACH,YAAY,EAAE,YAAY,CAAC,OAAO,CAAC,CAAC;IACpC,KAAK,CAAC,EAAE;QACN,KAAK,EAAE,iBAAiB,CAAC;QACzB,YAAY,EAAE,MAAM,CAAC;KACtB,CAAC;IAGF,YAAY,EAAE,CAAC,OAAO,EAAE,mBAAmB,CAAC,YAAY,EAAE,SAAS,EAAE,MAAM,EAAE,UAAU,CAAC,KAAK,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAC;CACvH;AAGD,KAAK,aAAa,CAAC,CAAC,SAAS,MAAM,IAAI,GAAG,CAAC,YAAY,CAAC;AAGxD,KAAK,OAAO,CAAC,CAAC,IAAI,CAAC,SAAS,OAAO,CAAC,MAAM,CAAC,CAAC,GAAG,CAAC,GAAG,CAAC,CAAC;AAGrD,KAAK,WAAW,CAAC,YAAY,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EAAE,MAAM,EAAE,UAAU,IAAI;IAC/E,GAAG,EAAE,SAAS,CAAC,MAAM,EAAE,UAAU,CAAC,CAAC;IACnC,OAAO,EAAE,YAAY,CAAC;CACvB,CAAC;AAGF,KAAK,kBAAkB,CAAC,CAAC,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EAAE,CAAC,SAAS,MAAM,EAAE,CAAC,IAAI,CAAC,GAAG,MAAM,CAAC,aAAa,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC;AAG9G,KAAK,qBAAqB,CAAC,YAAY,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EAAE,MAAM,EAAE,UAAU,IAAI,WAAW,CACpG,YAAY,EACZ,MAAM,EACN,UAAU,CACX,GAAG;IACF,KAAK,EAAE,YAAY,SAAS,MAAM,CAAC,yBAAyB,EAAE,MAAM,MAAM,CAAC,GAAG,MAAM,GAAG,KAAK,CAAC;CAC9F,CAAC;AAEF,KAAK,eAAe,CAAC,mBAAmB,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EAAE,MAAM,EAAE,UAAU,IAAI,OAAO,CACjG,SAAS,CAAC,MAAM,EAAE,UAAU,CAAC,GAAG;IAC9B,KAAK,EAAE,mBAAmB,SAAS,MAAM,CAAC,yBAAyB,EAAE,MAAM,MAAM,CAAC,GAAG,MAAM,GAAG,KAAK,CAAC;IACpG,MAAM,CAAC,EAAE,mBAAmB,SAAS,MAAM,CAAC,0BAA0B,EAAE,MAAM,OAAO,CAAC,GAAG,OAAO,GAAG,SAAS,CAAC;IAG7G,gBAAgB,CAAC,EAAE,MAAM,CAAC;IAC1B,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,mBAAmB,CAAC,EAAE,MAAM,CAAC;IAC7B,oBAAoB,CAAC,EAAE,MAAM,CAAC;IAG9B,oBAAoB,CAAC,EAAE,mBAAmB,SAAS,MAAM,CAAC,sBAAsB,EAAE,MAAM,WAAW,CAAC,GAChG,WAAW,GACX,SAAS,CAAC;IACd,iBAAiB,CAAC,EAAE,mBAAmB,SAAS,MAAM,CAAC,mBAAmB,EAAE,MAAM,QAAQ,CAAC,GAAG,QAAQ,GAAG,SAAS,CAAC;CACpH,GAAG;IAAE,KAAK,EAAE,MAAM,CAAA;CAAE,CACtB,CAAC;AAGF,KAAK,mBAAmB,CACtB,YAAY,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EACxC,SAAS,SAAS,MAAM,EACxB,MAAM,EACN,UAAU,IACR,SAAS,SAAS,gBAAgB,GAClC,qBAAqB,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,CAAC,GACvD,WAAW,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,CAAC,CAAC;AAGlD,KAAK,YAAY,CAAC,YAAY,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EAAE,MAAM,EAAE,UAAU,EAAE,OAAO,IACnF,CAAC,CAAC,OAAO,EAAE,WAAW,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,CAAC,KAAK,OAAO,CAAC,GACrE,CAAC,CAAC,OAAO,EAAE,WAAW,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,CAAC,KAAK,OAAO,CAAC,OAAO,CAAC,CAAC,CAAC;AAEnF,KAAK,0BAA0B,CAAC,YAAY,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EAAE,MAAM,EAAE,UAAU,IACxF,CAAC,CAAC,OAAO,EAAE,qBAAqB,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,CAAC,KAAK,GAAG,CAAC,GAC3E,CAAC,CAAC,OAAO,EAAE,qBAAqB,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,CAAC,KAAK,OAAO,CAAC,GAAG,CAAC,CAAC,CAAC;AAEzF,KAAK,yBAAyB,CAAC,YAAY,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EAAE,MAAM,EAAE,UAAU,IACvF,CAAC,CAAC,OAAO,EAAE,WAAW,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,CAAC,KAAK,MAAM,CAAC,GACpE,CAAC,CAAC,OAAO,EAAE,WAAW,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,CAAC,KAAK,OAAO,CAAC,MAAM,CAAC,CAAC,CAAC;AAGlF,UAAU,yBAAyB,CAAC,YAAY,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EAAE,MAAM,EAAE,UAAU;IAC9F,WAAW,EAAE,MAAM,CAAC;IACpB,KAAK,CAAC,EAAE;QACN,KAAK,EAAE,iBAAiB,CAAC;QACzB,YAAY,EAAE,MAAM,CAAC;KACtB,CAAC;IAEF,YAAY,EAAE,CAAC,OAAO,EAAE,WAAW,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,CAAC,KAAK,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAC;CACpG;AAGD,UAAU,0BAA0B,CAAC,YAAY,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EAAE,MAAM,EAAE,UAAU;IAC/F,WAAW,EAAE,MAAM,CAAC;IACpB,KAAK,CAAC,EAAE;QACN,KAAK,EAAE,iBAAiB,CAAC;QACzB,YAAY,EAAE,MAAM,CAAC;KACtB,CAAC;IAEF,YAAY,EAAE,CAAC,OAAO,EAAE,qBAAqB,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,CAAC,KAAK,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAC;CAC9G;AAGD,KAAK,iBAAiB,CAAC,YAAY,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EAAE,WAAW,EAAE,MAAM,EAAE,UAAU,IAC5F,YAAY,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,EAAE,WAAW,CAAC,GAC3D,CAAC,YAAY,CAAC,WAAW,EAAE,YAAY,EAAE,YAAY,EAAE,MAAM,EAAE,UAAU,CAAC,GAAG;IAC3E,YAAY,EAAE,YAAY,CAAC,WAAW,CAAC,CAAC;CACzC,CAAC,CAAC;AAEP,KAAK,cAAc,CAAC,YAAY,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EAAE,WAAW,EAAE,MAAM,EAAE,UAAU,IACzF,YAAY,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,EAAE,WAAW,CAAC,GAC3D,CAAC,YAAY,CAAC,WAAW,EAAE,YAAY,EAAE,SAAS,EAAE,MAAM,EAAE,UAAU,CAAC,GAAG;IACxE,YAAY,EAAE,YAAY,CAAC,WAAW,CAAC,CAAC;CACzC,CAAC,CAAC;AAGP,KAAK,oBAAoB,CAAC,YAAY,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EAAE,MAAM,EAAE,UAAU,IAClF,yBAAyB,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,CAAC,GAC3D,yBAAyB,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,CAAC,CAAC;AAGhE,KAAK,qBAAqB,CAAC,YAAY,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EAAE,MAAM,EAAE,UAAU,IACnF,0BAA0B,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,CAAC,GAC5D,0BAA0B,CAAC,YAAY,EAAE,MAAM,EAAE,UAAU,CAAC,CAAC;AAEjE,cAAM,YAAY,CAChB,GAAG,SAAS,MAAM,GAAG,MAAM,EAC3B,MAAM,GAAG,GAAG,EACZ,UAAU,GAAG,GAAG,EAChB,mBAAmB,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,GAAG,EAAE;;IAY3C,MAAM,EAAE,YAAY,CAAC,GAAG,EAAE,MAAM,EAAE,UAAU,CAAC;IACpD,OAAO,CAAC,KAAK;IACb,OAAO,CAAC,qBAAqB;IAT/B;;;OAGG;IACI,MAAM,CAAC,EAAE,MAAM,GAAG,QAAQ,CAAC;gBAGzB,MAAM,EAAE,YAAY,CAAC,GAAG,EAAE,MAAM,EAAE,UAAU,CAAC,EAC5C,KAAK,GAAE,KAAK,CAAC,oBAAoB,CAAM,EACvC,qBAAqB,GAAE,GAAG,CAChC,MAAM,EACJ,YAAY,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,MAAM,EAAE,UAAU,CAAC,GAC/C,0BAA0B,CAAC,GAAG,EAAE,MAAM,EAAE,UAAU,CAAC,GACnD,yBAAyB,CAAC,GAAG,EAAE,MAAM,EAAE,UAAU,CAAC,CACzC,EACb,MAAM,CAAC,EAAE,MAAM;IAajB;;;;OAIG;IACH,gBAAgB,CAAC,MAAM,EAAE,MAAM,GAAG,IAAI;IAItC;;;OAGG;IACH,WAAW,IAAI,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,SAAS;IAIlD;;;OAGG;IACH,cAAc,CAAC,SAAS,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI;IAIxD,IAAI,IAAI;;;kBAEP;IAED,IAAI,EAAE,IAAI,GAAG,CAEZ;IAED,IAAI,IAAI,IAAI,MAAM,CAEjB;IAED,IAAI,WAAW,IAAI,MAAM,CAExB;IAED,IAAI,KAAK;eA9OA,iBAAiB;sBACV,MAAM;kBA+OrB;IAED,UAAU,CAAC,iBAAiB,EAC1B,OAAO,EAAE,iBAAiB,CAAC,mBAAmB,EAAE,iBAAiB,EAAE,MAAM,EAAE,UAAU,CAAC,GACrF,YAAY,CACb,GAAG,EACH,MAAM,EACN,UAAU,EACV,kBAAkB,CAAC,mBAAmB,EAAE,YAAY,EAAE,OAAO,CAAC,iBAAiB,CAAC,CAAC,CAClF;IA6BD,OAAO,CAAC,cAAc,EACpB,OAAO,EAAE,cAAc,CAAC,mBAAmB,EAAE,cAAc,EAAE,MAAM,EAAE,UAAU,CAAC,GAC/E,YAAY,CACb,GAAG,EACH,MAAM,EACN,UAAU,EACV,kBAAkB,CAAC,mBAAmB,EAAE,SAAS,EAAE,OAAO,CAAC,cAAc,CAAC,CAAC,CAC5E;IAuBD,aAAa,CAAC,YAAY,SAAS,MAAM,GAAG,MAAM,EAChD,OAAO,EAAE,oBAAoB,CAAC,mBAAmB,EAAE,MAAM,EAAE,UAAU,CAAC,GACrE,YAAY,CACb,GAAG,EACH,MAAM,EACN,UAAU,EACV,kBAAkB,CAAC,mBAAmB,EAAE,eAAe,EAAE,OAAO,CAAC,YAAY,CAAC,CAAC,CAChF;IAuBD,cAAc,CAAC,aAAa,GAAG,MAAM,EACnC,OAAO,EAAE,qBAAqB,CAAC,mBAAmB,EAAE,MAAM,EAAE,UAAU,CAAC,GACtE,YAAY,CACb,GAAG,EACH,MAAM,EACN,UAAU,EACV,kBAAkB,CAAC,mBAAmB,EAAE,gBAAgB,EAAE,OAAO,CAAC,aAAa,CAAC,CAAC,CAClF;IAuBD,OAAO,KAAK,gBAAgB,GAE3B;IAEK,GAAG,CAAC,KAAK,EAAE,SAAS,CAAC,MAAM,EAAE,UAAU,CAAC,GAAG,eAAe,CAAC,mBAAmB,EAAE,MAAM,EAAE,UAAU,CAAC;IAoDzG,OAAO,CAAC,cAAc;IAkBtB,QAAQ,IAAI,KAAK,CAAC;QAAE,IAAI,EAAE,MAAM,CAAC;QAAC,IAAI,EAAE,UAAU,GAAG,QAAQ,CAAC;QAAC,WAAW,CAAC,EAAE,MAAM,CAAA;KAAE,CAAC;IAQtF,OAAO,CAAC,gBAAgB;IA+ExB,OAAO,CAAC,mBAAmB;YAab,mBAAmB;YAInB,iBAAiB;IA8F/B,OAAO,CAAC,uBAAuB;CAuBhC;AAGD,wBAAgB,YAAY,CAAC,GAAG,SAAS,MAAM,EAAE,KAAK,SAAS,MAAM,mBAAmB,EACtF,MAAM,EAAE,IAAI,CAAC,YAAY,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC,EAAE,MAAM,CAAC,GAAG;IAClD,IAAI,EAAE,KAAK,CAAC;CACb,GACA,YAAY,CAAC,GAAG,EAAE,mBAAmB,CAAC,KAAK,CAAC,CAAC,OAAO,CAAC,EAAE,mBAAmB,CAAC,KAAK,CAAC,CAAC,QAAQ,CAAC,EAAE,EAAE,CAAC,CAAC;AAGpG,wBAAgB,YAAY,CAAC,GAAG,SAAS,MAAM,EAAE,YAAY,SAAS,CAAC,CAAC,UAAU,EAAE,aAAa,SAAS,CAAC,CAAC,UAAU,EACpH,MAAM,EAAE,IAAI,CAAC,YAAY,CAAC,GAAG,EAAE,CAAC,CAAC,KAAK,CAAC,YAAY,CAAC,EAAE,CAAC,CAAC,KAAK,CAAC,aAAa,CAAC,CAAC,EAAE,MAAM,CAAC,GAAG;IACvF,IAAI,EAAE;QAAE,KAAK,EAAE,YAAY,CAAC;QAAC,MAAM,EAAE,aAAa,CAAA;KAAE,CAAC;CACtD,GACA,YAAY,CAAC,GAAG,EAAE,CAAC,CAAC,KAAK,CAAC,YAAY,CAAC,EAAE,CAAC,CAAC,KAAK,CAAC,aAAa,CAAC,EAAE,EAAE,CAAC,CAAC;AAGxE,wBAAgB,YAAY,CAAC,MAAM,GAAG,GAAG,EAAE,UAAU,GAAG,GAAG,EAAE,GAAG,SAAS,MAAM,GAAG,MAAM,EACtF,MAAM,EAAE,YAAY,CAAC,GAAG,EAAE,MAAM,EAAE,UAAU,CAAC,GAC5C,YAAY,CAAC,GAAG,EAAE,MAAM,EAAE,UAAU,EAAE,EAAE,CAAC,CAAC;AAa7C,MAAM,MAAM,iBAAiB,GAAG;IAC9B,MAAM,EAAE,YAAY,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC,CAAC;IACzC,QAAQ,CAAC,EAAE,qBAAqB,CAAC;CAClC,CAAC;AAEF,MAAM,MAAM,aAAa,GAAG,MAAM,CAAC,MAAM,EAAE,iBAAiB,CAAC,CAAC;AAG9D,YAAY,EAAE,YAAY,EAAE,SAAS,EAAE,YAAY,EAAE,CAAC;AAEtD,OAAO,EAAE,YAAY,EAAE,CAAC"}
|
package/dist/evals/index.cjs
CHANGED
|
@@ -1,78 +1,90 @@
|
|
|
1
1
|
'use strict';
|
|
2
2
|
|
|
3
|
-
var
|
|
4
|
-
var
|
|
5
|
-
var
|
|
3
|
+
var chunk5AVTFQEP_cjs = require('../chunk-5AVTFQEP.cjs');
|
|
4
|
+
var chunkVAVK4KJI_cjs = require('../chunk-VAVK4KJI.cjs');
|
|
5
|
+
var chunk7IDACSBM_cjs = require('../chunk-7IDACSBM.cjs');
|
|
6
6
|
|
|
7
7
|
|
|
8
8
|
|
|
9
9
|
Object.defineProperty(exports, "runEvals", {
|
|
10
10
|
enumerable: true,
|
|
11
|
-
get: function () { return
|
|
11
|
+
get: function () { return chunk5AVTFQEP_cjs.runEvals; }
|
|
12
12
|
});
|
|
13
13
|
Object.defineProperty(exports, "MastraScorer", {
|
|
14
14
|
enumerable: true,
|
|
15
|
-
get: function () { return
|
|
15
|
+
get: function () { return chunkVAVK4KJI_cjs.MastraScorer; }
|
|
16
16
|
});
|
|
17
17
|
Object.defineProperty(exports, "createScorer", {
|
|
18
18
|
enumerable: true,
|
|
19
|
-
get: function () { return
|
|
19
|
+
get: function () { return chunkVAVK4KJI_cjs.createScorer; }
|
|
20
|
+
});
|
|
21
|
+
Object.defineProperty(exports, "extractTrajectory", {
|
|
22
|
+
enumerable: true,
|
|
23
|
+
get: function () { return chunk7IDACSBM_cjs.extractTrajectory; }
|
|
24
|
+
});
|
|
25
|
+
Object.defineProperty(exports, "extractTrajectoryFromTrace", {
|
|
26
|
+
enumerable: true,
|
|
27
|
+
get: function () { return chunk7IDACSBM_cjs.extractTrajectoryFromTrace; }
|
|
28
|
+
});
|
|
29
|
+
Object.defineProperty(exports, "extractWorkflowTrajectory", {
|
|
30
|
+
enumerable: true,
|
|
31
|
+
get: function () { return chunk7IDACSBM_cjs.extractWorkflowTrajectory; }
|
|
20
32
|
});
|
|
21
33
|
Object.defineProperty(exports, "listScoresResponseSchema", {
|
|
22
34
|
enumerable: true,
|
|
23
|
-
get: function () { return
|
|
35
|
+
get: function () { return chunk7IDACSBM_cjs.listScoresResponseSchema; }
|
|
24
36
|
});
|
|
25
37
|
Object.defineProperty(exports, "saveScorePayloadSchema", {
|
|
26
38
|
enumerable: true,
|
|
27
|
-
get: function () { return
|
|
39
|
+
get: function () { return chunk7IDACSBM_cjs.saveScorePayloadSchema; }
|
|
28
40
|
});
|
|
29
41
|
Object.defineProperty(exports, "scoreResultSchema", {
|
|
30
42
|
enumerable: true,
|
|
31
|
-
get: function () { return
|
|
43
|
+
get: function () { return chunk7IDACSBM_cjs.scoreResultSchema; }
|
|
32
44
|
});
|
|
33
45
|
Object.defineProperty(exports, "scoreRowDataSchema", {
|
|
34
46
|
enumerable: true,
|
|
35
|
-
get: function () { return
|
|
47
|
+
get: function () { return chunk7IDACSBM_cjs.scoreRowDataSchema; }
|
|
36
48
|
});
|
|
37
49
|
Object.defineProperty(exports, "scoringEntityTypeSchema", {
|
|
38
50
|
enumerable: true,
|
|
39
|
-
get: function () { return
|
|
51
|
+
get: function () { return chunk7IDACSBM_cjs.scoringEntityTypeSchema; }
|
|
40
52
|
});
|
|
41
53
|
Object.defineProperty(exports, "scoringExtractStepResultSchema", {
|
|
42
54
|
enumerable: true,
|
|
43
|
-
get: function () { return
|
|
55
|
+
get: function () { return chunk7IDACSBM_cjs.scoringExtractStepResultSchema; }
|
|
44
56
|
});
|
|
45
57
|
Object.defineProperty(exports, "scoringHookInputSchema", {
|
|
46
58
|
enumerable: true,
|
|
47
|
-
get: function () { return
|
|
59
|
+
get: function () { return chunk7IDACSBM_cjs.scoringHookInputSchema; }
|
|
48
60
|
});
|
|
49
61
|
Object.defineProperty(exports, "scoringInputSchema", {
|
|
50
62
|
enumerable: true,
|
|
51
|
-
get: function () { return
|
|
63
|
+
get: function () { return chunk7IDACSBM_cjs.scoringInputSchema; }
|
|
52
64
|
});
|
|
53
65
|
Object.defineProperty(exports, "scoringInputWithExtractStepResultAndAnalyzeStepResultSchema", {
|
|
54
66
|
enumerable: true,
|
|
55
|
-
get: function () { return
|
|
67
|
+
get: function () { return chunk7IDACSBM_cjs.scoringInputWithExtractStepResultAndAnalyzeStepResultSchema; }
|
|
56
68
|
});
|
|
57
69
|
Object.defineProperty(exports, "scoringInputWithExtractStepResultAndScoreAndReasonSchema", {
|
|
58
70
|
enumerable: true,
|
|
59
|
-
get: function () { return
|
|
71
|
+
get: function () { return chunk7IDACSBM_cjs.scoringInputWithExtractStepResultAndScoreAndReasonSchema; }
|
|
60
72
|
});
|
|
61
73
|
Object.defineProperty(exports, "scoringInputWithExtractStepResultSchema", {
|
|
62
74
|
enumerable: true,
|
|
63
|
-
get: function () { return
|
|
75
|
+
get: function () { return chunk7IDACSBM_cjs.scoringInputWithExtractStepResultSchema; }
|
|
64
76
|
});
|
|
65
77
|
Object.defineProperty(exports, "scoringPromptsSchema", {
|
|
66
78
|
enumerable: true,
|
|
67
|
-
get: function () { return
|
|
79
|
+
get: function () { return chunk7IDACSBM_cjs.scoringPromptsSchema; }
|
|
68
80
|
});
|
|
69
81
|
Object.defineProperty(exports, "scoringSourceSchema", {
|
|
70
82
|
enumerable: true,
|
|
71
|
-
get: function () { return
|
|
83
|
+
get: function () { return chunk7IDACSBM_cjs.scoringSourceSchema; }
|
|
72
84
|
});
|
|
73
85
|
Object.defineProperty(exports, "scoringValueSchema", {
|
|
74
86
|
enumerable: true,
|
|
75
|
-
get: function () { return
|
|
87
|
+
get: function () { return chunk7IDACSBM_cjs.scoringValueSchema; }
|
|
76
88
|
});
|
|
77
89
|
//# sourceMappingURL=index.cjs.map
|
|
78
90
|
//# sourceMappingURL=index.cjs.map
|
package/dist/evals/index.js
CHANGED
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
export { runEvals } from '../chunk-
|
|
2
|
-
export { MastraScorer, createScorer } from '../chunk-
|
|
3
|
-
export { listScoresResponseSchema, saveScorePayloadSchema, scoreResultSchema, scoreRowDataSchema, scoringEntityTypeSchema, scoringExtractStepResultSchema, scoringHookInputSchema, scoringInputSchema, scoringInputWithExtractStepResultAndAnalyzeStepResultSchema, scoringInputWithExtractStepResultAndScoreAndReasonSchema, scoringInputWithExtractStepResultSchema, scoringPromptsSchema, scoringSourceSchema, scoringValueSchema } from '../chunk-
|
|
1
|
+
export { runEvals } from '../chunk-JEWTRDRI.js';
|
|
2
|
+
export { MastraScorer, createScorer } from '../chunk-VF3CL3JV.js';
|
|
3
|
+
export { extractTrajectory, extractTrajectoryFromTrace, extractWorkflowTrajectory, listScoresResponseSchema, saveScorePayloadSchema, scoreResultSchema, scoreRowDataSchema, scoringEntityTypeSchema, scoringExtractStepResultSchema, scoringHookInputSchema, scoringInputSchema, scoringInputWithExtractStepResultAndAnalyzeStepResultSchema, scoringInputWithExtractStepResultAndScoreAndReasonSchema, scoringInputWithExtractStepResultSchema, scoringPromptsSchema, scoringSourceSchema, scoringValueSchema } from '../chunk-VMKNS3YO.js';
|
|
4
4
|
//# sourceMappingURL=index.js.map
|
|
5
5
|
//# sourceMappingURL=index.js.map
|
|
@@ -11,12 +11,23 @@ type WorkflowRunOptions = WorkflowRunStartOptions & {
|
|
|
11
11
|
type RunEvalsDataItem<TTarget = unknown> = {
|
|
12
12
|
input: TTarget extends Workflow<any, any> ? any : TTarget extends Agent ? string | string[] | CoreMessage[] | AiMessageType[] | UIMessageWithMetadata[] : unknown;
|
|
13
13
|
groundTruth?: any;
|
|
14
|
+
expectedTrajectory?: any;
|
|
14
15
|
requestContext?: RequestContext;
|
|
15
16
|
startOptions?: WorkflowRunOptions;
|
|
16
17
|
} & Partial<ObservabilityContext>;
|
|
17
|
-
type WorkflowScorerConfig = {
|
|
18
|
+
export type WorkflowScorerConfig = {
|
|
19
|
+
/** Scorers that evaluate the overall workflow input/output */
|
|
18
20
|
workflow?: MastraScorer<any, any, any, any>[];
|
|
21
|
+
/** Scorers that evaluate individual workflow steps by step ID */
|
|
19
22
|
steps?: Record<string, MastraScorer<any, any, any, any>[]>;
|
|
23
|
+
/** Scorers that evaluate the workflow's step execution trajectory */
|
|
24
|
+
trajectory?: MastraScorer<any, any, any, any>[];
|
|
25
|
+
};
|
|
26
|
+
export type AgentScorerConfig = {
|
|
27
|
+
/** Scorers that evaluate the full agent input/output */
|
|
28
|
+
agent?: MastraScorer<any, any, any, any>[];
|
|
29
|
+
/** Scorers that evaluate the agent's tool call trajectory */
|
|
30
|
+
trajectory?: MastraScorer<any, any, any, any>[];
|
|
20
31
|
};
|
|
21
32
|
type RunEvalsResult = {
|
|
22
33
|
scores: Record<string, any>;
|
|
@@ -59,6 +70,22 @@ export declare function runEvals<TWorkflow extends AnyWorkflow>(config: {
|
|
|
59
70
|
scorerResults: {
|
|
60
71
|
workflow?: Record<string, any>;
|
|
61
72
|
steps?: Record<string, Record<string, any>>;
|
|
73
|
+
trajectory?: Record<string, any>;
|
|
74
|
+
};
|
|
75
|
+
}) => void | Promise<void>;
|
|
76
|
+
concurrency?: number;
|
|
77
|
+
}): Promise<RunEvalsResult>;
|
|
78
|
+
export declare function runEvals<TAgent extends Agent>(config: {
|
|
79
|
+
data: RunEvalsDataItem<TAgent>[];
|
|
80
|
+
scorers: AgentScorerConfig;
|
|
81
|
+
target: TAgent;
|
|
82
|
+
targetOptions?: Omit<AgentExecutionOptions<any>, 'scorers' | 'returnScorerData' | 'requestContext'>;
|
|
83
|
+
onItemComplete?: (params: {
|
|
84
|
+
item: RunEvalsDataItem<TAgent>;
|
|
85
|
+
targetResult: Awaited<ReturnType<Agent['generate']>>;
|
|
86
|
+
scorerResults: {
|
|
87
|
+
agent?: Record<string, any>;
|
|
88
|
+
trajectory?: Record<string, any>;
|
|
62
89
|
};
|
|
63
90
|
}) => void | Promise<void>;
|
|
64
91
|
concurrency?: number;
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/evals/run/index.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,WAAW,EAAE,MAAM,qBAAqB,CAAC;AACvD,OAAO,KAAK,EAAE,KAAK,EAAE,qBAAqB,EAAE,aAAa,EAAE,qBAAqB,EAAE,MAAM,aAAa,CAAC;AAItG,OAAO,KAAK,EAAE,oBAAoB,EAAE,MAAM,qBAAqB,CAAC;AAEhE,OAAO,KAAK,EAAE,cAAc,EAAE,MAAM,uBAAuB,CAAC;
|
|
1
|
+
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/evals/run/index.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,WAAW,EAAE,MAAM,qBAAqB,CAAC;AACvD,OAAO,KAAK,EAAE,KAAK,EAAE,qBAAqB,EAAE,aAAa,EAAE,qBAAqB,EAAE,MAAM,aAAa,CAAC;AAItG,OAAO,KAAK,EAAE,oBAAoB,EAAE,MAAM,qBAAqB,CAAC;AAEhE,OAAO,KAAK,EAAE,cAAc,EAAE,MAAM,uBAAuB,CAAC;AAE5D,OAAO,EAAE,QAAQ,EAAE,MAAM,iBAAiB,CAAC;AAC3C,OAAO,KAAK,EAAE,WAAW,EAAE,cAAc,EAAE,uBAAuB,EAAc,MAAM,iBAAiB,CAAC;AACxG,OAAO,KAAK,EAAE,YAAY,EAAE,MAAM,SAAS,CAAC;AAI5C,KAAK,kBAAkB,GAAG,uBAAuB,GAAG;IAClD,YAAY,CAAC,EAAE,GAAG,CAAC;CACpB,CAAC;AAEF,KAAK,gBAAgB,CAAC,OAAO,GAAG,OAAO,IAAI;IACzC,KAAK,EAAE,OAAO,SAAS,QAAQ,CAAC,GAAG,EAAE,GAAG,CAAC,GACrC,GAAG,GACH,OAAO,SAAS,KAAK,GACnB,MAAM,GAAG,MAAM,EAAE,GAAG,WAAW,EAAE,GAAG,aAAa,EAAE,GAAG,qBAAqB,EAAE,GAC7E,OAAO,CAAC;IACd,WAAW,CAAC,EAAE,GAAG,CAAC;IAClB,kBAAkB,CAAC,EAAE,GAAG,CAAC;IACzB,cAAc,CAAC,EAAE,cAAc,CAAC;IAChC,YAAY,CAAC,EAAE,kBAAkB,CAAC;CACnC,GAAG,OAAO,CAAC,oBAAoB,CAAC,CAAC;AAElC,MAAM,MAAM,oBAAoB,GAAG;IACjC,8DAA8D;IAC9D,QAAQ,CAAC,EAAE,YAAY,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC,EAAE,CAAC;IAC9C,iEAAiE;IACjE,KAAK,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,YAAY,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC,EAAE,CAAC,CAAC;IAC3D,qEAAqE;IACrE,UAAU,CAAC,EAAE,YAAY,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC,EAAE,CAAC;CACjD,CAAC;AAEF,MAAM,MAAM,iBAAiB,GAAG;IAC9B,wDAAwD;IACxD,KAAK,CAAC,EAAE,YAAY,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC,EAAE,CAAC;IAC3C,6DAA6D;IAC7D,UAAU,CAAC,EAAE,YAAY,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC,EAAE,CAAC;CACjD,CAAC;AAEF,KAAK,cAAc,GAAG;IACpB,MAAM,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;IAC5B,OAAO,EAAE;QACP,UAAU,EAAE,MAAM,CAAC;KACpB,CAAC;CACH,CAAC;AAGF,wBAAgB,QAAQ,CAAC,MAAM,SAAS,KAAK,EAAE,MAAM,EAAE;IACrD,IAAI,EAAE,gBAAgB,CAAC,MAAM,CAAC,EAAE,CAAC;IACjC,OAAO,EAAE,YAAY,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC,EAAE,CAAC;IAC5C,MAAM,EAAE,MAAM,CAAC;IACf,aAAa,CAAC,EAAE,IAAI,CAAC,qBAAqB,CAAC,GAAG,CAAC,EAAE,SAAS,GAAG,kBAAkB,GAAG,gBAAgB,CAAC,CAAC;IACpG,cAAc,CAAC,EAAE,CAAC,MAAM,EAAE;QACxB,IAAI,EAAE,gBAAgB,CAAC,MAAM,CAAC,CAAC;QAC/B,YAAY,EAAE,OAAO,CAAC,UAAU,CAAC,KAAK,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;QACrD,aAAa,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;KACpC,KAAK,IAAI,GAAG,OAAO,CAAC,IAAI,CAAC,CAAC;IAC3B,WAAW,CAAC,EAAE,MAAM,CAAC;CACtB,GAAG,OAAO,CAAC,cAAc,CAAC,CAAC;AAG5B,wBAAgB,QAAQ,CAAC,SAAS,SAAS,WAAW,EAAE,MAAM,EAAE;IAC9D,IAAI,EAAE,gBAAgB,CAAC,SAAS,CAAC,EAAE,CAAC;IACpC,OAAO,EAAE,YAAY,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC,EAAE,CAAC;IAC5C,MAAM,EAAE,SAAS,CAAC;IAClB,aAAa,CAAC,EAAE,kBAAkB,CAAC;IACnC,cAAc,CAAC,EAAE,CAAC,MAAM,EAAE;QACxB,IAAI,EAAE,gBAAgB,CAAC,SAAS,CAAC,CAAC;QAClC,YAAY,EAAE,cAAc,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC,CAAC;QACjD,aAAa,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;KACpC,KAAK,IAAI,GAAG,OAAO,CAAC,IAAI,CAAC,CAAC;IAC3B,WAAW,CAAC,EAAE,MAAM,CAAC;CACtB,GAAG,OAAO,CAAC,cAAc,CAAC,CAAC;AAG5B,wBAAgB,QAAQ,CAAC,SAAS,SAAS,WAAW,EAAE,MAAM,EAAE;IAC9D,IAAI,EAAE,gBAAgB,CAAC,SAAS,CAAC,EAAE,CAAC;IACpC,OAAO,EAAE,oBAAoB,CAAC;IAC9B,MAAM,EAAE,SAAS,CAAC;IAClB,aAAa,CAAC,EAAE,kBAAkB,CAAC;IACnC,cAAc,CAAC,EAAE,CAAC,MAAM,EAAE;QACxB,IAAI,EAAE,gBAAgB,CAAC,SAAS,CAAC,CAAC;QAClC,YAAY,EAAE,cAAc,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC,CAAC;QACjD,aAAa,EAAE;YACb,QAAQ,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;YAC/B,KAAK,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC,CAAC;YAC5C,UAAU,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;SAClC,CAAC;KACH,KAAK,IAAI,GAAG,OAAO,CAAC,IAAI,CAAC,CAAC;IAC3B,WAAW,CAAC,EAAE,MAAM,CAAC;CACtB,GAAG,OAAO,CAAC,cAAc,CAAC,CAAC;AAG5B,wBAAgB,QAAQ,CAAC,MAAM,SAAS,KAAK,EAAE,MAAM,EAAE;IACrD,IAAI,EAAE,gBAAgB,CAAC,MAAM,CAAC,EAAE,CAAC;IACjC,OAAO,EAAE,iBAAiB,CAAC;IAC3B,MAAM,EAAE,MAAM,CAAC;IACf,aAAa,CAAC,EAAE,IAAI,CAAC,qBAAqB,CAAC,GAAG,CAAC,EAAE,SAAS,GAAG,kBAAkB,GAAG,gBAAgB,CAAC,CAAC;IACpG,cAAc,CAAC,EAAE,CAAC,MAAM,EAAE;QACxB,IAAI,EAAE,gBAAgB,CAAC,MAAM,CAAC,CAAC;QAC/B,YAAY,EAAE,OAAO,CAAC,UAAU,CAAC,KAAK,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;QACrD,aAAa,EAAE;YACb,KAAK,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;YAC5B,UAAU,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;SAClC,CAAC;KACH,KAAK,IAAI,GAAG,OAAO,CAAC,IAAI,CAAC,CAAC;IAC3B,WAAW,CAAC,EAAE,MAAM,CAAC;CACtB,GAAG,OAAO,CAAC,cAAc,CAAC,CAAC"}
|
|
@@ -2,9 +2,12 @@ export declare class ScoreAccumulator {
|
|
|
2
2
|
private flatScores;
|
|
3
3
|
private workflowScores;
|
|
4
4
|
private stepScores;
|
|
5
|
+
private agentScores;
|
|
6
|
+
private trajectoryScores;
|
|
5
7
|
addScores(scorerResults: Record<string, any>): void;
|
|
6
8
|
private addFlatScores;
|
|
7
|
-
private
|
|
9
|
+
private addWorkflowScores;
|
|
10
|
+
private addAgentScores;
|
|
8
11
|
addStepScores(stepScorerResults: Record<string, Record<string, any>>): void;
|
|
9
12
|
getAverageScores(): Record<string, any>;
|
|
10
13
|
private getAverageScore;
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"scorerAccumulator.d.ts","sourceRoot":"","sources":["../../../src/evals/run/scorerAccumulator.ts"],"names":[],"mappings":"AAAA,qBAAa,gBAAgB;IAC3B,OAAO,CAAC,UAAU,CAAgC;IAClD,OAAO,CAAC,cAAc,CAAgC;IACtD,OAAO,CAAC,UAAU,CAAgD;
|
|
1
|
+
{"version":3,"file":"scorerAccumulator.d.ts","sourceRoot":"","sources":["../../../src/evals/run/scorerAccumulator.ts"],"names":[],"mappings":"AAAA,qBAAa,gBAAgB;IAC3B,OAAO,CAAC,UAAU,CAAgC;IAClD,OAAO,CAAC,cAAc,CAAgC;IACtD,OAAO,CAAC,UAAU,CAAgD;IAClE,OAAO,CAAC,WAAW,CAAgC;IACnD,OAAO,CAAC,gBAAgB,CAAgC;IAExD,SAAS,CAAC,aAAa,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC;IAiB5C,OAAO,CAAC,aAAa;IASrB,OAAO,CAAC,iBAAiB;IAmCzB,OAAO,CAAC,cAAc;IAoBtB,aAAa,CAAC,iBAAiB,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;IAcpE,gBAAgB,IAAI,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC;IA4CvC,OAAO,CAAC,eAAe;CAOxB"}
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
'use strict';
|
|
2
2
|
|
|
3
|
-
var
|
|
4
|
-
var
|
|
3
|
+
var chunkT2CILERS_cjs = require('../../chunk-T2CILERS.cjs');
|
|
4
|
+
var chunk7IDACSBM_cjs = require('../../chunk-7IDACSBM.cjs');
|
|
5
5
|
var chunkG5HKDGNT_cjs = require('../../chunk-G5HKDGNT.cjs');
|
|
6
6
|
var chunk4U7ZLI36_cjs = require('../../chunk-4U7ZLI36.cjs');
|
|
7
7
|
var pMap = require('p-map');
|
|
@@ -235,7 +235,7 @@ function transformTraceToScorerInputAndOutput(trace) {
|
|
|
235
235
|
}
|
|
236
236
|
|
|
237
237
|
// src/evals/scoreTraces/scoreTracesWorkflow.ts
|
|
238
|
-
var getTraceStep =
|
|
238
|
+
var getTraceStep = chunkT2CILERS_cjs.createStep({
|
|
239
239
|
id: "__process-trace-scoring",
|
|
240
240
|
inputSchema: v4.z.object({
|
|
241
241
|
targets: v4.z.array(
|
|
@@ -383,7 +383,7 @@ async function validateAndSaveScore({ storage, scorerResult }) {
|
|
|
383
383
|
text: "Scores storage domain is not available"
|
|
384
384
|
});
|
|
385
385
|
}
|
|
386
|
-
const payloadToSave =
|
|
386
|
+
const payloadToSave = chunk7IDACSBM_cjs.saveScorePayloadSchema.parse(scorerResult);
|
|
387
387
|
const result = await scoresStore.saveScore(payloadToSave);
|
|
388
388
|
return result.score;
|
|
389
389
|
}
|
|
@@ -446,7 +446,7 @@ async function attachScoreToSpan({
|
|
|
446
446
|
} catch {
|
|
447
447
|
}
|
|
448
448
|
}
|
|
449
|
-
var scoreTracesWorkflow =
|
|
449
|
+
var scoreTracesWorkflow = chunkT2CILERS_cjs.createWorkflow({
|
|
450
450
|
id: "__batch-scoring-traces",
|
|
451
451
|
inputSchema: v4.z.object({
|
|
452
452
|
targets: v4.z.array(
|
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import { createStep, createWorkflow } from '../../chunk-
|
|
2
|
-
import { saveScorePayloadSchema } from '../../chunk-
|
|
1
|
+
import { createStep, createWorkflow } from '../../chunk-YN3FI4AD.js';
|
|
2
|
+
import { saveScorePayloadSchema } from '../../chunk-VMKNS3YO.js';
|
|
3
3
|
import { resolveObservabilityContext } from '../../chunk-CT4YYQI3.js';
|
|
4
4
|
import { MastraError } from '../../chunk-FJEVLHJT.js';
|
|
5
5
|
import pMap from 'p-map';
|