agentv 4.12.2 → 4.12.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/{chunk-GSVQGON2.js → chunk-LL6TC7UU.js} +20 -16
- package/dist/chunk-LL6TC7UU.js.map +1 -0
- package/dist/{chunk-S3YQYLZN.js → chunk-ZT6ZFMKJ.js} +9 -6
- package/dist/chunk-ZT6ZFMKJ.js.map +1 -0
- package/dist/cli.js +2 -2
- package/dist/index.js +2 -2
- package/dist/{interactive-ZGCO5PVL.js → interactive-VI3QHT7A.js} +2 -2
- package/package.json +1 -1
- package/dist/chunk-GSVQGON2.js.map +0 -1
- package/dist/chunk-S3YQYLZN.js.map +0 -1
- /package/dist/{interactive-ZGCO5PVL.js.map → interactive-VI3QHT7A.js.map} +0 -0
|
@@ -46,7 +46,7 @@ import {
|
|
|
46
46
|
// package.json
|
|
47
47
|
var package_default = {
|
|
48
48
|
name: "agentv",
|
|
49
|
-
version: "4.12.
|
|
49
|
+
version: "4.12.3",
|
|
50
50
|
description: "CLI entry point for AgentV",
|
|
51
51
|
type: "module",
|
|
52
52
|
repository: {
|
|
@@ -473,19 +473,23 @@ function hydrateManifestRecord(baseDir, record) {
|
|
|
473
473
|
passed: assertion.passed,
|
|
474
474
|
evidence: assertion.evidence
|
|
475
475
|
})),
|
|
476
|
-
scores:
|
|
477
|
-
|
|
478
|
-
|
|
479
|
-
|
|
480
|
-
|
|
481
|
-
|
|
482
|
-
|
|
483
|
-
|
|
484
|
-
|
|
485
|
-
|
|
486
|
-
|
|
487
|
-
|
|
488
|
-
|
|
476
|
+
scores: (
|
|
477
|
+
// `evaluators` was renamed to `graders` in v4.13 — read both for backwards compat with old artifacts.
|
|
478
|
+
// TODO: remove `evaluators` fallback once old run directories are no longer in use.
|
|
479
|
+
(grading?.graders ?? grading?.evaluators)?.map((evaluator) => ({
|
|
480
|
+
name: evaluator.name,
|
|
481
|
+
type: evaluator.type,
|
|
482
|
+
score: evaluator.score,
|
|
483
|
+
assertions: Array.isArray(evaluator.assertions) ? evaluator.assertions.map((assertion) => ({
|
|
484
|
+
text: String(assertion.text ?? ""),
|
|
485
|
+
passed: Boolean(assertion.passed),
|
|
486
|
+
evidence: typeof assertion.evidence === "string" ? String(assertion.evidence) : void 0
|
|
487
|
+
})) : void 0,
|
|
488
|
+
weight: typeof evaluator.weight === "number" ? evaluator.weight : void 0,
|
|
489
|
+
verdict: typeof evaluator.verdict === "string" ? evaluator.verdict : void 0,
|
|
490
|
+
details: evaluator.details
|
|
491
|
+
})) ?? record.scores
|
|
492
|
+
),
|
|
489
493
|
tokenUsage: timing?.token_usage ? {
|
|
490
494
|
input: timing.token_usage.input,
|
|
491
495
|
output: timing.token_usage.output,
|
|
@@ -1264,7 +1268,7 @@ function buildGradingArtifact(result) {
|
|
|
1264
1268
|
total_tool_calls: totalToolCalls,
|
|
1265
1269
|
errors_encountered: errorsEncountered
|
|
1266
1270
|
},
|
|
1267
|
-
|
|
1271
|
+
graders: buildEvaluators(result.scores),
|
|
1268
1272
|
workspace_changes: parseWorkspaceChanges(result.fileChanges),
|
|
1269
1273
|
conversation: result.conversationId ? {
|
|
1270
1274
|
turns: result.trace ? result.trace.steps?.length ?? 0 : 0,
|
|
@@ -5771,4 +5775,4 @@ export {
|
|
|
5771
5775
|
getCategories,
|
|
5772
5776
|
filterByCategory
|
|
5773
5777
|
};
|
|
5774
|
-
//# sourceMappingURL=chunk-
|
|
5778
|
+
//# sourceMappingURL=chunk-LL6TC7UU.js.map
|