agentv 4.12.2 → 4.12.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -46,7 +46,7 @@ import {
46
46
  // package.json
47
47
  var package_default = {
48
48
  name: "agentv",
49
- version: "4.12.2",
49
+ version: "4.12.3",
50
50
  description: "CLI entry point for AgentV",
51
51
  type: "module",
52
52
  repository: {
@@ -473,19 +473,23 @@ function hydrateManifestRecord(baseDir, record) {
473
473
  passed: assertion.passed,
474
474
  evidence: assertion.evidence
475
475
  })),
476
- scores: grading?.evaluators?.map((evaluator) => ({
477
- name: evaluator.name,
478
- type: evaluator.type,
479
- score: evaluator.score,
480
- assertions: Array.isArray(evaluator.assertions) ? evaluator.assertions.map((assertion) => ({
481
- text: String(assertion.text ?? ""),
482
- passed: Boolean(assertion.passed),
483
- evidence: typeof assertion.evidence === "string" ? String(assertion.evidence) : void 0
484
- })) : void 0,
485
- weight: typeof evaluator.weight === "number" ? evaluator.weight : void 0,
486
- verdict: typeof evaluator.verdict === "string" ? evaluator.verdict : void 0,
487
- details: evaluator.details
488
- })) ?? record.scores,
476
+ scores: (
477
+ // `evaluators` was renamed to `graders` in v4.13 — read both for backwards compat with old artifacts.
478
+ // TODO: remove `evaluators` fallback once old run directories are no longer in use.
479
+ (grading?.graders ?? grading?.evaluators)?.map((evaluator) => ({
480
+ name: evaluator.name,
481
+ type: evaluator.type,
482
+ score: evaluator.score,
483
+ assertions: Array.isArray(evaluator.assertions) ? evaluator.assertions.map((assertion) => ({
484
+ text: String(assertion.text ?? ""),
485
+ passed: Boolean(assertion.passed),
486
+ evidence: typeof assertion.evidence === "string" ? String(assertion.evidence) : void 0
487
+ })) : void 0,
488
+ weight: typeof evaluator.weight === "number" ? evaluator.weight : void 0,
489
+ verdict: typeof evaluator.verdict === "string" ? evaluator.verdict : void 0,
490
+ details: evaluator.details
491
+ })) ?? record.scores
492
+ ),
489
493
  tokenUsage: timing?.token_usage ? {
490
494
  input: timing.token_usage.input,
491
495
  output: timing.token_usage.output,
@@ -1264,7 +1268,7 @@ function buildGradingArtifact(result) {
1264
1268
  total_tool_calls: totalToolCalls,
1265
1269
  errors_encountered: errorsEncountered
1266
1270
  },
1267
- evaluators: buildEvaluators(result.scores),
1271
+ graders: buildEvaluators(result.scores),
1268
1272
  workspace_changes: parseWorkspaceChanges(result.fileChanges),
1269
1273
  conversation: result.conversationId ? {
1270
1274
  turns: result.trace ? result.trace.steps?.length ?? 0 : 0,
@@ -5771,4 +5775,4 @@ export {
5771
5775
  getCategories,
5772
5776
  filterByCategory
5773
5777
  };
5774
- //# sourceMappingURL=chunk-GSVQGON2.js.map
5778
+ //# sourceMappingURL=chunk-LL6TC7UU.js.map