agentv 3.14.6 → 4.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,11 +1,13 @@
1
1
  import { createRequire } from 'node:module'; const require = createRequire(import.meta.url);
2
2
  import {
3
3
  CLI_PLACEHOLDERS,
4
+ COMMON_TARGET_SETTINGS,
4
5
  KNOWN_PROVIDERS,
5
6
  PROVIDER_ALIASES,
6
7
  ResponseCache,
7
8
  buildDirectoryChain,
8
9
  buildSearchRoots,
10
+ deriveCategory,
9
11
  ensureVSCodeSubagents,
10
12
  findGitRoot,
11
13
  interpolateEnv,
@@ -27,12 +29,12 @@ import {
27
29
  subscribeToCopilotCliLogEntries,
28
30
  subscribeToCopilotSdkLogEntries,
29
31
  subscribeToPiLogEntries
30
- } from "./chunk-ELQEFMGO.js";
32
+ } from "./chunk-XEAW7OQT.js";
31
33
 
32
34
  // package.json
33
35
  var package_default = {
34
36
  name: "agentv",
35
- version: "3.14.6",
37
+ version: "4.1.0",
36
38
  description: "CLI entry point for AgentV",
37
39
  type: "module",
38
40
  repository: {
@@ -110,6 +112,24 @@ async function resolveEvalPaths(evalPaths, cwd) {
110
112
  results.add(candidatePath);
111
113
  continue;
112
114
  }
115
+ if (stats.isDirectory()) {
116
+ const dirGlob = path.posix.join(candidatePath.replace(/\\/g, "/"), "**/*.eval.{yaml,yml}");
117
+ const dirMatches = await fg(dirGlob, {
118
+ absolute: true,
119
+ onlyFiles: true,
120
+ unique: true,
121
+ dot: true,
122
+ followSymbolicLinks: true
123
+ });
124
+ if (dirMatches.length === 0) {
125
+ unmatched.push(pattern);
126
+ } else {
127
+ for (const filePath of dirMatches) {
128
+ results.add(path.normalize(filePath));
129
+ }
130
+ }
131
+ continue;
132
+ }
113
133
  } catch {
114
134
  }
115
135
  const globPattern = pattern.includes("\\") ? pattern.replace(/\\/g, "/") : pattern;
@@ -562,20 +582,16 @@ function safeArtifactPathSegment(value, fallback) {
562
582
  function safeTestId(testId) {
563
583
  return safeArtifactPathSegment(testId, "unknown");
564
584
  }
565
- function safeTargetId(target) {
566
- return safeArtifactPathSegment(target, "default");
567
- }
568
- function getEvalSet(result) {
569
- const record = result;
570
- return result.eval_set ?? record.evalSet;
585
+ function getDataset(result) {
586
+ return result.dataset;
571
587
  }
572
588
  function buildArtifactSubdir(result) {
573
589
  const segments = [];
574
- const evalSet = getEvalSet(result);
590
+ const evalSet = getDataset(result);
575
591
  if (evalSet) {
576
592
  segments.push(safeArtifactPathSegment(evalSet, "default"));
577
593
  }
578
- segments.push(safeTestId(result.testId), safeTargetId(result.target));
594
+ segments.push(safeTestId(result.testId));
579
595
  return path4.posix.join(...segments);
580
596
  }
581
597
  function formatOutputMarkdown(output) {
@@ -598,7 +614,8 @@ function buildResultIndexArtifact(result) {
598
614
  return {
599
615
  timestamp: result.timestamp,
600
616
  test_id: result.testId ?? "unknown",
601
- eval_set: getEvalSet(result),
617
+ dataset: getDataset(result),
618
+ category: result.category,
602
619
  conversation_id: result.conversationId,
603
620
  score: result.score,
604
621
  target: result.target ?? "unknown",
@@ -1667,7 +1684,7 @@ var JunitWriter = class _JunitWriter {
1667
1684
  this.closed = true;
1668
1685
  const grouped = /* @__PURE__ */ new Map();
1669
1686
  for (const result of this.results) {
1670
- const suite = result.eval_set ?? "default";
1687
+ const suite = result.dataset ?? "default";
1671
1688
  const existing = grouped.get(suite);
1672
1689
  if (existing) {
1673
1690
  existing.push(result);
@@ -1995,7 +2012,8 @@ function hydrateManifestRecord(baseDir, record) {
1995
2012
  return {
1996
2013
  timestamp: record.timestamp,
1997
2014
  testId,
1998
- eval_set: record.eval_set,
2015
+ dataset: record.dataset,
2016
+ category: record.category,
1999
2017
  target: record.target,
2000
2018
  score: record.score,
2001
2019
  executionStatus: record.execution_status,
@@ -2053,6 +2071,7 @@ function loadLightweightResults(sourceFile) {
2053
2071
  return parseResultManifest(content).map((record) => ({
2054
2072
  testId: record.test_id ?? record.eval_id ?? "unknown",
2055
2073
  target: record.target,
2074
+ experiment: record.experiment,
2056
2075
  score: record.score,
2057
2076
  scores: record.scores,
2058
2077
  executionStatus: record.execution_status,
@@ -3020,7 +3039,7 @@ function validateContentForRoleMarkers(content, location, filePath, errors) {
3020
3039
  function isObject2(value) {
3021
3040
  return typeof value === "object" && value !== null && !Array.isArray(value);
3022
3041
  }
3023
- var COMMON_SETTINGS = /* @__PURE__ */ new Set(["provider_batching", "providerBatching"]);
3042
+ var COMMON_SETTINGS = new Set(COMMON_TARGET_SETTINGS);
3024
3043
  var RETRY_SETTINGS = /* @__PURE__ */ new Set([
3025
3044
  "max_retries",
3026
3045
  "maxRetries",
@@ -4140,9 +4159,12 @@ async function prepareFileMetadata(params) {
4140
4159
  repoRoot,
4141
4160
  verbose: options.verbose
4142
4161
  });
4162
+ const relativePath = path15.relative(cwd, testFilePath);
4163
+ const category = deriveCategory(relativePath);
4143
4164
  const suite = await loadTestSuite(testFilePath, repoRoot, {
4144
4165
  verbose: options.verbose,
4145
- filter: options.filter
4166
+ filter: options.filter,
4167
+ category
4146
4168
  });
4147
4169
  const filteredIds = suite.tests.map((value) => value.id);
4148
4170
  const cliTargets = options.cliTargets;
@@ -4421,7 +4443,7 @@ async function runEvalCommand(input) {
4421
4443
  const useFileExport = !!options.otelFile;
4422
4444
  if (options.exportOtel || useFileExport) {
4423
4445
  try {
4424
- const { OtelTraceExporter, OTEL_BACKEND_PRESETS } = await import("./dist-5EEXTTC3.js");
4446
+ const { OtelTraceExporter, OTEL_BACKEND_PRESETS } = await import("./dist-2JUUJ6PT.js");
4425
4447
  let endpoint = process.env.OTEL_EXPORTER_OTLP_ENDPOINT;
4426
4448
  let headers = {};
4427
4449
  if (options.otelBackend) {
@@ -4794,6 +4816,7 @@ export {
4794
4816
  resolveExistingRunPrimaryPath,
4795
4817
  resolveWorkspaceOrFilePath,
4796
4818
  writeArtifactsFromResults,
4819
+ parseResultManifest,
4797
4820
  resolveResultSourcePath,
4798
4821
  loadManifestResults,
4799
4822
  loadLightweightResults,
@@ -4812,4 +4835,4 @@ export {
4812
4835
  selectTarget,
4813
4836
  runEvalCommand
4814
4837
  };
4815
- //# sourceMappingURL=chunk-Y25VL7PX.js.map
4838
+ //# sourceMappingURL=chunk-4Z326WWF.js.map