agentv 3.14.6 → 4.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +59 -533
- package/dist/{chunk-CQRWNXVG.js → chunk-2W5JKKXC.js} +537 -727
- package/dist/chunk-2W5JKKXC.js.map +1 -0
- package/dist/{chunk-Y25VL7PX.js → chunk-4Z326WWF.js} +40 -17
- package/dist/chunk-4Z326WWF.js.map +1 -0
- package/dist/{chunk-ELQEFMGO.js → chunk-XEAW7OQT.js} +594 -296
- package/dist/chunk-XEAW7OQT.js.map +1 -0
- package/dist/cli.js +3 -3
- package/dist/{dist-5EEXTTC3.js → dist-2JUUJ6PT.js} +18 -2
- package/dist/index.js +3 -3
- package/dist/{interactive-5ESM5DWV.js → interactive-7ZYS6IOC.js} +4 -11
- package/dist/interactive-7ZYS6IOC.js.map +1 -0
- package/dist/studio/assets/index-CDGReinH.js +71 -0
- package/dist/studio/assets/index-DofvSOmX.js +11 -0
- package/dist/studio/assets/index-izxfmBKC.css +1 -0
- package/dist/studio/index.html +13 -0
- package/package.json +1 -1
- package/dist/chunk-CQRWNXVG.js.map +0 -1
- package/dist/chunk-ELQEFMGO.js.map +0 -1
- package/dist/chunk-Y25VL7PX.js.map +0 -1
- package/dist/interactive-5ESM5DWV.js.map +0 -1
- /package/dist/{dist-5EEXTTC3.js.map → dist-2JUUJ6PT.js.map} +0 -0
|
@@ -1,11 +1,13 @@
|
|
|
1
1
|
import { createRequire } from 'node:module'; const require = createRequire(import.meta.url);
|
|
2
2
|
import {
|
|
3
3
|
CLI_PLACEHOLDERS,
|
|
4
|
+
COMMON_TARGET_SETTINGS,
|
|
4
5
|
KNOWN_PROVIDERS,
|
|
5
6
|
PROVIDER_ALIASES,
|
|
6
7
|
ResponseCache,
|
|
7
8
|
buildDirectoryChain,
|
|
8
9
|
buildSearchRoots,
|
|
10
|
+
deriveCategory,
|
|
9
11
|
ensureVSCodeSubagents,
|
|
10
12
|
findGitRoot,
|
|
11
13
|
interpolateEnv,
|
|
@@ -27,12 +29,12 @@ import {
|
|
|
27
29
|
subscribeToCopilotCliLogEntries,
|
|
28
30
|
subscribeToCopilotSdkLogEntries,
|
|
29
31
|
subscribeToPiLogEntries
|
|
30
|
-
} from "./chunk-
|
|
32
|
+
} from "./chunk-XEAW7OQT.js";
|
|
31
33
|
|
|
32
34
|
// package.json
|
|
33
35
|
var package_default = {
|
|
34
36
|
name: "agentv",
|
|
35
|
-
version: "
|
|
37
|
+
version: "4.1.0",
|
|
36
38
|
description: "CLI entry point for AgentV",
|
|
37
39
|
type: "module",
|
|
38
40
|
repository: {
|
|
@@ -110,6 +112,24 @@ async function resolveEvalPaths(evalPaths, cwd) {
|
|
|
110
112
|
results.add(candidatePath);
|
|
111
113
|
continue;
|
|
112
114
|
}
|
|
115
|
+
if (stats.isDirectory()) {
|
|
116
|
+
const dirGlob = path.posix.join(candidatePath.replace(/\\/g, "/"), "**/*.eval.{yaml,yml}");
|
|
117
|
+
const dirMatches = await fg(dirGlob, {
|
|
118
|
+
absolute: true,
|
|
119
|
+
onlyFiles: true,
|
|
120
|
+
unique: true,
|
|
121
|
+
dot: true,
|
|
122
|
+
followSymbolicLinks: true
|
|
123
|
+
});
|
|
124
|
+
if (dirMatches.length === 0) {
|
|
125
|
+
unmatched.push(pattern);
|
|
126
|
+
} else {
|
|
127
|
+
for (const filePath of dirMatches) {
|
|
128
|
+
results.add(path.normalize(filePath));
|
|
129
|
+
}
|
|
130
|
+
}
|
|
131
|
+
continue;
|
|
132
|
+
}
|
|
113
133
|
} catch {
|
|
114
134
|
}
|
|
115
135
|
const globPattern = pattern.includes("\\") ? pattern.replace(/\\/g, "/") : pattern;
|
|
@@ -562,20 +582,16 @@ function safeArtifactPathSegment(value, fallback) {
|
|
|
562
582
|
function safeTestId(testId) {
|
|
563
583
|
return safeArtifactPathSegment(testId, "unknown");
|
|
564
584
|
}
|
|
565
|
-
function
|
|
566
|
-
return
|
|
567
|
-
}
|
|
568
|
-
function getEvalSet(result) {
|
|
569
|
-
const record = result;
|
|
570
|
-
return result.eval_set ?? record.evalSet;
|
|
585
|
+
function getDataset(result) {
|
|
586
|
+
return result.dataset;
|
|
571
587
|
}
|
|
572
588
|
function buildArtifactSubdir(result) {
|
|
573
589
|
const segments = [];
|
|
574
|
-
const evalSet =
|
|
590
|
+
const evalSet = getDataset(result);
|
|
575
591
|
if (evalSet) {
|
|
576
592
|
segments.push(safeArtifactPathSegment(evalSet, "default"));
|
|
577
593
|
}
|
|
578
|
-
segments.push(safeTestId(result.testId)
|
|
594
|
+
segments.push(safeTestId(result.testId));
|
|
579
595
|
return path4.posix.join(...segments);
|
|
580
596
|
}
|
|
581
597
|
function formatOutputMarkdown(output) {
|
|
@@ -598,7 +614,8 @@ function buildResultIndexArtifact(result) {
|
|
|
598
614
|
return {
|
|
599
615
|
timestamp: result.timestamp,
|
|
600
616
|
test_id: result.testId ?? "unknown",
|
|
601
|
-
|
|
617
|
+
dataset: getDataset(result),
|
|
618
|
+
category: result.category,
|
|
602
619
|
conversation_id: result.conversationId,
|
|
603
620
|
score: result.score,
|
|
604
621
|
target: result.target ?? "unknown",
|
|
@@ -1667,7 +1684,7 @@ var JunitWriter = class _JunitWriter {
|
|
|
1667
1684
|
this.closed = true;
|
|
1668
1685
|
const grouped = /* @__PURE__ */ new Map();
|
|
1669
1686
|
for (const result of this.results) {
|
|
1670
|
-
const suite = result.
|
|
1687
|
+
const suite = result.dataset ?? "default";
|
|
1671
1688
|
const existing = grouped.get(suite);
|
|
1672
1689
|
if (existing) {
|
|
1673
1690
|
existing.push(result);
|
|
@@ -1995,7 +2012,8 @@ function hydrateManifestRecord(baseDir, record) {
|
|
|
1995
2012
|
return {
|
|
1996
2013
|
timestamp: record.timestamp,
|
|
1997
2014
|
testId,
|
|
1998
|
-
|
|
2015
|
+
dataset: record.dataset,
|
|
2016
|
+
category: record.category,
|
|
1999
2017
|
target: record.target,
|
|
2000
2018
|
score: record.score,
|
|
2001
2019
|
executionStatus: record.execution_status,
|
|
@@ -2053,6 +2071,7 @@ function loadLightweightResults(sourceFile) {
|
|
|
2053
2071
|
return parseResultManifest(content).map((record) => ({
|
|
2054
2072
|
testId: record.test_id ?? record.eval_id ?? "unknown",
|
|
2055
2073
|
target: record.target,
|
|
2074
|
+
experiment: record.experiment,
|
|
2056
2075
|
score: record.score,
|
|
2057
2076
|
scores: record.scores,
|
|
2058
2077
|
executionStatus: record.execution_status,
|
|
@@ -3020,7 +3039,7 @@ function validateContentForRoleMarkers(content, location, filePath, errors) {
|
|
|
3020
3039
|
function isObject2(value) {
|
|
3021
3040
|
return typeof value === "object" && value !== null && !Array.isArray(value);
|
|
3022
3041
|
}
|
|
3023
|
-
var COMMON_SETTINGS =
|
|
3042
|
+
var COMMON_SETTINGS = new Set(COMMON_TARGET_SETTINGS);
|
|
3024
3043
|
var RETRY_SETTINGS = /* @__PURE__ */ new Set([
|
|
3025
3044
|
"max_retries",
|
|
3026
3045
|
"maxRetries",
|
|
@@ -4140,9 +4159,12 @@ async function prepareFileMetadata(params) {
|
|
|
4140
4159
|
repoRoot,
|
|
4141
4160
|
verbose: options.verbose
|
|
4142
4161
|
});
|
|
4162
|
+
const relativePath = path15.relative(cwd, testFilePath);
|
|
4163
|
+
const category = deriveCategory(relativePath);
|
|
4143
4164
|
const suite = await loadTestSuite(testFilePath, repoRoot, {
|
|
4144
4165
|
verbose: options.verbose,
|
|
4145
|
-
filter: options.filter
|
|
4166
|
+
filter: options.filter,
|
|
4167
|
+
category
|
|
4146
4168
|
});
|
|
4147
4169
|
const filteredIds = suite.tests.map((value) => value.id);
|
|
4148
4170
|
const cliTargets = options.cliTargets;
|
|
@@ -4421,7 +4443,7 @@ async function runEvalCommand(input) {
|
|
|
4421
4443
|
const useFileExport = !!options.otelFile;
|
|
4422
4444
|
if (options.exportOtel || useFileExport) {
|
|
4423
4445
|
try {
|
|
4424
|
-
const { OtelTraceExporter, OTEL_BACKEND_PRESETS } = await import("./dist-
|
|
4446
|
+
const { OtelTraceExporter, OTEL_BACKEND_PRESETS } = await import("./dist-2JUUJ6PT.js");
|
|
4425
4447
|
let endpoint = process.env.OTEL_EXPORTER_OTLP_ENDPOINT;
|
|
4426
4448
|
let headers = {};
|
|
4427
4449
|
if (options.otelBackend) {
|
|
@@ -4794,6 +4816,7 @@ export {
|
|
|
4794
4816
|
resolveExistingRunPrimaryPath,
|
|
4795
4817
|
resolveWorkspaceOrFilePath,
|
|
4796
4818
|
writeArtifactsFromResults,
|
|
4819
|
+
parseResultManifest,
|
|
4797
4820
|
resolveResultSourcePath,
|
|
4798
4821
|
loadManifestResults,
|
|
4799
4822
|
loadLightweightResults,
|
|
@@ -4812,4 +4835,4 @@ export {
|
|
|
4812
4835
|
selectTarget,
|
|
4813
4836
|
runEvalCommand
|
|
4814
4837
|
};
|
|
4815
|
-
//# sourceMappingURL=chunk-
|
|
4838
|
+
//# sourceMappingURL=chunk-4Z326WWF.js.map
|