agentv 4.31.4-next.1 → 4.32.0-next.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +14 -0
- package/dist/{artifact-writer-OYJ7VYQD.js → artifact-writer-VDF7KRWL.js} +4 -4
- package/dist/{chunk-3Y24WATS.js → chunk-2ZEY3WBH.js} +3 -3
- package/dist/{chunk-PDGEPSPO.js → chunk-5JMFFG36.js} +8 -8
- package/dist/{chunk-PDGEPSPO.js.map → chunk-5JMFFG36.js.map} +1 -1
- package/dist/{chunk-Y35UPYKH.js → chunk-IGTRNQAM.js} +51 -31
- package/dist/{chunk-Y35UPYKH.js.map → chunk-IGTRNQAM.js.map} +1 -1
- package/dist/{chunk-6Y3W7HJP.js → chunk-LX5AK3P7.js} +5 -5
- package/dist/chunk-LX5AK3P7.js.map +1 -0
- package/dist/{chunk-MIEYJ3YP.js → chunk-TAZBCVEZ.js} +66 -62
- package/dist/chunk-TAZBCVEZ.js.map +1 -0
- package/dist/cli.js +5 -5
- package/dist/{studio/assets/index-B_Ga8SID.js → dashboard/assets/index-BdoQWnyM.js} +1 -1
- package/dist/{studio/assets/index-CYUVGyMn.css → dashboard/assets/index-DcPH8PyS.css} +1 -1
- package/dist/dashboard/assets/index-EXkiwqam.js +116 -0
- package/dist/{studio → dashboard}/index.html +3 -3
- package/dist/{dist-KBYJJAXA.js → dist-GICSKMNP.js} +5 -3
- package/dist/index.js +5 -5
- package/dist/{interactive-RCBFUZUL.js → interactive-GIDBBDYZ.js} +5 -5
- package/dist/{ts-eval-loader-FRQF6KHR-PQPW5XQK.js → ts-eval-loader-Z6IUSDNA-YBOE4JIQ.js} +2 -2
- package/package.json +1 -1
- package/dist/chunk-6Y3W7HJP.js.map +0 -1
- package/dist/chunk-MIEYJ3YP.js.map +0 -1
- package/dist/studio/assets/index-Bw-5reb7.js +0 -116
- /package/dist/{artifact-writer-OYJ7VYQD.js.map → artifact-writer-VDF7KRWL.js.map} +0 -0
- /package/dist/{chunk-3Y24WATS.js.map → chunk-2ZEY3WBH.js.map} +0 -0
- /package/dist/{dist-KBYJJAXA.js.map → dist-GICSKMNP.js.map} +0 -0
- /package/dist/{interactive-RCBFUZUL.js.map → interactive-GIDBBDYZ.js.map} +0 -0
- /package/dist/{ts-eval-loader-FRQF6KHR-PQPW5XQK.js.map → ts-eval-loader-Z6IUSDNA-YBOE4JIQ.js.map} +0 -0
package/README.md
CHANGED
|
@@ -124,6 +124,20 @@ bun test
|
|
|
124
124
|
|
|
125
125
|
See [AGENTS.md](AGENTS.md) for development guidelines.
|
|
126
126
|
|
|
127
|
+
## Docker Dashboard Deployment
|
|
128
|
+
|
|
129
|
+
To simulate a one-command production deployment of AgentV Dashboard with the
|
|
130
|
+
AgentV examples project and a remote results repository:
|
|
131
|
+
|
|
132
|
+
```bash
|
|
133
|
+
AGENTV_RESULTS_REPO=EntityProcess/agentv-evalresults \
|
|
134
|
+
scripts/setup-dashboard-deployment.sh
|
|
135
|
+
```
|
|
136
|
+
|
|
137
|
+
The script clones AgentV examples into `~/agentv-dashboard`, clones the results
|
|
138
|
+
repo, writes the Dashboard project registry, builds the Docker image, and starts
|
|
139
|
+
Dashboard at `http://localhost:3117`.
|
|
140
|
+
|
|
127
141
|
## License
|
|
128
142
|
|
|
129
143
|
MIT
|
|
@@ -14,11 +14,11 @@ import {
|
|
|
14
14
|
writeArtifactsFromResults,
|
|
15
15
|
writeInitialBenchmarkArtifact,
|
|
16
16
|
writePerTestArtifacts
|
|
17
|
-
} from "./chunk-
|
|
18
|
-
import "./chunk-
|
|
17
|
+
} from "./chunk-2ZEY3WBH.js";
|
|
18
|
+
import "./chunk-LX5AK3P7.js";
|
|
19
19
|
import "./chunk-QOBQ5XYF.js";
|
|
20
20
|
import "./chunk-BPGJ4HBU.js";
|
|
21
|
-
import "./chunk-
|
|
21
|
+
import "./chunk-TAZBCVEZ.js";
|
|
22
22
|
import "./chunk-NPVGBFF6.js";
|
|
23
23
|
import "./chunk-M7BUKBAF.js";
|
|
24
24
|
import "./chunk-5H446C7X.js";
|
|
@@ -38,4 +38,4 @@ export {
|
|
|
38
38
|
writeInitialBenchmarkArtifact,
|
|
39
39
|
writePerTestArtifacts
|
|
40
40
|
};
|
|
41
|
-
//# sourceMappingURL=artifact-writer-
|
|
41
|
+
//# sourceMappingURL=artifact-writer-VDF7KRWL.js.map
|
|
@@ -1,10 +1,10 @@
|
|
|
1
1
|
import { createRequire } from 'node:module'; const require = createRequire(import.meta.url);
|
|
2
2
|
import {
|
|
3
3
|
toTranscriptJsonLines
|
|
4
|
-
} from "./chunk-
|
|
4
|
+
} from "./chunk-LX5AK3P7.js";
|
|
5
5
|
import {
|
|
6
6
|
DEFAULT_THRESHOLD
|
|
7
|
-
} from "./chunk-
|
|
7
|
+
} from "./chunk-TAZBCVEZ.js";
|
|
8
8
|
|
|
9
9
|
// src/commands/eval/artifact-writer.ts
|
|
10
10
|
import { mkdir, readFile, writeFile } from "node:fs/promises";
|
|
@@ -726,4 +726,4 @@ export {
|
|
|
726
726
|
writePerTestArtifacts,
|
|
727
727
|
writeArtifactsFromResults
|
|
728
728
|
};
|
|
729
|
-
//# sourceMappingURL=chunk-
|
|
729
|
+
//# sourceMappingURL=chunk-2ZEY3WBH.js.map
|
|
@@ -16,7 +16,7 @@ import {
|
|
|
16
16
|
toSnakeCaseDeep,
|
|
17
17
|
writeArtifactsFromResults,
|
|
18
18
|
writeInitialBenchmarkArtifact
|
|
19
|
-
} from "./chunk-
|
|
19
|
+
} from "./chunk-2ZEY3WBH.js";
|
|
20
20
|
import {
|
|
21
21
|
ResponseCache,
|
|
22
22
|
RunBudgetTracker,
|
|
@@ -32,7 +32,7 @@ import {
|
|
|
32
32
|
shouldEnableCache,
|
|
33
33
|
shouldSkipCacheForTemperature,
|
|
34
34
|
syncResultsRepo
|
|
35
|
-
} from "./chunk-
|
|
35
|
+
} from "./chunk-LX5AK3P7.js";
|
|
36
36
|
import {
|
|
37
37
|
CLI_PLACEHOLDERS,
|
|
38
38
|
COMMON_TARGET_SETTINGS,
|
|
@@ -64,7 +64,7 @@ import {
|
|
|
64
64
|
subscribeToCopilotSdkLogEntries,
|
|
65
65
|
subscribeToPiLogEntries,
|
|
66
66
|
toCamelCaseDeep
|
|
67
|
-
} from "./chunk-
|
|
67
|
+
} from "./chunk-TAZBCVEZ.js";
|
|
68
68
|
|
|
69
69
|
// src/commands/eval/shared.ts
|
|
70
70
|
import { constants } from "node:fs";
|
|
@@ -180,7 +180,7 @@ async function findRepoRoot(start) {
|
|
|
180
180
|
// package.json
|
|
181
181
|
var package_default = {
|
|
182
182
|
name: "agentv",
|
|
183
|
-
version: "4.
|
|
183
|
+
version: "4.32.0-next.1",
|
|
184
184
|
description: "CLI entry point for AgentV",
|
|
185
185
|
type: "module",
|
|
186
186
|
repository: {
|
|
@@ -5559,7 +5559,7 @@ async function runEvalCommand(input) {
|
|
|
5559
5559
|
const useFileExport = !!options.otelFile;
|
|
5560
5560
|
if (options.exportOtel || useFileExport) {
|
|
5561
5561
|
try {
|
|
5562
|
-
const { OtelTraceExporter, OTEL_BACKEND_PRESETS } = await import("./dist-
|
|
5562
|
+
const { OtelTraceExporter, OTEL_BACKEND_PRESETS } = await import("./dist-GICSKMNP.js");
|
|
5563
5563
|
let endpoint = process.env.OTEL_EXPORTER_OTLP_ENDPOINT;
|
|
5564
5564
|
let headers = {};
|
|
5565
5565
|
if (options.otelBackend) {
|
|
@@ -5758,7 +5758,7 @@ async function runEvalCommand(input) {
|
|
|
5758
5758
|
const activeTestFiles = resolvedTestFiles.filter((f) => fileMetadata.has(f));
|
|
5759
5759
|
let transcriptProviderFactory;
|
|
5760
5760
|
if (options.transcript) {
|
|
5761
|
-
const { TranscriptProvider } = await import("./dist-
|
|
5761
|
+
const { TranscriptProvider } = await import("./dist-GICSKMNP.js");
|
|
5762
5762
|
const transcriptProvider = await TranscriptProvider.fromFile(options.transcript);
|
|
5763
5763
|
const totalTests = [...fileMetadata.values()].reduce(
|
|
5764
5764
|
(sum, meta) => sum + meta.testCases.length,
|
|
@@ -5935,7 +5935,7 @@ async function runEvalCommand(input) {
|
|
|
5935
5935
|
if (usesDefaultArtifactWorkspace && allResults.length > 0) {
|
|
5936
5936
|
const evalFile = activeTestFiles.length === 1 ? activeTestFiles[0] : "";
|
|
5937
5937
|
if (isResumeAppend) {
|
|
5938
|
-
const { writePerTestArtifacts } = await import("./artifact-writer-
|
|
5938
|
+
const { writePerTestArtifacts } = await import("./artifact-writer-VDF7KRWL.js");
|
|
5939
5939
|
await writePerTestArtifacts(allResults, runDir, {
|
|
5940
5940
|
experiment: normalizeExperimentName(options.experiment)
|
|
5941
5941
|
});
|
|
@@ -6160,4 +6160,4 @@ export {
|
|
|
6160
6160
|
getCategories,
|
|
6161
6161
|
filterByCategory
|
|
6162
6162
|
};
|
|
6163
|
-
//# sourceMappingURL=chunk-
|
|
6163
|
+
//# sourceMappingURL=chunk-5JMFFG36.js.map
|