agentv 4.31.4-next.1 → 4.32.0-next.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (29) hide show
  1. package/README.md +14 -0
  2. package/dist/{artifact-writer-OYJ7VYQD.js → artifact-writer-VDF7KRWL.js} +4 -4
  3. package/dist/{chunk-3Y24WATS.js → chunk-2ZEY3WBH.js} +3 -3
  4. package/dist/{chunk-PDGEPSPO.js → chunk-5JMFFG36.js} +8 -8
  5. package/dist/{chunk-PDGEPSPO.js.map → chunk-5JMFFG36.js.map} +1 -1
  6. package/dist/{chunk-Y35UPYKH.js → chunk-IGTRNQAM.js} +51 -31
  7. package/dist/{chunk-Y35UPYKH.js.map → chunk-IGTRNQAM.js.map} +1 -1
  8. package/dist/{chunk-6Y3W7HJP.js → chunk-LX5AK3P7.js} +5 -5
  9. package/dist/chunk-LX5AK3P7.js.map +1 -0
  10. package/dist/{chunk-MIEYJ3YP.js → chunk-TAZBCVEZ.js} +66 -62
  11. package/dist/chunk-TAZBCVEZ.js.map +1 -0
  12. package/dist/cli.js +5 -5
  13. package/dist/{studio/assets/index-B_Ga8SID.js → dashboard/assets/index-BdoQWnyM.js} +1 -1
  14. package/dist/{studio/assets/index-CYUVGyMn.css → dashboard/assets/index-DcPH8PyS.css} +1 -1
  15. package/dist/dashboard/assets/index-EXkiwqam.js +116 -0
  16. package/dist/{studio → dashboard}/index.html +3 -3
  17. package/dist/{dist-KBYJJAXA.js → dist-GICSKMNP.js} +5 -3
  18. package/dist/index.js +5 -5
  19. package/dist/{interactive-RCBFUZUL.js → interactive-GIDBBDYZ.js} +5 -5
  20. package/dist/{ts-eval-loader-FRQF6KHR-PQPW5XQK.js → ts-eval-loader-Z6IUSDNA-YBOE4JIQ.js} +2 -2
  21. package/package.json +1 -1
  22. package/dist/chunk-6Y3W7HJP.js.map +0 -1
  23. package/dist/chunk-MIEYJ3YP.js.map +0 -1
  24. package/dist/studio/assets/index-Bw-5reb7.js +0 -116
  25. /package/dist/{artifact-writer-OYJ7VYQD.js.map → artifact-writer-VDF7KRWL.js.map} +0 -0
  26. /package/dist/{chunk-3Y24WATS.js.map → chunk-2ZEY3WBH.js.map} +0 -0
  27. /package/dist/{dist-KBYJJAXA.js.map → dist-GICSKMNP.js.map} +0 -0
  28. /package/dist/{interactive-RCBFUZUL.js.map → interactive-GIDBBDYZ.js.map} +0 -0
  29. /package/dist/{ts-eval-loader-FRQF6KHR-PQPW5XQK.js.map → ts-eval-loader-Z6IUSDNA-YBOE4JIQ.js.map} +0 -0
package/README.md CHANGED
@@ -124,6 +124,20 @@ bun test
124
124
 
125
125
  See [AGENTS.md](AGENTS.md) for development guidelines.
126
126
 
127
+ ## Docker Dashboard Deployment
128
+
129
+ To simulate a one-command production deployment of AgentV Dashboard with the
130
+ AgentV examples project and a remote results repository:
131
+
132
+ ```bash
133
+ AGENTV_RESULTS_REPO=EntityProcess/agentv-evalresults \
134
+ scripts/setup-dashboard-deployment.sh
135
+ ```
136
+
137
+ The script clones AgentV examples into `~/agentv-dashboard`, clones the results
138
+ repo, writes the Dashboard project registry, builds the Docker image, and starts
139
+ Dashboard at `http://localhost:3117`.
140
+
127
141
  ## License
128
142
 
129
143
  MIT
@@ -14,11 +14,11 @@ import {
14
14
  writeArtifactsFromResults,
15
15
  writeInitialBenchmarkArtifact,
16
16
  writePerTestArtifacts
17
- } from "./chunk-3Y24WATS.js";
18
- import "./chunk-6Y3W7HJP.js";
17
+ } from "./chunk-2ZEY3WBH.js";
18
+ import "./chunk-LX5AK3P7.js";
19
19
  import "./chunk-QOBQ5XYF.js";
20
20
  import "./chunk-BPGJ4HBU.js";
21
- import "./chunk-MIEYJ3YP.js";
21
+ import "./chunk-TAZBCVEZ.js";
22
22
  import "./chunk-NPVGBFF6.js";
23
23
  import "./chunk-M7BUKBAF.js";
24
24
  import "./chunk-5H446C7X.js";
@@ -38,4 +38,4 @@ export {
38
38
  writeInitialBenchmarkArtifact,
39
39
  writePerTestArtifacts
40
40
  };
41
- //# sourceMappingURL=artifact-writer-OYJ7VYQD.js.map
41
+ //# sourceMappingURL=artifact-writer-VDF7KRWL.js.map
@@ -1,10 +1,10 @@
1
1
  import { createRequire } from 'node:module'; const require = createRequire(import.meta.url);
2
2
  import {
3
3
  toTranscriptJsonLines
4
- } from "./chunk-6Y3W7HJP.js";
4
+ } from "./chunk-LX5AK3P7.js";
5
5
  import {
6
6
  DEFAULT_THRESHOLD
7
- } from "./chunk-MIEYJ3YP.js";
7
+ } from "./chunk-TAZBCVEZ.js";
8
8
 
9
9
  // src/commands/eval/artifact-writer.ts
10
10
  import { mkdir, readFile, writeFile } from "node:fs/promises";
@@ -726,4 +726,4 @@ export {
726
726
  writePerTestArtifacts,
727
727
  writeArtifactsFromResults
728
728
  };
729
- //# sourceMappingURL=chunk-3Y24WATS.js.map
729
+ //# sourceMappingURL=chunk-2ZEY3WBH.js.map
@@ -16,7 +16,7 @@ import {
16
16
  toSnakeCaseDeep,
17
17
  writeArtifactsFromResults,
18
18
  writeInitialBenchmarkArtifact
19
- } from "./chunk-3Y24WATS.js";
19
+ } from "./chunk-2ZEY3WBH.js";
20
20
  import {
21
21
  ResponseCache,
22
22
  RunBudgetTracker,
@@ -32,7 +32,7 @@ import {
32
32
  shouldEnableCache,
33
33
  shouldSkipCacheForTemperature,
34
34
  syncResultsRepo
35
- } from "./chunk-6Y3W7HJP.js";
35
+ } from "./chunk-LX5AK3P7.js";
36
36
  import {
37
37
  CLI_PLACEHOLDERS,
38
38
  COMMON_TARGET_SETTINGS,
@@ -64,7 +64,7 @@ import {
64
64
  subscribeToCopilotSdkLogEntries,
65
65
  subscribeToPiLogEntries,
66
66
  toCamelCaseDeep
67
- } from "./chunk-MIEYJ3YP.js";
67
+ } from "./chunk-TAZBCVEZ.js";
68
68
 
69
69
  // src/commands/eval/shared.ts
70
70
  import { constants } from "node:fs";
@@ -180,7 +180,7 @@ async function findRepoRoot(start) {
180
180
  // package.json
181
181
  var package_default = {
182
182
  name: "agentv",
183
- version: "4.31.4-next.1",
183
+ version: "4.32.0-next.1",
184
184
  description: "CLI entry point for AgentV",
185
185
  type: "module",
186
186
  repository: {
@@ -5559,7 +5559,7 @@ async function runEvalCommand(input) {
5559
5559
  const useFileExport = !!options.otelFile;
5560
5560
  if (options.exportOtel || useFileExport) {
5561
5561
  try {
5562
- const { OtelTraceExporter, OTEL_BACKEND_PRESETS } = await import("./dist-KBYJJAXA.js");
5562
+ const { OtelTraceExporter, OTEL_BACKEND_PRESETS } = await import("./dist-GICSKMNP.js");
5563
5563
  let endpoint = process.env.OTEL_EXPORTER_OTLP_ENDPOINT;
5564
5564
  let headers = {};
5565
5565
  if (options.otelBackend) {
@@ -5758,7 +5758,7 @@ async function runEvalCommand(input) {
5758
5758
  const activeTestFiles = resolvedTestFiles.filter((f) => fileMetadata.has(f));
5759
5759
  let transcriptProviderFactory;
5760
5760
  if (options.transcript) {
5761
- const { TranscriptProvider } = await import("./dist-KBYJJAXA.js");
5761
+ const { TranscriptProvider } = await import("./dist-GICSKMNP.js");
5762
5762
  const transcriptProvider = await TranscriptProvider.fromFile(options.transcript);
5763
5763
  const totalTests = [...fileMetadata.values()].reduce(
5764
5764
  (sum, meta) => sum + meta.testCases.length,
@@ -5935,7 +5935,7 @@ async function runEvalCommand(input) {
5935
5935
  if (usesDefaultArtifactWorkspace && allResults.length > 0) {
5936
5936
  const evalFile = activeTestFiles.length === 1 ? activeTestFiles[0] : "";
5937
5937
  if (isResumeAppend) {
5938
- const { writePerTestArtifacts } = await import("./artifact-writer-OYJ7VYQD.js");
5938
+ const { writePerTestArtifacts } = await import("./artifact-writer-VDF7KRWL.js");
5939
5939
  await writePerTestArtifacts(allResults, runDir, {
5940
5940
  experiment: normalizeExperimentName(options.experiment)
5941
5941
  });
@@ -6160,4 +6160,4 @@ export {
6160
6160
  getCategories,
6161
6161
  filterByCategory
6162
6162
  };
6163
- //# sourceMappingURL=chunk-PDGEPSPO.js.map
6163
+ //# sourceMappingURL=chunk-5JMFFG36.js.map