agentv 3.0.0-next.1 → 3.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (71) hide show
  1. package/dist/templates/.agentv/config.yaml +5 -0
  2. package/dist/templates/.agentv/targets.yaml +11 -8
  3. package/package.json +1 -1
  4. package/dist/agentv-provider-5CJVBBGG-2XVZBW7L.js +0 -9
  5. package/dist/agentv-provider-5CJVBBGG-2XVZBW7L.js.map +0 -1
  6. package/dist/chunk-3L2L5GIL.js +0 -51
  7. package/dist/chunk-3L2L5GIL.js.map +0 -1
  8. package/dist/chunk-5H446C7X.js +0 -50
  9. package/dist/chunk-5H446C7X.js.map +0 -1
  10. package/dist/chunk-5WIB7A27.js +0 -6149
  11. package/dist/chunk-5WIB7A27.js.map +0 -1
  12. package/dist/chunk-6GSYTMXD.js +0 -31520
  13. package/dist/chunk-6GSYTMXD.js.map +0 -1
  14. package/dist/chunk-BL4PVUAT.js +0 -261
  15. package/dist/chunk-BL4PVUAT.js.map +0 -1
  16. package/dist/chunk-C5GOHBQM.js +0 -84
  17. package/dist/chunk-C5GOHBQM.js.map +0 -1
  18. package/dist/chunk-DY4ZDTTO.js +0 -4216
  19. package/dist/chunk-DY4ZDTTO.js.map +0 -1
  20. package/dist/chunk-HF4X7ALN.js +0 -24299
  21. package/dist/chunk-HF4X7ALN.js.map +0 -1
  22. package/dist/chunk-JK6V4KVD.js +0 -114
  23. package/dist/chunk-JK6V4KVD.js.map +0 -1
  24. package/dist/chunk-LRULMAAA.js +0 -1711
  25. package/dist/chunk-LRULMAAA.js.map +0 -1
  26. package/dist/chunk-SR4I5KET.js +0 -1238
  27. package/dist/chunk-SR4I5KET.js.map +0 -1
  28. package/dist/chunk-VQ2ZO7XJ.js +0 -2098
  29. package/dist/chunk-VQ2ZO7XJ.js.map +0 -1
  30. package/dist/chunk-XALGXSKB.js +0 -21
  31. package/dist/chunk-XALGXSKB.js.map +0 -1
  32. package/dist/chunk-XOSNETAV.js +0 -565
  33. package/dist/chunk-XOSNETAV.js.map +0 -1
  34. package/dist/cli.js +0 -29
  35. package/dist/cli.js.map +0 -1
  36. package/dist/dist-WN2QIOQR.js +0 -305
  37. package/dist/dist-WN2QIOQR.js.map +0 -1
  38. package/dist/esm-5Q4BZALM-5REQWAUV.js +0 -924
  39. package/dist/esm-5Q4BZALM-5REQWAUV.js.map +0 -1
  40. package/dist/esm-CZAWIY6F.js +0 -32
  41. package/dist/esm-CZAWIY6F.js.map +0 -1
  42. package/dist/esm-QNEMCJPL.js +0 -933
  43. package/dist/esm-QNEMCJPL.js.map +0 -1
  44. package/dist/esm-R77SNOF5.js +0 -65
  45. package/dist/esm-R77SNOF5.js.map +0 -1
  46. package/dist/esm-RVQPUGWH.js +0 -1207
  47. package/dist/esm-RVQPUGWH.js.map +0 -1
  48. package/dist/getMachineId-bsd-HSK5LZMG.js +0 -41
  49. package/dist/getMachineId-bsd-HSK5LZMG.js.map +0 -1
  50. package/dist/getMachineId-darwin-4DP6CCJV.js +0 -41
  51. package/dist/getMachineId-darwin-4DP6CCJV.js.map +0 -1
  52. package/dist/getMachineId-linux-44LJ5UJB.js +0 -33
  53. package/dist/getMachineId-linux-44LJ5UJB.js.map +0 -1
  54. package/dist/getMachineId-unsupported-NVK6IATM.js +0 -24
  55. package/dist/getMachineId-unsupported-NVK6IATM.js.map +0 -1
  56. package/dist/getMachineId-win-YZ36S7VA.js +0 -43
  57. package/dist/getMachineId-win-YZ36S7VA.js.map +0 -1
  58. package/dist/index.js +0 -20
  59. package/dist/index.js.map +0 -1
  60. package/dist/interactive-B432TCRZ.js +0 -334
  61. package/dist/interactive-B432TCRZ.js.map +0 -1
  62. package/dist/otlp-json-file-exporter-77FDBRSY-EZAPHWP6.js +0 -9
  63. package/dist/otlp-json-file-exporter-77FDBRSY-EZAPHWP6.js.map +0 -1
  64. package/dist/simple-trace-file-exporter-S76DMABU-5FCJESD2.js +0 -9
  65. package/dist/simple-trace-file-exporter-S76DMABU-5FCJESD2.js.map +0 -1
  66. package/dist/src-ML4D2MC2.js +0 -1733
  67. package/dist/src-ML4D2MC2.js.map +0 -1
  68. package/dist/token-POXF46NU.js +0 -66
  69. package/dist/token-POXF46NU.js.map +0 -1
  70. package/dist/token-util-6GWYZWGE.js +0 -8
  71. package/dist/token-util-6GWYZWGE.js.map +0 -1
@@ -8,6 +8,11 @@ guideline_patterns:
8
8
  - "**/*.prompt.md"
9
9
  - "**/SKILL.md"
10
10
 
11
+ # Execution defaults (overridden by CLI flags)
12
+ # execution:
13
+ # pool_workspaces: true # Reuse materialized workspaces across eval runs
14
+ # pool_slots: 10 # Max pool slots on disk (1-50, default: 10)
15
+
11
16
  # Notes:
12
17
  # - Patterns use standard glob syntax (via micromatch library)
13
18
  # - Paths are normalized to forward slashes for cross-platform compatibility
@@ -12,11 +12,11 @@ targets:
12
12
 
13
13
  - name: vscode
14
14
  provider: vscode
15
- judge_target: azure-llm
15
+ judge_target: azure-base
16
16
 
17
17
  - name: codex
18
18
  provider: codex
19
- judge_target: azure-llm
19
+ judge_target: azure-base
20
20
  # Uses the Codex CLI (defaults to `codex` on PATH)
21
21
  # executable: ${{ CODEX_CLI_PATH }} # Optional: override executable path
22
22
  # args: # Optional additional CLI arguments
@@ -26,6 +26,7 @@ targets:
26
26
  # - ${{ CODEX_MODEL }}
27
27
  # - --ask-for-approval
28
28
  # - ${{ CODEX_APPROVAL_PRESET }}
29
+ timeout_seconds: 180
29
30
  cwd: ${{ CODEX_WORKSPACE_DIR }} # Where scratch workspaces are created
30
31
  log_dir: ${{ CODEX_LOG_DIR }} # Optional: where Codex CLI stream logs are stored (defaults to ./.agentv/logs/codex)
31
32
  log_format: json # Optional: 'summary' (default) or 'json' for raw event logs
@@ -33,9 +34,10 @@ targets:
33
34
  # Claude - Anthropic's Claude Agent SDK
34
35
  - name: claude
35
36
  provider: claude
36
- judge_target: azure-llm
37
+ judge_target: azure-base
37
38
  # Uses the @anthropic-ai/claude-agent-sdk
38
39
  # model: claude-sonnet-4-20250514 # Optional: override model
40
+ timeout_seconds: 180
39
41
  # cwd: ${{ CLAUDE_WORKSPACE_DIR }} # Optional: working directory (defaults to process.cwd())
40
42
  # max_turns: 50 # Optional: max conversation turns
41
43
  # max_budget_usd: 5.0 # Optional: max cost budget in USD
@@ -47,29 +49,29 @@ targets:
47
49
  provider: vscode
48
50
  workspace_template: ${{ PROJECTX_WORKSPACE_PATH }}
49
51
  provider_batching: false
50
- judge_target: azure-llm
52
+ judge_target: azure-base
51
53
 
52
54
  - name: vscode_insiders_projectx
53
55
  provider: vscode-insiders
54
56
  workspace_template: ${{ PROJECTX_WORKSPACE_PATH }}
55
57
  provider_batching: false
56
- judge_target: azure-llm
58
+ judge_target: azure-base
57
59
 
58
- - name: azure-llm
60
+ - name: azure-base
59
61
  provider: azure
60
62
  endpoint: ${{ AZURE_OPENAI_ENDPOINT }}
61
63
  api_key: ${{ AZURE_OPENAI_API_KEY }}
62
64
  model: ${{ AZURE_DEPLOYMENT_NAME }}
63
65
  version: ${{ AZURE_OPENAI_API_VERSION }}
64
66
 
65
- - name: gemini-llm
67
+ - name: gemini_base
66
68
  provider: gemini
67
69
  api_key: ${{ GOOGLE_GENERATIVE_AI_API_KEY }}
68
70
  model: ${{ GEMINI_MODEL_NAME }}
69
71
 
70
72
  - name: local_cli
71
73
  provider: cli
72
- judge_target: azure-llm
74
+ judge_target: azure-base
73
75
  # Passes the fully rendered prompt and any attached files to a local Python script
74
76
  # NOTE: Do not add quotes around {PROMPT} or {FILES} - they are already shell-escaped
75
77
  command: uv run ./mock_cli.py --prompt {PROMPT} {FILES} --output {OUTPUT_FILE}
@@ -77,5 +79,6 @@ targets:
77
79
  files_format: --file {path}
78
80
  # Optional working directory resolved from .env
79
81
  cwd: ${{ CLI_EVALS_DIR }}
82
+ timeout_seconds: 30
80
83
  healthcheck:
81
84
  command: uv run ./mock_cli.py --healthcheck
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "agentv",
3
- "version": "3.0.0-next.1",
3
+ "version": "3.1.0",
4
4
  "description": "CLI entry point for AgentV",
5
5
  "type": "module",
6
6
  "repository": {
@@ -1,9 +0,0 @@
1
- import { createRequire } from 'node:module'; const require = createRequire(import.meta.url);
2
- import {
3
- AgentvProvider
4
- } from "./chunk-6GSYTMXD.js";
5
- import "./chunk-5H446C7X.js";
6
- export {
7
- AgentvProvider
8
- };
9
- //# sourceMappingURL=agentv-provider-5CJVBBGG-2XVZBW7L.js.map
@@ -1 +0,0 @@
1
- {"version":3,"sources":[],"sourcesContent":[],"mappings":"","names":[]}
@@ -1,51 +0,0 @@
1
- import { createRequire } from 'node:module'; const require = createRequire(import.meta.url);
2
- import {
3
- __commonJS
4
- } from "./chunk-5H446C7X.js";
5
-
6
- // ../../node_modules/.bun/@vercel+oidc@3.0.5/node_modules/@vercel/oidc/dist/token-error.js
7
- var require_token_error = __commonJS({
8
- "../../node_modules/.bun/@vercel+oidc@3.0.5/node_modules/@vercel/oidc/dist/token-error.js"(exports, module) {
9
- "use strict";
10
- var __defProp = Object.defineProperty;
11
- var __getOwnPropDesc = Object.getOwnPropertyDescriptor;
12
- var __getOwnPropNames = Object.getOwnPropertyNames;
13
- var __hasOwnProp = Object.prototype.hasOwnProperty;
14
- var __export = (target, all) => {
15
- for (var name in all)
16
- __defProp(target, name, { get: all[name], enumerable: true });
17
- };
18
- var __copyProps = (to, from, except, desc) => {
19
- if (from && typeof from === "object" || typeof from === "function") {
20
- for (let key of __getOwnPropNames(from))
21
- if (!__hasOwnProp.call(to, key) && key !== except)
22
- __defProp(to, key, { get: () => from[key], enumerable: !(desc = __getOwnPropDesc(from, key)) || desc.enumerable });
23
- }
24
- return to;
25
- };
26
- var __toCommonJS = (mod) => __copyProps(__defProp({}, "__esModule", { value: true }), mod);
27
- var token_error_exports = {};
28
- __export(token_error_exports, {
29
- VercelOidcTokenError: () => VercelOidcTokenError
30
- });
31
- module.exports = __toCommonJS(token_error_exports);
32
- var VercelOidcTokenError = class extends Error {
33
- constructor(message, cause) {
34
- super(message);
35
- this.name = "VercelOidcTokenError";
36
- this.cause = cause;
37
- }
38
- toString() {
39
- if (this.cause) {
40
- return `${this.name}: ${this.message}: ${this.cause}`;
41
- }
42
- return `${this.name}: ${this.message}`;
43
- }
44
- };
45
- }
46
- });
47
-
48
- export {
49
- require_token_error
50
- };
51
- //# sourceMappingURL=chunk-3L2L5GIL.js.map
@@ -1 +0,0 @@
1
- {"version":3,"sources":["../../../node_modules/.bun/@vercel+oidc@3.0.5/node_modules/@vercel/oidc/dist/token-error.js"],"sourcesContent":["\"use strict\";\nvar __defProp = Object.defineProperty;\nvar __getOwnPropDesc = Object.getOwnPropertyDescriptor;\nvar __getOwnPropNames = Object.getOwnPropertyNames;\nvar __hasOwnProp = Object.prototype.hasOwnProperty;\nvar __export = (target, all) => {\n for (var name in all)\n __defProp(target, name, { get: all[name], enumerable: true });\n};\nvar __copyProps = (to, from, except, desc) => {\n if (from && typeof from === \"object\" || typeof from === \"function\") {\n for (let key of __getOwnPropNames(from))\n if (!__hasOwnProp.call(to, key) && key !== except)\n __defProp(to, key, { get: () => from[key], enumerable: !(desc = __getOwnPropDesc(from, key)) || desc.enumerable });\n }\n return to;\n};\nvar __toCommonJS = (mod) => __copyProps(__defProp({}, \"__esModule\", { value: true }), mod);\nvar token_error_exports = {};\n__export(token_error_exports, {\n VercelOidcTokenError: () => VercelOidcTokenError\n});\nmodule.exports = __toCommonJS(token_error_exports);\nclass VercelOidcTokenError extends Error {\n constructor(message, cause) {\n super(message);\n this.name = \"VercelOidcTokenError\";\n this.cause = cause;\n }\n toString() {\n if (this.cause) {\n return `${this.name}: ${this.message}: ${this.cause}`;\n }\n return `${this.name}: ${this.message}`;\n }\n}\n// Annotate the CommonJS export names for ESM import in node:\n0 && (module.exports = {\n VercelOidcTokenError\n});\n"],"mappings":";;;;;;AAAA;AAAA;AAAA;AACA,QAAI,YAAY,OAAO;AACvB,QAAI,mBAAmB,OAAO;AAC9B,QAAI,oBAAoB,OAAO;AAC/B,QAAI,eAAe,OAAO,UAAU;AACpC,QAAI,WAAW,CAAC,QAAQ,QAAQ;AAC9B,eAAS,QAAQ;AACf,kBAAU,QAAQ,MAAM,EAAE,KAAK,IAAI,IAAI,GAAG,YAAY,KAAK,CAAC;AAAA,IAChE;AACA,QAAI,cAAc,CAAC,IAAI,MAAM,QAAQ,SAAS;AAC5C,UAAI,QAAQ,OAAO,SAAS,YAAY,OAAO,SAAS,YAAY;AAClE,iBAAS,OAAO,kBAAkB,IAAI;AACpC,cAAI,CAAC,aAAa,KAAK,IAAI,GAAG,KAAK,QAAQ;AACzC,sBAAU,IAAI,KAAK,EAAE,KAAK,MAAM,KAAK,GAAG,GAAG,YAAY,EAAE,OAAO,iBAAiB,MAAM,GAAG,MAAM,KAAK,WAAW,CAAC;AAAA,MACvH;AACA,aAAO;AAAA,IACT;AACA,QAAI,eAAe,CAAC,QAAQ,YAAY,UAAU,CAAC,GAAG,cAAc,EAAE,OAAO,KAAK,CAAC,GAAG,GAAG;AACzF,QAAI,sBAAsB,CAAC;AAC3B,aAAS,qBAAqB;AAAA,MAC5B,sBAAsB,MAAM;AAAA,IAC9B,CAAC;AACD,WAAO,UAAU,aAAa,mBAAmB;AACjD,QAAM,uBAAN,cAAmC,MAAM;AAAA,MACvC,YAAY,SAAS,OAAO;AAC1B,cAAM,OAAO;AACb,aAAK,OAAO;AACZ,aAAK,QAAQ;AAAA,MACf;AAAA,MACA,WAAW;AACT,YAAI,KAAK,OAAO;AACd,iBAAO,GAAG,KAAK,IAAI,KAAK,KAAK,OAAO,KAAK,KAAK,KAAK;AAAA,QACrD;AACA,eAAO,GAAG,KAAK,IAAI,KAAK,KAAK,OAAO;AAAA,MACtC;AAAA,IACF;AAAA;AAAA;","names":[]}
@@ -1,50 +0,0 @@
1
- import { createRequire } from 'node:module'; const require = createRequire(import.meta.url);
2
- var __create = Object.create;
3
- var __defProp = Object.defineProperty;
4
- var __getOwnPropDesc = Object.getOwnPropertyDescriptor;
5
- var __getOwnPropNames = Object.getOwnPropertyNames;
6
- var __getProtoOf = Object.getPrototypeOf;
7
- var __hasOwnProp = Object.prototype.hasOwnProperty;
8
- var __require = /* @__PURE__ */ ((x) => typeof require !== "undefined" ? require : typeof Proxy !== "undefined" ? new Proxy(x, {
9
- get: (a, b) => (typeof require !== "undefined" ? require : a)[b]
10
- }) : x)(function(x) {
11
- if (typeof require !== "undefined") return require.apply(this, arguments);
12
- throw Error('Dynamic require of "' + x + '" is not supported');
13
- });
14
- var __esm = (fn, res) => function __init() {
15
- return fn && (res = (0, fn[__getOwnPropNames(fn)[0]])(fn = 0)), res;
16
- };
17
- var __commonJS = (cb, mod) => function __require2() {
18
- return mod || (0, cb[__getOwnPropNames(cb)[0]])((mod = { exports: {} }).exports, mod), mod.exports;
19
- };
20
- var __export = (target, all) => {
21
- for (var name in all)
22
- __defProp(target, name, { get: all[name], enumerable: true });
23
- };
24
- var __copyProps = (to, from, except, desc) => {
25
- if (from && typeof from === "object" || typeof from === "function") {
26
- for (let key of __getOwnPropNames(from))
27
- if (!__hasOwnProp.call(to, key) && key !== except)
28
- __defProp(to, key, { get: () => from[key], enumerable: !(desc = __getOwnPropDesc(from, key)) || desc.enumerable });
29
- }
30
- return to;
31
- };
32
- var __toESM = (mod, isNodeMode, target) => (target = mod != null ? __create(__getProtoOf(mod)) : {}, __copyProps(
33
- // If the importer is in node compatibility mode or this is not an ESM
34
- // file that has been converted to a CommonJS file using a Babel-
35
- // compatible transform (i.e. "__esModule" has not been set), then set
36
- // "default" to the CommonJS "module.exports" for node compatibility.
37
- isNodeMode || !mod || !mod.__esModule ? __defProp(target, "default", { value: mod, enumerable: true }) : target,
38
- mod
39
- ));
40
- var __toCommonJS = (mod) => __copyProps(__defProp({}, "__esModule", { value: true }), mod);
41
-
42
- export {
43
- __require,
44
- __esm,
45
- __commonJS,
46
- __export,
47
- __toESM,
48
- __toCommonJS
49
- };
50
- //# sourceMappingURL=chunk-5H446C7X.js.map
@@ -1 +0,0 @@
1
- {"version":3,"sources":[],"sourcesContent":[],"mappings":"","names":[]}