agentv 3.5.0 → 3.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/dist/cli.js CHANGED
@@ -2,9 +2,9 @@
2
2
  import { createRequire } from 'node:module'; const require = createRequire(import.meta.url);
3
3
  import {
4
4
  runCli
5
- } from "./chunk-5GG6DDP5.js";
6
- import "./chunk-RLL4QGNL.js";
7
- import "./chunk-D6G4N2H2.js";
5
+ } from "./chunk-TR6H437M.js";
6
+ import "./chunk-7YS6YNJZ.js";
7
+ import "./chunk-XGG64VIY.js";
8
8
  import "./chunk-C5GOHBQM.js";
9
9
  import "./chunk-JK6V4KVD.js";
10
10
  import "./chunk-HQDCIXVH.js";
@@ -141,7 +141,7 @@ import {
141
141
  transpileEvalYaml,
142
142
  transpileEvalYamlFile,
143
143
  trimBaselineResult
144
- } from "./chunk-D6G4N2H2.js";
144
+ } from "./chunk-XGG64VIY.js";
145
145
  import {
146
146
  OtlpJsonFileExporter
147
147
  } from "./chunk-C5GOHBQM.js";
@@ -300,4 +300,4 @@ export {
300
300
  transpileEvalYamlFile,
301
301
  trimBaselineResult
302
302
  };
303
- //# sourceMappingURL=dist-MZFXE6B5.js.map
303
+ //# sourceMappingURL=dist-VP6AXX6B.js.map
package/dist/index.js CHANGED
@@ -3,9 +3,9 @@ import {
3
3
  app,
4
4
  preprocessArgv,
5
5
  runCli
6
- } from "./chunk-5GG6DDP5.js";
7
- import "./chunk-RLL4QGNL.js";
8
- import "./chunk-D6G4N2H2.js";
6
+ } from "./chunk-TR6H437M.js";
7
+ import "./chunk-7YS6YNJZ.js";
8
+ import "./chunk-XGG64VIY.js";
9
9
  import "./chunk-C5GOHBQM.js";
10
10
  import "./chunk-JK6V4KVD.js";
11
11
  import "./chunk-HQDCIXVH.js";
@@ -4,14 +4,14 @@ import {
4
4
  fileExists,
5
5
  findRepoRoot,
6
6
  runEvalCommand
7
- } from "./chunk-RLL4QGNL.js";
7
+ } from "./chunk-7YS6YNJZ.js";
8
8
  import {
9
9
  DEFAULT_EVAL_PATTERNS,
10
10
  getAgentvHome,
11
11
  listTargetNames,
12
12
  loadConfig,
13
13
  readTargetDefinitions
14
- } from "./chunk-D6G4N2H2.js";
14
+ } from "./chunk-XGG64VIY.js";
15
15
  import "./chunk-C5GOHBQM.js";
16
16
  import "./chunk-JK6V4KVD.js";
17
17
  import "./chunk-HQDCIXVH.js";
@@ -371,4 +371,4 @@ ${ANSI_DIM}Retrying execution errors...${ANSI_RESET}
371
371
  export {
372
372
  launchInteractiveWizard
373
373
  };
374
- //# sourceMappingURL=interactive-J7SUWZH2.js.map
374
+ //# sourceMappingURL=interactive-F6XECJ33.js.map
@@ -1,25 +1,23 @@
1
1
  # Copy this file to .env and fill in your credentials
2
2
 
3
- # Eval run mode (used by agentv-bench skill)
4
- AGENT_EVAL_MODE=agent # agent | cli
5
-
6
3
  # Azure OpenAI Configuration
7
4
  AZURE_OPENAI_ENDPOINT=https://your-endpoint.openai.azure.com/
8
5
  AZURE_OPENAI_API_KEY=your-openai-api-key-here
9
- AZURE_DEPLOYMENT_NAME=gpt-5-mini
6
+ AZURE_DEPLOYMENT_NAME=gpt-5-chat
10
7
  AZURE_OPENAI_API_VERSION=2024-12-01-preview
11
8
 
12
- # OpenAI
13
- OPENAI_ENDPOINT=https://your-endpoint.openai.azure.com/
14
- OPENAI_API_KEY=your-openai-api-key-here
15
- OPENAI_MODEL=gpt-5-mini
16
-
17
9
  # Google Gemini
18
10
  GOOGLE_GENERATIVE_AI_API_KEY=your-gemini-api-key-here
19
- GEMINI_MODEL_NAME=gemini-3-flash-preview
11
+ GEMINI_MODEL_NAME=gemini-2.5-flash
20
12
 
21
13
  # Anthropic
22
14
  ANTHROPIC_API_KEY=your-anthropic-api-key-here
23
15
 
16
+ # VS Code Workspace Paths for Execution Targets
17
+ # Note: Using forward slashes is recommended for paths in .env files
18
+ # to avoid issues with escape characters.
19
+ PROJECTX_WORKSPACE_PATH=C:/Users/your-username/OneDrive - Company Pty Ltd/sample.code-workspace
20
+
24
21
  # CLI provider sample (used by the local_cli target)
25
- CLI_EVALS_DIR=./docs/examples/simple/evals/local-cli
22
+ CLI_EVALS_DIR=./docs/examples/simple/evals/local-cli
23
+ LOCAL_AGENT_TOKEN=dummytoken
@@ -8,11 +8,6 @@ guideline_patterns:
8
8
  - "**/*.prompt.md"
9
9
  - "**/SKILL.md"
10
10
 
11
- # Execution defaults (overridden by CLI flags)
12
- # execution:
13
- # pool_workspaces: true # Reuse materialized workspaces across eval runs
14
- # pool_slots: 10 # Max pool slots on disk (1-50, default: 10)
15
-
16
11
  # Notes:
17
12
  # - Patterns use standard glob syntax (via micromatch library)
18
13
  # - Paths are normalized to forward slashes for cross-platform compatibility
@@ -10,6 +10,10 @@ targets:
10
10
  model: ${{ AZURE_DEPLOYMENT_NAME }}
11
11
  # version: ${{ AZURE_OPENAI_API_VERSION }} # Optional: uncomment to override default (2024-12-01-preview)
12
12
 
13
+ - name: vscode
14
+ provider: vscode
15
+ judge_target: azure-llm
16
+
13
17
  - name: codex
14
18
  provider: codex
15
19
  judge_target: azure-llm
@@ -39,6 +43,18 @@ targets:
39
43
  log_format: json # Optional: 'summary' (default) or 'json' for raw event logs
40
44
  # system_prompt: optional override (default instructs agent to include code in response)
41
45
 
46
+ - name: vscode_projectx
47
+ provider: vscode
48
+ workspace_template: ${{ PROJECTX_WORKSPACE_PATH }}
49
+ provider_batching: false
50
+ judge_target: azure-llm
51
+
52
+ - name: vscode_insiders_projectx
53
+ provider: vscode-insiders
54
+ workspace_template: ${{ PROJECTX_WORKSPACE_PATH }}
55
+ provider_batching: false
56
+ judge_target: azure-llm
57
+
42
58
  - name: azure-llm
43
59
  provider: azure
44
60
  endpoint: ${{ AZURE_OPENAI_ENDPOINT }}
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "agentv",
3
- "version": "3.5.0",
3
+ "version": "3.7.0",
4
4
  "description": "CLI entry point for AgentV",
5
5
  "type": "module",
6
6
  "repository": {