agentv 0.7.5 → 0.9.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +82 -37
- package/dist/{chunk-J3LVKRRT.js → chunk-X2VVUCIB.js} +260 -161
- package/dist/chunk-X2VVUCIB.js.map +1 -0
- package/dist/cli.js +1 -1
- package/dist/index.js +1 -1
- package/dist/templates/agentv/targets.yaml +35 -43
- package/package.json +2 -2
- package/dist/chunk-J3LVKRRT.js.map +0 -1
package/dist/cli.js
CHANGED
package/dist/index.js
CHANGED
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
$schema: agentv-targets-v2
|
|
1
|
+
$schema: agentv-targets-v2.2
|
|
2
2
|
|
|
3
3
|
# A list of all supported evaluation targets for the project.
|
|
4
4
|
# Each target defines a provider and its specific configuration.
|
|
@@ -7,10 +7,9 @@ $schema: agentv-targets-v2
|
|
|
7
7
|
targets:
|
|
8
8
|
- name: default
|
|
9
9
|
provider: azure
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
|
|
13
|
-
model: AZURE_DEPLOYMENT_NAME
|
|
10
|
+
endpoint: ${{ AZURE_OPENAI_ENDPOINT }}
|
|
11
|
+
api_key: ${{ AZURE_OPENAI_API_KEY }}
|
|
12
|
+
model: ${{ AZURE_DEPLOYMENT_NAME }}
|
|
14
13
|
|
|
15
14
|
- name: vscode
|
|
16
15
|
provider: vscode
|
|
@@ -19,56 +18,49 @@ targets:
|
|
|
19
18
|
- name: codex
|
|
20
19
|
provider: codex
|
|
21
20
|
judge_target: azure_base
|
|
22
|
-
|
|
23
|
-
|
|
24
|
-
|
|
25
|
-
|
|
26
|
-
|
|
27
|
-
|
|
28
|
-
|
|
29
|
-
|
|
30
|
-
|
|
31
|
-
|
|
32
|
-
|
|
33
|
-
|
|
34
|
-
|
|
35
|
-
log_format: json # Optional: 'summary' (default) or 'json' for raw event logs
|
|
21
|
+
# Uses the Codex CLI (defaults to `codex` on PATH)
|
|
22
|
+
# executable: ${{ CODEX_CLI_PATH }} # Optional: override executable path
|
|
23
|
+
# args: # Optional additional CLI arguments
|
|
24
|
+
# - --profile
|
|
25
|
+
# - ${{ CODEX_PROFILE }}
|
|
26
|
+
# - --model
|
|
27
|
+
# - ${{ CODEX_MODEL }}
|
|
28
|
+
# - --ask-for-approval
|
|
29
|
+
# - ${{ CODEX_APPROVAL_PRESET }}
|
|
30
|
+
timeout_seconds: 180
|
|
31
|
+
cwd: ${{ CODEX_WORKSPACE_DIR }} # Where scratch workspaces are created
|
|
32
|
+
log_dir: ${{ CODEX_LOG_DIR }} # Optional: where Codex CLI stream logs are stored (defaults to ./.agentv/logs/codex)
|
|
33
|
+
log_format: json # Optional: 'summary' (default) or 'json' for raw event logs
|
|
36
34
|
|
|
37
35
|
- name: vscode_projectx
|
|
38
36
|
provider: vscode
|
|
39
|
-
|
|
40
|
-
|
|
41
|
-
provider_batching: false
|
|
37
|
+
workspace_template: ${{ PROJECTX_WORKSPACE_PATH }}
|
|
38
|
+
provider_batching: false
|
|
42
39
|
judge_target: azure_base
|
|
43
40
|
|
|
44
41
|
- name: vscode_insiders_projectx
|
|
45
42
|
provider: vscode-insiders
|
|
46
|
-
|
|
47
|
-
|
|
48
|
-
provider_batching: false
|
|
43
|
+
workspace_template: ${{ PROJECTX_WORKSPACE_PATH }}
|
|
44
|
+
provider_batching: false
|
|
49
45
|
judge_target: azure_base
|
|
50
46
|
|
|
51
47
|
- name: azure_base
|
|
52
48
|
provider: azure
|
|
53
|
-
|
|
54
|
-
|
|
55
|
-
|
|
56
|
-
model: AZURE_DEPLOYMENT_NAME
|
|
49
|
+
endpoint: ${{ AZURE_OPENAI_ENDPOINT }}
|
|
50
|
+
api_key: ${{ AZURE_OPENAI_API_KEY }}
|
|
51
|
+
model: ${{ AZURE_DEPLOYMENT_NAME }}
|
|
57
52
|
|
|
58
53
|
- name: local_cli
|
|
59
54
|
provider: cli
|
|
60
55
|
judge_target: azure_base
|
|
61
|
-
|
|
62
|
-
|
|
63
|
-
|
|
64
|
-
|
|
65
|
-
|
|
66
|
-
|
|
67
|
-
|
|
68
|
-
|
|
69
|
-
|
|
70
|
-
|
|
71
|
-
|
|
72
|
-
healthcheck:
|
|
73
|
-
type: command
|
|
74
|
-
command_template: uv run ./mock_cli.py --healthcheck
|
|
56
|
+
# Passes the fully rendered prompt and any attached files to a local Python script
|
|
57
|
+
# NOTE: Do not add quotes around {PROMPT} or {FILES} - they are already shell-escaped
|
|
58
|
+
command_template: uv run ./mock_cli.py --prompt {PROMPT} {FILES}
|
|
59
|
+
# Format for each file in {FILES}. {path} and {basename} are automatically shell-escaped, so no quotes needed
|
|
60
|
+
files_format: --file {path}
|
|
61
|
+
# Optional working directory resolved from .env
|
|
62
|
+
cwd: ${{ CLI_EVALS_DIR }}
|
|
63
|
+
timeout_seconds: 30
|
|
64
|
+
healthcheck:
|
|
65
|
+
type: command
|
|
66
|
+
command_template: uv run ./mock_cli.py --healthcheck
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "agentv",
|
|
3
|
-
"version": "0.
|
|
3
|
+
"version": "0.9.0",
|
|
4
4
|
"description": "CLI entry point for AgentV",
|
|
5
5
|
"type": "module",
|
|
6
6
|
"repository": {
|
|
@@ -24,7 +24,7 @@
|
|
|
24
24
|
"dotenv": "^16.4.5",
|
|
25
25
|
"micromatch": "^4.0.8",
|
|
26
26
|
"yaml": "^2.6.1",
|
|
27
|
-
"@agentv/core": "0.
|
|
27
|
+
"@agentv/core": "0.9.0"
|
|
28
28
|
},
|
|
29
29
|
"devDependencies": {
|
|
30
30
|
"execa": "^9.3.0"
|