agentv 3.9.2 → 3.10.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/{chunk-OIVGGWJ3.js → chunk-GWHHM6X2.js} +25 -14
- package/dist/chunk-GWHHM6X2.js.map +1 -0
- package/dist/{chunk-6ZAFWUBT.js → chunk-JLFFYTZA.js} +4 -4
- package/dist/{chunk-JGMJL2LV.js → chunk-TXCVDTEE.js} +8 -7
- package/dist/{chunk-JGMJL2LV.js.map → chunk-TXCVDTEE.js.map} +1 -1
- package/dist/cli.js +3 -3
- package/dist/{dist-PUPHGVKL.js → dist-FPC7J7KQ.js} +2 -2
- package/dist/index.js +3 -3
- package/dist/{interactive-BD56NB23.js → interactive-N463HRIL.js} +3 -3
- package/dist/templates/.agents/skills/agentv-chat-to-eval/README.md +84 -0
- package/dist/templates/.agents/skills/agentv-chat-to-eval/SKILL.md +144 -0
- package/dist/templates/.agents/skills/agentv-chat-to-eval/examples/transcript-json.md +67 -0
- package/dist/templates/.agents/skills/agentv-chat-to-eval/examples/transcript-markdown.md +101 -0
- package/dist/templates/.agents/skills/agentv-eval-builder/SKILL.md +458 -0
- package/dist/templates/.agents/skills/agentv-eval-builder/references/config-schema.json +36 -0
- package/dist/templates/.agents/skills/agentv-eval-builder/references/custom-evaluators.md +118 -0
- package/dist/templates/.agents/skills/agentv-eval-builder/references/eval-schema.json +12753 -0
- package/dist/templates/.agents/skills/agentv-eval-builder/references/rubric-evaluator.md +77 -0
- package/dist/templates/.agents/skills/agentv-eval-orchestrator/SKILL.md +50 -0
- package/dist/templates/.agents/skills/agentv-prompt-optimizer/SKILL.md +78 -0
- package/dist/templates/.agentv/.env.example +25 -0
- package/dist/templates/.claude/skills/agentv-eval-builder/SKILL.md +177 -0
- package/dist/templates/.claude/skills/agentv-eval-builder/references/batch-cli-evaluator.md +316 -0
- package/dist/templates/.claude/skills/agentv-eval-builder/references/compare-command.md +137 -0
- package/dist/templates/.claude/skills/agentv-eval-builder/references/composite-evaluator.md +215 -0
- package/dist/templates/.claude/skills/agentv-eval-builder/references/config-schema.json +27 -0
- package/dist/templates/.claude/skills/agentv-eval-builder/references/custom-evaluators.md +115 -0
- package/dist/templates/.claude/skills/agentv-eval-builder/references/eval-schema.json +278 -0
- package/dist/templates/.claude/skills/agentv-eval-builder/references/example-evals.md +333 -0
- package/dist/templates/.claude/skills/agentv-eval-builder/references/rubric-evaluator.md +79 -0
- package/dist/templates/.claude/skills/agentv-eval-builder/references/structured-data-evaluators.md +121 -0
- package/dist/templates/.claude/skills/agentv-eval-builder/references/tool-trajectory-evaluator.md +298 -0
- package/dist/templates/.claude/skills/agentv-prompt-optimizer/SKILL.md +78 -0
- package/dist/templates/.github/prompts/agentv-eval-build.prompt.md +5 -0
- package/dist/templates/.github/prompts/agentv-optimize.prompt.md +4 -0
- package/package.json +3 -3
- package/dist/chunk-OIVGGWJ3.js.map +0 -1
- /package/dist/{chunk-6ZAFWUBT.js.map → chunk-JLFFYTZA.js.map} +0 -0
- /package/dist/{dist-PUPHGVKL.js.map → dist-FPC7J7KQ.js.map} +0 -0
- /package/dist/{interactive-BD56NB23.js.map → interactive-N463HRIL.js.map} +0 -0
|
@@ -17,7 +17,7 @@ import {
|
|
|
17
17
|
validateEvalFile,
|
|
18
18
|
validateFileReferences,
|
|
19
19
|
validateTargetsFile
|
|
20
|
-
} from "./chunk-
|
|
20
|
+
} from "./chunk-TXCVDTEE.js";
|
|
21
21
|
import {
|
|
22
22
|
createBuiltinRegistry,
|
|
23
23
|
createProvider,
|
|
@@ -35,7 +35,7 @@ import {
|
|
|
35
35
|
toSnakeCaseDeep as toSnakeCaseDeep2,
|
|
36
36
|
transpileEvalYamlFile,
|
|
37
37
|
trimBaselineResult
|
|
38
|
-
} from "./chunk-
|
|
38
|
+
} from "./chunk-GWHHM6X2.js";
|
|
39
39
|
import {
|
|
40
40
|
__commonJS,
|
|
41
41
|
__esm,
|
|
@@ -4187,7 +4187,7 @@ var evalRunCommand = command({
|
|
|
4187
4187
|
},
|
|
4188
4188
|
handler: async (args) => {
|
|
4189
4189
|
if (args.evalPaths.length === 0 && process.stdin.isTTY) {
|
|
4190
|
-
const { launchInteractiveWizard } = await import("./interactive-
|
|
4190
|
+
const { launchInteractiveWizard } = await import("./interactive-N463HRIL.js");
|
|
4191
4191
|
await launchInteractiveWizard();
|
|
4192
4192
|
return;
|
|
4193
4193
|
}
|
|
@@ -6287,4 +6287,4 @@ export {
|
|
|
6287
6287
|
preprocessArgv,
|
|
6288
6288
|
runCli
|
|
6289
6289
|
};
|
|
6290
|
-
//# sourceMappingURL=chunk-
|
|
6290
|
+
//# sourceMappingURL=chunk-JLFFYTZA.js.map
|
|
@@ -27,12 +27,12 @@ import {
|
|
|
27
27
|
subscribeToCopilotCliLogEntries,
|
|
28
28
|
subscribeToCopilotSdkLogEntries,
|
|
29
29
|
subscribeToPiLogEntries
|
|
30
|
-
} from "./chunk-
|
|
30
|
+
} from "./chunk-GWHHM6X2.js";
|
|
31
31
|
|
|
32
32
|
// package.json
|
|
33
33
|
var package_default = {
|
|
34
34
|
name: "agentv",
|
|
35
|
-
version: "3.
|
|
35
|
+
version: "3.10.1",
|
|
36
36
|
description: "CLI entry point for AgentV",
|
|
37
37
|
type: "module",
|
|
38
38
|
repository: {
|
|
@@ -51,7 +51,7 @@ var package_default = {
|
|
|
51
51
|
dev: "bun src/cli.ts",
|
|
52
52
|
build: "tsup && bun run copy-readme",
|
|
53
53
|
"copy-readme": `bun -e "import { cpSync } from 'fs'; cpSync('../../README.md', 'README.md')"`,
|
|
54
|
-
prepublishOnly: "bun run
|
|
54
|
+
prepublishOnly: `node -e "if(process.env.ALLOW_PUBLISH!=='1'){console.error('ERROR: Use bun run publish:next, then bun run promote:latest');process.exit(1)}"`,
|
|
55
55
|
typecheck: "tsc --noEmit",
|
|
56
56
|
lint: "biome check .",
|
|
57
57
|
format: "biome format --write .",
|
|
@@ -3197,6 +3197,7 @@ async function validateTargetsFile(filePath) {
|
|
|
3197
3197
|
}
|
|
3198
3198
|
const provider = target.provider;
|
|
3199
3199
|
const providerValue = typeof provider === "string" ? provider.trim().toLowerCase() : void 0;
|
|
3200
|
+
const isTemplated = typeof provider === "string" && /^\$\{\{.+\}\}$/.test(provider.trim());
|
|
3200
3201
|
if (typeof provider !== "string" || provider.trim().length === 0) {
|
|
3201
3202
|
errors.push({
|
|
3202
3203
|
severity: "error",
|
|
@@ -3204,7 +3205,7 @@ async function validateTargetsFile(filePath) {
|
|
|
3204
3205
|
location: `${location}.provider`,
|
|
3205
3206
|
message: "Missing or invalid 'provider' field (must be a non-empty string)"
|
|
3206
3207
|
});
|
|
3207
|
-
} else if (!knownProviders.includes(provider)) {
|
|
3208
|
+
} else if (!isTemplated && !knownProviders.includes(provider)) {
|
|
3208
3209
|
errors.push({
|
|
3209
3210
|
severity: "warning",
|
|
3210
3211
|
filePath: absolutePath,
|
|
@@ -3215,7 +3216,7 @@ async function validateTargetsFile(filePath) {
|
|
|
3215
3216
|
if (providerValue === "cli") {
|
|
3216
3217
|
validateCliSettings(target, absolutePath, location, errors);
|
|
3217
3218
|
}
|
|
3218
|
-
if (typeof provider === "string") {
|
|
3219
|
+
if (typeof provider === "string" && !isTemplated) {
|
|
3219
3220
|
validateUnknownSettings(target, provider, absolutePath, location, errors);
|
|
3220
3221
|
}
|
|
3221
3222
|
const graderTarget = target.grader_target ?? target.judge_target;
|
|
@@ -4156,7 +4157,7 @@ async function runEvalCommand(input) {
|
|
|
4156
4157
|
const useFileExport = !!(options.otelFile || options.traceFile);
|
|
4157
4158
|
if (options.exportOtel || useFileExport) {
|
|
4158
4159
|
try {
|
|
4159
|
-
const { OtelTraceExporter, OTEL_BACKEND_PRESETS } = await import("./dist-
|
|
4160
|
+
const { OtelTraceExporter, OTEL_BACKEND_PRESETS } = await import("./dist-FPC7J7KQ.js");
|
|
4160
4161
|
let endpoint = process.env.OTEL_EXPORTER_OTLP_ENDPOINT;
|
|
4161
4162
|
let headers = {};
|
|
4162
4163
|
if (options.otelBackend) {
|
|
@@ -4501,4 +4502,4 @@ export {
|
|
|
4501
4502
|
selectTarget,
|
|
4502
4503
|
runEvalCommand
|
|
4503
4504
|
};
|
|
4504
|
-
//# sourceMappingURL=chunk-
|
|
4505
|
+
//# sourceMappingURL=chunk-TXCVDTEE.js.map
|