npm - agentv - Versions diffs - 4.26.1 → 4.27.0 - Mend

agentv 4.26.1 → 4.27.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (42) hide show

package/dist/{chunk-XBUHMRX2.js → chunk-PH5MHKPL.js} RENAMED Viewed

@@ -45,7 +45,7 @@ import {
   validateFileReferences,
   validateTargetsFile,
   validateWorkspacePaths
-} from "./chunk-JA4WQNE6.js";
+} from "./chunk-VO3THAOI.js";
 import {
   RESULT_INDEX_FILENAME,
   aggregateRunDir,
@@ -863,7 +863,7 @@ var require_src = __commonJS({
 });
 // src/index.ts
-import path26 from "node:path";
+import path27 from "node:path";
 // ../../node_modules/.bun/chalk@5.6.2/node_modules/chalk/source/vendor/ansi-styles/index.js
 var ANSI_BACKGROUND_OFFSET = 10;
@@ -3997,7 +3997,7 @@ var evalRunCommand = command({
   },
   handler: async (args) => {
     if (args.evalPaths.length === 0 && process.stdin.isTTY) {
-      const { launchInteractiveWizard } = await import("./interactive-YMKWKPD7.js");
+      const { launchInteractiveWizard } = await import("./interactive-UG4YNLYK.js");
       await launchInteractiveWizard();
       return;
     }
@@ -4599,9 +4599,11 @@ function readTemplatesRecursively(dir, relativePath) {
 // src/commands/init/index.ts
 function printSkillFirstInstructions() {
   console.log("\nAI-skills-first setup (recommended):");
+  console.log("  agentv skills get agentv-bench");
+  console.log('  Then ask your agent: "Set up AgentV in this repo."');
+  console.log("\nOr install the agentv-dev plugin for automatic skill discovery:");
   console.log("  npx allagents plugin marketplace add EntityProcess/agentv");
   console.log("  npx allagents plugin install agentv-dev@agentv");
-  console.log('  Then ask your agent: "Set up AgentV in this repo."');
 }
 async function promptYesNo(message) {
   const rl = readline.createInterface({
@@ -6489,9 +6491,34 @@ var evalInputCommand = command({
       test_ids: testIds
     });
     console.log(`Extracted ${testIds.length} test(s) to ${outDir}`);
+    if (targetKind === "agent") {
+      console.log(`
+  Target: ${targetName} (subagent-as-target mode)`);
+      console.log(`  Tests:  ${testIds.join(", ")}`);
+      console.log("");
+      console.log("  Next steps for the orchestrating agent:");
+      console.log("  1. Dispatch executor subagents \u2014 one per test case (all in parallel):");
+      console.log("     - Each reads <run-dir>/<test-id>/input.json");
+      console.log("     - Executes the task, writes <run-dir>/<test-id>/response.md");
+      console.log("  2. Run code graders:  agentv pipeline grade <run-dir>");
+      console.log(
+        "  3. Dispatch grader subagents \u2014 one per (test \xD7 LLM grader) pair (all in parallel):"
+      );
+      console.log(
+        "     - Read agents/grader.md and embed its content as system instructions in each subagent prompt"
+      );
+      console.log("     - Each subagent reads llm_graders/<name>.json + response.md for its test");
+      console.log("     - Each writes llm_grader_results/<name>.json");
+      console.log("  4. Merge scores:     agentv pipeline bench <run-dir>");
+      console.log("");
+      console.log("  For the full procedure:");
+      console.log("    agentv skills get agentv-bench --ref subagent-pipeline");
+      console.log("");
+    }
   }
 });
 async function writeGraderConfigs(testDir, assertions, evalDir) {
+  const counts = { codeGraders: 0, llmGraders: 0, builtinAssertions: 0 };
   const codeGradersDir = join3(testDir, "code_graders");
   const llmGradersDir = join3(testDir, "llm_graders");
   let hasCodeGraders = false;
@@ -6527,9 +6554,19 @@ async function writeGraderConfigs(testDir, assertions, evalDir) {
       } else if (typeof config.prompt === "string") {
         promptContent = config.prompt;
       }
+      const rubrics = config.rubrics;
+      const rubricsData = rubrics?.map((r) => ({
+        id: r.id,
+        outcome: r.outcome,
+        weight: r.weight ?? 1,
+        ...r.score_ranges ? { score_range: r.score_ranges } : {},
+        ...r.required !== void 0 ? { required: r.required } : {},
+        ...r.required_min_score !== void 0 ? { required_min_score: r.required_min_score } : {}
+      }));
       await writeJson(join3(llmGradersDir, `${config.name}.json`), {
         name: config.name,
         prompt_content: promptContent,
+        ...rubricsData && rubricsData.length > 0 ? { rubrics: rubricsData } : {},
         weight: config.weight ?? 1,
         threshold: 0.5,
         config: {}
@@ -6550,6 +6587,7 @@ async function writeGraderConfigs(testDir, assertions, evalDir) {
       });
     }
   }
+  return counts;
 }
 async function writeJson(filePath, data) {
   await writeFile7(filePath, `${JSON.stringify(data, null, 2)}
@@ -6591,7 +6629,7 @@ function loadEnvFile(dir) {
 }
 var evalRunCommand2 = command({
   name: "run",
-  description: "Extract inputs, invoke CLI targets, and run code graders in one step",
+  description: "Extract inputs, invoke CLI targets, and run code graders (for agent targets, use pipeline input + subagents)",
   args: {
     evalPath: positional({
       type: string,
@@ -6823,14 +6861,46 @@ var evalRunCommand2 = command({
       await Promise.all(pending);
       process.stderr.write("\n");
     } else {
-      console.log("Subagent-as-target mode \u2014 skipping CLI invocation.");
+      console.log("Subagent-as-target mode \u2014 the agent IS the target.");
+      console.log("");
+      console.log("  What happened: pipeline extracted inputs but did NOT invoke a CLI target.");
+      console.log(
+        "  The orchestrating agent must dispatch executor subagents to process each test."
+      );
+      console.log("");
+      console.log("  Next steps:");
+      console.log("  1. Dispatch executor subagents \u2014 one per test case (all in parallel):");
+      console.log("     - Each reads <run-dir>/<test-id>/input.json");
+      console.log("     - Executes the task, writes <run-dir>/<test-id>/response.md");
+      console.log("  2. Run code graders:   agentv pipeline grade <run-dir>");
+      console.log(
+        "  3. Dispatch grader subagents \u2014 one per (test x LLM grader) pair (all in parallel):"
+      );
+      console.log(
+        "     - Read agents/grader.md and embed its content as system instructions in each subagent prompt"
+      );
+      console.log("     - Each subagent reads llm_graders/<name>.json + response.md");
+      console.log("     - Each writes llm_grader_results/<name>.json");
+      console.log("  4. Merge scores:       agentv pipeline bench <run-dir>");
+      console.log("");
+      console.log("  For the full procedure:");
+      console.log("    agentv skills get agentv-bench --ref subagent-pipeline");
+      console.log("");
     }
     if (graderType !== "code") {
       console.log(`
 Done. Results in ${outDir}`);
-      console.log(
-        "To run code graders: agentv pipeline grade <run-dir>  (or re-run with --grader-type code)"
-      );
+      console.log("");
+      if (targetKind === "agent") {
+        console.log("  The agent must now:");
+        console.log("  1. Dispatch executor subagents to generate response.md files");
+        console.log("  2. Run code graders:   agentv pipeline grade <run-dir>");
+        console.log("  3. Dispatch grader subagents for llm_graders/ configs");
+        console.log("  4. Merge scores:       agentv pipeline bench <run-dir>");
+      } else {
+        console.log("  To run code graders: agentv pipeline grade <run-dir>");
+        console.log("  Or re-run with --grader-type code to grade inline.");
+      }
       return;
     }
     const graderTasks = [];
@@ -6856,8 +6926,15 @@ Done. Results in ${outDir}`);
     const graderConcurrency = workers ?? 10;
     const { totalGraders, totalPassed } = await runCodeGraders(graderTasks, graderConcurrency);
     console.log(`Graded ${totalGraders} code-grader(s): ${totalPassed} passed`);
-    console.log(`
-Done. Agent can now perform LLM grading on responses in ${outDir}`);
+    console.log("");
+    console.log(`Results in ${outDir}`);
+    console.log("");
+    console.log("  Remaining steps:");
+    console.log("  1. If llm_graders/ configs exist, dispatch grader subagents");
+    console.log(
+      "     - Read agents/grader.md, embed as system instructions in each subagent prompt"
+    );
+    console.log("  2. Merge all scores: agentv pipeline bench <run-dir>");
   }
 });
 async function writeJson2(filePath, data) {
@@ -6899,9 +6976,19 @@ async function writeGraderConfigs2(testDir, assertions, evalDir) {
       } else if (typeof config.prompt === "string") {
         promptContent = config.prompt;
       }
+      const rubrics = config.rubrics;
+      const rubricsData = rubrics?.map((r) => ({
+        id: r.id,
+        outcome: r.outcome,
+        weight: r.weight ?? 1,
+        ...r.score_ranges ? { score_range: r.score_ranges } : {},
+        ...r.required !== void 0 ? { required: r.required } : {},
+        ...r.required_min_score !== void 0 ? { required_min_score: r.required_min_score } : {}
+      }));
       await writeJson2(join4(llmGradersDir, `${config.name}.json`), {
         name: config.name,
         prompt_content: promptContent,
+        ...rubricsData && rubricsData.length > 0 ? { rubrics: rubricsData } : {},
         weight: config.weight ?? 1,
         threshold: 0.5,
         config: {}
@@ -6913,7 +7000,7 @@ async function writeGraderConfigs2(testDir, assertions, evalDir) {
 // src/commands/pipeline/index.ts
 var pipelineCommand = subcommands({
   name: "pipeline",
-  description: "Agent-mode eval pipeline commands (input \u2192 grade \u2192 bench)",
+  description: "Subagent-mode eval pipeline (input \u2192 executor subagents \u2192 grade \u2192 bench) \u2014 use this when the eval target is an AI agent (Claude, Codex, etc.)",
   cmds: {
     input: evalInputCommand,
     grade: evalGradeCommand,
@@ -11007,9 +11094,302 @@ var selfCommand = subcommands({
   }
 });
+// src/commands/skills/index.ts
+import { existsSync as existsSync15, readFileSync as readFileSync13, readdirSync as readdirSync5 } from "node:fs";
+import path20 from "node:path";
+import { fileURLToPath as fileURLToPath4 } from "node:url";
+function isValidSkillsDir(dir) {
+  if (!existsSync15(dir)) return false;
+  try {
+    return readdirSync5(dir, { withFileTypes: true }).some(
+      (e) => e.isDirectory() && existsSync15(path20.join(dir, e.name, "SKILL.md"))
+    );
+  } catch {
+    return false;
+  }
+}
+function findSkillsDir() {
+  const selfFile = fileURLToPath4(import.meta.url);
+  let dir = path20.dirname(selfFile);
+  for (let i = 0; i < 6; i++) {
+    const distCandidate = path20.join(dir, "dist", "skills");
+    if (isValidSkillsDir(distCandidate)) return distCandidate;
+    const repoRootCandidate = path20.join(dir, "skills-data");
+    if (isValidSkillsDir(repoRootCandidate)) return repoRootCandidate;
+    const legacyCandidate = path20.join(dir, "skills");
+    if (isValidSkillsDir(legacyCandidate)) return legacyCandidate;
+    dir = path20.dirname(dir);
+  }
+  return null;
+}
+function requireSkillsDir() {
+  const dir = findSkillsDir();
+  if (!dir) {
+    console.error(
+      "Error: bundled skills directory not found. This is a build issue \u2014 please reinstall agentv."
+    );
+    process.exit(1);
+  }
+  return dir;
+}
+function listSkillNames(skillsDir) {
+  if (!existsSync15(skillsDir)) return [];
+  return readdirSync5(skillsDir, { withFileTypes: true }).filter((e) => e.isDirectory()).map((e) => e.name).sort();
+}
+function readSkillFile(skillDir, relPath) {
+  const full = path20.join(skillDir, relPath);
+  if (!existsSync15(full)) return null;
+  return readFileSync13(full, "utf-8");
+}
+function collectDir(dir, prefix = "") {
+  const result = {};
+  if (!existsSync15(dir)) return result;
+  for (const entry of readdirSync5(dir, { withFileTypes: true })) {
+    const relPath = prefix ? `${prefix}/${entry.name}` : entry.name;
+    if (entry.isDirectory()) {
+      Object.assign(result, collectDir(path20.join(dir, entry.name), relPath));
+    } else {
+      result[relPath] = readFileSync13(path20.join(dir, entry.name), "utf-8");
+    }
+  }
+  return result;
+}
+function listSkillSubdirs(skillDir) {
+  if (!existsSync15(skillDir)) return [];
+  return readdirSync5(skillDir, { withFileTypes: true }).filter((e) => e.isDirectory() && !e.name.startsWith(".")).map((e) => e.name).sort();
+}
+function readSkill(skillsDir, name, full) {
+  const skillDir = path20.join(skillsDir, name);
+  if (!existsSync15(skillDir)) return null;
+  const content = readSkillFile(skillDir, "SKILL.md");
+  if (content === null) return null;
+  if (!full) return { name, content };
+  const files = {};
+  for (const sub of listSkillSubdirs(skillDir)) {
+    const subDir = path20.join(skillDir, sub);
+    const collected = collectDir(subDir, sub);
+    Object.assign(files, collected);
+  }
+  return { name, content, files: Object.keys(files).length > 0 ? files : void 0 };
+}
+function findRefFile(skillDir, refName) {
+  const candidates = refName.endsWith(".md") ? [refName] : [refName, `${refName}.md`];
+  for (const sub of listSkillSubdirs(skillDir)) {
+    for (const candidate of candidates) {
+      const filePath = path20.join(skillDir, sub, candidate);
+      if (existsSync15(filePath)) {
+        return { relPath: `${sub}/${candidate}`, content: readFileSync13(filePath, "utf-8") };
+      }
+    }
+  }
+  for (const candidate of candidates) {
+    const filePath = path20.join(skillDir, candidate);
+    if (existsSync15(filePath)) {
+      return { relPath: candidate, content: readFileSync13(filePath, "utf-8") };
+    }
+  }
+  return null;
+}
+function listRefFiles(skillDir) {
+  const out = [];
+  for (const sub of listSkillSubdirs(skillDir)) {
+    const subDir = path20.join(skillDir, sub);
+    for (const entry of readdirSync5(subDir, { withFileTypes: true })) {
+      if (entry.isFile()) out.push(`${sub}/${entry.name}`);
+    }
+  }
+  return out.sort();
+}
+function printSkill(skill, json) {
+  if (json) {
+    process.stdout.write(`${JSON.stringify({ success: true, data: [skill] })}
+`);
+    return;
+  }
+  process.stdout.write(skill.content);
+  if (!skill.content.endsWith("\n")) process.stdout.write("\n");
+  if (skill.files) {
+    for (const [relPath, content] of Object.entries(skill.files)) {
+      process.stdout.write(`
+--- ${relPath} ---
+`);
+      process.stdout.write(content);
+      if (!content.endsWith("\n")) process.stdout.write("\n");
+    }
+  }
+}
+var skillsListCommand = command({
+  name: "list",
+  description: "List available bundled skills",
+  args: {
+    json: flag({ long: "json", description: "Output as JSON" })
+  },
+  handler: ({ json }) => {
+    const skillsDir = requireSkillsDir();
+    const names = listSkillNames(skillsDir);
+    if (json) {
+      process.stdout.write(`${JSON.stringify({ success: true, data: names })}
+`);
+    } else {
+      for (const name of names) {
+        console.log(name);
+      }
+    }
+  }
+});
+var skillsGetCommand = command({
+  name: "get",
+  description: "Get skill content by name (or --all for all skills)",
+  args: {
+    name: positional({ type: optional(string), displayName: "name", description: "Skill name" }),
+    all: flag({ long: "all", description: "Get all skills" }),
+    full: flag({
+      long: "full",
+      description: "Also include all files under subdirectories (references/, scripts/, agents/, etc.)"
+    }),
+    ref: option({
+      type: optional(string),
+      long: "ref",
+      description: "Load a single file from the skill by relative path (searches all subdirectories). Takes precedence over --full."
+    }),
+    json: flag({ long: "json", description: "Output as JSON" })
+  },
+  handler: ({ name, all, full, ref, json }) => {
+    const skillsDir = requireSkillsDir();
+    if (ref !== void 0 && all) {
+      const msg = "--ref is incompatible with --all";
+      if (json) {
+        process.stdout.write(`${JSON.stringify({ success: false, error: msg })}
+`);
+      } else {
+        console.error(`Error: ${msg}`);
+      }
+      process.exit(1);
+    }
+    if (ref !== void 0) {
+      if (name === void 0) {
+        const msg = "--ref requires a skill name";
+        if (json) {
+          process.stdout.write(`${JSON.stringify({ success: false, error: msg })}
+`);
+        } else {
+          console.error(`Error: ${msg}`);
+        }
+        process.exit(1);
+      }
+      const skillDir = path20.join(skillsDir, name);
+      if (!existsSync15(skillDir)) {
+        const msg = `skill '${name}' not found`;
+        if (json) {
+          process.stdout.write(`${JSON.stringify({ success: false, error: msg })}
+`);
+        } else {
+          console.error(`Error: ${msg}`);
+          const available = listSkillNames(skillsDir);
+          if (available.length > 0) {
+            console.error(`Available skills: ${available.join(", ")}`);
+          }
+        }
+        process.exit(1);
+      }
+      const file = findRefFile(skillDir, ref);
+      if (!file) {
+        const msg = `reference '${ref}' not found in skill '${name}'`;
+        if (json) {
+          process.stdout.write(`${JSON.stringify({ success: false, error: msg })}
+`);
+        } else {
+          console.error(`Error: ${msg}`);
+          const available = listRefFiles(skillDir);
+          if (available.length > 0) {
+            console.error(`Available reference files:
+  ${available.join("\n  ")}`);
+          }
+        }
+        process.exit(1);
+      }
+      if (json) {
+        process.stdout.write(
+          `${JSON.stringify({ success: true, data: [{ name, content: file.content, files: { [file.relPath]: file.content } }] })}
+`
+        );
+        return;
+      }
+      process.stdout.write(file.content);
+      if (!file.content.endsWith("\n")) process.stdout.write("\n");
+      return;
+    }
+    if (all || name === void 0) {
+      const names = listSkillNames(skillsDir);
+      const skills = names.map((n) => readSkill(skillsDir, n, full)).filter((s) => s !== null);
+      if (json) {
+        process.stdout.write(`${JSON.stringify({ success: true, data: skills })}
+`);
+        return;
+      }
+      for (const skill2 of skills) {
+        if (skills.length > 1) {
+          process.stdout.write(`
+=== ${skill2.name} ===
+`);
+        }
+        printSkill(skill2, false);
+      }
+      return;
+    }
+    const skill = readSkill(skillsDir, name, full);
+    if (!skill) {
+      if (json) {
+        process.stdout.write(
+          `${JSON.stringify({ success: false, error: `Skill '${name}' not found` })}
+`
+        );
+      } else {
+        console.error(`Error: skill '${name}' not found`);
+        const available = listSkillNames(skillsDir);
+        if (available.length > 0) {
+          console.error(`Available skills: ${available.join(", ")}`);
+        }
+      }
+      process.exit(1);
+    }
+    printSkill(skill, json);
+  }
+});
+var skillsPathCommand = command({
+  name: "path",
+  description: "Print path to bundled skills directory (or specific skill directory)",
+  args: {
+    name: positional({ type: optional(string), displayName: "name", description: "Skill name" })
+  },
+  handler: ({ name }) => {
+    const skillsDir = requireSkillsDir();
+    if (name) {
+      const skillDir = path20.join(skillsDir, name);
+      if (!existsSync15(skillDir)) {
+        console.error(`Error: skill '${name}' not found`);
+        process.exit(1);
+      }
+      console.log(skillDir);
+    } else {
+      console.log(skillsDir);
+    }
+  }
+});
+var skillsCommand = subcommands({
+  name: "skills",
+  description: "List and retrieve bundled AgentV skills",
+  cmds: {
+    list: skillsListCommand,
+    get: skillsGetCommand,
+    path: skillsPathCommand
+  }
+});
 // src/commands/transpile/index.ts
 import { writeFileSync as writeFileSync7 } from "node:fs";
-import path20 from "node:path";
+import path21 from "node:path";
 var transpileCommand = command({
   name: "transpile",
   description: "Convert an EVAL.yaml file to Agent Skills evals.json format",
@@ -11033,7 +11413,7 @@ var transpileCommand = command({
   handler: async ({ input, outDir, stdout }) => {
     let result;
     try {
-      result = transpileEvalYamlFile(path20.resolve(input));
+      result = transpileEvalYamlFile(path21.resolve(input));
     } catch (error) {
       console.error(`Error: ${error.message}`);
       process.exit(1);
@@ -11057,11 +11437,11 @@ var transpileCommand = command({
       process.stdout.write("\n");
       return;
     }
-    const outputDir = outDir ? path20.resolve(outDir) : path20.dirname(path20.resolve(input));
+    const outputDir = outDir ? path21.resolve(outDir) : path21.dirname(path21.resolve(input));
     const fileNames = getOutputFilenames(result);
     for (const [skill, evalsJson] of result.files) {
       const fileName = fileNames.get(skill) ?? "evals.json";
-      const outputPath = path20.join(outputDir, fileName);
+      const outputPath = path21.join(outputDir, fileName);
       writeFileSync7(outputPath, `${JSON.stringify(evalsJson, null, 2)}
 `);
       console.log(`Transpiled to ${outputPath}`);
@@ -11070,7 +11450,7 @@ var transpileCommand = command({
 });
 // src/commands/trend/index.ts
-import path21 from "node:path";
+import path22 from "node:path";
 var colors2 = {
   reset: "\x1B[0m",
   bold: "\x1B[1m",
@@ -11120,7 +11500,7 @@ function colorizeSlope(value) {
 }
 function ensureTrendIndexPath(source, cwd) {
   const resolved = resolveResultSourcePath(source, cwd);
-  if (path21.basename(resolved) !== RESULT_INDEX_FILENAME) {
+  if (path22.basename(resolved) !== RESULT_INDEX_FILENAME) {
     throw new Error(
       `Unsupported result source for trend: ${source}. Use a run workspace directory or ${RESULT_INDEX_FILENAME} manifest.`
     );
@@ -11140,7 +11520,7 @@ function resolveTrendSources(cwd, sources, last) {
   if (last < 2) {
     throw new Error("--last must be at least 2");
   }
-  const metas = listResultFiles(cwd).filter((meta) => path21.basename(meta.path) === RESULT_INDEX_FILENAME).slice(0, last);
+  const metas = listResultFiles(cwd).filter((meta) => path22.basename(meta.path) === RESULT_INDEX_FILENAME).slice(0, last);
   if (metas.length < 2) {
     throw new Error(
       "Trend analysis requires at least 2 canonical run workspaces in .agentv/results/runs/"
@@ -11155,10 +11535,10 @@ function getRunLabel(sourcePath, timestamp) {
   if (timestamp) {
     return timestamp;
   }
-  return path21.basename(path21.dirname(sourcePath));
+  return path22.basename(path22.dirname(sourcePath));
 }
 function getRunSortKey(sourcePath, timestamp) {
-  return timestamp ?? path21.basename(path21.dirname(sourcePath));
+  return timestamp ?? path22.basename(path22.dirname(sourcePath));
 }
 function mean2(values) {
   return values.reduce((sum, value) => sum + value, 0) / values.length;
@@ -11413,7 +11793,7 @@ var trendCommand = command({
 });
 // src/commands/trim/index.ts
-import { readFileSync as readFileSync13, writeFileSync as writeFileSync8 } from "node:fs";
+import { readFileSync as readFileSync14, writeFileSync as writeFileSync8 } from "node:fs";
 var trimCommand = command({
   name: "trim",
   description: "Trim evaluation results for baseline storage (strips debug/audit fields)",
@@ -11432,7 +11812,7 @@ var trimCommand = command({
   },
   handler: async ({ input, out }) => {
     try {
-      const content = readFileSync13(input, "utf8");
+      const content = readFileSync14(input, "utf8");
       const lines = content.trim().split("\n").filter((line) => line.trim());
       const trimmedLines = lines.map((line) => {
         const record = JSON.parse(line);
@@ -11539,7 +11919,7 @@ function isTTY() {
 // src/commands/validate/validate-files.ts
 import { constants } from "node:fs";
 import { access, readdir as readdir4, stat } from "node:fs/promises";
-import path22 from "node:path";
+import path23 from "node:path";
 import fg2 from "fast-glob";
 async function validateFiles(paths) {
   const filePaths = await expandPaths(paths);
@@ -11554,7 +11934,7 @@ async function validateFiles(paths) {
   };
 }
 async function validateSingleFile(filePath) {
-  const absolutePath = path22.resolve(filePath);
+  const absolutePath = path23.resolve(filePath);
   const fileType = await detectFileType(absolutePath);
   let result;
   if (fileType === "eval") {
@@ -11598,7 +11978,7 @@ async function validateSingleFile(filePath) {
 async function expandPaths(paths) {
   const expanded = /* @__PURE__ */ new Set();
   for (const inputPath of paths) {
-    const absolutePath = path22.resolve(inputPath);
+    const absolutePath = path23.resolve(inputPath);
     try {
       await access(absolutePath, constants.F_OK);
       const stats = await stat(absolutePath);
@@ -11626,7 +12006,7 @@ async function expandPaths(paths) {
     if (yamlMatches.length === 0) {
       console.warn(`Warning: No YAML files matched pattern: ${inputPath}`);
     }
-    for (const f of yamlMatches) expanded.add(path22.normalize(f));
+    for (const f of yamlMatches) expanded.add(path23.normalize(f));
   }
   const sorted = Array.from(expanded);
   sorted.sort();
@@ -11637,7 +12017,7 @@ async function findYamlFiles(dirPath) {
   try {
     const entries2 = await readdir4(dirPath, { withFileTypes: true });
     for (const entry of entries2) {
-      const fullPath = path22.join(dirPath, entry.name);
+      const fullPath = path23.join(dirPath, entry.name);
       if (entry.isDirectory()) {
         if (entry.name === "node_modules" || entry.name.startsWith(".")) {
           continue;
@@ -11654,11 +12034,11 @@ async function findYamlFiles(dirPath) {
   return results;
 }
 function isYamlFile(filePath) {
-  const ext = path22.extname(filePath).toLowerCase();
+  const ext = path23.extname(filePath).toLowerCase();
   return ext === ".yaml" || ext === ".yml";
 }
 function isEvalYamlFile(filePath) {
-  const lower = path22.basename(filePath).toLowerCase();
+  const lower = path23.basename(filePath).toLowerCase();
   return lower.endsWith(".eval.yaml") || lower.endsWith(".eval.yml");
 }
@@ -11713,9 +12093,9 @@ var validateCommand = command({
 });
 // src/commands/workspace/clean.ts
-import { existsSync as existsSync15 } from "node:fs";
+import { existsSync as existsSync16 } from "node:fs";
 import { readFile as readFile6, readdir as readdir5, rm } from "node:fs/promises";
-import path23 from "node:path";
+import path24 from "node:path";
 async function confirm(message) {
   const readline2 = await import("node:readline");
   const rl = readline2.createInterface({ input: process.stdin, output: process.stdout });
@@ -11742,7 +12122,7 @@ var cleanCommand = command({
   },
   handler: async ({ repo, force }) => {
     const poolRoot = getWorkspacePoolRoot();
-    if (!existsSync15(poolRoot)) {
+    if (!existsSync16(poolRoot)) {
       console.log("No workspace pool entries found.");
       return;
     }
@@ -11751,8 +12131,8 @@ var cleanCommand = command({
       const poolDirs = entries2.filter((e) => e.isDirectory());
       const matchingDirs = [];
       for (const dir of poolDirs) {
-        const poolDir = path23.join(poolRoot, dir.name);
-        const metadataPath = path23.join(poolDir, "metadata.json");
+        const poolDir = path24.join(poolRoot, dir.name);
+        const metadataPath = path24.join(poolDir, "metadata.json");
         try {
           const raw = await readFile6(metadataPath, "utf-8");
           const metadata = JSON.parse(raw);
@@ -11783,7 +12163,7 @@ var cleanCommand = command({
       }
       for (const dir of matchingDirs) {
         await rm(dir, { recursive: true, force: true });
-        console.log(`Removed: ${path23.basename(dir).slice(0, 12)}...`);
+        console.log(`Removed: ${path24.basename(dir).slice(0, 12)}...`);
       }
       console.log("Done.");
     } else {
@@ -11801,7 +12181,7 @@ var cleanCommand = command({
 });
 // src/commands/workspace/deps.ts
-import path24 from "node:path";
+import path25 from "node:path";
 var depsCommand = command({
   name: "deps",
   description: "Scan eval files and list git repo dependencies needed by workspaces",
@@ -11825,7 +12205,7 @@ var depsCommand = command({
     const resolvedPaths = await resolveEvalPaths(evalPaths, cwd);
     const result = await scanRepoDeps(resolvedPaths);
     for (const err2 of result.errors) {
-      console.error(`warning: ${path24.relative(cwd, err2.file)}: ${err2.message}`);
+      console.error(`warning: ${path25.relative(cwd, err2.file)}: ${err2.message}`);
     }
     const output = {
       repos: result.repos.map((r) => ({
@@ -11833,7 +12213,7 @@ var depsCommand = command({
         ...r.ref !== void 0 && { ref: r.ref },
         ...r.clone !== void 0 && { clone: r.clone },
         ...r.checkout !== void 0 && { checkout: r.checkout },
-        ...usedBy && { used_by: r.usedBy.map((p) => path24.relative(cwd, p)) }
+        ...usedBy && { used_by: r.usedBy.map((p) => path25.relative(cwd, p)) }
       }))
     };
     console.log(JSON.stringify(output, null, 2));
@@ -11841,15 +12221,15 @@ var depsCommand = command({
 });
 // src/commands/workspace/list.ts
-import { existsSync as existsSync16 } from "node:fs";
+import { existsSync as existsSync17 } from "node:fs";
 import { readFile as readFile7, readdir as readdir6, stat as stat2 } from "node:fs/promises";
-import path25 from "node:path";
+import path26 from "node:path";
 async function getDirectorySize(dirPath) {
   let totalSize = 0;
   try {
     const entries2 = await readdir6(dirPath, { withFileTypes: true });
     for (const entry of entries2) {
-      const fullPath = path25.join(dirPath, entry.name);
+      const fullPath = path26.join(dirPath, entry.name);
       if (entry.isDirectory()) {
         totalSize += await getDirectorySize(fullPath);
       } else {
@@ -11873,7 +12253,7 @@ var listCommand = command({
   args: {},
   handler: async () => {
     const poolRoot = getWorkspacePoolRoot();
-    if (!existsSync16(poolRoot)) {
+    if (!existsSync17(poolRoot)) {
       console.log("No workspace pool entries found.");
       return;
     }
@@ -11884,11 +12264,11 @@ var listCommand = command({
       return;
     }
     for (const dir of poolDirs) {
-      const poolDir = path25.join(poolRoot, dir.name);
+      const poolDir = path26.join(poolRoot, dir.name);
       const fingerprint = dir.name;
       const poolEntries = await readdir6(poolDir, { withFileTypes: true });
       const slots = poolEntries.filter((e) => e.isDirectory() && e.name.startsWith("slot-"));
-      const metadataPath = path25.join(poolDir, "metadata.json");
+      const metadataPath = path26.join(poolDir, "metadata.json");
       let metadata = null;
       try {
         const raw = await readFile7(metadataPath, "utf-8");
@@ -11935,8 +12315,8 @@ var CHECK_INTERVAL_MS = 24 * 60 * 60 * 1e3;
 var CONFIG_DIR = getAgentvConfigDir();
 var CACHE_FILE = "version-check.json";
 var NPM_REGISTRY_BASE = "https://registry.npmjs.org/agentv/";
-async function getCachedUpdateInfo(path27) {
-  const filePath = path27 ?? join5(CONFIG_DIR, CACHE_FILE);
+async function getCachedUpdateInfo(path28) {
+  const filePath = path28 ?? join5(CONFIG_DIR, CACHE_FILE);
   try {
     const raw = await readFile8(filePath, "utf-8");
     const data = JSON.parse(raw);
@@ -12030,6 +12410,7 @@ var app = subcommands({
     pipeline: pipelineCommand,
     results: resultsCommand,
     self: selfCommand,
+    skills: skillsCommand,
     serve: resultsServeCommand,
     studio: resultsServeCommand,
     inspect: inspectCommand,
@@ -12051,6 +12432,7 @@ var TOP_LEVEL_COMMANDS = /* @__PURE__ */ new Set([
   "pipeline",
   "results",
   "self",
+  "skills",
   "serve",
   "studio",
   "trend",
@@ -12095,7 +12477,7 @@ ${updateNotice}
   const processedArgv = preprocessArgv(argv);
   const cwd = process.cwd();
   const repoRoot = await findRepoRoot(cwd);
-  const sessionConfig = await loadConfig(path26.join(cwd, "_"), repoRoot);
+  const sessionConfig = await loadConfig(path27.join(cwd, "_"), repoRoot);
   const beforeSessionCommand = sessionConfig?.hooks?.before_session;
   if (beforeSessionCommand) {
     runBeforeSessionHook(beforeSessionCommand);
@@ -12108,4 +12490,4 @@ export {
   preprocessArgv,
   runCli
 };
-//# sourceMappingURL=chunk-XBUHMRX2.js.map
+//# sourceMappingURL=chunk-PH5MHKPL.js.map