npm - @agentv/core - Versions diffs - 3.8.0 → 3.9.1 - Mend

@agentv/core 3.8.0 → 3.9.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

package/dist/{chunk-3ZS3GCMI.js → chunk-PC5TLJF6.js} +1 -2
package/dist/chunk-PC5TLJF6.js.map +1 -0
package/dist/evaluation/validation/index.cjs +1 -33
package/dist/evaluation/validation/index.cjs.map +1 -1
package/dist/evaluation/validation/index.js +2 -33
package/dist/evaluation/validation/index.js.map +1 -1
package/dist/index.cjs +533 -772
package/dist/index.cjs.map +1 -1
package/dist/index.d.cts +16 -21
package/dist/index.d.ts +16 -21
package/dist/index.js +381 -619
package/dist/index.js.map +1 -1
package/package.json +1 -1
package/dist/chunk-3ZS3GCMI.js.map +0 -1

package/dist/index.js CHANGED Viewed

@@ -19,7 +19,7 @@ import {
   readTextFile,
   resolveFileReference,
   resolveTargetDefinition
-} from "./chunk-3ZS3GCMI.js";
+} from "./chunk-PC5TLJF6.js";
 import {
   AgentvProvider
 } from "./chunk-W5YDZWT4.js";
@@ -149,9 +149,9 @@ function mergeExecutionMetrics(computed, metrics) {
 }
 // src/evaluation/yaml-parser.ts
-import { readFile as readFile7 } from "node:fs/promises";
-import path8 from "node:path";
-import micromatch3 from "micromatch";
+import { readFile as readFile6 } from "node:fs/promises";
+import path7 from "node:path";
+import micromatch2 from "micromatch";
 import { parse as parse2 } from "yaml";
 // src/evaluation/loaders/agent-skills-parser.ts
@@ -225,7 +225,6 @@ function parseAgentSkillsEvals(parsed, source = "evals.json", baseDir) {
       input_segments: [{ type: "text", value: prompt }],
       expected_output: evalCase.expected_output ? [{ role: "assistant", content: evalCase.expected_output }] : [],
       reference_answer: evalCase.expected_output,
-      guideline_paths: [],
       file_paths: filePaths,
       criteria: evalCase.expected_output ?? "",
       assertions,
@@ -239,7 +238,6 @@ function parseAgentSkillsEvals(parsed, source = "evals.json", baseDir) {
 // src/evaluation/loaders/config-loader.ts
 import { readFile as readFile2 } from "node:fs/promises";
 import path3 from "node:path";
-import micromatch from "micromatch";
 import { parse } from "yaml";
 // src/evaluation/loaders/file-resolver.ts
@@ -370,15 +368,6 @@ async function loadConfig(evalFilePath, repoRoot) {
         logWarning(`Invalid required_version in ${configPath}, expected string`);
         continue;
       }
-      const guidelinePatterns = config.guideline_patterns;
-      if (guidelinePatterns !== void 0 && !Array.isArray(guidelinePatterns)) {
-        logWarning(`Invalid guideline_patterns in ${configPath}, expected array`);
-        continue;
-      }
-      if (Array.isArray(guidelinePatterns) && !guidelinePatterns.every((p) => typeof p === "string")) {
-        logWarning(`Invalid guideline_patterns in ${configPath}, all entries must be strings`);
-        continue;
-      }
       const evalPatterns = config.eval_patterns;
       if (evalPatterns !== void 0 && !Array.isArray(evalPatterns)) {
         logWarning(`Invalid eval_patterns in ${configPath}, expected array`);
@@ -394,7 +383,6 @@ async function loadConfig(evalFilePath, repoRoot) {
       );
       return {
         required_version: requiredVersion,
-        guideline_patterns: guidelinePatterns,
         eval_patterns: evalPatterns,
         execution: executionDefaults
       };
@@ -406,11 +394,6 @@ async function loadConfig(evalFilePath, repoRoot) {
   }
   return null;
 }
-function isGuidelineFile(filePath, patterns) {
-  const normalized = filePath.split("\\").join("/");
-  const patternsToUse = patterns ?? [];
-  return micromatch.isMatch(normalized, patternsToUse);
-}
 function extractTargetFromSuite(suite) {
   const execution = suite.execution;
   if (execution && typeof execution === "object" && !Array.isArray(execution)) {
@@ -437,6 +420,17 @@ function extractTargetsFromSuite(suite) {
   }
   return void 0;
 }
+function extractWorkersFromSuite(suite) {
+  const execution = suite.execution;
+  if (!execution || typeof execution !== "object" || Array.isArray(execution)) {
+    return void 0;
+  }
+  const workers = execution.workers;
+  if (typeof workers === "number" && Number.isInteger(workers) && workers >= 1 && workers <= 50) {
+    return workers;
+  }
+  return void 0;
+}
 function extractTargetsFromTestCase(testCase) {
   const execution = testCase.execution;
   if (!execution || typeof execution !== "object" || Array.isArray(execution)) {
@@ -1986,7 +1980,7 @@ function parseInlineRubrics(rawRubrics) {
 // src/evaluation/loaders/jsonl-parser.ts
 import { readFile as readFile5 } from "node:fs/promises";
 import path6 from "node:path";
-import micromatch2 from "micromatch";
+import micromatch from "micromatch";
 import { parse as parseYaml } from "yaml";
 // src/evaluation/loaders/message-processor.ts
@@ -2013,10 +2007,6 @@ function formatSegment(segment, mode = "lm") {
   if (type === "text") {
     return asString2(segment.value);
   }
-  if (type === "guideline_ref") {
-    const refPath = asString2(segment.path);
-    return refPath ? `<Attached: ${refPath}>` : void 0;
-  }
   if (type === "file") {
     const filePath = asString2(segment.path);
     if (!filePath) {
@@ -2039,9 +2029,6 @@ function hasVisibleContent(segments) {
       const value = asString2(segment.value);
       return value !== void 0 && value.trim().length > 0;
     }
-    if (type === "guideline_ref") {
-      return false;
-    }
     if (type === "file") {
       const text = asString2(segment.text);
       return text !== void 0 && text.trim().length > 0;
@@ -2057,17 +2044,7 @@ function asString2(value) {
 var ANSI_YELLOW4 = "\x1B[33m";
 var ANSI_RESET5 = "\x1B[0m";
 async function processMessages(options) {
-  const {
-    messages,
-    searchRoots,
-    repoRootPath,
-    guidelinePatterns,
-    guidelinePaths,
-    treatFileSegmentsAsGuidelines,
-    textParts,
-    messageType,
-    verbose
-  } = options;
+  const { messages, searchRoots, repoRootPath, textParts, messageType, verbose } = options;
   const segments = [];
   for (const message of messages) {
     const content = message.content;
@@ -2111,21 +2088,6 @@ async function processMessages(options) {
         }
         try {
           const fileContent = (await readFile4(resolvedPath, "utf8")).replace(/\r\n/g, "\n");
-          const classifyAsGuideline = shouldTreatAsGuideline({
-            messageType,
-            resolvedPath,
-            repoRootPath,
-            guidelinePatterns,
-            treatFileSegmentsAsGuidelines
-          });
-          if (classifyAsGuideline && guidelinePaths) {
-            guidelinePaths.push(path5.resolve(resolvedPath));
-            if (verbose) {
-              console.log(`  [Guideline] Found: ${displayPath}`);
-              console.log(`    Resolved to: ${resolvedPath}`);
-            }
-            continue;
-          }
           segments.push({
             type: "file",
             path: displayPath,
@@ -2153,26 +2115,6 @@ async function processMessages(options) {
   }
   return segments;
 }
-function shouldTreatAsGuideline(options) {
-  const {
-    messageType,
-    resolvedPath,
-    repoRootPath,
-    guidelinePatterns,
-    treatFileSegmentsAsGuidelines
-  } = options;
-  if (messageType !== "input") {
-    return false;
-  }
-  if (treatFileSegmentsAsGuidelines) {
-    return true;
-  }
-  if (!guidelinePatterns || guidelinePatterns.length === 0) {
-    return false;
-  }
-  const relativeToRepo = path5.relative(repoRootPath, resolvedPath);
-  return isGuidelineFile(relativeToRepo, guidelinePatterns);
-}
 function asString3(value) {
   return typeof value === "string" ? value : void 0;
 }
@@ -2373,7 +2315,7 @@ async function loadSidecarMetadata(jsonlPath, verbose) {
     }
     return {
       description: asString4(parsed.description),
-      dataset: asString4(parsed.dataset),
+      name: asString4(parsed.name),
       execution: isJsonObject(parsed.execution) ? parsed.execution : void 0,
       evaluator: parsed.evaluator
     };
@@ -2409,20 +2351,18 @@ async function loadTestsFromJsonl(evalFilePath, repoRoot, options) {
   const absoluteTestPath = path6.resolve(evalFilePath);
   const repoRootPath = resolveToAbsolutePath(repoRoot);
   const searchRoots = buildSearchRoots2(absoluteTestPath, repoRootPath);
-  const config = await loadConfig(absoluteTestPath, repoRootPath);
-  const guidelinePatterns = config?.guideline_patterns;
   const sidecar = await loadSidecarMetadata(absoluteTestPath, verbose);
   const rawFile = await readFile5(absoluteTestPath, "utf8");
   const rawCases = parseJsonlContent(rawFile, evalFilePath);
-  const fallbackDataset = path6.basename(absoluteTestPath, ".jsonl") || "eval";
-  const datasetName = sidecar.dataset && sidecar.dataset.trim().length > 0 ? sidecar.dataset : fallbackDataset;
+  const fallbackEvalSet = path6.basename(absoluteTestPath, ".jsonl") || "eval";
+  const evalSetName = sidecar.name && sidecar.name.trim().length > 0 ? sidecar.name : fallbackEvalSet;
   const globalEvaluator = coerceEvaluator(sidecar.evaluator, "sidecar") ?? "llm-grader";
   const globalExecution = sidecar.execution;
   if (verbose) {
     console.log(`
 [JSONL Dataset: ${evalFilePath}]`);
     console.log(`  Cases: ${rawCases.length}`);
-    console.log(`  Dataset name: ${datasetName}`);
+    console.log(`  Eval set: ${evalSetName}`);
     if (sidecar.description) {
       console.log(`  Description: ${sidecar.description}`);
     }
@@ -2432,7 +2372,7 @@ async function loadTestsFromJsonl(evalFilePath, repoRoot, options) {
     const evalcase = rawCases[lineIndex];
     const lineNumber = lineIndex + 1;
     const id = asString4(evalcase.id);
-    if (filterPattern && (!id || !micromatch2.isMatch(id, filterPattern))) {
+    if (filterPattern && (!id || !micromatch.isMatch(id, filterPattern))) {
       continue;
     }
     const conversationId = asString4(evalcase.conversation_id);
@@ -2455,14 +2395,11 @@ async function loadTestsFromJsonl(evalFilePath, repoRoot, options) {
       continue;
     }
     const hasExpectedMessages = expectedMessages.length > 0;
-    const guidelinePaths = [];
     const inputTextParts = [];
     const inputSegments = await processMessages({
       messages: inputMessages,
       searchRoots,
       repoRootPath,
-      guidelinePatterns,
-      guidelinePaths,
       textParts: inputTextParts,
       messageType: "input",
       verbose
@@ -2512,40 +2449,20 @@ async function loadTestsFromJsonl(evalFilePath, repoRoot, options) {
         userFilePaths.push(segment.resolvedPath);
       }
     }
-    const allFilePaths = [
-      ...guidelinePaths.map((guidelinePath) => path6.resolve(guidelinePath)),
-      ...userFilePaths
-    ];
     const testCase = {
       id,
-      dataset: datasetName,
+      eval_set: evalSetName,
       conversation_id: conversationId,
       question,
       input: inputMessages,
       input_segments: inputSegments,
       expected_output: outputSegments,
       reference_answer: referenceAnswer,
-      guideline_paths: guidelinePaths.map((guidelinePath) => path6.resolve(guidelinePath)),
-      guideline_patterns: guidelinePatterns,
-      file_paths: allFilePaths,
+      file_paths: userFilePaths,
       criteria: outcome ?? "",
       evaluator: evalCaseEvaluatorKind,
       assertions: evaluators
     };
-    if (verbose) {
-      console.log(`
-[Test: ${id}]`);
-      if (testCase.guideline_paths.length > 0) {
-        console.log(`  Guidelines used: ${testCase.guideline_paths.length}`);
-        for (const guidelinePath of testCase.guideline_paths) {
-          console.log(`    - ${guidelinePath}`);
-        }
-      } else if (!guidelinePatterns || guidelinePatterns.length === 0) {
-        console.log("  No guidelines found (guideline_patterns not configured)");
-      } else {
-        console.log("  No guidelines found");
-      }
-    }
     results.push(testCase);
   }
   return results;
@@ -2603,30 +2520,7 @@ function parseMetadata(suite) {
 }
 // src/evaluation/formatting/prompt-builder.ts
-import { readFile as readFile6 } from "node:fs/promises";
-import path7 from "node:path";
-var ANSI_YELLOW6 = "\x1B[33m";
-var ANSI_RESET7 = "\x1B[0m";
 async function buildPromptInputs(testCase, mode = "lm") {
-  const guidelineParts = [];
-  for (const rawPath of testCase.guideline_paths) {
-    const absolutePath = path7.resolve(rawPath);
-    if (!await fileExists2(absolutePath)) {
-      logWarning5(`Could not read guideline file ${absolutePath}: file does not exist`);
-      continue;
-    }
-    try {
-      const content = (await readFile6(absolutePath, "utf8")).replace(/\r\n/g, "\n").trim();
-      guidelineParts.push({
-        content,
-        isFile: true,
-        displayPath: path7.basename(absolutePath)
-      });
-    } catch (error) {
-      logWarning5(`Could not read guideline file ${absolutePath}: ${error.message}`);
-    }
-  }
-  const guidelines = formatFileContents(guidelineParts);
   const segmentsByMessage = [];
   const fileContentsByPath = /* @__PURE__ */ new Map();
   for (const segment of testCase.input_segments) {
@@ -2651,10 +2545,6 @@ async function buildPromptInputs(testCase, mode = "lm") {
           if (type === "file") {
             const value = asString5(segment.value);
             if (!value) continue;
-            if (testCase.guideline_patterns && isGuidelineFile(value, testCase.guideline_patterns)) {
-              messageSegments.push({ type: "guideline_ref", path: value });
-              continue;
-            }
             const fileText = fileContentsByPath.get(value);
             if (fileText !== void 0) {
               messageSegments.push({ type: "file", text: fileText, path: value });
@@ -2703,10 +2593,6 @@ ${messageContent}`);
   } else {
     const questionParts = [];
     for (const segment of testCase.input_segments) {
-      if (segment.type === "file" && typeof segment.path === "string" && testCase.guideline_patterns && isGuidelineFile(segment.path, testCase.guideline_patterns)) {
-        questionParts.push(`<Attached: ${segment.path}>`);
-        continue;
-      }
       const formattedContent = formatSegment(segment, mode);
       if (formattedContent) {
         questionParts.push(formattedContent);
@@ -2717,11 +2603,9 @@ ${messageContent}`);
   const chatPrompt = useRoleMarkers ? buildChatPromptFromSegments({
     messages: testCase.input,
     segmentsByMessage,
-    guidelinePatterns: testCase.guideline_patterns,
-    guidelineContent: guidelines,
     mode
   }) : void 0;
-  return { question, guidelines, chatPrompt };
+  return { question, chatPrompt };
 }
 function needsRoleMarkers(messages, processedSegmentsByMessage) {
   if (messages.some((msg) => msg.role === "assistant" || msg.role === "tool")) {
@@ -2736,14 +2620,7 @@ function needsRoleMarkers(messages, processedSegmentsByMessage) {
   return messagesWithContent > 1;
 }
 function buildChatPromptFromSegments(options) {
-  const {
-    messages,
-    segmentsByMessage,
-    guidelinePatterns,
-    guidelineContent,
-    systemPrompt,
-    mode = "lm"
-  } = options;
+  const { messages, segmentsByMessage, systemPrompt, mode = "lm" } = options;
   if (messages.length === 0) {
     return void 0;
   }
@@ -2751,11 +2628,6 @@ function buildChatPromptFromSegments(options) {
   if (systemPrompt && systemPrompt.trim().length > 0) {
     systemSegments.push(systemPrompt.trim());
   }
-  if (guidelineContent && guidelineContent.trim().length > 0) {
-    systemSegments.push(`[[ ## Guidelines ## ]]
-${guidelineContent.trim()}`);
-  }
   let startIndex = 0;
   while (startIndex < messages.length && messages[startIndex].role === "system") {
     const segments = segmentsByMessage[startIndex];
@@ -2791,15 +2663,8 @@ ${guidelineContent.trim()}`);
       contentParts.push("@[Tool]:");
     }
     for (const segment of segments) {
-      if (segment.type === "guideline_ref") {
-        continue;
-      }
       const formatted = formatSegment(segment, mode);
       if (formatted) {
-        const isGuidelineRef = segment.type === "file" && typeof segment.path === "string" && guidelinePatterns && isGuidelineFile(segment.path, guidelinePatterns);
-        if (isGuidelineRef) {
-          continue;
-        }
         contentParts.push(formatted);
       }
     }
@@ -2817,30 +2682,27 @@ ${guidelineContent.trim()}`);
 function asString5(value) {
   return typeof value === "string" ? value : void 0;
 }
-function logWarning5(message) {
-  console.warn(`${ANSI_YELLOW6}Warning: ${message}${ANSI_RESET7}`);
-}
 // src/evaluation/yaml-parser.ts
-var ANSI_YELLOW7 = "\x1B[33m";
+var ANSI_YELLOW6 = "\x1B[33m";
 var ANSI_RED3 = "\x1B[31m";
-var ANSI_RESET8 = "\x1B[0m";
+var ANSI_RESET7 = "\x1B[0m";
 function resolveTests(suite) {
   if (suite.tests !== void 0) return suite.tests;
   if (suite.eval_cases !== void 0) {
-    logWarning6("'eval_cases' is deprecated. Use 'tests' instead.");
+    logWarning5("'eval_cases' is deprecated. Use 'tests' instead.");
     return suite.eval_cases;
   }
   if (suite.evalcases !== void 0) {
-    logWarning6("'evalcases' is deprecated. Use 'tests' instead.");
+    logWarning5("'evalcases' is deprecated. Use 'tests' instead.");
     return suite.evalcases;
   }
   return void 0;
 }
 async function readTestSuiteMetadata(testFilePath) {
   try {
-    const absolutePath = path8.resolve(testFilePath);
-    const content = await readFile7(absolutePath, "utf8");
+    const absolutePath = path7.resolve(testFilePath);
+    const content = await readFile6(absolutePath, "utf8");
     const parsed = interpolateEnv(parse2(content), process.env);
     if (!isJsonObject(parsed)) {
       return {};
@@ -2869,6 +2731,7 @@ async function loadTestSuite(evalFilePath, repoRoot, options) {
     tests,
     trials: extractTrialsConfig(parsed),
     targets: extractTargetsFromSuite(parsed),
+    workers: extractWorkersFromSuite(parsed),
     cacheConfig: extractCacheConfig(parsed),
     totalBudgetUsd: extractTotalBudgetUsd(parsed),
     ...metadata !== void 0 && { metadata },
@@ -2891,26 +2754,25 @@ var loadEvalCases = loadTests;
 async function loadTestsFromYaml(evalFilePath, repoRoot, options) {
   const verbose = options?.verbose ?? false;
   const filterPattern = options?.filter;
-  const absoluteTestPath = path8.resolve(evalFilePath);
+  const absoluteTestPath = path7.resolve(evalFilePath);
   const repoRootPath = resolveToAbsolutePath(repoRoot);
   const searchRoots = buildSearchRoots2(absoluteTestPath, repoRootPath);
   const config = await loadConfig(absoluteTestPath, repoRootPath);
-  const guidelinePatterns = config?.guideline_patterns;
-  const rawFile = await readFile7(absoluteTestPath, "utf8");
+  const rawFile = await readFile6(absoluteTestPath, "utf8");
   const interpolated = interpolateEnv(parse2(rawFile), process.env);
   if (!isJsonObject(interpolated)) {
     throw new Error(`Invalid test file format: ${evalFilePath}`);
   }
   const suite = interpolated;
-  const datasetNameFromSuite = asString6(suite.dataset)?.trim();
-  const fallbackDataset = path8.basename(absoluteTestPath).replace(/\.ya?ml$/i, "") || "eval";
-  const datasetName = datasetNameFromSuite && datasetNameFromSuite.length > 0 ? datasetNameFromSuite : fallbackDataset;
+  const evalSetNameFromSuite = asString6(suite.name)?.trim();
+  const fallbackEvalSet = path7.basename(absoluteTestPath).replace(/\.ya?ml$/i, "") || "eval";
+  const evalSetName = evalSetNameFromSuite && evalSetNameFromSuite.length > 0 ? evalSetNameFromSuite : fallbackEvalSet;
   const rawTestcases = resolveTests(suite);
   const globalEvaluator = coerceEvaluator(suite.evaluator, "global") ?? "llm-grader";
-  const evalFileDir = path8.dirname(absoluteTestPath);
+  const evalFileDir = path7.dirname(absoluteTestPath);
   let expandedTestcases;
   if (typeof rawTestcases === "string") {
-    const externalPath = path8.resolve(evalFileDir, rawTestcases);
+    const externalPath = path7.resolve(evalFileDir, rawTestcases);
     expandedTestcases = await loadCasesFromFile(externalPath);
   } else if (Array.isArray(rawTestcases)) {
     expandedTestcases = await expandFileReferences(rawTestcases, evalFileDir);
@@ -2924,18 +2786,18 @@ async function loadTestsFromYaml(evalFilePath, repoRoot, options) {
   const _globalTarget = asString6(rawGlobalExecution?.target) ?? asString6(suite.target);
   const suiteAssertions = suite.assertions ?? suite.assert;
   if (suite.assert !== void 0 && suite.assertions === void 0) {
-    logWarning6("'assert' is deprecated at the suite level. Use 'assertions' instead.");
+    logWarning5("'assert' is deprecated at the suite level. Use 'assertions' instead.");
   }
   const globalExecution = suiteAssertions !== void 0 ? { ...rawGlobalExecution ?? {}, assertions: suiteAssertions } : rawGlobalExecution;
   const results = [];
   for (const rawEvalcase of expandedTestcases) {
     if (!isJsonObject(rawEvalcase)) {
-      logWarning6("Skipping invalid test entry (expected object)");
+      logWarning5("Skipping invalid test entry (expected object)");
       continue;
     }
     const evalcase = rawEvalcase;
     const id = asString6(evalcase.id);
-    if (filterPattern && (!id || !micromatch3.isMatch(id, filterPattern))) {
+    if (filterPattern && (!id || !micromatch2.isMatch(id, filterPattern))) {
       continue;
     }
     const conversationId = asString6(evalcase.conversation_id);
@@ -2943,7 +2805,7 @@ async function loadTestsFromYaml(evalFilePath, repoRoot, options) {
     if (!outcome && evalcase.expected_outcome !== void 0) {
       outcome = asString6(evalcase.expected_outcome);
       if (outcome) {
-        logWarning6(
+        logWarning5(
           `Test '${asString6(evalcase.id) ?? "unknown"}': 'expected_outcome' is deprecated. Use 'criteria' instead.`
         );
       }
@@ -2963,15 +2825,11 @@ async function loadTestsFromYaml(evalFilePath, repoRoot, options) {
     const effectiveSuiteInputMessages = suiteInputMessages && !skipDefaults ? suiteInputMessages : void 0;
     const inputMessages = effectiveSuiteInputMessages ? [...effectiveSuiteInputMessages, ...testInputMessages] : testInputMessages;
     const hasExpectedMessages = expectedMessages.length > 0;
-    const guidelinePaths = [];
     const inputTextParts = [];
     const suiteInputSegments = effectiveSuiteInputMessages ? await processMessages({
       messages: effectiveSuiteInputMessages,
       searchRoots,
       repoRootPath,
-      guidelinePatterns,
-      guidelinePaths,
-      treatFileSegmentsAsGuidelines: true,
       textParts: inputTextParts,
       messageType: "input",
       verbose
@@ -2980,8 +2838,6 @@ async function loadTestsFromYaml(evalFilePath, repoRoot, options) {
       messages: testInputMessages,
       searchRoots,
       repoRootPath,
-      guidelinePatterns,
-      guidelinePaths,
       textParts: inputTextParts,
       messageType: "input",
       verbose
@@ -3030,26 +2886,20 @@ async function loadTestsFromYaml(evalFilePath, repoRoot, options) {
         userFilePaths.push(segment.resolvedPath);
       }
     }
-    const allFilePaths = [
-      ...guidelinePaths.map((guidelinePath) => path8.resolve(guidelinePath)),
-      ...userFilePaths
-    ];
     const caseWorkspace = await resolveWorkspaceConfig(evalcase.workspace, evalFileDir);
     const mergedWorkspace = mergeWorkspaceConfigs(suiteWorkspace, caseWorkspace);
     const metadata = isJsonObject(evalcase.metadata) ? evalcase.metadata : void 0;
     const caseTargets = extractTargetsFromTestCase(evalcase);
     const testCase = {
       id,
-      dataset: datasetName,
+      eval_set: evalSetName,
       conversation_id: conversationId,
       question,
       input: inputMessages,
       input_segments: inputSegments,
       expected_output: outputSegments,
       reference_answer: referenceAnswer,
-      guideline_paths: guidelinePaths.map((guidelinePath) => path8.resolve(guidelinePath)),
-      guideline_patterns: guidelinePatterns,
-      file_paths: allFilePaths,
+      file_paths: userFilePaths,
       criteria: outcome ?? "",
       evaluator: evalCaseEvaluatorKind,
       assertions: evaluators,
@@ -3057,20 +2907,6 @@ async function loadTestsFromYaml(evalFilePath, repoRoot, options) {
       metadata,
       targets: caseTargets
     };
-    if (verbose) {
-      console.log(`
-[Test: ${id}]`);
-      if (testCase.guideline_paths.length > 0) {
-        console.log(`  Guidelines used: ${testCase.guideline_paths.length}`);
-        for (const guidelinePath of testCase.guideline_paths) {
-          console.log(`    - ${guidelinePath}`);
-        }
-      } else if (!guidelinePatterns || guidelinePatterns.length === 0) {
-        console.log("  No guidelines found (guideline_patterns not configured)");
-      } else {
-        console.log("  No guidelines found");
-      }
-    }
     results.push(testCase);
   }
   return { tests: results, parsed: suite };
@@ -3089,7 +2925,7 @@ function parseWorkspaceScriptConfig(raw, evalFileDir) {
   if (!isJsonObject(raw)) return void 0;
   const obj = raw;
   if (obj.script !== void 0 && obj.command === void 0) {
-    logWarning6("'script' is deprecated. Use 'command' instead.");
+    logWarning5("'script' is deprecated. Use 'command' instead.");
   }
   const commandSource = obj.command ?? obj.script;
   if (!Array.isArray(commandSource) || commandSource.length === 0) return void 0;
@@ -3097,8 +2933,8 @@ function parseWorkspaceScriptConfig(raw, evalFileDir) {
   if (commandArr.length === 0) return void 0;
   const timeoutMs = typeof obj.timeout_ms === "number" ? obj.timeout_ms : void 0;
   let cwd = typeof obj.cwd === "string" ? obj.cwd : void 0;
-  if (cwd && !path8.isAbsolute(cwd)) {
-    cwd = path8.resolve(evalFileDir, cwd);
+  if (cwd && !path7.isAbsolute(cwd)) {
+    cwd = path7.resolve(evalFileDir, cwd);
   }
   const config = { command: commandArr };
   if (timeoutMs !== void 0) {
@@ -3188,10 +3024,10 @@ function parseWorkspaceHooksConfig(raw, evalFileDir) {
 }
 async function resolveWorkspaceConfig(raw, evalFileDir) {
   if (typeof raw === "string") {
-    const workspaceFilePath = path8.resolve(evalFileDir, raw);
+    const workspaceFilePath = path7.resolve(evalFileDir, raw);
     let content;
     try {
-      content = await readFile7(workspaceFilePath, "utf8");
+      content = await readFile6(workspaceFilePath, "utf8");
     } catch {
       throw new Error(`Workspace file not found: ${raw} (resolved to ${workspaceFilePath})`);
     }
@@ -3201,7 +3037,7 @@ async function resolveWorkspaceConfig(raw, evalFileDir) {
         `Invalid workspace file format: ${workspaceFilePath} (expected a YAML object)`
       );
     }
-    const workspaceFileDir = path8.dirname(workspaceFilePath);
+    const workspaceFileDir = path7.dirname(workspaceFilePath);
     return parseWorkspaceConfig(parsed, workspaceFileDir);
   }
   return parseWorkspaceConfig(raw, evalFileDir);
@@ -3221,8 +3057,8 @@ function parseWorkspaceConfig(raw, evalFileDir) {
     throw new Error("workspace.static has been removed. Use workspace.mode='static'.");
   }
   let template = typeof obj.template === "string" ? obj.template : void 0;
-  if (template && !path8.isAbsolute(template)) {
-    template = path8.resolve(evalFileDir, template);
+  if (template && !path7.isAbsolute(template)) {
+    template = path7.resolve(evalFileDir, template);
   }
   const isolation = obj.isolation === "shared" || obj.isolation === "per_test" ? obj.isolation : void 0;
   const repos = Array.isArray(obj.repos) ? obj.repos.map(parseRepoConfig).filter(Boolean) : void 0;
@@ -3272,28 +3108,28 @@ function mergeWorkspaceConfigs(suiteLevel, caseLevel) {
 function asString6(value) {
   return typeof value === "string" ? value : void 0;
 }
-function logWarning6(message, details) {
+function logWarning5(message, details) {
   if (details && details.length > 0) {
     const detailBlock = details.join("\n");
-    console.warn(`${ANSI_YELLOW7}Warning: ${message}
-${detailBlock}${ANSI_RESET8}`);
+    console.warn(`${ANSI_YELLOW6}Warning: ${message}
+${detailBlock}${ANSI_RESET7}`);
   } else {
-    console.warn(`${ANSI_YELLOW7}Warning: ${message}${ANSI_RESET8}`);
+    console.warn(`${ANSI_YELLOW6}Warning: ${message}${ANSI_RESET7}`);
   }
 }
 function logError3(message, details) {
   if (details && details.length > 0) {
     const detailBlock = details.join("\n");
     console.error(`${ANSI_RED3}Error: ${message}
-${detailBlock}${ANSI_RESET8}`);
+${detailBlock}${ANSI_RESET7}`);
   } else {
-    console.error(`${ANSI_RED3}Error: ${message}${ANSI_RESET8}`);
+    console.error(`${ANSI_RED3}Error: ${message}${ANSI_RESET7}`);
   }
 }
 // src/evaluation/loaders/eval-yaml-transpiler.ts
 import { readFileSync } from "node:fs";
-import path9 from "node:path";
+import path8 from "node:path";
 import { parse as parse3 } from "yaml";
 function codeGraderInstruction(graderName, description) {
   const desc = description ? ` This grader: ${description}.` : "";
@@ -3538,7 +3374,7 @@ function transpileEvalYaml(suite, source = "EVAL.yaml") {
 function transpileEvalYamlFile(evalYamlPath) {
   const content = readFileSync(evalYamlPath, "utf8");
   const parsed = parse3(content);
-  return transpileEvalYaml(parsed, path9.basename(evalYamlPath));
+  return transpileEvalYaml(parsed, path8.basename(evalYamlPath));
 }
 function getOutputFilenames(result) {
   const names = /* @__PURE__ */ new Map();
@@ -3773,10 +3609,10 @@ function buildChatPrompt(request) {
     if (hasSystemMessage) {
       return provided;
     }
-    const systemContent2 = resolveSystemContent(request, false);
+    const systemContent2 = resolveSystemContent(request);
     return [{ role: "system", content: systemContent2 }, ...provided];
   }
-  const systemContent = resolveSystemContent(request, true);
+  const systemContent = resolveSystemContent(request);
   const userContent = request.question.trim();
   const prompt = [
     { role: "system", content: systemContent },
@@ -3784,18 +3620,13 @@ function buildChatPrompt(request) {
   ];
   return prompt;
 }
-function resolveSystemContent(request, includeGuidelines) {
+function resolveSystemContent(request) {
   const systemSegments = [];
   if (request.systemPrompt && request.systemPrompt.trim().length > 0) {
     systemSegments.push(request.systemPrompt.trim());
   } else {
     systemSegments.push(DEFAULT_SYSTEM_PROMPT);
   }
-  if (includeGuidelines && request.guidelines && request.guidelines.trim().length > 0) {
-    systemSegments.push(`[[ ## Guidelines ## ]]
-${request.guidelines.trim()}`);
-  }
   return systemSegments.join("\n\n");
 }
 function toModelMessages(chatPrompt) {
@@ -3979,7 +3810,7 @@ import { spawn } from "node:child_process";
 import { randomUUID } from "node:crypto";
 import { createWriteStream } from "node:fs";
 import { mkdir } from "node:fs/promises";
-import path11 from "node:path";
+import path10 from "node:path";
 // src/evaluation/providers/claude-log-tracker.ts
 var GLOBAL_LOGS_KEY = Symbol.for("agentv.claudeLogs");
@@ -4035,17 +3866,11 @@ function subscribeToClaudeLogEntries(listener) {
 }
 // src/evaluation/providers/preread.ts
-import path10 from "node:path";
-function buildPromptDocument(request, inputFiles, options) {
+import path9 from "node:path";
+function buildPromptDocument(request, inputFiles) {
   const parts = [];
-  const guidelineFiles = collectGuidelineFiles(
-    inputFiles,
-    options?.guidelinePatterns ?? request.guideline_patterns,
-    options?.guidelineOverrides
-  );
   const inputFilesList = collectInputFiles(inputFiles);
-  const nonGuidelineInputFiles = inputFilesList.filter((file) => !guidelineFiles.includes(file));
-  const prereadBlock = buildMandatoryPrereadBlock(guidelineFiles, nonGuidelineInputFiles);
+  const prereadBlock = buildMandatoryPrereadBlock(inputFilesList);
   if (prereadBlock.length > 0) {
     parts.push("\n", prereadBlock);
   }
@@ -4058,62 +3883,36 @@ function normalizeInputFiles(inputFiles) {
   }
   const deduped = /* @__PURE__ */ new Map();
   for (const inputFile of inputFiles) {
-    const absolutePath = path10.resolve(inputFile);
+    const absolutePath = path9.resolve(inputFile);
     if (!deduped.has(absolutePath)) {
       deduped.set(absolutePath, absolutePath);
     }
   }
   return Array.from(deduped.values());
 }
-function collectGuidelineFiles(inputFiles, guidelinePatterns, overrides) {
-  if (!inputFiles || inputFiles.length === 0) {
-    return [];
-  }
-  const unique = /* @__PURE__ */ new Map();
-  for (const inputFile of inputFiles) {
-    const absolutePath = path10.resolve(inputFile);
-    if (overrides?.has(absolutePath)) {
-      if (!unique.has(absolutePath)) {
-        unique.set(absolutePath, absolutePath);
-      }
-      continue;
-    }
-    const normalized = absolutePath.split(path10.sep).join("/");
-    if (isGuidelineFile(normalized, guidelinePatterns)) {
-      if (!unique.has(absolutePath)) {
-        unique.set(absolutePath, absolutePath);
-      }
-    }
-  }
-  return Array.from(unique.values());
-}
 function collectInputFiles(inputFiles) {
   if (!inputFiles || inputFiles.length === 0) {
     return [];
   }
   const unique = /* @__PURE__ */ new Map();
   for (const inputFile of inputFiles) {
-    const absolutePath = path10.resolve(inputFile);
+    const absolutePath = path9.resolve(inputFile);
     if (!unique.has(absolutePath)) {
       unique.set(absolutePath, absolutePath);
     }
   }
   return Array.from(unique.values());
 }
-function buildMandatoryPrereadBlock(guidelineFiles, inputFiles) {
-  if (guidelineFiles.length === 0 && inputFiles.length === 0) {
+function buildMandatoryPrereadBlock(inputFiles) {
+  if (inputFiles.length === 0) {
     return "";
   }
   const buildList = (files) => files.map((absolutePath) => {
-    const fileName = path10.basename(absolutePath);
+    const fileName = path9.basename(absolutePath);
     const fileUri = pathToFileUri(absolutePath);
     return `* [${fileName}](${fileUri})`;
   });
   const sections = [];
-  if (guidelineFiles.length > 0) {
-    sections.push(`Read all guideline files:
-${buildList(guidelineFiles).join("\n")}.`);
-  }
   if (inputFiles.length > 0) {
     sections.push(`Read all input files:
 ${buildList(inputFiles).join("\n")}.`);
@@ -4125,7 +3924,7 @@ ${buildList(inputFiles).join("\n")}.`);
   return sections.join("\n");
 }
 function pathToFileUri(filePath) {
-  const absolutePath = path10.isAbsolute(filePath) ? filePath : path10.resolve(filePath);
+  const absolutePath = path9.isAbsolute(filePath) ? filePath : path9.resolve(filePath);
   const normalizedPath = absolutePath.replace(/\\/g, "/");
   if (/^[a-zA-Z]:\//.test(normalizedPath)) {
     return `file:///${normalizedPath}`;
@@ -4272,10 +4071,10 @@ var ClaudeCliProvider = class {
   }
   resolveCwd(cwdOverride) {
     if (cwdOverride) {
-      return path11.resolve(cwdOverride);
+      return path10.resolve(cwdOverride);
     }
     if (this.config.cwd) {
-      return path11.resolve(this.config.cwd);
+      return path10.resolve(this.config.cwd);
     }
     return void 0;
   }
@@ -4285,9 +4084,9 @@ var ClaudeCliProvider = class {
       return void 0;
     }
     if (this.config.logDir) {
-      return path11.resolve(this.config.logDir);
+      return path10.resolve(this.config.logDir);
     }
-    return path11.join(process.cwd(), ".agentv", "logs", "claude-cli");
+    return path10.join(process.cwd(), ".agentv", "logs", "claude-cli");
   }
   async createStreamLogger(request) {
     const logDir = this.resolveLogDirectory();
@@ -4301,7 +4100,7 @@ var ClaudeCliProvider = class {
       console.warn(`Skipping Claude CLI stream logging (could not create ${logDir}): ${message}`);
       return void 0;
     }
-    const filePath = path11.join(logDir, buildLogFilename(request, this.targetName));
+    const filePath = path10.join(logDir, buildLogFilename(request, this.targetName));
     try {
       const logger = await ClaudeCliStreamLogger.create({
         filePath,
@@ -4622,7 +4421,7 @@ function tryParseJson(line) {
 import { randomUUID as randomUUID2 } from "node:crypto";
 import { createWriteStream as createWriteStream2 } from "node:fs";
 import { mkdir as mkdir2 } from "node:fs/promises";
-import path12 from "node:path";
+import path11 from "node:path";
 var claudeSdkModule = null;
 async function loadClaudeSdk() {
   if (!claudeSdkModule) {
@@ -4782,10 +4581,10 @@ var ClaudeSdkProvider = class {
   }
   resolveCwd(cwdOverride) {
     if (cwdOverride) {
-      return path12.resolve(cwdOverride);
+      return path11.resolve(cwdOverride);
     }
     if (this.config.cwd) {
-      return path12.resolve(this.config.cwd);
+      return path11.resolve(this.config.cwd);
     }
     return void 0;
   }
@@ -4795,9 +4594,9 @@ var ClaudeSdkProvider = class {
       return void 0;
     }
     if (this.config.logDir) {
-      return path12.resolve(this.config.logDir);
+      return path11.resolve(this.config.logDir);
     }
-    return path12.join(process.cwd(), ".agentv", "logs", "claude");
+    return path11.join(process.cwd(), ".agentv", "logs", "claude");
   }
   async createStreamLogger(request) {
     const logDir = this.resolveLogDirectory();
@@ -4811,7 +4610,7 @@ var ClaudeSdkProvider = class {
       console.warn(`Skipping Claude stream logging (could not create ${logDir}): ${message}`);
       return void 0;
     }
-    const filePath = path12.join(logDir, buildLogFilename2(request, this.targetName));
+    const filePath = path11.join(logDir, buildLogFilename2(request, this.targetName));
     try {
       const logger = await ClaudeStreamLogger.create({
         filePath,
@@ -5018,7 +4817,7 @@ function formatElapsed2(startedAt) {
 import { exec as execWithCallback } from "node:child_process";
 import fs from "node:fs/promises";
 import os from "node:os";
-import path13 from "node:path";
+import path12 from "node:path";
 import { promisify } from "node:util";
 import { z as z2 } from "zod";
 var ToolCallSchema = z2.object({
@@ -5227,7 +5026,6 @@ var CliProvider = class {
     const { values: templateValues, promptFilePath } = await buildTemplateValues(
       {
         question: "",
-        guidelines: "",
         inputFiles: batchInputFiles,
         evalCaseId: "batch",
         attempt: 0
@@ -5460,7 +5258,6 @@ var CliProvider = class {
     const { values: templateValues, promptFilePath } = await buildTemplateValues(
       {
         question: "",
-        guidelines: "",
         inputFiles: [],
         evalCaseId: "healthcheck",
         attempt: 0
@@ -5501,7 +5298,6 @@ async function buildTemplateValues(request, config, outputFilePath) {
     values: {
       PROMPT: shellEscape(request.question ?? ""),
       PROMPT_FILE: shellEscape(promptFilePath),
-      GUIDELINES: shellEscape(request.guidelines ?? ""),
       EVAL_ID: shellEscape(request.evalCaseId ?? ""),
       ATTEMPT: shellEscape(String(request.attempt ?? 0)),
       FILES: formatFileList(inputFiles, config.filesFormat),
@@ -5523,7 +5319,7 @@ function normalizeInputFiles2(inputFiles) {
   }
   const unique = /* @__PURE__ */ new Map();
   for (const inputFile of inputFiles) {
-    const absolutePath = path13.resolve(inputFile);
+    const absolutePath = path12.resolve(inputFile);
     if (!unique.has(absolutePath)) {
       unique.set(absolutePath, absolutePath);
     }
@@ -5537,7 +5333,7 @@ function formatFileList(files, template) {
   const formatter = template ?? "{path}";
   return files.map((filePath) => {
     const escapedPath = shellEscape(filePath);
-    const escapedName = shellEscape(path13.basename(filePath));
+    const escapedName = shellEscape(path12.basename(filePath));
     return formatter.replaceAll("{path}", escapedPath).replaceAll("{basename}", escapedName);
   }).join(" ");
 }
@@ -5561,7 +5357,7 @@ function generateOutputFilePath(evalCaseId, extension = ".json") {
   const safeEvalId = evalCaseId || "unknown";
   const timestamp = Date.now();
   const random = Math.random().toString(36).substring(2, 9);
-  return path13.join(os.tmpdir(), `agentv-${safeEvalId}-${timestamp}-${random}${extension}`);
+  return path12.join(os.tmpdir(), `agentv-${safeEvalId}-${timestamp}-${random}${extension}`);
 }
 function formatTimeoutSuffix2(timeoutMs) {
   if (!timeoutMs || timeoutMs <= 0) {
@@ -5575,7 +5371,7 @@ function formatTimeoutSuffix2(timeoutMs) {
 import { randomUUID as randomUUID3 } from "node:crypto";
 import { createWriteStream as createWriteStream3 } from "node:fs";
 import { mkdir as mkdir3 } from "node:fs/promises";
-import path14 from "node:path";
+import path13 from "node:path";
 // src/evaluation/providers/codex-log-tracker.ts
 var GLOBAL_LOGS_KEY2 = Symbol.for("agentv.codexLogs");
@@ -5810,10 +5606,10 @@ ${basePrompt}` : basePrompt;
   }
   resolveCwd(cwdOverride) {
     if (cwdOverride) {
-      return path14.resolve(cwdOverride);
+      return path13.resolve(cwdOverride);
     }
     if (this.config.cwd) {
-      return path14.resolve(this.config.cwd);
+      return path13.resolve(this.config.cwd);
     }
     return void 0;
   }
@@ -5823,9 +5619,9 @@ ${basePrompt}` : basePrompt;
       return void 0;
     }
     if (this.config.logDir) {
-      return path14.resolve(this.config.logDir);
+      return path13.resolve(this.config.logDir);
     }
-    return path14.join(process.cwd(), ".agentv", "logs", "codex");
+    return path13.join(process.cwd(), ".agentv", "logs", "codex");
   }
   async createStreamLogger(request) {
     const logDir = this.resolveLogDirectory();
@@ -5839,7 +5635,7 @@ ${basePrompt}` : basePrompt;
       console.warn(`Skipping Codex SDK stream logging (could not create ${logDir}): ${message}`);
       return void 0;
     }
-    const filePath = path14.join(logDir, buildLogFilename3(request, this.targetName));
+    const filePath = path13.join(logDir, buildLogFilename3(request, this.targetName));
     try {
       const logger = await CodexSdkStreamLogger.create({
         filePath,
@@ -5983,7 +5779,7 @@ function formatElapsed3(startedAt) {
 // src/evaluation/providers/copilot-cli.ts
 import { randomUUID as randomUUID5 } from "node:crypto";
 import { mkdir as mkdir4 } from "node:fs/promises";
-import path16 from "node:path";
+import path15 from "node:path";
 import { Readable, Writable } from "node:stream";
 import { spawn as spawn2 } from "node:child_process";
 import * as acp from "@agentclientprotocol/sdk";
@@ -6045,7 +5841,7 @@ function subscribeToCopilotCliLogEntries(listener) {
 import { randomUUID as randomUUID4 } from "node:crypto";
 import { createWriteStream as createWriteStream4, existsSync, readdirSync } from "node:fs";
 import { arch, platform } from "node:os";
-import path15 from "node:path";
+import path14 from "node:path";
 import { fileURLToPath as fileURLToPath2 } from "node:url";
 function resolvePlatformCliPath() {
   const os3 = platform();
@@ -6069,7 +5865,7 @@ function resolvePlatformCliPath() {
   try {
     const resolved = import.meta.resolve(`${packageName}/package.json`);
     const packageJsonPath = resolved.startsWith("file:") ? fileURLToPath2(resolved) : resolved;
-    const binaryPath = path15.join(path15.dirname(packageJsonPath), binaryName);
+    const binaryPath = path14.join(path14.dirname(packageJsonPath), binaryName);
     if (existsSync(binaryPath)) {
       return binaryPath;
     }
@@ -6077,7 +5873,7 @@ function resolvePlatformCliPath() {
   }
   let searchDir = process.cwd();
   for (let i = 0; i < 10; i++) {
-    const standardPath = path15.join(
+    const standardPath = path14.join(
       searchDir,
       "node_modules",
       ...packageName.split("/"),
@@ -6086,13 +5882,13 @@ function resolvePlatformCliPath() {
     if (existsSync(standardPath)) {
       return standardPath;
     }
-    const bunDir = path15.join(searchDir, "node_modules", ".bun");
+    const bunDir = path14.join(searchDir, "node_modules", ".bun");
     const prefix = `@github+copilot-${osPart}-${archPart}@`;
     try {
       const entries = readdirSync(bunDir);
       for (const entry of entries) {
         if (entry.startsWith(prefix)) {
-          const candidate = path15.join(
+          const candidate = path14.join(
             bunDir,
             entry,
             "node_modules",
@@ -6107,7 +5903,7 @@ function resolvePlatformCliPath() {
       }
     } catch {
     }
-    const parent = path15.dirname(searchDir);
+    const parent = path14.dirname(searchDir);
     if (parent === searchDir) break;
     searchDir = parent;
   }
@@ -6445,10 +6241,10 @@ var CopilotCliProvider = class {
   }
   resolveCwd(cwdOverride) {
     if (cwdOverride) {
-      return path16.resolve(cwdOverride);
+      return path15.resolve(cwdOverride);
     }
     if (this.config.cwd) {
-      return path16.resolve(this.config.cwd);
+      return path15.resolve(this.config.cwd);
     }
     return void 0;
   }
@@ -6467,9 +6263,9 @@ var CopilotCliProvider = class {
       return void 0;
     }
     if (this.config.logDir) {
-      return path16.resolve(this.config.logDir);
+      return path15.resolve(this.config.logDir);
     }
-    return path16.join(process.cwd(), ".agentv", "logs", "copilot-cli");
+    return path15.join(process.cwd(), ".agentv", "logs", "copilot-cli");
   }
   async createStreamLogger(request) {
     const logDir = this.resolveLogDirectory();
@@ -6483,7 +6279,7 @@ var CopilotCliProvider = class {
       console.warn(`Skipping Copilot CLI stream logging (could not create ${logDir}): ${message}`);
       return void 0;
     }
-    const filePath = path16.join(logDir, buildLogFilename4(request, this.targetName, "copilot-cli"));
+    const filePath = path15.join(logDir, buildLogFilename4(request, this.targetName, "copilot-cli"));
     try {
       const logger = await CopilotStreamLogger.create(
         {
@@ -6578,7 +6374,7 @@ function summarizeAcpEvent(eventType, data) {
 // src/evaluation/providers/copilot-sdk.ts
 import { randomUUID as randomUUID6 } from "node:crypto";
 import { mkdir as mkdir5 } from "node:fs/promises";
-import path17 from "node:path";
+import path16 from "node:path";
 // src/evaluation/providers/copilot-sdk-log-tracker.ts
 var GLOBAL_LOGS_KEY4 = Symbol.for("agentv.copilotSdkLogs");
@@ -6857,10 +6653,10 @@ var CopilotSdkProvider = class {
   }
   resolveCwd(cwdOverride) {
     if (cwdOverride) {
-      return path17.resolve(cwdOverride);
+      return path16.resolve(cwdOverride);
     }
     if (this.config.cwd) {
-      return path17.resolve(this.config.cwd);
+      return path16.resolve(this.config.cwd);
     }
     return void 0;
   }
@@ -6869,9 +6665,9 @@ var CopilotSdkProvider = class {
       return void 0;
     }
     if (this.config.logDir) {
-      return path17.resolve(this.config.logDir);
+      return path16.resolve(this.config.logDir);
     }
-    return path17.join(process.cwd(), ".agentv", "logs", "copilot-sdk");
+    return path16.join(process.cwd(), ".agentv", "logs", "copilot-sdk");
   }
   async createStreamLogger(request) {
     const logDir = this.resolveLogDirectory();
@@ -6885,7 +6681,7 @@ var CopilotSdkProvider = class {
       console.warn(`Skipping Copilot SDK stream logging (could not create ${logDir}): ${message}`);
       return void 0;
     }
-    const filePath = path17.join(logDir, buildLogFilename4(request, this.targetName, "copilot-sdk"));
+    const filePath = path16.join(logDir, buildLogFilename4(request, this.targetName, "copilot-sdk"));
     try {
       const logger = await CopilotStreamLogger.create(
         {
@@ -6962,8 +6758,7 @@ var MockProvider = class {
     return {
       output: [{ role: "assistant", content: this.cannedResponse }],
       raw: {
-        question: request.question,
-        guidelines: request.guidelines
+        question: request.question
       }
     };
   }
@@ -7241,7 +7036,7 @@ import { randomUUID as randomUUID7 } from "node:crypto";
 import { createWriteStream as createWriteStream5 } from "node:fs";
 import { mkdir as mkdir6, mkdtemp, rm, writeFile } from "node:fs/promises";
 import { tmpdir } from "node:os";
-import path18 from "node:path";
+import path17 from "node:path";
 // src/evaluation/providers/pi-log-tracker.ts
 var GLOBAL_LOGS_KEY5 = Symbol.for("agentv.piLogs");
@@ -7322,7 +7117,7 @@ var PiCodingAgentProvider = class {
     const workspaceRoot = await this.createWorkspace();
     const logger = await this.createStreamLogger(request).catch(() => void 0);
     try {
-      const promptFile = path18.join(workspaceRoot, PROMPT_FILENAME);
+      const promptFile = path17.join(workspaceRoot, PROMPT_FILENAME);
       await writeFile(promptFile, request.question, "utf8");
       const args = this.buildPiArgs(request.question, inputFiles, request.captureFileChanges);
       const cwd = this.resolveCwd(workspaceRoot, request.cwd);
@@ -7384,12 +7179,12 @@ var PiCodingAgentProvider = class {
   }
   resolveCwd(workspaceRoot, cwdOverride) {
     if (cwdOverride) {
-      return path18.resolve(cwdOverride);
+      return path17.resolve(cwdOverride);
     }
     if (!this.config.cwd) {
       return workspaceRoot;
     }
-    return path18.resolve(this.config.cwd);
+    return path17.resolve(this.config.cwd);
   }
   buildPiArgs(prompt, inputFiles, _captureFileChanges) {
     const args = [];
@@ -7478,7 +7273,7 @@ ${prompt}` : prompt;
     return env;
   }
   async createWorkspace() {
-    return await mkdtemp(path18.join(tmpdir(), WORKSPACE_PREFIX));
+    return await mkdtemp(path17.join(tmpdir(), WORKSPACE_PREFIX));
   }
   async cleanupWorkspace(workspaceRoot) {
     try {
@@ -7488,9 +7283,9 @@ ${prompt}` : prompt;
   }
   resolveLogDirectory() {
     if (this.config.logDir) {
-      return path18.resolve(this.config.logDir);
+      return path17.resolve(this.config.logDir);
     }
-    return path18.join(process.cwd(), ".agentv", "logs", "pi-coding-agent");
+    return path17.join(process.cwd(), ".agentv", "logs", "pi-coding-agent");
   }
   async createStreamLogger(request) {
     const logDir = this.resolveLogDirectory();
@@ -7504,7 +7299,7 @@ ${prompt}` : prompt;
       console.warn(`Skipping Pi stream logging (could not create ${logDir}): ${message}`);
       return void 0;
     }
-    const filePath = path18.join(logDir, buildLogFilename5(request, this.targetName));
+    const filePath = path17.join(logDir, buildLogFilename5(request, this.targetName));
     try {
       const logger = await PiStreamLogger.create({
         filePath,
@@ -8005,17 +7800,17 @@ var ProviderRegistry = class {
 // src/evaluation/providers/vscode-provider.ts
 import { exec as exec2 } from "node:child_process";
 import { constants as constants3, access as access3, stat as stat4 } from "node:fs/promises";
-import path30 from "node:path";
+import path29 from "node:path";
 import { promisify as promisify3 } from "node:util";
 // src/evaluation/providers/vscode/dispatch/agentDispatch.ts
 import { stat as stat3, writeFile as writeFile4 } from "node:fs/promises";
-import path28 from "node:path";
+import path27 from "node:path";
 // src/evaluation/providers/vscode/utils/fs.ts
 import { constants as constants2 } from "node:fs";
 import { access as access2, mkdir as mkdir7, readdir, rm as rm2, stat } from "node:fs/promises";
-import path19 from "node:path";
+import path18 from "node:path";
 async function pathExists(target) {
   try {
     await access2(target, constants2.F_OK);
@@ -8031,7 +7826,7 @@ async function readDirEntries(target) {
   const entries = await readdir(target, { withFileTypes: true });
   return entries.map((entry) => ({
     name: entry.name,
-    absolutePath: path19.join(target, entry.name),
+    absolutePath: path18.join(target, entry.name),
     isDirectory: entry.isDirectory()
   }));
 }
@@ -8046,9 +7841,9 @@ async function removeIfExists(target) {
 }
 // src/evaluation/providers/vscode/utils/path.ts
-import path20 from "node:path";
+import path19 from "node:path";
 function pathToFileUri2(filePath) {
-  const absolutePath = path20.isAbsolute(filePath) ? filePath : path20.resolve(filePath);
+  const absolutePath = path19.isAbsolute(filePath) ? filePath : path19.resolve(filePath);
   const normalizedPath = absolutePath.replace(/\\/g, "/");
   if (/^[a-zA-Z]:\//.test(normalizedPath)) {
     return `file:///${normalizedPath}`;
@@ -8057,7 +7852,7 @@ function pathToFileUri2(filePath) {
 }
 // src/evaluation/providers/vscode/dispatch/promptBuilder.ts
-import path21 from "node:path";
+import path20 from "node:path";
 // src/evaluation/providers/vscode/utils/template.ts
 function renderTemplate2(content, variables) {
@@ -8149,8 +7944,8 @@ function createBatchRequestPrompt(userQuery, responseFileTmp, responseFileFinal,
   });
 }
 function createBatchOrchestratorPrompt(requestFiles, responseFiles, templateContent) {
-  const requestLines = requestFiles.map((file, index) => `${index + 1}. messages/${path21.basename(file)}`).join("\n");
-  const responseList = responseFiles.map((file) => `"${path21.basename(file)}"`).join(", ");
+  const requestLines = requestFiles.map((file, index) => `${index + 1}. messages/${path20.basename(file)}`).join("\n");
+  const responseList = responseFiles.map((file) => `"${path20.basename(file)}"`).join(", ");
   return renderTemplate2(templateContent, {
     requestFiles: requestLines,
     responseList
@@ -8158,8 +7953,8 @@ function createBatchOrchestratorPrompt(requestFiles, responseFiles, templateCont
 }
 // src/evaluation/providers/vscode/dispatch/responseWaiter.ts
-import { readFile as readFile8 } from "node:fs/promises";
-import path22 from "node:path";
+import { readFile as readFile7 } from "node:fs/promises";
+import path21 from "node:path";
 // src/evaluation/providers/vscode/utils/time.ts
 function sleep2(ms) {
@@ -8197,7 +7992,7 @@ async function waitForResponseOutput(responseFileFinal, pollInterval = 1e3, sile
   const maxAttempts = 10;
   while (attempts < maxAttempts) {
     try {
-      const content = await readFile8(responseFileFinal, { encoding: "utf8" });
+      const content = await readFile7(responseFileFinal, { encoding: "utf8" });
       if (!silent) {
         process.stdout.write(`${content}
 `);
@@ -8218,7 +8013,7 @@ async function waitForResponseOutput(responseFileFinal, pollInterval = 1e3, sile
 }
 async function waitForBatchResponses(responseFilesFinal, pollInterval = 1e3, silent = false, timeoutMs = DEFAULT_TIMEOUT_MS) {
   if (!silent) {
-    const fileList = responseFilesFinal.map((file) => path22.basename(file)).join(", ");
+    const fileList = responseFilesFinal.map((file) => path21.basename(file)).join(", ");
     console.error(`waiting for ${responseFilesFinal.length} batch response(s): ${fileList}`);
   }
   const deadline = Date.now() + timeoutMs;
@@ -8227,7 +8022,7 @@ async function waitForBatchResponses(responseFilesFinal, pollInterval = 1e3, sil
     while (pending.size > 0) {
       if (Date.now() >= deadline) {
         if (!silent) {
-          const remaining = [...pending].map((f) => path22.basename(f)).join(", ");
+          const remaining = [...pending].map((f) => path21.basename(f)).join(", ");
           console.error(
             `error: timed out after ${Math.round(timeoutMs / 1e3)}s waiting for batch responses. Still pending: ${remaining}`
           );
@@ -8254,7 +8049,7 @@ async function waitForBatchResponses(responseFilesFinal, pollInterval = 1e3, sil
     const maxAttempts = 10;
     while (attempts < maxAttempts) {
       try {
-        const content = await readFile8(file, { encoding: "utf8" });
+        const content = await readFile7(file, { encoding: "utf8" });
         if (!silent) {
           process.stdout.write(`${content}
 `);
@@ -8278,15 +8073,15 @@ async function waitForBatchResponses(responseFilesFinal, pollInterval = 1e3, sil
 // src/evaluation/providers/vscode/dispatch/vscodeProcess.ts
 import { exec, spawn as spawn4 } from "node:child_process";
 import { mkdir as mkdir8, writeFile as writeFile2 } from "node:fs/promises";
-import path25 from "node:path";
+import path24 from "node:path";
 import { promisify as promisify2 } from "node:util";
 // src/evaluation/providers/vscode/dispatch/constants.ts
-import path24 from "node:path";
+import path23 from "node:path";
 // src/paths.ts
 import os2 from "node:os";
-import path23 from "node:path";
+import path22 from "node:path";
 var logged = false;
 function getAgentvHome() {
   const envHome = process.env.AGENTV_HOME;
@@ -8297,19 +8092,19 @@ function getAgentvHome() {
     }
     return envHome;
   }
-  return path23.join(os2.homedir(), ".agentv");
+  return path22.join(os2.homedir(), ".agentv");
 }
 function getWorkspacesRoot() {
-  return path23.join(getAgentvHome(), "workspaces");
+  return path22.join(getAgentvHome(), "workspaces");
 }
 function getSubagentsRoot() {
-  return path23.join(getAgentvHome(), "subagents");
+  return path22.join(getAgentvHome(), "subagents");
 }
 function getTraceStateRoot() {
-  return path23.join(getAgentvHome(), "trace-state");
+  return path22.join(getAgentvHome(), "trace-state");
 }
 function getWorkspacePoolRoot() {
-  return path23.join(getAgentvHome(), "workspace-pool");
+  return path22.join(getAgentvHome(), "workspace-pool");
 }
 // src/evaluation/providers/vscode/dispatch/constants.ts
@@ -8317,7 +8112,7 @@ var DEFAULT_LOCK_NAME = "subagent.lock";
 var DEFAULT_ALIVE_FILENAME = ".alive";
 function getDefaultSubagentRoot(vscodeCmd = "code") {
   const folder = vscodeCmd === "code-insiders" ? "vscode-insiders-agents" : "vscode-agents";
-  return path24.join(getSubagentsRoot(), folder);
+  return path23.join(getSubagentsRoot(), folder);
 }
 var DEFAULT_SUBAGENT_ROOT = getDefaultSubagentRoot();
@@ -8384,11 +8179,11 @@ async function ensureWorkspaceFocused(workspacePath, workspaceName, subagentDir,
     await raceSpawnError(child);
     return true;
   }
-  const aliveFile = path25.join(subagentDir, DEFAULT_ALIVE_FILENAME);
+  const aliveFile = path24.join(subagentDir, DEFAULT_ALIVE_FILENAME);
   await removeIfExists(aliveFile);
-  const githubAgentsDir = path25.join(subagentDir, ".github", "agents");
+  const githubAgentsDir = path24.join(subagentDir, ".github", "agents");
   await mkdir8(githubAgentsDir, { recursive: true });
-  const wakeupDst = path25.join(githubAgentsDir, "wakeup.md");
+  const wakeupDst = path24.join(githubAgentsDir, "wakeup.md");
   await writeFile2(wakeupDst, DEFAULT_WAKEUP_CONTENT, "utf8");
   const workspaceChild = spawnVsCode(vscodeCmd, [workspacePath], {
     label: "open-workspace"
@@ -8401,7 +8196,7 @@ async function ensureWorkspaceFocused(workspacePath, workspaceName, subagentDir,
     "chat",
     "-m",
     wakeupChatId,
-    `create a file named .alive in the ${path25.basename(subagentDir)} folder`
+    `create a file named .alive in the ${path24.basename(subagentDir)} folder`
   ];
   const wakeupChild = spawnVsCode(vscodeCmd, chatArgs, { label: "send-wakeup-chat" });
   await raceSpawnError(wakeupChild);
@@ -8416,10 +8211,10 @@ async function ensureWorkspaceFocused(workspacePath, workspaceName, subagentDir,
   return true;
 }
 async function launchVsCodeWithChat(subagentDir, chatId, attachmentPaths, requestInstructions, timestamp, vscodeCmd) {
-  const workspacePath = path25.join(subagentDir, `${path25.basename(subagentDir)}.code-workspace`);
-  const messagesDir = path25.join(subagentDir, "messages");
+  const workspacePath = path24.join(subagentDir, `${path24.basename(subagentDir)}.code-workspace`);
+  const messagesDir = path24.join(subagentDir, "messages");
   await mkdir8(messagesDir, { recursive: true });
-  const reqFile = path25.join(messagesDir, `${timestamp}_req.md`);
+  const reqFile = path24.join(messagesDir, `${timestamp}_req.md`);
   await writeFile2(reqFile, requestInstructions, { encoding: "utf8" });
   const reqUri = pathToFileUri2(reqFile);
   const chatArgs = ["-r", "chat", "-m", chatId];
@@ -8427,16 +8222,16 @@ async function launchVsCodeWithChat(subagentDir, chatId, attachmentPaths, reques
     chatArgs.push("-a", attachment);
   }
   chatArgs.push("-a", reqFile);
-  chatArgs.push(`Follow instructions in [${path25.basename(reqFile)}](${reqUri})`);
+  chatArgs.push(`Follow instructions in [${path24.basename(reqFile)}](${reqUri})`);
   const workspaceReady = await ensureWorkspaceFocused(
     workspacePath,
-    path25.basename(subagentDir),
+    path24.basename(subagentDir),
     subagentDir,
     vscodeCmd
   );
   if (!workspaceReady) {
     throw new Error(
-      `VS Code workspace '${path25.basename(subagentDir)}' failed to become ready within the timeout. Check that '${vscodeCmd}' can open workspaces.`
+      `VS Code workspace '${path24.basename(subagentDir)}' failed to become ready within the timeout. Check that '${vscodeCmd}' can open workspaces.`
     );
   }
   await sleep2(500);
@@ -8444,8 +8239,8 @@ async function launchVsCodeWithChat(subagentDir, chatId, attachmentPaths, reques
   await raceSpawnError(child);
 }
 async function launchVsCodeWithBatchChat(subagentDir, chatId, attachmentPaths, chatInstruction, vscodeCmd) {
-  const workspacePath = path25.join(subagentDir, `${path25.basename(subagentDir)}.code-workspace`);
-  const messagesDir = path25.join(subagentDir, "messages");
+  const workspacePath = path24.join(subagentDir, `${path24.basename(subagentDir)}.code-workspace`);
+  const messagesDir = path24.join(subagentDir, "messages");
   await mkdir8(messagesDir, { recursive: true });
   const chatArgs = ["-r", "chat", "-m", chatId];
   for (const attachment of attachmentPaths) {
@@ -8454,13 +8249,13 @@ async function launchVsCodeWithBatchChat(subagentDir, chatId, attachmentPaths, c
   chatArgs.push(chatInstruction);
   const workspaceReady = await ensureWorkspaceFocused(
     workspacePath,
-    path25.basename(subagentDir),
+    path24.basename(subagentDir),
     subagentDir,
     vscodeCmd
   );
   if (!workspaceReady) {
     throw new Error(
-      `VS Code workspace '${path25.basename(subagentDir)}' failed to become ready within the timeout. Check that '${vscodeCmd}' can open workspaces.`
+      `VS Code workspace '${path24.basename(subagentDir)}' failed to become ready within the timeout. Check that '${vscodeCmd}' can open workspaces.`
     );
   }
   await sleep2(500);
@@ -8469,11 +8264,11 @@ async function launchVsCodeWithBatchChat(subagentDir, chatId, attachmentPaths, c
 }
 // src/evaluation/providers/vscode/dispatch/workspaceManager.ts
-import { copyFile, mkdir as mkdir9, readFile as readFile9, readdir as readdir2, stat as stat2, writeFile as writeFile3 } from "node:fs/promises";
-import path27 from "node:path";
+import { copyFile, mkdir as mkdir9, readFile as readFile8, readdir as readdir2, stat as stat2, writeFile as writeFile3 } from "node:fs/promises";
+import path26 from "node:path";
 // src/evaluation/providers/vscode/utils/workspace.ts
-import path26 from "node:path";
+import path25 from "node:path";
 import JSON5 from "json5";
 function transformWorkspacePaths(workspaceContent, templateDir) {
   let workspace;
@@ -8490,10 +8285,10 @@ function transformWorkspacePaths(workspaceContent, templateDir) {
   }
   const transformedFolders = workspace.folders.map((folder) => {
     const folderPath = folder.path;
-    if (path26.isAbsolute(folderPath)) {
+    if (path25.isAbsolute(folderPath)) {
       return folder;
     }
-    const absolutePath = path26.resolve(templateDir, folderPath);
+    const absolutePath = path25.resolve(templateDir, folderPath);
     return {
       ...folder,
       path: absolutePath
@@ -8515,19 +8310,19 @@ function transformWorkspacePaths(workspaceContent, templateDir) {
       if (locationMap && typeof locationMap === "object") {
         const transformedMap = {};
         for (const [locationPath, value] of Object.entries(locationMap)) {
-          const isAbsolute = path26.isAbsolute(locationPath);
+          const isAbsolute = path25.isAbsolute(locationPath);
           if (isAbsolute) {
             transformedMap[locationPath] = value;
           } else {
             const firstGlobIndex = locationPath.search(/[*]/);
             if (firstGlobIndex === -1) {
-              const resolvedPath = path26.resolve(templateDir, locationPath).replace(/\\/g, "/");
+              const resolvedPath = path25.resolve(templateDir, locationPath).replace(/\\/g, "/");
               transformedMap[resolvedPath] = value;
             } else {
               const basePathEnd = locationPath.lastIndexOf("/", firstGlobIndex);
               const basePath = basePathEnd !== -1 ? locationPath.substring(0, basePathEnd) : ".";
               const patternPath = locationPath.substring(basePathEnd !== -1 ? basePathEnd : 0);
-              const resolvedPath = (path26.resolve(templateDir, basePath) + patternPath).replace(
+              const resolvedPath = (path25.resolve(templateDir, basePath) + patternPath).replace(
                 /\\/g,
                 "/"
               );
@@ -8568,7 +8363,7 @@ async function findUnlockedSubagent(subagentRoot) {
     number: Number.parseInt(entry.name.split("-")[1] ?? "", 10)
   })).filter((entry) => Number.isInteger(entry.number)).sort((a, b) => a.number - b.number);
   for (const subagent of subagents) {
-    const lockFile = path27.join(subagent.absolutePath, DEFAULT_LOCK_NAME);
+    const lockFile = path26.join(subagent.absolutePath, DEFAULT_LOCK_NAME);
     if (!await pathExists(lockFile)) {
       return subagent.absolutePath;
     }
@@ -8578,7 +8373,7 @@ async function findUnlockedSubagent(subagentRoot) {
 async function copyAgentConfig(subagentDir, workspaceTemplate, cwd) {
   let workspaceContent;
   if (workspaceTemplate) {
-    const workspaceSrc = path27.resolve(workspaceTemplate);
+    const workspaceSrc = path26.resolve(workspaceTemplate);
     if (!await pathExists(workspaceSrc)) {
       throw new Error(`workspace template not found: ${workspaceSrc}`);
     }
@@ -8586,18 +8381,18 @@ async function copyAgentConfig(subagentDir, workspaceTemplate, cwd) {
     if (!stats.isFile()) {
       throw new Error(`workspace template must be a file, not a directory: ${workspaceSrc}`);
     }
-    const templateText = await readFile9(workspaceSrc, "utf8");
+    const templateText = await readFile8(workspaceSrc, "utf8");
     workspaceContent = JSON.parse(templateText);
   } else {
     workspaceContent = DEFAULT_WORKSPACE_TEMPLATE;
   }
-  const workspaceName = `${path27.basename(subagentDir)}.code-workspace`;
-  const workspaceDst = path27.join(subagentDir, workspaceName);
-  const templateDir = workspaceTemplate ? path27.dirname(path27.resolve(workspaceTemplate)) : subagentDir;
+  const workspaceName = `${path26.basename(subagentDir)}.code-workspace`;
+  const workspaceDst = path26.join(subagentDir, workspaceName);
+  const templateDir = workspaceTemplate ? path26.dirname(path26.resolve(workspaceTemplate)) : subagentDir;
   const workspaceJson = JSON.stringify(workspaceContent, null, 2);
   let transformedContent = transformWorkspacePaths(workspaceJson, templateDir);
   if (cwd) {
-    const absCwd = path27.resolve(cwd);
+    const absCwd = path26.resolve(cwd);
     const parsed = JSON.parse(transformedContent);
     const alreadyPresent = parsed.folders.some((f) => f.path === absCwd);
     if (!alreadyPresent) {
@@ -8606,35 +8401,35 @@ async function copyAgentConfig(subagentDir, workspaceTemplate, cwd) {
     }
   }
   await writeFile3(workspaceDst, transformedContent, "utf8");
-  const messagesDir = path27.join(subagentDir, "messages");
+  const messagesDir = path26.join(subagentDir, "messages");
   await mkdir9(messagesDir, { recursive: true });
   return { workspace: workspaceDst, messagesDir };
 }
 async function createSubagentLock(subagentDir) {
-  const messagesDir = path27.join(subagentDir, "messages");
+  const messagesDir = path26.join(subagentDir, "messages");
   if (await pathExists(messagesDir)) {
     const files = await readdir2(messagesDir);
     await Promise.all(
       files.map(async (file) => {
-        const target = path27.join(messagesDir, file);
+        const target = path26.join(messagesDir, file);
         await removeIfExists(target);
       })
     );
   }
-  const githubAgentsDir = path27.join(subagentDir, ".github", "agents");
+  const githubAgentsDir = path26.join(subagentDir, ".github", "agents");
   if (await pathExists(githubAgentsDir)) {
     const agentFiles = await readdir2(githubAgentsDir);
     const preservedFiles = /* @__PURE__ */ new Set(["wakeup.md", "subagent.md"]);
     await Promise.all(
-      agentFiles.filter((file) => file.endsWith(".md") && !preservedFiles.has(file)).map((file) => removeIfExists(path27.join(githubAgentsDir, file)))
+      agentFiles.filter((file) => file.endsWith(".md") && !preservedFiles.has(file)).map((file) => removeIfExists(path26.join(githubAgentsDir, file)))
     );
   }
-  const lockFile = path27.join(subagentDir, DEFAULT_LOCK_NAME);
+  const lockFile = path26.join(subagentDir, DEFAULT_LOCK_NAME);
   await writeFile3(lockFile, "", { encoding: "utf8" });
   return lockFile;
 }
 async function removeSubagentLock(subagentDir) {
-  const lockFile = path27.join(subagentDir, DEFAULT_LOCK_NAME);
+  const lockFile = path26.join(subagentDir, DEFAULT_LOCK_NAME);
   await removeIfExists(lockFile);
 }
 async function prepareSubagentDirectory(subagentDir, promptFile, chatId, workspaceTemplate, dryRun, cwd) {
@@ -8654,9 +8449,9 @@ async function prepareSubagentDirectory(subagentDir, promptFile, chatId, workspa
     return 1;
   }
   if (promptFile) {
-    const githubAgentsDir = path27.join(subagentDir, ".github", "agents");
+    const githubAgentsDir = path26.join(subagentDir, ".github", "agents");
     await mkdir9(githubAgentsDir, { recursive: true });
-    const agentFile = path27.join(githubAgentsDir, `${chatId}.md`);
+    const agentFile = path26.join(githubAgentsDir, `${chatId}.md`);
     try {
       await copyFile(promptFile, agentFile);
     } catch (error) {
@@ -8675,7 +8470,7 @@ async function resolvePromptFile(promptFile) {
   if (!promptFile) {
     return void 0;
   }
-  const resolvedPrompt = path28.resolve(promptFile);
+  const resolvedPrompt = path27.resolve(promptFile);
   if (!await pathExists(resolvedPrompt)) {
     throw new Error(`Prompt file not found: ${resolvedPrompt}`);
   }
@@ -8691,7 +8486,7 @@ async function resolveAttachments(extraAttachments) {
   }
   const resolved = [];
   for (const attachment of extraAttachments) {
-    const resolvedPath = path28.resolve(attachment);
+    const resolvedPath = path27.resolve(attachment);
     if (!await pathExists(resolvedPath)) {
       throw new Error(`Attachment not found: ${resolvedPath}`);
     }
@@ -8733,7 +8528,7 @@ async function dispatchAgentSession(options) {
         error: "No unlocked subagents available. Provision additional subagents with: subagent code provision --subagents <desired_total>"
       };
     }
-    const subagentName = path28.basename(subagentDir);
+    const subagentName = path27.basename(subagentDir);
     const chatId = Math.random().toString(16).slice(2, 10);
     const preparationResult = await prepareSubagentDirectory(
       subagentDir,
@@ -8761,9 +8556,9 @@ async function dispatchAgentSession(options) {
       };
     }
     const timestamp = generateTimestamp();
-    const messagesDir = path28.join(subagentDir, "messages");
-    const responseFileTmp = path28.join(messagesDir, `${timestamp}_res.tmp.md`);
-    const responseFileFinal = path28.join(messagesDir, `${timestamp}_res.md`);
+    const messagesDir = path27.join(subagentDir, "messages");
+    const responseFileTmp = path27.join(messagesDir, `${timestamp}_res.tmp.md`);
+    const responseFileFinal = path27.join(messagesDir, `${timestamp}_res.md`);
     const requestInstructions = createRequestPrompt(
       userQuery,
       responseFileTmp,
@@ -8868,7 +8663,7 @@ async function dispatchBatchAgent(options) {
         error: "No unlocked subagents available. Provision additional subagents with: subagent code provision --subagents <desired_total>"
       };
     }
-    subagentName = path28.basename(subagentDir);
+    subagentName = path27.basename(subagentDir);
     const chatId = Math.random().toString(16).slice(2, 10);
     const preparationResult = await prepareSubagentDirectory(
       subagentDir,
@@ -8899,17 +8694,17 @@ async function dispatchBatchAgent(options) {
       };
     }
     const timestamp = generateTimestamp();
-    const messagesDir = path28.join(subagentDir, "messages");
+    const messagesDir = path27.join(subagentDir, "messages");
     requestFiles = userQueries.map(
-      (_, index) => path28.join(messagesDir, `${timestamp}_${index}_req.md`)
+      (_, index) => path27.join(messagesDir, `${timestamp}_${index}_req.md`)
     );
     const responseTmpFiles = userQueries.map(
-      (_, index) => path28.join(messagesDir, `${timestamp}_${index}_res.tmp.md`)
+      (_, index) => path27.join(messagesDir, `${timestamp}_${index}_res.tmp.md`)
     );
     responseFilesFinal = userQueries.map(
-      (_, index) => path28.join(messagesDir, `${timestamp}_${index}_res.md`)
+      (_, index) => path27.join(messagesDir, `${timestamp}_${index}_res.md`)
     );
-    const orchestratorFile = path28.join(messagesDir, `${timestamp}_orchestrator.md`);
+    const orchestratorFile = path27.join(messagesDir, `${timestamp}_orchestrator.md`);
     if (!dryRun) {
       await Promise.all(
         userQueries.map((query, index) => {
@@ -8995,7 +8790,7 @@ async function dispatchBatchAgent(options) {
 // src/evaluation/providers/vscode/dispatch/provision.ts
 import { writeFile as writeFile5 } from "node:fs/promises";
-import path29 from "node:path";
+import path28 from "node:path";
 var DEFAULT_WORKSPACE_TEMPLATE2 = {
   folders: [
     {
@@ -9026,7 +8821,7 @@ async function provisionSubagents(options) {
   if (!Number.isInteger(subagents) || subagents < 1) {
     throw new Error("subagents must be a positive integer");
   }
-  const targetPath = path29.resolve(targetRoot);
+  const targetPath = path28.resolve(targetRoot);
   if (!dryRun) {
     await ensureDir(targetPath);
   }
@@ -9046,7 +8841,7 @@ async function provisionSubagents(options) {
         continue;
       }
       highestNumber = Math.max(highestNumber, parsed);
-      const lockFile = path29.join(entry.absolutePath, lockName);
+      const lockFile = path28.join(entry.absolutePath, lockName);
       const locked = await pathExists(lockFile);
       if (locked) {
         lockedSubagents.add(entry.absolutePath);
@@ -9063,10 +8858,10 @@ async function provisionSubagents(options) {
       break;
     }
     const subagentDir = subagent.absolutePath;
-    const githubAgentsDir = path29.join(subagentDir, ".github", "agents");
-    const lockFile = path29.join(subagentDir, lockName);
-    const workspaceDst = path29.join(subagentDir, `${path29.basename(subagentDir)}.code-workspace`);
-    const wakeupDst = path29.join(githubAgentsDir, "wakeup.md");
+    const githubAgentsDir = path28.join(subagentDir, ".github", "agents");
+    const lockFile = path28.join(subagentDir, lockName);
+    const workspaceDst = path28.join(subagentDir, `${path28.basename(subagentDir)}.code-workspace`);
+    const wakeupDst = path28.join(githubAgentsDir, "wakeup.md");
     const isLocked = await pathExists(lockFile);
     if (isLocked && !force) {
       continue;
@@ -9104,10 +8899,10 @@ async function provisionSubagents(options) {
   let nextIndex = highestNumber;
   while (subagentsProvisioned < subagents) {
     nextIndex += 1;
-    const subagentDir = path29.join(targetPath, `subagent-${nextIndex}`);
-    const githubAgentsDir = path29.join(subagentDir, ".github", "agents");
-    const workspaceDst = path29.join(subagentDir, `${path29.basename(subagentDir)}.code-workspace`);
-    const wakeupDst = path29.join(githubAgentsDir, "wakeup.md");
+    const subagentDir = path28.join(targetPath, `subagent-${nextIndex}`);
+    const githubAgentsDir = path28.join(subagentDir, ".github", "agents");
+    const workspaceDst = path28.join(subagentDir, `${path28.basename(subagentDir)}.code-workspace`);
+    const wakeupDst = path28.join(githubAgentsDir, "wakeup.md");
     if (!dryRun) {
       await ensureDir(subagentDir);
       await ensureDir(githubAgentsDir);
@@ -9174,7 +8969,7 @@ var VSCodeProvider = class {
     }
     await this.ensureEnvironmentReady();
     const inputFiles = normalizeAttachments(request.inputFiles);
-    const promptContent = buildPromptDocument2(request, inputFiles, request.guideline_patterns);
+    const promptContent = buildPromptDocument2(request, inputFiles);
     const workspaceTemplate = request.workspaceFile ?? await resolveWorkspaceTemplateFile(this.config.workspaceTemplate);
     const startTime = Date.now();
     const session = await dispatchAgentSession({
@@ -9228,7 +9023,7 @@ var VSCodeProvider = class {
       normalizedRequests.map(({ inputFiles }) => inputFiles)
     );
     const userQueries = normalizedRequests.map(
-      ({ request, inputFiles }) => buildPromptDocument2(request, inputFiles, request.guideline_patterns)
+      ({ request, inputFiles }) => buildPromptDocument2(request, inputFiles)
     );
     const batchWorkspaceTemplate = await resolveWorkspaceTemplateFile(
       this.config.workspaceTemplate
@@ -9297,7 +9092,7 @@ var VSCodeProvider = class {
 async function locateVSCodeExecutable(candidate) {
   const includesPathSeparator = candidate.includes("/") || candidate.includes("\\");
   if (includesPathSeparator) {
-    const resolved = path30.isAbsolute(candidate) ? candidate : path30.resolve(candidate);
+    const resolved = path29.isAbsolute(candidate) ? candidate : path29.resolve(candidate);
     try {
       await access3(resolved, constants3.F_OK);
       return resolved;
@@ -9326,41 +9121,35 @@ async function resolveWorkspaceTemplateFile(template) {
     return void 0;
   }
   try {
-    const stats = await stat4(path30.resolve(template));
+    const stats = await stat4(path29.resolve(template));
     return stats.isFile() ? template : void 0;
   } catch {
     return template;
   }
 }
-function buildPromptDocument2(request, attachments, guidelinePatterns) {
+function buildPromptDocument2(request, attachments) {
   const parts = [];
   if (request.systemPrompt && request.systemPrompt.trim().length > 0) {
     parts.push(request.systemPrompt.trim());
   }
-  const guidelineFiles = collectGuidelineFiles2(attachments, guidelinePatterns);
   const attachmentFiles = collectAttachmentFiles(attachments);
-  const nonGuidelineAttachments = attachmentFiles.filter((file) => !guidelineFiles.includes(file));
-  const prereadBlock = buildMandatoryPrereadBlock2(guidelineFiles, nonGuidelineAttachments);
+  const prereadBlock = buildMandatoryPrereadBlock2(attachmentFiles);
   if (prereadBlock.length > 0) {
     parts.push("\n", prereadBlock);
   }
   parts.push("\n[[ ## user_query ## ]]\n", request.question.trim());
   return parts.join("\n").trim();
 }
-function buildMandatoryPrereadBlock2(guidelineFiles, attachmentFiles) {
-  if (guidelineFiles.length === 0 && attachmentFiles.length === 0) {
+function buildMandatoryPrereadBlock2(attachmentFiles) {
+  if (attachmentFiles.length === 0) {
     return "";
   }
   const buildList = (files) => files.map((absolutePath) => {
-    const fileName = path30.basename(absolutePath);
+    const fileName = path29.basename(absolutePath);
     const fileUri = pathToFileUri3(absolutePath);
     return `* [${fileName}](${fileUri})`;
   });
   const sections = [];
-  if (guidelineFiles.length > 0) {
-    sections.push(`Read all guideline files:
-${buildList(guidelineFiles).join("\n")}.`);
-  }
   if (attachmentFiles.length > 0) {
     sections.push(`Read all attachment files:
 ${buildList(attachmentFiles).join("\n")}.`);
@@ -9371,29 +9160,13 @@ ${buildList(attachmentFiles).join("\n")}.`);
   );
   return sections.join("\n");
 }
-function collectGuidelineFiles2(attachments, guidelinePatterns) {
-  if (!attachments || attachments.length === 0) {
-    return [];
-  }
-  const unique = /* @__PURE__ */ new Map();
-  for (const attachment of attachments) {
-    const absolutePath = path30.resolve(attachment);
-    const normalized = absolutePath.split(path30.sep).join("/");
-    if (isGuidelineFile(normalized, guidelinePatterns)) {
-      if (!unique.has(absolutePath)) {
-        unique.set(absolutePath, absolutePath);
-      }
-    }
-  }
-  return Array.from(unique.values());
-}
 function collectAttachmentFiles(attachments) {
   if (!attachments || attachments.length === 0) {
     return [];
   }
   const unique = /* @__PURE__ */ new Map();
   for (const attachment of attachments) {
-    const absolutePath = path30.resolve(attachment);
+    const absolutePath = path29.resolve(attachment);
     if (!unique.has(absolutePath)) {
       unique.set(absolutePath, absolutePath);
     }
@@ -9401,7 +9174,7 @@ function collectAttachmentFiles(attachments) {
   return Array.from(unique.values());
 }
 function pathToFileUri3(filePath) {
-  const absolutePath = path30.isAbsolute(filePath) ? filePath : path30.resolve(filePath);
+  const absolutePath = path29.isAbsolute(filePath) ? filePath : path29.resolve(filePath);
   const normalizedPath = absolutePath.replace(/\\/g, "/");
   if (/^[a-zA-Z]:\//.test(normalizedPath)) {
     return `file:///${normalizedPath}`;
@@ -9414,7 +9187,7 @@ function normalizeAttachments(attachments) {
   }
   const deduped = /* @__PURE__ */ new Set();
   for (const attachment of attachments) {
-    deduped.add(path30.resolve(attachment));
+    deduped.add(path29.resolve(attachment));
   }
   return Array.from(deduped);
 }
@@ -9423,7 +9196,7 @@ function mergeAttachments(all) {
   for (const list of all) {
     if (!list) continue;
     for (const inputFile of list) {
-      deduped.add(path30.resolve(inputFile));
+      deduped.add(path29.resolve(inputFile));
     }
   }
   return deduped.size > 0 ? Array.from(deduped) : void 0;
@@ -9471,8 +9244,8 @@ total unlocked subagents available: ${result.created.length + result.skippedExis
 // src/evaluation/providers/targets-file.ts
 import { constants as constants4 } from "node:fs";
-import { access as access4, readFile as readFile10 } from "node:fs/promises";
-import path31 from "node:path";
+import { access as access4, readFile as readFile9 } from "node:fs/promises";
+import path30 from "node:path";
 import { parse as parse4 } from "yaml";
 function isRecord(value) {
   return typeof value === "object" && value !== null && !Array.isArray(value);
@@ -9509,11 +9282,11 @@ async function fileExists3(filePath) {
   }
 }
 async function readTargetDefinitions(filePath) {
-  const absolutePath = path31.resolve(filePath);
+  const absolutePath = path30.resolve(filePath);
   if (!await fileExists3(absolutePath)) {
     throw new Error(`targets.yaml not found at ${absolutePath}`);
   }
-  const raw = await readFile10(absolutePath, "utf8");
+  const raw = await readFile9(absolutePath, "utf8");
   const parsed = parse4(raw);
   if (!isRecord(parsed)) {
     throw new Error(`targets.yaml at ${absolutePath} must be a YAML object with a 'targets' field`);
@@ -9529,16 +9302,16 @@ function listTargetNames(definitions) {
 }
 // src/evaluation/providers/provider-discovery.ts
-import path32 from "node:path";
+import path31 from "node:path";
 import fg from "fast-glob";
 async function discoverProviders(registry, baseDir) {
   const patterns = ["*.ts", "*.js", "*.mts", "*.mjs"];
   const candidateDirs = [];
-  let dir = path32.resolve(baseDir);
-  const root = path32.parse(dir).root;
+  let dir = path31.resolve(baseDir);
+  const root = path31.parse(dir).root;
   while (dir !== root) {
-    candidateDirs.push(path32.join(dir, ".agentv", "providers"));
-    dir = path32.dirname(dir);
+    candidateDirs.push(path31.join(dir, ".agentv", "providers"));
+    dir = path31.dirname(dir);
   }
   let files = [];
   for (const providersDir of candidateDirs) {
@@ -9554,7 +9327,7 @@ async function discoverProviders(registry, baseDir) {
   }
   const discoveredKinds = [];
   for (const filePath of files) {
-    const basename = path32.basename(filePath);
+    const basename = path31.basename(filePath);
     const kindName = basename.replace(/\.(ts|js|mts|mjs)$/, "");
     if (registry.has(kindName)) {
       continue;
@@ -9763,15 +9536,15 @@ async function execFileWithStdinNode(argv, stdinPayload, options) {
   });
 }
 async function execShellWithStdin(command, stdinPayload, options = {}) {
-  const { mkdir: mkdir15, readFile: readFile13, rm: rm6, writeFile: writeFile9 } = await import("node:fs/promises");
+  const { mkdir: mkdir15, readFile: readFile12, rm: rm6, writeFile: writeFile9 } = await import("node:fs/promises");
   const { tmpdir: tmpdir3 } = await import("node:os");
-  const path45 = await import("node:path");
+  const path44 = await import("node:path");
   const { randomUUID: randomUUID9 } = await import("node:crypto");
-  const dir = path45.join(tmpdir3(), `agentv-exec-${randomUUID9()}`);
+  const dir = path44.join(tmpdir3(), `agentv-exec-${randomUUID9()}`);
   await mkdir15(dir, { recursive: true });
-  const stdinPath = path45.join(dir, "stdin.txt");
-  const stdoutPath = path45.join(dir, "stdout.txt");
-  const stderrPath = path45.join(dir, "stderr.txt");
+  const stdinPath = path44.join(dir, "stdin.txt");
+  const stdoutPath = path44.join(dir, "stdout.txt");
+  const stderrPath = path44.join(dir, "stderr.txt");
   await writeFile9(stdinPath, stdinPayload, "utf8");
   const wrappedCommand = process.platform === "win32" ? `(${command}) < ${shellEscapePath(stdinPath)} > ${shellEscapePath(stdoutPath)} 2> ${shellEscapePath(stderrPath)}` : `(${command}) < ${shellEscapePath(stdinPath)} > ${shellEscapePath(stdoutPath)} 2> ${shellEscapePath(stderrPath)}`;
   const { spawn: spawn5 } = await import("node:child_process");
@@ -9801,8 +9574,8 @@ async function execShellWithStdin(command, stdinPayload, options = {}) {
         resolve(code ?? 0);
       });
     });
-    const stdout = (await readFile13(stdoutPath, "utf8")).replace(/\r\n/g, "\n");
-    const stderr = (await readFile13(stderrPath, "utf8")).replace(/\r\n/g, "\n");
+    const stdout = (await readFile12(stdoutPath, "utf8")).replace(/\r\n/g, "\n");
+    const stderr = (await readFile12(stderrPath, "utf8")).replace(/\r\n/g, "\n");
     return { stdout, stderr, exitCode };
   } finally {
     await rm6(dir, { recursive: true, force: true });
@@ -10119,10 +9892,7 @@ var CodeEvaluator = class {
       outputText: context.candidate,
       output: outputForPayload,
       outputPath,
-      guidelineFiles: context.evalCase.guideline_paths,
-      inputFiles: context.evalCase.file_paths.filter(
-        (path45) => !context.evalCase.guideline_paths.includes(path45)
-      ),
+      inputFiles: context.evalCase.file_paths,
       input: context.evalCase.input,
       trace: context.trace ?? null,
       tokenUsage: context.tokenUsage ?? null,
@@ -10253,7 +10023,7 @@ import { generateText as generateText3 } from "ai";
 // src/evaluation/evaluators/llm-grader.ts
 import fs2 from "node:fs/promises";
-import path33 from "node:path";
+import path32 from "node:path";
 import { generateText as generateText2, stepCountIs, tool } from "ai";
 import { z as z3 } from "zod";
 var DEFAULT_MAX_STEPS = 10;
@@ -11085,8 +10855,8 @@ function calculateScoreRangeResult(result, rubrics) {
   };
 }
 function resolveSandboxed(basePath, relativePath) {
-  const resolved = path33.resolve(basePath, relativePath);
-  if (!resolved.startsWith(basePath + path33.sep) && resolved !== basePath) {
+  const resolved = path32.resolve(basePath, relativePath);
+  if (!resolved.startsWith(basePath + path32.sep) && resolved !== basePath) {
     throw new Error(`Path '${relativePath}' is outside the workspace`);
   }
   return resolved;
@@ -11176,11 +10946,11 @@ async function searchDirectory(dirPath, workspacePath, regex, matches) {
   for (const entry of entries) {
     if (matches.length >= MAX_SEARCH_MATCHES) return;
     if (SEARCH_SKIP_DIRS.has(entry.name)) continue;
-    const fullPath = path33.join(dirPath, entry.name);
+    const fullPath = path32.join(dirPath, entry.name);
     if (entry.isDirectory()) {
       await searchDirectory(fullPath, workspacePath, regex, matches);
     } else if (entry.isFile()) {
-      const ext = path33.extname(entry.name).toLowerCase();
+      const ext = path32.extname(entry.name).toLowerCase();
       if (BINARY_EXTENSIONS.has(ext)) continue;
       try {
         const stat8 = await fs2.stat(fullPath);
@@ -11192,7 +10962,7 @@ async function searchDirectory(dirPath, workspacePath, regex, matches) {
           regex.lastIndex = 0;
           if (regex.test(lines[i])) {
             matches.push({
-              file: path33.relative(workspacePath, fullPath),
+              file: path32.relative(workspacePath, fullPath),
               line: i + 1,
               text: lines[i].substring(0, 200)
             });
@@ -11827,115 +11597,115 @@ var FieldAccuracyEvaluator = class {
    * Evaluate a single field against the expected value.
    */
   evaluateField(fieldConfig, candidateData, expectedData) {
-    const { path: path45, match, required = true, weight = 1 } = fieldConfig;
-    const candidateValue = resolvePath(candidateData, path45);
-    const expectedValue = resolvePath(expectedData, path45);
+    const { path: path44, match, required = true, weight = 1 } = fieldConfig;
+    const candidateValue = resolvePath(candidateData, path44);
+    const expectedValue = resolvePath(expectedData, path44);
     if (expectedValue === void 0) {
       return {
-        path: path45,
+        path: path44,
         score: 1,
         // No expected value means no comparison needed
         weight,
         hit: true,
-        message: `${path45}: no expected value`
+        message: `${path44}: no expected value`
       };
     }
     if (candidateValue === void 0) {
       if (required) {
         return {
-          path: path45,
+          path: path44,
           score: 0,
           weight,
           hit: false,
-          message: `${path45} (required, missing)`
+          message: `${path44} (required, missing)`
         };
       }
       return {
-        path: path45,
+        path: path44,
         score: 1,
         // Don't penalize missing optional fields
         weight: 0,
         // Zero weight means it won't affect the score
         hit: true,
-        message: `${path45}: optional field missing`
+        message: `${path44}: optional field missing`
       };
     }
     switch (match) {
       case "exact":
-        return this.compareExact(path45, candidateValue, expectedValue, weight);
+        return this.compareExact(path44, candidateValue, expectedValue, weight);
       case "numeric_tolerance":
         return this.compareNumericTolerance(
-          path45,
+          path44,
           candidateValue,
           expectedValue,
           fieldConfig,
           weight
         );
       case "date":
-        return this.compareDate(path45, candidateValue, expectedValue, fieldConfig, weight);
+        return this.compareDate(path44, candidateValue, expectedValue, fieldConfig, weight);
       default:
         return {
-          path: path45,
+          path: path44,
           score: 0,
           weight,
           hit: false,
-          message: `${path45}: unknown match type "${match}"`
+          message: `${path44}: unknown match type "${match}"`
         };
     }
   }
   /**
    * Exact equality comparison.
    */
-  compareExact(path45, candidateValue, expectedValue, weight) {
+  compareExact(path44, candidateValue, expectedValue, weight) {
     if (deepEqual(candidateValue, expectedValue)) {
       return {
-        path: path45,
+        path: path44,
         score: 1,
         weight,
         hit: true,
-        message: path45
+        message: path44
       };
     }
     if (typeof candidateValue !== typeof expectedValue) {
       return {
-        path: path45,
+        path: path44,
         score: 0,
         weight,
         hit: false,
-        message: `${path45} (type mismatch: got ${typeof candidateValue}, expected ${typeof expectedValue})`
+        message: `${path44} (type mismatch: got ${typeof candidateValue}, expected ${typeof expectedValue})`
       };
     }
     return {
-      path: path45,
+      path: path44,
       score: 0,
       weight,
       hit: false,
-      message: `${path45} (value mismatch)`
+      message: `${path44} (value mismatch)`
     };
   }
   /**
    * Numeric comparison with absolute or relative tolerance.
    */
-  compareNumericTolerance(path45, candidateValue, expectedValue, fieldConfig, weight) {
+  compareNumericTolerance(path44, candidateValue, expectedValue, fieldConfig, weight) {
     const { tolerance = 0, relative = false } = fieldConfig;
     const candidateNum = toNumber(candidateValue);
     const expectedNum = toNumber(expectedValue);
     if (candidateNum === null || expectedNum === null) {
       return {
-        path: path45,
+        path: path44,
         score: 0,
         weight,
         hit: false,
-        message: `${path45} (non-numeric value)`
+        message: `${path44} (non-numeric value)`
       };
     }
     if (!Number.isFinite(candidateNum) || !Number.isFinite(expectedNum)) {
       return {
-        path: path45,
+        path: path44,
         score: 0,
         weight,
         hit: false,
-        message: `${path45} (invalid numeric value)`
+        message: `${path44} (invalid numeric value)`
       };
     }
     const diff = Math.abs(candidateNum - expectedNum);
@@ -11948,61 +11718,61 @@ var FieldAccuracyEvaluator = class {
     }
     if (withinTolerance) {
       return {
-        path: path45,
+        path: path44,
         score: 1,
         weight,
         hit: true,
-        message: `${path45} (within tolerance: diff=${diff.toFixed(2)})`
+        message: `${path44} (within tolerance: diff=${diff.toFixed(2)})`
       };
     }
     return {
-      path: path45,
+      path: path44,
       score: 0,
       weight,
       hit: false,
-      message: `${path45} (outside tolerance: diff=${diff.toFixed(2)}, tolerance=${tolerance})`
+      message: `${path44} (outside tolerance: diff=${diff.toFixed(2)}, tolerance=${tolerance})`
     };
   }
   /**
    * Date comparison with format normalization.
    */
-  compareDate(path45, candidateValue, expectedValue, fieldConfig, weight) {
+  compareDate(path44, candidateValue, expectedValue, fieldConfig, weight) {
     const formats = fieldConfig.formats ?? DEFAULT_DATE_FORMATS;
     const candidateDate = parseDate(String(candidateValue), formats);
     const expectedDate = parseDate(String(expectedValue), formats);
     if (candidateDate === null) {
       return {
-        path: path45,
+        path: path44,
         score: 0,
         weight,
         hit: false,
-        message: `${path45} (unparseable candidate date)`
+        message: `${path44} (unparseable candidate date)`
       };
     }
     if (expectedDate === null) {
       return {
-        path: path45,
+        path: path44,
         score: 0,
         weight,
         hit: false,
-        message: `${path45} (unparseable expected date)`
+        message: `${path44} (unparseable expected date)`
       };
     }
     if (candidateDate.getFullYear() === expectedDate.getFullYear() && candidateDate.getMonth() === expectedDate.getMonth() && candidateDate.getDate() === expectedDate.getDate()) {
       return {
-        path: path45,
+        path: path44,
         score: 1,
         weight,
         hit: true,
-        message: path45
+        message: path44
       };
     }
     return {
-      path: path45,
+      path: path44,
       score: 0,
       weight,
       hit: false,
-      message: `${path45} (date mismatch: got ${formatDateISO(candidateDate)}, expected ${formatDateISO(expectedDate)})`
+      message: `${path44} (date mismatch: got ${formatDateISO(candidateDate)}, expected ${formatDateISO(expectedDate)})`
     };
   }
   /**
@@ -12035,11 +11805,11 @@ var FieldAccuracyEvaluator = class {
     };
   }
 };
-function resolvePath(obj, path45) {
-  if (!path45 || !obj) {
+function resolvePath(obj, path44) {
+  if (!path44 || !obj) {
     return void 0;
   }
-  const parts = path45.split(/\.|\[|\]/).filter((p) => p.length > 0);
+  const parts = path44.split(/\.|\[|\]/).filter((p) => p.length > 0);
   let current = obj;
   for (const part of parts) {
     if (current === null || current === void 0) {
@@ -12499,8 +12269,8 @@ var TokenUsageEvaluator = class {
 };
 // src/evaluation/evaluators/tool-trajectory.ts
-function getNestedValue(obj, path45) {
-  const parts = path45.split(".");
+function getNestedValue(obj, path44) {
+  const parts = path44.split(".");
   let current = obj;
   for (const part of parts) {
     if (current === null || current === void 0 || typeof current !== "object") {
@@ -13122,8 +12892,8 @@ function runEqualsAssertion(output, value) {
 // src/evaluation/orchestrator.ts
 import { createHash as createHash2, randomUUID as randomUUID8 } from "node:crypto";
 import { copyFile as copyFile2, mkdir as mkdir13, readdir as readdir6, stat as stat7 } from "node:fs/promises";
-import path42 from "node:path";
-import micromatch4 from "micromatch";
+import path41 from "node:path";
+import micromatch3 from "micromatch";
 // ../../node_modules/.bun/yocto-queue@1.2.2/node_modules/yocto-queue/index.js
 var Node = class {
@@ -13336,7 +13106,7 @@ var InlineAssertEvaluator = class {
 };
 // src/evaluation/evaluators/prompt-resolution.ts
-import path34 from "node:path";
+import path33 from "node:path";
 async function resolveCustomPrompt(promptConfig, context, timeoutMs) {
   if (promptConfig.resolvedPromptScript && promptConfig.resolvedPromptScript.length > 0) {
     if (!context) {
@@ -13371,10 +13141,7 @@ async function executePromptTemplate(script, context, config, timeoutMs) {
     expectedOutput: context.evalCase.expected_output,
     outputText: context.candidate,
     output: context.output ?? null,
-    guidelineFiles: context.evalCase.guideline_paths,
-    inputFiles: context.evalCase.file_paths.filter(
-      (p) => !context.evalCase.guideline_paths.includes(p)
-    ),
+    inputFiles: context.evalCase.file_paths,
     input: context.evalCase.input,
     trace: context.trace ?? null,
     fileChanges: context.fileChanges ?? null,
@@ -13385,7 +13152,7 @@ async function executePromptTemplate(script, context, config, timeoutMs) {
   };
   const inputJson = JSON.stringify(toSnakeCaseDeep(payload), null, 2);
   const scriptPath = script[script.length - 1];
-  const cwd = path34.dirname(scriptPath);
+  const cwd = path33.dirname(scriptPath);
   try {
     const stdout = await executeScript(script, inputJson, timeoutMs, cwd);
     const prompt = stdout.trim();
@@ -13657,16 +13424,16 @@ function createBuiltinRegistry() {
 }
 // src/evaluation/registry/assertion-discovery.ts
-import path35 from "node:path";
+import path34 from "node:path";
 import fg2 from "fast-glob";
 async function discoverAssertions(registry, baseDir) {
   const patterns = ["*.ts", "*.js", "*.mts", "*.mjs"];
   const candidateDirs = [];
-  let dir = path35.resolve(baseDir);
-  const root = path35.parse(dir).root;
+  let dir = path34.resolve(baseDir);
+  const root = path34.parse(dir).root;
   while (dir !== root) {
-    candidateDirs.push(path35.join(dir, ".agentv", "assertions"));
-    dir = path35.dirname(dir);
+    candidateDirs.push(path34.join(dir, ".agentv", "assertions"));
+    dir = path34.dirname(dir);
   }
   let files = [];
   for (const assertionsDir of candidateDirs) {
@@ -13682,7 +13449,7 @@ async function discoverAssertions(registry, baseDir) {
   }
   const discoveredTypes = [];
   for (const filePath of files) {
-    const basename = path35.basename(filePath);
+    const basename = path34.basename(filePath);
     const typeName = basename.replace(/\.(ts|js|mts|mjs)$/, "");
     if (registry.has(typeName)) {
       continue;
@@ -13700,17 +13467,17 @@ async function discoverAssertions(registry, baseDir) {
 }
 // src/evaluation/registry/grader-discovery.ts
-import path36 from "node:path";
+import path35 from "node:path";
 import fg3 from "fast-glob";
 async function discoverGraders(registry, baseDir) {
   const patterns = ["*.ts", "*.js", "*.mts", "*.mjs"];
   const candidateDirs = [];
-  let dir = path36.resolve(baseDir);
-  const root = path36.parse(dir).root;
+  let dir = path35.resolve(baseDir);
+  const root = path35.parse(dir).root;
   while (dir !== root) {
-    candidateDirs.push(path36.join(dir, ".agentv", "graders"));
-    candidateDirs.push(path36.join(dir, ".agentv", "judges"));
-    dir = path36.dirname(dir);
+    candidateDirs.push(path35.join(dir, ".agentv", "graders"));
+    candidateDirs.push(path35.join(dir, ".agentv", "judges"));
+    dir = path35.dirname(dir);
   }
   let files = [];
   for (const gradersDir of candidateDirs) {
@@ -13726,7 +13493,7 @@ async function discoverGraders(registry, baseDir) {
   }
   const discoveredTypes = [];
   for (const filePath of files) {
-    const basename = path36.basename(filePath);
+    const basename = path35.basename(filePath);
     const typeName = basename.replace(/\.(ts|js|mts|mjs)$/, "");
     if (registry.has(typeName)) {
       continue;
@@ -13886,7 +13653,7 @@ function getTCritical(df) {
 // src/evaluation/workspace/file-changes.ts
 import { exec as execCallback } from "node:child_process";
 import { readdirSync as readdirSync2, statSync } from "node:fs";
-import path37 from "node:path";
+import path36 from "node:path";
 import { promisify as promisify4 } from "node:util";
 var execAsync4 = promisify4(execCallback);
 function gitExecOpts(workspacePath) {
@@ -13920,10 +13687,10 @@ async function stageNestedRepoChanges(workspacePath) {
   }
   for (const entry of entries) {
     if (entry === ".git" || entry === "node_modules") continue;
-    const childPath = path37.join(workspacePath, entry);
+    const childPath = path36.join(workspacePath, entry);
     try {
       if (!statSync(childPath).isDirectory()) continue;
-      if (!statSync(path37.join(childPath, ".git")).isDirectory()) continue;
+      if (!statSync(path36.join(childPath, ".git")).isDirectory()) continue;
     } catch {
       continue;
     }
@@ -13934,7 +13701,7 @@ async function stageNestedRepoChanges(workspacePath) {
 // src/evaluation/workspace/manager.ts
 import { cp, mkdir as mkdir11, readdir as readdir3, rm as rm4, stat as stat5 } from "node:fs/promises";
-import path38 from "node:path";
+import path37 from "node:path";
 var TemplateNotFoundError = class extends Error {
   constructor(templatePath) {
     super(`Workspace template not found: ${templatePath}`);
@@ -13964,14 +13731,14 @@ async function isDirectory(filePath) {
 }
 function getWorkspacePath(evalRunId, caseId, workspaceRoot) {
   const root = workspaceRoot ?? getWorkspacesRoot();
-  return path38.join(root, evalRunId, caseId);
+  return path37.join(root, evalRunId, caseId);
 }
 async function copyDirectoryRecursive(src, dest) {
   await mkdir11(dest, { recursive: true });
   const entries = await readdir3(src, { withFileTypes: true });
   for (const entry of entries) {
-    const srcPath = path38.join(src, entry.name);
-    const destPath = path38.join(dest, entry.name);
+    const srcPath = path37.join(src, entry.name);
+    const destPath = path37.join(dest, entry.name);
     if (entry.name === ".git") {
       continue;
     }
@@ -13983,7 +13750,7 @@ async function copyDirectoryRecursive(src, dest) {
   }
 }
 async function createTempWorkspace(templatePath, evalRunId, caseId, workspaceRoot) {
-  const resolvedTemplatePath = path38.resolve(templatePath);
+  const resolvedTemplatePath = path37.resolve(templatePath);
   if (!await fileExists(resolvedTemplatePath)) {
     throw new TemplateNotFoundError(resolvedTemplatePath);
   }
@@ -14032,7 +13799,7 @@ async function cleanupWorkspace(workspacePath) {
 }
 async function cleanupEvalWorkspaces(evalRunId, workspaceRoot) {
   const root = workspaceRoot ?? getWorkspacesRoot();
-  const evalDir = path38.join(root, evalRunId);
+  const evalDir = path37.join(root, evalRunId);
   if (await fileExists(evalDir)) {
     await rm4(evalDir, { recursive: true, force: true });
   }
@@ -14042,8 +13809,8 @@ async function cleanupEvalWorkspaces(evalRunId, workspaceRoot) {
 import { execFile } from "node:child_process";
 import { createHash } from "node:crypto";
 import { existsSync as existsSync2 } from "node:fs";
-import { cp as cp2, mkdir as mkdir12, readFile as readFile11, readdir as readdir4, rm as rm5, unlink, writeFile as writeFile7 } from "node:fs/promises";
-import path39 from "node:path";
+import { cp as cp2, mkdir as mkdir12, readFile as readFile10, readdir as readdir4, rm as rm5, unlink, writeFile as writeFile7 } from "node:fs/promises";
+import path38 from "node:path";
 import { promisify as promisify5 } from "node:util";
 var execFileAsync = promisify5(execFile);
 function gitEnv() {
@@ -14097,8 +13864,8 @@ async function copyDirectoryRecursive2(src, dest, skipDirs) {
   await mkdir12(dest, { recursive: true });
   const entries = await readdir4(src, { withFileTypes: true });
   for (const entry of entries) {
-    const srcPath = path39.join(src, entry.name);
-    const destPath = path39.join(dest, entry.name);
+    const srcPath = path38.join(src, entry.name);
+    const destPath = path38.join(dest, entry.name);
     if (entry.name === ".git") {
       continue;
     }
@@ -14131,7 +13898,7 @@ var WorkspacePoolManager = class {
   async acquireWorkspace(options) {
     const { templatePath, repos, maxSlots, repoManager, poolReset } = options;
     const fingerprint = computeWorkspaceFingerprint(repos);
-    const poolDir = path39.join(this.poolRoot, fingerprint);
+    const poolDir = path38.join(this.poolRoot, fingerprint);
     await mkdir12(poolDir, { recursive: true });
     const drifted = await this.checkDrift(poolDir, fingerprint);
     if (drifted) {
@@ -14141,7 +13908,7 @@ var WorkspacePoolManager = class {
       await this.removeAllSlots(poolDir);
     }
     for (let i = 0; i < maxSlots; i++) {
-      const slotPath = path39.join(poolDir, `slot-${i}`);
+      const slotPath = path38.join(poolDir, `slot-${i}`);
       const lockPath = `${slotPath}.lock`;
       const locked = await this.tryLock(lockPath);
       if (!locked) {
@@ -14203,7 +13970,7 @@ var WorkspacePoolManager = class {
           throw err;
         }
         try {
-          const pidStr = await readFile11(lockPath, "utf-8");
+          const pidStr = await readFile10(lockPath, "utf-8");
           const pid = Number.parseInt(pidStr.trim(), 10);
           if (!Number.isNaN(pid)) {
             try {
@@ -14228,9 +13995,9 @@ var WorkspacePoolManager = class {
    * Returns false (no drift) if metadata.json doesn't exist (first use).
    */
   async checkDrift(poolDir, fingerprint) {
-    const metadataPath = path39.join(poolDir, "metadata.json");
+    const metadataPath = path38.join(poolDir, "metadata.json");
     try {
-      const raw = await readFile11(metadataPath, "utf-8");
+      const raw = await readFile10(metadataPath, "utf-8");
       const metadata = JSON.parse(raw);
       return metadata.fingerprint !== fingerprint;
     } catch {
@@ -14245,17 +14012,17 @@ var WorkspacePoolManager = class {
       repos,
       createdAt: (/* @__PURE__ */ new Date()).toISOString()
     };
-    await writeFile7(path39.join(poolDir, "metadata.json"), JSON.stringify(metadata, null, 2));
+    await writeFile7(path38.join(poolDir, "metadata.json"), JSON.stringify(metadata, null, 2));
   }
   /** Remove all slot directories and their lock files from a pool directory. */
   async removeAllSlots(poolDir) {
     const entries = await readdir4(poolDir);
     for (const entry of entries) {
       if (entry.startsWith("slot-") && !entry.endsWith(".lock")) {
-        const lockPath = path39.join(poolDir, `${entry}.lock`);
+        const lockPath = path38.join(poolDir, `${entry}.lock`);
         if (existsSync2(lockPath)) {
           try {
-            const pidStr = await readFile11(lockPath, "utf-8");
+            const pidStr = await readFile10(lockPath, "utf-8");
             const pid = Number.parseInt(pidStr.trim(), 10);
             if (!Number.isNaN(pid)) {
               try {
@@ -14268,12 +14035,12 @@ var WorkspacePoolManager = class {
           } catch {
           }
         }
-        await rm5(path39.join(poolDir, entry), { recursive: true, force: true });
+        await rm5(path38.join(poolDir, entry), { recursive: true, force: true });
         await rm5(lockPath, { force: true }).catch(() => {
         });
       }
     }
-    await rm5(path39.join(poolDir, "metadata.json"), { force: true }).catch(() => {
+    await rm5(path38.join(poolDir, "metadata.json"), { force: true }).catch(() => {
     });
   }
   /**
@@ -14283,7 +14050,7 @@ var WorkspacePoolManager = class {
    */
   async resetSlot(slotPath, templatePath, repos, poolReset = "fast") {
     for (const repo of repos) {
-      const repoDir = path39.join(slotPath, repo.path);
+      const repoDir = path38.join(slotPath, repo.path);
       if (!existsSync2(repoDir)) {
         continue;
       }
@@ -14310,7 +14077,7 @@ var WorkspacePoolManager = class {
 // src/evaluation/workspace/repo-manager.ts
 import { execFile as execFile2 } from "node:child_process";
 import { existsSync as existsSync3 } from "node:fs";
-import path40 from "node:path";
+import path39 from "node:path";
 import { promisify as promisify6 } from "node:util";
 var execFileAsync2 = promisify6(execFile2);
 var DEFAULT_TIMEOUT_MS2 = 3e5;
@@ -14410,7 +14177,7 @@ ${lines.join("\n")}`;
    * Handles checkout, ref resolution, ancestor walking, shallow clone, sparse checkout.
    */
   async materialize(repo, workspacePath) {
-    const targetDir = path40.join(workspacePath, repo.path);
+    const targetDir = path39.join(workspacePath, repo.path);
     const sourceUrl = getSourceUrl(repo.source);
     const startedAt = Date.now();
     if (this.verbose) {
@@ -14501,7 +14268,7 @@ ${lines.join("\n")}`;
   async reset(repos, workspacePath, reset) {
     const cleanFlag = reset === "strict" ? "-fdx" : "-fd";
     for (const repo of repos) {
-      const targetDir = path40.join(workspacePath, repo.path);
+      const targetDir = path39.join(workspacePath, repo.path);
       await this.runGit(["reset", "--hard", "HEAD"], { cwd: targetDir });
       await this.runGit(["clean", cleanFlag], { cwd: targetDir });
     }
@@ -14510,16 +14277,16 @@ ${lines.join("\n")}`;
 // src/evaluation/workspace/resolve.ts
 import { readdir as readdir5, stat as stat6 } from "node:fs/promises";
-import path41 from "node:path";
+import path40 from "node:path";
 async function resolveWorkspaceTemplate(templatePath) {
   if (!templatePath) {
     return void 0;
   }
-  const resolved = path41.resolve(templatePath);
+  const resolved = path40.resolve(templatePath);
   const stats = await stat6(resolved);
   if (stats.isFile()) {
     return {
-      dir: path41.dirname(resolved),
+      dir: path40.dirname(resolved),
       workspaceFile: resolved
     };
   }
@@ -14531,14 +14298,14 @@ async function resolveWorkspaceTemplate(templatePath) {
   if (workspaceFiles.length === 1) {
     return {
       dir: resolved,
-      workspaceFile: path41.join(resolved, workspaceFiles[0])
+      workspaceFile: path40.join(resolved, workspaceFiles[0])
     };
   }
   if (workspaceFiles.length > 1) {
     const conventionFile = workspaceFiles.find((f) => f === "template.code-workspace");
     return {
       dir: resolved,
-      workspaceFile: conventionFile ? path41.join(resolved, conventionFile) : void 0
+      workspaceFile: conventionFile ? path40.join(resolved, conventionFile) : void 0
     };
   }
   return { dir: resolved };
@@ -14742,7 +14509,7 @@ async function runEvaluation(options) {
   ];
   const evaluatorRegistry = buildEvaluatorRegistry(evaluators, resolveGraderProvider);
   const typeRegistry = createBuiltinRegistry();
-  const discoveryBaseDir = evalFilePath ? path42.dirname(path42.resolve(evalFilePath)) : process.cwd();
+  const discoveryBaseDir = evalFilePath ? path41.dirname(path41.resolve(evalFilePath)) : process.cwd();
   const evalDir = discoveryBaseDir;
   await discoverAssertions(typeRegistry, discoveryBaseDir);
   await discoverGraders(typeRegistry, discoveryBaseDir);
@@ -14851,14 +14618,22 @@ async function runEvaluation(options) {
   const usePool = poolEnabled !== false && !!suiteWorkspace?.repos?.length && !isPerTestIsolation && !useStaticWorkspace;
   const resolvedRetainOnSuccess = retainOnSuccess ?? (keepWorkspaces ? "keep" : "cleanup");
   const resolvedRetainOnFailure = retainOnFailure ?? (cleanupWorkspaces ? "cleanup" : "keep");
-  const requestedWorkers = options.maxConcurrency ?? target.workers ?? 1;
-  const workers = hasSharedWorkspace && !usePool ? 1 : requestedWorkers;
+  const workers = options.maxConcurrency ?? target.workers ?? 1;
   setupLog(
-    `sharedWorkspace=${hasSharedWorkspace} perTestIsolation=${isPerTestIsolation} usePool=${usePool} requestedWorkers=${requestedWorkers} effectiveWorkers=${workers}`
+    `sharedWorkspace=${hasSharedWorkspace} perTestIsolation=${isPerTestIsolation} usePool=${usePool} workers=${workers}`
   );
-  if (hasSharedWorkspace && !usePool && requestedWorkers > 1) {
+  if (hasSharedWorkspace && !usePool && workers > 1) {
     console.warn(
-      `Warning: Shared workspace requires sequential execution. Overriding workers from ${requestedWorkers} to 1.`
+      [
+        `Warning: This eval uses a shared workspace with ${workers} workers.`,
+        "If the agent under test makes file edits, concurrent runs may corrupt each other.",
+        "To limit concurrency, add this to your eval YAML:",
+        "",
+        "  execution:",
+        "    workers: 1",
+        "",
+        "Or pass --workers 1 on the command line."
+      ].join("\n")
     );
   }
   const limit = pLimit(workers);
@@ -14931,7 +14706,7 @@ async function runEvaluation(options) {
   }
   try {
     if (suiteWorkspaceFile && sharedWorkspacePath) {
-      const copiedWorkspaceFile = path42.join(sharedWorkspacePath, path42.basename(suiteWorkspaceFile));
+      const copiedWorkspaceFile = path41.join(sharedWorkspacePath, path41.basename(suiteWorkspaceFile));
       try {
         await stat7(copiedWorkspaceFile);
         suiteWorkspaceFile = copiedWorkspaceFile;
@@ -15041,7 +14816,7 @@ async function runEvaluation(options) {
           const budgetResult = {
             timestamp: (now ?? (() => /* @__PURE__ */ new Date()))().toISOString(),
             testId: evalCase.id,
-            dataset: evalCase.dataset,
+            eval_set: evalCase.eval_set,
             score: 0,
             assertions: [],
             output: [],
@@ -15077,7 +14852,7 @@ async function runEvaluation(options) {
           const haltResult = {
             timestamp: (now ?? (() => /* @__PURE__ */ new Date()))().toISOString(),
             testId: evalCase.id,
-            dataset: evalCase.dataset,
+            eval_set: evalCase.eval_set,
             score: 0,
             assertions: [],
             output: [],
@@ -15309,8 +15084,6 @@ async function runBatchEvaluation(options) {
     const promptInputs = promptInputsList[index];
     return {
       question: promptInputs.question,
-      guidelines: promptInputs.guidelines,
-      guideline_patterns: evalCase.guideline_patterns,
       inputFiles: evalCase.file_paths,
       evalCaseId: evalCase.id,
       metadata: {
@@ -15508,7 +15281,7 @@ async function runEvalCase(options) {
         );
       }
       if (caseWorkspaceFile && workspacePath) {
-        const copiedFile = path42.join(workspacePath, path42.basename(caseWorkspaceFile));
+        const copiedFile = path41.join(workspacePath, path41.basename(caseWorkspaceFile));
         try {
           await stat7(copiedFile);
           caseWorkspaceFile = copiedFile;
@@ -15568,10 +15341,10 @@ async function runEvalCase(options) {
       const files = evalCase.metadata.agent_skills_files;
       if (baseDir && files.length > 0) {
         for (const relPath of files) {
-          const srcPath = path42.resolve(baseDir, relPath);
-          const destPath = path42.resolve(workspacePath, relPath);
+          const srcPath = path41.resolve(baseDir, relPath);
+          const destPath = path41.resolve(workspacePath, relPath);
           try {
-            await mkdir13(path42.dirname(destPath), { recursive: true });
+            await mkdir13(path41.dirname(destPath), { recursive: true });
             await copyFile2(srcPath, destPath);
           } catch (error) {
             const message = error instanceof Error ? error.message : String(error);
@@ -16018,8 +15791,7 @@ async function evaluateCandidate(options) {
   let lmRequest;
   if (isAgentProvider(provider)) {
     agentRequest = {
-      question: promptInputs.question,
-      guideline_paths: evalCase.guideline_paths
+      question: promptInputs.question
     };
   } else {
     if (promptInputs.chatPrompt) {
@@ -16028,8 +15800,7 @@ async function evaluateCandidate(options) {
       };
     } else {
       lmRequest = {
-        question: promptInputs.question,
-        guidelines: promptInputs.guidelines
+        question: promptInputs.question
       };
     }
   }
@@ -16043,7 +15814,7 @@ async function evaluateCandidate(options) {
   return {
     timestamp: completedAt.toISOString(),
     testId: evalCase.id,
-    dataset: evalCase.dataset,
+    eval_set: evalCase.eval_set,
     conversationId: evalCase.conversation_id,
     score: score.score,
     assertions: score.assertions,
@@ -16191,7 +15962,7 @@ async function runEvaluatorList(options) {
     fileChanges,
     workspacePath
   };
-  const evalFileDir = evalCase.guideline_paths[0] ? path42.dirname(evalCase.guideline_paths[0]) : process.cwd();
+  const evalFileDir = evalCase.file_paths[0] ? path41.dirname(evalCase.file_paths[0]) : process.cwd();
   const dispatchContext = {
     graderProvider,
     targetResolver,
@@ -16305,7 +16076,7 @@ function filterEvalCases(evalCases, filter) {
   if (!filter) {
     return evalCases;
   }
-  return evalCases.filter((evalCase) => micromatch4.isMatch(evalCase.id, filter));
+  return evalCases.filter((evalCase) => micromatch3.isMatch(evalCase.id, filter));
 }
 function buildEvaluatorRegistry(overrides, resolveGraderProvider) {
   const llmGrader = overrides?.["llm-grader"] ?? overrides?.["llm-judge"] ?? new LlmGraderEvaluator({
@@ -16342,8 +16113,6 @@ async function invokeProvider(provider, options) {
     const braintrustSpanIds = streamCallbacks?.getActiveSpanIds?.() ?? void 0;
     return await provider.invoke({
       question: promptInputs.question,
-      guidelines: promptInputs.guidelines,
-      guideline_patterns: evalCase.guideline_patterns,
       chatPrompt: promptInputs.chatPrompt,
       inputFiles: evalCase.file_paths,
       evalCaseId: evalCase.id,
@@ -16371,21 +16140,17 @@ function buildErrorResult(evalCase, targetName, timestamp, error, promptInputs,
   if (isAgentProvider(provider)) {
     agentRequest = {
       question: promptInputs.question,
-      guideline_paths: evalCase.guideline_paths,
       error: message
     };
   } else {
     if (promptInputs.chatPrompt) {
       lmRequest = {
         chat_prompt: promptInputs.chatPrompt,
-        guideline_paths: evalCase.guideline_paths,
         error: message
       };
     } else {
       lmRequest = {
         question: promptInputs.question,
-        guidelines: promptInputs.guidelines,
-        guideline_paths: evalCase.guideline_paths,
         error: message
       };
     }
@@ -16398,7 +16163,7 @@ function buildErrorResult(evalCase, targetName, timestamp, error, promptInputs,
   return {
     timestamp: timestamp.toISOString(),
     testId: evalCase.id,
-    dataset: evalCase.dataset,
+    eval_set: evalCase.eval_set,
     conversationId: evalCase.conversation_id,
     score: 0,
     assertions: [{ text: `Error: ${message}`, passed: false }],
@@ -16431,7 +16196,6 @@ function createCacheKey(provider, target, evalCase, promptInputs) {
   hash.update(target.name);
   hash.update(evalCase.id);
   hash.update(promptInputs.question);
-  hash.update(promptInputs.guidelines);
   hash.update(promptInputs.systemMessage ?? "");
   if (promptInputs.chatPrompt) {
     hash.update(JSON.stringify(promptInputs.chatPrompt));
@@ -16531,7 +16295,7 @@ function computeWeightedMean(entries) {
 // src/evaluation/evaluate.ts
 import { existsSync as existsSync4 } from "node:fs";
-import path43 from "node:path";
+import path42 from "node:path";
 // src/evaluation/providers/function-provider.ts
 function createFunctionProvider(taskFn) {
@@ -16568,7 +16332,7 @@ async function evaluate(config) {
   }
   const gitRoot = await findGitRoot(process.cwd());
   const repoRoot = gitRoot ?? process.cwd();
-  const testFilePath = config.specFile ? path43.resolve(config.specFile) : path43.join(process.cwd(), "__programmatic__.yaml");
+  const testFilePath = config.specFile ? path42.resolve(config.specFile) : path42.join(process.cwd(), "__programmatic__.yaml");
   await loadEnvHierarchy(repoRoot, testFilePath);
   let resolvedTarget;
   let taskProvider;
@@ -16634,8 +16398,6 @@ async function evaluate(config) {
         input_segments: inputSegments,
         expected_output: expectedOutput,
         reference_answer: expectedOutputValue,
-        guideline_paths: [],
-        guideline_patterns: [],
         file_paths: [],
         assertions: assertConfigs.length > 0 ? assertConfigs : void 0,
         metadata: test.metadata
@@ -16697,10 +16459,10 @@ function computeSummary(results, durationMs) {
 var TARGET_FILE_CANDIDATES = [".agentv/targets.yaml", ".agentv/targets.yml"];
 async function discoverDefaultTarget(repoRoot) {
   const cwd = process.cwd();
-  const chain = buildDirectoryChain(path43.join(cwd, "_placeholder"), repoRoot);
+  const chain = buildDirectoryChain(path42.join(cwd, "_placeholder"), repoRoot);
   for (const dir of chain) {
     for (const candidate of TARGET_FILE_CANDIDATES) {
-      const targetsPath = path43.join(dir, candidate);
+      const targetsPath = path42.join(dir, candidate);
       if (!existsSync4(targetsPath)) continue;
       try {
         const definitions = await readTargetDefinitions(targetsPath);
@@ -16717,7 +16479,7 @@ async function loadEnvHierarchy(repoRoot, startPath) {
   const chain = buildDirectoryChain(startPath, repoRoot);
   const envFiles = [];
   for (const dir of chain) {
-    const envPath = path43.join(dir, ".env");
+    const envPath = path42.join(dir, ".env");
     if (existsSync4(envPath)) envFiles.push(envPath);
   }
   for (let i = 0; i < envFiles.length; i++) {
@@ -16898,8 +16660,8 @@ function buildPrompt(criteria, question, referenceAnswer) {
 }
 // src/evaluation/cache/response-cache.ts
-import { mkdir as mkdir14, readFile as readFile12, writeFile as writeFile8 } from "node:fs/promises";
-import path44 from "node:path";
+import { mkdir as mkdir14, readFile as readFile11, writeFile as writeFile8 } from "node:fs/promises";
+import path43 from "node:path";
 var DEFAULT_CACHE_PATH = ".agentv/cache";
 var ResponseCache = class {
   cachePath;
@@ -16909,7 +16671,7 @@ var ResponseCache = class {
   async get(key) {
     const filePath = this.keyToPath(key);
     try {
-      const data = await readFile12(filePath, "utf8");
+      const data = await readFile11(filePath, "utf8");
       return JSON.parse(data);
     } catch {
       return void 0;
@@ -16917,13 +16679,13 @@ var ResponseCache = class {
   }
   async set(key, value) {
     const filePath = this.keyToPath(key);
-    const dir = path44.dirname(filePath);
+    const dir = path43.dirname(filePath);
     await mkdir14(dir, { recursive: true });
     await writeFile8(filePath, JSON.stringify(value, null, 2), "utf8");
   }
   keyToPath(key) {
     const prefix = key.slice(0, 2);
-    return path44.join(this.cachePath, prefix, `${key}.json`);
+    return path43.join(this.cachePath, prefix, `${key}.json`);
   }
 };
 function shouldEnableCache(params) {
@@ -17111,7 +16873,7 @@ var OtelTraceExporter = class {
         rootSpan.setAttribute("gen_ai.system", "agentv");
         rootSpan.setAttribute("agentv.test_id", result.testId);
         rootSpan.setAttribute("agentv.target", result.target);
-        if (result.dataset) rootSpan.setAttribute("agentv.dataset", result.dataset);
+        if (result.eval_set) rootSpan.setAttribute("agentv.eval_set", result.eval_set);
         rootSpan.setAttribute("agentv.score", result.score);
         if (captureContent && result.output.length > 0) {
           const lastMsg = result.output[result.output.length - 1];
@@ -17296,14 +17058,14 @@ var OtelStreamingObserver = class {
   // biome-ignore lint/suspicious/noExplicitAny: OTel context loaded dynamically
   rootCtx = null;
   /** Create root eval span immediately (visible in backend right away) */
-  startEvalCase(testId, target, dataset) {
+  startEvalCase(testId, target, evalSet) {
     const ctx = this.parentCtx ?? this.api.context.active();
     this.rootSpan = this.tracer.startSpan("agentv.eval", void 0, ctx);
     this.rootSpan.setAttribute("gen_ai.operation.name", "evaluate");
     this.rootSpan.setAttribute("gen_ai.system", "agentv");
     this.rootSpan.setAttribute("agentv.test_id", testId);
     this.rootSpan.setAttribute("agentv.target", target);
-    if (dataset) this.rootSpan.setAttribute("agentv.dataset", dataset);
+    if (evalSet) this.rootSpan.setAttribute("agentv.eval_set", evalSet);
     this.rootCtx = this.api.trace.setSpan(this.api.context.active(), this.rootSpan);
   }
   /** Create and immediately export a tool span */
@@ -17477,6 +17239,7 @@ export {
   extractTargetsFromSuite,
   extractTargetsFromTestCase,
   extractTrialsConfig,
+  extractWorkersFromSuite,
   fileExists,
   findGitRoot,
   freeformEvaluationSchema,
@@ -17491,7 +17254,6 @@ export {
   initializeBaseline,
   isAgentSkillsFormat,
   isEvaluatorKind,
-  isGuidelineFile,
   isJsonObject,
   isJsonValue,
   isNonEmptyString,