npm - @xn-intenton-z2a/agentic-lib - Versions diffs - 7.4.32 → 7.4.33 - Mend

@xn-intenton-z2a/agentic-lib 7.4.32 → 7.4.33

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (17) hide show

package/.github/workflows/agentic-lib-init.yml +12 -10
package/.github/workflows/agentic-lib-schedule.yml +122 -56
package/.github/workflows/agentic-lib-test.yml +1 -1
package/.github/workflows/agentic-lib-workflow.yml +30 -2
package/agentic-lib.toml +22 -2
package/bin/agentic-lib.js +166 -19
package/package.json +1 -1
package/src/actions/agentic-step/tasks/direct.js +17 -9
package/src/actions/agentic-step/tasks/implementation-review.js +66 -15
package/src/actions/agentic-step/tasks/maintain-features.js +5 -0
package/src/actions/agentic-step/tasks/review-issue.js +13 -2
package/src/actions/agentic-step/tasks/transform.js +18 -0
package/src/copilot/config.js +17 -3
package/src/copilot/telemetry.js +18 -1
package/src/seeds/zero-MISSION.md +14 -14
package/src/seeds/zero-README.md +106 -65
package/src/seeds/zero-package.json +1 -1

package/bin/agentic-lib.js CHANGED Viewed

@@ -110,7 +110,7 @@ const target = resolve(targetPath);
 const modelIdx = flags.indexOf("--model");
 const model = modelIdx >= 0 ? flags[modelIdx + 1] : "claude-sonnet-4";
 const missionIdx = flags.indexOf("--mission");
-const mission = missionIdx >= 0 ? flags[missionIdx + 1] : "6-kyu-understand-hamming-distance";
+const mission = missionIdx >= 0 ? flags[missionIdx + 1] : "7-kyu-understand-fizz-buzz";
 const cyclesIdx = flags.indexOf("--cycles");
 const cycles = cyclesIdx >= 0 ? parseInt(flags[cyclesIdx + 1], 10) : 0;
 const stepsIdx = flags.indexOf("--steps");
@@ -734,7 +734,7 @@ function clearAndRecreateDir(dirPath, label) {
   if (!dryRun) mkdirSync(fullPath, { recursive: true });
 }
-function initPurge(seedsDir, missionName, initTimestamp) {
+async function initPurge(seedsDir, missionName, initTimestamp) {
   console.log("\n--- Purge: Reset Source Files to Seed State ---");
   const { sourcePath, testsPath, behaviourPath, examplesPath, webPath } = readTomlPaths();
@@ -779,12 +779,52 @@ function initPurge(seedsDir, missionName, initTimestamp) {
     console.log("  CREATE: docs/.nojekyll");
   }
+  // W10: Preserve TOML values through purge
+  const tomlTarget = resolve(target, "agentic-lib.toml");
+  let preservedTomlValues = {};
+  if (existsSync(tomlTarget)) {
+    const existingToml = readFileSync(tomlTarget, "utf8");
+    const readTomlValue = (key) => {
+      const m = existingToml.match(new RegExp(`^\\s*${key.replace(/[.*+?^${}()|[\]\\]/g, "\\$&")}\\s*=\\s*"([^"]*)"`, "m"));
+      return m ? m[1] : null;
+    };
+    const readTomlNum = (key) => {
+      const m = existingToml.match(new RegExp(`^\\s*${key.replace(/[.*+?^${}()|[\]\\]/g, "\\$&")}\\s*=\\s*(\\d+)`, "m"));
+      return m ? parseInt(m[1], 10) : null;
+    };
+    preservedTomlValues = {
+      supervisor: readTomlValue("supervisor"),
+      focus: readTomlValue("focus"),
+      model: readTomlValue("model"),
+      profile: readTomlValue("profile"),
+      "acceptance-criteria-threshold": readTomlNum("acceptance-criteria-threshold"),
+      "min-resolved-issues": readTomlNum("min-resolved-issues"),
+      "mission-type": readTomlValue("mission-type"),
+    };
+    console.log("  PRESERVE: saved TOML values for restoration after purge");
+  }
   // Force-overwrite agentic-lib.toml during purge (transformed from root)
   const tomlSource = resolve(pkgRoot, "agentic-lib.toml");
   if (existsSync(tomlSource)) {
     initTransformFile(tomlSource, resolve(target, "agentic-lib.toml"), "SEED: agentic-lib.toml (transformed)");
   }
+  // Restore preserved values into the new TOML
+  if (existsSync(tomlTarget) && Object.values(preservedTomlValues).some(v => v !== null)) {
+    let toml = readFileSync(tomlTarget, "utf8");
+    for (const [key, value] of Object.entries(preservedTomlValues)) {
+      if (value === null) continue;
+      const isNum = typeof value === "number";
+      const regex = new RegExp(`^(\\s*${key.replace(/[.*+?^${}()|[\]\\]/g, "\\$&")}\\s*=\\s*)${isNum ? "\\d+" : '"[^"]*"'}`, "m");
+      if (regex.test(toml)) {
+        toml = toml.replace(regex, `$1${isNum ? value : `"${value}"`}`);
+        console.log(`  RESTORE: ${key} = ${value}`);
+      }
+    }
+    if (!dryRun) writeFileSync(tomlTarget, toml);
+  }
   // Clear agent log files (written by implementation-review and other tasks)
   try {
     const agentLogs = readdirSync(target).filter((f) => f.startsWith("agent-log-") && f.endsWith(".md"));
@@ -798,27 +838,133 @@ function initPurge(seedsDir, missionName, initTimestamp) {
     if (agentLogs.length > 0) console.log(`  Cleared ${agentLogs.length} agent log file(s)`);
   } catch { /* ignore — directory may not have agent logs */ }
-  // Copy mission seed file as MISSION.md
+  // Copy mission seed file as MISSION.md (with random/generate support)
   const missionsDir = resolve(seedsDir, "missions");
-  const missionFile = resolve(missionsDir, `${missionName}.md`);
-  if (existsSync(missionFile)) {
-    initCopyFile(missionFile, resolve(target, "MISSION.md"), `MISSION: missions/${missionName}.md → MISSION.md`);
-  } else {
-    // List available missions and error
+  let resolvedMission = missionName;
+  let missionType = missionName; // "random", "generate", or the specific seed name
+  if (missionName === "random") {
+    // W11: Pick a random mission from available seeds
     const available = existsSync(missionsDir)
-      ? readdirSync(missionsDir)
-          .filter((f) => f.endsWith(".md"))
-          .map((f) => f.replace(/\.md$/, ""))
+      ? readdirSync(missionsDir).filter((f) => f.endsWith(".md")).map((f) => f.replace(/\.md$/, ""))
       : [];
-    console.error(`\nERROR: Unknown mission "${missionName}".`);
-    if (available.length > 0) {
-      console.error(`Available missions: ${available.join(", ")}`);
+    if (available.length === 0) {
+      console.error("\nERROR: No missions available for random selection.");
+      process.exit(1);
+    }
+    resolvedMission = available[Math.floor(Math.random() * available.length)];
+    console.log(`  RANDOM: selected mission "${resolvedMission}" from ${available.length} available`);
+  } else if (missionName === "generate") {
+    // W12: Generate a mission using LLM
+    console.log("  GENERATE: Creating LLM-generated mission...");
+    try {
+      const { runCopilotSession } = await import("../src/copilot/copilot-session.js");
+      const available = existsSync(missionsDir)
+        ? readdirSync(missionsDir).filter((f) => f.endsWith(".md")).map((f) => f.replace(/\.md$/, ""))
+        : [];
+      const sampleMission = existsSync(resolve(missionsDir, "7-kyu-understand-fizz-buzz.md"))
+        ? readFileSync(resolve(missionsDir, "7-kyu-understand-fizz-buzz.md"), "utf8")
+        : "";
+      const prompt = [
+        "Generate a novel JavaScript library mission for an autonomous coding pipeline.",
+        "The mission should follow this exact structure (use the example as a template):",
+        "",
+        sampleMission,
+        "",
+        "Requirements:",
+        "- Be distinct from all existing missions: " + available.join(", "),
+        "- Difficulty should be between 8-kyu (trivial) and 2-kyu (expert)",
+        "- Include 5-10 acceptance criteria as markdown checkboxes (- [ ] ...)",
+        "- The library must be implementable in a single src/lib/main.js file",
+        "- Include edge cases and error handling in the requirements",
+        "",
+        "Write the mission to MISSION.md using the write_file tool.",
+      ].join("\n");
+      await runCopilotSession({
+        task: "generate-mission",
+        model,
+        target,
+        prompt,
+        timeoutMs: 120000,
+        dryRun,
+      });
+      resolvedMission = "generated";
+      console.log("  GENERATE: Mission written to MISSION.md");
+    } catch (err) {
+      console.error(`  GENERATE: LLM generation failed (${err.message}), falling back to fizz-buzz`);
+      resolvedMission = "7-kyu-understand-fizz-buzz";
+      missionType = "generate-fallback";
+    }
+  }
+  if (missionName !== "generate" || resolvedMission !== "generated") {
+    const selectedMissionFile = resolve(missionsDir, `${resolvedMission}.md`);
+    if (existsSync(selectedMissionFile)) {
+      initCopyFile(selectedMissionFile, resolve(target, "MISSION.md"), `MISSION: missions/${resolvedMission}.md → MISSION.md`);
+    } else {
+      const available = existsSync(missionsDir)
+        ? readdirSync(missionsDir).filter((f) => f.endsWith(".md")).map((f) => f.replace(/\.md$/, ""))
+        : [];
+      console.error(`\nERROR: Unknown mission "${resolvedMission}".`);
+      if (available.length > 0) {
+        console.error(`Available missions: ${available.join(", ")}`);
+      }
+      process.exit(1);
+    }
+  }
+  // W17: Generate structured acceptance criteria in TOML
+  const missionTargetPath = resolve(target, "MISSION.md");
+  if (existsSync(missionTargetPath)) {
+    const missionContent = readFileSync(missionTargetPath, "utf8");
+    const checkboxes = missionContent.match(/- \[ \] (.+)/g) || [];
+    if (checkboxes.length > 0) {
+      const criteriaEntries = checkboxes.map((line, i) => {
+        const text = line.replace(/^- \[ \] /, "").trim();
+        return `${i + 1} = { text = ${JSON.stringify(text)}, met = false }`;
+      });
+      const criteriaSection = [
+        "",
+        "[acceptance-criteria]",
+        `# Auto-generated from MISSION.md on init. Updated by implementation-review.`,
+        `total = ${checkboxes.length}`,
+        ...criteriaEntries,
+      ].join("\n");
+      const tomlFile = resolve(target, "agentic-lib.toml");
+      if (existsSync(tomlFile)) {
+        let toml = readFileSync(tomlFile, "utf8");
+        if (/^\[acceptance-criteria\]/m.test(toml)) {
+          toml = toml.replace(/\n?\[acceptance-criteria\][^\[]*/, criteriaSection);
+        } else {
+          toml = toml.trimEnd() + "\n" + criteriaSection + "\n";
+        }
+        if (!dryRun) writeFileSync(tomlFile, toml);
+        console.log(`  WRITE: [acceptance-criteria] section (${checkboxes.length} criteria)`);
+        initChanges++;
+      }
+    }
+  }
+  // Set acceptance criteria threshold based on mission difficulty
+  const difficultyMatch = resolvedMission.match(/^(\d+)-(?:kyu|dan)/);
+  if (difficultyMatch) {
+    const level = parseInt(difficultyMatch[1], 10);
+    const isDan = resolvedMission.includes("-dan-");
+    const THRESHOLD_MAP = { 8: 100, 7: 75, 6: 60, 5: 50, 4: 50, 3: 40, 2: isDan ? 30 : 35, 1: 30 };
+    const threshold = THRESHOLD_MAP[level] || 50;
+    const tomlFile = resolve(target, "agentic-lib.toml");
+    if (existsSync(tomlFile)) {
+      let toml = readFileSync(tomlFile, "utf8");
+      const regex = /^(\s*acceptance-criteria-threshold\s*=\s*)\d+/m;
+      if (regex.test(toml)) {
+        toml = toml.replace(regex, `$1${threshold}`);
+        if (!dryRun) writeFileSync(tomlFile, toml);
+        console.log(`  SET: acceptance-criteria-threshold = ${threshold} (${resolvedMission})`);
+      }
     }
-    process.exit(1);
   }
   // Write init metadata to agentic-lib.toml
-  const tomlTarget = resolve(target, "agentic-lib.toml");
   if (existsSync(tomlTarget)) {
     let toml = readFileSync(tomlTarget, "utf8");
     const pkg = JSON.parse(readFileSync(resolve(pkgRoot, "package.json"), "utf8"));
@@ -827,7 +973,8 @@ function initPurge(seedsDir, missionName, initTimestamp) {
       "[init]",
       `timestamp = "${initTimestamp}"`,
       `mode = "purge"`,
-      `mission = "${missionName}"`,
+      `mission = "${resolvedMission}"`,
+      `mission-type = "${missionType}"`,
       `version = "${pkg.version}"`,
     ].join("\n");
     // Replace existing [init] section or append
@@ -1260,7 +1407,7 @@ function initPurgeGitHub() {
   }
 }
-function runInit() {
+async function runInit() {
   if (!existsSync(target)) {
     console.error(`Target directory does not exist: ${target}`);
     process.exit(1);
@@ -1316,7 +1463,7 @@ function runInit() {
   initScripts(agenticDir);
   initConfig(seedsDir);
   if (reseed) initReseed(initTimestamp);
-  if (purge) initPurge(seedsDir, mission, initTimestamp);
+  if (purge) await initPurge(seedsDir, mission, initTimestamp);
   if (purge) initPurgeGitHub();
   console.log(`\n${initChanges} change(s)${dryRun ? " (dry run)" : ""}`);

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@xn-intenton-z2a/agentic-lib",
-  "version": "7.4.32",
+  "version": "7.4.33",
   "description": "Agentic-lib Agentic Coding Systems SDK powering automated GitHub workflows.",
   "type": "module",
   "scripts": {

package/src/actions/agentic-step/tasks/direct.js CHANGED Viewed

@@ -67,8 +67,13 @@ function detectDedicatedTests() {
  */
 async function buildMetricAssessment(ctx, config) {
   const thresholds = config.missionCompleteThresholds || {};
-  const minResolved = thresholds.minResolvedIssues ?? 3;
+  const minResolved = thresholds.minResolvedIssues ?? 1;
   const maxTodos = thresholds.maxSourceTodos ?? 0;
+  const minCumulativeTransforms = thresholds.minCumulativeTransforms ?? 1;
+  const acceptanceThreshold = thresholds.acceptanceCriteriaThreshold ?? 50;
+  const requireNoOpenIssues = thresholds.requireNoOpenIssues ?? true;
+  const requireNoOpenPrs = thresholds.requireNoOpenPrs ?? true;
+  const requireNoCriticalGaps = thresholds.requireNoCriticalGaps ?? true;
   // Implementation review gaps (passed from workflow via env)
   let reviewGaps = [];
@@ -78,22 +83,23 @@ async function buildMetricAssessment(ctx, config) {
   } catch { /* ignore parse errors */ }
   const criticalGaps = reviewGaps.filter((g) => g.severity === "critical");
-  // Acceptance criteria from MISSION.md checkboxes
+  // Acceptance criteria from MISSION.md checkboxes (or structured TOML if available)
   const { countAcceptanceCriteria } = await import("../../../copilot/telemetry.js");
   const missionPath = config.paths?.mission?.path || "MISSION.md";
   const acceptance = countAcceptanceCriteria(missionPath);
-  const acceptanceMet = acceptance.total > 0 && acceptance.met > acceptance.total / 2;
+  const acceptancePct = acceptance.total > 0 ? (acceptance.met / acceptance.total) * 100 : 0;
+  const acceptanceMet = acceptance.total > 0 && acceptancePct >= acceptanceThreshold;
   // C6: Removed "Dedicated tests" metric; using cumulative transforms instead
   const metrics = [
-    { metric: "Open issues", value: ctx.issuesSummary.length, target: 0, met: ctx.issuesSummary.length === 0 },
-    { metric: "Open PRs", value: ctx.prsSummary.length, target: 0, met: ctx.prsSummary.length === 0 },
+    { metric: "Open issues", value: ctx.issuesSummary.length, target: 0, met: requireNoOpenIssues ? ctx.issuesSummary.length === 0 : true },
+    { metric: "Open PRs", value: ctx.prsSummary.length, target: 0, met: requireNoOpenPrs ? ctx.prsSummary.length === 0 : true },
     { metric: "Issues resolved", value: ctx.resolvedCount, target: minResolved, met: ctx.resolvedCount >= minResolved },
     { metric: "Source TODOs", value: ctx.sourceTodoCount, target: maxTodos, met: ctx.sourceTodoCount <= maxTodos },
-    { metric: "Cumulative transforms", value: ctx.cumulativeTransformationCost, target: 1, met: ctx.cumulativeTransformationCost >= 1 },
+    { metric: "Cumulative transforms", value: ctx.cumulativeTransformationCost, target: minCumulativeTransforms, met: ctx.cumulativeTransformationCost >= minCumulativeTransforms },
     { metric: "Budget", value: ctx.cumulativeTransformationCost, target: ctx.transformationBudget || "unlimited", met: !(ctx.transformationBudget > 0 && ctx.cumulativeTransformationCost >= ctx.transformationBudget) },
-    { metric: "Implementation review", value: criticalGaps.length === 0 ? "No critical gaps" : `${criticalGaps.length} critical gap(s)`, target: "No critical gaps", met: criticalGaps.length === 0 },
-    { metric: "Acceptance criteria", value: acceptance.total > 0 ? `${acceptance.met}/${acceptance.total}` : "N/A", target: "> 50%", met: acceptanceMet },
+    { metric: "Implementation review", value: criticalGaps.length === 0 ? "No critical gaps" : `${criticalGaps.length} critical gap(s)`, target: "No critical gaps", met: requireNoCriticalGaps ? criticalGaps.length === 0 : true },
+    { metric: "Acceptance criteria", value: acceptance.total > 0 ? `${acceptance.met}/${acceptance.total} (${Math.round(acceptancePct)}%)` : "N/A", target: `>= ${acceptanceThreshold}%`, met: acceptanceMet },
   ];
   const allMet = metrics.every((m) => m.met);
@@ -166,7 +172,9 @@ function buildPrompt(ctx, agentInstructions, metricAssessment) {
     "Check the acceptance criteria in the Mission section above. If all criteria are clearly satisfied by the current source code and tests (verified via read_file), you SHOULD declare mission-complete even if not all mechanical metrics are MET.",
     "For simple missions (few functions, clear acceptance criteria), do not require elaborate test coverage or documentation beyond what the acceptance criteria specify.",
     "",
-    "**Post-merge evaluation context:** This director runs AFTER a dev transformation has been merged. The source code, tests, README, and website you see are the result of that merge. The acceptance criteria checkboxes in MISSION.md reflect the implementation review's findings. If the metrics show all conditions MET and the acceptance criteria are > 50% checked, you should declare mission-complete unless you find a critical implementation gap via read_file. Do not defer to a future run — the pipeline has a structural 2-run minimum, and this is your chance to complete in 1 run.",
+    `**Focus mode:** ${config.focus === "maintenance" ? "MAINTENANCE — The mission is substantially complete. Focus on adding value: improve test coverage, refactor for clarity, improve documentation, optimise performance. Do NOT declare mission-complete or mission-failed. Dispatch maintenance work instead." : "MISSION — Work toward mission completion. Declare mission-complete when criteria are met."}`,
+    "",
+    `**Post-merge evaluation context:** This director runs AFTER a dev transformation has been merged. The source code, tests, README, and website you see are the result of that merge. The acceptance criteria checkboxes in MISSION.md reflect the implementation review's findings. If the metrics show all conditions MET and the acceptance criteria meet the ${metricAssessment.metrics.find(m => m.metric === "Acceptance criteria")?.target || ">= 50%"} threshold, you should declare mission-complete unless you find a critical implementation gap via read_file. Do not defer to a future run — the pipeline has a structural 2-run minimum, and this is your chance to complete in 1 run.`,
     "",
     "Then call report_director_decision with your determination.",
     "",

package/src/actions/agentic-step/tasks/implementation-review.js CHANGED Viewed

@@ -48,9 +48,11 @@ function buildReviewPrompt(mission, config, agentInstructions, agentLogsSummary)
     "   - Tests that don't assert anything meaningful (empty/trivial)",
     "   - Features listed as done in docs but missing from code",
     "   - PRs merged without test coverage for the claimed feature",
-    "4. Check the MISSION.md Acceptance Criteria checkboxes (`- [ ]`). For each criterion,",
-    "   if you verified it is implemented AND unit-tested, include its exact text in the",
-    "   `acceptanceCriteriaMet` array. Copy the criterion text exactly as it appears after `- [ ]`.",
+    "4. Check the MISSION.md Acceptance Criteria. For each criterion that you verified is",
+    "   implemented AND unit-tested, include its **index number** (1-based) in the",
+    "   `acceptanceCriteriaMetIndices` array. Also include the text in `acceptanceCriteriaMet`",
+    "   for backwards compatibility. The indexed criteria are listed in agentic-lib.toml",
+    "   under [acceptance-criteria] if available.",
     "5. Call report_implementation_review with your findings.",
     "",
     "**You MUST call report_implementation_review exactly once.**",
@@ -172,34 +174,83 @@ export async function implementationReview(context) {
           acceptanceCriteriaMet: {
             type: "array",
             items: { type: "string" },
-            description: "Exact text of each acceptance criterion from MISSION.md that is verified as implemented AND unit-tested. Copy the text after '- [ ]' exactly.",
+            description: "Text of each acceptance criterion verified as implemented AND unit-tested (for backwards compatibility).",
+          },
+          acceptanceCriteriaMetIndices: {
+            type: "array",
+            items: { type: "integer" },
+            description: "1-based indices of acceptance criteria verified as met (preferred over text matching). See [acceptance-criteria] in agentic-lib.toml.",
           },
         },
         required: ["elements", "gaps", "advice"],
       },
-      handler: async ({ elements, gaps, advice, misleadingMetrics, acceptanceCriteriaMet }) => {
+      handler: async ({ elements, gaps, advice, misleadingMetrics, acceptanceCriteriaMet, acceptanceCriteriaMetIndices }) => {
         reviewResult.elements = elements || [];
         reviewResult.gaps = gaps || [];
         reviewResult.advice = advice || "";
         reviewResult.misleadingMetrics = misleadingMetrics || [];
-        // Update MISSION.md checkboxes based on verified acceptance criteria
+        const metIndices = acceptanceCriteriaMetIndices || [];
         const metCriteria = acceptanceCriteriaMet || [];
-        if (metCriteria.length > 0) {
+        const totalUpdated = metIndices.length || metCriteria.length;
+        // W17: Update structured TOML acceptance criteria by index (primary)
+        if (metIndices.length > 0) {
+          try {
+            const { readFileSync, writeFileSync } = await import("fs");
+            const tomlPath = config.configToml ? "agentic-lib.toml" : null;
+            if (tomlPath && readFileSync(tomlPath, "utf8").includes("[acceptance-criteria]")) {
+              let toml = readFileSync(tomlPath, "utf8");
+              for (const idx of metIndices) {
+                const regex = new RegExp(`^(${idx}\\s*=\\s*\\{[^}]*met\\s*=\\s*)false`, "m");
+                if (regex.test(toml)) {
+                  toml = toml.replace(regex, "$1true");
+                }
+              }
+              writeFileSync(tomlPath, toml, "utf8");
+              core.info(`Updated ${metIndices.length} acceptance criteria by index in TOML`);
+            }
+          } catch (err) {
+            core.warning(`Could not update TOML acceptance criteria: ${err.message}`);
+          }
+        }
+        // Also update MISSION.md checkboxes (best-effort, not critical)
+        if (metCriteria.length > 0 || metIndices.length > 0) {
           try {
             const missionPath = config.paths?.mission?.path || "MISSION.md";
             const { readFileSync, writeFileSync } = await import("fs");
             let missionContent = readFileSync(missionPath, "utf8");
             let checkedCount = 0;
-            for (const criterionText of metCriteria) {
-              // Match the checkbox line containing this criterion text (fuzzy: trim whitespace)
-              const escaped = criterionText.replace(/[.*+?^${}()|[\]\\]/g, "\\$&").trim();
-              const re = new RegExp(`- \\[ \\] ${escaped}`);
-              if (re.test(missionContent)) {
-                missionContent = missionContent.replace(re, `- [x] ${criterionText.trim()}`);
-                checkedCount++;
+            // Index-based update: find the Nth checkbox and check it
+            if (metIndices.length > 0) {
+              const lines = missionContent.split("\n");
+              let checkboxIdx = 0;
+              for (let i = 0; i < lines.length; i++) {
+                if (/^- \[ \] /.test(lines[i])) {
+                  checkboxIdx++;
+                  if (metIndices.includes(checkboxIdx)) {
+                    lines[i] = lines[i].replace(/^- \[ \] /, "- [x] ");
+                    checkedCount++;
+                  }
+                }
               }
+              missionContent = lines.join("\n");
             }
+            // Text-based update (fallback for backwards compatibility)
+            if (checkedCount === 0 && metCriteria.length > 0) {
+              for (const criterionText of metCriteria) {
+                const escaped = criterionText.replace(/[.*+?^${}()|[\]\\]/g, "\\$&").trim();
+                const re = new RegExp(`- \\[ \\] ${escaped}`);
+                if (re.test(missionContent)) {
+                  missionContent = missionContent.replace(re, `- [x] ${criterionText.trim()}`);
+                  checkedCount++;
+                }
+              }
+            }
             if (checkedCount > 0) {
               writeFileSync(missionPath, missionContent, "utf8");
               core.info(`Updated ${checkedCount} acceptance criteria checkboxes in ${missionPath}`);
@@ -209,7 +260,7 @@ export async function implementationReview(context) {
           }
         }
-        return { textResultForLlm: `Review recorded: ${elements?.length || 0} elements traced, ${gaps?.length || 0} gaps found, ${metCriteria.length} criteria checked` };
+        return { textResultForLlm: `Review recorded: ${elements?.length || 0} elements traced, ${gaps?.length || 0} gaps found, ${totalUpdated} criteria checked` };
       },
     });

package/src/actions/agentic-step/tasks/maintain-features.js CHANGED Viewed

@@ -87,6 +87,11 @@ export async function maintainFeatures(context) {
     `2. If there are fewer than ${featureLimit} features, create new features aligned with the mission.`,
     "3. Ensure each feature has clear, testable acceptance criteria.",
     "",
+    `## Focus Mode: ${config.focus === "maintenance" ? "MAINTENANCE" : "MISSION"}`,
+    config.focus === "maintenance"
+      ? "The mission is substantially complete. Generate maintenance-oriented features: refactoring, test coverage improvement, documentation, performance optimisation. Do not create mission-gap features."
+      : "Create features that advance the mission toward completion. Focus on unimplemented capabilities and gaps.",
+    "",
     formatPathsSection(writablePaths, config.readOnlyPaths, config),
     "",
     "## Constraints",

package/src/actions/agentic-step/tasks/review-issue.js CHANGED Viewed

@@ -237,8 +237,9 @@ export async function reviewIssue(context) {
     return reviewSingleIssue({ octokit, repo, config, targetIssueNumber: issueNumber, instructions, model, tuning: t, logFilePath, screenshotFilePath });
   }
-  // Batch mode: find up to 3 unreviewed issues
-  const issueNumbers = await findUnreviewedIssues(octokit, repo, 3);
+  // Batch mode: find unreviewed issues (cap from config, default 3)
+  const reviewCap = config.reviewIssuesCap ?? 3;
+  const issueNumbers = await findUnreviewedIssues(octokit, repo, reviewCap);
   if (issueNumbers.length === 0) {
     return { outcome: "nop", details: "No open automated issues to review" };
   }
@@ -248,7 +249,17 @@ export async function reviewIssue(context) {
   let totalInputTokens = 0;
   let totalOutputTokens = 0;
+  // W19: Remaining-time guard — work within the 10-minute step timeout
+  const STEP_TIMEOUT_MS = 10 * 60 * 1000;
+  const MIN_REMAINING_MS = 4 * 60 * 1000; // need at least 4 min for a review
+  const batchStart = Date.now();
   for (const num of issueNumbers) {
+    const elapsed = Date.now() - batchStart;
+    if (elapsed + MIN_REMAINING_MS > STEP_TIMEOUT_MS) {
+      core.warning(`Skipping issue #${num} — only ${Math.round((STEP_TIMEOUT_MS - elapsed) / 1000)}s remaining (need ${MIN_REMAINING_MS / 1000}s). Reviewed ${results.length}/${issueNumbers.length} issues.`);
+      break;
+    }
     core.info(`Batch reviewing issue #${num} (${results.length + 1}/${issueNumbers.length})`);
     const result = await reviewSingleIssue({
       octokit, repo, config, targetIssueNumber: num, instructions, model, tuning: t, logFilePath, screenshotFilePath,

package/src/actions/agentic-step/tasks/transform.js CHANGED Viewed

@@ -215,6 +215,11 @@ export async function transform(context) {
       })()),
     ] : []),
     "",
+    `## Focus Mode: ${config.focus === "maintenance" ? "MAINTENANCE" : "MISSION"}`,
+    config.focus === "maintenance"
+      ? "The mission is substantially complete. Focus on adding value to the existing codebase: improve test coverage, refactor for clarity, improve documentation, optimise performance. Do not create new feature issues or push for mission-complete."
+      : "Work toward completing the mission. Implement missing capabilities, resolve gaps, and advance toward mission completion.",
+    "",
     "## Your Task",
     "Analyze the mission and open issues (use list_issues tool).",
     "Read the source files you need (use read_file tool).",
@@ -332,6 +337,19 @@ export async function transform(context) {
   const sessionDurationMs = Date.now() - sessionStartTime;
   core.info(`Transform session completed in ${Math.round(sessionDurationMs / 1000)}s (${result.tokensIn + result.tokensOut} tokens, maxToolCalls=${maxToolCalls})`);
+  // W15: Post-transform lockfile sync — if package.json was modified, regenerate lockfile
+  try {
+    const { execSync } = await import("child_process");
+    const gitDiff = execSync("git diff --name-only HEAD", { encoding: "utf8", timeout: 10000 }).trim();
+    if (gitDiff.split("\n").some(f => f.endsWith("package.json"))) {
+      core.info("package.json changed during transform — syncing lockfile");
+      execSync("npm install --package-lock-only", { encoding: "utf8", timeout: 60000, stdio: "pipe" });
+      core.info("Lockfile synced successfully");
+    }
+  } catch (err) {
+    core.warning(`Post-transform lockfile sync failed: ${err.message}`);
+  }
   // Detect mission-complete hint
   const lowerResult = (result.agentMessage || "").toLowerCase();
   if (lowerResult.includes("mission is satisfied") || lowerResult.includes("mission is complete") || lowerResult.includes("no changes needed")) {

package/src/copilot/config.js CHANGED Viewed

@@ -260,16 +260,29 @@ export function loadConfig(configPath) {
     minBranchCoverage: goals["min-branch-coverage"] ?? 30,
   };
-  // Mission-complete thresholds (with safe defaults)
+  // Mission-complete thresholds (with safe defaults from profile)
   // C6: Removed minDedicatedTests and requireDedicatedTests
   const mc = toml["mission-complete"] || {};
+  const activeProfile = profilesSection[tuning.profileName] || {};
   const missionCompleteThresholds = {
-    minResolvedIssues: mc["min-resolved-issues"] ?? 3,
-    maxSourceTodos: mc["max-source-todos"] ?? 0,
+    minResolvedIssues: mc["min-resolved-issues"] ?? activeProfile["min-resolved-issues"] ?? 1,
+    maxSourceTodos: mc["max-source-todos"] ?? activeProfile["max-source-todos"] ?? 0,
+    acceptanceCriteriaThreshold: mc["acceptance-criteria-threshold"] ?? activeProfile["acceptance-criteria-threshold"] ?? 50,
+    minCumulativeTransforms: mc["min-cumulative-transforms"] ?? activeProfile["min-cumulative-transforms"] ?? 1,
+    requireNoOpenIssues: mc["require-no-open-issues"] ?? true,
+    requireNoOpenPrs: mc["require-no-open-prs"] ?? true,
+    requireNoCriticalGaps: mc["require-no-critical-gaps"] ?? true,
   };
+  // Review issues cap (from limits, with profile fallback)
+  const reviewIssuesCap = limitsSection["review-issues-cap"] ?? activeProfile["review-issues-cap"] ?? 3;
+  // Schedule focus
+  const focus = toml.schedule?.focus || "mission";
   return {
     supervisor: toml.schedule?.supervisor || "daily",
+    focus,
     model: toml.tuning?.model || toml.schedule?.model || "gpt-5-mini",
     tuning,
     paths,
@@ -288,6 +301,7 @@ export function loadConfig(configPath) {
     init: toml.init || null,
     tdd: toml.tdd === true,
     missionCompleteThresholds,
+    reviewIssuesCap,
     coverageGoals,
     maxTokensPerMaintain: resolvedLimits.maxTokensPerMaintain || 200000,
     writablePaths,

package/src/copilot/telemetry.js CHANGED Viewed

@@ -70,6 +70,23 @@ export function countSourceLines(dir) {
  * @returns {{ met: number, total: number }}
  */
 export function countAcceptanceCriteria(missionPath) {
+  // W17: Try structured TOML first (primary source)
+  try {
+    const tomlPath = "agentic-lib.toml";
+    if (existsSync(tomlPath)) {
+      const toml = readFileSync(tomlPath, "utf8");
+      if (toml.includes("[acceptance-criteria]")) {
+        const totalMatch = toml.match(/^\s*total\s*=\s*(\d+)/m);
+        if (totalMatch) {
+          const total = parseInt(totalMatch[1], 10);
+          const metMatches = toml.match(/met\s*=\s*true/g) || [];
+          return { met: metMatches.length, total };
+        }
+      }
+    }
+  } catch { /* fall through to MISSION.md */ }
+  // Fallback: count checkboxes in MISSION.md
   if (!missionPath || !existsSync(missionPath)) return { met: 0, total: 0 };
   try {
     const content = readFileSync(missionPath, "utf8");
@@ -112,7 +129,7 @@ export function buildMissionMetrics(config, result, _limitsStatus, cumulativeCos
   const todoCount = countSourceTodos(srcRoot);
   const thresholds = config.missionCompleteThresholds || {};
-  const minResolved = thresholds.minResolvedIssues ?? 3;
+  const minResolved = thresholds.minResolvedIssues ?? 1;
   const maxTodos = thresholds.maxSourceTodos ?? 0;
   // C6: Dynamic metrics

package/src/seeds/zero-MISSION.md CHANGED Viewed

@@ -1,26 +1,26 @@
 # Mission
-A JavaScript library for computing Hamming distances — between equal-length strings (character positions that differ) and between non-negative integers (differing bits).
+A JavaScript library exporting FizzBuzz functions. This is the simplest possible mission — if the pipeline can't complete this and stop, something is fundamentally broken.
-## Required Capabilities
+## Core Functions
-- Compute the Hamming distance between two strings of equal length.
-- Compute the Hamming distance between two non-negative integers by counting differing bits.
-- Handle Unicode strings correctly (compare code points, not UTF-16 code units).
-- Validate inputs: throw `TypeError` for non-string/non-integer arguments, `RangeError` for unequal-length strings or negative integers.
+- `fizzBuzz(n)` — return an array of strings from 1 to n, replacing multiples of 3 with "Fizz", multiples of 5 with "Buzz", and multiples of both with "FizzBuzz".
+- `fizzBuzzSingle(n)` — return the FizzBuzz string for a single positive integer.
 ## Requirements
-- Export all public API as named exports from `src/lib/main.js`.
-- Comprehensive unit tests covering normal cases, edge cases (empty strings, zero, large integers), and error cases.
-- README with usage examples and API documentation.
+- Handle edge cases: `n = 0` returns an empty array, negative numbers throw `RangeError`, non-integers throw `TypeError`.
+- Export both functions as named exports from `src/lib/main.js`.
+- Comprehensive unit tests covering normal operation and all edge cases.
+- README with usage examples.
 ## Acceptance Criteria
-- [ ] Hamming distance between `"karolin"` and `"kathrin"` is `3`
-- [ ] Hamming distance between `""` and `""` is `0`
-- [ ] Hamming distance between strings of different lengths throws `RangeError`
-- [ ] Bit-level Hamming distance between `1` and `4` is `2` (binary: 001 vs 100)
-- [ ] Bit-level Hamming distance between `0` and `0` is `0`
+- [ ] `fizzBuzz(15)` returns the correct 15-element array ending with "FizzBuzz"
+- [ ] `fizzBuzzSingle(3)` returns "Fizz"
+- [ ] `fizzBuzzSingle(5)` returns "Buzz"
+- [ ] `fizzBuzzSingle(15)` returns "FizzBuzz"
+- [ ] `fizzBuzzSingle(7)` returns "7"
+- [ ] `fizzBuzz(0)` returns `[]`
 - [ ] All unit tests pass
 - [ ] README documents usage with examples