npm - wogiflow - Versions diffs - 2.32.0 → 2.34.1 - Mend

wogiflow 2.32.0 → 2.34.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

package/.claude/docs/claude-code-compatibility.md +51 -0
package/.claude/docs/scheduled-mode.md +213 -0
package/.claude/docs/skill-portability.md +190 -0
package/.claude/rules/alternative-hook-args-exec-form.md +6 -0
package/.claude/settings.json +2 -1
package/.claude/skills/_template/skill.md +1 -0
package/.claude/skills/conventional-commit/knowledge/examples.md +65 -0
package/.claude/skills/conventional-commit/skill.md +76 -0
package/bin/flow +16 -0
package/lib/scheduled-mode.js +374 -0
package/lib/skill-export-agentskills.js +211 -0
package/lib/skill-export-claude-plugin.js +183 -0
package/lib/skill-portability.js +342 -0
package/lib/skill-registry.js +32 -2
package/lib/workspace-channel-server.js +106 -3
package/lib/workspace-channel-tracking.js +102 -1
package/lib/workspace-dispatch-tracking.js +28 -0
package/lib/workspace-messages.js +32 -4
package/lib/workspace-subtask-state.js +215 -0
package/lib/workspace.js +81 -0
package/package.json +2 -2
package/scripts/flow +25 -0
package/scripts/flow-config-defaults.js +20 -0
package/scripts/flow-constants.js +3 -1
package/scripts/flow-schedule.js +486 -0
package/scripts/flow-scheduled-runner.js +659 -0
package/scripts/flow-skill-export.js +334 -0
package/scripts/flow-standards-checker.js +37 -0
package/scripts/hooks/adapters/claude-code.js +18 -3
package/scripts/hooks/core/git-safety-gate.js +118 -27
package/scripts/hooks/core/long-input-enforcement.js +139 -4
package/scripts/hooks/core/overdue-dispatches.js +28 -6
package/scripts/hooks/core/session-start-worker.js +52 -0
package/scripts/hooks/core/stop-orchestrator.js +17 -2
package/scripts/hooks/core/validation.js +8 -0
package/scripts/hooks/core/worker-continuation-gate.js +326 -0
package/scripts/hooks/core/workspace-stop-gates.js +21 -0
package/scripts/hooks/core/workspace-stop-notify.js +174 -59
package/scripts/hooks/entry/claude-code/post-tool-use.js +26 -0

package/scripts/hooks/core/long-input-enforcement.js CHANGED Viewed

@@ -71,6 +71,83 @@ const SOURCE_LINK_PATTERNS = [
   /\bwf-[a-f0-9]{8}\b/i  // bare wf-ID reference
 ];
+/**
+ * Strip quoted/pasted content from a prompt so item + line counts reflect
+ * what the USER is actually requesting, not what they're illustrating.
+ *
+ * Removes:
+ *   - Fenced code blocks (``` … ```) — pasted code or transcript output
+ *   - Lines starting with `⏺` — pasted Claude Code transcript bullet
+ *   - Lines starting with `  ⎿ ` — pasted Claude Code tool-result indent
+ *   - Lines starting with `>` (markdown blockquote, indented or not) — quoted source
+ *   - Indented blocks of 4+ leading spaces directly after a fence-less line
+ *     (informal code-block convention — git diff output, REPL traces, etc.)
+ *
+ * Conservative: only strips when stripping changes the count classification —
+ * downstream callers compare strip vs. raw and use the lower count if it crosses
+ * the threshold. (Tested directly via the helper export; the classifier wires
+ * it into both detectLongFormPrompt and hasTaskSignals.)
+ *
+ * Why this matters: the current turn's user prompt was a short narrative + a
+ * ~70-line PASTED transcript inside a fenced block. The raw line count crossed
+ * the threshold, the imperatives inside the transcript ("fix", "add", "rm")
+ * crossed the task-signal threshold, and the gate fired — even though the user
+ * pasted the transcript to ILLUSTRATE a bug, not to deliver work items.
+ *
+ * @param {string} text
+ * @returns {string} stripped text (always a string; '' if input wasn't)
+ */
+function stripQuotedContent(text) {
+  if (typeof text !== 'string') return '';
+  // 1. Strip fenced code blocks (greedy, but match per-block so unclosed
+  //    fences don't eat the rest of the prompt).
+  let stripped = text.replace(/^```[^\n]*\n[\s\S]*?\n```\s*$/gm, '');
+  // 2. Strip pasted-transcript / blockquote lines.
+  const lines = stripped.split('\n');
+  const kept = [];
+  for (const line of lines) {
+    // ⏺ — Claude Code transcript bullet
+    if (/^\s*⏺/.test(line)) continue;
+    // ⎿ — Claude Code tool-result continuation marker
+    if (/^\s*⎿/.test(line)) continue;
+    // > — markdown blockquote (any indent level)
+    if (/^\s*>/.test(line)) continue;
+    // 4+ leading-space "code-by-indentation" lines that don't look like
+    // a markdown list item (those start with `- ` / `* ` / `N. ` AFTER spaces).
+    if (/^ {4,}\S/.test(line) && !/^\s*(?:[-*]|\d+[.)])\s+/.test(line)) continue;
+    kept.push(line);
+  }
+  return kept.join('\n');
+}
+/**
+ * Detect a Claude Code skill-body echo. When the AI calls `Skill(...)`, the
+ * harness surfaces the full skill prompt + args back as a "user message" via
+ * UserPromptSubmit. These are AI-composed, not user-typed; firing the gate
+ * on them creates a deadlock (the AI can't dismiss its own skill args, and
+ * extract-review needs Bash which is also gated).
+ *
+ * Detection: the prompt contains ≥2 structural markers that only appear in
+ * Claude Code skill bodies (heading hierarchies, "ARGUMENTS: {args}" template,
+ * etc.). These are exceedingly unlikely to appear in user-typed prose.
+ *
+ * @param {string} text
+ * @returns {boolean}
+ */
+function isSkillBodyEcho(text) {
+  if (typeof text !== 'string' || text.length < 500) return false;
+  let hits = 0;
+  for (const marker of SKILL_BODY_MARKERS) {
+    if (text.includes(marker)) {
+      hits++;
+      if (hits >= 2) return true;
+    }
+  }
+  return false;
+}
 function countDiscreteItems(text) {
   if (typeof text !== 'string') return 0;
   let count = 0;
@@ -83,9 +160,12 @@ function countDiscreteItems(text) {
 function detectLongFormPrompt(text) {
   if (typeof text !== 'string' || !text.trim()) return false;
-  const lineCount = text.split('\n').filter(l => l.trim()).length;
+  // Strip quoted/pasted content before counting — only the USER's own words
+  // contribute to thresholds (otherwise the gate fires on illustrative pastes).
+  const stripped = stripQuotedContent(text);
+  const lineCount = stripped.split('\n').filter(l => l.trim()).length;
   if (lineCount > LONG_LINE_THRESHOLD) return true;
-  if (countDiscreteItems(text) >= LONG_ITEM_THRESHOLD) return true;
+  if (countDiscreteItems(stripped) >= LONG_ITEM_THRESHOLD) return true;
   return false;
 }
@@ -116,6 +196,27 @@ const SYSTEM_CONTENT_PREFIXES = [
   '<bash-stderr>'
 ];
+// Skill-body markers that indicate the prompt is a Claude Code skill body
+// being echoed back to the model after an AI Skill(...) invocation. When
+// the AI calls `Skill(skill="wogi-start", args="...long...")`, Claude Code
+// surfaces the full skill prompt + args as the next "user message" — going
+// through UserPromptSubmit. The args are AI-composed, not user-typed, so
+// the gate must NOT fire on them. We detect this by the structural markers
+// that only ever appear in skill body bodies (not in regular user prose).
+// Treating it as a user prompt was the deadlock shape from the wogiflow-cli
+// 2026-05-13 incident — see the bug report transcript in this commit's body.
+const SKILL_BODY_MARKERS = [
+  '**UNIVERSAL ENTRY POINT**',
+  '## Request Triage (AI-Driven Routing',
+  '### Command Catalog',
+  '### Pre-Routing Checks (Automatic)',
+  'Routing order: Task ID',
+  '## Phase Execution (MANDATORY)',
+  '## Mandatory Rules',
+  'ARGUMENTS: {args}',
+  '## How It Works (MANDATORY',
+];
 /**
  * Detect content that originates from the system (tool results, sub-agent
  * notifications, slash-command framings) rather than user typing. These
@@ -137,9 +238,14 @@ function isSystemOriginatedContent(text) {
 function hasTaskSignals(text) {
   if (typeof text !== 'string') return false;
+  // Imperatives inside pasted code/transcript/blockquotes are illustrative,
+  // not the user's own work-creating instructions. Count only on the USER's
+  // own words. (Without this, pasted error logs containing "fix" / "add"
+  // / "remove" trip the gate as if the user were ordering 5 tasks.)
+  const stripped = stripQuotedContent(text);
   let imperativeHits = 0;
   for (const re of TASK_IMPERATIVES) {
-    const m = text.match(new RegExp(re.source, 'gi'));
+    const m = stripped.match(new RegExp(re.source, 'gi'));
     if (m) imperativeHits += m.length;
   }
   return imperativeHits >= 2;
@@ -176,6 +282,13 @@ function shouldForceExtractReview({ text, source, env = process.env } = {}) {
   if (isSystemOriginatedContent(text)) {
     return { forced: false, level: 'pass', reason: 'system-originated-content' };
   }
+  // Deadlock fix (2026-05-13): AI-composed Skill args get surfaced back as
+  // a "user message" by the harness. Detect the skill-body echo signature
+  // and skip the gate — the args are AI-decomposed, not user-typed, so
+  // item-reconciliation has no source to reconcile against.
+  if (isSkillBodyEcho(text)) {
+    return { forced: false, level: 'pass', reason: 'skill-body-echo' };
+  }
   if (!detectLongFormPrompt(text)) {
     return { forced: false, level: 'pass', reason: 'below-long-input-threshold' };
   }
@@ -308,6 +421,20 @@ function checkLongInputPendingGate(toolName, toolInput) {
     if (/flow\s+extract-zero-loss/.test(cmd)) return { blocked: false };
     if (/flow\s+long-input/.test(cmd)) return { blocked: false };
     if (/flow-source-fidelity\.js/.test(cmd)) return { blocked: false };
+    // EMERGENCY ESCAPE (2026-05-13 deadlock fix): when the `flow` CLI is
+    // unavailable (e.g., target project has no node_modules/wogiflow on PATH,
+    // or the CLI itself is broken), allow the user to manually clear the
+    // marker file via `rm`. Scoped narrowly to the exact marker path so it
+    // can't be used as a general-purpose Bash escape.
+    if (/^\s*rm\s+(?:-[a-zA-Z]+\s+)?(?:["']?)\.workflow\/state\/long-input-pending\.json(?:["']?)\s*$/.test(cmd)) {
+      return { blocked: false };
+    }
+    // Also allow the node-script equivalent (for sessions where `rm` is
+    // unavailable, e.g. some Windows shells). Matches both `fs.unlinkSync(...)`
+    // and `require('fs').unlinkSync(...)` forms.
+    if (/unlinkSync\s*\(\s*['"]\.workflow\/state\/long-input-pending\.json['"]\s*\)/.test(cmd)) {
+      return { blocked: false };
+    }
     // Falls through to block for everything else
   }
@@ -334,6 +461,11 @@ function checkLongInputPendingGate(toolName, toolInput) {
       '  2. (ESCAPE HATCH) If this prompt genuinely does NOT create work',
       '     (e.g., it\'s a log dump or pure question), dismiss with:',
       '     `flow long-input-pending dismiss --reason="<concrete reason>"`',
+      '  3. (EMERGENCY) If both paths above fail (e.g., `flow` CLI missing',
+      '     or broken), manually clear the marker file:',
+      '     `rm .workflow/state/long-input-pending.json`',
+      '     (This Bash command is explicitly allowed by the gate as a',
+      '     deadlock escape.)',
       '',
       'Read/Glob/Grep tools remain available for investigation.'
     ].join('\n')
@@ -345,10 +477,12 @@ module.exports = {
   LONG_LINE_THRESHOLD,
   LONG_ITEM_THRESHOLD,
   SYSTEM_CONTENT_PREFIXES,
+  SKILL_BODY_MARKERS,
   detectLongFormPrompt,
   hasSourceLink,
   hasTaskSignals,
   isSystemOriginatedContent,
+  isSkillBodyEcho,
   isChannelDispatchInWorker,
   shouldForceExtractReview,
   buildEnforcementMessage,
@@ -357,5 +491,6 @@ module.exports = {
   isLongInputPending,
   readLongInputPending,
   checkLongInputPendingGate,
-  countDiscreteItems
+  countDiscreteItems,
+  stripQuotedContent
 };

package/scripts/hooks/core/overdue-dispatches.js CHANGED Viewed

@@ -53,7 +53,7 @@ function formatLine(record, now) {
  */
 function sweepAndReconcile(workspaceRoot) {
   let reconciled = 0;
-  let readMessages, reconcileDispatch, readDispatches;
+  let readMessages, reconcileDispatch, readDispatches, refreshDispatchDeadline;
   try {
     const libMessages = path.resolve(__dirname, '..', '..', '..', 'lib', 'workspace-messages.js');
     const libTracking = path.resolve(__dirname, '..', '..', '..', 'lib', 'workspace-dispatch-tracking.js');
@@ -61,6 +61,7 @@ function sweepAndReconcile(workspaceRoot) {
     const tracking = require(libTracking);
     reconcileDispatch = tracking.reconcileDispatch;
     readDispatches = tracking.readDispatches;
+    refreshDispatchDeadline = tracking.refreshDispatchDeadline;
   } catch (_err) {
     return 0; // Fail-open
   }
@@ -78,13 +79,32 @@ function sweepAndReconcile(workspaceRoot) {
     if (r.taskId && !byTaskId.has(r.taskId)) byTaskId.set(r.taskId, r);
   }
-  // Pull both message types. readMessages throws on missing dir internally
-  // but guards with existsSync, so it's safe.
+  // S3 (wf-d3ae1717): heartbeats refresh the deadline (work ongoing, NOT a
+  // silent halt); terminal types resolve the dispatch. worker-progress is
+  // applied FIRST so a heartbeat that arrived before a terminal doesn't keep a
+  // since-resolved dispatch alive.
+  try {
+    const heartbeats = readMessages(workspaceRoot, { type: 'worker-progress' });
+    if (refreshDispatchDeadline) {
+      for (const hb of heartbeats) {
+        const taskId = hb.taskId;
+        if (!taskId || !byTaskId.has(taskId)) continue;
+        try { refreshDispatchDeadline(workspaceRoot, taskId); } catch (_err) { /* per-record */ }
+      }
+    }
+  } catch (_err) { /* heartbeats are best-effort */ }
+  // Pull terminal message types. readMessages throws on missing dir internally
+  // but guards with existsSync, so it's safe. worker-blocked / worker-idle /
+  // worker-awaiting-approval are terminal stops alongside the legacy pair.
   let messages = [];
   try {
     const completes = readMessages(workspaceRoot, { type: 'task-complete' });
     const stops = readMessages(workspaceRoot, { type: 'worker-stopped' });
-    messages = completes.concat(stops);
+    const blocked = readMessages(workspaceRoot, { type: 'worker-blocked' });
+    const idle = readMessages(workspaceRoot, { type: 'worker-idle' });
+    const awaiting = readMessages(workspaceRoot, { type: 'worker-awaiting-approval' });
+    messages = completes.concat(stops, blocked, idle, awaiting);
   } catch (_err) {
     return 0;
   }
@@ -93,8 +113,10 @@ function sweepAndReconcile(workspaceRoot) {
     const taskId = msg.taskId || (msg.type === 'task-complete' ? msg.subject : null);
     if (!taskId || !byTaskId.has(taskId)) continue;
     try {
-      const status = msg.type === 'worker-stopped' ? 'graceful-stop' : 'completed';
-      const reason = msg.type === 'worker-stopped' ? (msg.reason || 'graceful') : null;
+      // task-complete → completed; everything else is a non-overdue graceful
+      // stop (the reason field distinguishes blocked / awaiting / idle / graceful).
+      const status = msg.type === 'task-complete' ? 'completed' : 'graceful-stop';
+      const reason = msg.type === 'task-complete' ? null : (msg.reason || msg.type);
       const result = reconcileDispatch(workspaceRoot, taskId, status, reason);
       if (result) {
         reconciled++;

package/scripts/hooks/core/session-start-worker.js CHANGED Viewed

@@ -40,6 +40,58 @@ function handleWorkerSessionStart() {
     const { isWorker, shouldAnnounceReady, announceWorkerReady } = require(WORKER_READY_LIB);
     if (!isWorker()) return { branch: 'skip', reason: 'not-worker' };
+    // S5 (wf-ee87a24e): RESUME-IN-PROGRESS. If this restarted session has a task
+    // still in `inProgress` with sub-tasks remaining (durable S1 ledger), resume
+    // THAT task — do NOT fall through to "announce idle" (which would orphan it)
+    // or pick a different next task. The durable ledger means completed sub-tasks
+    // are NOT redone. Also post a worker-ready ack so the manager actively
+    // re-triggers if the resume wake-up was missed.
+    try {
+      const { PATHS, safeJsonParse } = require('../../flow-utils');
+      const ready = safeJsonParse(path.join(PATHS.state, 'ready.json'), { inProgress: [] });
+      const inProgress = (ready.inProgress || [])[0] || null;
+      if (inProgress && inProgress.id) {
+        let remaining = null, total = null;
+        try {
+          const subtaskState = require(path.join(__dirname, '..', '..', '..', 'lib', 'workspace-subtask-state.js'));
+          const summary = subtaskState.summary(inProgress.id);
+          remaining = summary.remaining; total = summary.total;
+        } catch (_err) { /* ledger optional */ }
+        // Only treat as resumable if there is remaining decomposed work, OR no
+        // ledger exists at all (single-step task interrupted mid-flight).
+        if (remaining === null || remaining > 0) {
+          // Best-effort ack so the manager knows the worker is back on this task.
+          // Bypass shouldAnnounceReady's empty-queue gating (it returns
+          // 'in-progress-not-empty' here by design) — for a resume we WANT the
+          // manager pinged. announceWorkerReady dedups via hasPendingAnnounce.
+          try {
+            const wr = require(WORKER_READY_LIB);
+            const wsRoot = process.env.WOGI_WORKSPACE_ROOT;
+            const repoName = process.env.WOGI_REPO_NAME;
+            if (wsRoot && repoName && repoName !== 'manager') {
+              wr.announceWorkerReady(wsRoot, repoName);
+            }
+          } catch (_err) { /* ack is best-effort */ }
+          const ctx = [
+            `⚡ WORKSPACE SESSION START — RESUMING IN-PROGRESS TASK`,
+            '',
+            `This worker restarted with task ${inProgress.id} still in progress${total != null ? ` (${remaining} of ${total} sub-task(s) remaining)` : ''}.`,
+            `Durable sub-task state is on disk — completed sub-tasks are recorded and must NOT be redone.`,
+            '',
+            'AUTONOMOUS MODE CONTRACT (workspace worker):',
+            '  • Resume the SAME task — do not pick a different one, do not go idle.',
+            '  • Read .workflow/state/subtask-state.json to see which sub-tasks remain.',
+            '  • Grind to completion; only stop when done (flow done) or genuinely blocked.',
+            '',
+            `ACT NOW: Invoke Skill(skill="wogi-start", args="${inProgress.id}")`
+          ].join('\n');
+          return { branch: 'resume-in-progress', context: ctx, taskId: inProgress.id, remaining, total };
+        }
+      }
+    } catch (err) {
+      if (process.env.DEBUG) console.error(`[session-start-worker] resume-in-progress check failed (fail-open): ${err.message}`);
+    }
     // Check for queued work first — if any, tell the model to pick it up
     // instead of announcing idle readiness.
     let pickup;

package/scripts/hooks/core/stop-orchestrator.js CHANGED Viewed

@@ -87,8 +87,12 @@ async function orchestrateStop({ parsedInput }) {
     };
   }
+  // S3 (wf-d3ae1717): the worker-stopped emission used to fire HERE,
+  // unconditionally, before any gate decided to continue — so the manager saw
+  // "stopped mid-work" on every turn boundary. It now fires only at a genuine
+  // stop (end of this function) with a precise terminal type, and a
+  // worker-progress heartbeat fires from the continuation gate instead.
   const workspaceNotify = require('./workspace-stop-notify');
-  await workspaceNotify.notifyWorkerStopped();
   const restartCoordinator = require('./task-boundary-restart-coordinator');
   const restartResult = await restartCoordinator.handleTaskBoundaryRestart({ parsedInput });
@@ -120,7 +124,18 @@ async function orchestrateStop({ parsedInput }) {
   const wsResult = await workspaceGates.checkWorkspaceStopGates({ parsedInput });
   if (wsResult?.shouldReturn) return wsResult.result;
-  return await checkLoopExit();
+  // Genuine stop path: no gate forced continuation. Emit a precise terminal
+  // worker signal ONLY when we're actually allowing the turn to end (canExit).
+  // continueToNext / blocked-continue are not terminal stops.
+  const loopResult = await checkLoopExit();
+  try {
+    if (loopResult?.canExit === true) {
+      await workspaceNotify.notifyWorkerTerminal();
+    }
+  } catch (err) {
+    if (process.env.DEBUG) console.error(`[Stop] terminal notify error (fail-open): ${err.message}`);
+  }
+  return loopResult;
 }
 module.exports = { orchestrateStop };

package/scripts/hooks/core/validation.js CHANGED Viewed

@@ -222,6 +222,14 @@ async function runValidation(options = {}) {
   return {
     passed: allPassed,
+    // F6 (R-379): signal `blocked` so the adapter's `decision: 'block'` path
+    // actually fires when validation fails. Without this, the `continueOnBlock`
+    // wiring in transformPostToolUse is inert (decision is always undefined).
+    // With it, lint/typecheck failure after Edit/Write feeds back to Claude
+    // and (per the continueOnBlock setting) the turn continues so Claude can
+    // fix the error in-loop — which is what CLAUDE.md's "validate after every
+    // file edit" rule needs.
+    blocked: !allPassed,
     skipped: false,
     results,
     summary: generateValidationSummary(results, filePath)