npm - wogiflow - Versions diffs - 2.32.0 → 2.33.0 - Mend

wogiflow 2.32.0 → 2.33.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

package/.claude/docs/claude-code-compatibility.md +51 -0
package/.claude/docs/scheduled-mode.md +213 -0
package/.claude/docs/skill-portability.md +190 -0
package/.claude/rules/alternative-hook-args-exec-form.md +6 -0
package/.claude/settings.json +2 -1
package/.claude/skills/_template/skill.md +1 -0
package/.claude/skills/conventional-commit/knowledge/examples.md +65 -0
package/.claude/skills/conventional-commit/skill.md +76 -0
package/bin/flow +16 -0
package/lib/scheduled-mode.js +377 -0
package/lib/skill-export-agentskills.js +211 -0
package/lib/skill-export-claude-plugin.js +143 -0
package/lib/skill-portability.js +324 -0
package/lib/skill-registry.js +32 -2
package/package.json +2 -2
package/scripts/flow +8 -0
package/scripts/flow-config-defaults.js +20 -0
package/scripts/flow-schedule.js +469 -0
package/scripts/flow-scheduled-runner.js +614 -0
package/scripts/flow-skill-export.js +334 -0
package/scripts/hooks/adapters/claude-code.js +12 -1
package/scripts/hooks/core/git-safety-gate.js +92 -20
package/scripts/hooks/core/long-input-enforcement.js +139 -4

package/scripts/hooks/core/long-input-enforcement.js CHANGED Viewed

@@ -71,6 +71,83 @@ const SOURCE_LINK_PATTERNS = [
   /\bwf-[a-f0-9]{8}\b/i  // bare wf-ID reference
 ];
+/**
+ * Strip quoted/pasted content from a prompt so item + line counts reflect
+ * what the USER is actually requesting, not what they're illustrating.
+ *
+ * Removes:
+ *   - Fenced code blocks (``` … ```) — pasted code or transcript output
+ *   - Lines starting with `⏺` — pasted Claude Code transcript bullet
+ *   - Lines starting with `  ⎿ ` — pasted Claude Code tool-result indent
+ *   - Lines starting with `>` (markdown blockquote, indented or not) — quoted source
+ *   - Indented blocks of 4+ leading spaces directly after a fence-less line
+ *     (informal code-block convention — git diff output, REPL traces, etc.)
+ *
+ * Conservative: only strips when stripping changes the count classification —
+ * downstream callers compare strip vs. raw and use the lower count if it crosses
+ * the threshold. (Tested directly via the helper export; the classifier wires
+ * it into both detectLongFormPrompt and hasTaskSignals.)
+ *
+ * Why this matters: the current turn's user prompt was a short narrative + a
+ * ~70-line PASTED transcript inside a fenced block. The raw line count crossed
+ * the threshold, the imperatives inside the transcript ("fix", "add", "rm")
+ * crossed the task-signal threshold, and the gate fired — even though the user
+ * pasted the transcript to ILLUSTRATE a bug, not to deliver work items.
+ *
+ * @param {string} text
+ * @returns {string} stripped text (always a string; '' if input wasn't)
+ */
+function stripQuotedContent(text) {
+  if (typeof text !== 'string') return '';
+  // 1. Strip fenced code blocks (greedy, but match per-block so unclosed
+  //    fences don't eat the rest of the prompt).
+  let stripped = text.replace(/^```[^\n]*\n[\s\S]*?\n```\s*$/gm, '');
+  // 2. Strip pasted-transcript / blockquote lines.
+  const lines = stripped.split('\n');
+  const kept = [];
+  for (const line of lines) {
+    // ⏺ — Claude Code transcript bullet
+    if (/^\s*⏺/.test(line)) continue;
+    // ⎿ — Claude Code tool-result continuation marker
+    if (/^\s*⎿/.test(line)) continue;
+    // > — markdown blockquote (any indent level)
+    if (/^\s*>/.test(line)) continue;
+    // 4+ leading-space "code-by-indentation" lines that don't look like
+    // a markdown list item (those start with `- ` / `* ` / `N. ` AFTER spaces).
+    if (/^ {4,}\S/.test(line) && !/^\s*(?:[-*]|\d+[.)])\s+/.test(line)) continue;
+    kept.push(line);
+  }
+  return kept.join('\n');
+}
+/**
+ * Detect a Claude Code skill-body echo. When the AI calls `Skill(...)`, the
+ * harness surfaces the full skill prompt + args back as a "user message" via
+ * UserPromptSubmit. These are AI-composed, not user-typed; firing the gate
+ * on them creates a deadlock (the AI can't dismiss its own skill args, and
+ * extract-review needs Bash which is also gated).
+ *
+ * Detection: the prompt contains ≥2 structural markers that only appear in
+ * Claude Code skill bodies (heading hierarchies, "ARGUMENTS: {args}" template,
+ * etc.). These are exceedingly unlikely to appear in user-typed prose.
+ *
+ * @param {string} text
+ * @returns {boolean}
+ */
+function isSkillBodyEcho(text) {
+  if (typeof text !== 'string' || text.length < 500) return false;
+  let hits = 0;
+  for (const marker of SKILL_BODY_MARKERS) {
+    if (text.includes(marker)) {
+      hits++;
+      if (hits >= 2) return true;
+    }
+  }
+  return false;
+}
 function countDiscreteItems(text) {
   if (typeof text !== 'string') return 0;
   let count = 0;
@@ -83,9 +160,12 @@ function countDiscreteItems(text) {
 function detectLongFormPrompt(text) {
   if (typeof text !== 'string' || !text.trim()) return false;
-  const lineCount = text.split('\n').filter(l => l.trim()).length;
+  // Strip quoted/pasted content before counting — only the USER's own words
+  // contribute to thresholds (otherwise the gate fires on illustrative pastes).
+  const stripped = stripQuotedContent(text);
+  const lineCount = stripped.split('\n').filter(l => l.trim()).length;
   if (lineCount > LONG_LINE_THRESHOLD) return true;
-  if (countDiscreteItems(text) >= LONG_ITEM_THRESHOLD) return true;
+  if (countDiscreteItems(stripped) >= LONG_ITEM_THRESHOLD) return true;
   return false;
 }
@@ -116,6 +196,27 @@ const SYSTEM_CONTENT_PREFIXES = [
   '<bash-stderr>'
 ];
+// Skill-body markers that indicate the prompt is a Claude Code skill body
+// being echoed back to the model after an AI Skill(...) invocation. When
+// the AI calls `Skill(skill="wogi-start", args="...long...")`, Claude Code
+// surfaces the full skill prompt + args as the next "user message" — going
+// through UserPromptSubmit. The args are AI-composed, not user-typed, so
+// the gate must NOT fire on them. We detect this by the structural markers
+// that only ever appear in skill body bodies (not in regular user prose).
+// Treating it as a user prompt was the deadlock shape from the wogiflow-cli
+// 2026-05-13 incident — see the bug report transcript in this commit's body.
+const SKILL_BODY_MARKERS = [
+  '**UNIVERSAL ENTRY POINT**',
+  '## Request Triage (AI-Driven Routing',
+  '### Command Catalog',
+  '### Pre-Routing Checks (Automatic)',
+  'Routing order: Task ID',
+  '## Phase Execution (MANDATORY)',
+  '## Mandatory Rules',
+  'ARGUMENTS: {args}',
+  '## How It Works (MANDATORY',
+];
 /**
  * Detect content that originates from the system (tool results, sub-agent
  * notifications, slash-command framings) rather than user typing. These
@@ -137,9 +238,14 @@ function isSystemOriginatedContent(text) {
 function hasTaskSignals(text) {
   if (typeof text !== 'string') return false;
+  // Imperatives inside pasted code/transcript/blockquotes are illustrative,
+  // not the user's own work-creating instructions. Count only on the USER's
+  // own words. (Without this, pasted error logs containing "fix" / "add"
+  // / "remove" trip the gate as if the user were ordering 5 tasks.)
+  const stripped = stripQuotedContent(text);
   let imperativeHits = 0;
   for (const re of TASK_IMPERATIVES) {
-    const m = text.match(new RegExp(re.source, 'gi'));
+    const m = stripped.match(new RegExp(re.source, 'gi'));
     if (m) imperativeHits += m.length;
   }
   return imperativeHits >= 2;
@@ -176,6 +282,13 @@ function shouldForceExtractReview({ text, source, env = process.env } = {}) {
   if (isSystemOriginatedContent(text)) {
     return { forced: false, level: 'pass', reason: 'system-originated-content' };
   }
+  // Deadlock fix (2026-05-13): AI-composed Skill args get surfaced back as
+  // a "user message" by the harness. Detect the skill-body echo signature
+  // and skip the gate — the args are AI-decomposed, not user-typed, so
+  // item-reconciliation has no source to reconcile against.
+  if (isSkillBodyEcho(text)) {
+    return { forced: false, level: 'pass', reason: 'skill-body-echo' };
+  }
   if (!detectLongFormPrompt(text)) {
     return { forced: false, level: 'pass', reason: 'below-long-input-threshold' };
   }
@@ -308,6 +421,20 @@ function checkLongInputPendingGate(toolName, toolInput) {
     if (/flow\s+extract-zero-loss/.test(cmd)) return { blocked: false };
     if (/flow\s+long-input/.test(cmd)) return { blocked: false };
     if (/flow-source-fidelity\.js/.test(cmd)) return { blocked: false };
+    // EMERGENCY ESCAPE (2026-05-13 deadlock fix): when the `flow` CLI is
+    // unavailable (e.g., target project has no node_modules/wogiflow on PATH,
+    // or the CLI itself is broken), allow the user to manually clear the
+    // marker file via `rm`. Scoped narrowly to the exact marker path so it
+    // can't be used as a general-purpose Bash escape.
+    if (/^\s*rm\s+(?:-[a-zA-Z]+\s+)?(?:["']?)\.workflow\/state\/long-input-pending\.json(?:["']?)\s*$/.test(cmd)) {
+      return { blocked: false };
+    }
+    // Also allow the node-script equivalent (for sessions where `rm` is
+    // unavailable, e.g. some Windows shells). Matches both `fs.unlinkSync(...)`
+    // and `require('fs').unlinkSync(...)` forms.
+    if (/unlinkSync\s*\(\s*['"]\.workflow\/state\/long-input-pending\.json['"]\s*\)/.test(cmd)) {
+      return { blocked: false };
+    }
     // Falls through to block for everything else
   }
@@ -334,6 +461,11 @@ function checkLongInputPendingGate(toolName, toolInput) {
       '  2. (ESCAPE HATCH) If this prompt genuinely does NOT create work',
       '     (e.g., it\'s a log dump or pure question), dismiss with:',
       '     `flow long-input-pending dismiss --reason="<concrete reason>"`',
+      '  3. (EMERGENCY) If both paths above fail (e.g., `flow` CLI missing',
+      '     or broken), manually clear the marker file:',
+      '     `rm .workflow/state/long-input-pending.json`',
+      '     (This Bash command is explicitly allowed by the gate as a',
+      '     deadlock escape.)',
       '',
       'Read/Glob/Grep tools remain available for investigation.'
     ].join('\n')
@@ -345,10 +477,12 @@ module.exports = {
   LONG_LINE_THRESHOLD,
   LONG_ITEM_THRESHOLD,
   SYSTEM_CONTENT_PREFIXES,
+  SKILL_BODY_MARKERS,
   detectLongFormPrompt,
   hasSourceLink,
   hasTaskSignals,
   isSystemOriginatedContent,
+  isSkillBodyEcho,
   isChannelDispatchInWorker,
   shouldForceExtractReview,
   buildEnforcementMessage,
@@ -357,5 +491,6 @@ module.exports = {
   isLongInputPending,
   readLongInputPending,
   checkLongInputPendingGate,
-  countDiscreteItems
+  countDiscreteItems,
+  stripQuotedContent
 };