npm - cclaw-cli - Versions diffs - 0.51.8 → 0.51.10 - Mend

cclaw-cli 0.51.8 → 0.51.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/dist/artifact-linter.js +142 -7
package/dist/content/examples.js +3 -1
package/dist/content/stages/brainstorm.js +19 -8
package/dist/content/stages/scope.js +14 -13
package/dist/content/start-command.js +3 -2
package/dist/content/templates.js +43 -8
package/dist/internal/advance-stage.js +25 -2
package/package.json +1 -1

package/dist/artifact-linter.js CHANGED Viewed

@@ -252,7 +252,7 @@ function meaningfulLineCount(sectionBody) {
         .filter((line) => line.length > 0)
         .filter((line) => !line.startsWith("<!--"))
         .filter((line) => !/^[-:| ]+$/u.test(line))
-        .filter((line) => /[A-Za-z0-9]/u.test(line))
+        .filter((line) => /[\p{L}\p{N}]/u.test(line))
         .length;
 }
 function lineHasToken(line, token) {
@@ -304,17 +304,21 @@ function tokensFromRule(rule) {
     return [];
 }
 /**
- * Extract required keywords from validation rules that contain comma-separated
- * concept lists. Activates only for rules with structured enumerations like
- * "failure modes, error surface, data-flow paths" — not for short rules.
+ * Extract required keywords from validation rules that contain *backticked*
+ * stable tokens after a colon. We only fire on machine-surface enumerations
+ * (e.g., `` Must contain: `Status:`, `WAIT_FOR_CONFIRM`, `Approved:` ``);
+ * descriptive English prose with bare comma lists is intentionally ignored so
+ * authors can write rationale freely without triggering hardcoded keyword
+ * matches. Sections that need richer structural enforcement use a dedicated
+ * `validateSectionBody` dispatch (see `validateScopeSummary`, etc.).
  */
 function extractRequiredKeywords(rule) {
     const colonMatch = /:\s*(.+)$/u.exec(rule);
     if (!colonMatch)
         return [];
     const tail = colonMatch[1];
-    const parts = tail.split(/,\s*(?:and\s+)?/u).map((p) => p.trim().replace(/\.$/u, ""));
-    const phrases = parts.filter((p) => p.length >= 4 && !/^(must|should|at least|if |or )/iu.test(p));
+    const backtickedTokens = Array.from(tail.matchAll(/`([^`]+)`/gu)).map((m) => m[1].trim());
+    const phrases = backtickedTokens.filter((p) => p.length >= 2);
     if (phrases.length < 3)
         return [];
     return phrases;
@@ -366,11 +370,16 @@ function getMarkdownTableRows(sectionBody) {
 }
 function getApproachRows(sectionBody) {
     const tableRows = getMarkdownTableRows(sectionBody).map((row) => row.join(" "));
+    const headingRows = sectionBody
+        .split(/\r?\n/u)
+        .map((line) => line.trim())
+        .filter((line) => /^#{3,6}\s+\S/u.test(line))
+        .map((line) => line.replace(/^#{3,6}\s+/u, ""));
     const bulletRows = sectionBody
         .split(/\r?\n/u)
         .map((line) => line.trim())
         .filter((line) => /^(?:[-*]|\d+\.)\s+\S/u.test(line));
-    return [...tableRows, ...bulletRows];
+    return [...tableRows, ...headingRows, ...bulletRows];
 }
 function hasSemanticChallenger(row) {
     const normalized = row
@@ -487,6 +496,126 @@ function validateFailureModeTable(sectionBody) {
         details: "Failure Mode Table header and critical-risk checks passed."
     };
 }
+// Canonical scope mode tokens (gstack CEO review). The four mode names live in
+// the scope skill, the artifact template, and downstream traces. Requiring one
+// of them in Scope Summary is **structural** — not free-form English keyword
+// matching on user prose. Authors may also use the canonical short form on a
+// `Mode:` / `Selected mode:` line (e.g. `Selected mode: hold`) as a courtesy.
+const SCOPE_MODE_FULL_TOKENS = [
+    "SCOPE EXPANSION",
+    "SELECTIVE EXPANSION",
+    "HOLD SCOPE",
+    "SCOPE REDUCTION"
+];
+const SCOPE_MODE_FULL_REGEX = new RegExp("\\b(?:" +
+    SCOPE_MODE_FULL_TOKENS
+        .map((token) => token.replace(/[.*+?^${}()|[\]\\]/g, "\\$&").replace(/\s+/g, "[\\s_-]+"))
+        .join("|") +
+    ")\\b", "iu");
+// Short-form synonyms accepted only when stamped on an explicit `Mode:` /
+// `Selected mode:` / `Scope mode:` line. Plain prose with the same word does
+// not count, so `strict` / `broad` / `narrow` / similar non-mode adjectives
+// remain rejected.
+const SCOPE_MODE_LINE_REGEX = /(?:^|\n)\s*[-*]?\s*\**\s*(?:Selected\s+|Scope\s+)?Mode\**\s*:\s*\**\s*([^\n]+)/iu;
+const SCOPE_MODE_SHORT_TOKEN_REGEX = /\b(?:hold(?:[\s_-]?scope)?|selective(?:[\s_-]?expansion)?|scope[\s_-]?expansion|expansion|scope[\s_-]?reduction|reduction|expand|reduce)\b/iu;
+// Next-stage handoff token. We only enforce the canonical machine-surface stage
+// IDs (`design`, `spec`) plus stable handoff phrases. The surrounding prose may
+// be written in any language — this guards the downstream cross-stage trace,
+// not the wording of the rationale.
+const NEXT_STAGE_HANDOFF_REGEX = /(?:`(?:design|spec)`|\bdesign\b|\bspec\b|next[-\s_]stage|next stage|handoff|hand[-\s]off)/iu;
+function hasCanonicalScopeMode(body) {
+    if (SCOPE_MODE_FULL_REGEX.test(body))
+        return true;
+    for (const match of body.matchAll(new RegExp(SCOPE_MODE_LINE_REGEX, "giu"))) {
+        const value = match[1] ?? "";
+        if (SCOPE_MODE_SHORT_TOKEN_REGEX.test(value))
+            return true;
+    }
+    return false;
+}
+function validatePremiseChallenge(sectionBody) {
+    // gstack-style premise challenge requires a real Q/A structure (table or
+    // list), not free-form prose. The validation is *structural* only — we do
+    // NOT keyword-grep for English phrases like "right problem"; authors may
+    // write the questions in any language, and the answers carry the meaning.
+    // The template ships with canonical question labels as scaffolding, but
+    // the linter only enforces that the section actually compares premise
+    // questions to answers.
+    const tableRows = getMarkdownTableRows(sectionBody);
+    const bulletRows = sectionBody
+        .split(/\r?\n/u)
+        .map((line) => line.trim())
+        .filter((line) => /^(?:[-*]|\d+\.)\s+\S/u.test(line));
+    const rowCount = Math.max(tableRows.length, bulletRows.length);
+    if (rowCount < 3) {
+        return {
+            ok: false,
+            details: `Premise Challenge needs at least 3 question/answer rows in a table or bullet list (right problem? / direct path? / what if nothing? are the gstack default trio). Found ${rowCount}.`
+        };
+    }
+    // For tables, each data row must have at least 2 non-empty cells so the
+    // section is genuinely a Q/A comparison, not a list of headlines. For
+    // bullet lists, each line must be substantive (>= 8 characters of letters
+    // or digits) so we don't accept three-letter placeholders like `- a`.
+    if (tableRows.length >= 3) {
+        const sparseRows = tableRows.filter((row) => {
+            const filledCells = row.filter((cell) => cell.replace(/[\s|]/gu, "").length >= 2);
+            return filledCells.length < 2;
+        });
+        if (sparseRows.length > 0) {
+            return {
+                ok: false,
+                details: "Premise Challenge table rows must populate at least the question and answer columns (no empty answers)."
+            };
+        }
+    }
+    else if (bulletRows.length >= 3) {
+        const sparseBullets = bulletRows.filter((line) => {
+            const cleaned = line.replace(/^[-*\d.\s]+/u, "").replace(/[`*_]/gu, "").trim();
+            const hasQuestionMark = /\?/u.test(cleaned);
+            const meaningful = cleaned.match(/[\p{L}\p{N}]/gu)?.length ?? 0;
+            return !hasQuestionMark && meaningful < 12;
+        });
+        if (sparseBullets.length > bulletRows.length - 3) {
+            return {
+                ok: false,
+                details: "Premise Challenge bullet list must include at least 3 substantive Q/A lines (a question mark plus the answer, or a labelled `Question: answer` pair)."
+            };
+        }
+    }
+    return {
+        ok: true,
+        details: `Premise Challenge structures ${rowCount} Q/A rows.`
+    };
+}
+function validateScopeSummary(sectionBody) {
+    const meaningfulLines = sectionBody
+        .split(/\r?\n/)
+        .map((line) => line.trim())
+        .filter((line) => line.length > 0 && /[\p{L}\p{N}]/u.test(line));
+    if (meaningfulLines.length < 2) {
+        return {
+            ok: false,
+            details: "Scope Summary must list at least 2 substantive lines covering the selected mode and the next-stage handoff."
+        };
+    }
+    if (!hasCanonicalScopeMode(sectionBody)) {
+        return {
+            ok: false,
+            details: "Scope Summary must name the selected mode using a canonical token (SCOPE EXPANSION, SELECTIVE EXPANSION, HOLD SCOPE, SCOPE REDUCTION) or a short form on a `Mode:` line (hold, selective, expansion, reduction)."
+        };
+    }
+    if (!NEXT_STAGE_HANDOFF_REGEX.test(sectionBody)) {
+        return {
+            ok: false,
+            details: "Scope Summary must record the track-aware next-stage handoff (mention `design` for standard, `spec` for medium, or include a `Next-stage handoff:` line)."
+        };
+    }
+    return {
+        ok: true,
+        details: "Scope Summary names the selected mode and the next-stage handoff."
+    };
+}
 const INTERACTION_EDGE_CASE_REQUIREMENTS = [
     { label: "double-click", pattern: /\bdouble[\s-]?click\b/iu },
     {
@@ -1207,6 +1336,12 @@ function validateSectionBody(sectionBody, rule, sectionName) {
     if (sectionNameNormalized === "pre-scope system audit") {
         return validatePreScopeSystemAudit(sectionBody);
     }
+    if (sectionNameNormalized === "scope summary") {
+        return validateScopeSummary(sectionBody);
+    }
+    if (sectionNameNormalized === "premise challenge") {
+        return validatePremiseChallenge(sectionBody);
+    }
     if (sectionNameNormalized === "data flow") {
         return validateInteractionEdgeCaseMatrix(sectionBody);
     }

package/dist/content/examples.js CHANGED Viewed

@@ -142,9 +142,11 @@ The original premise (“add notifications”) was reframed to **“ensure users
 ## Scope Summary
+- Selected mode: SELECTIVE EXPANSION (cherry-pick durable feed on hold-scope baseline).
 - Accepted scope: durable feed + SSE + explicit degraded UX.
 - Deferred: WebSocket channel and rich-media/search enhancements.
-- Explicitly excluded: outbound channels and marketing workflows for v1.`,
+- Explicitly excluded: outbound channels and marketing workflows for v1.
+- Next-stage handoff: design — carry the durable-feed contract, SSE failover paths, and degraded-UX expectations into architecture lock-in.`,
     design: `## Codebase Investigation (blast-radius files)
 | File | Current responsibility | Patterns discovered |

package/dist/content/stages/brainstorm.js CHANGED Viewed

@@ -36,23 +36,29 @@ export const BRAINSTORM = {
     },
     executionModel: {
         checklist: [
-            "**Explore project context** — inspect existing files/docs/recent activity before asking what to build.",
+            "**Explore project context** — inspect existing files/docs/recent activity before asking what to build; capture matching files/patterns/seeds in `Context > Discovered context` so downstream stages don't redo discovery.",
             "**Classify depth and scope** — pick Lightweight / Standard / Deep; decompose independent subsystems before deeper work.",
+            "**Premise check (one pass)** — answer the three gstack-style questions in the artifact body: *Right problem? Direct path? What if we do nothing?* Take a position; do not hedge.",
+            "**Reframe with How Might We** — write a single `How Might We …?` line that names the user, the desired outcome, and the constraint. This is the altitude check before approaches.",
+            "**Sharpening questions (3-5)** — capture decision-changing question/answer pairs in the `Sharpening Questions` table with the actual decision impact; if a question would not change architecture/scope/UX, state the assumption and skip it.",
             "**Use compact discovery for simple apps** — for concrete low-risk asks (todo app, landing page, local widget), do one context pass, compare one baseline and one challenger, then ask for one explicit approval; do not drag the user through a full workshop.",
             "**Short-circuit concrete asks** — for unambiguous implementation-only requests, write a compact brainstorm stub (context, problem, approved intent, constraints, assumptions) and ask for one explicit approval.",
             "**Ask only decision-changing questions** — one at a time; if answers would not change approach, state the assumption and continue.",
-            "**Compare 2-3 distinct approaches** — include real trade-offs, withhold recommendation, and include one higher-upside challenger.",
+            "**Compare 2-3 distinct approaches with stable Role/Upside columns** — Role values are `baseline` | `challenger` | `wild-card`; Upside is `low` | `modest` | `high` | `higher`; include real trade-offs and reuse notes; include exactly one challenger with explicit `high` or `higher` upside.",
             "**Collect reaction before recommending** — ask which option feels closest and what concern remains, then recommend based on that reaction.",
-            "**Write and tighten the artifact** — scale sections to complexity, optionally add a compact diagram, then patch contradictions, weak trade-offs, placeholders, ambiguity, and weak handoff language.",
+            "**Write the `Not Doing` list** — name 3-5 things this brainstorm explicitly is not committing to (vs. deferred). This protects scope from silent enlargement and the next stage from rework.",
+            "**Self-review before user approval** — re-read the artifact and patch contradictions, weak trade-offs, placeholders, ambiguity, and weak handoff language; record the patch list in `Self-Review Notes` (or `- None.`).",
             "**Request explicit approval** — state exactly what direction is being approved; do not advance without approval and artifact review.",
             "**Handoff** — only after approval, complete the stage and point to `/cc-next`."
         ],
         interactionProtocol: [
-            "Start from observed project context; if the idea is vague, first narrow the project type.",
+            "Start from observed project context; if the idea is vague, first narrow the project type with **one** structured question, then keep going.",
+            "Lead with the premise check (right problem / direct path / what if nothing) and the `How Might We` reframing before approaches; both go in the artifact, not just the chat.",
             "Ask at most one question per turn, only when decision-changing; if using a structured question tool, send exactly one question object, not a multi-question form.",
-            "If likely answers do not change architecture or scope boundaries, choose the default and state the assumption.",
-            "For simple greenfield web apps, present a compact A/B choice with one recommended path and one higher-upside challenger; keep the artifact concise but structurally complete.",
+            "If likely answers do not change architecture or scope boundaries, choose the default and state the assumption inline.",
+            "For simple greenfield web apps, present a compact A/B choice with one recommended path and one higher-upside challenger; keep the artifact concise but structurally complete (Context, Premise, How Might We, Sharpening Questions, Approaches, Reaction, Selected Direction, Not Doing).",
             "Show approaches before the recommendation; include a higher-upside challenger and gather reaction first.",
+            "Self-review before approval: re-read the artifact, fix contradictions/placeholders/weak trade-offs, then ask for approval. Do not ask for approval on a draft you have not re-read.",
             "State exactly what is being approved, then **STOP** until the user explicitly approves the artifact."
         ],
         process: [
@@ -117,16 +123,21 @@ export const BRAINSTORM = {
             traceabilityRule: "Scope and design decisions must trace back to explored context and approved brainstorm direction."
         },
         artifactValidation: [
-            { section: "Context", required: true, validationRule: "Must reference project state and relevant existing code or patterns." },
+            { section: "Context", required: true, validationRule: "Must reference project state and relevant existing code or patterns. A `Discovered context` subsection (or list) is recommended for downstream traceability." },
             { section: "Problem", required: true, validationRule: "Must define what we're solving, success criteria, and constraints." },
+            { section: "Premise Check", required: false, validationRule: "Recommended: explicit answers to `Right problem?`, `Direct path?`, `What if we do nothing?` — take a position, do not hedge." },
+            { section: "How Might We", required: false, validationRule: "Recommended: a single `How Might We …?` line naming the user, the outcome, and the binding constraint." },
+            { section: "Sharpening Questions", required: false, validationRule: "Recommended: 3-5 question/answer pairs with explicit `Decision impact` so downstream stages see what each answer changed." },
             { section: "Clarifying Questions", required: false, validationRule: "Must capture question, answer, and decision impact for each clarifying question." },
             { section: "Approach Tier", required: true, validationRule: "Must classify depth as Lightweight/Standard/Deep and explain why." },
             { section: "Short-Circuit Decision", required: false, validationRule: "Must include Status/Why/Scope handoff lines when short-circuit is discussed; compact stubs are valid for concrete asks." },
-            { section: "Approaches", required: true, validationRule: "Must compare 2-3 distinct options with real trade-offs; include one option marked as a challenger with explicit high/higher upside." },
+            { section: "Approaches", required: true, validationRule: "Must compare 2-3 distinct options with real trade-offs. Use the canonical `Role` column with `baseline` | `challenger` | `wild-card` and the `Upside` column with `low` | `modest` | `high` | `higher`; include exactly one challenger row with `high` or `higher` upside." },
             { section: "Approach Reaction", required: true, validationRule: "Must appear before Selected Direction and summarize user reaction before recommendation, including `Closest option`, `Concerns`, and what changed after reaction." },
             { section: "Selected Direction", required: true, validationRule: "Must include the selected approach, an explicit approval marker, rationale traceable to the prior Approach Reaction, and a track-aware next-stage handoff." },
+            { section: "Not Doing", required: false, validationRule: "Recommended: 3-5 explicitly non-committed items (distinct from deferred). Protects scope from silent enlargement and the next stage from rework." },
             { section: "Design", required: false, validationRule: "Must cover architecture, key components, and data flow scaled to complexity." },
             { section: "Visual Companion", required: false, validationRule: "If architecture/data-flow complexity is medium+, include compact ASCII/Mermaid diagram or explicitly justify omission." },
+            { section: "Self-Review Notes", required: false, validationRule: "Recommended: list of patches applied during self-review (or `- None.`) — done before requesting user approval." },
             { section: "Assumptions and Open Questions", required: false, validationRule: "Must capture unresolved assumptions/open questions, or explicitly state none." }
         ],
         trivialOverrideSections: [

package/dist/content/stages/scope.js CHANGED Viewed

@@ -46,31 +46,32 @@ export const SCOPE = {
     executionModel: {
         checklist: [
             "**Compact CEO pass first** — read brainstorm, name the job-to-be-done, challenge whether this is the right product slice, and propose the highest-leverage scope in one pass. For simple apps, keep this to a tight scope contract instead of a full strategy workshop.",
-            "**Pick one of four gstack modes** — SCOPE EXPANSION, SELECTIVE EXPANSION, HOLD SCOPE, or SCOPE REDUCTION. State why and what user signal would change the mode.",
+            "**Premise and leverage check** — answer in the artifact: *Right problem? Direct path? What if nothing? Where can we leverage existing code? What is the reversibility cost?* Take a position; do not hedge.",
             "**Draft the 10-star vs current-slice boundary** — show what would make the product meaningfully better, then explicitly choose what ships now, what is deferred, and what is excluded without using vague `later/for now` placeholders.",
-            "**Premise and leverage check** — test right problem, direct path, no-action outcome, existing-code leverage, and reversibility before asking the user anything.",
-            "**Compare implementation alternatives** — include minimum viable, product-grade, and ideal architecture options with effort/risk/reuse, then recommend one.",
-            "**Run outside voice before final approval** — for simple/low-risk scope, record one concise adversarial self-check row; for complex/high-risk/configured scope, iterate until threshold. Record the loop summary in `## Spec Review Loop` before asking approval.",
+            "**Pick one of four gstack modes with the user** — SCOPE EXPANSION, SELECTIVE EXPANSION, HOLD SCOPE, or SCOPE REDUCTION. Recommend one, state why and what signal would change it, then STOP for the user's mode/scope approval before writing the final artifact.",
+            "**Run mode-specific analysis** — match the analysis to the chosen mode: SCOPE EXPANSION enumerates 10x opportunities + delight features; SELECTIVE EXPANSION lists baseline + cherry-picked additions with leverage rationale; HOLD SCOPE proves rigor on the current slice; SCOPE REDUCTION names the smallest useful wedge and what is cut, with follow-up split.",
+            "**Compare implementation alternatives** — include minimum viable, product-grade, and ideal architecture options with effort (S/M/L/XL), risk (Low/Med/High), pros, cons, and reuses. Recommend one and tie it to mode.",
+            "**Run outside voice before final approval** — for simple/low-risk scope, record one concise adversarial self-check row; for complex/high-risk/configured scope, iterate until threshold. Record the loop summary in `## Spec Review Loop`, but do not treat it as user approval.",
             "**Ask only one decision-changing question** — if the user rejects the contract but is unsure, offer 3-4 concrete scope moves instead of open-ended interrogation.",
-            "**Write the scope contract** — include in-scope/out-of-scope, discretion areas, deferred items, locked decisions, error/rescue notes, completion dashboard, scope summary, next-stage handoff, and explicit approval."
+            "**Write the scope contract after approval** — include in-scope/out-of-scope, discretion areas, deferred items, locked decisions, error/rescue notes, completion dashboard, scope summary (with canonical mode token + next-stage handoff), and explicit approval evidence."
         ],
         interactionProtocol: [
             decisionProtocolInstruction("scope mode selection", "present expand/selective/hold/reduce as labeled options with trade-offs and mark one as (recommended)", "recommend the option that best covers the prime-directive failure modes, four data-flow paths, observability, and deferred handling for the in-scope set with the smallest blast radius. Base your recommendation on default heuristics: greenfield -> expand, enhancement -> selective, bugfix/hotfix/refactor -> hold, broad blast radius -> reduce"),
-            "Do not walk the full checklist by default. Lead with an opinionated scope contract and the one decision that matters most.",
-            "For simple web-app flows, default to HOLD SCOPE or SELECTIVE EXPANSION, show the exact in/out/deferred contract, and ask for one approval.",
+            "Do not walk the full checklist by default. Lead with a proposed scope contract and the one decision that matters most; label the mode as recommended, not selected, until the user answers.",
+            "For simple web-app flows, default to HOLD SCOPE or SELECTIVE EXPANSION, show the exact in/out/deferred contract as a proposal, and STOP for one explicit approval before writing the final scope artifact or completing the stage.",
             "Challenge premise first, take a firm position, and name one concrete condition that would change it.",
             "Push back on weak framing: vague scope needs a specific user/problem, platform vision needs a narrow wedge, social proof needs behavioral evidence.",
             "Resolve one structural scope issue at a time; otherwise state the assumption and move on.",
             "If the user says no but cannot name the change, offer concrete moves: keep scope, add one obvious adjacent capability, reduce to wedge, or re-open stack/product direction.",
             `Before final approval, record outside-voice findings and a \`## Spec Review Loop\` table using ${reviewLoopPolicySummary("scope")}`,
-            "**STOP.** Wait for explicit approval of the scope contract before advancing.",
-            "**STOP BEFORE ADVANCE.** Mandatory delegation `planner` must be completed or explicitly waived. If no isolated planner is available, use `--waive-delegation=planner --waiver-reason=\"role-switch scope self-review completed\"`. Then close with `node .cclaw/hooks/stage-complete.mjs scope --passed=scope_mode_selected,scope_contract_written,scope_user_approved --evidence-json '{\"scope_mode_selected\":\"<mode + rationale>\",\"scope_contract_written\":\"<artifact path + sections>\"}'`. Do not include `scope_user_approved` manually; stage-complete auto-hydrates its review-loop envelope from `## Spec Review Loop`."
+            "**STOP.** Wait for explicit user approval of the scope mode and scope contract before writing final approval language or advancing.",
+            "**STOP BEFORE ADVANCE.** Mandatory delegation `planner` must be completed or explicitly waived. If no isolated planner is available, use `--waive-delegation=planner --waiver-reason=\"role-switch scope self-review completed\"`. Then close with `node .cclaw/hooks/stage-complete.mjs scope --passed=scope_mode_selected,scope_contract_written,scope_user_approved --evidence-json '{\"scope_mode_selected\":\"<user-approved mode + rationale>\",\"scope_contract_written\":\"<artifact path + sections>\",\"scope_user_approved\":\"<explicit user approval quote or summary>\"}'`. `scope_user_approved` must cite the user's approval; review-loop evidence alone is not approval."
         ],
         process: [
             "Run configured pre-scope audit only when enabled.",
             "Run the gstack-style CEO scope pass scaled to risk: job-to-be-done, premise challenge, 10-star upside, smallest useful wedge, and what would change the recommendation.",
             "Compare minimum viable, product-grade, and ideal architecture scope alternatives with explicit reuse/effort/risk.",
-            "Select scope mode with explicit rationale; ask for user opt-in only when changing or expanding scope.",
+            "Recommend a scope mode with explicit rationale, then ask for user opt-in before treating it as selected.",
             "Run outside voice / adversarial self-check before final approval and record a valid `## Spec Review Loop` table.",
             "Write explicit scope contract, discretion areas, deferred items, error/rescue registry, and D-XX locked decisions.",
             "Produce scope summary, completion dashboard, and exact next-stage handoff before asking final approval."
@@ -89,7 +90,7 @@ export const SCOPE = {
             "Locked Decisions section lists stable D-XX IDs for non-negotiable boundaries.",
             "Premise challenge findings documented.",
             "Outside Voice findings and dispositions are recorded (accept/reject/defer with rationale) before final approval.",
-            `Spec review loop summary includes a table with columns Iteration, Quality Score, Findings, plus Stop reason, Target score, and Max iterations. stage-complete auto-hydrates scope_user_approved evidence from this section. ${reviewLoopPolicySummary("scope")}`,
+            `Spec review loop summary includes a table with columns Iteration, Quality Score, Findings, plus Stop reason, Target score, and Max iterations. This is outside-voice evidence only; it does not satisfy user approval. ${reviewLoopPolicySummary("scope")}`,
             reviewLoopSecondOpinionSummary("scope"),
             "Deferred items list with one-line rationale for each.",
             "When an upside deferred idea is parked, a seed file is created under `.cclaw/seeds/` and referenced in the artifact.",
@@ -138,7 +139,7 @@ export const SCOPE = {
             { section: "Upstream Handoff", required: false, validationRule: "Summarizes brainstorm/idea decisions, constraints, open questions, and explicit drift before scope decisions." },
             { section: "Pre-Scope System Audit", required: false, validationRule: "When `.cclaw/config.yaml::optInAudits.scopePreAudit` is true: must capture git log -30, git diff --stat, git stash list, and debt-marker scan (TODO/FIXME/XXX/HACK) before premise challenge." },
             { section: "Prime Directives", required: false, validationRule: "For each scoped capability: named failure modes, explicit error surface, four data-flow paths, interaction edge cases, observability expectations, and deferred-item handling." },
-            { section: "Premise Challenge", required: false, validationRule: "Must contain explicit answers to: right problem? direct path? what if nothing?" },
+            { section: "Premise Challenge", required: false, validationRule: "Must list at least 3 question/answer rows in a markdown table or bullet list (gstack default trio: right problem? direct path? what if we do nothing? — extend with leverage and reversibility for richer scope). The linter enforces structure, not English wording — answers may be in any language." },
             { section: "Landscape Check", required: false, validationRule: "When mode is EXPAND/SELECTIVE, include at least one external reference insight and its impact on scope." },
             { section: "Taste Calibration", required: false, validationRule: "Must reference 2-3 strong in-repo modules/files that define the quality bar or explicitly justify omission." },
             { section: "Requirements", required: false, validationRule: "Table of stable requirement IDs (R1, R2, R3…) one per row with observable outcome, priority, and source. IDs are assigned once and never renumbered across scope/design/spec/plan/review; dropped requirements stay with Priority `DROPPED`." },
@@ -153,7 +154,7 @@ export const SCOPE = {
             { section: "Outside Voice Findings", required: false, validationRule: "Must list external/adversarial findings and disposition (accept/reject/defer) with rationale." },
             { section: "Spec Review Loop", required: false, validationRule: `Must record iterations, quality score per iteration, stop reason, and unresolved concerns. Enforce ${reviewLoopPolicySummary("scope")}` },
             { section: "Completion Dashboard", required: true, validationRule: "Lists per-review-section status, count of critical/open gaps, resolved decisions, and unresolved decisions (or 'None')." },
-            { section: "Scope Summary", required: true, validationRule: "Clean summary: mode, strongest challenges, recommended path, accepted scope, deferred, excluded, and track-aware next-stage handoff." },
+            { section: "Scope Summary", required: true, validationRule: "Compact recap of the locked scope. Must name the selected mode using one of the canonical tokens (`SCOPE EXPANSION`, `SELECTIVE EXPANSION`, `HOLD SCOPE`, `SCOPE REDUCTION`) and record the track-aware next-stage handoff (`design` for standard, `spec` for medium); the linter checks structure, not English wording." },
             { section: "Dream State Mapping", required: false, validationRule: "If present (complex projects): CURRENT STATE, THIS PLAN, 12-MONTH IDEAL, and alignment verdict." },
             { section: "Temporal Interrogation", required: false, validationRule: "If present (complex projects): timeline simulation table with decision pressures and lock-now vs defer verdicts." }
         ]

package/dist/content/start-command.js CHANGED Viewed

@@ -70,7 +70,7 @@ ${conversationLanguagePolicyMarkdown()}
    Skip detection quietly if no markers are found — do NOT invent a stack.
 5. Read \`${flowPath}\`.
-6. If flow already has completed stages, warn the user that starting a new tracked flow will reset progress. Ask for confirmation before proceeding.
+6. If flow already has completed stages, warn the user that starting a new tracked flow will reset progress. Ask for confirmation before proceeding. A fresh init placeholder state with \`completedStages: []\`, no passed gates, and no \`00-idea.md\` is **not** an active flow; do not ask the user to resume it.
 7. **Track heuristic** — classify the idea text and **recommend** a track (the user can override before any state mutation):
    - First, load \`${RUNTIME_ROOT}/config.yaml\`. If \`trackHeuristics\` is defined, apply those per-track vocabulary hints (\`fallback\`, \`tracks.<id>.{triggers,veto}\`) on top of the built-in defaults. Evaluation order is always \`standard -> medium -> quick\` (narrow-to-broad).
    - **quick** (\`spec → tdd → review → ship\`) — single-purpose work where the spec is essentially already known.
@@ -152,7 +152,7 @@ description: "Unified entry point for the cclaw flow. No args = resume/next. Wit
 ## HARD-GATE
-Do **not** silently discard an existing flow when the user provides a prompt. If completed stages exist, inform and confirm before resetting.
+Do **not** silently discard an existing flow when the user provides a prompt. If completed stages exist, inform and confirm before resetting. A freshly initialized placeholder state with \`completedStages: []\`, no passed gates, and no \`${RUNTIME_ROOT}/artifacts/00-idea.md\` is not an active flow; classify the prompt and start normally.
 ${conversationLanguagePolicyMarkdown()}
 ## Protocol
@@ -168,6 +168,7 @@ ${conversationLanguagePolicyMarkdown()}
    - Inform: "You have an active flow at stage **{currentStage}** with {N} completed stages. Starting a new tracked flow will reset progress."
    - Ask: "Continue with reset? (A) Yes, start fresh (B) No, resume current flow"
    - If (B) → switch to Path B behavior.
+   If \`completedStages\` is empty, all gate \`passed\` arrays are empty, and \`${RUNTIME_ROOT}/artifacts/00-idea.md\` is missing, treat it as a fresh init placeholder — do **not** ask whether to continue the current flow.
 7. **Classify the idea** using the heuristic below and present one compact Start framing summary (class, track, stack, origin docs, seed recalls, next action). Wait for explicit confirmation or override before mutating any state only when reset/conflict/ambiguity makes it necessary.
    - If \`${RUNTIME_ROOT}/config.yaml\` defines \`trackHeuristics\`, apply those vocabulary hints (\`fallback\`, \`tracks.<id>.{triggers,veto}\`) on top of built-in defaults. Evaluation order is fixed: \`standard -> medium -> quick\`. (Honest note: this is advisory prose; the LLM applies it, not a Node-level router.)

package/dist/content/templates.js CHANGED Viewed

@@ -26,11 +26,29 @@ export const ARTIFACT_TEMPLATES = {
 - **Project state:**
 - **Relevant existing code/patterns:**
+### Discovered context
+- (paths, prior artifacts, seeds, prompt fragments — referenced by downstream stages, or \`- None.\`)
 ## Problem
 - **What we're solving:**
 - **Success criteria:**
 - **Constraints:**
+## Premise Check
+- **Right problem?** (yes/no + one-line justification — take a position)
+- **Direct path?** (yes/no + one-line justification)
+- **What if we do nothing?** (concrete consequence, not "nothing happens")
+## How Might We
+- *How might we …?* — one line naming the user, the desired outcome, and the binding constraint.
+## Sharpening Questions
+| # | Question | Answer / Assumption | Decision impact |
+|---|---|---|---|
+| 1 |  |  |  |
+| 2 |  |  |  |
+| 3 |  |  |  |
 ## Clarifying Questions
 | # | Question | Answer | Decision impact |
 |---|---|---|---|
@@ -46,10 +64,12 @@ export const ARTIFACT_TEMPLATES = {
 - Scope handoff:
 ## Approaches
-| Approach | Role | Upside | Architecture | Trade-offs | Recommendation |
-|---|---|---|---|---|---|
-| A | baseline | modest |  |  |  |
-| B | challenger | high |  |  |  |
+| Approach | Role | Upside | Architecture | Trade-offs | Reuses | Recommendation |
+|---|---|---|---|---|---|---|
+| A | baseline | modest |  |  |  |  |
+| B | challenger | high |  |  |  |  |
+> Role values: \`baseline\` | \`challenger\` | \`wild-card\`. Upside values: \`low\` | \`modest\` | \`high\` | \`higher\`. Exactly one row must be a \`challenger\` with \`high\` or \`higher\` upside.
 ## Approach Reaction
 - Closest option:
@@ -62,6 +82,9 @@ export const ARTIFACT_TEMPLATES = {
 - **Approval:** pending
 - **Next-stage handoff:** On standard track, hand this to \`scope\`; on medium track, hand this directly to \`spec\` with explicit requirements/constraints.
+## Not Doing
+- (3-5 things this brainstorm is *not* committing to — distinct from \`Deferred\`. These will not appear in scope unless the user explicitly opts in.)
 ${SEED_SHELF_SECTION}
 ## Design
@@ -69,6 +92,12 @@ ${SEED_SHELF_SECTION}
 - **Key components:**
 - **Data flow:**
+## Visual Companion
+- (compact ASCII/Mermaid diagram for medium+ complexity, or one-line justification for omission.)
+## Self-Review Notes
+- (list patches applied to this artifact during self-review, or \`- None.\`)
 ## Assumptions and Open Questions
 - **Assumptions:**
 - **Open questions (or "None"):**
@@ -101,9 +130,13 @@ ${SEED_SHELF_SECTION}
 - Four paths per data flow:
 ## Premise Challenge
-- Is this the right problem?
-- Why this path?
-- What if we do nothing?
+| Question | Answer (take a position) | Evidence / leverage |
+|---|---|---|
+| Right problem? |  |  |
+| Direct path? |  |  |
+| What if we do nothing? |  |  |
+| Existing-code leverage? |  |  |
+| Reversibility cost? |  |  |
 ## Dream State Mapping
 - CURRENT STATE:
@@ -198,7 +231,9 @@ ${SEED_SHELF_SECTION}
 - Unresolved decisions (or \`None\`):
 ## Scope Summary
-- Selected mode:
+- Selected mode: (one of \`SCOPE EXPANSION\` | \`SELECTIVE EXPANSION\` | \`HOLD SCOPE\` | \`SCOPE REDUCTION\`)
+- Strongest challenges resolved:
+- Recommended path:
 - Accepted scope:
 - Deferred:
 - Explicitly excluded:

package/dist/internal/advance-stage.js CHANGED Viewed

@@ -19,7 +19,6 @@ import { runTddLoopStatusCommand } from "./tdd-loop-status.js";
 import { runTddRedEvidenceCommand } from "./tdd-red-evidence.js";
 import { extractReviewLoopEnvelopeFromArtifact } from "../content/review-loop.js";
 const AUTO_REVIEW_LOOP_GATE_BY_STAGE = {
-    scope: "scope_user_approved",
     design: "design_architecture_locked"
 };
 function unique(values) {
@@ -163,6 +162,30 @@ function validateReviewLoopGateEvidence(stage, evidence) {
     }
     return null;
 }
+function validateUserApprovalEvidence(evidence) {
+    const normalized = evidence.trim();
+    if (normalized.length === 0) {
+        return "must cite explicit user approval.";
+    }
+    const reviewLoopEnvelope = (() => {
+        try {
+            return pickReviewLoopEnvelope(JSON.parse(normalized));
+        }
+        catch {
+            return null;
+        }
+    })();
+    if (reviewLoopEnvelope) {
+        return "must cite explicit user approval; review-loop evidence is outside-voice evidence, not user approval.";
+    }
+    if (/\b(?:approved|approval|user approved|confirmed|accepted|yes|ok)\b/iu.test(normalized)) {
+        return null;
+    }
+    if (/\b(?:утвержд(?:аю|ено|ен|ена)|подтвержд(?:аю|ено|ен|ена)|соглас(?:ен|на|овано)|да|ок|принято)\b/iu.test(normalized)) {
+        return null;
+    }
+    return "must cite explicit user approval (for example `user approved the scope contract` or `пользователь утвердил scope`).";
+}
 // Per-gate validators keyed by `${stage}:${gateId}`. Returning a non-null
 // string surfaces the reason as an `advance-stage` failure so evidence is
 // guaranteed to carry the structural breadcrumbs downstream tooling
@@ -186,7 +209,7 @@ const GATE_EVIDENCE_VALIDATORS = {
         }
         return null;
     },
-    "scope:scope_user_approved": (evidence) => validateReviewLoopGateEvidence("scope", evidence),
+    "scope:scope_user_approved": (evidence) => validateUserApprovalEvidence(evidence),
     "design:design_architecture_locked": (evidence) => validateReviewLoopGateEvidence("design", evidence)
 };
 function validateGateEvidenceShape(stage, gateId, evidence) {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "cclaw-cli",
-  "version": "0.51.8",
+  "version": "0.51.10",
   "description": "Installer-first flow toolkit for coding agents",
   "type": "module",
   "bin": {