npm - cclaw-cli - Versions diffs - 0.49.0 → 0.51.1 - Mend

cclaw-cli 0.49.0 → 0.51.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (183) hide show

package/README.md +57 -84
package/dist/artifact-linter.d.ts +4 -0
package/dist/artifact-linter.js +24 -3
package/dist/cli.d.ts +1 -19
package/dist/cli.js +49 -491
package/dist/constants.d.ts +2 -13
package/dist/constants.js +1 -43
package/dist/content/closeout-guidance.d.ts +14 -0
package/dist/content/closeout-guidance.js +42 -0
package/dist/content/core-agents.js +55 -17
package/dist/content/decision-protocol.d.ts +12 -0
package/dist/content/decision-protocol.js +20 -0
package/dist/content/diff-command.d.ts +1 -2
package/dist/content/diff-command.js +8 -94
package/dist/content/examples.d.ts +4 -10
package/dist/content/examples.js +10 -20
package/dist/content/hook-events.js +2 -2
package/dist/content/hook-inline-snippets.d.ts +5 -2
package/dist/content/hook-inline-snippets.js +33 -1
package/dist/content/hook-manifest.d.ts +3 -4
package/dist/content/hook-manifest.js +11 -12
package/dist/content/hooks.js +44 -21
package/dist/content/ideate-command.d.ts +2 -0
package/dist/content/ideate-command.js +34 -25
package/dist/content/iron-laws.d.ts +5 -5
package/dist/content/iron-laws.js +5 -5
package/dist/content/language-policy.d.ts +2 -0
package/dist/content/language-policy.js +13 -0
package/dist/content/learnings.d.ts +3 -4
package/dist/content/learnings.js +26 -50
package/dist/content/meta-skill.js +33 -22
package/dist/content/next-command.js +41 -38
package/dist/content/node-hooks.js +17 -345
package/dist/content/opencode-plugin.js +5 -103
package/dist/content/research-playbooks.js +14 -14
package/dist/content/review-loop.d.ts +2 -0
package/dist/content/review-loop.js +8 -0
package/dist/content/session-hooks.js +15 -47
package/dist/content/skills.d.ts +0 -5
package/dist/content/skills.js +55 -128
package/dist/content/stage-common-guidance.d.ts +0 -1
package/dist/content/stage-common-guidance.js +17 -14
package/dist/content/stage-schema.d.ts +26 -1
package/dist/content/stage-schema.js +121 -40
package/dist/content/stages/_lint-metadata/index.js +9 -15
package/dist/content/stages/brainstorm.js +22 -43
package/dist/content/stages/design.js +37 -57
package/dist/content/stages/plan.js +22 -13
package/dist/content/stages/review.js +24 -27
package/dist/content/stages/scope.js +34 -46
package/dist/content/stages/ship.js +7 -4
package/dist/content/stages/spec.js +20 -9
package/dist/content/stages/tdd.js +64 -44
package/dist/content/start-command.js +13 -12
package/dist/content/status-command.d.ts +2 -7
package/dist/content/status-command.js +19 -146
package/dist/content/subagents.d.ts +0 -5
package/dist/content/subagents.js +51 -28
package/dist/content/templates.d.ts +1 -1
package/dist/content/templates.js +126 -135
package/dist/content/track-render-context.d.ts +17 -0
package/dist/content/track-render-context.js +44 -0
package/dist/content/tree-command.d.ts +1 -2
package/dist/content/tree-command.js +4 -87
package/dist/content/utility-skills.d.ts +2 -29
package/dist/content/utility-skills.js +2 -1534
package/dist/content/view-command.js +31 -11
package/dist/delegation.d.ts +1 -1
package/dist/delegation.js +5 -15
package/dist/doctor-registry.js +20 -21
package/dist/doctor.js +88 -344
package/dist/flow-state.d.ts +3 -0
package/dist/flow-state.js +2 -0
package/dist/harness-adapters.d.ts +1 -1
package/dist/harness-adapters.js +51 -58
package/dist/install.js +128 -358
package/dist/internal/advance-stage.js +3 -9
package/dist/internal/compound-readiness.d.ts +1 -1
package/dist/internal/compound-readiness.js +1 -1
package/dist/internal/tdd-loop-status.d.ts +1 -1
package/dist/internal/tdd-loop-status.js +1 -1
package/dist/knowledge-store.d.ts +16 -10
package/dist/knowledge-store.js +51 -15
package/dist/policy.js +16 -105
package/dist/run-archive.d.ts +4 -6
package/dist/run-archive.js +15 -20
package/dist/run-persistence.d.ts +2 -2
package/dist/run-persistence.js +3 -9
package/package.json +1 -2
package/dist/content/archive-command.d.ts +0 -2
package/dist/content/archive-command.js +0 -124
package/dist/content/compound-command.d.ts +0 -5
package/dist/content/compound-command.js +0 -193
package/dist/content/contexts.d.ts +0 -18
package/dist/content/contexts.js +0 -24
package/dist/content/contracts.d.ts +0 -2
package/dist/content/contracts.js +0 -51
package/dist/content/doctor-references.d.ts +0 -2
package/dist/content/doctor-references.js +0 -150
package/dist/content/eval-scaffold.d.ts +0 -15
package/dist/content/eval-scaffold.js +0 -370
package/dist/content/feature-command.d.ts +0 -2
package/dist/content/feature-command.js +0 -123
package/dist/content/flow-map.d.ts +0 -23
package/dist/content/flow-map.js +0 -134
package/dist/content/harness-doc.d.ts +0 -2
package/dist/content/harness-doc.js +0 -202
package/dist/content/harness-playbooks.d.ts +0 -24
package/dist/content/harness-playbooks.js +0 -393
package/dist/content/harness-tool-refs.d.ts +0 -20
package/dist/content/harness-tool-refs.js +0 -268
package/dist/content/ops-command.d.ts +0 -2
package/dist/content/ops-command.js +0 -71
package/dist/content/protocols.d.ts +0 -7
package/dist/content/protocols.js +0 -215
package/dist/content/retro-command.d.ts +0 -2
package/dist/content/retro-command.js +0 -165
package/dist/content/rewind-command.d.ts +0 -2
package/dist/content/rewind-command.js +0 -106
package/dist/content/tdd-log-command.d.ts +0 -2
package/dist/content/tdd-log-command.js +0 -85
package/dist/eval/agents/single-shot.d.ts +0 -27
package/dist/eval/agents/single-shot.js +0 -79
package/dist/eval/agents/with-tools.d.ts +0 -44
package/dist/eval/agents/with-tools.js +0 -261
package/dist/eval/agents/workflow.d.ts +0 -31
package/dist/eval/agents/workflow.js +0 -155
package/dist/eval/baseline.d.ts +0 -38
package/dist/eval/baseline.js +0 -282
package/dist/eval/config-loader.d.ts +0 -14
package/dist/eval/config-loader.js +0 -395
package/dist/eval/corpus.d.ts +0 -30
package/dist/eval/corpus.js +0 -330
package/dist/eval/cost-guard.d.ts +0 -102
package/dist/eval/cost-guard.js +0 -190
package/dist/eval/diff.d.ts +0 -64
package/dist/eval/diff.js +0 -323
package/dist/eval/llm-client.d.ts +0 -176
package/dist/eval/llm-client.js +0 -267
package/dist/eval/mode.d.ts +0 -28
package/dist/eval/mode.js +0 -61
package/dist/eval/progress.d.ts +0 -83
package/dist/eval/progress.js +0 -59
package/dist/eval/report.d.ts +0 -11
package/dist/eval/report.js +0 -181
package/dist/eval/rubric-loader.d.ts +0 -20
package/dist/eval/rubric-loader.js +0 -143
package/dist/eval/runner.d.ts +0 -81
package/dist/eval/runner.js +0 -746
package/dist/eval/runs.d.ts +0 -41
package/dist/eval/runs.js +0 -114
package/dist/eval/sandbox.d.ts +0 -38
package/dist/eval/sandbox.js +0 -137
package/dist/eval/tools/glob.d.ts +0 -2
package/dist/eval/tools/glob.js +0 -163
package/dist/eval/tools/grep.d.ts +0 -2
package/dist/eval/tools/grep.js +0 -152
package/dist/eval/tools/index.d.ts +0 -7
package/dist/eval/tools/index.js +0 -35
package/dist/eval/tools/read.d.ts +0 -2
package/dist/eval/tools/read.js +0 -122
package/dist/eval/tools/types.d.ts +0 -49
package/dist/eval/tools/types.js +0 -41
package/dist/eval/tools/write.d.ts +0 -2
package/dist/eval/tools/write.js +0 -92
package/dist/eval/types.d.ts +0 -561
package/dist/eval/types.js +0 -47
package/dist/eval/verifiers/judge.d.ts +0 -40
package/dist/eval/verifiers/judge.js +0 -256
package/dist/eval/verifiers/rules.d.ts +0 -24
package/dist/eval/verifiers/rules.js +0 -218
package/dist/eval/verifiers/structural.d.ts +0 -14
package/dist/eval/verifiers/structural.js +0 -171
package/dist/eval/verifiers/traceability.d.ts +0 -23
package/dist/eval/verifiers/traceability.js +0 -84
package/dist/eval/verifiers/workflow-consistency.d.ts +0 -21
package/dist/eval/verifiers/workflow-consistency.js +0 -225
package/dist/eval/workflow-corpus.d.ts +0 -7
package/dist/eval/workflow-corpus.js +0 -207
package/dist/feature-system.d.ts +0 -42
package/dist/feature-system.js +0 -432
package/dist/internal/knowledge-digest.d.ts +0 -7
package/dist/internal/knowledge-digest.js +0 -93

package/README.md CHANGED Viewed

@@ -25,8 +25,7 @@ operational knobs to memorise.
   changes across multiple harnesses and languages.
 - Staff engineers and tech leads who want **enforceable discipline**:
   locked-in decisions, no placeholders, mandatory TDD, traceable plans.
-- Maintainers of AI agents/skills who want **measurable prompt engineering**
-  via the built-in eval harness.
+- Maintainers who want a compact, file-backed flow their harness agents can actually follow.
 ---
@@ -76,7 +75,7 @@ You ──► /cc <idea>
    cclaw reads state + knowledge, guides execution
         │
         ▼
-   artifacts written, checkpoint saved
+   artifacts written, handoff captured
         │
         ▼
    next stage is explicit in flow-state.json
@@ -86,7 +85,14 @@ You ──► /cc <idea>
 ## 30-second install
+Requirements:
+- Node.js **20+** (matches the package `engines` field).
+- Run from the **git project root** you want cclaw to manage, not from `~`
+  or a nested package directory.
 ```bash
+cd /path/to/your/repo
 npx cclaw-cli
 ```
@@ -102,26 +108,23 @@ Everything day-to-day happens inside your harness (Claude Code, Cursor,
 OpenCode, or Codex); optional maintenance commands are listed in the
 CLI reference.
+If cclaw says it is not installed, either run `npx cclaw-cli init` in the
+repo root or `cd` to the project that already contains `.cclaw/`.
 ### What gets generated
 ```text
 .cclaw/
-├── commands/           # stage + utility command contracts (markdown)
-├── skills/             # stage + utility skills loaded by the harness
-├── contexts/           # cross-cutting context modes (research, debugging, …)
+├── commands/           # four entrypoints: /cc, /cc-next, /cc-ideate, /cc-view
+├── skills/             # flow-critical skills loaded by the harness
 ├── templates/          # artifact skeletons for each stage
-├── rules/              # lint-style rules surfaced to the agent
-├── adapters/           # per-harness translation notes
-├── agents/             # subagent definitions (planner, reviewer, …)
-├── hooks/              # harness-agnostic hook scripts
-├── worktrees/          # isolated feature worktrees (power-user, via /cc-ops)
-├── artifacts/          # active feature artifacts (00-idea.md → 09-retro.md)
-├── runs/               # archived feature snapshots: YYYY-MM-DD-slug/
-├── references/         # (optional) pinned copies of reference frameworks
-├── evals/              # eval corpus, rubrics, baselines, reports
-├── custom-skills/      # user-authored skills (never overwritten)
-├── state/              # flow-state.json + delegation-log.json + activity
-└── knowledge.jsonl     # append-only, strict-schema lessons + patterns
+├── rules/              # opt-in language rule packs
+├── agents/             # subagent definitions
+├── hooks/              # harness-agnostic hook runtime
+├── artifacts/          # active run artifacts (00-idea.md -> 09-retro.md)
+├── runs/               # archived run snapshots: YYYY-MM-DD-slug/
+├── state/              # flow-state.json + stage activity log
+└── knowledge.jsonl     # append-only lessons + patterns
 ```
 Plus harness-specific shims:
@@ -133,9 +136,10 @@ Plus harness-specific shims:
   activated via `/use cc` or description-based auto-matching. Hooks
   require Codex CLI ≥ v0.114 and `[features] codex_hooks = true` in
   `~/.codex/config.toml`; `cclaw init --codex` offers to patch that flag
-  for you. `.codex/commands/` and the legacy `.agents/skills/cclaw-cc*/`
-  folders are auto-cleaned on sync.)
+  for you. `cclaw doctor` reports stale legacy Codex layouts.)
 - `AGENTS.md` with a managed routing block (includes a Codex-specific note)
+  — see [`docs/agents-block.example.md`](./docs/agents-block.example.md)
+  for a static example of what the harness reads.
 ### `.cclaw/config.yaml` — the minimal surface
@@ -172,21 +176,22 @@ Full key-by-key reference: [`docs/config.md`](./docs/config.md).
 ## The four commands you actually use
 All four appear as slash commands in every supported harness. This is the
-top-level user surface — everything else is either automatic or happens
-inside `/cc-ops` subcommands.
+top-level user surface: `/cc`, `/cc-next`, `/cc-ideate`, and `/cc-view status`
+cover the happy path. Operator/support tools stay separate so the harness
+does not feel like a command framework.
 | Command | What it does |
 |---|---|
 | **`/cc <idea>`** | Classify the task, discover origin docs (`docs/prd/**`, ADRs, root `PRD.md`, …), sniff the stack, recommend a track, then start the first stage of that track. `/cc` without arguments resumes the current flow. |
 | **`/cc-next`** | The one progression primitive. Reads `flow-state.json`, checks gates + mandatory subagent delegations, and either resumes the current stage or advances to the next. `/cc-next` in a new session is how you **resume**. |
 | **`/cc-ideate`** | Repository improvement ideate mode. Scans for TODOs, flaky tests, oversized modules, docs drift, and recurring knowledge-store lessons, **persists the ranked backlog** to `.cclaw/artifacts/ideate-<date>-<slug>.md`, and ends with a concrete handoff: launch `/cc` on the selected candidate in the same session, save-and-close, or discard. Resume check on next run reuses any ideate artifact younger than 30 days. Never mutates `flow-state.json`. |
-| **`/cc-view`** | Read-only flow visibility. `/cc-view status` (default) shows stage progress, mandatory delegations with their fulfillment mode (isolated / generic-dispatch / role-switch), the ship closeout substate (retro → compound → archive), and the active harness parity row. `/cc-view tree` renders the same picture as a tree with a closeout sub-branch under ship and a per-harness playbook summary. `/cc-view diff` shows stage/gate/closeout/delegation deltas since the last run. Never mutates state (except diff's snapshot baseline). |
+| **`/cc-view`** | Read-only flow visibility. `/cc-view status` (default) shows stage progress, mandatory delegations with their fulfillment mode (isolated / generic-dispatch / role-switch), the ship closeout substate (retro → compound → archive), and the active harness parity row. `/cc-view tree` renders the same picture as a tree with a closeout sub-branch under ship and harness capability status from `cclaw doctor --explain`. `/cc-view diff` shows stage/gate/closeout/delegation changes from visible state and git evidence. Never mutates state. |
-> Power-user surface: `/cc-ops` is an operational router for manual
-> overrides (rewind a stale stage, manage parallel features, re-run a
-> compound pass). `/cc-learn` is the strict-schema knowledge writer —
-> agents call it automatically from completion protocols; you rarely
-> invoke it by hand.
+Operational extras stay off the main surface: `/cc-next` handles progression
+and closeout, `cclaw archive` handles explicit archival/reset, and
+`cclaw doctor` verifies install/runtime wiring. Doctor is not a replacement
+for a real harness smoke test; it catches broken files, stale hooks, and
+schema drift before the user loses a run.
 ### Example first-run
@@ -260,7 +265,7 @@ Each critical-path stage produces a dated artifact under
 `02a-research.md` (design research fleet synthesis), `03-design.md` through
 `08-ship.md`. Closeout adds `09-retro.md`; archive then rolls the whole
 bundle into `.cclaw/runs/<YYYY-MM-DD-slug>/` and resets the active flow for
-the next feature.
+the next run.
 ### Track heuristics are configurable (advisory)
@@ -312,9 +317,7 @@ it into ceremony:
 - **Mandatory subagent delegation** at TDD, with per-harness waivers.
 - **Turn Announce Discipline.** Every stage entry/exit emits a visible
   line so users can see what the agent is doing, not just what it says.
-- **Extracted protocols.** Decision, Completion, and Ethos protocols live
-  in a single place (`.cclaw/contexts/`), so every skill speaks the same
-  dialect.
+- **Inline protocols.** Decision, Completion, and Ethos discipline is embedded in the active stage skill so users do not need to chase generated reference files.
 - **Knowledge capture throughout the flow.** Every stage completion
   protocol emits typed entries (`rule` / `pattern` / `lesson`) to
   `.cclaw/knowledge.jsonl` as the flow progresses — not only at retro.
@@ -334,7 +337,7 @@ it into ceremony:
 The `tdd` stage is not prose guidance. It requires:
-- an explicit **RED** test run (logged to `.cclaw/state/stage-activity.jsonl`)
+- an explicit **RED** test run (captured in `.cclaw/artifacts/06-tdd.md`)
 - a mandatory **`test-author`** subagent dispatch (logged to
   `.cclaw/state/delegation-log.json`)
 - a **GREEN** full-suite run before exit
@@ -349,7 +352,7 @@ subagent as `completed` (or, on Codex / OpenCode, role-switched with
 ## Ship and closeout — automatic, resumable
 Shipping writes `08-ship.md`. `/cc-next` then automatically walks the
-feature through a deterministic three-step closeout without extra
+run through a deterministic three-step closeout without extra
 commands from you:
 1. **Retro (`09-retro.md`).** cclaw drafts a retrospective from your
@@ -375,9 +378,7 @@ If your session dies mid-closeout, a new `/cc-next` resumes at the
 exact step — retro drafts are not regenerated and no structured ask is
 repeated silently.
-You can still invoke each step manually (`/cc-ops retro`, `/cc-ops
-compound`, `/cc-ops archive`), but for the default path you do not need
-to: `/cc-next` is the only command.
+For the default path, `/cc-next` is the only command; explicit archival/reset remains available through `cclaw archive`.
 ---
@@ -386,12 +387,12 @@ to: `/cc-next` is the only command.
 cclaw is honest about what each harness can and cannot do, and it
 closes every real gap with a documented fallback — not a silent waiver.
-| Harness | Dispatch | Fallback | Hook surface | Structured ask | Playbook |
-|---|---|---|---|---|---|
-| Claude Code | full (named subagents) | `native` | full | `AskUserQuestion` | [`claude-playbook.md`](./src/content/harness-playbooks.ts) |
-| Cursor | generic Task dispatcher | `generic-dispatch` | full | `AskQuestion` | `cursor-playbook.md` |
-| OpenCode | plugin / in-session | `role-switch` | plugin | `question` (permission-gated; `permission.question: "allow"`) | `opencode-playbook.md` |
-| OpenAI Codex | in-session only | `role-switch` (evidenceRefs required) | limited (Bash-only `PreToolUse`/`PostToolUse`; requires `codex_hooks` feature flag) | `request_user_input` (experimental; Plan / Collaboration mode) | `codex-playbook.md` |
+| Harness | Dispatch | Fallback | Hook surface | Structured ask |
+|---|---|---|---|---|
+| Claude Code | full (named subagents) | `native` | full | `AskUserQuestion` |
+| Cursor | generic Task dispatcher | `generic-dispatch` | full | `AskQuestion` |
+| OpenCode | plugin / in-session | `role-switch` | plugin | `question` (permission-gated; `permission.question: "allow"`) |
+| OpenAI Codex | in-session only | `role-switch` (evidenceRefs required) | limited (Bash-only `PreToolUse`/`PostToolUse`; requires `codex_hooks` feature flag) | `request_user_input` (experimental; Plan / Collaboration mode) |
 What the fallbacks mean:
@@ -401,8 +402,7 @@ What the fallbacks mean:
   vocabulary of `subagent_type`s (`explore`, `generalPurpose`, …).
   cclaw maps each named agent (planner / reviewer / test-author /
   security-reviewer / doc-updater) onto the generic dispatcher with a
-  structured role prompt. Per-agent mapping lives in the Cursor
-  playbook.
+  structured role prompt.
 - `role-switch` — OpenCode and Codex lack an isolated worker primitive.
   The agent announces the role in-session, performs the work, and
   records a delegation row with `fulfillmentMode: "role-switch"` and at
@@ -418,10 +418,10 @@ What the fallbacks mean:
 > (Jan 2026), but Codex ≥ v0.114 (Mar 2026) grew an experimental
 > lifecycle hooks API. cclaw installs Codex entry points as native
 > **skills** under `.agents/skills/cc*/SKILL.md` (invoke with `/use cc`,
-> `/use cc-next`, `/use cc-view`, `/use cc-ops`, `/use cc-ideate`, or
+> `/use cc-next`, `/use cc-view`, `/use cc-ideate`, or
 > by typing `/cc …` in plain text — Codex auto-matches from the skill
 > description) **and** writes `.codex/hooks.json` so session-start
-> rehydration, stop-checkpoint, prompt-guard, workflow-guard, and
+> rehydration, stop-handoff, prompt-guard, workflow-guard, and
 > context-monitor fire automatically — as long as you enable the
 > `codex_hooks` feature flag in `~/.codex/config.toml`. `cclaw init
 > --codex` asks for consent before patching that file. Codex's
@@ -431,59 +431,32 @@ What the fallbacks mean:
 > and any legacy layout to clean up.
 The full capability matrix lives in
-[`docs/harnesses.md`](./docs/harnesses.md). Per-harness playbooks are
-generated into `.cclaw/references/harnesses/` on every install and
-upgrade; stage skills cite them by path.
-Runtime state:
-- `.cclaw/state/harness-gaps.json` (schema v2) — per-harness list of
-  missing capabilities, missing hook events, the declared fallback, the
-  playbook path, and a `remediation[]` list you can act on.
-- `cclaw doctor` — asserts every installed harness has its playbook on
-  disk and surfaces the expected fulfillment mode inside the
-  `delegation:mandatory:current_stage` check.
----
+[`docs/harnesses.md`](./docs/harnesses.md). Harness capability gaps are
+reported by `cclaw doctor` instead of generating reference files into the
+user project.
-## Eval-driven prompt engineering
-cclaw ships with `cclaw-cli eval` — a three-tier regression harness for
-the skills and contracts the runtime generates. Use it when you change a
-stage skill, tweak a prompt, or swap a model.
-Works with any OpenAI-compatible endpoint — Zhipu AI GLM, OpenAI, Together,
-self-hosted vLLM — via three environment variables:
-```bash
-CCLAW_EVAL_API_KEY=...
-CCLAW_EVAL_BASE_URL=https://api.z.ai/api/coding/paas/v4   # default
-CCLAW_EVAL_MODEL=glm-5.1                                  # default
-```
-Full details, corpus format, and the eval contract live in
-[`docs/evals.md`](./docs/evals.md).
-Mutation-testing setup lives in `stryker.config.mjs` and
-`.github/workflows/mutation.yml` (manual + weekly run).
+Runtime state stays small: `flow-state.json` is the source of truth, while
+stage activity is an append-only trace for what happened during the run.
+Derived diagnostics are produced on demand by `cclaw doctor`.
 ---
 ## CLI reference
-The CLI is deliberately small. Everything operational happens inside
-your harness.
+`cclaw-cli` is deliberately small: it installs, syncs, upgrades, diagnoses, and removes the generated harness runtime. Day-to-day flow work happens inside your harness via `/cc*` commands and Node hooks.
 ```bash
 npx cclaw-cli                   # launches interactive setup (or prints
                                 # a one-line status hint if already installed)
 npx cclaw-cli sync              # re-materialize generated runtime from config.yaml
 npx cclaw-cli upgrade           # refresh generated files; preserves .cclaw/config.yaml
-npx cclaw-cli archive           # archive current run and reset flow-state
+npx cclaw-cli archive           # explicit/manual archive; normal post-ship closeout uses /cc-next
 npx cclaw-cli uninstall         # remove .cclaw + generated harness shims
-npx cclaw-cli eval …            # maintainer surface (see docs/evals.md)
 npx cclaw-cli --version
 ```
+The generated `node .cclaw/hooks/stage-complete.mjs <stage>` helper is the canonical stage-closeout path and must not require a runtime `cclaw` binary in `PATH`.
 For CI or scripted installs, `cclaw-cli init --harnesses=<list>
 --no-interactive` is the non-interactive form. All other tunables
 (prompt-guard strictness, TDD enforcement, language rule packs, track

package/dist/artifact-linter.d.ts CHANGED Viewed

@@ -28,6 +28,8 @@ export interface LearningSeedEntry {
     domain?: string | null;
     stage?: FlowStage | null;
     origin_stage?: FlowStage | null;
+    origin_run?: string | null;
+    /** @deprecated Use `origin_run`. Accepted only for legacy learning bullets. */
     origin_feature?: string | null;
     frequency?: number;
     universality?: LearningUniversality;
@@ -37,6 +39,8 @@ export interface LearningSeedEntry {
     last_seen_ts?: string;
     project?: string | null;
     source?: LearningSource | null;
+    supersedes?: string[];
+    superseded_by?: string;
 }
 export interface LearningsParseResult {
     ok: boolean;

package/dist/artifact-linter.js CHANGED Viewed

@@ -780,6 +780,7 @@ const LEARNING_ALLOWED_KEYS = new Set([
     "domain",
     "stage",
     "origin_stage",
+    "origin_run",
     "origin_feature",
     "frequency",
     "universality",
@@ -788,7 +789,9 @@ const LEARNING_ALLOWED_KEYS = new Set([
     "first_seen_ts",
     "last_seen_ts",
     "project",
-    "source"
+    "source",
+    "supersedes",
+    "superseded_by"
 ]);
 function isIsoUtcTimestamp(value) {
     return /^\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}Z$/u.test(value);
@@ -862,6 +865,9 @@ function parseLearningSeedEntry(raw, index) {
             error: `Learnings bullet #${index} field "origin_stage" must be one of ${FLOW_STAGES.join(", ")} or null.`
         };
     }
+    if (obj.origin_run !== undefined && !isNullableString(obj.origin_run)) {
+        return { ok: false, error: `Learnings bullet #${index} field "origin_run" must be string or null.` };
+    }
     if (obj.origin_feature !== undefined && !isNullableString(obj.origin_feature)) {
         return { ok: false, error: `Learnings bullet #${index} field "origin_feature" must be string or null.` };
     }
@@ -906,6 +912,17 @@ function parseLearningSeedEntry(raw, index) {
             };
         }
     }
+    if (obj.supersedes !== undefined) {
+        if (!Array.isArray(obj.supersedes) ||
+            obj.supersedes.length === 0 ||
+            obj.supersedes.some((value) => typeof value !== "string" || value.trim().length === 0)) {
+            return { ok: false, error: `Learnings bullet #${index} field "supersedes" must be a non-empty array of strings.` };
+        }
+    }
+    if (obj.superseded_by !== undefined &&
+        (typeof obj.superseded_by !== "string" || obj.superseded_by.trim().length === 0)) {
+        return { ok: false, error: `Learnings bullet #${index} field "superseded_by" must be a non-empty string.` };
+    }
     return {
         ok: true,
         entry: {
@@ -1002,7 +1019,6 @@ const FRONTMATTER_REQUIRED_KEYS = [
     "stage",
     "schema_version",
     "version",
-    "feature",
     "locked_decisions",
     "inputs_hash"
 ];
@@ -1271,6 +1287,11 @@ export async function lintArtifact(projectRoot, stage, track = "standard") {
         const value = parsedFrontmatter.values[key];
         return typeof value !== "string" || value.trim().length === 0;
     });
+    if (parsedFrontmatter.hasFrontmatter &&
+        typeof parsedFrontmatter.values.run !== "string" &&
+        typeof parsedFrontmatter.values.feature !== "string") {
+        frontmatterMissingKeys.push("run");
+    }
     const frontmatterStage = parsedFrontmatter.values.stage?.replace(/^['"]|['"]$/gu, "");
     const frontmatterSchemaVersion = parsedFrontmatter.values.schema_version?.replace(/^['"]|['"]$/gu, "");
     const frontmatterInputsHash = parsedFrontmatter.values.inputs_hash?.replace(/^['"]|['"]$/gu, "");
@@ -1283,7 +1304,7 @@ export async function lintArtifact(projectRoot, stage, track = "standard") {
     findings.push({
         section: "Frontmatter",
         required: requireFrontmatter,
-        rule: "Artifact must include frontmatter keys (stage, schema_version=1, version, feature, locked_decisions, inputs_hash=sha256:pending|sha256:<64hex>).",
+        rule: "Artifact must include frontmatter keys (stage, schema_version=1, version, run, locked_decisions, inputs_hash=sha256:pending|sha256:<64hex>). Legacy feature is accepted during migration.",
         found: parsedFrontmatter.hasFrontmatter ? frontmatterValid : true,
         details: !parsedFrontmatter.hasFrontmatter
             ? "Legacy artifact without YAML frontmatter (allowed for backward compatibility)."

package/dist/cli.d.ts CHANGED Viewed

@@ -1,7 +1,6 @@
 #!/usr/bin/env node
 import type { FlowTrack, HarnessId } from "./types.js";
-import type { EvalMode } from "./eval/types.js";
-type CommandName = "init" | "sync" | "doctor" | "upgrade" | "uninstall" | "archive" | "eval" | "internal";
+type CommandName = "init" | "sync" | "doctor" | "upgrade" | "uninstall" | "archive" | "internal";
 interface ParsedArgs {
     command?: CommandName;
     harnesses?: HarnessId[];
@@ -16,23 +15,6 @@ interface ParsedArgs {
     archiveName?: string;
     archiveSkipRetro?: boolean;
     archiveSkipRetroReason?: string;
-    evalStage?: string;
-    evalMode?: EvalMode;
-    evalSchemaOnly?: boolean;
-    evalRules?: boolean;
-    evalJudge?: boolean;
-    evalJson?: boolean;
-    evalNoWrite?: boolean;
-    evalUpdateBaseline?: boolean;
-    evalConfirm?: boolean;
-    evalQuiet?: boolean;
-    evalMaxCostUsd?: number;
-    /** Optional subcommand after `eval`. */
-    evalSubcommand?: "diff" | "runs";
-    /** Positional arguments for eval subcommands (e.g. `diff <old> <new>`). */
-    evalArgs?: string[];
-    evalBackground?: boolean;
-    evalCompareModel?: string;
     /** Hidden plumbing command (`cclaw internal ...`) arguments. */
     internalArgs?: string[];
     showHelp?: boolean;