npm - valent-pipeline - Versions diffs - 0.7.0 → 0.17.1 - Mend

valent-pipeline 0.7.0 → 0.17.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (187) hide show

package/README.md +65 -54
package/bin/cli.js +502 -40
package/package.json +2 -3
package/pipeline/docs/agent-reference.md +6 -5
package/pipeline/docs/communication-standard.md +1 -1
package/pipeline/docs/index.md +1 -1
package/pipeline/docs/knowledge-system.md +12 -12
package/pipeline/docs/npx-implementation-plan.md +5 -7
package/pipeline/docs/npx-packaging.md +10 -13
package/pipeline/docs/pipeline-overview.md +11 -11
package/pipeline/docs/task-graph.md +2 -2
package/pipeline/docs/template-skeleton.md +1 -1
package/pipeline/orchestrators/claude-code/README.md +21 -23
package/pipeline/orchestrators/claude-code/plan.workflow.js +177 -60
package/pipeline/orchestrators/claude-code/retro.workflow.js +31 -14
package/pipeline/orchestrators/claude-code/sprint.workflow.js +1721 -257
package/pipeline/prompts/bend.md +10 -21
package/pipeline/prompts/critic.md +12 -23
package/pipeline/prompts/data.md +8 -9
package/pipeline/prompts/docgen.md +8 -9
package/pipeline/prompts/fend.md +10 -21
package/pipeline/prompts/iac.md +10 -11
package/pipeline/prompts/judge.md +10 -22
package/pipeline/prompts/libdev.md +8 -9
package/pipeline/prompts/mcp-dev.md +8 -9
package/pipeline/prompts/mobile.md +10 -11
package/pipeline/prompts/pmcp.md +1 -1
package/pipeline/prompts/qa-a.md +22 -15
package/pipeline/prompts/qa-b.md +13 -23
package/pipeline/prompts/reqs.md +10 -11
package/pipeline/prompts/retrospective.md +8 -8
package/pipeline/prompts/uxa.md +9 -10
package/pipeline/schemas/atdd-proof.schema.json +62 -0
package/pipeline/schemas/atdd-red-baseline.schema.json +78 -0
package/pipeline/schemas/bugs-block.schema.json +30 -0
package/pipeline/schemas/evidence-assert.schema.json +63 -0
package/pipeline/schemas/evidence-baseline.schema.json +38 -0
package/pipeline/schemas/evidence-run.schema.json +118 -0
package/pipeline/schemas/gate-pin.schema.json +20 -0
package/pipeline/schemas/qa-spec-manifest.schema.json +53 -0
package/pipeline/schemas/reqs-manifest.schema.json +28 -0
package/pipeline/schemas/verdict.schema.json +5 -0
package/pipeline/steps/bend/estimate.md +1 -1
package/pipeline/steps/bend/handoff.md +2 -2
package/pipeline/steps/bend/read-inputs.md +2 -2
package/pipeline/steps/bend/write-tests.md +8 -5
package/pipeline/steps/common/agent-protocol.md +13 -31
package/pipeline/steps/common/distilled-handoff-format.md +2 -2
package/pipeline/steps/common/no-api-passthrough.md +1 -1
package/pipeline/steps/common/no-ui-passthrough.md +1 -1
package/pipeline/steps/critic/acceptance-audit.md +8 -6
package/pipeline/steps/critic/write-verdict.md +6 -12
package/pipeline/steps/data/estimate.md +1 -1
package/pipeline/steps/data/handoff.md +2 -2
package/pipeline/steps/data/read-inputs.md +2 -2
package/pipeline/steps/data/write-tests.md +5 -0
package/pipeline/steps/docgen/estimate.md +1 -1
package/pipeline/steps/docgen/handoff.md +2 -2
package/pipeline/steps/docgen/read-inputs.md +2 -2
package/pipeline/steps/docgen/write-tests.md +5 -0
package/pipeline/steps/fend/estimate.md +1 -1
package/pipeline/steps/fend/handoff.md +3 -3
package/pipeline/steps/fend/read-inputs.md +2 -2
package/pipeline/steps/fend/write-tests.md +8 -5
package/pipeline/steps/iac/estimate.md +1 -1
package/pipeline/steps/iac/handoff.md +2 -2
package/pipeline/steps/iac/implement.md +1 -1
package/pipeline/steps/iac/read-inputs.md +2 -2
package/pipeline/steps/iac/write-tests.md +7 -4
package/pipeline/steps/judge/bug-review.md +1 -1
package/pipeline/steps/judge/evidence-review.md +31 -17
package/pipeline/steps/judge/ship-decision.md +3 -6
package/pipeline/steps/libdev/estimate.md +1 -1
package/pipeline/steps/libdev/handoff.md +2 -2
package/pipeline/steps/libdev/read-inputs.md +2 -2
package/pipeline/steps/libdev/write-tests.md +5 -0
package/pipeline/steps/mcp-dev/estimate.md +1 -1
package/pipeline/steps/mcp-dev/handoff.md +2 -2
package/pipeline/steps/mcp-dev/read-inputs.md +2 -2
package/pipeline/steps/mcp-dev/write-tests.md +5 -0
package/pipeline/steps/mobile/emulator-lifecycle.md +2 -2
package/pipeline/steps/mobile/estimate.md +1 -1
package/pipeline/steps/mobile/handoff.md +3 -6
package/pipeline/steps/mobile/read-inputs.md +2 -2
package/pipeline/steps/mobile/write-tests.md +8 -5
package/pipeline/steps/orchestration/bug-intake.md +4 -1
package/pipeline/steps/orchestration/git-flow.md +99 -0
package/pipeline/steps/orchestration/pm-autonomy.md +109 -0
package/pipeline/steps/orchestration/resolve-next-work-item.md +52 -27
package/pipeline/steps/orchestration/update-backlog-status.md +84 -69
package/pipeline/steps/orchestration/validate-story-inputs.md +3 -1
package/pipeline/steps/qa-a/read-inputs.md +4 -4
package/pipeline/steps/qa-a/self-attack.md +14 -0
package/pipeline/steps/qa-a/write-acceptance-tests.md +45 -0
package/pipeline/steps/qa-a/write-spec.md +8 -4
package/pipeline/steps/qa-b/api.md +10 -3
package/pipeline/steps/qa-b/execute-tests.md +20 -1
package/pipeline/steps/qa-b/file-bugs.md +12 -1
package/pipeline/steps/qa-b/write-report.md +18 -10
package/pipeline/steps/reqs/pre-mortem.md +1 -1
package/pipeline/steps/reqs/read-inputs.md +3 -3
package/pipeline/steps/reqs/write-output.md +16 -1
package/pipeline/steps/retrospective/directives.md +10 -4
package/pipeline/steps/retrospective/embed-instructions.md +1 -2
package/pipeline/steps/retrospective/report.md +5 -2
package/pipeline/steps/uxa/read-inputs.md +2 -2
package/pipeline/steps/uxa/write-output.md +0 -1
package/pipeline/task-graphs/backend-api.yaml +3 -84
package/pipeline/task-graphs/data-pipeline.yaml +3 -84
package/pipeline/task-graphs/document-generation.yaml +3 -84
package/pipeline/task-graphs/frontend-only.yaml +3 -92
package/pipeline/task-graphs/fullstack-web.yaml +4 -102
package/pipeline/task-graphs/library.yaml +3 -84
package/pipeline/task-graphs/mcp-server.yaml +3 -84
package/pipeline/task-graphs/mobile-app.yaml +3 -92
package/pipeline/templates/bugs.template.md +12 -0
package/pipeline/templates/embed-instructions.template.md +1 -1
package/pipeline/templates/qa-test-spec.template.md +6 -2
package/pipeline/templates/reqs-brief.template.md +2 -1
package/pipeline/templates/retrospective.template.md +1 -1
package/pipeline/templates/story-report.template.md +1 -1
package/pipeline/templates/uxa-spec.template.md +1 -1
package/pipeline/templates/visual-validation-checklist.template.md +1 -1
package/skills/valent-configure/SKILL.md +37 -7
package/skills/valent-debug-export/SKILL.md +1 -2
package/skills/valent-help/SKILL.md +5 -5
package/skills/valent-knowledge/SKILL.md +3 -7
package/skills/valent-resume/SKILL.md +3 -3
package/skills/valent-review-cost/SKILL.md +2 -2
package/skills/valent-run-deferred-tests/SKILL.md +17 -8
package/skills/valent-run-epic-workflow/SKILL.md +60 -15
package/skills/valent-run-project-workflow/SKILL.md +39 -14
package/skills/valent-run-spike/SKILL.md +96 -0
package/skills/valent-run-story-workflow/SKILL.md +7 -7
package/skills/valent-setup-backlog/SKILL.md +43 -2
package/src/commands/analyze.js +204 -0
package/src/commands/audit.js +13 -1
package/src/commands/backlog.js +376 -0
package/src/commands/check-spec-conformance.js +21 -1
package/src/commands/crosscheck.js +113 -0
package/src/commands/db-directives.js +0 -0
package/src/commands/db-index.js +3 -70
package/src/commands/db-query.js +14 -1
package/src/commands/db-rebuild.js +10 -10
package/src/commands/detect-project.js +36 -0
package/src/commands/evidence.js +609 -0
package/src/commands/git-flow.js +143 -0
package/src/commands/init.js +89 -10
package/src/commands/rejection-cap.js +20 -15
package/src/commands/resolve-eligible.js +16 -2
package/src/commands/spec-check.js +72 -0
package/src/commands/sprint-pack.js +15 -2
package/src/commands/trace.js +99 -0
package/src/commands/upgrade.js +8 -1
package/src/commands/validate.js +7 -0
package/src/lib/analyze.js +173 -0
package/src/lib/audit.js +1 -0
package/src/lib/backlog-lint.js +160 -0
package/src/lib/backlog.js +559 -0
package/src/lib/config-schema.js +227 -9
package/src/lib/crosscheck.js +141 -0
package/src/lib/db.js +21 -28
package/src/lib/detect.js +387 -0
package/src/lib/evidence.js +0 -0
package/src/lib/git-flow.js +701 -0
package/src/lib/graph.js +25 -4
package/src/lib/handoff.js +16 -6
package/src/lib/junit.js +231 -0
package/src/lib/locked-file.js +61 -0
package/src/lib/obsolete-manifest.js +11 -0
package/src/lib/spec-check.js +98 -0
package/src/lib/spec-conformance.js +39 -3
package/src/lib/sprint.js +150 -23
package/src/lib/trace.js +199 -0
package/pipeline/prompts/readiness.md +0 -73
package/pipeline/providers/claude-code/runtime.md +0 -148
package/pipeline/providers/claude-code/spawn.template.md +0 -16
package/pipeline/scripts/db-bootstrap.ts +0 -153
package/pipeline/scripts/embed-sqlite.ts +0 -288
package/pipeline/scripts/embed.ts +0 -425
package/pipeline/scripts/query-kb.ts +0 -183
package/pipeline/spawn-templates/agent-spawn.template.md +0 -16
package/pipeline/spawn-templates/pipeline-context.template.md +0 -47
package/pipeline/steps/orchestration/load-pipeline-config.md +0 -39
package/pipeline/steps/readiness/sprint-review.md +0 -45
package/pipeline/steps/readiness/standalone-review.md +0 -131
package/pipeline/templates/readiness-review.template.md +0 -147

package/README.md CHANGED Viewed

@@ -29,23 +29,24 @@ npx valent-pipeline init
 ## How It Works
-A persistent **Lead** agent reads your story, assembles a team of specialist agents, and orchestrates them through a dependency-driven pipeline:
+A deterministic **Workflow orchestrator** (`sprint.workflow.js`) reads your story, spawns specialist agents per task, and drives them through a dependency-driven pipeline:
 ```
-REQS -> UXA -> QA-A -> READINESS -> BEND + FEND -> CRITIC -> QA-B -> JUDGE -> SHIP
+REQS -> UXA -> QA-A -> SPECCHECK -> RED -> BEND + FEND -> STATIC -> CRITIC -> GREEN -> QA-B -> EVIDENCE -> JUDGE -> SHIP
 ```
-1. **REQS** translates acceptance criteria into an implementation brief
+1. **REQS** translates acceptance criteria into an implementation brief (+ a machine-readable AC manifest)
 2. **UXA** converts UX specs into component specifications (frontend projects)
-3. **QA-A** writes behavioral test specifications *before any code exists*
-4. **READINESS** gate validates the spec chain -- stops on first failure
+3. **QA-A** writes behavioral test specifications *before any code exists* (+ a spec manifest mapping every case to its AC)
+4. **SPECCHECK** gate validates the spec chain mechanically (`valent spec check` + `trace check`); **RED** gate proves the acceptance suite fails pre-implementation (ATDD)
 5. **BEND + FEND** implement production code and tests in parallel
-6. **CRITIC** runs a 3-pass adversarial code review (blind hunt, edge cases, acceptance audit)
-7. **QA-B** executes tests against real infrastructure, files bugs, builds traceability matrix
-8. **JUDGE** makes an evidence-based SHIP or REJECT decision
-9. **Lead** commits code, writes the story report, and picks the next story
+6. **STATIC** gate runs deterministic checks at mechanical cost: lint/type commands, spec-conformance (no dropped assertion targets or un-waived skips), trace check (every AC has a covering case)
+7. **CRITIC** runs a 3-pass adversarial code review (blind hunt, edge cases, acceptance audit), pinning the git SHA it reviewed
+8. **QA-B** executes tests against real infrastructure **through `evidence run`** — exit codes, full logs, junit reports (frozen + SHA-256-hashed), and the git SHA are captured by the CLI, never transcribed by a model — then files bugs and builds the traceability matrix
+9. **EVIDENCE** gate deterministically re-verifies the machine record: report hashes intact, junit green (with the brownfield pre-existing carve-out), every spec'd case executed, CRITIC's pin matches the tested SHA
+10. **JUDGE** makes the SHIP or REJECT decision from the machine verdicts (its self-reported numbers are recounted from the artifacts afterward — a mismatch stops the run)
-Two quality gates (**READINESS** and **JUDGE**) enforce pass/fail checkpoints. Rejection loops send work back to the responsible agent with specific corrections, with a circuit breaker to prevent infinite cycles.
+Quality gates (**SPECCHECK**, **RED**, **STATIC**, **CRITIC**, **GREEN**, **EVIDENCE**, **JUDGE**) enforce pass/fail checkpoints. Rejection loops send work back to the responsible agent with specific corrections, with a code-owned circuit breaker to prevent infinite cycles. The trust property throughout: **facts are captured by code, not transcribed by models** — test results live in `stories/<id>/evidence/` as hashed, machine-written records that gates re-verify.
 ## Project Types
@@ -62,7 +63,7 @@ The pipeline supports 7 project types, each with a tailored task graph and speci
 | `library` | LIBDEV | UXA, FEND, PMCP |
 | `mobile-app` | MOBILE | *(conditional)* |
-The Lead selects which agents to spawn based on `project.type` in your `pipeline-config.yaml` and the story's `testing_profiles`.
+The workflow selects which agents to spawn based on `project.type` in your `pipeline-config.yaml` and the story's `testing_profiles` (resolved deterministically by `resolve-graph`).
 ## Agent Roster
@@ -75,13 +76,14 @@ Spawned fresh per story, torn down after ship or cancel.
 | REQS | Sonnet | Requirements analyst | `reqs-brief.md` |
 | UXA | Sonnet | UX specification | `uxa-spec.md` |
 | QA-A | Sonnet | Test specification | `qa-test-spec.md`, `visual-validation-checklist.md` |
-| READINESS | Sonnet | Spec quality gate | `readiness-review.md` |
+| SPECCHECK | Haiku | Mechanical spec gate (artifact matrix + AC coverage CLIs) | gate transcript |
 | BEND | Sonnet | Backend developer | `bend-handoff.md` |
 | FEND | Sonnet | Frontend developer | `fend-handoff.md` |
 | CRITIC | Opus | Adversarial code reviewer | `critic-review.md` |
 | QA-B | Sonnet | Test executor | `execution-report.md`, `bugs.md`, `traceability-matrix.md` |
-| JUDGE | Sonnet | Final quality gate | `judge-review.md`, `judge-decision.md` |
-| Knowledge | Haiku | Knowledge retrieval | *(inbox only)* |
+| JUDGE | Sonnet/Opus | Final quality gate (evidence pass / binding decision) | `judge-review.md`, `judge-decision.md` |
+Knowledge retrieval has no dedicated agent — every agent self-serves from curated files and the SQLite knowledge base via the `db` CLI commands.
 ### Domain Developer Agents
@@ -96,15 +98,13 @@ Specialized agents that replace BEND for non-API project types:
 | IAC | Sonnet | Cross-cutting (any type) | `iac-handoff.md` |
 | MOBILE | Sonnet | `mobile-app` | `mobile-handoff.md` |
-### Persistent & Ephemeral Agents
+### Cross-Story Stages
-| Agent | Model | Lifecycle | Trigger |
-|---|---|---|---|
-| Lead | Opus | Persistent across stories | Always running |
-| PMCP | Sonnet | Ephemeral | QA-B requests visual validation |
-| Embed | Haiku | Ephemeral | After Retrospective curates |
-| Retrospective | Sonnet | Ephemeral | Every N stories (configurable) |
-| Help | Haiku | Ephemeral | User request |
+| Stage | Model | Trigger |
+|---|---|---|
+| PMCP (visual evidence) | Haiku | Orchestrator stage after QA-B on `ui` stories |
+| Retrospective | Sonnet | Retro workflow after a sprint |
+| Knowledge persist | Haiku | `db index-curated` CLI step driven by the retro workflow |
 ## Installation
@@ -177,13 +177,19 @@ models:
   haiku: [Knowledge, Embed, Help]  # Retrieval, indexing, lookups
 quality:
-  max_rejection_cycles: 5          # Circuit breaker for rejection loops
+  max_rejection_cycles: 3          # Circuit breaker for rejection loops
   retrospective_every_n_stories: 5 # Retrospective trigger frequency
   stall_threshold_minutes: 15      # Agent stall detection timeout
-git:
-  target_branch: ""                # Base branch for story branches
-  story_branch_prefix: story/      # Branch naming convention
+git:                               # Story git flow (valent git start-story|commit-phase|ship-story|leave-story)
+  enabled: true                    # Branch-per-story + typed commit trail + merge --no-ff on ship
+  target_branch: ""                # Base/merge-back branch ("" = the branch the sprint starts on)
+  story_branch_prefix: story/      # Branch naming convention (story/<id>)
+  parallelism:                     # Concurrent stories in git worktrees (merges stay serialized)
+    enabled: false                 # OFF = strictly sequential sprint (the default)
+    max_stories: 2                 # Concurrency cap when enabled
+    worktree_dir: .valent-worktrees  # Worktrees at <dir>/<story-id> (ignored via .git/info/exclude)
+    setup_commands: []             # Run in each fresh worktree (env files, per-story ports, installs)
 knowledge:
   mode: sqlite                     # none | sqlite | local-docker | connect-to-existing
@@ -212,10 +218,17 @@ sprint:                            # Only used in epic/project mode
 | Command | Description |
 |---|---|
 | `valent-pipeline db init` | Initialize SQLite knowledge database |
-| `valent-pipeline db rebuild` | Drop and recreate all tables |
-| `valent-pipeline db index <story-dir>` | Index a story's artifacts |
-| `valent-pipeline db query <text>` | Full-text search across artifacts |
-| `valent-pipeline db embed <file>` | Generate and store embeddings |
+| `valent-pipeline db rebuild` | Rebuild the database from story artifacts |
+| `valent-pipeline db index-handoff --file <path>` | Index a single handoff artifact |
+| `valent-pipeline db search --query <text>` | Full-text search across all artifacts |
+| `valent-pipeline db query-artifact --story <id> --type <type>` | Fetch a specific artifact |
+| `valent-pipeline db query-directives [--agent <role>]` | Get active correction directives |
+| `valent-pipeline db add-directive --json-file <path> --batch <n>` | Persist correction directives (canonical YAML + queryable index, one call) |
+| `valent-pipeline db retire-directive --id <id> [--status expired\|superseded]` | Expire/supersede a directive (status change only — audit trail kept) |
+| `valent-pipeline db sync-directives` | Re-derive the directives index from knowledge/correction-directives.yaml |
+| `valent-pipeline db index-curated --file <path>` | Process embed-instructions.md from a retrospective |
+Calibration/query helpers: `db record-calibration`, `db query-velocity`, `db query-list`, `db query-stories`, `db query-bugs-since` (see `valent-pipeline db --help`).
 ### Claude Code Skills
@@ -228,6 +241,7 @@ Invoked as slash commands inside Claude Code:
 | `/valent-run-story-workflow STORY-ID` | Execute a single story via the Claude Code **Workflow** orchestrator |
 | `/valent-run-epic-workflow EPIC-ID` | Execute an epic (sprint planning + execution) via the **Workflow** orchestrator |
 | `/valent-run-project-workflow` | Execute a full project across all epics via the **Workflow** orchestrator |
+| `/valent-run-spike SPIKE-ID` | Run a time-boxed de-risking spike to a recorded GO/STEP-DOWN/HALT decision |
 | `/valent-run-deferred-tests` | Run deferred iOS tests on Mac |
 | `/valent-debug-export` | Export diagnostic dump |
 | `/valent-help` | Pipeline documentation and FAQ |
@@ -263,7 +277,7 @@ For each story, the pipeline produces 15+ artifacts in `stories/{story-id}/outpu
 | `execution-report.md` | QA-B | Test execution results |
 | `bugs.md` | QA-B | Filed bugs with priorities |
 | `traceability-matrix.md` | QA-B | AC-to-test coverage map |
-| `readiness-review.md` | READINESS | Spec gate results |
+| `evidence/atdd-red.json`, `evidence/proof.json` | RED/GREEN gates (CLI-written) | ATDD red baseline + the red/green/diff proof object |
 | `judge-review.md` | JUDGE | Bug review findings |
 | `judge-decision.md` | JUDGE | Ship/reject decision with evidence |
 | `story-report.md` | orchestrator | Story completion summary |
@@ -274,10 +288,10 @@ Plus committed, tested production code in your project source tree.
 All inter-agent communication follows the [Distilled Communication Standard](pipeline/docs/communication-standard.md):
-- **Handoff documents** -- structured artifacts with YAML frontmatter, orchestrator summary, and facts-only content. Every handoff follows a [template skeleton](pipeline/docs/template-skeleton.md).
-- **Inbox messages** -- terse coordination messages (~500 tokens max) with file pointers. Types include `[HANDOFF]`, `[BLOCKER]`, `[REVISION]`, `[CRITIC-REJECTION]`, `[BUG]`, `[DESIGN-COUNCIL]`, `[ESCALATION]`.
+- **Handoff documents** -- structured artifacts with YAML frontmatter, orchestrator summary, and facts-only content. Every handoff follows a [template skeleton](pipeline/docs/template-skeleton.md). The handoff file IS the completion signal -- the orchestrator sequences agents from it.
+- **Structured returns** -- each agent returns a terse, schema-validated machine block with file pointers; the orchestrator routes all coordination (rejections, bugs, escalations) from these.
 - **Design Council** -- structured deliberation protocol for contested design decisions with position statements, synthesis, and escalation to user if consensus fails.
-- **Human Escalation** -- when agent deliberation is insufficient, the Lead surfaces the issue to the user with full context.
+- **Human Escalation** -- when agent deliberation is insufficient, the orchestrator surfaces the issue to the user with full context.
 ## Knowledge System
@@ -287,9 +301,9 @@ The pipeline learns from its own output through a [knowledge system](pipeline/do
 |---|---|---|
 | Correction directives | `knowledge/correction-directives.yaml` | Behavioral changes for agents from past patterns |
 | Curated knowledge | `knowledge/curated/` | Conventions, validated patterns, known pitfalls |
-| SQLite / ChromaDB | `.valent-pipeline/pipeline.db` | Embedding-based retrieval (optional) |
+| SQLite (FTS5) | `.valent-pipeline/pipeline.db` | Full-text retrieval over indexed artifacts and curated lessons |
-The **Retrospective** agent (triggered every N stories) is the sole gatekeeper for what enters persistent knowledge. It analyzes batch outputs, writes correction directives, and produces indexing instructions for the **Embed** agent. The **Knowledge** agent reads all sources and responds to teammate queries during story execution.
+The retrospective workflow (`retro.workflow.js`, triggered every N stories) is the sole gatekeeper for what enters persistent knowledge: it analyzes batch outputs, synthesizes gated correction directives, and emits indexing instructions executed by its EMBED stage. During story execution, agents self-serve from the knowledge sources via the `valent-knowledge` skill.
 ### Knowledge Modes
@@ -302,7 +316,7 @@ The **Retrospective** agent (triggered every N stories) is the sole gatekeeper f
 ## Execution Modes
-The pipeline runs on a single orchestration path: the **Claude Code Workflow** path. A deterministic Workflow script (`pipeline/orchestrators/claude-code/{plan,sprint,retro}.workflow.js`) drives the pipeline with schema-validated gates, a code-owned rejection cap, parallel CRITIC passes, and journal-based resume (`resumeFromRunId`). Control flow lives in JavaScript and the journal — not in a model interpreting prose. Validated by `scripts/test-workflow.js` but not yet exercised end-to-end against a live story — validate against a fixture before relying on it. See `pipeline/orchestrators/claude-code/README.md`.
+The pipeline runs on a single orchestration path: the **Claude Code Workflow** path. A deterministic Workflow script (`pipeline/orchestrators/claude-code/{plan,sprint,retro}.workflow.js`) drives the pipeline with schema-validated gates, a code-owned rejection cap, parallel CRITIC passes, and journal-based resume (`resumeFromRunId`). Control flow lives in JavaScript and the journal — not in a model interpreting prose. Control flow is validated by `scripts/test-workflow.js`, and the orchestrator is exercised end-to-end against live stories (live runs have driven the version history). See `pipeline/orchestrators/claude-code/README.md`.
 > Requires Claude Code (the Workflow tool). `runtime.provider` must be `claude-code`.
@@ -340,14 +354,20 @@ Converts your epics and stories documents into a prioritized `pipeline-backlog.y
 ## Quality Gates
-### READINESS Gate
+### SPECCHECK Gate (mechanical)
+Validates the spec chain before any code is written — as CLIs, not LLM judgment:
+- `valent spec check`: artifact-existence matrix per testing profile, acceptance-file existence, and the acceptance-tier mock ban
+- `valent trace check`: every unwaived AC covered by at least one spec'd case
+Rework routes to the CLI-named owner (REQS/UXA/QA-A) with downstream specs re-derived automatically.
-Validates the spec chain before any code is written:
-- REQS brief completeness and accuracy
-- UXA spec consistency (frontend projects)
-- QA test spec coverage and depth
+### RED / GREEN Gates (ATDD)
-Stops on first failure. The responsible upstream agent must rework before the pipeline proceeds.
+When `atdd.command` is configured, QA-A authors **executable acceptance tests** before any implementation exists:
+- **RED** (pre-dev): the suite runs via `valent evidence run` and every required acceptance case must FAIL — a pre-passing test is a spec bug. The passing red writes `evidence/atdd-red.json`, snapshot-hashing the acceptance sources.
+- The acceptance tests are **read-only for dev agents** — any edit is hash-detected and auto-REJECTed to QA-A arbitration (restore, or amend with an audited `evidence rebaseline`).
+- **GREEN** (post-CRITIC): the suite re-runs and must pass with the sources byte-identical since red. `valent evidence proof` then assembles `proof.json`: the failing run before AI wrote code, the passing run after, the exact diff between, and the hashes.
 ### JUDGE Gate
@@ -358,14 +378,14 @@ Makes the final ship decision based on evidence:
 - PMCP visual evidence (UI projects)
 - Applies "evidence over assertion" -- independently verifies every upstream claim
-Verdicts: **SHIP** (commit and close), **SHIP-PARTIAL** (mobile: ship Android, defer iOS), **REJECT** (send back with corrections).
+Verdicts: **SHIP** (the story branch merges `--no-ff` into the target branch and the backlog flips to shipped), **SHIP-PARTIAL** (mobile: ship Android, defer iOS), **REJECT** (the story branch is left unmerged for the fix/retry; send back with corrections).
 ### Rejection Loops
 When CRITIC or JUDGE rejects work:
 1. Lead re-queues the responsible agent with the specific rejection findings
 2. Agent reworks and resubmits
-3. Circuit breaker (`max_rejection_cycles`, default 5) prevents infinite loops
+3. Circuit breaker (`max_rejection_cycles`, default 3) prevents infinite loops
 4. After max cycles, Lead escalates to user
 ## Crash Recovery
@@ -397,7 +417,6 @@ After initialization, the pipeline installs to `.valent-pipeline/` in your proje
     qa-a/                     #   Test spec steps (domain-specific)
     qa-b/                     #   Test execution steps (domain-specific)
     reqs/                     #   Requirements analysis steps
-    readiness/                #   Readiness gate steps
     judge/                    #   Judge gate steps
     orchestration/            #   Shared orchestration steps (config, story resolution, status)
     retrospective/            #   Retrospective analysis steps
@@ -410,7 +429,6 @@ After initialization, the pipeline installs to `.valent-pipeline/` in your proje
     mcp-dev/                  #   MCP server developer steps
     mobile/                   #   Mobile developer steps
     uxa/                      #   UX specification steps
-  spawn-templates/            # Agent spawn configuration
   scripts/                    # Pipeline utility scripts
   docs/                       # Pipeline reference documentation
   knowledge/
@@ -428,19 +446,12 @@ Full reference documentation lives in `pipeline/docs/`:
 | [Pipeline Overview](pipeline/docs/pipeline-overview.md) | Architecture, flow, artifact map |
 | [Agent Reference](pipeline/docs/agent-reference.md) | All agents, models, inputs/outputs |
 | [Communication Standard](pipeline/docs/communication-standard.md) | Handoff format, inbox protocol, Design Council |
-| [Lead Lifecycle](pipeline/docs/lead-lifecycle.md) | Kick-off, monitoring, ship, crash recovery |
 | [Task Graph Specification](pipeline/docs/task-graph.md) | Dependencies, task states, claiming |
 | [Pipeline State Schema](pipeline/docs/pipeline-state-schema.md) | JSON schema for pipeline-state.json |
 | [Knowledge System](pipeline/docs/knowledge-system.md) | RAG assessment, correction directives, curation |
 | [Template Skeleton](pipeline/docs/template-skeleton.md) | Universal handoff document structure |
 | [NPX Packaging](pipeline/docs/npx-packaging.md) | Package distribution and init workflow |
-### Reference
-| Document | Description |
-|---|---|
-| [Refactor Checklist](pipeline/docs/design/refactor-checklist.md) | Every location to update when changing agents, config, tables, or phases |
 ## License
 MIT