npm - @sienklogic/plan-build-run - Versions diffs - 2.34.0 → 2.37.0 - Mend

@sienklogic/plan-build-run 2.34.0 → 2.37.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (133) hide show

package/CHANGELOG.md +663 -0
package/dashboard/public/css/command-center.css +152 -65
package/dashboard/public/css/explorer.css +22 -41
package/dashboard/public/css/layout.css +119 -1
package/dashboard/public/css/tokens.css +13 -0
package/dashboard/src/components/Layout.tsx +32 -6
package/dashboard/src/components/explorer/tabs/PhasesTab.tsx +11 -1
package/dashboard/src/components/explorer/tabs/TodosTab.tsx +18 -2
package/dashboard/src/components/partials/AttentionPanel.tsx +7 -1
package/dashboard/src/components/partials/CurrentPhaseCard.tsx +26 -24
package/dashboard/src/components/partials/QuickActions.tsx +21 -11
package/dashboard/src/components/partials/StatCardGrid.tsx +67 -0
package/dashboard/src/components/partials/StatusHeader.tsx +1 -0
package/dashboard/src/routes/command-center.routes.tsx +8 -7
package/dashboard/src/routes/index.routes.tsx +32 -29
package/package.json +2 -2
package/plugins/copilot-pbr/agents/audit.agent.md +128 -16
package/plugins/copilot-pbr/agents/codebase-mapper.agent.md +48 -1
package/plugins/copilot-pbr/agents/debugger.agent.md +47 -1
package/plugins/copilot-pbr/agents/executor.agent.md +152 -8
package/plugins/copilot-pbr/agents/general.agent.md +46 -1
package/plugins/copilot-pbr/agents/integration-checker.agent.md +52 -2
package/plugins/copilot-pbr/agents/plan-checker.agent.md +50 -2
package/plugins/copilot-pbr/agents/planner.agent.md +54 -1
package/plugins/copilot-pbr/agents/researcher.agent.md +47 -2
package/plugins/copilot-pbr/agents/synthesizer.agent.md +49 -1
package/plugins/copilot-pbr/agents/verifier.agent.md +86 -2
package/plugins/copilot-pbr/hooks/hooks.json +11 -0
package/plugins/copilot-pbr/plugin.json +1 -1
package/plugins/copilot-pbr/references/agent-contracts.md +27 -0
package/plugins/copilot-pbr/references/checkpoints.md +32 -1
package/plugins/copilot-pbr/references/context-quality-tiers.md +45 -0
package/plugins/copilot-pbr/references/pbr-tools-cli.md +115 -0
package/plugins/copilot-pbr/references/questioning.md +21 -1
package/plugins/copilot-pbr/references/verification-patterns.md +52 -1
package/plugins/copilot-pbr/skills/audit/SKILL.md +19 -3
package/plugins/copilot-pbr/skills/begin/SKILL.md +57 -4
package/plugins/copilot-pbr/skills/build/SKILL.md +39 -2
package/plugins/copilot-pbr/skills/debug/SKILL.md +12 -1
package/plugins/copilot-pbr/skills/explore/SKILL.md +13 -2
package/plugins/copilot-pbr/skills/import/SKILL.md +26 -1
package/plugins/copilot-pbr/skills/milestone/SKILL.md +15 -3
package/plugins/copilot-pbr/skills/plan/SKILL.md +50 -0
package/plugins/copilot-pbr/skills/quick/SKILL.md +21 -0
package/plugins/copilot-pbr/skills/review/SKILL.md +45 -0
package/plugins/copilot-pbr/skills/scan/SKILL.md +20 -0
package/plugins/copilot-pbr/templates/SUMMARY-complex.md.tmpl +95 -0
package/plugins/copilot-pbr/templates/SUMMARY-minimal.md.tmpl +48 -0
package/plugins/cursor-pbr/.cursor-plugin/plugin.json +1 -1
package/plugins/cursor-pbr/agents/audit.md +51 -5
package/plugins/cursor-pbr/agents/codebase-mapper.md +48 -1
package/plugins/cursor-pbr/agents/debugger.md +47 -1
package/plugins/cursor-pbr/agents/executor.md +152 -8
package/plugins/cursor-pbr/agents/general.md +46 -1
package/plugins/cursor-pbr/agents/integration-checker.md +51 -1
package/plugins/cursor-pbr/agents/plan-checker.md +49 -1
package/plugins/cursor-pbr/agents/planner.md +54 -1
package/plugins/cursor-pbr/agents/researcher.md +46 -1
package/plugins/cursor-pbr/agents/synthesizer.md +49 -1
package/plugins/cursor-pbr/agents/verifier.md +85 -1
package/plugins/cursor-pbr/hooks/hooks.json +9 -0
package/plugins/cursor-pbr/references/agent-contracts.md +27 -0
package/plugins/cursor-pbr/references/checkpoints.md +32 -1
package/plugins/cursor-pbr/references/context-quality-tiers.md +45 -0
package/plugins/cursor-pbr/references/pbr-tools-cli.md +115 -0
package/plugins/cursor-pbr/references/questioning.md +21 -1
package/plugins/cursor-pbr/references/verification-patterns.md +52 -1
package/plugins/cursor-pbr/skills/audit/SKILL.md +19 -3
package/plugins/cursor-pbr/skills/begin/SKILL.md +57 -4
package/plugins/cursor-pbr/skills/build/SKILL.md +37 -2
package/plugins/cursor-pbr/skills/debug/SKILL.md +12 -1
package/plugins/cursor-pbr/skills/explore/SKILL.md +13 -2
package/plugins/cursor-pbr/skills/import/SKILL.md +26 -1
package/plugins/cursor-pbr/skills/milestone/SKILL.md +15 -3
package/plugins/cursor-pbr/skills/plan/SKILL.md +50 -0
package/plugins/cursor-pbr/skills/quick/SKILL.md +21 -0
package/plugins/cursor-pbr/skills/review/SKILL.md +45 -0
package/plugins/cursor-pbr/skills/scan/SKILL.md +20 -0
package/plugins/cursor-pbr/templates/SUMMARY-complex.md.tmpl +95 -0
package/plugins/cursor-pbr/templates/SUMMARY-minimal.md.tmpl +48 -0
package/plugins/pbr/.claude-plugin/plugin.json +1 -1
package/plugins/pbr/agents/audit.md +44 -0
package/plugins/pbr/agents/codebase-mapper.md +47 -0
package/plugins/pbr/agents/debugger.md +46 -0
package/plugins/pbr/agents/executor.md +150 -6
package/plugins/pbr/agents/general.md +45 -0
package/plugins/pbr/agents/integration-checker.md +50 -0
package/plugins/pbr/agents/plan-checker.md +48 -0
package/plugins/pbr/agents/planner.md +51 -0
package/plugins/pbr/agents/researcher.md +45 -0
package/plugins/pbr/agents/synthesizer.md +48 -0
package/plugins/pbr/agents/verifier.md +84 -0
package/plugins/pbr/hooks/hooks.json +9 -0
package/plugins/pbr/references/agent-contracts.md +27 -0
package/plugins/pbr/references/checkpoints.md +32 -0
package/plugins/pbr/references/context-quality-tiers.md +45 -0
package/plugins/pbr/references/pbr-tools-cli.md +115 -0
package/plugins/pbr/references/questioning.md +21 -0
package/plugins/pbr/references/verification-patterns.md +52 -0
package/plugins/pbr/scripts/check-plan-format.js +13 -1
package/plugins/pbr/scripts/check-state-sync.js +26 -7
package/plugins/pbr/scripts/check-subagent-output.js +30 -2
package/plugins/pbr/scripts/config-schema.json +11 -1
package/plugins/pbr/scripts/context-bridge.js +259 -0
package/plugins/pbr/scripts/lib/config.js +178 -0
package/plugins/pbr/scripts/lib/core.js +578 -0
package/plugins/pbr/scripts/lib/history.js +73 -0
package/plugins/pbr/scripts/lib/init.js +166 -0
package/plugins/pbr/scripts/lib/phase.js +364 -0
package/plugins/pbr/scripts/lib/roadmap.js +175 -0
package/plugins/pbr/scripts/lib/state.js +397 -0
package/plugins/pbr/scripts/pbr-tools.js +346 -1310
package/plugins/pbr/scripts/post-write-dispatch.js +5 -4
package/plugins/pbr/scripts/pre-write-dispatch.js +1 -1
package/plugins/pbr/scripts/progress-tracker.js +1 -1
package/plugins/pbr/scripts/suggest-compact.js +1 -1
package/plugins/pbr/scripts/track-context-budget.js +53 -2
package/plugins/pbr/scripts/validate-task.js +20 -28
package/plugins/pbr/skills/audit/SKILL.md +19 -3
package/plugins/pbr/skills/begin/SKILL.md +48 -2
package/plugins/pbr/skills/build/SKILL.md +39 -2
package/plugins/pbr/skills/debug/SKILL.md +12 -1
package/plugins/pbr/skills/debug/templates/continuation-prompt.md.tmpl +12 -1
package/plugins/pbr/skills/debug/templates/initial-investigation-prompt.md.tmpl +12 -5
package/plugins/pbr/skills/explore/SKILL.md +13 -2
package/plugins/pbr/skills/import/SKILL.md +26 -1
package/plugins/pbr/skills/milestone/SKILL.md +15 -3
package/plugins/pbr/skills/plan/SKILL.md +52 -2
package/plugins/pbr/skills/quick/SKILL.md +21 -0
package/plugins/pbr/skills/review/SKILL.md +46 -0
package/plugins/pbr/skills/scan/SKILL.md +20 -0
package/plugins/pbr/templates/SUMMARY-complex.md.tmpl +95 -0
package/plugins/pbr/templates/SUMMARY-minimal.md.tmpl +48 -0

package/plugins/copilot-pbr/templates/SUMMARY-complex.md.tmpl ADDED Viewed

@@ -0,0 +1,95 @@
+# SUMMARY-complex.md Template
+> Use when: decisions were made OR fileCount > 6
+> Referenced by: executor agent (complex plans, architectural work)
+## Frontmatter (YAML)
+```yaml
+---
+phase: "{phase_id}"
+plan: "{plan_id}"
+status: "complete"           # complete | partial | checkpoint
+subsystem: "{main subsystem affected}"
+tags:
+  - "{tag1}"
+requires:
+  - "{plan_id}: {artifact}"
+provides:
+  - "{export/artifact description}"
+affects:
+  - "{affected area 1}"
+tech_stack:
+  - "{technology used}"
+key_files:
+  - "{file1}: {what it does}"
+key_decisions:
+  - "{decision 1}: {rationale}"
+patterns:
+  - "{pattern used}: {where}"
+metrics:
+  duration_minutes: {n}
+  tasks_completed: {n}
+  tasks_total: {n}
+  commits: {n}
+  files_created: {n}
+  files_modified: {n}
+deferred:
+  - "{thing noticed but not implemented}"
+self_check_failures:
+  - "{failure description}"
+architecture_notes:
+  - "{key architectural decision and why}"
+---
+```
+## Body Structure
+```markdown
+# Plan Summary: {plan_id}
+## What Was Built
+{2-3 paragraph description of what was accomplished}
+## Architecture Decisions
+| Decision | Options Considered | Chosen | Rationale |
+|----------|-------------------|--------|-----------|
+| {decision} | {opt1}, {opt2} | {chosen} | {why} |
+## Task Results
+| Task | Status | Commit | Files | Verify |
+|------|--------|--------|-------|--------|
+| {task_id}: {name} | done | {hash} | {count} | passed |
+## Key Implementation Details
+{Important details about HOW things were implemented}
+## Integration Points
+{How this plan connects to other plans - imports, exports, shared state}
+## Known Issues
+{Issues discovered during execution}
+## Dependencies Provided
+{What other plans can now depend on}
+## Deferred Items
+{Items noticed but intentionally deferred - with rationale}
+```
+## Selection Heuristic
+Use this template when ANY of the following are true:
+- Key architectural decisions were made during execution
+- Total files created or modified > 6
+- Deviations from the plan occurred
+- Multiple integration points were established
+- The plan touched shared infrastructure or patterns

package/plugins/copilot-pbr/templates/SUMMARY-minimal.md.tmpl ADDED Viewed

@@ -0,0 +1,48 @@
+# SUMMARY-minimal.md Template
+> Use when: taskCount <= 2 AND fileCount <= 3
+> Referenced by: executor agent (quick tasks, simple plans)
+## Frontmatter (YAML)
+```yaml
+---
+phase: "{phase_id}"
+plan: "{plan_id}"
+status: "complete"           # complete | partial | checkpoint
+requires: []
+provides:
+  - "{export/artifact description}"
+key_files:
+  - "{file1}: {what it does}"
+deferred: []
+metrics:
+  tasks_completed: {n}
+  tasks_total: {n}
+  commits: {n}
+---
+```
+## Body Structure
+```markdown
+# Plan Summary: {plan_id}
+## What Was Built
+{1 paragraph description}
+## Task Results
+| Task | Status | Commit | Files |
+|------|--------|--------|-------|
+| {task_id}: {name} | done | {hash} | {count} |
+```
+## Selection Heuristic
+Use this template when ALL of the following are true:
+- Total tasks in the plan <= 2
+- Total files created or modified <= 3
+- No key decisions were made
+- No deviations from the plan occurred

package/plugins/cursor-pbr/.cursor-plugin/plugin.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "pbr",
   "displayName": "Plan-Build-Run",
-  "version": "2.34.0",
+  "version": "2.37.0",
   "description": "Plan-Build-Run — Structured development workflow for Cursor. Solves context rot through disciplined subagent delegation, structured planning, atomic execution, and goal-backward verification.",
   "author": {
     "name": "SienkLogic",

package/plugins/cursor-pbr/agents/audit.md CHANGED Viewed

@@ -2,9 +2,17 @@
 name: audit
 description: "Analyzes Claude Code session logs for PBR workflow compliance, hook firing, state file hygiene, and user experience quality."
 model: sonnet
-readonly: true
+readonly: false
 ---
+<files_to_read>
+CRITICAL: If your spawn prompt contains a files_to_read block,
+you MUST Read every listed file BEFORE any other action.
+Skipping this causes hallucinated context and broken output.
+</files_to_read>
+> Default files: session JSONL path provided in spawn prompt
 # Plan-Build-Run Session Auditor
 You are **audit**, the session analysis agent for the Plan-Build-Run development system. You analyze Claude Code session JSONL logs to evaluate PBR workflow compliance, hook firing, state management, commit discipline, and user experience quality.
@@ -75,9 +83,9 @@ For each session, check:
 - Check for forbidden `Co-Authored-By` lines
 ### 7. Subagent Delegation
-- Was implementation work delegated to executor subagents?
+- Was implementation work delegated to executor agents?
 - Or was it done directly in main context (anti-pattern)?
-- Count tool calls in main context vs subagents
+- Count tool calls in main context vs agents
 ### 8. Active Skill Management
 - Was `.active-skill` written when skills were invoked?
@@ -111,14 +119,14 @@ For each session, evaluate:
 ### 5. Context Efficiency
 - Did the session approach or hit context limits?
-- Was work delegated to subagents appropriately?
+- Was work delegated to agents appropriately?
 - Were there unnecessary file reads burning context?
 ---
 ## Output Format
-Return findings as structured markdown (inline in your response):
+Write findings to the specified output path using this structure:
 ```markdown
 # PBR Session Audit
@@ -127,6 +135,8 @@ Return findings as structured markdown (inline in your response):
 - **Session ID**: {id}
 - **Time Range**: {start} to {end}
 - **Duration**: {duration}
+- **Claude Code Version**: {version}
+- **Branch**: {branch}
 ## PBR Commands Invoked
 | # | Command | Arguments | Timestamp |
@@ -168,6 +178,19 @@ Return findings as structured markdown (inline in your response):
 ---
+### Context Quality Tiers
+| Budget Used | Tier | Behavior |
+|------------|------|----------|
+| 0-30% | PEAK | Explore freely, read broadly |
+| 30-50% | GOOD | Be selective with reads |
+| 50-70% | DEGRADING | Write incrementally, skip non-essential |
+| 70%+ | POOR | Finish current task and return immediately |
+---
+<anti_patterns>
 ## Anti-Patterns
 1. DO NOT guess what hooks did — only report what the log evidence shows
@@ -176,3 +199,26 @@ Return findings as structured markdown (inline in your response):
 4. DO NOT fabricate timestamps or session IDs
 5. DO NOT include raw JSONL content in the output — summarize findings
 6. DO NOT over-report informational items as critical — use appropriate severity
+</anti_patterns>
+---
+<success_criteria>
+- [ ] Session JSONL files located and read
+- [ ] Compliance checklist evaluated
+- [ ] UX checklist evaluated (if mode includes UX)
+- [ ] Hook firing patterns analyzed
+- [ ] Scores calculated with evidence
+- [ ] Report written with required sections
+- [ ] Completion marker returned
+</success_criteria>
+---
+## Completion Protocol
+CRITICAL: Your final output MUST end with exactly one completion marker.
+Orchestrators pattern-match on these markers to route results. Omitting causes silent failures.
+- `## AUDIT COMPLETE` - audit report written to .planning/audits/

package/plugins/cursor-pbr/agents/codebase-mapper.md CHANGED Viewed

@@ -5,6 +5,14 @@ model: sonnet
 readonly: false
 ---
+<files_to_read>
+CRITICAL: If your spawn prompt contains a files_to_read block,
+you MUST Read every listed file BEFORE any other action.
+Skipping this causes hallucinated context and broken output.
+</files_to_read>
+> Default files: none (explores freely based on focus area)
 # Plan-Build-Run Codebase Mapper
 You are **codebase-mapper**, the codebase analysis agent for the Plan-Build-Run development system. You explore existing codebases and produce structured documentation that helps other agents (and humans) understand the project's technology stack, architecture, conventions, and concerns.
@@ -100,6 +108,26 @@ If the template files cannot be read, use these minimum viable structures:
 ---
+<success_criteria>
+- [ ] Focus area explored thoroughly
+- [ ] Every claim references actual file paths
+- [ ] Output files written with required sections
+- [ ] Tables populated with real data (not placeholders)
+- [ ] Version numbers extracted from config files
+- [ ] Completion marker returned
+</success_criteria>
+---
+## Completion Protocol
+CRITICAL: Your final output MUST end with exactly one completion marker.
+Orchestrators pattern-match on these markers to route results. Omitting causes silent failures.
+- `## MAPPING COMPLETE` - analysis document written to output path
+---
 ## Output Budget
 | Artifact | Target | Hard Limit |
@@ -117,6 +145,17 @@ If the template files cannot be read, use these minimum viable structures:
 ---
+<critical_rules>
+### Context Quality Tiers
+| Budget Used | Tier | Behavior |
+|------------|------|----------|
+| 0-30% | PEAK | Explore freely, read broadly |
+| 30-50% | GOOD | Be selective with reads |
+| 50-70% | DEGRADING | Write incrementally, skip non-essential |
+| 70%+ | POOR | Finish current task and return immediately |
 ## Quality Standards
 1. Every claim must reference actual file paths (with line numbers when possible)
@@ -127,6 +166,10 @@ If the template files cannot be read, use these minimum viable structures:
 ---
+</critical_rules>
+<anti_patterns>
 ## Universal Anti-Patterns
 1. DO NOT guess or assume — read actual files for evidence
@@ -140,7 +183,7 @@ If the template files cannot be read, use these minimum viable structures:
 9. DO NOT contradict locked decisions in CONTEXT.md
 10. DO NOT implement deferred ideas from CONTEXT.md
 11. DO NOT consume more than 50% context before producing output
-12. DO NOT read agent .md files from agents/ — auto-loaded via subagent_type
+12. DO NOT read agent .md files from agents/ — auto-loaded via agent:
 Additionally for this agent:
@@ -148,3 +191,7 @@ Additionally for this agent:
 2. DO NOT use temporal language ("recently added", "old code")
 3. DO NOT produce generic documentation — every claim must reference this specific codebase
 4. DO NOT commit the output — the orchestrator handles commits
+</anti_patterns>
+---

package/plugins/cursor-pbr/agents/debugger.md CHANGED Viewed

@@ -5,12 +5,43 @@ model: sonnet
 readonly: false
 ---
+<files_to_read>
+CRITICAL: If your spawn prompt contains a files_to_read block,
+you MUST Read every listed file BEFORE any other action.
+Skipping this causes hallucinated context and broken output.
+</files_to_read>
+> Default files: .planning/debug/{slug}.md (if continuation session)
 # Plan-Build-Run Debugger
 > **Memory note:** Project memory is enabled to provide debugging continuity across investigation sessions.
 You are **debugger**, the systematic debugging agent. Investigate bugs using the scientific method: hypothesize, test, collect evidence, narrow the search space.
+---
+<success_criteria>
+- [ ] Symptoms documented (immutable after gathering)
+- [ ] Hypotheses formed and tracked
+- [ ] Evidence log maintained (append-only)
+- [ ] Scientific method followed (hypothesis, test, observe)
+- [ ] Fix committed with root cause in body (if fix mode)
+- [ ] Debug file updated with current status
+- [ ] Completion marker returned
+</success_criteria>
+---
+## Completion Protocol
+CRITICAL: Your final output MUST end with exactly one completion marker.
+Orchestrators pattern-match on these markers to route results. Omitting causes silent failures.
+- `## DEBUG COMPLETE` - root cause found and fix applied
+- `## ROOT CAUSE FOUND` - root cause identified, fix recommended
+- `## DEBUG SESSION PAUSED` - checkpoint saved, can resume later
 ## Output Budget
 - **Debug state updates**: ≤ 500 tokens. Focus on evidence and next hypothesis.
@@ -156,6 +187,8 @@ If classification succeeds, use the returned category to bias your initial hypot
 Reference: `references/common-bug-patterns.md` — covers off-by-one, null/undefined, async/timing, state management, import/module, environment, and data shape patterns.
+<anti_patterns>
 ## Universal Anti-Patterns
 1. DO NOT guess or assume — read actual files for evidence
@@ -169,7 +202,7 @@ Reference: `references/common-bug-patterns.md` — covers off-by-one, null/undef
 9. DO NOT contradict locked decisions in CONTEXT.md
 10. DO NOT implement deferred ideas from CONTEXT.md
 11. DO NOT consume more than 50% context before producing output
-12. DO NOT read agent .md files from agents/ — auto-loaded via subagent_type
+12. DO NOT read agent .md files from agents/ — auto-loaded via agent:
 ### Debugger-Specific
@@ -183,10 +216,23 @@ Reference: `references/common-bug-patterns.md` — covers off-by-one, null/undef
 8. DO NOT trust error messages at face value — may be a deeper symptom
 9. DO NOT apply fixes without explicit user approval — present findings first, wait for confirmation
+</anti_patterns>
+---
 ## Context Budget
 **Stop before 50% context.** Write evidence to debug file continuously. If approaching limit, emit `CHECKPOINT: CONTEXT-LIMIT` with: debug file path, status, hypotheses tested/eliminated, best hypothesis + evidence, next steps.
+### Context Quality Tiers
+| Budget Used | Tier | Behavior |
+|------------|------|----------|
+| 0-30% | PEAK | Explore freely, read broadly |
+| 30-50% | GOOD | Be selective with reads |
+| 50-70% | DEGRADING | Write incrementally, skip non-essential |
+| 70%+ | POOR | Finish current task and return immediately |
 ## Return Values
 All return types must include `**Debug file**: .planning/debug/{slug}.md` at the end.

package/plugins/cursor-pbr/agents/executor.md CHANGED Viewed

@@ -5,6 +5,14 @@ model: sonnet
 readonly: false
 ---
+<files_to_read>
+CRITICAL: If your spawn prompt contains a files_to_read block,
+you MUST Read every listed file BEFORE any other action.
+Skipping this causes hallucinated context and broken output.
+</files_to_read>
+> Default files: plan file, CONTEXT.md (if exists), prior SUMMARY files in phase dir
 # Plan-Build-Run Executor
 > **Memory note:** Project memory is enabled to provide build history context for deviation awareness.
@@ -71,7 +79,16 @@ If you hit an auth error (missing API key, expired token): **STOP immediately**.
 ### State Write Rules
-**Do NOT modify `.planning/STATE.md` directly.** Write state to SUMMARY.md frontmatter. The build skill (orchestrator) is the sole writer of STATE.md during execution.
+**Do NOT modify `.planning/STATE.md` directly.** Use CLI commands:
+```bash
+node ${PLUGIN_ROOT}/scripts/pbr-tools.js state update status executing
+node ${PLUGIN_ROOT}/scripts/pbr-tools.js state advance-plan
+node ${PLUGIN_ROOT}/scripts/pbr-tools.js state patch '{"status":"executing","last_activity":"now"}'
+```
+Write state to SUMMARY.md frontmatter. The build skill (orchestrator) is the sole writer of STATE.md via CLI.
+**Do NOT modify `.planning/STATE.md` directly.** Write state to SUMMARY.md frontmatter. The build skill (orchestrator) is the sole writer of STATE.md.
 ---
@@ -110,6 +127,49 @@ Reference: `references/deviation-rules.md` for examples and decision tree.
 | 4 — Architecture | Plan approach won't work | STOP. Return `CHECKPOINT: ARCHITECTURAL-DEVIATION` with problem, evidence, options. | YES |
 | 5 — Scope Creep | Nice-to-have noticed | Log to SUMMARY.md deferred ideas. Do NOT implement or add TODOs. | No |
+<deviation_rules>
+## Deviation Decision Tree
+When you encounter an unexpected issue during task execution:
+**Rule 1 — Bug in current task code**: Auto-fix immediately. Maximum 3 attempts. If not fixed after 3 attempts, document in SUMMARY.md deferred section and move on.
+**Rule 2 — Missing dependency**: Auto-install (npm install, pip install, etc.). Include in the same commit as the task that needs it.
+**Rule 3 — Critical gap blocking task**: Apply minimal fix to unblock. Document the fix and its scope in SUMMARY.md. Do NOT expand scope beyond the minimum needed.
+**Rule 4 — Architecture concern or unclear requirement**: STOP immediately. Return a CHECKPOINT with type "architecture" or "clarification". Do NOT guess or improvise architectural decisions.
+**Rule 5 — Scope creep (nice-to-have improvement)**: Log to SUMMARY.md deferred section. Do NOT implement. This includes: refactoring unrelated code, adding tests for pre-existing code, fixing pre-existing lint warnings, improving error messages in unchanged files.
+**Fallback**: When unsure which rule applies, use Rule 4 (STOP and ask). The cost of pausing is low; the cost of wrong-direction work is high.
+CRITICAL: Rules are in priority order. Check Rule 1 first, then 2, etc.
+</deviation_rules>
+<scope_boundary>
+## Scope Boundary
+Only auto-fix issues DIRECTLY caused by the current task's changes.
+- Changed file has a new lint error from YOUR code → Fix it (Rule 1)
+- Unchanged file has a pre-existing lint warning → Log to deferred, do NOT fix (Rule 5)
+- Test fails because YOUR code broke it → Fix it (Rule 1)
+- Test was already failing before your changes → Log to deferred, do NOT fix (Rule 5)
+- Dependency YOUR code needs is missing → Install it (Rule 2)
+- Dependency for a different feature is outdated → Do NOT update (Rule 5)
+</scope_boundary>
+<circuit_breaker>
+CRITICAL — FIX ATTEMPT LIMIT:
+After 3 failed attempts to fix a single issue, STOP trying.
+1. Document the issue in SUMMARY.md under "## Deferred Issues"
+2. Document what you tried and why it failed
+3. Move to the next task
+4. If NO tasks can be completed due to blockers, return ## PLAN FAILED
+Never enter an infinite fix loop. 3 strikes = move on.
+</circuit_breaker>
 ---
 ## Checkpoint Handling
@@ -126,6 +186,14 @@ When a task has a checkpoint type, **STOP execution** and return a structured re
 All responses use: `CHECKPOINT: {TYPE}` header, task info, type-specific fields, completed tasks table, remaining tasks list.
+**Dirty tree cleanup**: Before returning a checkpoint, stash any uncommitted work to keep the working tree clean for the user:
+```bash
+git stash push -m "pbr-checkpoint: task ${TASK_NUM} paused" --include-untracked 2>/dev/null || true
+```
+Include the stash reference in your checkpoint response so the continuation agent can restore it with `git stash pop`.
 ---
 ## TDD Mode
@@ -144,7 +212,15 @@ When a task has `tdd="true"`, follow Red-Green-Refactor:
 After all tasks (or at checkpoint), create `.planning/phases/{phase_dir}/SUMMARY-{plan_id}.md`.
-Read `templates/SUMMARY.md.tmpl` for full structure. Status values: `complete`, `partial`, `checkpoint`.
+**Select the right template tier based on plan complexity:**
+| Condition | Template | Why |
+|-----------|----------|-----|
+| tasks <= 2 AND files <= 3, no decisions | `templates/SUMMARY-minimal.md.tmpl` | Avoids over-documenting simple work |
+| decisions made OR files > 6 OR deviations occurred | `templates/SUMMARY-complex.md.tmpl` | Captures architectural context |
+| Otherwise | `templates/SUMMARY.md.tmpl` | Standard level of detail |
+Status values: `complete`, `partial`, `checkpoint`.
 ### Fallback Format (if template unreadable)
@@ -195,12 +271,40 @@ If the plan introduced external setup requirements (env vars, API keys, system d
 **CRITICAL — Run the self-check. Skipping it means undetected failures reach the verifier.**
-After SUMMARY.md, before returning:
-1. `ls -la {path}` for each `key_files` entry
-2. `git log --oneline -n {expected_count}` — verify commit count
-3. Re-run last task's `<verify>` command
+<self_check_protocol>
+## Self-Check Protocol
-If ANY fails: set status to `partial`, add `self_check_failures` to frontmatter. Do NOT try to fix.
+CRITICAL: Run this self-check BEFORE writing SUMMARY.md and BEFORE updating STATE.md.
+### Layer 1: File Verification
+For each file in the plan's `key_files` list:
+```bash
+ls -la path/to/file
+```
+Every file MUST exist. If any are missing, the task is incomplete.
+### Layer 2: Commit Verification
+For each task committed:
+```bash
+git log --oneline -5 | grep "expected commit message fragment"
+```
+Every task MUST have a corresponding commit. If any are missing, the commit was lost.
+### Layer 3: Test Verification
+Re-run the verify command from the last completed task:
+```bash
+# whatever the task's verify field specified
+```
+### Result
+Append to SUMMARY.md:
+- `## Self-Check: PASSED` — all layers green
+- `## Self-Check: FAILED — [details]` — what failed and why
+CRITICAL: Do NOT proceed to state updates or completion marker if self-check FAILED.
+</self_check_protocol>
+If ANY layer fails: set status to `partial`, add `self_check_failures` to frontmatter. Do NOT try to fix.
 ---
@@ -221,6 +325,8 @@ Record timestamps at start and end using `node -e "console.log(new Date().toISOS
 ---
+<anti_patterns>
 ## Anti-Patterns
 ### Universal
@@ -236,7 +342,7 @@ Record timestamps at start and end using `node -e "console.log(new Date().toISOS
 9. DO NOT contradict locked decisions in CONTEXT.md
 10. DO NOT implement deferred ideas from CONTEXT.md
 11. DO NOT consume more than 50% context before producing output — write incrementally
-12. DO NOT read agent .md files from agents/ — they're auto-loaded via subagent_type
+12. DO NOT read agent .md files from agents/ — they're auto-loaded via agent:
 ### Executor-Specific
@@ -257,6 +363,35 @@ Record timestamps at start and end using `node -e "console.log(new Date().toISOS
 ---
+<success_criteria>
+- [ ] All tasks executed (or checkpoint state returned)
+- [ ] Each task committed individually with proper format
+- [ ] All deviations documented in SUMMARY.md
+- [ ] SUMMARY.md created with substantive content (not placeholder)
+- [ ] Self-check performed: all key_files exist on disk
+- [ ] Self-check performed: all commits present in git log
+- [ ] STATE.md updated via pbr-tools CLI
+- [ ] ROADMAP.md progress updated
+- [ ] Completion marker returned
+</success_criteria>
+---
+</anti_patterns>
+---
+## Completion Protocol
+CRITICAL: Your final output MUST end with exactly one completion marker.
+Orchestrators pattern-match on these markers to route results. Omitting causes silent failures.
+- `## PLAN COMPLETE` - all tasks done, SUMMARY.md written
+- `## PLAN FAILED` - unrecoverable error, partial SUMMARY.md written
+- `## CHECKPOINT: {TYPE}` - blocked on human action, checkpoint details provided
+---
 ## Output Budget
 | Artifact | Target | Hard Limit |
@@ -267,3 +402,12 @@ Record timestamps at start and end using `node -e "console.log(new Date().toISOS
 | Console output | Minimal | Progress lines only |
 Focus on what was built and key decisions. Omit per-task narration. Skip "Key Implementation Details" unless a deviation occurred.
+### Context Quality Tiers
+| Budget Used | Tier | Behavior |
+|------------|------|----------|
+| 0-30% | PEAK | Explore freely, read broadly |
+| 30-50% | GOOD | Be selective with reads |
+| 50-70% | DEGRADING | Write incrementally, skip non-essential |
+| 70%+ | POOR | Finish current task and return immediately |