npm - @zigrivers/scaffold - Versions diffs - 2.28.1 → 2.38.0 - Mend

@zigrivers/scaffold 2.28.1 → 2.38.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (375) hide show

package/README.md +309 -136
package/dist/cli/commands/build.d.ts.map +1 -1
package/dist/cli/commands/build.js +94 -14
package/dist/cli/commands/build.js.map +1 -1
package/dist/cli/commands/build.test.js +30 -5
package/dist/cli/commands/build.test.js.map +1 -1
package/dist/cli/commands/check.d.ts +12 -0
package/dist/cli/commands/check.d.ts.map +1 -0
package/dist/cli/commands/check.js +311 -0
package/dist/cli/commands/check.js.map +1 -0
package/dist/cli/commands/check.test.d.ts +2 -0
package/dist/cli/commands/check.test.d.ts.map +1 -0
package/dist/cli/commands/check.test.js +412 -0
package/dist/cli/commands/check.test.js.map +1 -0
package/dist/cli/commands/complete.d.ts +12 -0
package/dist/cli/commands/complete.d.ts.map +1 -0
package/dist/cli/commands/complete.js +101 -0
package/dist/cli/commands/complete.js.map +1 -0
package/dist/cli/commands/complete.test.d.ts +2 -0
package/dist/cli/commands/complete.test.d.ts.map +1 -0
package/dist/cli/commands/complete.test.js +133 -0
package/dist/cli/commands/complete.test.js.map +1 -0
package/dist/cli/commands/dashboard.d.ts.map +1 -1
package/dist/cli/commands/dashboard.js +12 -8
package/dist/cli/commands/dashboard.js.map +1 -1
package/dist/cli/commands/info.d.ts.map +1 -1
package/dist/cli/commands/info.js +4 -0
package/dist/cli/commands/info.js.map +1 -1
package/dist/cli/commands/knowledge.d.ts.map +1 -1
package/dist/cli/commands/knowledge.js +6 -2
package/dist/cli/commands/knowledge.js.map +1 -1
package/dist/cli/commands/knowledge.test.js +16 -11
package/dist/cli/commands/knowledge.test.js.map +1 -1
package/dist/cli/commands/next.d.ts.map +1 -1
package/dist/cli/commands/next.js +41 -13
package/dist/cli/commands/next.js.map +1 -1
package/dist/cli/commands/next.test.js +3 -0
package/dist/cli/commands/next.test.js.map +1 -1
package/dist/cli/commands/reset.d.ts +1 -0
package/dist/cli/commands/reset.d.ts.map +1 -1
package/dist/cli/commands/reset.js +179 -67
package/dist/cli/commands/reset.js.map +1 -1
package/dist/cli/commands/reset.test.js +360 -0
package/dist/cli/commands/reset.test.js.map +1 -1
package/dist/cli/commands/rework.d.ts +20 -0
package/dist/cli/commands/rework.d.ts.map +1 -0
package/dist/cli/commands/rework.js +332 -0
package/dist/cli/commands/rework.js.map +1 -0
package/dist/cli/commands/rework.test.d.ts +2 -0
package/dist/cli/commands/rework.test.d.ts.map +1 -0
package/dist/cli/commands/rework.test.js +297 -0
package/dist/cli/commands/rework.test.js.map +1 -0
package/dist/cli/commands/run.d.ts.map +1 -1
package/dist/cli/commands/run.js +59 -31
package/dist/cli/commands/run.js.map +1 -1
package/dist/cli/commands/run.test.js +288 -6
package/dist/cli/commands/run.test.js.map +1 -1
package/dist/cli/commands/skill.d.ts +12 -0
package/dist/cli/commands/skill.d.ts.map +1 -0
package/dist/cli/commands/skill.js +123 -0
package/dist/cli/commands/skill.js.map +1 -0
package/dist/cli/commands/skill.test.d.ts +2 -0
package/dist/cli/commands/skill.test.d.ts.map +1 -0
package/dist/cli/commands/skill.test.js +297 -0
package/dist/cli/commands/skill.test.js.map +1 -0
package/dist/cli/commands/skip.d.ts +1 -1
package/dist/cli/commands/skip.d.ts.map +1 -1
package/dist/cli/commands/skip.js +123 -57
package/dist/cli/commands/skip.js.map +1 -1
package/dist/cli/commands/skip.test.js +91 -0
package/dist/cli/commands/skip.test.js.map +1 -1
package/dist/cli/commands/status.d.ts +1 -0
package/dist/cli/commands/status.d.ts.map +1 -1
package/dist/cli/commands/status.js +57 -10
package/dist/cli/commands/status.js.map +1 -1
package/dist/cli/commands/status.test.js +81 -0
package/dist/cli/commands/status.test.js.map +1 -1
package/dist/cli/commands/update.test.js +252 -0
package/dist/cli/commands/update.test.js.map +1 -1
package/dist/cli/commands/version.test.js +171 -1
package/dist/cli/commands/version.test.js.map +1 -1
package/dist/cli/index.d.ts.map +1 -1
package/dist/cli/index.js +8 -0
package/dist/cli/index.js.map +1 -1
package/dist/core/adapters/adapter.d.ts +14 -0
package/dist/core/adapters/adapter.d.ts.map +1 -1
package/dist/core/adapters/adapter.js.map +1 -1
package/dist/core/adapters/adapter.test.js +10 -0
package/dist/core/adapters/adapter.test.js.map +1 -1
package/dist/core/adapters/claude-code.d.ts.map +1 -1
package/dist/core/adapters/claude-code.js +47 -10
package/dist/core/adapters/claude-code.js.map +1 -1
package/dist/core/adapters/claude-code.test.js +41 -20
package/dist/core/adapters/claude-code.test.js.map +1 -1
package/dist/core/adapters/codex.d.ts.map +1 -1
package/dist/core/adapters/codex.js +5 -1
package/dist/core/adapters/codex.js.map +1 -1
package/dist/core/adapters/codex.test.js +5 -0
package/dist/core/adapters/codex.test.js.map +1 -1
package/dist/core/adapters/universal.d.ts.map +1 -1
package/dist/core/adapters/universal.js +0 -1
package/dist/core/adapters/universal.js.map +1 -1
package/dist/core/adapters/universal.test.js +5 -0
package/dist/core/adapters/universal.test.js.map +1 -1
package/dist/core/assembly/context-gatherer.d.ts.map +1 -1
package/dist/core/assembly/context-gatherer.js +5 -2
package/dist/core/assembly/context-gatherer.js.map +1 -1
package/dist/core/assembly/engine.d.ts.map +1 -1
package/dist/core/assembly/engine.js +10 -2
package/dist/core/assembly/engine.js.map +1 -1
package/dist/core/assembly/engine.test.js +19 -0
package/dist/core/assembly/engine.test.js.map +1 -1
package/dist/core/assembly/knowledge-loader.d.ts +25 -0
package/dist/core/assembly/knowledge-loader.d.ts.map +1 -1
package/dist/core/assembly/knowledge-loader.js +75 -2
package/dist/core/assembly/knowledge-loader.js.map +1 -1
package/dist/core/assembly/knowledge-loader.test.js +388 -1
package/dist/core/assembly/knowledge-loader.test.js.map +1 -1
package/dist/core/assembly/meta-prompt-loader.d.ts +6 -0
package/dist/core/assembly/meta-prompt-loader.d.ts.map +1 -1
package/dist/core/assembly/meta-prompt-loader.js +41 -25
package/dist/core/assembly/meta-prompt-loader.js.map +1 -1
package/dist/core/assembly/preset-loader.d.ts +10 -0
package/dist/core/assembly/preset-loader.d.ts.map +1 -1
package/dist/core/assembly/preset-loader.js +26 -1
package/dist/core/assembly/preset-loader.js.map +1 -1
package/dist/core/assembly/preset-loader.test.js +65 -1
package/dist/core/assembly/preset-loader.test.js.map +1 -1
package/dist/core/assembly/update-mode.d.ts.map +1 -1
package/dist/core/assembly/update-mode.js +10 -4
package/dist/core/assembly/update-mode.js.map +1 -1
package/dist/core/assembly/update-mode.test.js +47 -0
package/dist/core/assembly/update-mode.test.js.map +1 -1
package/dist/core/dependency/dependency.d.ts.map +1 -1
package/dist/core/dependency/dependency.js +3 -2
package/dist/core/dependency/dependency.js.map +1 -1
package/dist/core/dependency/dependency.test.js +2 -0
package/dist/core/dependency/dependency.test.js.map +1 -1
package/dist/core/dependency/eligibility.js +3 -3
package/dist/core/dependency/eligibility.js.map +1 -1
package/dist/core/dependency/eligibility.test.js +2 -0
package/dist/core/dependency/eligibility.test.js.map +1 -1
package/dist/core/dependency/graph.d.ts.map +1 -1
package/dist/core/dependency/graph.js +4 -0
package/dist/core/dependency/graph.js.map +1 -1
package/dist/core/dependency/graph.test.d.ts +2 -0
package/dist/core/dependency/graph.test.d.ts.map +1 -0
package/dist/core/dependency/graph.test.js +262 -0
package/dist/core/dependency/graph.test.js.map +1 -0
package/dist/core/rework/phase-selector.d.ts +24 -0
package/dist/core/rework/phase-selector.d.ts.map +1 -0
package/dist/core/rework/phase-selector.js +98 -0
package/dist/core/rework/phase-selector.js.map +1 -0
package/dist/core/rework/phase-selector.test.d.ts +2 -0
package/dist/core/rework/phase-selector.test.d.ts.map +1 -0
package/dist/core/rework/phase-selector.test.js +138 -0
package/dist/core/rework/phase-selector.test.js.map +1 -0
package/dist/dashboard/generator.d.ts +48 -17
package/dist/dashboard/generator.d.ts.map +1 -1
package/dist/dashboard/generator.js +75 -5
package/dist/dashboard/generator.js.map +1 -1
package/dist/dashboard/generator.test.js +213 -5
package/dist/dashboard/generator.test.js.map +1 -1
package/dist/dashboard/template.d.ts +1 -1
package/dist/dashboard/template.d.ts.map +1 -1
package/dist/dashboard/template.js +755 -114
package/dist/dashboard/template.js.map +1 -1
package/dist/e2e/knowledge.test.js +4 -3
package/dist/e2e/knowledge.test.js.map +1 -1
package/dist/e2e/pipeline.test.js +2 -0
package/dist/e2e/pipeline.test.js.map +1 -1
package/dist/e2e/rework.test.d.ts +6 -0
package/dist/e2e/rework.test.d.ts.map +1 -0
package/dist/e2e/rework.test.js +226 -0
package/dist/e2e/rework.test.js.map +1 -0
package/dist/index.js +0 -0
package/dist/project/adopt.test.js +2 -0
package/dist/project/adopt.test.js.map +1 -1
package/dist/project/claude-md.js +2 -2
package/dist/project/claude-md.js.map +1 -1
package/dist/project/claude-md.test.js +4 -4
package/dist/project/claude-md.test.js.map +1 -1
package/dist/project/detector.d.ts.map +1 -1
package/dist/project/detector.js +4 -1
package/dist/project/detector.js.map +1 -1
package/dist/project/frontmatter.d.ts.map +1 -1
package/dist/project/frontmatter.js +54 -15
package/dist/project/frontmatter.js.map +1 -1
package/dist/project/frontmatter.test.js +2 -2
package/dist/project/frontmatter.test.js.map +1 -1
package/dist/state/rework-manager.d.ts +16 -0
package/dist/state/rework-manager.d.ts.map +1 -0
package/dist/state/rework-manager.js +126 -0
package/dist/state/rework-manager.js.map +1 -0
package/dist/state/rework-manager.test.d.ts +2 -0
package/dist/state/rework-manager.test.d.ts.map +1 -0
package/dist/state/rework-manager.test.js +191 -0
package/dist/state/rework-manager.test.js.map +1 -0
package/dist/state/state-manager.d.ts +13 -0
package/dist/state/state-manager.d.ts.map +1 -1
package/dist/state/state-manager.js +39 -2
package/dist/state/state-manager.js.map +1 -1
package/dist/state/state-manager.test.js +74 -1
package/dist/state/state-manager.test.js.map +1 -1
package/dist/state/state-migration.d.ts +23 -0
package/dist/state/state-migration.d.ts.map +1 -0
package/dist/state/state-migration.js +144 -0
package/dist/state/state-migration.js.map +1 -0
package/dist/state/state-migration.test.d.ts +2 -0
package/dist/state/state-migration.test.d.ts.map +1 -0
package/dist/state/state-migration.test.js +451 -0
package/dist/state/state-migration.test.js.map +1 -0
package/dist/types/assembly.d.ts +2 -0
package/dist/types/assembly.d.ts.map +1 -1
package/dist/types/dependency.d.ts +2 -2
package/dist/types/dependency.d.ts.map +1 -1
package/dist/types/frontmatter.d.ts +100 -7
package/dist/types/frontmatter.d.ts.map +1 -1
package/dist/types/frontmatter.js +89 -1
package/dist/types/frontmatter.js.map +1 -1
package/dist/types/index.d.ts +1 -0
package/dist/types/index.d.ts.map +1 -1
package/dist/types/index.js +1 -0
package/dist/types/index.js.map +1 -1
package/dist/types/lock.d.ts +1 -1
package/dist/types/lock.d.ts.map +1 -1
package/dist/types/rework.d.ts +36 -0
package/dist/types/rework.d.ts.map +1 -0
package/dist/types/rework.js +2 -0
package/dist/types/rework.js.map +1 -0
package/dist/utils/errors.d.ts +1 -0
package/dist/utils/errors.d.ts.map +1 -1
package/dist/utils/errors.js +8 -0
package/dist/utils/errors.js.map +1 -1
package/dist/utils/fs.d.ts +6 -0
package/dist/utils/fs.d.ts.map +1 -1
package/dist/utils/fs.js +13 -0
package/dist/utils/fs.js.map +1 -1
package/dist/validation/config-validator.test.d.ts +2 -0
package/dist/validation/config-validator.test.d.ts.map +1 -0
package/dist/validation/config-validator.test.js +210 -0
package/dist/validation/config-validator.test.js.map +1 -0
package/dist/validation/dependency-validator.test.d.ts +2 -0
package/dist/validation/dependency-validator.test.d.ts.map +1 -0
package/dist/validation/dependency-validator.test.js +215 -0
package/dist/validation/dependency-validator.test.js.map +1 -0
package/dist/validation/frontmatter-validator.test.d.ts +2 -0
package/dist/validation/frontmatter-validator.test.d.ts.map +1 -0
package/dist/validation/frontmatter-validator.test.js +371 -0
package/dist/validation/frontmatter-validator.test.js.map +1 -0
package/dist/validation/state-validator.test.d.ts +2 -0
package/dist/validation/state-validator.test.d.ts.map +1 -0
package/dist/validation/state-validator.test.js +325 -0
package/dist/validation/state-validator.test.js.map +1 -0
package/dist/wizard/suggestion.test.d.ts +2 -0
package/dist/wizard/suggestion.test.d.ts.map +1 -0
package/dist/wizard/suggestion.test.js +115 -0
package/dist/wizard/suggestion.test.js.map +1 -0
package/dist/wizard/wizard.d.ts.map +1 -1
package/dist/wizard/wizard.js +34 -1
package/dist/wizard/wizard.js.map +1 -1
package/knowledge/core/adr-craft.md +4 -0
package/knowledge/core/api-design.md +4 -0
package/knowledge/core/automated-review-tooling.md +203 -0
package/knowledge/core/coding-conventions.md +1 -1
package/knowledge/core/database-design.md +4 -0
package/knowledge/core/design-system-tokens.md +4 -0
package/knowledge/core/domain-modeling.md +4 -0
package/knowledge/core/git-workflow-patterns.md +200 -0
package/knowledge/core/operations-runbook.md +5 -1
package/knowledge/core/security-best-practices.md +4 -0
package/knowledge/core/system-architecture.md +5 -1
package/knowledge/core/task-decomposition.md +118 -3
package/knowledge/core/user-story-innovation.md +13 -0
package/knowledge/core/ux-specification.md +13 -0
package/knowledge/execution/enhancement-workflow.md +201 -0
package/knowledge/execution/task-claiming-strategy.md +130 -0
package/knowledge/execution/tdd-execution-loop.md +172 -0
package/knowledge/execution/worktree-management.md +205 -0
package/knowledge/finalization/apply-fixes-and-freeze.md +12 -0
package/knowledge/finalization/developer-onboarding.md +4 -0
package/knowledge/finalization/implementation-playbook.md +83 -5
package/knowledge/product/gap-analysis.md +5 -1
package/knowledge/product/prd-innovation.md +12 -0
package/knowledge/product/vision-craft.md +213 -0
package/knowledge/review/review-adr.md +12 -0
package/knowledge/review/review-api-design.md +13 -0
package/knowledge/review/review-database-design.md +13 -0
package/knowledge/review/review-domain-modeling.md +5 -1
package/knowledge/review/review-implementation-tasks.md +58 -1
package/knowledge/review/review-methodology.md +11 -0
package/knowledge/review/review-operations.md +12 -0
package/knowledge/review/review-prd.md +13 -0
package/knowledge/review/review-security.md +12 -0
package/knowledge/review/review-system-architecture.md +4 -2
package/knowledge/review/review-testing-strategy.md +11 -0
package/knowledge/review/review-user-stories.md +11 -0
package/knowledge/review/review-ux-specification.md +13 -1
package/knowledge/review/review-vision.md +255 -0
package/knowledge/tools/release-management.md +222 -0
package/knowledge/tools/session-analysis.md +215 -0
package/knowledge/tools/version-strategy.md +200 -0
package/knowledge/validation/critical-path-analysis.md +1 -1
package/knowledge/validation/cross-phase-consistency.md +12 -0
package/knowledge/validation/decision-completeness.md +13 -1
package/knowledge/validation/dependency-validation.md +12 -0
package/knowledge/validation/scope-management.md +12 -0
package/knowledge/validation/traceability.md +12 -0
package/methodology/README.md +37 -0
package/methodology/custom-defaults.yml +12 -1
package/methodology/deep.yml +11 -0
package/methodology/mvp.yml +11 -0
package/package.json +3 -3
package/pipeline/architecture/review-architecture.md +18 -7
package/pipeline/architecture/system-architecture.md +11 -8
package/pipeline/build/multi-agent-resume.md +245 -0
package/pipeline/build/multi-agent-start.md +236 -0
package/pipeline/build/new-enhancement.md +456 -0
package/pipeline/build/quick-task.md +381 -0
package/pipeline/build/single-agent-resume.md +210 -0
package/pipeline/build/single-agent-start.md +207 -0
package/pipeline/consolidation/claude-md-optimization.md +11 -8
package/pipeline/consolidation/workflow-audit.md +15 -11
package/pipeline/decisions/adrs.md +7 -5
package/pipeline/decisions/review-adrs.md +14 -6
package/pipeline/environment/ai-memory-setup.md +18 -12
package/pipeline/environment/automated-pr-review.md +10 -4
package/pipeline/environment/design-system.md +9 -7
package/pipeline/environment/dev-env-setup.md +8 -5
package/pipeline/environment/git-workflow.md +3 -1
package/pipeline/finalization/apply-fixes-and-freeze.md +16 -5
package/pipeline/finalization/developer-onboarding-guide.md +22 -8
package/pipeline/finalization/implementation-playbook.md +40 -11
package/pipeline/foundation/beads.md +10 -7
package/pipeline/foundation/coding-standards.md +6 -3
package/pipeline/foundation/project-structure.md +5 -1
package/pipeline/foundation/tdd.md +10 -6
package/pipeline/foundation/tech-stack.md +9 -9
package/pipeline/integration/add-e2e-testing.md +21 -6
package/pipeline/modeling/domain-modeling.md +10 -7
package/pipeline/modeling/review-domain-modeling.md +17 -6
package/pipeline/parity/platform-parity-review.md +31 -11
package/pipeline/planning/implementation-plan-review.md +21 -10
package/pipeline/planning/implementation-plan.md +52 -19
package/pipeline/pre/create-prd.md +22 -7
package/pipeline/pre/innovate-prd.md +10 -8
package/pipeline/pre/innovate-user-stories.md +9 -7
package/pipeline/pre/review-prd.md +11 -2
package/pipeline/pre/review-user-stories.md +12 -3
package/pipeline/pre/user-stories.md +12 -7
package/pipeline/quality/create-evals.md +10 -6
package/pipeline/quality/operations.md +16 -12
package/pipeline/quality/review-operations.md +19 -10
package/pipeline/quality/review-security.md +21 -11
package/pipeline/quality/review-testing.md +23 -12
package/pipeline/quality/security.md +17 -13
package/pipeline/quality/story-tests.md +6 -4
package/pipeline/specification/api-contracts.md +11 -6
package/pipeline/specification/database-schema.md +12 -6
package/pipeline/specification/review-api.md +18 -9
package/pipeline/specification/review-database.md +18 -9
package/pipeline/specification/review-ux.md +20 -10
package/pipeline/specification/ux-spec.md +8 -5
package/pipeline/validation/critical-path-walkthrough.md +14 -7
package/pipeline/validation/cross-phase-consistency.md +14 -7
package/pipeline/validation/decision-completeness.md +14 -7
package/pipeline/validation/dependency-graph-validation.md +15 -7
package/pipeline/validation/implementability-dry-run.md +15 -7
package/pipeline/validation/scope-creep-check.md +15 -7
package/pipeline/validation/traceability-matrix.md +20 -7
package/pipeline/vision/create-vision.md +267 -0
package/pipeline/vision/innovate-vision.md +157 -0
package/pipeline/vision/review-vision.md +149 -0
package/skills/scaffold-pipeline/SKILL.md +33 -18
package/skills/scaffold-runner/SKILL.md +172 -18

package/knowledge/core/automated-review-tooling.md ADDED Viewed

@@ -0,0 +1,203 @@
+---
+name: automated-review-tooling
+description: Patterns for setting up automated PR code review using AI models (Codex, Gemini) via local CLI, including dual-model review, reconciliation, and CI integration
+topics: [code-review, automation, codex, gemini, pull-requests, ci-cd, review-tooling]
+---
+# Automated Review Tooling
+Automated PR review leverages AI models to provide consistent, thorough code review without manual reviewer bottlenecks. This knowledge covers the local CLI approach (no GitHub Actions), dual-model review patterns, and integration with the PR workflow.
+## Summary
+### Architecture: Local CLI Review
+The scaffold approach uses local CLI review rather than GitHub Actions:
+- **No CI secrets required** — models run locally via CLI tools
+- **Dual-model review** — run Codex and Gemini (when available) for independent perspectives
+- **Agent-managed loop** — Claude orchestrates the review-fix cycle locally
+Components:
+- `AGENTS.md` — reviewer instructions with project-specific rules
+- `docs/review-standards.md` — severity definitions (P0-P3) and criteria
+- `scripts/cli-pr-review.sh` — dual-model review script
+- `scripts/await-pr-review.sh` — polling script for external bot mode
+### Review Severity Levels
+Consistent with the pipeline's review step severity:
+- **P0 (blocking)** — must fix before merge (security, data loss, broken functionality)
+- **P1 (important)** — should fix before merge (bugs, missing tests, performance)
+- **P2 (suggestion)** — consider fixing (style, naming, documentation)
+- **P3 (nit)** — optional (personal preference, minor optimization)
+### Dual-Model Review Pattern
+When both Codex CLI and Gemini CLI are available:
+1. Run both reviewers independently on the PR diff
+2. Collect findings from each
+3. Reconcile: consensus findings get higher confidence
+4. Disagreements are flagged for the implementing agent to resolve
+### Integration with PR Workflow
+The review step integrates into the standard PR flow:
+1. Agent creates PR
+2. Agent runs `scripts/cli-pr-review.sh` (or review runs automatically)
+3. Review findings are posted as PR comments or written to a local file
+4. Agent addresses P0/P1 findings, pushes fixes
+5. Re-review until no P0/P1 findings remain
+6. PR is ready for merge
+## Deep Guidance
+### AGENTS.md Structure
+The `AGENTS.md` file provides reviewer instructions:
+```markdown
+# Code Review Instructions
+## Project Context
+[Brief description of what this project does]
+## Review Focus Areas
+- Security: [project-specific security concerns]
+- Performance: [known hot paths or constraints]
+- Testing: [coverage requirements, test patterns]
+## Coding Standards Reference
+See docs/coding-standards.md for:
+- Naming conventions
+- Error handling patterns
+- Logging standards
+## Known Patterns
+[Project-specific patterns reviewers should enforce]
+## Out of Scope
+[Things reviewers should NOT flag]
+```
+### CLI Review Script Pattern
+The `cli-pr-review.sh` script follows this structure:
+```bash
+#!/usr/bin/env bash
+set -euo pipefail
+# 1. Get the PR diff
+diff=$(gh pr diff "$PR_NUMBER")
+# 2. Run Codex review (if available)
+if command -v codex &>/dev/null; then
+  codex_findings=$(echo "$diff" | codex review --context AGENTS.md)
+fi
+# 3. Run Gemini review (if available)
+if command -v gemini &>/dev/null; then
+  gemini_findings=$(echo "$diff" | gemini review --context AGENTS.md)
+fi
+# 4. Reconcile findings
+# - Findings from both models: HIGH confidence
+# - Findings from one model: MEDIUM confidence
+# - Contradictions: flagged for human review
+```
+### Review Standards Document
+`docs/review-standards.md` should define:
+- Severity levels with concrete examples per project
+- What constitutes a blocking review (P0/P1 threshold)
+- Auto-approve criteria (when review can be skipped)
+- Review SLA (how long before auto-approve kicks in)
+### Fallback When Models Unavailable
+If neither Codex nor Gemini CLI is available:
+1. Claude performs an enhanced self-review of the diff
+2. Focus on the AGENTS.md review criteria
+3. Apply the same severity classification
+4. Document that the review was single-model
+### Updating Review Standards Over Time
+As the project evolves:
+- Add new review focus areas when new patterns emerge
+- Remove rules that linters now enforce automatically
+- Update AGENTS.md when architecture changes
+- Track false-positive rates and adjust thresholds
+### Review Finding Reconciliation
+When running dual-model review, reconcile findings systematically:
+```
+Finding Classification:
+┌─────────────────┬──────────┬──────────┬───────────────────┐
+│                 │ Codex    │ Gemini   │ Action            │
+├─────────────────┼──────────┼──────────┼───────────────────┤
+│ Same issue      │ Found    │ Found    │ HIGH confidence   │
+│ Unique finding  │ Found    │ -        │ MEDIUM confidence │
+│ Unique finding  │ -        │ Found    │ MEDIUM confidence │
+│ Contradiction   │ Fix X    │ Keep X   │ Flag for agent    │
+└─────────────────┴──────────┴──────────┴───────────────────┘
+```
+HIGH confidence findings are always addressed. MEDIUM confidence findings are addressed if P0/P1. Contradictions require the implementing agent to make a judgment call and document the reasoning.
+### Security-Focused Review Checklist
+Every automated review should check:
+- No secrets or credentials in the diff (API keys, passwords, tokens)
+- No `eval()` or equivalent unsafe operations introduced
+- SQL queries use parameterized queries (no string concatenation)
+- User input is validated before use
+- Authentication/authorization checks are present on new endpoints
+- Dependencies added are from trusted sources with known versions
+### Performance Review Patterns
+Look for these performance anti-patterns:
+- N+1 queries (loop with individual DB calls)
+- Missing pagination on list endpoints
+- Synchronous operations that should be async
+- Large objects passed by value instead of reference
+- Missing caching for expensive computations
+- Unbounded growth in arrays or maps
+### Integration with CLAUDE.md
+The workflow-audit step should add review commands to CLAUDE.md:
+```markdown
+## Code Review
+| Command | Purpose |
+|---------|---------|
+| `scripts/cli-pr-review.sh <PR#>` | Run dual-model review |
+| `scripts/await-pr-review.sh <PR#>` | Poll for external review |
+```
+This ensures agents always know how to trigger reviews without consulting separate docs.
+### Common False Positives
+Track and suppress recurring false positives:
+- Test files flagged for "hardcoded values" (test fixtures are intentional)
+- Migration files flagged for "raw SQL" (migrations must use raw SQL)
+- Generated files flagged for style issues (generated code has its own conventions)
+Add suppressions to AGENTS.md under "Out of Scope" to prevent repeated false findings.
+### Review Metrics and Continuous Improvement
+Track these metrics over time to improve review quality:
+- **False positive rate** — findings that are dismissed without action
+- **Escape rate** — bugs that reach production despite review
+- **Time to resolve** — average time between finding and fix
+- **Coverage** — percentage of PRs that receive automated review
+- **Model agreement rate** — how often Codex and Gemini agree
+Use these metrics to calibrate severity thresholds and update AGENTS.md focus areas.

package/knowledge/core/coding-conventions.md CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 name: coding-conventions
 description: Universal coding standards patterns across languages and linter/formatter configuration
-topics: [coding-standards, linting, formatting, naming-conventions, error-handling, code-style]
+topics: [coding-standards, linting, formatting, naming, error-handling, code-style]
 ---
 # Coding Conventions

package/knowledge/core/database-design.md CHANGED Viewed

@@ -4,6 +4,8 @@ description: Database schema design, normalization, indexing, and migration patt
 topics: [database, schema, sql, nosql, migrations, indexing, data-modeling]
 ---
+## Summary
 ## From Domain Models to Schema
 The domain model defines what the business cares about. The database schema defines how that information is stored. The mapping between them is deliberate, not automatic.
@@ -77,6 +79,8 @@ metadata JSONB NOT NULL DEFAULT '{}'
 **Lookup table** — Store value objects with limited valid values in a reference table. Best for enums with associated data (status codes with descriptions, country codes with names).
+## Deep Guidance
 ### Modeling Relationships
 **One-to-one:** Use a foreign key in either table (typically the dependent side). Consider: could this be columns in the same table instead?

package/knowledge/core/design-system-tokens.md CHANGED Viewed

@@ -4,6 +4,8 @@ description: Design token definitions, base component visual specs, dark mode pa
 topics: [design-system, tokens, colors, typography, spacing, components, dark-mode, pattern-library]
 ---
+## Summary
 ## Design Tokens
 Design tokens are the atomic values that define the visual language. They are variables, not hard-coded values. Every visual property in the application references a token.
@@ -66,6 +68,8 @@ Design tokens are the atomic values that define the visual language. They are va
 --color-focus-ring: rgba(37,99,235,0.5)  // Focus indicator
 ```
+## Deep Guidance
 ### Typography Tokens
 **Font families:**

package/knowledge/core/domain-modeling.md CHANGED Viewed

@@ -4,6 +4,8 @@ description: Domain-driven design patterns for identifying and modeling project
 topics: [ddd, domain-modeling, entities, aggregates, bounded-contexts, domain-events, value-objects]
 ---
+## Summary
 ## Strategic DDD Patterns
 Strategic DDD operates at the system level, answering where domain boundaries fall and how domains communicate.
@@ -54,6 +56,8 @@ Not all parts of a system are equally important or complex. Classify domains by
 **Classification decisions matter because they drive resource allocation.** Over-investing in a generic domain (building a custom auth system when Auth0 exists) wastes effort. Under-investing in a core domain (using a generic CRUD framework for your competitive advantage) produces mediocre software.
+## Deep Guidance
 ## Tactical DDD Patterns
 Tactical DDD patterns structure the code within a bounded context.

package/knowledge/core/git-workflow-patterns.md ADDED Viewed

@@ -0,0 +1,200 @@
+---
+name: git-workflow-patterns
+description: Git branching strategies, commit conventions, PR workflows, merge policies, and CI integration patterns for AI-agent-driven development
+topics: [git, branching, commits, pull-requests, ci-cd, merge-strategy, worktrees]
+---
+# Git Workflow Patterns
+Structured git workflows for AI-agent-driven projects ensure consistent branching, meaningful commit history, automated quality gates, and smooth multi-agent collaboration via worktrees.
+## Summary
+### Branching Strategy
+The trunk-based development model works best for AI-agent workflows:
+- **Main branch** (`main`) — always deployable, protected by CI
+- **Feature branches** — short-lived, created per task or story (`feat/US-xxx-slug`, `fix/bug-description`)
+- **Worktree branches** — parallel agent execution using git worktrees (`agent/<name>/<task>`)
+Branch naming conventions:
+```
+feat/US-001-user-registration    # Feature work tied to a story
+fix/login-timeout-handling       # Bug fix
+chore/update-dependencies        # Maintenance
+docs/api-contract-updates        # Documentation only
+```
+### Commit Conventions
+Use Conventional Commits format for machine-parseable history:
+```
+<type>(<scope>): <description>
+[optional body]
+[optional footer(s)]
+```
+Types: `feat`, `fix`, `docs`, `style`, `refactor`, `test`, `chore`, `ci`
+AI agent commits should include the Co-Authored-By trailer for attribution and auditability.
+### Pull Request Workflow
+Standard PR lifecycle:
+1. Create branch from `main`
+2. Implement changes with passing tests
+3. Push branch, create PR with structured description
+4. CI runs all quality gates (`make check` or equivalent)
+5. Review (automated or manual)
+6. Squash-merge to maintain clean history
+7. Delete branch after merge
+## Deep Guidance
+### Merge Policies
+- **Squash merge** for feature branches — keeps main history clean
+- **Merge commit** for release branches — preserves the merge point
+- **Never force-push** to main or shared branches
+- **Delete branches** after merge to prevent clutter
+### CI Integration
+Minimum CI pipeline for scaffold projects:
+1. **Lint** — ShellCheck, ESLint, or language-appropriate linter
+2. **Test** — Full test suite including evals
+3. **Build** — Verify compilation/bundling succeeds
+4. **Type check** — For typed languages (TypeScript, etc.)
+### Worktree Patterns for Multi-Agent Work
+Git worktrees enable parallel agent execution on the same repository:
+```bash
+# Create a worktree for an agent
+scripts/setup-agent-worktree.sh agent-name
+# Each worktree gets its own branch and working directory
+# Agents can work simultaneously without conflicts
+```
+Key rules:
+- Each agent works in its own worktree with its own branch
+- Agents coordinate via the implementation plan task assignments
+- Merge conflicts are resolved by the agent whose branch is behind
+- The main worktree is the coordination point
+### Branch Protection Rules
+Configure branch protection for `main`:
+- Require status checks to pass before merge
+- Require branches to be up to date before merge
+- Do not allow direct pushes
+- Require squash merging for feature branches
+### Commit Message Quality
+Good commit messages for AI agents:
+```
+feat(auth): add JWT token refresh endpoint
+Implements automatic token refresh when the access token expires
+within 5 minutes. Refresh tokens are rotated on each use.
+Closes US-015
+```
+Bad commit messages to avoid:
+- `fix stuff` — no context
+- `WIP` — should never be pushed
+- `update` — what was updated?
+### PR Description Template
+```
+### What changed
+- [1-3 bullet points describing the change]
+### Files modified
+- [Specific files/components modified]
+### How to test
+- [How to verify the changes work]
+### Related
+- [Story ID, issue link, or ADR reference]
+```
+### Conflict Resolution Strategy
+When multiple agents work in parallel:
+1. Agent finishing first merges normally
+2. Agent finishing second rebases onto updated main
+3. If conflicts arise, the second agent resolves them
+4. Never force-push over another agent's work
+Conflict resolution checklist:
+- Pull latest main before starting any task
+- Rebase frequently on long-running branches (every few commits)
+- If a rebase produces conflicts in files you didn't modify, investigate — another agent may have refactored the same area
+- After resolving conflicts, re-run the full test suite before pushing
+- Document unusual conflict resolutions in the commit message body
+### Release Workflow
+For version-tagged releases:
+1. Ensure all PRs are merged to main
+2. Run full quality gates on main
+3. Create a version tag (`v1.2.3`)
+4. Generate changelog from conventional commits
+5. Push tag to trigger release pipeline
+### Semantic Versioning
+Follow semver for version tags:
+- **MAJOR** (`X.0.0`) — breaking API changes, incompatible migrations
+- **MINOR** (`0.X.0`) — new features, backward-compatible additions
+- **PATCH** (`0.0.X`) — bug fixes, documentation, internal refactors
+Pre-release versions for staging: `v1.2.3-rc.1`, `v1.2.3-beta.1`
+### Git Hooks
+Pre-commit hooks for quality enforcement:
+```bash
+# .husky/pre-commit or .git/hooks/pre-commit
+#!/usr/bin/env bash
+set -euo pipefail
+# Run linter on staged files
+make lint
+# Validate frontmatter on changed command files
+./scripts/validate-frontmatter.sh $(git diff --cached --name-only -- 'commands/*.md')
+```
+Pre-push hooks for broader validation:
+```bash
+# .husky/pre-push or .git/hooks/pre-push
+#!/usr/bin/env bash
+set -euo pipefail
+# Run full test suite before pushing
+make test
+```
+### Common Anti-Patterns
+Patterns to avoid in AI-agent git workflows:
+1. **Long-lived branches** — branches older than 1 day risk merge conflicts. Keep branches short-lived.
+2. **Giant PRs** — PRs with 500+ lines changed are hard to review. Split into smaller, focused PRs.
+3. **Skipping hooks** — `--no-verify` hides real issues. Fix the root cause instead.
+4. **Rebasing shared branches** — only rebase branches that only you use. Shared branches use merge commits.
+5. **Committing generated files** — lock files yes, build output no. Use `.gitignore` aggressively.
+6. **Force-pushing to main** — this is never acceptable. Even if CI is broken, create a fix branch.
+7. **Mixing concerns in one commit** — each commit should be atomic and focused on one change.

package/knowledge/core/operations-runbook.md CHANGED Viewed

@@ -1,9 +1,11 @@
 ---
 name: operations-runbook
 description: Deployment pipeline, deployment strategies, monitoring, alerting, and incident response
-topics: [operations, cicd, deployment, monitoring, incident-response, alerting, rollback]
+topics: [operations, ci-cd, deployment, monitoring, incident-response, alerting, rollback]
 ---
+## Summary
 ## Dev Environment Reference
 Local development setup (prerequisites, env vars, one-command setup, database, hot reload, common commands, troubleshooting) is defined in `docs/dev-setup.md`, created by the Dev Setup prompt. The operations runbook should reference it rather than redefine it.
@@ -73,6 +75,8 @@ Operations adds (main branch only):
 - Tag artifacts with the git SHA for traceability
 - Set retention policies (keep last 30 days, keep releases forever)
+## Deep Guidance
 ## Deployment Strategies
 ### Blue-Green Deployment

package/knowledge/core/security-best-practices.md CHANGED Viewed

@@ -4,6 +4,8 @@ description: OWASP Top 10, authentication, authorization, data protection, and t
 topics: [security, owasp, authentication, authorization, threat-modeling, secrets-management, dependency-auditing]
 ---
+## Summary
 ## OWASP Top 10
 The OWASP Top 10 represents the most critical security risks to web applications. Every project should evaluate each risk and implement appropriate mitigations.
@@ -55,6 +57,8 @@ Sensitive data exposed due to weak or missing encryption.
 - Hash passwords with bcrypt, scrypt, or Argon2 (NEVER MD5 or SHA-256 for passwords)
 - Don't store sensitive data you don't need — the safest data is data you don't have
+## Deep Guidance
 ### A03: Injection
 Untrusted data sent to an interpreter as part of a command or query, causing unintended execution.

package/knowledge/core/system-architecture.md CHANGED Viewed

@@ -1,9 +1,11 @@
 ---
 name: system-architecture
 description: Architecture patterns, component design, and project structure
-topics: [architecture, components, modules, data-flows, project-structure, state-management]
+topics: [architecture, components, modules, data-flow, project-structure, state-management]
 ---
+## Summary
 ## Architecture Patterns
 ### Layered Architecture
@@ -81,6 +83,8 @@ For most scaffold pipeline projects:
 4. Use **microservices** only if you have multiple teams that need independent deployment, or specific services with dramatically different scaling needs.
 5. Avoid **layered** unless the application is genuinely simple (CRUD with minimal business logic).
+## Deep Guidance
 ## Component Design
 ### Identifying Components from Domain Models

package/knowledge/core/task-decomposition.md CHANGED Viewed

@@ -16,7 +16,14 @@ User stories bridge PRD features and implementation tasks. Each story decomposes
 ### Task Sizing
-Each task should be completable in a single AI agent session (30-90 minutes of agent time). A well-sized task has a clear title (usable as commit message), touches 1-5 files, produces a testable result, and has no ambiguity about "done."
+Each task should be completable in a single AI agent session (30-90 minutes of agent time). A well-sized task has a clear title (usable as commit message), touches 1-3 application files (hard limit; justify exceptions), produces ~150 lines of net-new application code (excluding tests and generated files), and has no ambiguity about "done."
+Five rules govern agent-friendly task sizing:
+1. **Three-File Rule** — Max 3 application files modified (test files excluded)
+2. **150-Line Budget** — Max ~150 lines of net-new application code per task
+3. **Single-Concern Rule** — One task does one thing (no "and" connecting unrelated work)
+4. **Decision-Free Execution** — All design decisions resolved in the task description; agents implement, they don't architect
+5. **Test Co-location** — Tests live in the same task as the code they test; no deferred testing
 Split large tasks by layer (API, UI, DB, tests), by feature slice (happy path, validation, edge cases), or by entity. Combine tiny tasks that touch the same file and have no independent value.
@@ -157,8 +164,11 @@ Each task should be completable in a single AI agent session (typically 30-90 mi
 **A well-sized task:**
 - Has a clear, specific title that could be a commit message
-- Touches 1-5 files (not counting test files)
-- Produces a testable, verifiable result
+- Touches 1-3 application files (hard limit; test files excluded from count)
+- Produces ~150 lines of net-new application code (excluding tests and generated files)
+- Does exactly one thing (passes the single-concern test: describable without "and")
+- Requires no design decisions from the agent (all choices resolved in the description)
+- Includes co-located tests (the task isn't done until tests pass)
 - Has no ambiguity about what "done" means
 - Can be code-reviewed independently
@@ -376,6 +386,111 @@ Does NOT assume:
 - Any auth endpoints exist (this is the first)
 ```
+### Agent Executability Heuristics
+Five formalized rules for ensuring tasks are the right size for AI agent execution. These are hard rules with an escape hatch — tasks exceeding limits must be split unless the author provides explicit justification via `<!-- agent-size-exception: reason -->`.
+#### Rule 1: Three-File Rule
+A task modifies at most 3 application files (test files don't count toward this limit). If it would touch more, split by layer or concern.
+**Why 3:** Reading 3 files plus their context (imports, types, interfaces) consumes roughly 40-60% of a standard agent context window, leaving room for the task description, test code, and reasoning. At 5+ files, context pressure causes agents to lose track of cross-file consistency.
+**Splitting when exceeded:**
+- 4 files across 2 layers → split into one task per layer
+- 5 files in the same layer → split by entity or concern within the layer
+- Config files touched alongside application files → separate config task if non-trivial
+#### Rule 2: 150-Line Budget
+A task produces at most ~150 lines of net-new application code (excluding tests, generated files, and config). This keeps the entire change reviewable in one screen and within agent context budgets.
+**Why 150:** Agent output quality degrades measurably after ~200 lines of new code in a single session. At 150 lines, the agent can hold the entire change in context while writing tests and verifying correctness.
+**Estimating line count from task descriptions:**
+- A CRUD endpoint with validation: ~80-120 lines
+- A UI component with state management: ~100-150 lines
+- A database migration with seed data: ~50-80 lines
+- A full feature slice (API + UI + tests): ~300+ lines — MUST split
+#### Rule 3: Single-Concern Rule
+A task does exactly one thing. The test: can you describe what this task does in one sentence without "and"?
+**Passes the test:**
+- "Implement the user registration endpoint with input validation" (validation is part of the endpoint)
+- "Create the order model with database migration" (migration is part of model creation)
+**Fails the test:**
+- "Add the API endpoint AND update the dashboard" — two tasks
+- "Implement authentication AND set up the database" — two tasks
+- "Build the payment form AND integrate with Stripe AND add webhook handling" — three tasks
+**Splitting signals:**
+- Task description contains "and" connecting unrelated work
+- Task spans multiple architectural layers (API + frontend + database in one task)
+- Task affects multiple bounded contexts or feature domains
+- Task has acceptance criteria for two distinct user-facing behaviors
+#### Rule 4: Decision-Free Execution
+The task description must resolve all design decisions upfront. The agent implements, it doesn't architect. No task should require the agent to:
+- Choose between patterns (repository vs active record, REST vs GraphQL)
+- Select libraries or tools
+- Decide module structure or file organization
+- Determine API contract shapes (these come from upstream specs)
+**Red flags in task descriptions:**
+- "Choose the best approach for..."
+- "Determine whether to use X or Y"
+- "Decide how to structure..."
+- "Evaluate options for..."
+- "Select the most appropriate..."
+- "Figure out the best way to..."
+If a task contains any of these, the decision belongs in the task description — resolved by the plan author — not left to agent judgment. Local implementation choices (variable names, loop style, internal helper structure) are fine.
+#### Rule 5: Test Co-location
+Tests live in the same task as the code they test. The task follows TDD: write the failing test, then the implementation, then verify. The task isn't done until tests pass.
+**Anti-pattern:** "Tasks 1-8: implement features. Task 9: write tests for everything." This produces untestable code, violates TDD, and creates a single massive testing task that exceeds all size limits.
+**What co-location looks like:**
+```
+Task: Implement user registration endpoint
+  1. Write failing integration test (POST /register with valid data → 201)
+  2. Implement endpoint to make test pass
+  3. Write failing validation test (invalid email → 400)
+  4. Add validation to make test pass
+  5. Commit
+```
+#### Escape Hatch
+If a task genuinely can't be split further without creating tasks that have no independent value, add an explicit annotation in the task description: `<!-- agent-size-exception: [reason] -->`. The review pass flags unjustified exceptions but accepts reasoned ones.
+**Valid exception reasons:**
+- "Migration task touches 4 files but they're all trivial one-line renames"
+- "Config file changes across 4 files are mechanical and identical in structure"
+- "Test setup file is large but generated from a template"
+**Invalid exception reasons:**
+- "It's easier to do it all at once" (convenience is not a justification)
+- "The files are related" (related files can still be separate tasks)
+- "It would create too many tasks" (more small tasks > fewer large tasks)
+#### Concrete "Too Big" Examples
+| Task (Too Big) | Violations | Split Into |
+|---------------|-----------|------------|
+| "Implement user authentication" (8+ files, registration + login + reset + middleware) | Three-File, Single-Concern | 4 tasks: registration endpoint, login endpoint, password reset flow, auth middleware |
+| "Build the settings page with all preferences" (6 files, multiple forms + APIs) | Three-File, 150-Line, Single-Concern | Per-group: profile settings, notification settings, security settings |
+| "Set up database with all migrations and seed data" (10+ files, every entity) | Three-File, 150-Line | Per-entity: users table, orders table, products table, then seed data task |
+| "Create API client with retry, caching, and auth" (4 concerns in one module) | Single-Concern, Decision-Free | 3 tasks: base client with auth, retry middleware, cache layer |
+| "Implement the dashboard with charts, filters, and real-time updates" (5+ files, 300+ lines) | All five rules | 4 tasks: dashboard layout + routing, chart components, filter system, WebSocket integration |
 ### Common Pitfalls
 **Tasks too vague.** "Implement backend" or "Set up auth" with no acceptance criteria, no file paths, and no test requirements. An agent receiving this task will guess wrong about scope, structure, and conventions. Fix: every task must specify exact files to create/modify, acceptance criteria, and test requirements.