prizmkit 1.1.0 → 1.1.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/bundled/VERSION.json +3 -3
- package/bundled/adapters/claude/agent-adapter.js +18 -0
- package/bundled/adapters/claude/command-adapter.js +1 -27
- package/bundled/agents/prizm-dev-team-critic.md +2 -0
- package/bundled/agents/prizm-dev-team-dev.md +2 -0
- package/bundled/agents/prizm-dev-team-reviewer.md +2 -0
- package/bundled/dev-pipeline/README.md +63 -63
- package/bundled/dev-pipeline/assets/feature-list-example.json +1 -1
- package/bundled/dev-pipeline/assets/prizm-dev-team-integration.md +1 -1
- package/bundled/dev-pipeline/{launch-daemon.sh → launch-feature-daemon.sh} +33 -33
- package/bundled/dev-pipeline/launch-refactor-daemon.sh +454 -0
- package/bundled/dev-pipeline/lib/branch.sh +1 -1
- package/bundled/dev-pipeline/reset-feature.sh +3 -3
- package/bundled/dev-pipeline/reset-refactor.sh +312 -0
- package/bundled/dev-pipeline/{retry-bug.sh → retry-bugfix.sh} +47 -59
- package/bundled/dev-pipeline/retry-feature.sh +41 -54
- package/bundled/dev-pipeline/retry-refactor.sh +358 -0
- package/bundled/dev-pipeline/run-bugfix.sh +6 -0
- package/bundled/dev-pipeline/{run.sh → run-feature.sh} +31 -31
- package/bundled/dev-pipeline/run-refactor.sh +787 -0
- package/bundled/dev-pipeline/scripts/generate-bootstrap-prompt.py +177 -10
- package/bundled/dev-pipeline/scripts/generate-refactor-prompt.py +419 -0
- package/bundled/dev-pipeline/scripts/init-refactor-pipeline.py +393 -0
- package/bundled/dev-pipeline/scripts/update-refactor-status.py +726 -0
- package/bundled/dev-pipeline/templates/agent-prompts/critic-code-challenge.md +13 -0
- package/bundled/dev-pipeline/templates/agent-prompts/critic-plan-challenge.md +7 -0
- package/bundled/dev-pipeline/templates/agent-prompts/dev-fix.md +7 -0
- package/bundled/dev-pipeline/templates/agent-prompts/dev-implement.md +26 -0
- package/bundled/dev-pipeline/templates/agent-prompts/dev-resume.md +5 -0
- package/bundled/dev-pipeline/templates/agent-prompts/reviewer-analyze.md +5 -0
- package/bundled/dev-pipeline/templates/agent-prompts/reviewer-review.md +12 -0
- package/bundled/dev-pipeline/templates/bootstrap-tier1.md +29 -2
- package/bundled/dev-pipeline/templates/bootstrap-tier2.md +8 -7
- package/bundled/dev-pipeline/templates/bootstrap-tier3.md +11 -10
- package/bundled/dev-pipeline/templates/bugfix-bootstrap-prompt.md +2 -3
- package/bundled/dev-pipeline/templates/feature-list-schema.json +1 -1
- package/bundled/dev-pipeline/templates/refactor-list-schema.json +159 -0
- package/bundled/dev-pipeline/templates/sections/ac-verification-checklist.md +13 -0
- package/bundled/dev-pipeline/templates/sections/feature-context.md +1 -1
- package/bundled/dev-pipeline/templates/sections/phase-analyze-agent.md +9 -8
- package/bundled/dev-pipeline/templates/sections/phase-analyze-full.md +9 -8
- package/bundled/dev-pipeline/templates/sections/phase-browser-verification.md +2 -1
- package/bundled/dev-pipeline/templates/sections/phase-critic-code.md +8 -10
- package/bundled/dev-pipeline/templates/sections/phase-critic-plan-full.md +9 -10
- package/bundled/dev-pipeline/templates/sections/phase-critic-plan.md +8 -9
- package/bundled/dev-pipeline/templates/sections/phase-implement-agent.md +7 -10
- package/bundled/dev-pipeline/templates/sections/phase-implement-full.md +8 -15
- package/bundled/dev-pipeline/templates/sections/phase-review-agent.md +7 -12
- package/bundled/dev-pipeline/templates/sections/phase-review-full.md +8 -19
- package/bundled/dev-pipeline/templates/sections/test-failure-recovery.md +75 -0
- package/bundled/skills/_metadata.json +33 -6
- package/bundled/skills/app-planner/SKILL.md +105 -320
- package/bundled/skills/app-planner/assets/app-design-guide.md +101 -0
- package/bundled/skills/app-planner/references/frontend-design-guide.md +1 -1
- package/bundled/skills/app-planner/references/project-brief-guide.md +49 -80
- package/bundled/skills/bug-fix-workflow/SKILL.md +2 -2
- package/bundled/skills/bug-planner/SKILL.md +68 -5
- package/bundled/skills/bug-planner/scripts/validate-bug-list.py +3 -2
- package/bundled/skills/bugfix-pipeline-launcher/SKILL.md +19 -5
- package/bundled/skills/{dev-pipeline-launcher → feature-pipeline-launcher}/SKILL.md +32 -32
- package/bundled/skills/feature-planner/SKILL.md +337 -0
- package/bundled/skills/{app-planner → feature-planner}/assets/evaluation-guide.md +4 -4
- package/bundled/skills/{app-planner → feature-planner}/assets/planning-guide.md +3 -171
- package/bundled/skills/{app-planner → feature-planner}/references/browser-interaction.md +6 -5
- package/bundled/skills/feature-planner/references/decomposition-patterns.md +75 -0
- package/bundled/skills/{app-planner → feature-planner}/references/error-recovery.md +8 -8
- package/bundled/skills/{app-planner → feature-planner}/references/incremental-feature-planning.md +1 -1
- package/bundled/skills/{app-planner/references/new-app-planning.md → feature-planner/references/new-project-planning.md} +1 -1
- package/bundled/skills/{app-planner → feature-planner}/scripts/validate-and-generate.py +4 -4
- package/bundled/skills/feature-workflow/SKILL.md +23 -23
- package/bundled/skills/prizm-kit/SKILL.md +1 -3
- package/bundled/skills/prizmkit-analyze/SKILL.md +2 -5
- package/bundled/skills/prizmkit-code-review/SKILL.md +2 -2
- package/bundled/skills/prizmkit-committer/SKILL.md +4 -8
- package/bundled/skills/prizmkit-deploy/SKILL.md +1 -5
- package/bundled/skills/prizmkit-implement/SKILL.md +3 -50
- package/bundled/skills/prizmkit-init/SKILL.md +5 -77
- package/bundled/skills/prizmkit-plan/SKILL.md +1 -12
- package/bundled/skills/prizmkit-prizm-docs/SKILL.md +6 -24
- package/bundled/skills/prizmkit-prizm-docs/assets/PRIZM-SPEC.md +21 -0
- package/bundled/skills/prizmkit-retrospective/SKILL.md +12 -117
- package/bundled/skills/recovery-workflow/SKILL.md +166 -316
- package/bundled/skills/recovery-workflow/evals/evals.json +29 -13
- package/bundled/skills/recovery-workflow/scripts/detect-recovery-state.py +232 -274
- package/bundled/skills/refactor-pipeline-launcher/SKILL.md +352 -0
- package/bundled/skills/refactor-planner/SKILL.md +436 -0
- package/bundled/skills/refactor-planner/assets/planning-guide.md +292 -0
- package/bundled/skills/refactor-planner/references/behavior-preservation.md +301 -0
- package/bundled/skills/refactor-planner/references/refactor-scoping-guide.md +221 -0
- package/bundled/skills/refactor-planner/scripts/validate-and-generate-refactor.py +786 -0
- package/bundled/skills/refactor-workflow/SKILL.md +299 -319
- package/package.json +1 -1
- package/src/clean.js +3 -3
- package/src/scaffold.js +6 -6
- /package/bundled/skills/{dev-pipeline-launcher → feature-pipeline-launcher}/scripts/preflight-check.py +0 -0
|
@@ -10,20 +10,19 @@ If CRITIC:MISSING — skip this phase entirely and proceed. Log: "Critic agent n
|
|
|
10
10
|
|
|
11
11
|
**If {{CRITIC_COUNT}} = 1 → Single Critic** (skip to CP-2.5 after this):
|
|
12
12
|
|
|
13
|
-
Spawn
|
|
13
|
+
**Spawn Agent**:
|
|
14
|
+
| Parameter | Value |
|
|
15
|
+
|-----------|-------|
|
|
16
|
+
| subagent_type | prizm-dev-team-critic |
|
|
17
|
+
| mode | plan |
|
|
18
|
+
| run_in_background | false |
|
|
14
19
|
|
|
15
|
-
Prompt
|
|
16
|
-
>
|
|
17
|
-
> **MODE: Plan Challenge**
|
|
18
|
-
> 1. Read `.prizmkit/specs/{{FEATURE_SLUG}}/context-snapshot.md` FIRST — Section 3 has project context, Section 4 has file manifest.
|
|
19
|
-
> 2. Read `.prizm-docs/root.prizm` and relevant L1/L2 docs for affected modules.
|
|
20
|
-
> 3. Read existing source files in the modules this plan touches.
|
|
21
|
-
> 4. Challenge plan.md against the project's existing architecture, patterns, and style.
|
|
22
|
-
> Write `.prizmkit/specs/{{FEATURE_SLUG}}/challenge-report.md` with findings (or 'No significant challenges')."
|
|
20
|
+
**Prompt**:
|
|
21
|
+
> {{AGENT_PROMPT_CRITIC_PLAN_CHALLENGE}}
|
|
23
22
|
|
|
24
23
|
**If {{CRITIC_COUNT}} = 3 → Multi-Critic Voting** (skip Single Critic above):
|
|
25
24
|
|
|
26
|
-
Spawn 3 Critic agents sequentially (each with run_in_background=false), each with a different focus lens:
|
|
25
|
+
Spawn 3 Critic agents sequentially (each with mode="plan", run_in_background=false), each with a different focus lens:
|
|
27
26
|
|
|
28
27
|
Critic-A prompt (append to base prompt above):
|
|
29
28
|
> "**Focus Lens: Architecture & Scalability.** Prioritize: architectural pattern fit, scalability implications, over-engineering risks, component boundary design.
|
|
@@ -6,16 +6,15 @@ ls {{CRITIC_SUBAGENT_PATH}} 2>/dev/null && echo "CRITIC:READY" || echo "CRITIC:M
|
|
|
6
6
|
```
|
|
7
7
|
If CRITIC:MISSING — skip this phase entirely and proceed. Log: "Critic agent not installed — skipping Plan Challenge."
|
|
8
8
|
|
|
9
|
-
Spawn
|
|
9
|
+
**Spawn Agent**:
|
|
10
|
+
| Parameter | Value |
|
|
11
|
+
|-----------|-------|
|
|
12
|
+
| subagent_type | prizm-dev-team-critic |
|
|
13
|
+
| mode | plan |
|
|
14
|
+
| run_in_background | false |
|
|
10
15
|
|
|
11
|
-
Prompt
|
|
12
|
-
>
|
|
13
|
-
> **MODE: Plan Challenge**
|
|
14
|
-
> 1. Read `.prizmkit/specs/{{FEATURE_SLUG}}/context-snapshot.md` FIRST — Section 3 has project context, Section 4 has file manifest.
|
|
15
|
-
> 2. Read `.prizm-docs/root.prizm` and relevant L1/L2 docs for affected modules.
|
|
16
|
-
> 3. Read existing source files in the modules this plan touches.
|
|
17
|
-
> 4. Challenge plan.md against the project's existing architecture, patterns, and style.
|
|
18
|
-
> Write `.prizmkit/specs/{{FEATURE_SLUG}}/challenge-report.md` with findings (or 'No significant challenges')."
|
|
16
|
+
**Prompt**:
|
|
17
|
+
> {{AGENT_PROMPT_CRITIC_PLAN_CHALLENGE}}
|
|
19
18
|
|
|
20
19
|
Wait for Critic to return.
|
|
21
20
|
- Read challenge-report.md. For items marked CRITICAL/HIGH: decide whether to adjust plan.md or document why the plan stands.
|
|
@@ -2,17 +2,14 @@
|
|
|
2
2
|
|
|
3
3
|
**Build artifacts rule** (passed to Dev): After any build/compile command (`go build`, `npm run build`, `tsc`, etc.), ensure the output binary or build directory is in `.gitignore`. Never commit compiled binaries, build output, or generated artifacts.
|
|
4
4
|
|
|
5
|
-
Spawn
|
|
5
|
+
**Spawn Agent**:
|
|
6
|
+
| Parameter | Value |
|
|
7
|
+
|-----------|-------|
|
|
8
|
+
| subagent_type | prizm-dev-team-dev |
|
|
9
|
+
| run_in_background | false |
|
|
6
10
|
|
|
7
|
-
Prompt
|
|
8
|
-
>
|
|
9
|
-
> **IMPORTANT**: Read `.prizmkit/specs/{{FEATURE_SLUG}}/context-snapshot.md` FIRST — Section 3 has Prizm Context (TRAPS/RULES), Section 4 has File Manifest with paths and interfaces.
|
|
10
|
-
> ⚠️ DO NOT re-read source files already listed in Section 4 File Manifest unless you need implementation detail beyond the interface summary.
|
|
11
|
-
> 1. Read `.prizmkit/specs/{{FEATURE_SLUG}}/context-snapshot.md` for full context.
|
|
12
|
-
> 2. Run `/prizmkit-implement` to execute the tasks in plan.md. Use `TEST_CMD=<TEST_CMD>` for testing. Baseline failures: `BASELINE_FAILURES=<BASELINE_FAILURES>`.
|
|
13
|
-
> 3. After implement completes, verify the '## Implementation Log' section was written to context-snapshot.md.
|
|
14
|
-
> 4. Do NOT execute any git commands (no git add/commit/reset/push).
|
|
15
|
-
> Do NOT exit until all tasks are [x] and the '## Implementation Log' section is written in context-snapshot.md."
|
|
11
|
+
**Prompt**:
|
|
12
|
+
> {{AGENT_PROMPT_DEV_IMPLEMENT}}
|
|
16
13
|
|
|
17
14
|
Wait for Dev to return. All tasks must be `[x]`, tests pass.
|
|
18
15
|
|
|
@@ -9,17 +9,14 @@ grep -c '^\- \[ \]' .prizmkit/specs/{{FEATURE_SLUG}}/plan.md 2>/dev/null || true
|
|
|
9
9
|
- If result is `0` (all tasks already `[x]`) → **SKIP this phase**, go directly to Review. Do NOT spawn Dev.
|
|
10
10
|
- If result is non-zero → spawn Dev agent below.
|
|
11
11
|
|
|
12
|
-
Spawn
|
|
12
|
+
**Spawn Agent**:
|
|
13
|
+
| Parameter | Value |
|
|
14
|
+
|-----------|-------|
|
|
15
|
+
| subagent_type | prizm-dev-team-dev |
|
|
16
|
+
| run_in_background | false |
|
|
13
17
|
|
|
14
|
-
Prompt
|
|
15
|
-
>
|
|
16
|
-
> **IMPORTANT**: Read `.prizmkit/specs/{{FEATURE_SLUG}}/context-snapshot.md` FIRST — Section 3 has Prizm Context (TRAPS/RULES), Section 4 has File Manifest with paths and interfaces.
|
|
17
|
-
> ⚠️ DO NOT re-read source files already listed in Section 4 File Manifest unless you need implementation detail beyond the interface summary.
|
|
18
|
-
> 1. Read `.prizmkit/specs/{{FEATURE_SLUG}}/context-snapshot.md` for full context.
|
|
19
|
-
> 2. Run `/prizmkit-implement` to execute the tasks in plan.md. Use `TEST_CMD=<TEST_CMD>` for testing. Baseline failures: `BASELINE_FAILURES=<BASELINE_FAILURES>`.
|
|
20
|
-
> 3. After implement completes, verify the '## Implementation Log' section was written to context-snapshot.md.
|
|
21
|
-
> 4. Do NOT execute any git commands (no git add/commit/reset/push).
|
|
22
|
-
> Do NOT exit until all tasks are [x] and the '## Implementation Log' section is written in context-snapshot.md."
|
|
18
|
+
**Prompt**:
|
|
19
|
+
> {{AGENT_PROMPT_DEV_IMPLEMENT}}
|
|
23
20
|
|
|
24
21
|
**Gate Check — Implementation Log**:
|
|
25
22
|
After Dev agent returns, verify the Implementation Log was written:
|
|
@@ -31,11 +28,7 @@ If GATE:MISSING — send message to Dev (re-spawn if needed): "Write the '## Imp
|
|
|
31
28
|
Wait for Dev to return. **If Dev times out before all tasks are `[x]`**:
|
|
32
29
|
1. Check progress: `grep -c '^\- \[ \]' .prizmkit/specs/{{FEATURE_SLUG}}/plan.md`
|
|
33
30
|
2. If any tasks remain: re-spawn Dev with this recovery prompt:
|
|
34
|
-
>
|
|
35
|
-
> 1. Read `.prizmkit/specs/{{FEATURE_SLUG}}/context-snapshot.md` — Section 4 has File Manifest, 'Implementation Log' (if present) shows what was already done.
|
|
36
|
-
> 2. Run `git diff HEAD` to see actual code changes already made.
|
|
37
|
-
> 3. Run `/prizmkit-implement` to complete the remaining `[ ]` tasks. Use `TEST_CMD=<TEST_CMD>` for testing.
|
|
38
|
-
> 4. Do NOT execute any git commands."
|
|
31
|
+
> {{AGENT_PROMPT_DEV_RESUME}}
|
|
39
32
|
3. Max 2 recovery retries. After 2 failures, orchestrator implements remaining tasks directly.
|
|
40
33
|
|
|
41
34
|
All tasks `[x]`, tests pass.
|
|
@@ -1,18 +1,13 @@
|
|
|
1
1
|
### Review + Test — Reviewer Subagent
|
|
2
2
|
|
|
3
|
-
Spawn
|
|
3
|
+
**Spawn Agent**:
|
|
4
|
+
| Parameter | Value |
|
|
5
|
+
|-----------|-------|
|
|
6
|
+
| subagent_type | prizm-dev-team-reviewer |
|
|
7
|
+
| run_in_background | false |
|
|
4
8
|
|
|
5
|
-
Prompt
|
|
6
|
-
>
|
|
7
|
-
> **IMPORTANT**: Read `.prizmkit/specs/{{FEATURE_SLUG}}/context-snapshot.md` FIRST.
|
|
8
|
-
> 1. Read `.prizmkit/specs/{{FEATURE_SLUG}}/context-snapshot.md`:
|
|
9
|
-
> - Section 3: Prizm Context (RULES, PATTERNS to check against)
|
|
10
|
-
> - Section 4: File Manifest (original file structure)
|
|
11
|
-
> - '## Implementation Log': what Dev changed, key decisions, discoveries
|
|
12
|
-
> 2. Run prizmkit-code-review (both phases): Phase 1 diagnostic review (spec compliance, code quality, correctness), then Phase 2 fix strategy formulation for any findings. Read ONLY files listed in Implementation Log for diagnosis; MAY read additional files for impact analysis.
|
|
13
|
-
> 3. Run the full test suite — **ONLY if the Implementation Log does not already confirm all tests passing**. If the log states tests passed, trust it and skip the re-run. When running: `$TEST_CMD 2>&1 | tee /tmp/review-test-out.txt | tail -20`, then grep the file for details — do NOT re-run the suite multiple times. Write and execute integration tests covering all user stories.
|
|
14
|
-
> 4. Write structured '## Review Notes' to context-snapshot.md with Fix Instructions (Root Cause, Impact, Fix Strategy, Code Guidance, Verification for each finding) and Re-Review Expectations.
|
|
15
|
-
> Report verdict: PASS, PASS_WITH_WARNINGS, or NEEDS_FIXES."
|
|
9
|
+
**Prompt**:
|
|
10
|
+
> {{AGENT_PROMPT_REVIEWER_REVIEW}}
|
|
16
11
|
|
|
17
12
|
Wait for Reviewer to return.
|
|
18
13
|
|
|
@@ -1,18 +1,13 @@
|
|
|
1
1
|
### Review + Test — Reviewer Agent
|
|
2
2
|
|
|
3
|
-
Spawn
|
|
3
|
+
**Spawn Agent**:
|
|
4
|
+
| Parameter | Value |
|
|
5
|
+
|-----------|-------|
|
|
6
|
+
| subagent_type | prizm-dev-team-reviewer |
|
|
7
|
+
| run_in_background | false |
|
|
4
8
|
|
|
5
|
-
Prompt
|
|
6
|
-
>
|
|
7
|
-
> **IMPORTANT**: Read `.prizmkit/specs/{{FEATURE_SLUG}}/context-snapshot.md` FIRST.
|
|
8
|
-
> 1. Read `.prizmkit/specs/{{FEATURE_SLUG}}/context-snapshot.md`:
|
|
9
|
-
> - Section 3: Prizm Context (RULES, PATTERNS to check against)
|
|
10
|
-
> - Section 4: File Manifest (original file structure)
|
|
11
|
-
> - '## Implementation Log': what Dev changed, key decisions, discoveries
|
|
12
|
-
> 2. Run prizmkit-code-review (both phases): Phase 1 diagnostic review (spec compliance, code quality, correctness), then Phase 2 fix strategy formulation for any findings. Read ONLY files listed in Implementation Log for diagnosis; MAY read additional files for impact analysis.
|
|
13
|
-
> 3. Run the full test suite using `TEST_CMD=<TEST_CMD>` — **ONLY if the Implementation Log does not already confirm all tests passing**. If Implementation Log states tests passed, trust it and skip the re-run. When running tests: `$TEST_CMD 2>&1 | tee /tmp/review-test-out.txt | tail -20`, then grep `/tmp/review-test-out.txt` for details — do NOT re-run the suite multiple times. Write and execute integration tests covering all user stories from spec.md.
|
|
14
|
-
> 4. Write structured '## Review Notes' to context-snapshot.md with Fix Instructions (Root Cause, Impact, Fix Strategy, Code Guidance, Verification for each finding) and Re-Review Expectations.
|
|
15
|
-
> Report verdict: PASS, PASS_WITH_WARNINGS, or NEEDS_FIXES."
|
|
9
|
+
**Prompt**:
|
|
10
|
+
> {{AGENT_PROMPT_REVIEWER_REVIEW}}
|
|
16
11
|
|
|
17
12
|
Wait for Reviewer to return.
|
|
18
13
|
|
|
@@ -24,13 +19,7 @@ grep -q "## Review Notes" .prizmkit/specs/{{FEATURE_SLUG}}/context-snapshot.md &
|
|
|
24
19
|
If GATE:MISSING — send message to Reviewer (re-spawn if needed): "Write the '## Review Notes' section to context-snapshot.md with structured Fix Instructions. Include: verdict, findings with Root Cause/Impact/Fix Strategy/Code Guidance/Verification, and Re-Review Expectations."
|
|
25
20
|
|
|
26
21
|
- If NEEDS_FIXES: spawn Dev to fix with this prompt:
|
|
27
|
-
>
|
|
28
|
-
> 1. Read `.prizmkit/specs/{{FEATURE_SLUG}}/context-snapshot.md` — '## Review Notes' section contains structured Fix Instructions with exact steps.
|
|
29
|
-
> 2. Follow Fix Instructions in order (respect Depends On / Blocks dependencies). Each FIX-N has: Root Cause, Fix Strategy, Code Guidance, and Verification criteria.
|
|
30
|
-
> 3. After each fix, run the Verification command listed in that FIX-N to confirm it works.
|
|
31
|
-
> 4. Use `TEST_CMD=<TEST_CMD>` to verify no regressions.
|
|
32
|
-
> 5. Append fix summary to '## Implementation Log' in context-snapshot.md.
|
|
33
|
-
> 6. Do NOT execute any git commands."
|
|
22
|
+
> {{AGENT_PROMPT_DEV_FIX}}
|
|
34
23
|
Then re-run Review (max 3 rounds).
|
|
35
24
|
|
|
36
25
|
**CP-3**: Integration tests pass, verdict is not NEEDS_FIXES.
|
|
@@ -0,0 +1,75 @@
|
|
|
1
|
+
## Test Failure Recovery Protocol
|
|
2
|
+
|
|
3
|
+
When tests fail during implementation (Phase 3 / Phase 4):
|
|
4
|
+
|
|
5
|
+
### Immediate Action — Recovery Attempt (Max 2 Rounds)
|
|
6
|
+
|
|
7
|
+
1. **Analyze failure output**:
|
|
8
|
+
- Read the test failure message carefully
|
|
9
|
+
- Identify: root cause (code bug vs. test brittleness vs. environment issue)
|
|
10
|
+
- Check if baseline already recorded this failure (in BASELINE_FAILURES)
|
|
11
|
+
|
|
12
|
+
2. **Categorize failure**:
|
|
13
|
+
- **Pre-existing baseline failure** (expected): Record as acceptable, do NOT fix
|
|
14
|
+
- **New regression**: Code introduced a bug, fix the code
|
|
15
|
+
- **Brittle test**: Test passes/fails inconsistently, fix the test or environment
|
|
16
|
+
- **Environment issue**: Missing dependency, wrong config, fix setup
|
|
17
|
+
|
|
18
|
+
3. **Fix and re-run** (first round):
|
|
19
|
+
- Apply fix (code or test, not environment)
|
|
20
|
+
- Re-run `$TEST_CMD` to verify
|
|
21
|
+
- If now passing → continue to next task
|
|
22
|
+
- If still failing → **proceed to Round 2**
|
|
23
|
+
|
|
24
|
+
4. **Second fix attempt** (second round only):
|
|
25
|
+
- Re-analyze the failure with fresh perspective
|
|
26
|
+
- Try alternate fix approach
|
|
27
|
+
- Re-run `$TEST_CMD`
|
|
28
|
+
- If still failing after Round 2 → **escalate** (see below)
|
|
29
|
+
|
|
30
|
+
### Escalation Paths
|
|
31
|
+
|
|
32
|
+
**Tier 1 (Single Agent)**:
|
|
33
|
+
- After max 2 fix rounds with tests still failing
|
|
34
|
+
- Document failure in Implementation Log with root cause analysis
|
|
35
|
+
- Attempt one manual fix by re-reading related source code
|
|
36
|
+
- If unable to resolve: record PARTIAL status with known failure list
|
|
37
|
+
- **Do NOT block commit**; tests can fail during development (recovery may be deferred to next session)
|
|
38
|
+
|
|
39
|
+
**Tier 2/3 (Dev + Reviewer)**:
|
|
40
|
+
- After Dev completes max 2 fix rounds with tests still failing
|
|
41
|
+
- Dev appends failure details to Implementation Log
|
|
42
|
+
- Reviewer agent runs full test suite in Phase 5
|
|
43
|
+
- If Reviewer confirms NEW regressions (not in baseline): mark verdict as `NEEDS_FIXES`
|
|
44
|
+
- If Reviewer confirms only baseline failures remain: proceed with `PASS_WITH_WARNINGS`
|
|
45
|
+
|
|
46
|
+
### Context-Aware Test Re-run (Performance Optimization)
|
|
47
|
+
|
|
48
|
+
**Skip redundant re-runs**:
|
|
49
|
+
- If Implementation Log section in context-snapshot.md already confirms "all tests passing"
|
|
50
|
+
- → Skip Phase 5 test suite re-run (Reviewer will verify baseline log instead)
|
|
51
|
+
- This avoids rebuilding/re-running tests when already verified
|
|
52
|
+
|
|
53
|
+
**When to re-run**:
|
|
54
|
+
- If Implementation Log is missing or incomplete
|
|
55
|
+
- If any new code was added after the last test run
|
|
56
|
+
- If Reviewer suspects brittleness or environment drift
|
|
57
|
+
|
|
58
|
+
### Failure Capture Rules
|
|
59
|
+
|
|
60
|
+
If tests remain broken after recovery:
|
|
61
|
+
|
|
62
|
+
```
|
|
63
|
+
## Test Failures Encountered
|
|
64
|
+
|
|
65
|
+
- **Test**: [test name/path]
|
|
66
|
+
- Root Cause: [explanation]
|
|
67
|
+
- Category: [pre-existing baseline | new regression | brittle test | environment]
|
|
68
|
+
- Fix Attempted: [describe what was tried]
|
|
69
|
+
- Status: [still failing | requires next session | known limitation]
|
|
70
|
+
|
|
71
|
+
- **Impact on Feature**: [can AC be verified despite failure | blocks AC verification]
|
|
72
|
+
```
|
|
73
|
+
|
|
74
|
+
**Rule**: If any AC cannot be verified due to test failure, the feature is incomplete. Document in failure-log.md for next session.
|
|
75
|
+
|
|
@@ -1,5 +1,5 @@
|
|
|
1
1
|
{
|
|
2
|
-
"version": "1.1.
|
|
2
|
+
"version": "1.1.3",
|
|
3
3
|
"skills": {
|
|
4
4
|
"prizm-kit": {
|
|
5
5
|
"description": "Full-lifecycle dev toolkit. Covers spec-driven development, Prizm context docs, code quality, debugging, deployment, and knowledge management.",
|
|
@@ -72,7 +72,7 @@
|
|
|
72
72
|
"hasScripts": false
|
|
73
73
|
},
|
|
74
74
|
"feature-workflow": {
|
|
75
|
-
"description": "One-stop entry point for feature development. Orchestrates
|
|
75
|
+
"description": "One-stop entry point for feature development. Orchestrates feature-planner → feature-pipeline-launcher → background execution. Handles multi-feature batch development from a single request.",
|
|
76
76
|
"tier": "companion",
|
|
77
77
|
"category": "orchestration-skill",
|
|
78
78
|
"subcategory": "workflows",
|
|
@@ -80,8 +80,8 @@
|
|
|
80
80
|
"hasScripts": false
|
|
81
81
|
},
|
|
82
82
|
"refactor-workflow": {
|
|
83
|
-
"description": "
|
|
84
|
-
"tier": "
|
|
83
|
+
"description": "One-stop entry point for code refactoring. Orchestrates refactor-planner → refactor-pipeline-launcher → execution.",
|
|
84
|
+
"tier": "companion",
|
|
85
85
|
"category": "orchestration-skill",
|
|
86
86
|
"subcategory": "workflows",
|
|
87
87
|
"hasAssets": false,
|
|
@@ -96,6 +96,14 @@
|
|
|
96
96
|
"hasScripts": false
|
|
97
97
|
},
|
|
98
98
|
"app-planner": {
|
|
99
|
+
"description": "Plan a new application from scratch — vision, tech stack, feature decomposition, and validated feature-list.json.",
|
|
100
|
+
"tier": "companion",
|
|
101
|
+
"category": "orchestration-skill",
|
|
102
|
+
"subcategory": "pipelines",
|
|
103
|
+
"hasAssets": true,
|
|
104
|
+
"hasScripts": true
|
|
105
|
+
},
|
|
106
|
+
"feature-planner": {
|
|
99
107
|
"description": "Interactive planning for new apps and incremental features; outputs validated feature-list.json for dev-pipeline.",
|
|
100
108
|
"tier": "companion",
|
|
101
109
|
"category": "orchestration-skill",
|
|
@@ -103,7 +111,7 @@
|
|
|
103
111
|
"hasAssets": true,
|
|
104
112
|
"hasScripts": true
|
|
105
113
|
},
|
|
106
|
-
"
|
|
114
|
+
"feature-pipeline-launcher": {
|
|
107
115
|
"description": "Launch and manage the dev-pipeline from within an AI CLI session. Start pipeline in background, monitor logs, check status, stop pipeline.",
|
|
108
116
|
"tier": "companion",
|
|
109
117
|
"category": "orchestration-skill",
|
|
@@ -119,6 +127,22 @@
|
|
|
119
127
|
"hasAssets": false,
|
|
120
128
|
"hasScripts": false
|
|
121
129
|
},
|
|
130
|
+
"refactor-planner": {
|
|
131
|
+
"description": "Interactive refactoring planner. Analyzes code structure and produces validated refactor-list.json for dev-pipeline execution.",
|
|
132
|
+
"tier": "companion",
|
|
133
|
+
"category": "orchestration-skill",
|
|
134
|
+
"subcategory": "pipelines",
|
|
135
|
+
"hasAssets": true,
|
|
136
|
+
"hasScripts": true
|
|
137
|
+
},
|
|
138
|
+
"refactor-pipeline-launcher": {
|
|
139
|
+
"description": "Launch and manage the refactor pipeline from within an AI CLI session.",
|
|
140
|
+
"tier": "companion",
|
|
141
|
+
"category": "orchestration-skill",
|
|
142
|
+
"subcategory": "pipelines",
|
|
143
|
+
"hasAssets": false,
|
|
144
|
+
"hasScripts": false
|
|
145
|
+
},
|
|
122
146
|
"bug-fix-workflow": {
|
|
123
147
|
"description": "Interactive single-bug fix in current session. Guides triage → reproduce → fix → review → commit without background pipeline.",
|
|
124
148
|
"tier": "companion",
|
|
@@ -153,9 +177,12 @@
|
|
|
153
177
|
"feature-workflow",
|
|
154
178
|
"refactor-workflow",
|
|
155
179
|
"app-planner",
|
|
180
|
+
"feature-planner",
|
|
156
181
|
"bug-planner",
|
|
157
|
-
"
|
|
182
|
+
"feature-pipeline-launcher",
|
|
158
183
|
"bugfix-pipeline-launcher",
|
|
184
|
+
"refactor-planner",
|
|
185
|
+
"refactor-pipeline-launcher",
|
|
159
186
|
"bug-fix-workflow",
|
|
160
187
|
"recovery-workflow"
|
|
161
188
|
]
|