maestro-flow 0.5.3 → 0.5.31

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (259) hide show
  1. package/.agents/skills/learn-follow/SKILL.md +114 -114
  2. package/.agents/skills/learn-investigate/SKILL.md +138 -139
  3. package/.agents/skills/learn-second-opinion/SKILL.md +105 -109
  4. package/.agents/skills/maestro/SKILL.md +2 -10
  5. package/.agents/skills/maestro-amend/SKILL.md +152 -152
  6. package/.agents/skills/maestro-analyze/SKILL.md +201 -252
  7. package/.agents/skills/maestro-blueprint/SKILL.md +175 -190
  8. package/.agents/skills/maestro-brainstorm/SKILL.md +196 -200
  9. package/.agents/skills/maestro-collab/SKILL.md +159 -159
  10. package/.agents/skills/maestro-companion/SKILL.md +517 -517
  11. package/.agents/skills/maestro-composer/SKILL.md +173 -164
  12. package/.agents/skills/maestro-execute/SKILL.md +169 -170
  13. package/.agents/skills/maestro-fork/SKILL.md +97 -96
  14. package/.agents/skills/maestro-grill/SKILL.md +161 -162
  15. package/.agents/skills/maestro-guard/SKILL.md +93 -92
  16. package/.agents/skills/maestro-impeccable/SKILL.md +296 -253
  17. package/.agents/skills/maestro-init/SKILL.md +117 -118
  18. package/.agents/skills/maestro-merge/SKILL.md +73 -66
  19. package/.agents/skills/maestro-milestone-audit/SKILL.md +4 -10
  20. package/.agents/skills/maestro-milestone-complete/SKILL.md +6 -7
  21. package/.agents/skills/maestro-milestone-release/SKILL.md +122 -131
  22. package/.agents/skills/maestro-next/SKILL.md +241 -245
  23. package/.agents/skills/maestro-overlay/SKILL.md +176 -166
  24. package/.agents/skills/maestro-plan/SKILL.md +211 -197
  25. package/.agents/skills/maestro-player/SKILL.md +167 -167
  26. package/.agents/skills/maestro-quick/SKILL.md +69 -63
  27. package/.agents/skills/maestro-ralph/SKILL.md +2 -36
  28. package/.agents/skills/maestro-ralph-beta/SKILL.md +861 -872
  29. package/.agents/skills/maestro-ralph-execute/SKILL.md +234 -234
  30. package/.agents/skills/maestro-roadmap/SKILL.md +159 -172
  31. package/.agents/skills/maestro-swarm-workflow/SKILL.md +229 -250
  32. package/.agents/skills/maestro-tools-execute/SKILL.md +108 -103
  33. package/.agents/skills/maestro-tools-register/SKILL.md +148 -143
  34. package/.agents/skills/maestro-ui-codify/SKILL.md +103 -86
  35. package/.agents/skills/maestro-universal-workflow/SKILL.md +534 -547
  36. package/.agents/skills/maestro-update/SKILL.md +109 -106
  37. package/.agents/skills/manage-codebase-rebuild/SKILL.md +73 -71
  38. package/.agents/skills/manage-harvest/SKILL.md +83 -81
  39. package/.agents/skills/manage-issue/SKILL.md +59 -60
  40. package/.agents/skills/manage-issue-discover/SKILL.md +70 -68
  41. package/.agents/skills/manage-kg-extractors/SKILL.md +130 -0
  42. package/.agents/skills/manage-knowhow/SKILL.md +70 -66
  43. package/.agents/skills/manage-knowhow-capture/SKILL.md +79 -69
  44. package/.agents/skills/manage-knowledge-audit/SKILL.md +91 -74
  45. package/.agents/skills/manage-status/SKILL.md +52 -42
  46. package/.agents/skills/manage-wiki/SKILL.md +69 -58
  47. package/.agents/skills/odyssey-debug/SKILL.md +445 -459
  48. package/.agents/skills/odyssey-improve/SKILL.md +477 -491
  49. package/.agents/skills/odyssey-planex/SKILL.md +576 -587
  50. package/.agents/skills/odyssey-review-test-fix/SKILL.md +400 -413
  51. package/.agents/skills/odyssey-ui/SKILL.md +431 -448
  52. package/.agents/skills/quality-auto-test/SKILL.md +140 -123
  53. package/.agents/skills/quality-debug/SKILL.md +145 -106
  54. package/.agents/skills/quality-refactor/SKILL.md +91 -53
  55. package/.agents/skills/quality-retrospective/SKILL.md +109 -63
  56. package/.agents/skills/quality-review/SKILL.md +141 -114
  57. package/.agents/skills/quality-sync/SKILL.md +74 -38
  58. package/.agents/skills/quality-test/SKILL.md +133 -103
  59. package/.agents/skills/security-audit/SKILL.md +217 -166
  60. package/.agents/skills/spec-add/SKILL.md +66 -59
  61. package/.agents/skills/spec-load/SKILL.md +68 -68
  62. package/.agents/skills/spec-remove/SKILL.md +42 -42
  63. package/.agents/skills/spec-setup/SKILL.md +38 -41
  64. package/.agy/skills/learn-follow/SKILL.md +114 -114
  65. package/.agy/skills/learn-investigate/SKILL.md +138 -139
  66. package/.agy/skills/learn-second-opinion/SKILL.md +105 -109
  67. package/.agy/skills/maestro/SKILL.md +2 -10
  68. package/.agy/skills/maestro-amend/SKILL.md +152 -152
  69. package/.agy/skills/maestro-analyze/SKILL.md +201 -252
  70. package/.agy/skills/maestro-blueprint/SKILL.md +175 -190
  71. package/.agy/skills/maestro-brainstorm/SKILL.md +196 -200
  72. package/.agy/skills/maestro-collab/SKILL.md +159 -159
  73. package/.agy/skills/maestro-companion/SKILL.md +517 -517
  74. package/.agy/skills/maestro-composer/SKILL.md +173 -164
  75. package/.agy/skills/maestro-execute/SKILL.md +169 -170
  76. package/.agy/skills/maestro-fork/SKILL.md +97 -96
  77. package/.agy/skills/maestro-grill/SKILL.md +161 -162
  78. package/.agy/skills/maestro-guard/SKILL.md +93 -92
  79. package/.agy/skills/maestro-impeccable/SKILL.md +296 -253
  80. package/.agy/skills/maestro-init/SKILL.md +117 -118
  81. package/.agy/skills/maestro-merge/SKILL.md +73 -66
  82. package/.agy/skills/maestro-milestone-audit/SKILL.md +4 -10
  83. package/.agy/skills/maestro-milestone-complete/SKILL.md +6 -7
  84. package/.agy/skills/maestro-milestone-release/SKILL.md +122 -131
  85. package/.agy/skills/maestro-next/SKILL.md +241 -245
  86. package/.agy/skills/maestro-overlay/SKILL.md +176 -166
  87. package/.agy/skills/maestro-plan/SKILL.md +211 -197
  88. package/.agy/skills/maestro-player/SKILL.md +167 -167
  89. package/.agy/skills/maestro-quick/SKILL.md +69 -63
  90. package/.agy/skills/maestro-ralph/SKILL.md +2 -36
  91. package/.agy/skills/maestro-ralph-beta/SKILL.md +861 -872
  92. package/.agy/skills/maestro-ralph-execute/SKILL.md +234 -234
  93. package/.agy/skills/maestro-roadmap/SKILL.md +159 -172
  94. package/.agy/skills/maestro-swarm-workflow/SKILL.md +229 -250
  95. package/.agy/skills/maestro-tools-execute/SKILL.md +108 -103
  96. package/.agy/skills/maestro-tools-register/SKILL.md +148 -143
  97. package/.agy/skills/maestro-ui-codify/SKILL.md +103 -86
  98. package/.agy/skills/maestro-universal-workflow/SKILL.md +534 -547
  99. package/.agy/skills/maestro-update/SKILL.md +109 -106
  100. package/.agy/skills/manage-codebase-rebuild/SKILL.md +73 -71
  101. package/.agy/skills/manage-harvest/SKILL.md +83 -81
  102. package/.agy/skills/manage-issue/SKILL.md +59 -60
  103. package/.agy/skills/manage-issue-discover/SKILL.md +70 -68
  104. package/.agy/skills/manage-kg-extractors/SKILL.md +130 -0
  105. package/.agy/skills/manage-knowhow/SKILL.md +70 -66
  106. package/.agy/skills/manage-knowhow-capture/SKILL.md +79 -69
  107. package/.agy/skills/manage-knowledge-audit/SKILL.md +91 -74
  108. package/.agy/skills/manage-status/SKILL.md +52 -42
  109. package/.agy/skills/manage-wiki/SKILL.md +69 -58
  110. package/.agy/skills/odyssey-debug/SKILL.md +445 -459
  111. package/.agy/skills/odyssey-improve/SKILL.md +477 -491
  112. package/.agy/skills/odyssey-planex/SKILL.md +576 -587
  113. package/.agy/skills/odyssey-review-test-fix/SKILL.md +400 -413
  114. package/.agy/skills/odyssey-ui/SKILL.md +431 -448
  115. package/.agy/skills/quality-auto-test/SKILL.md +140 -123
  116. package/.agy/skills/quality-debug/SKILL.md +145 -106
  117. package/.agy/skills/quality-refactor/SKILL.md +91 -53
  118. package/.agy/skills/quality-retrospective/SKILL.md +109 -63
  119. package/.agy/skills/quality-review/SKILL.md +141 -114
  120. package/.agy/skills/quality-sync/SKILL.md +74 -38
  121. package/.agy/skills/quality-test/SKILL.md +133 -103
  122. package/.agy/skills/security-audit/SKILL.md +217 -166
  123. package/.agy/skills/spec-add/SKILL.md +66 -59
  124. package/.agy/skills/spec-load/SKILL.md +68 -68
  125. package/.agy/skills/spec-remove/SKILL.md +42 -42
  126. package/.agy/skills/spec-setup/SKILL.md +38 -41
  127. package/.claude/commands/learn-follow.md +127 -127
  128. package/.claude/commands/learn-investigate.md +151 -152
  129. package/.claude/commands/learn-second-opinion.md +118 -122
  130. package/.claude/commands/maestro-amend.md +164 -164
  131. package/.claude/commands/maestro-analyze.md +215 -266
  132. package/.claude/commands/maestro-blueprint.md +189 -204
  133. package/.claude/commands/maestro-brainstorm.md +209 -213
  134. package/.claude/commands/maestro-collab.md +172 -172
  135. package/.claude/commands/maestro-companion.md +531 -531
  136. package/.claude/commands/maestro-composer.md +188 -179
  137. package/.claude/commands/maestro-execute.md +183 -184
  138. package/.claude/commands/maestro-fork.md +111 -110
  139. package/.claude/commands/maestro-grill.md +175 -176
  140. package/.claude/commands/maestro-guard.md +103 -102
  141. package/.claude/commands/maestro-impeccable.md +311 -268
  142. package/.claude/commands/maestro-init.md +130 -131
  143. package/.claude/commands/maestro-merge.md +87 -80
  144. package/.claude/commands/maestro-milestone-audit.md +4 -10
  145. package/.claude/commands/maestro-milestone-complete.md +6 -7
  146. package/.claude/commands/maestro-milestone-release.md +136 -145
  147. package/.claude/commands/maestro-next.md +253 -257
  148. package/.claude/commands/maestro-overlay.md +188 -178
  149. package/.claude/commands/maestro-plan.md +225 -211
  150. package/.claude/commands/maestro-player.md +182 -182
  151. package/.claude/commands/maestro-quick.md +83 -77
  152. package/.claude/commands/maestro-ralph-beta.md +875 -886
  153. package/.claude/commands/maestro-ralph-execute.md +247 -247
  154. package/.claude/commands/maestro-ralph.md +2 -36
  155. package/.claude/commands/maestro-roadmap.md +173 -186
  156. package/.claude/commands/maestro-swarm-workflow.md +243 -264
  157. package/.claude/commands/maestro-tools-execute.md +122 -117
  158. package/.claude/commands/maestro-tools-register.md +162 -157
  159. package/.claude/commands/maestro-ui-codify.md +117 -100
  160. package/.claude/commands/maestro-universal-workflow.md +548 -561
  161. package/.claude/commands/maestro-update.md +122 -119
  162. package/.claude/commands/maestro.md +2 -10
  163. package/.claude/commands/manage-codebase-rebuild.md +87 -85
  164. package/.claude/commands/manage-harvest.md +97 -95
  165. package/.claude/commands/manage-issue-discover.md +83 -81
  166. package/.claude/commands/manage-issue.md +72 -73
  167. package/.claude/commands/manage-kg-extractors.md +128 -0
  168. package/.claude/commands/manage-knowhow-capture.md +92 -82
  169. package/.claude/commands/manage-knowhow.md +83 -79
  170. package/.claude/commands/manage-knowledge-audit.md +105 -88
  171. package/.claude/commands/manage-status.md +62 -52
  172. package/.claude/commands/manage-wiki.md +82 -71
  173. package/.claude/commands/odyssey-debug.md +459 -473
  174. package/.claude/commands/odyssey-improve.md +491 -505
  175. package/.claude/commands/odyssey-planex.md +590 -601
  176. package/.claude/commands/odyssey-review-test-fix.md +414 -427
  177. package/.claude/commands/odyssey-ui.md +445 -462
  178. package/.claude/commands/quality-auto-test.md +153 -136
  179. package/.claude/commands/quality-debug.md +159 -120
  180. package/.claude/commands/quality-refactor.md +105 -67
  181. package/.claude/commands/quality-retrospective.md +123 -77
  182. package/.claude/commands/quality-review.md +155 -128
  183. package/.claude/commands/quality-sync.md +88 -52
  184. package/.claude/commands/quality-test.md +147 -117
  185. package/.claude/commands/security-audit.md +230 -179
  186. package/.claude/commands/spec-add.md +77 -70
  187. package/.claude/commands/spec-load.md +78 -78
  188. package/.claude/commands/spec-remove.md +55 -55
  189. package/.claude/commands/spec-setup.md +49 -52
  190. package/dist/src/cli.js +1 -1
  191. package/dist/src/cli.js.map +1 -1
  192. package/dist/src/commands/kg.d.ts.map +1 -1
  193. package/dist/src/commands/kg.js +11 -5
  194. package/dist/src/commands/kg.js.map +1 -1
  195. package/dist/src/graph/kg/extraction/code/code-extractor.d.ts +2 -0
  196. package/dist/src/graph/kg/extraction/code/code-extractor.d.ts.map +1 -1
  197. package/dist/src/graph/kg/extraction/code/code-extractor.js +32 -3
  198. package/dist/src/graph/kg/extraction/code/code-extractor.js.map +1 -1
  199. package/dist/src/graph/kg/extraction/code/plugin-engine.d.ts +35 -0
  200. package/dist/src/graph/kg/extraction/code/plugin-engine.d.ts.map +1 -0
  201. package/dist/src/graph/kg/extraction/code/plugin-engine.js +573 -0
  202. package/dist/src/graph/kg/extraction/code/plugin-engine.js.map +1 -0
  203. package/dist/src/graph/kg/extraction/code/plugin-types.d.ts +95 -0
  204. package/dist/src/graph/kg/extraction/code/plugin-types.d.ts.map +1 -0
  205. package/dist/src/graph/kg/extraction/code/plugin-types.js +5 -0
  206. package/dist/src/graph/kg/extraction/code/plugin-types.js.map +1 -0
  207. package/dist/src/graph/kg/extraction/orchestrator.d.ts.map +1 -1
  208. package/dist/src/graph/kg/extraction/orchestrator.js +17 -5
  209. package/dist/src/graph/kg/extraction/orchestrator.js.map +1 -1
  210. package/dist/src/graph/kg/schema.sql +16 -11
  211. package/dist/src/graph/kg/surface/cli.d.ts.map +1 -1
  212. package/dist/src/graph/kg/surface/cli.js +153 -56
  213. package/dist/src/graph/kg/surface/cli.js.map +1 -1
  214. package/dist/src/hooks/workspace.d.ts +4 -2
  215. package/dist/src/hooks/workspace.d.ts.map +1 -1
  216. package/dist/src/hooks/workspace.js +6 -2
  217. package/dist/src/hooks/workspace.js.map +1 -1
  218. package/package.json +91 -91
  219. package/workflows/analyze.md +25 -49
  220. package/workflows/auto-test.md +699 -699
  221. package/workflows/blueprint.md +403 -431
  222. package/workflows/brainstorm.md +54 -195
  223. package/workflows/business-test.md +570 -570
  224. package/workflows/claude-instructions.md +23 -51
  225. package/workflows/codex-instructions.md +27 -77
  226. package/workflows/coding-philosophy.md +69 -69
  227. package/workflows/command-authoring.md +823 -823
  228. package/workflows/debug.md +43 -98
  229. package/workflows/delegate-usage.md +39 -241
  230. package/workflows/execute.md +4 -53
  231. package/workflows/grill.md +12 -56
  232. package/workflows/harvest.md +22 -68
  233. package/workflows/init.md +148 -148
  234. package/workflows/instruction-authoring-guide.md +97 -0
  235. package/workflows/issue-execute.md +110 -110
  236. package/workflows/issue-gaps-analyze.codex.md +260 -260
  237. package/workflows/issue-gaps-analyze.md +216 -216
  238. package/workflows/issue-plan.md +110 -110
  239. package/workflows/issue.md +338 -346
  240. package/workflows/knowhow.md +0 -32
  241. package/workflows/learn.md +277 -277
  242. package/workflows/maestro-chain-execute.md +20 -20
  243. package/workflows/refactor.md +22 -44
  244. package/workflows/retrospective.md +16 -65
  245. package/workflows/review.md +446 -486
  246. package/workflows/roadmap.md +35 -132
  247. package/workflows/skill-authoring.md +265 -265
  248. package/workflows/spec-generate.md +470 -470
  249. package/workflows/specs-remove.md +104 -104
  250. package/workflows/sync.md +11 -41
  251. package/workflows/test-gen.md +226 -226
  252. package/workflows/test.md +385 -475
  253. package/workflows/ui-design.md +391 -391
  254. package/workflows/ui-style.md +199 -199
  255. package/workflows/wiki-connect.md +151 -151
  256. package/workflows/wiki-digest.md +178 -178
  257. package/workflows/wiki-manage.md +109 -109
  258. package/workflows/cli-tools-usage.md +0 -252
  259. package/workflows/delegate-protocol.codex.md +0 -65
@@ -13,126 +13,143 @@ allowed-tools:
13
13
  ---
14
14
  <!-- Open-standard mirror generated by scripts/build-agents-standard.mjs — do not edit; re-run after editing .claude/ source. -->
15
15
 
16
- <purpose>
17
- Run unified automated testing via CSV layer pipeline. Reads project state to auto-select the optimal scenario source PRD specs (when spec package exists), coverage gaps (when Nyquist audit found gaps), or code exploration (default). All sources converge into a CSV pipeline: discover infrastructure → plan → build scenarios.csv → write tests per layer (spawn_agents_on_csv parallel) → execute → diagnose failures (spawn_agents_on_csv parallel) → iterate → report.
18
-
19
- Key mechanisms:
20
- - **Intelligent routing**: Reads `.tests/`, `.workflow/blueprint/`, `verification.json` to auto-select source — no mode flag needed
21
- - **CSV parallel test writing**: Per-layer `spawn_agents_on_csv` — each agent writes one test file independently
22
- - **CSV parallel failure diagnosis**: Failed scenarios dispatched via `spawn_agents_on_csv` for classification + fix
23
- - **Unified iteration engine**: Nested inner loop (fix test_defects via diagnosis CSV, max 3/layer) + outer loop (adaptive strategy, max N iterations)
24
- - **Layers as waves**: L0→L1→L2→L3 sequential (fail-fast on critical), scenarios within layer parallel
25
- - **Discovery board**: `discoveries.ndjson` shared across all agents/iterations (append-only)
26
- - **Degenerate modes**: `--max-iter 1` = single-pass generation; default = full iterative cycle
27
- - **Session persistence**: CSV state + state.json survive context resets, resume from any point
28
- </purpose>
29
-
30
- <required_reading>
31
- @~/.maestro/workflows/auto-test.md
32
- </required_reading>
33
-
34
- <context>
35
- Phase or task: $ARGUMENTS (required phase number)
36
-
37
- **Flags:**
38
- - `--max-iter N` — Maximum outer iterations (default: 5). Set to 1 for single-pass generation only.
39
- - `--layer L` Start from or restrict to specific layer (L0|L1|L2|L3)
40
- - `--dry-run` Generate test plan only, do not execute
41
- - `--re-run` Re-run only previously failed/blocked scenarios
42
-
43
- **Intelligent routing** (auto-detected from project state):
44
-
45
- | Priority | Condition | Route | Reference skill |
46
- |----------|-----------|-------|-----------------|
47
- | 1 | Active session exists (state.json status=running) | Resume | — |
48
- | 2 | --re-run flag + previous failures | Re-run | — |
49
- | 3 | Spec package exists (REQ-*.md) | spec | quality-business-test (separate skill) |
50
- | 4 | Nyquist gaps exist (verification.json) | gap | quality-test-gen (separate skill) |
51
- | 5 | Default | code | quality-integration-test (separate skill) |
52
-
53
- Flags, artifact context resolution, and output formats defined in workflow auto-test.md.
54
-
55
- ### Pre-load context (before test generation)
56
-
57
- 1. **Test specs + tools**: Run `maestro spec load --category test` to load test conventions (framework, patterns, naming). Apply to all generated tests.
58
- 2. **Coding specs**: Run `maestro spec load --category coding` to understand coding patterns for accurate test targeting.
59
- 3. **Role Knowledge**:
60
- - Browse: `maestro search --category test`
61
- - Load task-relevant entries: `maestro wiki load <id1> [id2...]`
62
- 4. All are optional proceed without if unavailable.
63
- </context>
64
-
65
- <execution>
66
- Follow '~/.maestro/workflows/auto-test.md' completely.
67
-
68
- **Command-specific extensions (not in workflow):**
69
-
70
- **Review findings integration** (from related review artifacts):
71
- - Extract critical/high findings as additional test scenarios, marked `source: "review_finding"`
72
- - When review verdict is "BLOCK" and review-finding tests fail, suggest quality-debug
73
-
74
- **Debug root cause integration** (from related debug artifacts):
75
- - Generate regression test scenarios from confirmed root causes, marked `source: "debug_root_cause"`
76
-
77
- **Register artifact on completion:**
78
- ```
79
- Append to state.json.artifacts[]:
80
- {
81
- id: nextArtifactId(artifacts, "test"), // TST-001
82
- type: "test",
83
- milestone: current_milestone,
84
- phase: target_phase,
85
- scope: "phase",
86
- path: "scratch/{YYYYMMDD}-auto-test-P{N}-{slug}",
87
- status: issues == 0 ? "completed" : "failed",
88
- depends_on: exec_art.id,
89
- harvested: false,
90
- created_at: start_time,
91
- completed_at: now()
92
- }
93
- ```
94
-
95
- **Next-step routing on completion:**
96
- - Converged (>=95%) → `/quality-review {phase}`
97
- - All requirements verified (spec source) → `/maestro-milestone-audit`
98
- - Bugs discovered → `/quality-debug --from-uat {phase}`
99
- - Max iter, >80% → `/quality-test {phase}` for manual UAT
100
- - Max iter, <80% → `/quality-debug {phase}`
101
- - Coverage still low → `/quality-auto-test {phase} --layer {missing}`
102
- - Re-run all pass → `/quality-review {phase}`
103
- - Single pass, all pass → `/quality-test {phase}`
104
- </execution>
105
-
106
- <error_codes>
107
- | Code | Severity | Condition | Recovery |
108
- |------|----------|-----------|----------|
109
- | E001 | error | Phase argument required (no active sessions) | Prompt user for phase number |
110
- | E002 | error | Phase not found in artifact registry | Check state.json artifacts |
111
- | E003 | error | No test framework detected | Install test framework or configure test runner |
112
- | W001 | warning | One or more test scenarios failed | Auto-iterate or suggest fix options |
113
- | W002 | warning | Max iterations reached without convergence | Review reflection-log.md, suggest debug |
114
- | W003 | warning | Degraded spec mode (no full spec package) | Consider running maestro-roadmap --mode full |
115
- </error_codes>
116
-
117
- <success_criteria>
118
- - [ ] Phase resolved from artifact registry
119
- - [ ] Route auto-selected from project state (spec/gap/code)
120
- - [ ] Active sessions checked, resume offered if applicable
121
- - [ ] Scenarios extracted and normalized to unified format
122
- - [ ] Test infrastructure discovered (framework, patterns, conventions)
123
- - [ ] test-plan.json generated with layer distribution
124
- - [ ] User confirmed plan (or --dry-run stopped here)
125
- - [ ] Tests written following RED-GREEN methodology and existing patterns
126
- - [ ] Tests executed progressively (L0→L3) with fail-fast on critical
127
- - [ ] Iteration engine ran (inner: test_defect fix, outer: strategy adjust)
128
- - [ ] state.json, report.json, reflection-log.md written
129
- - [ ] Test confidence scored per iteration (Step 7.5) with 5-dimension factor model
130
- - [ ] Convergence check includes confidence >= 60% alongside pass_rate threshold
131
- - [ ] Pressure pass completed on highest-pass-rate layer before completion
132
- - [ ] report.json includes confidence section
133
- - [ ] index.json updated with auto_test section
134
- - [ ] If spec source: traceability matrix built, traceability.md written
135
- - [ ] If failures: issues auto-created in issues.jsonl
136
- - [ ] If gap source: validation.json gaps updated (MISSING→COVERED)
137
- - [ ] Next step routed based on convergence status
138
- </success_criteria>
16
+ <purpose>
17
+ Unified automated testing via CSV layer pipeline. Auto-selects scenario source from project state (specs / coverage gaps / code exploration), then: discover → plan → build CSV → write tests (parallel) → execute → diagnose failures (parallel) → iterate → report.
18
+
19
+ Layers L0→L3 sequential (fail-fast), scenarios within layer parallel. `--max-iter 1` = single-pass; default = full iterative cycle.
20
+ </purpose>
21
+
22
+ <required_reading>
23
+ @~/.maestro/workflows/auto-test.md
24
+ </required_reading>
25
+
26
+ <context>
27
+ Phase or task: $ARGUMENTS (required phase number)
28
+
29
+ **Flags:**
30
+ - `--max-iter N` — Maximum outer iterations (default: 5). Set to 1 for single-pass generation only.
31
+ - `--layer L` — Start from or restrict to specific layer (L0|L1|L2|L3)
32
+ - `--dry-run` — Generate test plan only, do not execute
33
+ - `--re-run` — Re-run only previously failed/blocked scenarios
34
+
35
+ **Intelligent routing** (auto-detected from project state):
36
+
37
+ | Priority | Condition | Route | Reference skill |
38
+ |----------|-----------|-------|-----------------|
39
+ | 1 | Active session exists (state.json status=running) | Resume | |
40
+ | 2 | --re-run flag + previous failures | Re-run | — |
41
+ | 3 | Spec package exists (REQ-*.md) | spec | quality-business-test (separate skill) |
42
+ | 4 | Nyquist gaps exist (verification.json) | gap | quality-test-gen (separate skill) |
43
+ | 5 | Default | code | quality-integration-test (separate skill) |
44
+
45
+ Flags, artifact context resolution, and output formats defined in workflow auto-test.md.
46
+
47
+ ### Pre-load context (before test generation)
48
+
49
+ 1. **Test specs + tools**: Run `maestro spec load --category test` to load test conventions (framework, patterns, naming). Apply to all generated tests.
50
+ 2. **Coding specs**: Run `maestro spec load --category coding` to understand coding patterns for accurate test targeting.
51
+ 3. **Role Knowledge**:
52
+ - Browse: `maestro search --category test`
53
+ - Load task-relevant entries: `maestro wiki load <id1> [id2...]`
54
+ 4. All are optional — proceed without if unavailable.
55
+ </context>
56
+
57
+ <execution>
58
+ Follow '~/.maestro/workflows/auto-test.md' completely.
59
+
60
+ ### Phase Gates (MANDATORY, BLOCKING)
61
+
62
+ **GATE 1: Setup Plan** (Route Selection CSV Generation)
63
+ - REQUIRED: Phase resolved from artifact registry. E001/E002 if missing.
64
+ - REQUIRED: Route auto-selected (spec/gap/code) from project state.
65
+ - REQUIRED: Test infrastructure discovered (framework, patterns, conventions).
66
+ - BLOCKED if missing: cannot generate test plan without route and framework.
67
+
68
+ **GATE 2: Plan → Write** (CSV Test Generation)
69
+ - REQUIRED: test-plan.json generated with layer distribution (L0→L3).
70
+ - REQUIRED: User confirmed plan (unless `--dry-run` stops here).
71
+ - BLOCKED if plan missing or rejected: do not write tests.
72
+
73
+ **GATE 3: Write → Execute** (Test Generation → Execution)
74
+ - REQUIRED: All planned test files written following existing patterns.
75
+ - REQUIRED: Tests follow RED-GREEN methodology.
76
+ - BLOCKED if tests incomplete: finish writing before execution.
77
+
78
+ **GATE 4: Execute → Report** (Iteration → Completion)
79
+ - REQUIRED: Progressive execution completed (L0→L3, fail-fast on critical).
80
+ - REQUIRED: Iteration engine ran (inner: test_defect fix, outer: strategy adjust).
81
+ - REQUIRED: Confidence scored with 5-dimension factor model (>= 60%).
82
+ - REQUIRED: Pressure pass completed on highest-pass-rate layer.
83
+ - BLOCKED if iteration incomplete: continue iterating before reporting.
84
+
85
+ **Command-specific extensions (not in workflow):**
86
+
87
+ **Review findings integration** (from related review artifacts):
88
+ - Extract critical/high findings as additional test scenarios, marked `source: "review_finding"`
89
+ - When review verdict is "BLOCK" and review-finding tests fail, suggest quality-debug
90
+
91
+ **Debug root cause integration** (from related debug artifacts):
92
+ - Generate regression test scenarios from confirmed root causes, marked `source: "debug_root_cause"`
93
+
94
+ **Register artifact on completion:**
95
+ ```
96
+ Append to state.json.artifacts[]:
97
+ {
98
+ id: nextArtifactId(artifacts, "test"), // TST-001
99
+ type: "test",
100
+ milestone: current_milestone,
101
+ phase: target_phase,
102
+ scope: "phase",
103
+ path: "scratch/{YYYYMMDD}-auto-test-P{N}-{slug}",
104
+ status: issues == 0 ? "completed" : "failed",
105
+ depends_on: exec_art.id,
106
+ harvested: false,
107
+ created_at: start_time,
108
+ completed_at: now()
109
+ }
110
+ ```
111
+
112
+ **Next-step routing on completion:**
113
+ - Converged (>=95%) `/quality-review {phase}`
114
+ - All requirements verified (spec source) `/maestro-milestone-audit`
115
+ - Bugs discovered → `/quality-debug --from-uat {phase}`
116
+ - Max iter, >80% → `/quality-test {phase}` for manual UAT
117
+ - Max iter, <80% → `/quality-debug {phase}`
118
+ - Coverage still low `/quality-auto-test {phase} --layer {missing}`
119
+ - Re-run all pass → `/quality-review {phase}`
120
+ - Single pass, all pass `/quality-test {phase}`
121
+ </execution>
122
+
123
+ <error_codes>
124
+ | Code | Severity | Condition | Recovery |
125
+ |------|----------|-----------|----------|
126
+ | E001 | error | Phase argument required (no active sessions) | Prompt user for phase number |
127
+ | E002 | error | Phase not found in artifact registry | Check state.json artifacts |
128
+ | E003 | error | No test framework detected | Install test framework or configure test runner |
129
+ | W001 | warning | One or more test scenarios failed | Auto-iterate or suggest fix options |
130
+ | W002 | warning | Max iterations reached without convergence | Review reflection-log.md, suggest debug |
131
+ | W003 | warning | Degraded spec mode (no full spec package) | Consider running maestro-roadmap --mode full |
132
+ </error_codes>
133
+
134
+ <success_criteria>
135
+ - [ ] Phase resolved from artifact registry
136
+ - [ ] Route auto-selected from project state (spec/gap/code)
137
+ - [ ] Active sessions checked, resume offered if applicable
138
+ - [ ] Scenarios extracted and normalized to unified format
139
+ - [ ] Test infrastructure discovered (framework, patterns, conventions)
140
+ - [ ] test-plan.json generated with layer distribution
141
+ - [ ] User confirmed plan (or --dry-run stopped here)
142
+ - [ ] Tests written following RED-GREEN methodology and existing patterns
143
+ - [ ] Tests executed progressively (L0→L3) with fail-fast on critical
144
+ - [ ] Iteration engine ran (inner: test_defect fix, outer: strategy adjust)
145
+ - [ ] state.json, report.json, reflection-log.md written
146
+ - [ ] Test confidence scored per iteration (Step 7.5) with 5-dimension factor model
147
+ - [ ] Convergence check includes confidence >= 60% alongside pass_rate threshold
148
+ - [ ] Pressure pass completed on highest-pass-rate layer before completion
149
+ - [ ] report.json includes confidence section
150
+ - [ ] index.json updated with auto_test section
151
+ - [ ] If spec source: traceability matrix built, traceability.md written
152
+ - [ ] If failures: issues auto-created in issues.jsonl
153
+ - [ ] If gap source: validation.json gaps updated (MISSING→COVERED)
154
+ - [ ] Next step routed based on convergence status
155
+ </success_criteria>
@@ -14,109 +14,148 @@ allowed-tools:
14
14
  ---
15
15
  <!-- Open-standard mirror generated by scripts/build-agents-standard.mjs — do not edit; re-run after editing .claude/ source. -->
16
16
 
17
- <purpose>
18
- Debug issues using scientific method with subagent isolation and persistent debug state. Three entry modes (standalone, from-UAT, parallel) and structured root cause collection with UAT feedback loop. Full algorithm defined in workflow debug.md.
19
- </purpose>
20
-
21
- <required_reading>
22
- @~/.maestro/workflows/debug.md
23
- </required_reading>
24
-
25
- <context>
26
- User's issue: $ARGUMENTS
27
-
28
- **Flags:**
29
- - `--from-uat <phase>` -- Read gaps from phase's uat.md as pre-filled symptoms
30
- - `--parallel` -- Spawn parallel debug agents (one per gap cluster)
31
-
32
- **All context via state.json.artifacts[]:**
33
-
34
- ```
35
- related = artifacts.filter(a =>
36
- a.phase === target_phase && a.milestone === current_milestone
37
- ).sort_by(completed_at asc)
38
- ```
39
-
40
- Each artifact's type determines its outputs at `.workflow/{a.path}/`:
41
- - **execute** → .summaries/, .task/ (source of code changes)
42
- - **review** → review.json (findings guide hypothesis formation)
43
- - **debug** → understanding.md, evidence.ndjson (prior investigations, avoid re-investigation)
44
- - **test** → uat.md (--from-uat gap source), .tests/
45
-
46
- Extract conclusions from related artifacts that may affect this debug session — review findings guide investigation direction, prior debug avoids redundant work.
47
-
48
- ### Pre-load (optional, proceed without)
49
- - Codebase docs: `.workflow/codebase/ARCHITECTURE.md` → module boundaries
50
- - Wiki: `maestro search "<symptom keywords>" --json` → prior investigations
51
- - Specs: `maestro spec load --category debug --keyword "<symptom>"` → known issues/workarounds
52
- - Role knowledge: `maestro search --category debug` select relevant `maestro wiki load`
53
-
54
- **Output**: `DEBUG_DIR = .workflow/scratch/{YYYYMMDD}-debug-P{N}-{slug}/` (P{N} = phase number when phase-scoped; omit for standalone). Output directory rules defined in workflow debug.md Step 4.
55
- </context>
56
-
57
- <execution>
58
- Follow '~/.maestro/workflows/debug.md' completely.
59
-
60
- **Register artifact on completion (phase-scoped only):**
61
- ```
62
- Append to state.json.artifacts[]:
63
- {
64
- id: nextArtifactId(artifacts, "debug"), // DBG-001
65
- type: "debug",
66
- milestone: current_milestone,
67
- phase: target_phase,
68
- scope: "phase",
69
- path: "scratch/{YYYYMMDD}-debug-P{N}-{slug}",
70
- status: all_diagnosed ? "completed" : "failed",
71
- depends_on: triggering_review_id || exec_art.id,
72
- harvested: false,
73
- created_at: start_time,
74
- completed_at: now()
75
- }
76
- ```
77
-
78
- ### Post-debug Knowledge Inquiry
79
-
80
- | Condition | Ask | Route |
81
- |-----------|-----|-------|
82
- | Recurring root cause pattern (seen in prior debug) | "Document in debug-notes.md?" | spec-add debug |
83
- | Non-obvious fix / workaround | "Record as learning?" | spec-add learning |
84
- | Root cause = architectural boundary violation | "Update architecture-constraints.md?" | spec-add arch |
85
-
86
- On confirm → `invoke_skill("spec-add", "<category> <content> --description \"<summary>\"")`.
87
-
88
- **Next-step routing on completion:**
89
- - Root cause found, fix needed → `/maestro-plan {phase} --gaps`
90
- - Root cause found (from UAT), auto-fix → `/quality-test {phase} --auto-fix`
91
- - Inconclusive, need more info → `/quality-debug {issue} -c` (resume session)
92
- - Standalone fix already applied → `/maestro-execute {phase}`
93
- </execution>
94
-
95
- <error_codes>
96
- | Code | Severity | Condition | Recovery |
97
- |------|----------|-----------|----------|
98
- | E001 | error | Issue description required (no arguments, no active sessions) | Check arguments format, re-run with correct input |
99
- | E002 | error | UAT file not found for --from-uat phase | Verify UAT file exists for specified phase |
100
- | W001 | warning | Existing debug session found, offer resume | Review existing sessions, choose resume or new |
101
- | W002 | warning | Checkpoint reached, user input needed | Provide requested input to continue |
102
- | W003 | warning | Some gaps inconclusive, partial diagnosis | Review partial results, retry inconclusive gaps |
103
- </error_codes>
104
-
105
- <success_criteria>
106
- - [ ] Input parsed: standalone, --from-uat, or --parallel mode determined
107
- - [ ] Active sessions checked and resume offered if applicable
108
- - [ ] Symptoms gathered (interactive) or loaded from UAT (pre-filled)
109
- - [ ] Debug output directory created (phase .debug/ or scratch/)
110
- - [ ] Debug agent(s) spawned with full symptom context
111
- - [ ] If --parallel: one agent per gap cluster, all concurrent
112
- - [ ] evidence.ndjson written with structured NDJSON entries
113
- - [ ] understanding.md tracks evolving understanding per cluster
114
- - [ ] Root causes collected with fix_direction and affected_files
115
- - [ ] Multi-factor confidence scored per gap (Step 7.0) replacing simple high/medium/low
116
- - [ ] Readiness gate checked before ROOT CAUSE declaration
117
- - [ ] Pressure pass completed on confirmed hypothesis
118
- - [ ] Confidence table appended to understanding.md
119
- - [ ] If --from-uat: uat.md gaps updated with diagnosis artifacts
120
- - [ ] Results unified into diagnosis summary with confidence section
121
- - [ ] Next step routed (plan --gaps + execute if fix needed, verify if fix applied, resume if inconclusive)
122
- </success_criteria>
17
+ <purpose>
18
+ Debug issues using scientific method with subagent isolation and persistent debug state. Three entry modes (standalone, from-UAT, parallel) and structured root cause collection with UAT feedback loop. Full algorithm defined in workflow debug.md.
19
+ </purpose>
20
+
21
+ <required_reading>
22
+ @~/.maestro/workflows/debug.md
23
+ </required_reading>
24
+
25
+ <context>
26
+ User's issue: $ARGUMENTS
27
+
28
+ **Flags:**
29
+ - `--from-uat <phase>` -- Read gaps from phase's uat.md as pre-filled symptoms
30
+ - `--parallel` -- Spawn parallel debug agents (one per gap cluster)
31
+
32
+ **All context via state.json.artifacts[]:**
33
+
34
+ ```
35
+ related = artifacts.filter(a =>
36
+ a.phase === target_phase && a.milestone === current_milestone
37
+ ).sort_by(completed_at asc)
38
+ ```
39
+
40
+ Each artifact's type determines its outputs at `.workflow/{a.path}/`:
41
+ - **execute** → .summaries/, .task/ (source of code changes)
42
+ - **review** → review.json (findings guide hypothesis formation)
43
+ - **debug** → understanding.md, evidence.ndjson (prior investigations, avoid re-investigation)
44
+ - **test** → uat.md (--from-uat gap source), .tests/
45
+
46
+ ### Pre-load (optional, proceed without)
47
+ - Codebase docs: `.workflow/codebase/ARCHITECTURE.md` → module boundaries
48
+ - Wiki: `maestro search "<symptom keywords>" --json` → prior investigations
49
+ - Specs: `maestro spec load --category debug --keyword "<symptom>"` known issues/workarounds
50
+ - Role knowledge: `maestro search --category debug` → select relevant → `maestro wiki load`
51
+
52
+ **Output**: `DEBUG_DIR = .workflow/scratch/{YYYYMMDD}-debug-P{N}-{slug}/` (P{N} = phase number when phase-scoped; omit for standalone). Output directory rules defined in workflow debug.md Step 4.
53
+ </context>
54
+
55
+ <execution>
56
+ Follow '~/.maestro/workflows/debug.md' completely.
57
+
58
+ ### Phase Gates (MANDATORY, BLOCKING)
59
+
60
+ **GATE 1: Input Investigation**
61
+ - REQUIRED: Symptoms gathered (interactive) or loaded from UAT (--from-uat).
62
+ - REQUIRED: Debug output directory created.
63
+ - BLOCKED if missing: cannot investigate without symptom baseline.
64
+
65
+ **GATE 2: Investigation → Diagnosis**
66
+ - REQUIRED: Debug agent(s) spawned with full symptom context.
67
+ - REQUIRED: evidence.ndjson written with structured entries.
68
+ - REQUIRED: understanding.md tracks evolving understanding.
69
+ - BLOCKED if incomplete: continue investigation before declaring root cause.
70
+
71
+ **GATE 3: Diagnosis Completion**
72
+ - REQUIRED: Root causes collected with fix_direction and affected_files.
73
+ - REQUIRED: Multi-factor confidence scored per gap.
74
+ - REQUIRED: Readiness gate checked and pressure pass completed.
75
+ - BLOCKED if inconclusive: resume session or escalate.
76
+
77
+ **Register artifact on completion (phase-scoped only):**
78
+ ```
79
+ Append to state.json.artifacts[]:
80
+ {
81
+ id: nextArtifactId(artifacts, "debug"), // DBG-001
82
+ type: "debug",
83
+ milestone: current_milestone,
84
+ phase: target_phase,
85
+ scope: "phase",
86
+ path: "scratch/{YYYYMMDD}-debug-P{N}-{slug}",
87
+ status: all_diagnosed ? "completed" : "failed",
88
+ depends_on: triggering_review_id || exec_art.id,
89
+ harvested: false,
90
+ created_at: start_time,
91
+ completed_at: now()
92
+ }
93
+ ```
94
+
95
+ ### Post-debug Knowledge Inquiry
96
+
97
+ | Condition | Ask | Route |
98
+ |-----------|-----|-------|
99
+ | Recurring root cause pattern (seen in prior debug) | "Document in debug-notes.md?" | spec-add debug |
100
+ | Non-obvious fix / workaround | "Record as learning?" | spec-add learning |
101
+ | Root cause = architectural boundary violation | "Update architecture-constraints.md?" | spec-add arch |
102
+
103
+ On confirm → `invoke_skill("spec-add", "<category> <content> --description \"<summary>\"")`.
104
+
105
+ </execution>
106
+
107
+ <completion>
108
+ ### Standalone report
109
+
110
+ ```
111
+ --- COMPLETION STATUS ---
112
+ STATUS: DONE|DONE_WITH_CONCERNS|NEEDS_RETRY
113
+ CONCERNS: {description if applicable}
114
+ --- END STATUS ---
115
+ ```
116
+
117
+ ### Ralph-invoked completion
118
+
119
+ End the step by calling the CLI (no text block output):
120
+ ```
121
+ maestro ralph complete <idx> --status {STATUS} [--evidence {path}]
122
+ ```
123
+
124
+ ### Next-step routing
125
+
126
+ | Condition | Suggestion |
127
+ |-----------|-----------|
128
+ | Root cause found, fix needed | `/maestro-plan {phase} --gaps` |
129
+ | Root cause found (from UAT), auto-fix | `/quality-test {phase} --auto-fix` |
130
+ | Inconclusive, need more info | `/quality-debug {issue} -c` (resume) |
131
+ | Standalone fix already applied | `/maestro-execute {phase}` |
132
+ </completion>
133
+
134
+ <error_codes>
135
+ | Code | Severity | Condition | Recovery |
136
+ |------|----------|-----------|----------|
137
+ | E001 | error | Issue description required (no arguments, no active sessions) | Check arguments format, re-run with correct input |
138
+ | E002 | error | UAT file not found for --from-uat phase | Verify UAT file exists for specified phase |
139
+ | W001 | warning | Existing debug session found, offer resume | Review existing sessions, choose resume or new |
140
+ | W002 | warning | Checkpoint reached, user input needed | Provide requested input to continue |
141
+ | W003 | warning | Some gaps inconclusive, partial diagnosis | Review partial results, retry inconclusive gaps |
142
+ </error_codes>
143
+
144
+ <success_criteria>
145
+ - [ ] Input parsed: standalone, --from-uat, or --parallel mode determined
146
+ - [ ] Active sessions checked and resume offered if applicable
147
+ - [ ] Symptoms gathered (interactive) or loaded from UAT (pre-filled)
148
+ - [ ] Debug output directory created (phase .debug/ or scratch/)
149
+ - [ ] Debug agent(s) spawned with full symptom context
150
+ - [ ] If --parallel: one agent per gap cluster, all concurrent
151
+ - [ ] evidence.ndjson written with structured NDJSON entries
152
+ - [ ] understanding.md tracks evolving understanding per cluster
153
+ - [ ] Root causes collected with fix_direction and affected_files
154
+ - [ ] Multi-factor confidence scored per gap (Step 7.0) replacing simple high/medium/low
155
+ - [ ] Readiness gate checked before ROOT CAUSE declaration
156
+ - [ ] Pressure pass completed on confirmed hypothesis
157
+ - [ ] Confidence table appended to understanding.md
158
+ - [ ] If --from-uat: uat.md gaps updated with diagnosis artifacts
159
+ - [ ] Results unified into diagnosis summary with confidence section
160
+ - [ ] Next step routed (plan --gaps + execute if fix needed, verify if fix applied, resume if inconclusive)
161
+ </success_criteria>