maestro-flow 0.5.3 → 0.5.31

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (259) hide show
  1. package/.agents/skills/learn-follow/SKILL.md +114 -114
  2. package/.agents/skills/learn-investigate/SKILL.md +138 -139
  3. package/.agents/skills/learn-second-opinion/SKILL.md +105 -109
  4. package/.agents/skills/maestro/SKILL.md +2 -10
  5. package/.agents/skills/maestro-amend/SKILL.md +152 -152
  6. package/.agents/skills/maestro-analyze/SKILL.md +201 -252
  7. package/.agents/skills/maestro-blueprint/SKILL.md +175 -190
  8. package/.agents/skills/maestro-brainstorm/SKILL.md +196 -200
  9. package/.agents/skills/maestro-collab/SKILL.md +159 -159
  10. package/.agents/skills/maestro-companion/SKILL.md +517 -517
  11. package/.agents/skills/maestro-composer/SKILL.md +173 -164
  12. package/.agents/skills/maestro-execute/SKILL.md +169 -170
  13. package/.agents/skills/maestro-fork/SKILL.md +97 -96
  14. package/.agents/skills/maestro-grill/SKILL.md +161 -162
  15. package/.agents/skills/maestro-guard/SKILL.md +93 -92
  16. package/.agents/skills/maestro-impeccable/SKILL.md +296 -253
  17. package/.agents/skills/maestro-init/SKILL.md +117 -118
  18. package/.agents/skills/maestro-merge/SKILL.md +73 -66
  19. package/.agents/skills/maestro-milestone-audit/SKILL.md +4 -10
  20. package/.agents/skills/maestro-milestone-complete/SKILL.md +6 -7
  21. package/.agents/skills/maestro-milestone-release/SKILL.md +122 -131
  22. package/.agents/skills/maestro-next/SKILL.md +241 -245
  23. package/.agents/skills/maestro-overlay/SKILL.md +176 -166
  24. package/.agents/skills/maestro-plan/SKILL.md +211 -197
  25. package/.agents/skills/maestro-player/SKILL.md +167 -167
  26. package/.agents/skills/maestro-quick/SKILL.md +69 -63
  27. package/.agents/skills/maestro-ralph/SKILL.md +2 -36
  28. package/.agents/skills/maestro-ralph-beta/SKILL.md +861 -872
  29. package/.agents/skills/maestro-ralph-execute/SKILL.md +234 -234
  30. package/.agents/skills/maestro-roadmap/SKILL.md +159 -172
  31. package/.agents/skills/maestro-swarm-workflow/SKILL.md +229 -250
  32. package/.agents/skills/maestro-tools-execute/SKILL.md +108 -103
  33. package/.agents/skills/maestro-tools-register/SKILL.md +148 -143
  34. package/.agents/skills/maestro-ui-codify/SKILL.md +103 -86
  35. package/.agents/skills/maestro-universal-workflow/SKILL.md +534 -547
  36. package/.agents/skills/maestro-update/SKILL.md +109 -106
  37. package/.agents/skills/manage-codebase-rebuild/SKILL.md +73 -71
  38. package/.agents/skills/manage-harvest/SKILL.md +83 -81
  39. package/.agents/skills/manage-issue/SKILL.md +59 -60
  40. package/.agents/skills/manage-issue-discover/SKILL.md +70 -68
  41. package/.agents/skills/manage-kg-extractors/SKILL.md +130 -0
  42. package/.agents/skills/manage-knowhow/SKILL.md +70 -66
  43. package/.agents/skills/manage-knowhow-capture/SKILL.md +79 -69
  44. package/.agents/skills/manage-knowledge-audit/SKILL.md +91 -74
  45. package/.agents/skills/manage-status/SKILL.md +52 -42
  46. package/.agents/skills/manage-wiki/SKILL.md +69 -58
  47. package/.agents/skills/odyssey-debug/SKILL.md +445 -459
  48. package/.agents/skills/odyssey-improve/SKILL.md +477 -491
  49. package/.agents/skills/odyssey-planex/SKILL.md +576 -587
  50. package/.agents/skills/odyssey-review-test-fix/SKILL.md +400 -413
  51. package/.agents/skills/odyssey-ui/SKILL.md +431 -448
  52. package/.agents/skills/quality-auto-test/SKILL.md +140 -123
  53. package/.agents/skills/quality-debug/SKILL.md +145 -106
  54. package/.agents/skills/quality-refactor/SKILL.md +91 -53
  55. package/.agents/skills/quality-retrospective/SKILL.md +109 -63
  56. package/.agents/skills/quality-review/SKILL.md +141 -114
  57. package/.agents/skills/quality-sync/SKILL.md +74 -38
  58. package/.agents/skills/quality-test/SKILL.md +133 -103
  59. package/.agents/skills/security-audit/SKILL.md +217 -166
  60. package/.agents/skills/spec-add/SKILL.md +66 -59
  61. package/.agents/skills/spec-load/SKILL.md +68 -68
  62. package/.agents/skills/spec-remove/SKILL.md +42 -42
  63. package/.agents/skills/spec-setup/SKILL.md +38 -41
  64. package/.agy/skills/learn-follow/SKILL.md +114 -114
  65. package/.agy/skills/learn-investigate/SKILL.md +138 -139
  66. package/.agy/skills/learn-second-opinion/SKILL.md +105 -109
  67. package/.agy/skills/maestro/SKILL.md +2 -10
  68. package/.agy/skills/maestro-amend/SKILL.md +152 -152
  69. package/.agy/skills/maestro-analyze/SKILL.md +201 -252
  70. package/.agy/skills/maestro-blueprint/SKILL.md +175 -190
  71. package/.agy/skills/maestro-brainstorm/SKILL.md +196 -200
  72. package/.agy/skills/maestro-collab/SKILL.md +159 -159
  73. package/.agy/skills/maestro-companion/SKILL.md +517 -517
  74. package/.agy/skills/maestro-composer/SKILL.md +173 -164
  75. package/.agy/skills/maestro-execute/SKILL.md +169 -170
  76. package/.agy/skills/maestro-fork/SKILL.md +97 -96
  77. package/.agy/skills/maestro-grill/SKILL.md +161 -162
  78. package/.agy/skills/maestro-guard/SKILL.md +93 -92
  79. package/.agy/skills/maestro-impeccable/SKILL.md +296 -253
  80. package/.agy/skills/maestro-init/SKILL.md +117 -118
  81. package/.agy/skills/maestro-merge/SKILL.md +73 -66
  82. package/.agy/skills/maestro-milestone-audit/SKILL.md +4 -10
  83. package/.agy/skills/maestro-milestone-complete/SKILL.md +6 -7
  84. package/.agy/skills/maestro-milestone-release/SKILL.md +122 -131
  85. package/.agy/skills/maestro-next/SKILL.md +241 -245
  86. package/.agy/skills/maestro-overlay/SKILL.md +176 -166
  87. package/.agy/skills/maestro-plan/SKILL.md +211 -197
  88. package/.agy/skills/maestro-player/SKILL.md +167 -167
  89. package/.agy/skills/maestro-quick/SKILL.md +69 -63
  90. package/.agy/skills/maestro-ralph/SKILL.md +2 -36
  91. package/.agy/skills/maestro-ralph-beta/SKILL.md +861 -872
  92. package/.agy/skills/maestro-ralph-execute/SKILL.md +234 -234
  93. package/.agy/skills/maestro-roadmap/SKILL.md +159 -172
  94. package/.agy/skills/maestro-swarm-workflow/SKILL.md +229 -250
  95. package/.agy/skills/maestro-tools-execute/SKILL.md +108 -103
  96. package/.agy/skills/maestro-tools-register/SKILL.md +148 -143
  97. package/.agy/skills/maestro-ui-codify/SKILL.md +103 -86
  98. package/.agy/skills/maestro-universal-workflow/SKILL.md +534 -547
  99. package/.agy/skills/maestro-update/SKILL.md +109 -106
  100. package/.agy/skills/manage-codebase-rebuild/SKILL.md +73 -71
  101. package/.agy/skills/manage-harvest/SKILL.md +83 -81
  102. package/.agy/skills/manage-issue/SKILL.md +59 -60
  103. package/.agy/skills/manage-issue-discover/SKILL.md +70 -68
  104. package/.agy/skills/manage-kg-extractors/SKILL.md +130 -0
  105. package/.agy/skills/manage-knowhow/SKILL.md +70 -66
  106. package/.agy/skills/manage-knowhow-capture/SKILL.md +79 -69
  107. package/.agy/skills/manage-knowledge-audit/SKILL.md +91 -74
  108. package/.agy/skills/manage-status/SKILL.md +52 -42
  109. package/.agy/skills/manage-wiki/SKILL.md +69 -58
  110. package/.agy/skills/odyssey-debug/SKILL.md +445 -459
  111. package/.agy/skills/odyssey-improve/SKILL.md +477 -491
  112. package/.agy/skills/odyssey-planex/SKILL.md +576 -587
  113. package/.agy/skills/odyssey-review-test-fix/SKILL.md +400 -413
  114. package/.agy/skills/odyssey-ui/SKILL.md +431 -448
  115. package/.agy/skills/quality-auto-test/SKILL.md +140 -123
  116. package/.agy/skills/quality-debug/SKILL.md +145 -106
  117. package/.agy/skills/quality-refactor/SKILL.md +91 -53
  118. package/.agy/skills/quality-retrospective/SKILL.md +109 -63
  119. package/.agy/skills/quality-review/SKILL.md +141 -114
  120. package/.agy/skills/quality-sync/SKILL.md +74 -38
  121. package/.agy/skills/quality-test/SKILL.md +133 -103
  122. package/.agy/skills/security-audit/SKILL.md +217 -166
  123. package/.agy/skills/spec-add/SKILL.md +66 -59
  124. package/.agy/skills/spec-load/SKILL.md +68 -68
  125. package/.agy/skills/spec-remove/SKILL.md +42 -42
  126. package/.agy/skills/spec-setup/SKILL.md +38 -41
  127. package/.claude/commands/learn-follow.md +127 -127
  128. package/.claude/commands/learn-investigate.md +151 -152
  129. package/.claude/commands/learn-second-opinion.md +118 -122
  130. package/.claude/commands/maestro-amend.md +164 -164
  131. package/.claude/commands/maestro-analyze.md +215 -266
  132. package/.claude/commands/maestro-blueprint.md +189 -204
  133. package/.claude/commands/maestro-brainstorm.md +209 -213
  134. package/.claude/commands/maestro-collab.md +172 -172
  135. package/.claude/commands/maestro-companion.md +531 -531
  136. package/.claude/commands/maestro-composer.md +188 -179
  137. package/.claude/commands/maestro-execute.md +183 -184
  138. package/.claude/commands/maestro-fork.md +111 -110
  139. package/.claude/commands/maestro-grill.md +175 -176
  140. package/.claude/commands/maestro-guard.md +103 -102
  141. package/.claude/commands/maestro-impeccable.md +311 -268
  142. package/.claude/commands/maestro-init.md +130 -131
  143. package/.claude/commands/maestro-merge.md +87 -80
  144. package/.claude/commands/maestro-milestone-audit.md +4 -10
  145. package/.claude/commands/maestro-milestone-complete.md +6 -7
  146. package/.claude/commands/maestro-milestone-release.md +136 -145
  147. package/.claude/commands/maestro-next.md +253 -257
  148. package/.claude/commands/maestro-overlay.md +188 -178
  149. package/.claude/commands/maestro-plan.md +225 -211
  150. package/.claude/commands/maestro-player.md +182 -182
  151. package/.claude/commands/maestro-quick.md +83 -77
  152. package/.claude/commands/maestro-ralph-beta.md +875 -886
  153. package/.claude/commands/maestro-ralph-execute.md +247 -247
  154. package/.claude/commands/maestro-ralph.md +2 -36
  155. package/.claude/commands/maestro-roadmap.md +173 -186
  156. package/.claude/commands/maestro-swarm-workflow.md +243 -264
  157. package/.claude/commands/maestro-tools-execute.md +122 -117
  158. package/.claude/commands/maestro-tools-register.md +162 -157
  159. package/.claude/commands/maestro-ui-codify.md +117 -100
  160. package/.claude/commands/maestro-universal-workflow.md +548 -561
  161. package/.claude/commands/maestro-update.md +122 -119
  162. package/.claude/commands/maestro.md +2 -10
  163. package/.claude/commands/manage-codebase-rebuild.md +87 -85
  164. package/.claude/commands/manage-harvest.md +97 -95
  165. package/.claude/commands/manage-issue-discover.md +83 -81
  166. package/.claude/commands/manage-issue.md +72 -73
  167. package/.claude/commands/manage-kg-extractors.md +128 -0
  168. package/.claude/commands/manage-knowhow-capture.md +92 -82
  169. package/.claude/commands/manage-knowhow.md +83 -79
  170. package/.claude/commands/manage-knowledge-audit.md +105 -88
  171. package/.claude/commands/manage-status.md +62 -52
  172. package/.claude/commands/manage-wiki.md +82 -71
  173. package/.claude/commands/odyssey-debug.md +459 -473
  174. package/.claude/commands/odyssey-improve.md +491 -505
  175. package/.claude/commands/odyssey-planex.md +590 -601
  176. package/.claude/commands/odyssey-review-test-fix.md +414 -427
  177. package/.claude/commands/odyssey-ui.md +445 -462
  178. package/.claude/commands/quality-auto-test.md +153 -136
  179. package/.claude/commands/quality-debug.md +159 -120
  180. package/.claude/commands/quality-refactor.md +105 -67
  181. package/.claude/commands/quality-retrospective.md +123 -77
  182. package/.claude/commands/quality-review.md +155 -128
  183. package/.claude/commands/quality-sync.md +88 -52
  184. package/.claude/commands/quality-test.md +147 -117
  185. package/.claude/commands/security-audit.md +230 -179
  186. package/.claude/commands/spec-add.md +77 -70
  187. package/.claude/commands/spec-load.md +78 -78
  188. package/.claude/commands/spec-remove.md +55 -55
  189. package/.claude/commands/spec-setup.md +49 -52
  190. package/dist/src/cli.js +1 -1
  191. package/dist/src/cli.js.map +1 -1
  192. package/dist/src/commands/kg.d.ts.map +1 -1
  193. package/dist/src/commands/kg.js +11 -5
  194. package/dist/src/commands/kg.js.map +1 -1
  195. package/dist/src/graph/kg/extraction/code/code-extractor.d.ts +2 -0
  196. package/dist/src/graph/kg/extraction/code/code-extractor.d.ts.map +1 -1
  197. package/dist/src/graph/kg/extraction/code/code-extractor.js +32 -3
  198. package/dist/src/graph/kg/extraction/code/code-extractor.js.map +1 -1
  199. package/dist/src/graph/kg/extraction/code/plugin-engine.d.ts +35 -0
  200. package/dist/src/graph/kg/extraction/code/plugin-engine.d.ts.map +1 -0
  201. package/dist/src/graph/kg/extraction/code/plugin-engine.js +573 -0
  202. package/dist/src/graph/kg/extraction/code/plugin-engine.js.map +1 -0
  203. package/dist/src/graph/kg/extraction/code/plugin-types.d.ts +95 -0
  204. package/dist/src/graph/kg/extraction/code/plugin-types.d.ts.map +1 -0
  205. package/dist/src/graph/kg/extraction/code/plugin-types.js +5 -0
  206. package/dist/src/graph/kg/extraction/code/plugin-types.js.map +1 -0
  207. package/dist/src/graph/kg/extraction/orchestrator.d.ts.map +1 -1
  208. package/dist/src/graph/kg/extraction/orchestrator.js +17 -5
  209. package/dist/src/graph/kg/extraction/orchestrator.js.map +1 -1
  210. package/dist/src/graph/kg/schema.sql +16 -11
  211. package/dist/src/graph/kg/surface/cli.d.ts.map +1 -1
  212. package/dist/src/graph/kg/surface/cli.js +153 -56
  213. package/dist/src/graph/kg/surface/cli.js.map +1 -1
  214. package/dist/src/hooks/workspace.d.ts +4 -2
  215. package/dist/src/hooks/workspace.d.ts.map +1 -1
  216. package/dist/src/hooks/workspace.js +6 -2
  217. package/dist/src/hooks/workspace.js.map +1 -1
  218. package/package.json +91 -91
  219. package/workflows/analyze.md +25 -49
  220. package/workflows/auto-test.md +699 -699
  221. package/workflows/blueprint.md +403 -431
  222. package/workflows/brainstorm.md +54 -195
  223. package/workflows/business-test.md +570 -570
  224. package/workflows/claude-instructions.md +23 -51
  225. package/workflows/codex-instructions.md +27 -77
  226. package/workflows/coding-philosophy.md +69 -69
  227. package/workflows/command-authoring.md +823 -823
  228. package/workflows/debug.md +43 -98
  229. package/workflows/delegate-usage.md +39 -241
  230. package/workflows/execute.md +4 -53
  231. package/workflows/grill.md +12 -56
  232. package/workflows/harvest.md +22 -68
  233. package/workflows/init.md +148 -148
  234. package/workflows/instruction-authoring-guide.md +97 -0
  235. package/workflows/issue-execute.md +110 -110
  236. package/workflows/issue-gaps-analyze.codex.md +260 -260
  237. package/workflows/issue-gaps-analyze.md +216 -216
  238. package/workflows/issue-plan.md +110 -110
  239. package/workflows/issue.md +338 -346
  240. package/workflows/knowhow.md +0 -32
  241. package/workflows/learn.md +277 -277
  242. package/workflows/maestro-chain-execute.md +20 -20
  243. package/workflows/refactor.md +22 -44
  244. package/workflows/retrospective.md +16 -65
  245. package/workflows/review.md +446 -486
  246. package/workflows/roadmap.md +35 -132
  247. package/workflows/skill-authoring.md +265 -265
  248. package/workflows/spec-generate.md +470 -470
  249. package/workflows/specs-remove.md +104 -104
  250. package/workflows/sync.md +11 -41
  251. package/workflows/test-gen.md +226 -226
  252. package/workflows/test.md +385 -475
  253. package/workflows/ui-design.md +391 -391
  254. package/workflows/ui-style.md +199 -199
  255. package/workflows/wiki-connect.md +151 -151
  256. package/workflows/wiki-digest.md +178 -178
  257. package/workflows/wiki-manage.md +109 -109
  258. package/workflows/cli-tools-usage.md +0 -252
  259. package/workflows/delegate-protocol.codex.md +0 -65
@@ -1,136 +1,153 @@
1
- ---
2
- name: quality-auto-test
3
- description: Use when test coverage needs automated expansion or existing tests need iterative convergence
4
- argument-hint: "<phase> [-y] [-c N] [--max-iter N] [--layer L0|L1|L2|L3] [--dry-run] [--re-run]"
5
- allowed-tools:
6
- - Read
7
- - Write
8
- - Edit
9
- - Bash
10
- - Glob
11
- - Grep
12
- - AskUserQuestion
13
- ---
14
- <purpose>
15
- Run unified automated testing via CSV layer pipeline. Reads project state to auto-select the optimal scenario source PRD specs (when spec package exists), coverage gaps (when Nyquist audit found gaps), or code exploration (default). All sources converge into a CSV pipeline: discover infrastructure → plan → build scenarios.csv → write tests per layer (spawn_agents_on_csv parallel) → execute → diagnose failures (spawn_agents_on_csv parallel) → iterate → report.
16
-
17
- Key mechanisms:
18
- - **Intelligent routing**: Reads `.tests/`, `.workflow/blueprint/`, `verification.json` to auto-select source — no mode flag needed
19
- - **CSV parallel test writing**: Per-layer `spawn_agents_on_csv` — each agent writes one test file independently
20
- - **CSV parallel failure diagnosis**: Failed scenarios dispatched via `spawn_agents_on_csv` for classification + fix
21
- - **Unified iteration engine**: Nested inner loop (fix test_defects via diagnosis CSV, max 3/layer) + outer loop (adaptive strategy, max N iterations)
22
- - **Layers as waves**: L0→L1→L2→L3 sequential (fail-fast on critical), scenarios within layer parallel
23
- - **Discovery board**: `discoveries.ndjson` shared across all agents/iterations (append-only)
24
- - **Degenerate modes**: `--max-iter 1` = single-pass generation; default = full iterative cycle
25
- - **Session persistence**: CSV state + state.json survive context resets, resume from any point
26
- </purpose>
27
-
28
- <required_reading>
29
- @~/.maestro/workflows/auto-test.md
30
- </required_reading>
31
-
32
- <context>
33
- Phase or task: $ARGUMENTS (required phase number)
34
-
35
- **Flags:**
36
- - `--max-iter N` — Maximum outer iterations (default: 5). Set to 1 for single-pass generation only.
37
- - `--layer L` Start from or restrict to specific layer (L0|L1|L2|L3)
38
- - `--dry-run` Generate test plan only, do not execute
39
- - `--re-run` Re-run only previously failed/blocked scenarios
40
-
41
- **Intelligent routing** (auto-detected from project state):
42
-
43
- | Priority | Condition | Route | Reference skill |
44
- |----------|-----------|-------|-----------------|
45
- | 1 | Active session exists (state.json status=running) | Resume | — |
46
- | 2 | --re-run flag + previous failures | Re-run | — |
47
- | 3 | Spec package exists (REQ-*.md) | spec | quality-business-test (separate skill) |
48
- | 4 | Nyquist gaps exist (verification.json) | gap | quality-test-gen (separate skill) |
49
- | 5 | Default | code | quality-integration-test (separate skill) |
50
-
51
- Flags, artifact context resolution, and output formats defined in workflow auto-test.md.
52
-
53
- ### Pre-load context (before test generation)
54
-
55
- 1. **Test specs + tools**: Run `maestro spec load --category test` to load test conventions (framework, patterns, naming). Apply to all generated tests.
56
- 2. **Coding specs**: Run `maestro spec load --category coding` to understand coding patterns for accurate test targeting.
57
- 3. **Role Knowledge**:
58
- - Browse: `maestro search --category test`
59
- - Load task-relevant entries: `maestro wiki load <id1> [id2...]`
60
- 4. All are optional proceed without if unavailable.
61
- </context>
62
-
63
- <execution>
64
- Follow '~/.maestro/workflows/auto-test.md' completely.
65
-
66
- **Command-specific extensions (not in workflow):**
67
-
68
- **Review findings integration** (from related review artifacts):
69
- - Extract critical/high findings as additional test scenarios, marked `source: "review_finding"`
70
- - When review verdict is "BLOCK" and review-finding tests fail, suggest quality-debug
71
-
72
- **Debug root cause integration** (from related debug artifacts):
73
- - Generate regression test scenarios from confirmed root causes, marked `source: "debug_root_cause"`
74
-
75
- **Register artifact on completion:**
76
- ```
77
- Append to state.json.artifacts[]:
78
- {
79
- id: nextArtifactId(artifacts, "test"), // TST-001
80
- type: "test",
81
- milestone: current_milestone,
82
- phase: target_phase,
83
- scope: "phase",
84
- path: "scratch/{YYYYMMDD}-auto-test-P{N}-{slug}",
85
- status: issues == 0 ? "completed" : "failed",
86
- depends_on: exec_art.id,
87
- harvested: false,
88
- created_at: start_time,
89
- completed_at: now()
90
- }
91
- ```
92
-
93
- **Next-step routing on completion:**
94
- - Converged (>=95%) → `/quality-review {phase}`
95
- - All requirements verified (spec source) → `/maestro-milestone-audit`
96
- - Bugs discovered → `/quality-debug --from-uat {phase}`
97
- - Max iter, >80% → `/quality-test {phase}` for manual UAT
98
- - Max iter, <80% → `/quality-debug {phase}`
99
- - Coverage still low → `/quality-auto-test {phase} --layer {missing}`
100
- - Re-run all pass → `/quality-review {phase}`
101
- - Single pass, all pass → `/quality-test {phase}`
102
- </execution>
103
-
104
- <error_codes>
105
- | Code | Severity | Condition | Recovery |
106
- |------|----------|-----------|----------|
107
- | E001 | error | Phase argument required (no active sessions) | Prompt user for phase number |
108
- | E002 | error | Phase not found in artifact registry | Check state.json artifacts |
109
- | E003 | error | No test framework detected | Install test framework or configure test runner |
110
- | W001 | warning | One or more test scenarios failed | Auto-iterate or suggest fix options |
111
- | W002 | warning | Max iterations reached without convergence | Review reflection-log.md, suggest debug |
112
- | W003 | warning | Degraded spec mode (no full spec package) | Consider running maestro-roadmap --mode full |
113
- </error_codes>
114
-
115
- <success_criteria>
116
- - [ ] Phase resolved from artifact registry
117
- - [ ] Route auto-selected from project state (spec/gap/code)
118
- - [ ] Active sessions checked, resume offered if applicable
119
- - [ ] Scenarios extracted and normalized to unified format
120
- - [ ] Test infrastructure discovered (framework, patterns, conventions)
121
- - [ ] test-plan.json generated with layer distribution
122
- - [ ] User confirmed plan (or --dry-run stopped here)
123
- - [ ] Tests written following RED-GREEN methodology and existing patterns
124
- - [ ] Tests executed progressively (L0→L3) with fail-fast on critical
125
- - [ ] Iteration engine ran (inner: test_defect fix, outer: strategy adjust)
126
- - [ ] state.json, report.json, reflection-log.md written
127
- - [ ] Test confidence scored per iteration (Step 7.5) with 5-dimension factor model
128
- - [ ] Convergence check includes confidence >= 60% alongside pass_rate threshold
129
- - [ ] Pressure pass completed on highest-pass-rate layer before completion
130
- - [ ] report.json includes confidence section
131
- - [ ] index.json updated with auto_test section
132
- - [ ] If spec source: traceability matrix built, traceability.md written
133
- - [ ] If failures: issues auto-created in issues.jsonl
134
- - [ ] If gap source: validation.json gaps updated (MISSING→COVERED)
135
- - [ ] Next step routed based on convergence status
136
- </success_criteria>
1
+ ---
2
+ name: quality-auto-test
3
+ description: Use when test coverage needs automated expansion or existing tests need iterative convergence
4
+ argument-hint: "<phase> [-y] [-c N] [--max-iter N] [--layer L0|L1|L2|L3] [--dry-run] [--re-run]"
5
+ allowed-tools:
6
+ - Read
7
+ - Write
8
+ - Edit
9
+ - Bash
10
+ - Glob
11
+ - Grep
12
+ - AskUserQuestion
13
+ ---
14
+ <purpose>
15
+ Unified automated testing via CSV layer pipeline. Auto-selects scenario source from project state (specs / coverage gaps / code exploration), then: discover → plan → build CSV → write tests (parallel) → execute → diagnose failures (parallel) → iterate → report.
16
+
17
+ Layers L0→L3 sequential (fail-fast), scenarios within layer parallel. `--max-iter 1` = single-pass; default = full iterative cycle.
18
+ </purpose>
19
+
20
+ <required_reading>
21
+ @~/.maestro/workflows/auto-test.md
22
+ </required_reading>
23
+
24
+ <context>
25
+ Phase or task: $ARGUMENTS (required phase number)
26
+
27
+ **Flags:**
28
+ - `--max-iter N` — Maximum outer iterations (default: 5). Set to 1 for single-pass generation only.
29
+ - `--layer L` — Start from or restrict to specific layer (L0|L1|L2|L3)
30
+ - `--dry-run` — Generate test plan only, do not execute
31
+ - `--re-run` — Re-run only previously failed/blocked scenarios
32
+
33
+ **Intelligent routing** (auto-detected from project state):
34
+
35
+ | Priority | Condition | Route | Reference skill |
36
+ |----------|-----------|-------|-----------------|
37
+ | 1 | Active session exists (state.json status=running) | Resume | |
38
+ | 2 | --re-run flag + previous failures | Re-run | — |
39
+ | 3 | Spec package exists (REQ-*.md) | spec | quality-business-test (separate skill) |
40
+ | 4 | Nyquist gaps exist (verification.json) | gap | quality-test-gen (separate skill) |
41
+ | 5 | Default | code | quality-integration-test (separate skill) |
42
+
43
+ Flags, artifact context resolution, and output formats defined in workflow auto-test.md.
44
+
45
+ ### Pre-load context (before test generation)
46
+
47
+ 1. **Test specs + tools**: Run `maestro spec load --category test` to load test conventions (framework, patterns, naming). Apply to all generated tests.
48
+ 2. **Coding specs**: Run `maestro spec load --category coding` to understand coding patterns for accurate test targeting.
49
+ 3. **Role Knowledge**:
50
+ - Browse: `maestro search --category test`
51
+ - Load task-relevant entries: `maestro wiki load <id1> [id2...]`
52
+ 4. All are optional — proceed without if unavailable.
53
+ </context>
54
+
55
+ <execution>
56
+ Follow '~/.maestro/workflows/auto-test.md' completely.
57
+
58
+ ### Phase Gates (MANDATORY, BLOCKING)
59
+
60
+ **GATE 1: Setup Plan** (Route Selection CSV Generation)
61
+ - REQUIRED: Phase resolved from artifact registry. E001/E002 if missing.
62
+ - REQUIRED: Route auto-selected (spec/gap/code) from project state.
63
+ - REQUIRED: Test infrastructure discovered (framework, patterns, conventions).
64
+ - BLOCKED if missing: cannot generate test plan without route and framework.
65
+
66
+ **GATE 2: Plan → Write** (CSV Test Generation)
67
+ - REQUIRED: test-plan.json generated with layer distribution (L0→L3).
68
+ - REQUIRED: User confirmed plan (unless `--dry-run` stops here).
69
+ - BLOCKED if plan missing or rejected: do not write tests.
70
+
71
+ **GATE 3: Write → Execute** (Test Generation → Execution)
72
+ - REQUIRED: All planned test files written following existing patterns.
73
+ - REQUIRED: Tests follow RED-GREEN methodology.
74
+ - BLOCKED if tests incomplete: finish writing before execution.
75
+
76
+ **GATE 4: Execute → Report** (Iteration → Completion)
77
+ - REQUIRED: Progressive execution completed (L0→L3, fail-fast on critical).
78
+ - REQUIRED: Iteration engine ran (inner: test_defect fix, outer: strategy adjust).
79
+ - REQUIRED: Confidence scored with 5-dimension factor model (>= 60%).
80
+ - REQUIRED: Pressure pass completed on highest-pass-rate layer.
81
+ - BLOCKED if iteration incomplete: continue iterating before reporting.
82
+
83
+ **Command-specific extensions (not in workflow):**
84
+
85
+ **Review findings integration** (from related review artifacts):
86
+ - Extract critical/high findings as additional test scenarios, marked `source: "review_finding"`
87
+ - When review verdict is "BLOCK" and review-finding tests fail, suggest quality-debug
88
+
89
+ **Debug root cause integration** (from related debug artifacts):
90
+ - Generate regression test scenarios from confirmed root causes, marked `source: "debug_root_cause"`
91
+
92
+ **Register artifact on completion:**
93
+ ```
94
+ Append to state.json.artifacts[]:
95
+ {
96
+ id: nextArtifactId(artifacts, "test"), // TST-001
97
+ type: "test",
98
+ milestone: current_milestone,
99
+ phase: target_phase,
100
+ scope: "phase",
101
+ path: "scratch/{YYYYMMDD}-auto-test-P{N}-{slug}",
102
+ status: issues == 0 ? "completed" : "failed",
103
+ depends_on: exec_art.id,
104
+ harvested: false,
105
+ created_at: start_time,
106
+ completed_at: now()
107
+ }
108
+ ```
109
+
110
+ **Next-step routing on completion:**
111
+ - Converged (>=95%) `/quality-review {phase}`
112
+ - All requirements verified (spec source) `/maestro-milestone-audit`
113
+ - Bugs discovered → `/quality-debug --from-uat {phase}`
114
+ - Max iter, >80% → `/quality-test {phase}` for manual UAT
115
+ - Max iter, <80% → `/quality-debug {phase}`
116
+ - Coverage still low `/quality-auto-test {phase} --layer {missing}`
117
+ - Re-run all pass → `/quality-review {phase}`
118
+ - Single pass, all pass `/quality-test {phase}`
119
+ </execution>
120
+
121
+ <error_codes>
122
+ | Code | Severity | Condition | Recovery |
123
+ |------|----------|-----------|----------|
124
+ | E001 | error | Phase argument required (no active sessions) | Prompt user for phase number |
125
+ | E002 | error | Phase not found in artifact registry | Check state.json artifacts |
126
+ | E003 | error | No test framework detected | Install test framework or configure test runner |
127
+ | W001 | warning | One or more test scenarios failed | Auto-iterate or suggest fix options |
128
+ | W002 | warning | Max iterations reached without convergence | Review reflection-log.md, suggest debug |
129
+ | W003 | warning | Degraded spec mode (no full spec package) | Consider running maestro-roadmap --mode full |
130
+ </error_codes>
131
+
132
+ <success_criteria>
133
+ - [ ] Phase resolved from artifact registry
134
+ - [ ] Route auto-selected from project state (spec/gap/code)
135
+ - [ ] Active sessions checked, resume offered if applicable
136
+ - [ ] Scenarios extracted and normalized to unified format
137
+ - [ ] Test infrastructure discovered (framework, patterns, conventions)
138
+ - [ ] test-plan.json generated with layer distribution
139
+ - [ ] User confirmed plan (or --dry-run stopped here)
140
+ - [ ] Tests written following RED-GREEN methodology and existing patterns
141
+ - [ ] Tests executed progressively (L0→L3) with fail-fast on critical
142
+ - [ ] Iteration engine ran (inner: test_defect fix, outer: strategy adjust)
143
+ - [ ] state.json, report.json, reflection-log.md written
144
+ - [ ] Test confidence scored per iteration (Step 7.5) with 5-dimension factor model
145
+ - [ ] Convergence check includes confidence >= 60% alongside pass_rate threshold
146
+ - [ ] Pressure pass completed on highest-pass-rate layer before completion
147
+ - [ ] report.json includes confidence section
148
+ - [ ] index.json updated with auto_test section
149
+ - [ ] If spec source: traceability matrix built, traceability.md written
150
+ - [ ] If failures: issues auto-created in issues.jsonl
151
+ - [ ] If gap source: validation.json gaps updated (MISSING→COVERED)
152
+ - [ ] Next step routed based on convergence status
153
+ </success_criteria>
@@ -1,120 +1,159 @@
1
- ---
2
- name: quality-debug
3
- description: Use when bugs, test failures, or unexpected behavior need systematic root cause investigation
4
- argument-hint: "[issue description] [--from-uat <phase>] [--parallel]"
5
- allowed-tools:
6
- - Read
7
- - Write
8
- - Edit
9
- - Bash
10
- - Glob
11
- - Grep
12
- - Agent
13
- - AskUserQuestion
14
- ---
15
- <purpose>
16
- Debug issues using scientific method with subagent isolation and persistent debug state. Three entry modes (standalone, from-UAT, parallel) and structured root cause collection with UAT feedback loop. Full algorithm defined in workflow debug.md.
17
- </purpose>
18
-
19
- <required_reading>
20
- @~/.maestro/workflows/debug.md
21
- </required_reading>
22
-
23
- <context>
24
- User's issue: $ARGUMENTS
25
-
26
- **Flags:**
27
- - `--from-uat <phase>` -- Read gaps from phase's uat.md as pre-filled symptoms
28
- - `--parallel` -- Spawn parallel debug agents (one per gap cluster)
29
-
30
- **All context via state.json.artifacts[]:**
31
-
32
- ```
33
- related = artifacts.filter(a =>
34
- a.phase === target_phase && a.milestone === current_milestone
35
- ).sort_by(completed_at asc)
36
- ```
37
-
38
- Each artifact's type determines its outputs at `.workflow/{a.path}/`:
39
- - **execute** → .summaries/, .task/ (source of code changes)
40
- - **review** → review.json (findings guide hypothesis formation)
41
- - **debug** → understanding.md, evidence.ndjson (prior investigations, avoid re-investigation)
42
- - **test** → uat.md (--from-uat gap source), .tests/
43
-
44
- Extract conclusions from related artifacts that may affect this debug session — review findings guide investigation direction, prior debug avoids redundant work.
45
-
46
- ### Pre-load (optional, proceed without)
47
- - Codebase docs: `.workflow/codebase/ARCHITECTURE.md` → module boundaries
48
- - Wiki: `maestro search "<symptom keywords>" --json` → prior investigations
49
- - Specs: `maestro spec load --category debug --keyword "<symptom>"` → known issues/workarounds
50
- - Role knowledge: `maestro search --category debug` select relevant `maestro wiki load`
51
-
52
- **Output**: `DEBUG_DIR = .workflow/scratch/{YYYYMMDD}-debug-P{N}-{slug}/` (P{N} = phase number when phase-scoped; omit for standalone). Output directory rules defined in workflow debug.md Step 4.
53
- </context>
54
-
55
- <execution>
56
- Follow '~/.maestro/workflows/debug.md' completely.
57
-
58
- **Register artifact on completion (phase-scoped only):**
59
- ```
60
- Append to state.json.artifacts[]:
61
- {
62
- id: nextArtifactId(artifacts, "debug"), // DBG-001
63
- type: "debug",
64
- milestone: current_milestone,
65
- phase: target_phase,
66
- scope: "phase",
67
- path: "scratch/{YYYYMMDD}-debug-P{N}-{slug}",
68
- status: all_diagnosed ? "completed" : "failed",
69
- depends_on: triggering_review_id || exec_art.id,
70
- harvested: false,
71
- created_at: start_time,
72
- completed_at: now()
73
- }
74
- ```
75
-
76
- ### Post-debug Knowledge Inquiry
77
-
78
- | Condition | Ask | Route |
79
- |-----------|-----|-------|
80
- | Recurring root cause pattern (seen in prior debug) | "Document in debug-notes.md?" | spec-add debug |
81
- | Non-obvious fix / workaround | "Record as learning?" | spec-add learning |
82
- | Root cause = architectural boundary violation | "Update architecture-constraints.md?" | spec-add arch |
83
-
84
- On confirm → `Skill("spec-add", "<category> <content> --description \"<summary>\"")`.
85
-
86
- **Next-step routing on completion:**
87
- - Root cause found, fix needed → `/maestro-plan {phase} --gaps`
88
- - Root cause found (from UAT), auto-fix → `/quality-test {phase} --auto-fix`
89
- - Inconclusive, need more info → `/quality-debug {issue} -c` (resume session)
90
- - Standalone fix already applied → `/maestro-execute {phase}`
91
- </execution>
92
-
93
- <error_codes>
94
- | Code | Severity | Condition | Recovery |
95
- |------|----------|-----------|----------|
96
- | E001 | error | Issue description required (no arguments, no active sessions) | Check arguments format, re-run with correct input |
97
- | E002 | error | UAT file not found for --from-uat phase | Verify UAT file exists for specified phase |
98
- | W001 | warning | Existing debug session found, offer resume | Review existing sessions, choose resume or new |
99
- | W002 | warning | Checkpoint reached, user input needed | Provide requested input to continue |
100
- | W003 | warning | Some gaps inconclusive, partial diagnosis | Review partial results, retry inconclusive gaps |
101
- </error_codes>
102
-
103
- <success_criteria>
104
- - [ ] Input parsed: standalone, --from-uat, or --parallel mode determined
105
- - [ ] Active sessions checked and resume offered if applicable
106
- - [ ] Symptoms gathered (interactive) or loaded from UAT (pre-filled)
107
- - [ ] Debug output directory created (phase .debug/ or scratch/)
108
- - [ ] Debug agent(s) spawned with full symptom context
109
- - [ ] If --parallel: one agent per gap cluster, all concurrent
110
- - [ ] evidence.ndjson written with structured NDJSON entries
111
- - [ ] understanding.md tracks evolving understanding per cluster
112
- - [ ] Root causes collected with fix_direction and affected_files
113
- - [ ] Multi-factor confidence scored per gap (Step 7.0) replacing simple high/medium/low
114
- - [ ] Readiness gate checked before ROOT CAUSE declaration
115
- - [ ] Pressure pass completed on confirmed hypothesis
116
- - [ ] Confidence table appended to understanding.md
117
- - [ ] If --from-uat: uat.md gaps updated with diagnosis artifacts
118
- - [ ] Results unified into diagnosis summary with confidence section
119
- - [ ] Next step routed (plan --gaps + execute if fix needed, verify if fix applied, resume if inconclusive)
120
- </success_criteria>
1
+ ---
2
+ name: quality-debug
3
+ description: Use when bugs, test failures, or unexpected behavior need systematic root cause investigation
4
+ argument-hint: "[issue description] [--from-uat <phase>] [--parallel]"
5
+ allowed-tools:
6
+ - Read
7
+ - Write
8
+ - Edit
9
+ - Bash
10
+ - Glob
11
+ - Grep
12
+ - Agent
13
+ - AskUserQuestion
14
+ ---
15
+ <purpose>
16
+ Debug issues using scientific method with subagent isolation and persistent debug state. Three entry modes (standalone, from-UAT, parallel) and structured root cause collection with UAT feedback loop. Full algorithm defined in workflow debug.md.
17
+ </purpose>
18
+
19
+ <required_reading>
20
+ @~/.maestro/workflows/debug.md
21
+ </required_reading>
22
+
23
+ <context>
24
+ User's issue: $ARGUMENTS
25
+
26
+ **Flags:**
27
+ - `--from-uat <phase>` -- Read gaps from phase's uat.md as pre-filled symptoms
28
+ - `--parallel` -- Spawn parallel debug agents (one per gap cluster)
29
+
30
+ **All context via state.json.artifacts[]:**
31
+
32
+ ```
33
+ related = artifacts.filter(a =>
34
+ a.phase === target_phase && a.milestone === current_milestone
35
+ ).sort_by(completed_at asc)
36
+ ```
37
+
38
+ Each artifact's type determines its outputs at `.workflow/{a.path}/`:
39
+ - **execute** → .summaries/, .task/ (source of code changes)
40
+ - **review** → review.json (findings guide hypothesis formation)
41
+ - **debug** → understanding.md, evidence.ndjson (prior investigations, avoid re-investigation)
42
+ - **test** → uat.md (--from-uat gap source), .tests/
43
+
44
+ ### Pre-load (optional, proceed without)
45
+ - Codebase docs: `.workflow/codebase/ARCHITECTURE.md` → module boundaries
46
+ - Wiki: `maestro search "<symptom keywords>" --json` → prior investigations
47
+ - Specs: `maestro spec load --category debug --keyword "<symptom>"` known issues/workarounds
48
+ - Role knowledge: `maestro search --category debug` → select relevant → `maestro wiki load`
49
+
50
+ **Output**: `DEBUG_DIR = .workflow/scratch/{YYYYMMDD}-debug-P{N}-{slug}/` (P{N} = phase number when phase-scoped; omit for standalone). Output directory rules defined in workflow debug.md Step 4.
51
+ </context>
52
+
53
+ <execution>
54
+ Follow '~/.maestro/workflows/debug.md' completely.
55
+
56
+ ### Phase Gates (MANDATORY, BLOCKING)
57
+
58
+ **GATE 1: Input Investigation**
59
+ - REQUIRED: Symptoms gathered (interactive) or loaded from UAT (--from-uat).
60
+ - REQUIRED: Debug output directory created.
61
+ - BLOCKED if missing: cannot investigate without symptom baseline.
62
+
63
+ **GATE 2: Investigation → Diagnosis**
64
+ - REQUIRED: Debug agent(s) spawned with full symptom context.
65
+ - REQUIRED: evidence.ndjson written with structured entries.
66
+ - REQUIRED: understanding.md tracks evolving understanding.
67
+ - BLOCKED if incomplete: continue investigation before declaring root cause.
68
+
69
+ **GATE 3: Diagnosis Completion**
70
+ - REQUIRED: Root causes collected with fix_direction and affected_files.
71
+ - REQUIRED: Multi-factor confidence scored per gap.
72
+ - REQUIRED: Readiness gate checked and pressure pass completed.
73
+ - BLOCKED if inconclusive: resume session or escalate.
74
+
75
+ **Register artifact on completion (phase-scoped only):**
76
+ ```
77
+ Append to state.json.artifacts[]:
78
+ {
79
+ id: nextArtifactId(artifacts, "debug"), // DBG-001
80
+ type: "debug",
81
+ milestone: current_milestone,
82
+ phase: target_phase,
83
+ scope: "phase",
84
+ path: "scratch/{YYYYMMDD}-debug-P{N}-{slug}",
85
+ status: all_diagnosed ? "completed" : "failed",
86
+ depends_on: triggering_review_id || exec_art.id,
87
+ harvested: false,
88
+ created_at: start_time,
89
+ completed_at: now()
90
+ }
91
+ ```
92
+
93
+ ### Post-debug Knowledge Inquiry
94
+
95
+ | Condition | Ask | Route |
96
+ |-----------|-----|-------|
97
+ | Recurring root cause pattern (seen in prior debug) | "Document in debug-notes.md?" | spec-add debug |
98
+ | Non-obvious fix / workaround | "Record as learning?" | spec-add learning |
99
+ | Root cause = architectural boundary violation | "Update architecture-constraints.md?" | spec-add arch |
100
+
101
+ On confirm → `Skill("spec-add", "<category> <content> --description \"<summary>\"")`.
102
+
103
+ </execution>
104
+
105
+ <completion>
106
+ ### Standalone report
107
+
108
+ ```
109
+ --- COMPLETION STATUS ---
110
+ STATUS: DONE|DONE_WITH_CONCERNS|NEEDS_RETRY
111
+ CONCERNS: {description if applicable}
112
+ --- END STATUS ---
113
+ ```
114
+
115
+ ### Ralph-invoked completion
116
+
117
+ End the step by calling the CLI (no text block output):
118
+ ```
119
+ maestro ralph complete <idx> --status {STATUS} [--evidence {path}]
120
+ ```
121
+
122
+ ### Next-step routing
123
+
124
+ | Condition | Suggestion |
125
+ |-----------|-----------|
126
+ | Root cause found, fix needed | `/maestro-plan {phase} --gaps` |
127
+ | Root cause found (from UAT), auto-fix | `/quality-test {phase} --auto-fix` |
128
+ | Inconclusive, need more info | `/quality-debug {issue} -c` (resume) |
129
+ | Standalone fix already applied | `/maestro-execute {phase}` |
130
+ </completion>
131
+
132
+ <error_codes>
133
+ | Code | Severity | Condition | Recovery |
134
+ |------|----------|-----------|----------|
135
+ | E001 | error | Issue description required (no arguments, no active sessions) | Check arguments format, re-run with correct input |
136
+ | E002 | error | UAT file not found for --from-uat phase | Verify UAT file exists for specified phase |
137
+ | W001 | warning | Existing debug session found, offer resume | Review existing sessions, choose resume or new |
138
+ | W002 | warning | Checkpoint reached, user input needed | Provide requested input to continue |
139
+ | W003 | warning | Some gaps inconclusive, partial diagnosis | Review partial results, retry inconclusive gaps |
140
+ </error_codes>
141
+
142
+ <success_criteria>
143
+ - [ ] Input parsed: standalone, --from-uat, or --parallel mode determined
144
+ - [ ] Active sessions checked and resume offered if applicable
145
+ - [ ] Symptoms gathered (interactive) or loaded from UAT (pre-filled)
146
+ - [ ] Debug output directory created (phase .debug/ or scratch/)
147
+ - [ ] Debug agent(s) spawned with full symptom context
148
+ - [ ] If --parallel: one agent per gap cluster, all concurrent
149
+ - [ ] evidence.ndjson written with structured NDJSON entries
150
+ - [ ] understanding.md tracks evolving understanding per cluster
151
+ - [ ] Root causes collected with fix_direction and affected_files
152
+ - [ ] Multi-factor confidence scored per gap (Step 7.0) replacing simple high/medium/low
153
+ - [ ] Readiness gate checked before ROOT CAUSE declaration
154
+ - [ ] Pressure pass completed on confirmed hypothesis
155
+ - [ ] Confidence table appended to understanding.md
156
+ - [ ] If --from-uat: uat.md gaps updated with diagnosis artifacts
157
+ - [ ] Results unified into diagnosis summary with confidence section
158
+ - [ ] Next step routed (plan --gaps + execute if fix needed, verify if fix applied, resume if inconclusive)
159
+ </success_criteria>