@howlil/ez-agents 2.0.0 → 2.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (106) hide show
  1. package/LICENSE +21 -21
  2. package/README.md +93 -93
  3. package/agents/ez-plan-checker.md +2 -2
  4. package/agents/ez-research-synthesizer.md +1 -1
  5. package/agents/ez-ui-researcher.md +1 -1
  6. package/agents/ez-verifier.md +1 -1
  7. package/bin/install.js +132 -132
  8. package/get-shit-done/bin/lib/assistant-adapter.cjs +205 -205
  9. package/get-shit-done/bin/lib/audit-exec.cjs +150 -150
  10. package/get-shit-done/bin/lib/auth.cjs +175 -175
  11. package/get-shit-done/bin/lib/circuit-breaker.cjs +118 -118
  12. package/get-shit-done/bin/lib/commands.cjs +666 -666
  13. package/get-shit-done/bin/lib/config.cjs +183 -183
  14. package/get-shit-done/bin/lib/core.cjs +495 -495
  15. package/get-shit-done/bin/lib/file-lock.cjs +236 -236
  16. package/get-shit-done/bin/lib/frontmatter.cjs +299 -299
  17. package/get-shit-done/bin/lib/fs-utils.cjs +153 -153
  18. package/get-shit-done/bin/lib/git-utils.cjs +203 -203
  19. package/get-shit-done/bin/lib/health-check.cjs +163 -163
  20. package/get-shit-done/bin/lib/index.cjs +113 -113
  21. package/get-shit-done/bin/lib/init.cjs +710 -710
  22. package/get-shit-done/bin/lib/logger.cjs +117 -117
  23. package/get-shit-done/bin/lib/milestone.cjs +241 -241
  24. package/get-shit-done/bin/lib/model-provider.cjs +146 -146
  25. package/get-shit-done/bin/lib/phase.cjs +908 -908
  26. package/get-shit-done/bin/lib/retry.cjs +119 -119
  27. package/get-shit-done/bin/lib/roadmap.cjs +305 -305
  28. package/get-shit-done/bin/lib/safe-exec.cjs +128 -128
  29. package/get-shit-done/bin/lib/safe-path.cjs +130 -130
  30. package/get-shit-done/bin/lib/state.cjs +721 -721
  31. package/get-shit-done/bin/lib/temp-file.cjs +239 -239
  32. package/get-shit-done/bin/lib/template.cjs +222 -222
  33. package/get-shit-done/bin/lib/test-file-lock.cjs +112 -112
  34. package/get-shit-done/bin/lib/test-graceful.cjs +93 -93
  35. package/get-shit-done/bin/lib/test-logger.cjs +60 -60
  36. package/get-shit-done/bin/lib/test-safe-exec.cjs +38 -38
  37. package/get-shit-done/bin/lib/test-safe-path.cjs +33 -33
  38. package/get-shit-done/bin/lib/test-temp-file.cjs +125 -125
  39. package/get-shit-done/bin/lib/timeout-exec.cjs +62 -62
  40. package/get-shit-done/bin/lib/verify.cjs +820 -820
  41. package/get-shit-done/references/checkpoints.md +776 -776
  42. package/get-shit-done/references/questioning.md +162 -162
  43. package/get-shit-done/references/tdd.md +263 -263
  44. package/get-shit-done/templates/codebase/concerns.md +310 -310
  45. package/get-shit-done/templates/codebase/conventions.md +307 -307
  46. package/get-shit-done/templates/codebase/integrations.md +280 -280
  47. package/get-shit-done/templates/codebase/stack.md +186 -186
  48. package/get-shit-done/templates/codebase/testing.md +480 -480
  49. package/get-shit-done/templates/config.json +37 -37
  50. package/get-shit-done/templates/continue-here.md +78 -78
  51. package/get-shit-done/templates/milestone-archive.md +123 -123
  52. package/get-shit-done/templates/milestone.md +115 -115
  53. package/get-shit-done/templates/requirements.md +231 -231
  54. package/get-shit-done/templates/research-project/ARCHITECTURE.md +204 -204
  55. package/get-shit-done/templates/research-project/FEATURES.md +147 -147
  56. package/get-shit-done/templates/research-project/PITFALLS.md +200 -200
  57. package/get-shit-done/templates/research-project/STACK.md +120 -120
  58. package/get-shit-done/templates/research-project/SUMMARY.md +170 -170
  59. package/get-shit-done/templates/retrospective.md +54 -54
  60. package/get-shit-done/templates/roadmap.md +202 -202
  61. package/get-shit-done/templates/summary-minimal.md +41 -41
  62. package/get-shit-done/templates/summary-standard.md +48 -48
  63. package/get-shit-done/templates/summary.md +248 -248
  64. package/get-shit-done/templates/user-setup.md +311 -311
  65. package/get-shit-done/templates/verification-report.md +322 -322
  66. package/get-shit-done/workflows/add-phase.md +112 -112
  67. package/get-shit-done/workflows/add-tests.md +351 -351
  68. package/get-shit-done/workflows/add-todo.md +158 -158
  69. package/get-shit-done/workflows/audit-milestone.md +332 -332
  70. package/get-shit-done/workflows/autonomous.md +743 -743
  71. package/get-shit-done/workflows/check-todos.md +177 -177
  72. package/get-shit-done/workflows/cleanup.md +152 -152
  73. package/get-shit-done/workflows/complete-milestone.md +766 -766
  74. package/get-shit-done/workflows/diagnose-issues.md +219 -219
  75. package/get-shit-done/workflows/discovery-phase.md +289 -289
  76. package/get-shit-done/workflows/discuss-phase.md +762 -762
  77. package/get-shit-done/workflows/execute-phase.md +468 -468
  78. package/get-shit-done/workflows/execute-plan.md +483 -483
  79. package/get-shit-done/workflows/health.md +159 -159
  80. package/get-shit-done/workflows/help.md +492 -492
  81. package/get-shit-done/workflows/insert-phase.md +130 -130
  82. package/get-shit-done/workflows/list-phase-assumptions.md +178 -178
  83. package/get-shit-done/workflows/map-codebase.md +316 -316
  84. package/get-shit-done/workflows/new-milestone.md +384 -384
  85. package/get-shit-done/workflows/new-project.md +1111 -1111
  86. package/get-shit-done/workflows/node-repair.md +92 -92
  87. package/get-shit-done/workflows/pause-work.md +122 -122
  88. package/get-shit-done/workflows/plan-milestone-gaps.md +274 -274
  89. package/get-shit-done/workflows/plan-phase.md +651 -651
  90. package/get-shit-done/workflows/progress.md +382 -382
  91. package/get-shit-done/workflows/quick.md +610 -610
  92. package/get-shit-done/workflows/remove-phase.md +155 -155
  93. package/get-shit-done/workflows/research-phase.md +74 -74
  94. package/get-shit-done/workflows/resume-project.md +307 -307
  95. package/get-shit-done/workflows/set-profile.md +81 -81
  96. package/get-shit-done/workflows/settings.md +242 -242
  97. package/get-shit-done/workflows/stats.md +57 -57
  98. package/get-shit-done/workflows/transition.md +544 -544
  99. package/get-shit-done/workflows/ui-phase.md +290 -290
  100. package/get-shit-done/workflows/ui-review.md +157 -157
  101. package/get-shit-done/workflows/update.md +320 -320
  102. package/get-shit-done/workflows/validate-phase.md +167 -167
  103. package/get-shit-done/workflows/verify-phase.md +243 -243
  104. package/package.json +1 -1
  105. package/scripts/build-hooks.js +43 -43
  106. package/scripts/run-tests.cjs +29 -29
@@ -1,351 +1,351 @@
1
- <purpose>
2
- Generate unit and E2E tests for a completed phase based on its SUMMARY.md, CONTEXT.md, and implementation. Classifies each changed file into TDD (unit), E2E (browser), or Skip categories, presents a test plan for user approval, then generates tests following RED-GREEN conventions.
3
-
4
- Users currently hand-craft `/ez:quick` prompts for test generation after each phase. This workflow standardizes the process with proper classification, quality gates, and gap reporting.
5
- </purpose>
6
-
7
- <required_reading>
8
- Read all files referenced by the invoking prompt's execution_context before starting.
9
- </required_reading>
10
-
11
- <process>
12
-
13
- <step name="parse_arguments">
14
- Parse `$ARGUMENTS` for:
15
- - Phase number (integer, decimal, or letter-suffix) → store as `$PHASE_ARG`
16
- - Remaining text after phase number → store as `$EXTRA_INSTRUCTIONS` (optional)
17
-
18
- Example: `/ez:add-tests 12 focus on edge cases` → `$PHASE_ARG=12`, `$EXTRA_INSTRUCTIONS="focus on edge cases"`
19
-
20
- If no phase argument provided:
21
-
22
- ```
23
- ERROR: Phase number required
24
- Usage: /ez:add-tests <phase> [additional instructions]
25
- Example: /ez:add-tests 12
26
- Example: /ez:add-tests 12 focus on edge cases in the pricing module
27
- ```
28
-
29
- Exit.
30
- </step>
31
-
32
- <step name="init_context">
33
- Load phase operation context:
34
-
35
- ```bash
36
- INIT=$(node "$HOME/.claude/ez-agents/bin/ez-tools.cjs" init phase-op "${PHASE_ARG}")
37
- if [[ "$INIT" == @file:* ]]; then INIT=$(cat "${INIT#@file:}"); fi
38
- ```
39
-
40
- Extract from init JSON: `phase_dir`, `phase_number`, `phase_name`.
41
-
42
- Verify the phase directory exists. If not:
43
- ```
44
- ERROR: Phase directory not found for phase ${PHASE_ARG}
45
- Ensure the phase exists in .planning/phases/
46
- ```
47
- Exit.
48
-
49
- Read the phase artifacts (in order of priority):
50
- 1. `${phase_dir}/*-SUMMARY.md` — what was implemented, files changed
51
- 2. `${phase_dir}/CONTEXT.md` — acceptance criteria, decisions
52
- 3. `${phase_dir}/*-VERIFICATION.md` — user-verified scenarios (if UAT was done)
53
-
54
- If no SUMMARY.md exists:
55
- ```
56
- ERROR: No SUMMARY.md found for phase ${PHASE_ARG}
57
- This command works on completed phases. Run /ez:execute-phase first.
58
- ```
59
- Exit.
60
-
61
- Present banner:
62
- ```
63
- ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
64
- GSD ► ADD TESTS — Phase ${phase_number}: ${phase_name}
65
- ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
66
- ```
67
- </step>
68
-
69
- <step name="analyze_implementation">
70
- Extract the list of files modified by the phase from SUMMARY.md ("Files Changed" or equivalent section).
71
-
72
- For each file, classify into one of three categories:
73
-
74
- | Category | Criteria | Test Type |
75
- |----------|----------|-----------|
76
- | **TDD** | Pure functions where `expect(fn(input)).toBe(output)` is writable | Unit tests |
77
- | **E2E** | UI behavior verifiable by browser automation | Playwright/E2E tests |
78
- | **Skip** | Not meaningfully testable or already covered | None |
79
-
80
- **TDD classification — apply when:**
81
- - Business logic: calculations, pricing, tax rules, validation
82
- - Data transformations: mapping, filtering, aggregation, formatting
83
- - Parsers: CSV, JSON, XML, custom format parsing
84
- - Validators: input validation, schema validation, business rules
85
- - State machines: status transitions, workflow steps
86
- - Utilities: string manipulation, date handling, number formatting
87
-
88
- **E2E classification — apply when:**
89
- - Keyboard shortcuts: key bindings, modifier keys, chord sequences
90
- - Navigation: page transitions, routing, breadcrumbs, back/forward
91
- - Form interactions: submit, validation errors, field focus, autocomplete
92
- - Selection: row selection, multi-select, shift-click ranges
93
- - Drag and drop: reordering, moving between containers
94
- - Modal dialogs: open, close, confirm, cancel
95
- - Data grids: sorting, filtering, inline editing, column resize
96
-
97
- **Skip classification — apply when:**
98
- - UI layout/styling: CSS classes, visual appearance, responsive breakpoints
99
- - Configuration: config files, environment variables, feature flags
100
- - Glue code: dependency injection setup, middleware registration, routing tables
101
- - Migrations: database migrations, schema changes
102
- - Simple CRUD: basic create/read/update/delete with no business logic
103
- - Type definitions: records, DTOs, interfaces with no logic
104
-
105
- Read each file to verify classification. Don't classify based on filename alone.
106
- </step>
107
-
108
- <step name="present_classification">
109
- Present the classification to the user for confirmation before proceeding:
110
-
111
- ```
112
- AskUserQuestion(
113
- header: "Test Classification",
114
- question: |
115
- ## Files classified for testing
116
-
117
- ### TDD (Unit Tests) — {N} files
118
- {list of files with brief reason}
119
-
120
- ### E2E (Browser Tests) — {M} files
121
- {list of files with brief reason}
122
-
123
- ### Skip — {K} files
124
- {list of files with brief reason}
125
-
126
- {if $EXTRA_INSTRUCTIONS: "Additional instructions: ${EXTRA_INSTRUCTIONS}"}
127
-
128
- How would you like to proceed?
129
- options:
130
- - "Approve and generate test plan"
131
- - "Adjust classification (I'll specify changes)"
132
- - "Cancel"
133
- )
134
- ```
135
-
136
- If user selects "Adjust classification": apply their changes and re-present.
137
- If user selects "Cancel": exit gracefully.
138
- </step>
139
-
140
- <step name="discover_test_structure">
141
- Before generating the test plan, discover the project's existing test structure:
142
-
143
- ```bash
144
- # Find existing test directories
145
- find . -type d -name "*test*" -o -name "*spec*" -o -name "*__tests__*" 2>/dev/null | head -20
146
- # Find existing test files for convention matching
147
- find . -type f \( -name "*.test.*" -o -name "*.spec.*" -o -name "*Tests.fs" -o -name "*Test.fs" \) 2>/dev/null | head -20
148
- # Check for test runners
149
- ls package.json *.sln 2>/dev/null
150
- ```
151
-
152
- Identify:
153
- - Test directory structure (where unit tests live, where E2E tests live)
154
- - Naming conventions (`.test.ts`, `.spec.ts`, `*Tests.fs`, etc.)
155
- - Test runner commands (how to execute unit tests, how to execute E2E tests)
156
- - Test framework (xUnit, NUnit, Jest, Playwright, etc.)
157
-
158
- If test structure is ambiguous, ask the user:
159
- ```
160
- AskUserQuestion(
161
- header: "Test Structure",
162
- question: "I found multiple test locations. Where should I create tests?",
163
- options: [list discovered locations]
164
- )
165
- ```
166
- </step>
167
-
168
- <step name="generate_test_plan">
169
- For each approved file, create a detailed test plan.
170
-
171
- **For TDD files**, plan tests following RED-GREEN-REFACTOR:
172
- 1. Identify testable functions/methods in the file
173
- 2. For each function: list input scenarios, expected outputs, edge cases
174
- 3. Note: since code already exists, tests may pass immediately — that's OK, but verify they test the RIGHT behavior
175
-
176
- **For E2E files**, plan tests following RED-GREEN gates:
177
- 1. Identify user scenarios from CONTEXT.md/VERIFICATION.md
178
- 2. For each scenario: describe the user action, expected outcome, assertions
179
- 3. Note: RED gate means confirming the test would fail if the feature were broken
180
-
181
- Present the complete test plan:
182
-
183
- ```
184
- AskUserQuestion(
185
- header: "Test Plan",
186
- question: |
187
- ## Test Generation Plan
188
-
189
- ### Unit Tests ({N} tests across {M} files)
190
- {for each file: test file path, list of test cases}
191
-
192
- ### E2E Tests ({P} tests across {Q} files)
193
- {for each file: test file path, list of test scenarios}
194
-
195
- ### Test Commands
196
- - Unit: {discovered test command}
197
- - E2E: {discovered e2e command}
198
-
199
- Ready to generate?
200
- options:
201
- - "Generate all"
202
- - "Cherry-pick (I'll specify which)"
203
- - "Adjust plan"
204
- )
205
- ```
206
-
207
- If "Cherry-pick": ask user which tests to include.
208
- If "Adjust plan": apply changes and re-present.
209
- </step>
210
-
211
- <step name="execute_tdd_generation">
212
- For each approved TDD test:
213
-
214
- 1. **Create test file** following discovered project conventions (directory, naming, imports)
215
-
216
- 2. **Write test** with clear arrange/act/assert structure:
217
- ```
218
- // Arrange — set up inputs and expected outputs
219
- // Act — call the function under test
220
- // Assert — verify the output matches expectations
221
- ```
222
-
223
- 3. **Run the test**:
224
- ```bash
225
- {discovered test command}
226
- ```
227
-
228
- 4. **Evaluate result:**
229
- - **Test passes**: Good — the implementation satisfies the test. Verify the test checks meaningful behavior (not just that it compiles).
230
- - **Test fails with assertion error**: This may be a genuine bug discovered by the test. Flag it:
231
- ```
232
- ⚠️ Potential bug found: {test name}
233
- Expected: {expected}
234
- Actual: {actual}
235
- File: {implementation file}
236
- ```
237
- Do NOT fix the implementation — this is a test-generation command, not a fix command. Record the finding.
238
- - **Test fails with error (import, syntax, etc.)**: This is a test error. Fix the test and re-run.
239
- </step>
240
-
241
- <step name="execute_e2e_generation">
242
- For each approved E2E test:
243
-
244
- 1. **Check for existing tests** covering the same scenario:
245
- ```bash
246
- grep -r "{scenario keyword}" {e2e test directory} 2>/dev/null
247
- ```
248
- If found, extend rather than duplicate.
249
-
250
- 2. **Create test file** targeting the user scenario from CONTEXT.md/VERIFICATION.md
251
-
252
- 3. **Run the E2E test**:
253
- ```bash
254
- {discovered e2e command}
255
- ```
256
-
257
- 4. **Evaluate result:**
258
- - **GREEN (passes)**: Record success
259
- - **RED (fails)**: Determine if it's a test issue or a genuine application bug. Flag bugs:
260
- ```
261
- ⚠️ E2E failure: {test name}
262
- Scenario: {description}
263
- Error: {error message}
264
- ```
265
- - **Cannot run**: Report blocker. Do NOT mark as complete.
266
- ```
267
- 🛑 E2E blocker: {reason tests cannot run}
268
- ```
269
-
270
- **No-skip rule:** If E2E tests cannot execute (missing dependencies, environment issues), report the blocker and mark the test as incomplete. Never mark success without actually running the test.
271
- </step>
272
-
273
- <step name="summary_and_commit">
274
- Create a test coverage report and present to user:
275
-
276
- ```
277
- ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
278
- GSD ► TEST GENERATION COMPLETE
279
- ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
280
-
281
- ## Results
282
-
283
- | Category | Generated | Passing | Failing | Blocked |
284
- |----------|-----------|---------|---------|---------|
285
- | Unit | {N} | {n1} | {n2} | {n3} |
286
- | E2E | {M} | {m1} | {m2} | {m3} |
287
-
288
- ## Files Created/Modified
289
- {list of test files with paths}
290
-
291
- ## Coverage Gaps
292
- {areas that couldn't be tested and why}
293
-
294
- ## Bugs Discovered
295
- {any assertion failures that indicate implementation bugs}
296
- ```
297
-
298
- Record test generation in project state:
299
- ```bash
300
- node "$HOME/.claude/ez-agents/bin/ez-tools.cjs" state-snapshot
301
- ```
302
-
303
- If there are passing tests to commit:
304
-
305
- ```bash
306
- git add {test files}
307
- git commit -m "test(phase-${phase_number}): add unit and E2E tests from add-tests command"
308
- ```
309
-
310
- Present next steps:
311
-
312
- ```
313
- ---
314
-
315
- ## ▶ Next Up
316
-
317
- {if bugs discovered:}
318
- **Fix discovered bugs:** `/ez:quick fix the {N} test failures discovered in phase ${phase_number}`
319
-
320
- {if blocked tests:}
321
- **Resolve test blockers:** {description of what's needed}
322
-
323
- {otherwise:}
324
- **All tests passing!** Phase ${phase_number} is fully tested.
325
-
326
- ---
327
-
328
- **Also available:**
329
- - `/ez:add-tests {next_phase}` — test another phase
330
- - `/ez:verify-work {phase_number}` — run UAT verification
331
-
332
- ---
333
- ```
334
- </step>
335
-
336
- </process>
337
-
338
- <success_criteria>
339
- - [ ] Phase artifacts loaded (SUMMARY.md, CONTEXT.md, optionally VERIFICATION.md)
340
- - [ ] All changed files classified into TDD/E2E/Skip categories
341
- - [ ] Classification presented to user and approved
342
- - [ ] Project test structure discovered (directories, conventions, runners)
343
- - [ ] Test plan presented to user and approved
344
- - [ ] TDD tests generated with arrange/act/assert structure
345
- - [ ] E2E tests generated targeting user scenarios
346
- - [ ] All tests executed — no untested tests marked as passing
347
- - [ ] Bugs discovered by tests flagged (not fixed)
348
- - [ ] Test files committed with proper message
349
- - [ ] Coverage gaps documented
350
- - [ ] Next steps presented to user
351
- </success_criteria>
1
+ <purpose>
2
+ Generate unit and E2E tests for a completed phase based on its SUMMARY.md, CONTEXT.md, and implementation. Classifies each changed file into TDD (unit), E2E (browser), or Skip categories, presents a test plan for user approval, then generates tests following RED-GREEN conventions.
3
+
4
+ Users currently hand-craft `/ez:quick` prompts for test generation after each phase. This workflow standardizes the process with proper classification, quality gates, and gap reporting.
5
+ </purpose>
6
+
7
+ <required_reading>
8
+ Read all files referenced by the invoking prompt's execution_context before starting.
9
+ </required_reading>
10
+
11
+ <process>
12
+
13
+ <step name="parse_arguments">
14
+ Parse `$ARGUMENTS` for:
15
+ - Phase number (integer, decimal, or letter-suffix) → store as `$PHASE_ARG`
16
+ - Remaining text after phase number → store as `$EXTRA_INSTRUCTIONS` (optional)
17
+
18
+ Example: `/ez:add-tests 12 focus on edge cases` → `$PHASE_ARG=12`, `$EXTRA_INSTRUCTIONS="focus on edge cases"`
19
+
20
+ If no phase argument provided:
21
+
22
+ ```
23
+ ERROR: Phase number required
24
+ Usage: /ez:add-tests <phase> [additional instructions]
25
+ Example: /ez:add-tests 12
26
+ Example: /ez:add-tests 12 focus on edge cases in the pricing module
27
+ ```
28
+
29
+ Exit.
30
+ </step>
31
+
32
+ <step name="init_context">
33
+ Load phase operation context:
34
+
35
+ ```bash
36
+ INIT=$(node "$HOME/.claude/ez-agents/bin/ez-tools.cjs" init phase-op "${PHASE_ARG}")
37
+ if [[ "$INIT" == @file:* ]]; then INIT=$(cat "${INIT#@file:}"); fi
38
+ ```
39
+
40
+ Extract from init JSON: `phase_dir`, `phase_number`, `phase_name`.
41
+
42
+ Verify the phase directory exists. If not:
43
+ ```
44
+ ERROR: Phase directory not found for phase ${PHASE_ARG}
45
+ Ensure the phase exists in .planning/phases/
46
+ ```
47
+ Exit.
48
+
49
+ Read the phase artifacts (in order of priority):
50
+ 1. `${phase_dir}/*-SUMMARY.md` — what was implemented, files changed
51
+ 2. `${phase_dir}/CONTEXT.md` — acceptance criteria, decisions
52
+ 3. `${phase_dir}/*-VERIFICATION.md` — user-verified scenarios (if UAT was done)
53
+
54
+ If no SUMMARY.md exists:
55
+ ```
56
+ ERROR: No SUMMARY.md found for phase ${PHASE_ARG}
57
+ This command works on completed phases. Run /ez:execute-phase first.
58
+ ```
59
+ Exit.
60
+
61
+ Present banner:
62
+ ```
63
+ ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
64
+ GSD ► ADD TESTS — Phase ${phase_number}: ${phase_name}
65
+ ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
66
+ ```
67
+ </step>
68
+
69
+ <step name="analyze_implementation">
70
+ Extract the list of files modified by the phase from SUMMARY.md ("Files Changed" or equivalent section).
71
+
72
+ For each file, classify into one of three categories:
73
+
74
+ | Category | Criteria | Test Type |
75
+ |----------|----------|-----------|
76
+ | **TDD** | Pure functions where `expect(fn(input)).toBe(output)` is writable | Unit tests |
77
+ | **E2E** | UI behavior verifiable by browser automation | Playwright/E2E tests |
78
+ | **Skip** | Not meaningfully testable or already covered | None |
79
+
80
+ **TDD classification — apply when:**
81
+ - Business logic: calculations, pricing, tax rules, validation
82
+ - Data transformations: mapping, filtering, aggregation, formatting
83
+ - Parsers: CSV, JSON, XML, custom format parsing
84
+ - Validators: input validation, schema validation, business rules
85
+ - State machines: status transitions, workflow steps
86
+ - Utilities: string manipulation, date handling, number formatting
87
+
88
+ **E2E classification — apply when:**
89
+ - Keyboard shortcuts: key bindings, modifier keys, chord sequences
90
+ - Navigation: page transitions, routing, breadcrumbs, back/forward
91
+ - Form interactions: submit, validation errors, field focus, autocomplete
92
+ - Selection: row selection, multi-select, shift-click ranges
93
+ - Drag and drop: reordering, moving between containers
94
+ - Modal dialogs: open, close, confirm, cancel
95
+ - Data grids: sorting, filtering, inline editing, column resize
96
+
97
+ **Skip classification — apply when:**
98
+ - UI layout/styling: CSS classes, visual appearance, responsive breakpoints
99
+ - Configuration: config files, environment variables, feature flags
100
+ - Glue code: dependency injection setup, middleware registration, routing tables
101
+ - Migrations: database migrations, schema changes
102
+ - Simple CRUD: basic create/read/update/delete with no business logic
103
+ - Type definitions: records, DTOs, interfaces with no logic
104
+
105
+ Read each file to verify classification. Don't classify based on filename alone.
106
+ </step>
107
+
108
+ <step name="present_classification">
109
+ Present the classification to the user for confirmation before proceeding:
110
+
111
+ ```
112
+ AskUserQuestion(
113
+ header: "Test Classification",
114
+ question: |
115
+ ## Files classified for testing
116
+
117
+ ### TDD (Unit Tests) — {N} files
118
+ {list of files with brief reason}
119
+
120
+ ### E2E (Browser Tests) — {M} files
121
+ {list of files with brief reason}
122
+
123
+ ### Skip — {K} files
124
+ {list of files with brief reason}
125
+
126
+ {if $EXTRA_INSTRUCTIONS: "Additional instructions: ${EXTRA_INSTRUCTIONS}"}
127
+
128
+ How would you like to proceed?
129
+ options:
130
+ - "Approve and generate test plan"
131
+ - "Adjust classification (I'll specify changes)"
132
+ - "Cancel"
133
+ )
134
+ ```
135
+
136
+ If user selects "Adjust classification": apply their changes and re-present.
137
+ If user selects "Cancel": exit gracefully.
138
+ </step>
139
+
140
+ <step name="discover_test_structure">
141
+ Before generating the test plan, discover the project's existing test structure:
142
+
143
+ ```bash
144
+ # Find existing test directories
145
+ find . -type d -name "*test*" -o -name "*spec*" -o -name "*__tests__*" 2>/dev/null | head -20
146
+ # Find existing test files for convention matching
147
+ find . -type f \( -name "*.test.*" -o -name "*.spec.*" -o -name "*Tests.fs" -o -name "*Test.fs" \) 2>/dev/null | head -20
148
+ # Check for test runners
149
+ ls package.json *.sln 2>/dev/null
150
+ ```
151
+
152
+ Identify:
153
+ - Test directory structure (where unit tests live, where E2E tests live)
154
+ - Naming conventions (`.test.ts`, `.spec.ts`, `*Tests.fs`, etc.)
155
+ - Test runner commands (how to execute unit tests, how to execute E2E tests)
156
+ - Test framework (xUnit, NUnit, Jest, Playwright, etc.)
157
+
158
+ If test structure is ambiguous, ask the user:
159
+ ```
160
+ AskUserQuestion(
161
+ header: "Test Structure",
162
+ question: "I found multiple test locations. Where should I create tests?",
163
+ options: [list discovered locations]
164
+ )
165
+ ```
166
+ </step>
167
+
168
+ <step name="generate_test_plan">
169
+ For each approved file, create a detailed test plan.
170
+
171
+ **For TDD files**, plan tests following RED-GREEN-REFACTOR:
172
+ 1. Identify testable functions/methods in the file
173
+ 2. For each function: list input scenarios, expected outputs, edge cases
174
+ 3. Note: since code already exists, tests may pass immediately — that's OK, but verify they test the RIGHT behavior
175
+
176
+ **For E2E files**, plan tests following RED-GREEN gates:
177
+ 1. Identify user scenarios from CONTEXT.md/VERIFICATION.md
178
+ 2. For each scenario: describe the user action, expected outcome, assertions
179
+ 3. Note: RED gate means confirming the test would fail if the feature were broken
180
+
181
+ Present the complete test plan:
182
+
183
+ ```
184
+ AskUserQuestion(
185
+ header: "Test Plan",
186
+ question: |
187
+ ## Test Generation Plan
188
+
189
+ ### Unit Tests ({N} tests across {M} files)
190
+ {for each file: test file path, list of test cases}
191
+
192
+ ### E2E Tests ({P} tests across {Q} files)
193
+ {for each file: test file path, list of test scenarios}
194
+
195
+ ### Test Commands
196
+ - Unit: {discovered test command}
197
+ - E2E: {discovered e2e command}
198
+
199
+ Ready to generate?
200
+ options:
201
+ - "Generate all"
202
+ - "Cherry-pick (I'll specify which)"
203
+ - "Adjust plan"
204
+ )
205
+ ```
206
+
207
+ If "Cherry-pick": ask user which tests to include.
208
+ If "Adjust plan": apply changes and re-present.
209
+ </step>
210
+
211
+ <step name="execute_tdd_generation">
212
+ For each approved TDD test:
213
+
214
+ 1. **Create test file** following discovered project conventions (directory, naming, imports)
215
+
216
+ 2. **Write test** with clear arrange/act/assert structure:
217
+ ```
218
+ // Arrange — set up inputs and expected outputs
219
+ // Act — call the function under test
220
+ // Assert — verify the output matches expectations
221
+ ```
222
+
223
+ 3. **Run the test**:
224
+ ```bash
225
+ {discovered test command}
226
+ ```
227
+
228
+ 4. **Evaluate result:**
229
+ - **Test passes**: Good — the implementation satisfies the test. Verify the test checks meaningful behavior (not just that it compiles).
230
+ - **Test fails with assertion error**: This may be a genuine bug discovered by the test. Flag it:
231
+ ```
232
+ ⚠️ Potential bug found: {test name}
233
+ Expected: {expected}
234
+ Actual: {actual}
235
+ File: {implementation file}
236
+ ```
237
+ Do NOT fix the implementation — this is a test-generation command, not a fix command. Record the finding.
238
+ - **Test fails with error (import, syntax, etc.)**: This is a test error. Fix the test and re-run.
239
+ </step>
240
+
241
+ <step name="execute_e2e_generation">
242
+ For each approved E2E test:
243
+
244
+ 1. **Check for existing tests** covering the same scenario:
245
+ ```bash
246
+ grep -r "{scenario keyword}" {e2e test directory} 2>/dev/null
247
+ ```
248
+ If found, extend rather than duplicate.
249
+
250
+ 2. **Create test file** targeting the user scenario from CONTEXT.md/VERIFICATION.md
251
+
252
+ 3. **Run the E2E test**:
253
+ ```bash
254
+ {discovered e2e command}
255
+ ```
256
+
257
+ 4. **Evaluate result:**
258
+ - **GREEN (passes)**: Record success
259
+ - **RED (fails)**: Determine if it's a test issue or a genuine application bug. Flag bugs:
260
+ ```
261
+ ⚠️ E2E failure: {test name}
262
+ Scenario: {description}
263
+ Error: {error message}
264
+ ```
265
+ - **Cannot run**: Report blocker. Do NOT mark as complete.
266
+ ```
267
+ 🛑 E2E blocker: {reason tests cannot run}
268
+ ```
269
+
270
+ **No-skip rule:** If E2E tests cannot execute (missing dependencies, environment issues), report the blocker and mark the test as incomplete. Never mark success without actually running the test.
271
+ </step>
272
+
273
+ <step name="summary_and_commit">
274
+ Create a test coverage report and present to user:
275
+
276
+ ```
277
+ ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
278
+ GSD ► TEST GENERATION COMPLETE
279
+ ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
280
+
281
+ ## Results
282
+
283
+ | Category | Generated | Passing | Failing | Blocked |
284
+ |----------|-----------|---------|---------|---------|
285
+ | Unit | {N} | {n1} | {n2} | {n3} |
286
+ | E2E | {M} | {m1} | {m2} | {m3} |
287
+
288
+ ## Files Created/Modified
289
+ {list of test files with paths}
290
+
291
+ ## Coverage Gaps
292
+ {areas that couldn't be tested and why}
293
+
294
+ ## Bugs Discovered
295
+ {any assertion failures that indicate implementation bugs}
296
+ ```
297
+
298
+ Record test generation in project state:
299
+ ```bash
300
+ node "$HOME/.claude/ez-agents/bin/ez-tools.cjs" state-snapshot
301
+ ```
302
+
303
+ If there are passing tests to commit:
304
+
305
+ ```bash
306
+ git add {test files}
307
+ git commit -m "test(phase-${phase_number}): add unit and E2E tests from add-tests command"
308
+ ```
309
+
310
+ Present next steps:
311
+
312
+ ```
313
+ ---
314
+
315
+ ## ▶ Next Up
316
+
317
+ {if bugs discovered:}
318
+ **Fix discovered bugs:** `/ez:quick fix the {N} test failures discovered in phase ${phase_number}`
319
+
320
+ {if blocked tests:}
321
+ **Resolve test blockers:** {description of what's needed}
322
+
323
+ {otherwise:}
324
+ **All tests passing!** Phase ${phase_number} is fully tested.
325
+
326
+ ---
327
+
328
+ **Also available:**
329
+ - `/ez:add-tests {next_phase}` — test another phase
330
+ - `/ez:verify-work {phase_number}` — run UAT verification
331
+
332
+ ---
333
+ ```
334
+ </step>
335
+
336
+ </process>
337
+
338
+ <success_criteria>
339
+ - [ ] Phase artifacts loaded (SUMMARY.md, CONTEXT.md, optionally VERIFICATION.md)
340
+ - [ ] All changed files classified into TDD/E2E/Skip categories
341
+ - [ ] Classification presented to user and approved
342
+ - [ ] Project test structure discovered (directories, conventions, runners)
343
+ - [ ] Test plan presented to user and approved
344
+ - [ ] TDD tests generated with arrange/act/assert structure
345
+ - [ ] E2E tests generated targeting user scenarios
346
+ - [ ] All tests executed — no untested tests marked as passing
347
+ - [ ] Bugs discovered by tests flagged (not fixed)
348
+ - [ ] Test files committed with proper message
349
+ - [ ] Coverage gaps documented
350
+ - [ ] Next steps presented to user
351
+ </success_criteria>