gsd-antigravity-kit 2.0.1 → 2.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (251) hide show
  1. package/.agent/skills/gsd/SKILL.md +26 -4
  2. package/.agent/skills/gsd/VERSION +1 -1
  3. package/.agent/skills/gsd/assets/templates/AI-SPEC.md +246 -0
  4. package/.agent/skills/gsd/assets/templates/DEBUG.md +7 -2
  5. package/.agent/skills/gsd/assets/templates/config.json +56 -48
  6. package/.agent/skills/gsd/assets/templates/research.md +40 -0
  7. package/.agent/skills/gsd/assets/templates/spec.md +307 -0
  8. package/.agent/skills/gsd/assets/templates/state.md +8 -0
  9. package/.agent/skills/gsd/bin/gsd-tools.cjs +212 -11
  10. package/.agent/skills/gsd/bin/help-manifest.json +8 -2
  11. package/.agent/skills/gsd/bin/hooks/gsd-check-update-worker.js +108 -0
  12. package/.agent/skills/gsd/bin/hooks/gsd-check-update.js +14 -89
  13. package/.agent/skills/gsd/bin/hooks/gsd-context-monitor.js +34 -5
  14. package/.agent/skills/gsd/bin/hooks/gsd-phase-boundary.sh +1 -0
  15. package/.agent/skills/gsd/bin/hooks/gsd-prompt-guard.js +1 -1
  16. package/.agent/skills/gsd/bin/hooks/gsd-read-guard.js +6 -1
  17. package/.agent/skills/gsd/bin/hooks/gsd-session-state.sh +1 -0
  18. package/.agent/skills/gsd/bin/hooks/gsd-statusline.js +150 -16
  19. package/.agent/skills/gsd/bin/hooks/gsd-validate-commit.sh +1 -0
  20. package/.agent/skills/gsd/bin/hooks/gsd-workflow-guard.js +1 -1
  21. package/.agent/skills/gsd/bin/lib/audit.cjs +757 -0
  22. package/.agent/skills/gsd/bin/lib/commands.cjs +17 -7
  23. package/.agent/skills/gsd/bin/lib/config.cjs +66 -20
  24. package/.agent/skills/gsd/bin/lib/core.cjs +212 -12
  25. package/.agent/skills/gsd/bin/lib/frontmatter.cjs +6 -8
  26. package/.agent/skills/gsd/bin/lib/graphify.cjs +494 -0
  27. package/.agent/skills/gsd/bin/lib/gsd2-import.cjs +511 -0
  28. package/.agent/skills/gsd/bin/lib/init.cjs +371 -18
  29. package/.agent/skills/gsd/bin/lib/intel.cjs +9 -30
  30. package/.agent/skills/gsd/bin/lib/milestone.cjs +18 -17
  31. package/.agent/skills/gsd/bin/lib/model-profiles.cjs +1 -0
  32. package/.agent/skills/gsd/bin/lib/phase.cjs +225 -98
  33. package/.agent/skills/gsd/bin/lib/profile-output.cjs +17 -5
  34. package/.agent/skills/gsd/bin/lib/roadmap.cjs +12 -5
  35. package/.agent/skills/gsd/bin/lib/state.cjs +394 -129
  36. package/.agent/skills/gsd/bin/lib/template.cjs +8 -4
  37. package/.agent/skills/gsd/bin/lib/uat.cjs +2 -1
  38. package/.agent/skills/gsd/bin/lib/verify.cjs +111 -42
  39. package/.agent/skills/gsd/migration_report.md +2 -2
  40. package/.agent/skills/gsd/references/agents/gsd-advisor-researcher.md +23 -0
  41. package/.agent/skills/gsd/references/agents/gsd-ai-researcher.md +133 -0
  42. package/.agent/skills/gsd/references/agents/gsd-code-fixer.md +11 -10
  43. package/.agent/skills/gsd/references/agents/gsd-code-reviewer.md +2 -2
  44. package/.agent/skills/gsd/references/agents/gsd-codebase-mapper.md +13 -2
  45. package/.agent/skills/gsd/references/agents/gsd-debug-session-manager.md +314 -0
  46. package/.agent/skills/gsd/references/agents/gsd-debugger.md +147 -76
  47. package/.agent/skills/gsd/references/agents/gsd-doc-verifier.md +1 -1
  48. package/.agent/skills/gsd/references/agents/gsd-doc-writer.md +615 -602
  49. package/.agent/skills/gsd/references/agents/gsd-domain-researcher.md +153 -0
  50. package/.agent/skills/gsd/references/agents/gsd-eval-auditor.md +175 -0
  51. package/.agent/skills/gsd/references/agents/gsd-eval-planner.md +154 -0
  52. package/.agent/skills/gsd/references/agents/gsd-executor.md +108 -38
  53. package/.agent/skills/gsd/references/agents/gsd-framework-selector.md +160 -0
  54. package/.agent/skills/gsd/references/agents/gsd-integration-checker.md +454 -443
  55. package/.agent/skills/gsd/references/agents/gsd-intel-updater.md +40 -20
  56. package/.agent/skills/gsd/references/agents/gsd-nyquist-auditor.md +187 -176
  57. package/.agent/skills/gsd/references/agents/gsd-pattern-mapper.md +335 -0
  58. package/.agent/skills/gsd/references/agents/gsd-phase-researcher.md +112 -13
  59. package/.agent/skills/gsd/references/agents/gsd-plan-checker.md +104 -10
  60. package/.agent/skills/gsd/references/agents/gsd-planner.md +125 -167
  61. package/.agent/skills/gsd/references/agents/gsd-project-researcher.md +25 -2
  62. package/.agent/skills/gsd/references/agents/gsd-research-synthesizer.md +3 -3
  63. package/.agent/skills/gsd/references/agents/gsd-roadmapper.md +12 -1
  64. package/.agent/skills/gsd/references/agents/gsd-security-auditor.md +139 -128
  65. package/.agent/skills/gsd/references/agents/gsd-ui-auditor.md +3 -3
  66. package/.agent/skills/gsd/references/agents/gsd-ui-checker.md +11 -2
  67. package/.agent/skills/gsd/references/agents/gsd-ui-researcher.md +27 -4
  68. package/.agent/skills/gsd/references/agents/gsd-verifier.md +13 -19
  69. package/.agent/skills/gsd/references/commands/atomic/add-todo.md +2 -2
  70. package/.agent/skills/gsd/references/commands/atomic/check-todos.md +2 -2
  71. package/.agent/skills/gsd/references/commands/atomic/cleanup.md +2 -2
  72. package/.agent/skills/gsd/references/commands/atomic/do.md +2 -2
  73. package/.agent/skills/gsd/references/commands/atomic/help.md +2 -2
  74. package/.agent/skills/gsd/references/commands/atomic/join-discord.md +2 -2
  75. package/.agent/skills/gsd/references/commands/atomic/note.md +2 -2
  76. package/.agent/skills/gsd/references/commands/atomic/session-report.md +2 -2
  77. package/.agent/skills/gsd/references/commands/atomic/ship.md +2 -2
  78. package/.agent/skills/gsd/references/commands/atomic/stats.md +2 -2
  79. package/.agent/skills/gsd/references/commands/atomic/thread.md +141 -41
  80. package/.agent/skills/gsd/references/commands/atomic/undo.md +2 -2
  81. package/.agent/skills/gsd/references/commands/milestone/add-backlog.md +15 -12
  82. package/.agent/skills/gsd/references/commands/milestone/audit-milestone.md +2 -2
  83. package/.agent/skills/gsd/references/commands/milestone/complete-milestone.md +2 -2
  84. package/.agent/skills/gsd/references/commands/milestone/milestone-summary.md +2 -2
  85. package/.agent/skills/gsd/references/commands/milestone/new-milestone.md +2 -2
  86. package/.agent/skills/gsd/references/commands/milestone/plan-milestone-gaps.md +2 -2
  87. package/.agent/skills/gsd/references/commands/milestone/plant-seed.md +2 -2
  88. package/.agent/skills/gsd/references/commands/milestone/review-backlog.md +4 -4
  89. package/.agent/skills/gsd/references/commands/misc/ai-integration-phase.md +38 -0
  90. package/.agent/skills/gsd/references/commands/misc/audit-fix.md +2 -2
  91. package/.agent/skills/gsd/references/commands/misc/audit-uat.md +2 -2
  92. package/.agent/skills/gsd/references/commands/misc/eval-review.md +34 -0
  93. package/.agent/skills/gsd/references/commands/misc/extract_learnings.md +24 -0
  94. package/.agent/skills/gsd/references/commands/misc/from-gsd2.md +49 -0
  95. package/.agent/skills/gsd/references/commands/misc/graphify.md +203 -0
  96. package/.agent/skills/gsd/references/commands/misc/inbox.md +40 -0
  97. package/.agent/skills/gsd/references/commands/misc/next.md +5 -3
  98. package/.agent/skills/gsd/references/commands/misc/progress.md +4 -3
  99. package/.agent/skills/gsd/references/commands/misc/sketch-wrap-up.md +33 -0
  100. package/.agent/skills/gsd/references/commands/misc/sketch.md +47 -0
  101. package/.agent/skills/gsd/references/commands/misc/spec-phase.md +64 -0
  102. package/.agent/skills/gsd/references/commands/misc/spike-wrap-up.md +33 -0
  103. package/.agent/skills/gsd/references/commands/misc/spike.md +43 -0
  104. package/.agent/skills/gsd/references/commands/misc/verify-work.md +2 -2
  105. package/.agent/skills/gsd/references/commands/phase/add-phase.md +2 -2
  106. package/.agent/skills/gsd/references/commands/phase/add-tests.md +2 -2
  107. package/.agent/skills/gsd/references/commands/phase/discuss-phase.md +5 -5
  108. package/.agent/skills/gsd/references/commands/phase/execute-phase.md +4 -4
  109. package/.agent/skills/gsd/references/commands/phase/insert-phase.md +2 -2
  110. package/.agent/skills/gsd/references/commands/phase/list-phase-assumptions.md +2 -2
  111. package/.agent/skills/gsd/references/commands/phase/plan-phase.md +3 -3
  112. package/.agent/skills/gsd/references/commands/phase/remove-phase.md +2 -2
  113. package/.agent/skills/gsd/references/commands/phase/research-phase.md +5 -5
  114. package/.agent/skills/gsd/references/commands/phase/secure-phase.md +2 -2
  115. package/.agent/skills/gsd/references/commands/phase/ui-phase.md +2 -2
  116. package/.agent/skills/gsd/references/commands/phase/ui-review.md +2 -2
  117. package/.agent/skills/gsd/references/commands/phase/validate-phase.md +2 -2
  118. package/.agent/skills/gsd/references/commands/phase/workstreams.md +9 -9
  119. package/.agent/skills/gsd/references/commands/project/analyze-dependencies.md +2 -2
  120. package/.agent/skills/gsd/references/commands/project/explore.md +2 -2
  121. package/.agent/skills/gsd/references/commands/project/import.md +2 -2
  122. package/.agent/skills/gsd/references/commands/project/intel.md +10 -10
  123. package/.agent/skills/gsd/references/commands/project/list-workspaces.md +2 -2
  124. package/.agent/skills/gsd/references/commands/project/map-codebase.md +2 -2
  125. package/.agent/skills/gsd/references/commands/project/new-project.md +2 -2
  126. package/.agent/skills/gsd/references/commands/project/new-workspace.md +2 -2
  127. package/.agent/skills/gsd/references/commands/project/remove-workspace.md +2 -2
  128. package/.agent/skills/gsd/references/commands/project/scan.md +2 -2
  129. package/.agent/skills/gsd/references/commands/system/autonomous.md +4 -3
  130. package/.agent/skills/gsd/references/commands/system/code-review-fix.md +3 -3
  131. package/.agent/skills/gsd/references/commands/system/code-review.md +3 -3
  132. package/.agent/skills/gsd/references/commands/system/debug.md +177 -100
  133. package/.agent/skills/gsd/references/commands/system/docs-update.md +2 -2
  134. package/.agent/skills/gsd/references/commands/system/fast.md +2 -2
  135. package/.agent/skills/gsd/references/commands/system/forensics.md +2 -2
  136. package/.agent/skills/gsd/references/commands/system/gsd-tools.md +153 -6
  137. package/.agent/skills/gsd/references/commands/system/health.md +2 -2
  138. package/.agent/skills/gsd/references/commands/system/manager.md +3 -3
  139. package/.agent/skills/gsd/references/commands/system/pause-work.md +2 -2
  140. package/.agent/skills/gsd/references/commands/system/pr-branch.md +2 -2
  141. package/.agent/skills/gsd/references/commands/system/profile-user.md +2 -2
  142. package/.agent/skills/gsd/references/commands/system/quick.md +127 -3
  143. package/.agent/skills/gsd/references/commands/system/reapply-patches.md +45 -6
  144. package/.agent/skills/gsd/references/commands/system/resume-work.md +2 -2
  145. package/.agent/skills/gsd/references/commands/system/review.md +6 -4
  146. package/.agent/skills/gsd/references/commands/system/set-profile.md +3 -3
  147. package/.agent/skills/gsd/references/commands/system/settings.md +2 -2
  148. package/.agent/skills/gsd/references/commands/system/update.md +2 -2
  149. package/.agent/skills/gsd/references/docs/ai-evals.md +156 -0
  150. package/.agent/skills/gsd/references/docs/ai-frameworks.md +186 -0
  151. package/.agent/skills/gsd/references/docs/artifact-types.md +18 -0
  152. package/.agent/skills/gsd/references/docs/autonomous-smart-discuss.md +277 -0
  153. package/.agent/skills/gsd/references/docs/checkpoints.md +30 -0
  154. package/.agent/skills/gsd/references/docs/common-bug-patterns.md +49 -49
  155. package/.agent/skills/gsd/references/docs/continuation-format.md +11 -7
  156. package/.agent/skills/gsd/references/docs/debugger-philosophy.md +76 -0
  157. package/.agent/skills/gsd/references/docs/decimal-phase-calculation.md +64 -64
  158. package/.agent/skills/gsd/references/docs/executor-examples.md +110 -0
  159. package/.agent/skills/gsd/references/docs/git-integration.md +4 -4
  160. package/.agent/skills/gsd/references/docs/git-planning-commit.md +40 -38
  161. package/.agent/skills/gsd/references/docs/ios-scaffold.md +123 -0
  162. package/.agent/skills/gsd/references/docs/mandatory-initial-read.md +2 -0
  163. package/.agent/skills/gsd/references/docs/phase-argument-parsing.md +61 -61
  164. package/.agent/skills/gsd/references/docs/planner-antipatterns.md +89 -0
  165. package/.agent/skills/gsd/references/docs/planner-revision.md +87 -87
  166. package/.agent/skills/gsd/references/docs/planner-source-audit.md +73 -0
  167. package/.agent/skills/gsd/references/docs/planning-config.md +33 -8
  168. package/.agent/skills/gsd/references/docs/project-skills-discovery.md +19 -0
  169. package/.agent/skills/gsd/references/docs/sketch-interactivity.md +41 -0
  170. package/.agent/skills/gsd/references/docs/sketch-theme-system.md +94 -0
  171. package/.agent/skills/gsd/references/docs/sketch-tooling.md +45 -0
  172. package/.agent/skills/gsd/references/docs/sketch-variant-patterns.md +81 -0
  173. package/.agent/skills/gsd/references/docs/tdd.md +67 -0
  174. package/.agent/skills/gsd/references/docs/universal-anti-patterns.md +5 -0
  175. package/.agent/skills/gsd/references/docs/workstream-flag.md +11 -11
  176. package/.agent/skills/gsd/references/mapping.md +1 -1
  177. package/.agent/skills/gsd/references/workflows/add-phase.md +112 -112
  178. package/.agent/skills/gsd/references/workflows/add-tests.md +6 -3
  179. package/.agent/skills/gsd/references/workflows/add-todo.md +5 -3
  180. package/.agent/skills/gsd/references/workflows/ai-integration-phase.md +284 -0
  181. package/.agent/skills/gsd/references/workflows/audit-fix.md +157 -157
  182. package/.agent/skills/gsd/references/workflows/audit-milestone.md +340 -340
  183. package/.agent/skills/gsd/references/workflows/audit-uat.md +109 -109
  184. package/.agent/skills/gsd/references/workflows/autonomous.md +20 -288
  185. package/.agent/skills/gsd/references/workflows/check-todos.md +4 -2
  186. package/.agent/skills/gsd/references/workflows/cleanup.md +3 -1
  187. package/.agent/skills/gsd/references/workflows/code-review-fix.md +497 -497
  188. package/.agent/skills/gsd/references/workflows/code-review.md +515 -515
  189. package/.agent/skills/gsd/references/workflows/complete-milestone.md +97 -24
  190. package/.agent/skills/gsd/references/workflows/diagnose-issues.md +238 -238
  191. package/.agent/skills/gsd/references/workflows/discovery-phase.md +2 -0
  192. package/.agent/skills/gsd/references/workflows/discuss-phase-assumptions.md +11 -11
  193. package/.agent/skills/gsd/references/workflows/discuss-phase.md +143 -19
  194. package/.agent/skills/gsd/references/workflows/do.md +8 -2
  195. package/.agent/skills/gsd/references/workflows/docs-update.md +5 -3
  196. package/.agent/skills/gsd/references/workflows/eval-review.md +155 -0
  197. package/.agent/skills/gsd/references/workflows/execute-phase.md +338 -54
  198. package/.agent/skills/gsd/references/workflows/execute-plan.md +80 -104
  199. package/.agent/skills/gsd/references/workflows/explore.md +3 -1
  200. package/.agent/skills/gsd/references/workflows/extract_learnings.md +232 -0
  201. package/.agent/skills/gsd/references/workflows/forensics.md +3 -3
  202. package/.agent/skills/gsd/references/workflows/health.md +2 -2
  203. package/.agent/skills/gsd/references/workflows/help.md +59 -1
  204. package/.agent/skills/gsd/references/workflows/import.md +3 -1
  205. package/.agent/skills/gsd/references/workflows/inbox.md +387 -384
  206. package/.agent/skills/gsd/references/workflows/insert-phase.md +130 -130
  207. package/.agent/skills/gsd/references/workflows/list-workspaces.md +56 -56
  208. package/.agent/skills/gsd/references/workflows/manager.md +5 -3
  209. package/.agent/skills/gsd/references/workflows/map-codebase.md +19 -5
  210. package/.agent/skills/gsd/references/workflows/milestone-summary.md +6 -6
  211. package/.agent/skills/gsd/references/workflows/new-milestone.md +63 -9
  212. package/.agent/skills/gsd/references/workflows/new-project.md +126 -22
  213. package/.agent/skills/gsd/references/workflows/new-workspace.md +6 -4
  214. package/.agent/skills/gsd/references/workflows/next.md +220 -153
  215. package/.agent/skills/gsd/references/workflows/note.md +2 -0
  216. package/.agent/skills/gsd/references/workflows/pause-work.md +11 -7
  217. package/.agent/skills/gsd/references/workflows/plan-milestone-gaps.md +273 -273
  218. package/.agent/skills/gsd/references/workflows/plan-phase.md +281 -62
  219. package/.agent/skills/gsd/references/workflows/plant-seed.md +4 -1
  220. package/.agent/skills/gsd/references/workflows/pr-branch.md +41 -13
  221. package/.agent/skills/gsd/references/workflows/profile-user.md +15 -13
  222. package/.agent/skills/gsd/references/workflows/progress.md +133 -21
  223. package/.agent/skills/gsd/references/workflows/quick.md +67 -27
  224. package/.agent/skills/gsd/references/workflows/remove-phase.md +155 -155
  225. package/.agent/skills/gsd/references/workflows/remove-workspace.md +4 -2
  226. package/.agent/skills/gsd/references/workflows/research-phase.md +3 -3
  227. package/.agent/skills/gsd/references/workflows/resume-project.md +3 -3
  228. package/.agent/skills/gsd/references/workflows/review.md +71 -8
  229. package/.agent/skills/gsd/references/workflows/scan.md +102 -102
  230. package/.agent/skills/gsd/references/workflows/secure-phase.md +7 -5
  231. package/.agent/skills/gsd/references/workflows/settings.md +24 -7
  232. package/.agent/skills/gsd/references/workflows/ship.md +71 -6
  233. package/.agent/skills/gsd/references/workflows/sketch-wrap-up.md +283 -0
  234. package/.agent/skills/gsd/references/workflows/sketch.md +263 -0
  235. package/.agent/skills/gsd/references/workflows/spec-phase.md +262 -0
  236. package/.agent/skills/gsd/references/workflows/spike-wrap-up.md +273 -0
  237. package/.agent/skills/gsd/references/workflows/spike.md +270 -0
  238. package/.agent/skills/gsd/references/workflows/stats.md +60 -60
  239. package/.agent/skills/gsd/references/workflows/transition.md +671 -671
  240. package/.agent/skills/gsd/references/workflows/ui-phase.md +33 -12
  241. package/.agent/skills/gsd/references/workflows/ui-review.md +6 -4
  242. package/.agent/skills/gsd/references/workflows/undo.md +3 -1
  243. package/.agent/skills/gsd/references/workflows/update.md +113 -2
  244. package/.agent/skills/gsd/references/workflows/validate-phase.md +7 -5
  245. package/.agent/skills/gsd/references/workflows/verify-phase.md +93 -10
  246. package/.agent/skills/gsd/references/workflows/verify-work.md +50 -10
  247. package/.agent/skills/gsd-converter/references/mapping.md +1 -1
  248. package/.agent/skills/gsd-converter/scripts/convert.py +36 -17
  249. package/.agent/skills/gsd-converter/scripts/regression_test.py +68 -33
  250. package/README.md +3 -2
  251. package/package.json +1 -1
@@ -1,6 +1,6 @@
1
1
  ---
2
2
  name: gsd
3
- version: 1.34.2
3
+ version: 1.37.1
4
4
  description: "Antigravity GSD (Get Stuff Done) - A spec-driven hierarchical planning and execution system. Triggers on project planning, phase management, and GSD slash commands."
5
5
  ---
6
6
 
@@ -25,6 +25,7 @@ This skill should be used when:
25
25
  - `gsd:add-phase`
26
26
  - `gsd:add-tests`
27
27
  - `gsd:add-todo`
28
+ - `gsd:ai-integration-phase`
28
29
  - `gsd:analyze-dependencies`
29
30
  - `gsd:audit-fix`
30
31
  - `gsd:audit-milestone`
@@ -39,14 +40,19 @@ This skill should be used when:
39
40
  - `gsd:discuss-phase`
40
41
  - `gsd:do`
41
42
  - `gsd:docs-update`
43
+ - `gsd:eval-review`
42
44
  - `gsd:execute-phase`
43
45
  - `gsd:explore`
46
+ - `gsd:extract_learnings`
44
47
  - `gsd:fast`
45
48
  - `gsd:forensics`
49
+ - `gsd:from-gsd2`
50
+ - `gsd:graphify`
46
51
  - `gsd:gsd-tools`
47
52
  - `gsd:health`
48
53
  - `gsd:help`
49
54
  - `gsd:import`
55
+ - `gsd:inbox`
50
56
  - `gsd:insert-phase`
51
57
  - `gsd:intel`
52
58
  - `gsd:join-discord`
@@ -81,6 +87,11 @@ This skill should be used when:
81
87
  - `gsd:set-profile`
82
88
  - `gsd:settings`
83
89
  - `gsd:ship`
90
+ - `gsd:sketch`
91
+ - `gsd:sketch-wrap-up`
92
+ - `gsd:spec-phase`
93
+ - `gsd:spike`
94
+ - `gsd:spike-wrap-up`
84
95
  - `gsd:stats`
85
96
  - `gsd:thread`
86
97
  - `gsd:ui-phase`
@@ -128,16 +139,27 @@ The following slash commands are available in this skill. Use them to drive the
128
139
  - **[`gsd:review-backlog`](references/commands/milestone/review-backlog.md)**: Review and promote backlog items to active milestone
129
140
 
130
141
  ### Misc Commands
142
+ - **[`gsd:ai-integration-phase`](references/commands/misc/ai-integration-phase.md)**: Generate AI design contract (AI-SPEC.md) for phases that involve building AI systems — framework selection, implementation guidance from official docs, and evaluation strategy
131
143
  - **[`gsd:audit-fix`](references/commands/misc/audit-fix.md)**: Autonomous audit-to-fix pipeline — find issues, classify, fix, test, commit
132
144
  - **[`gsd:audit-uat`](references/commands/misc/audit-uat.md)**: Cross-phase audit of all outstanding UAT and verification items
145
+ - **[`gsd:eval-review`](references/commands/misc/eval-review.md)**: Retroactively audit an executed AI phase's evaluation coverage — scores each eval dimension as COVERED/PARTIAL/MISSING and produces an actionable EVAL-REVIEW.md with remediation plan
146
+ - **[`gsd:extract_learnings`](references/commands/misc/extract_learnings.md)**: Extract decisions, lessons, patterns, and surprises from completed phase artifacts
147
+ - **[`gsd:from-gsd2`](references/commands/misc/from-gsd2.md)**: Import a GSD-2 (.gsd/) project back to GSD v1 (.planning/) format
148
+ - **[`gsd:graphify`](references/commands/misc/graphify.md)**: Build, query, and inspect the project knowledge graph in .planning/graphs/
149
+ - **[`gsd:inbox`](references/commands/misc/inbox.md)**: Triage and review all open GitHub issues and PRs against project templates and contribution guidelines
133
150
  - **[`gsd:next`](references/commands/misc/next.md)**: Automatically advance to the next logical step in the GSD workflow
134
- - **[`gsd:progress`](references/commands/misc/progress.md)**: Check project progress, show context, and route to next action (execute or plan)
151
+ - **[`gsd:progress`](references/commands/misc/progress.md)**: Check project progress, show context, and route to next action (execute or plan). Use --forensic to append a 6-check integrity audit after the standard report.
152
+ - **[`gsd:sketch-wrap-up`](references/commands/misc/sketch-wrap-up.md)**: Package sketch design findings into a persistent project skill for future build conversations
153
+ - **[`gsd:sketch`](references/commands/misc/sketch.md)**: Rapidly sketch UI/design ideas using throwaway HTML mockups with multi-variant exploration
154
+ - **[`gsd:spec-phase`](references/commands/misc/spec-phase.md)**: Socratic spec refinement — clarify WHAT a phase delivers with ambiguity scoring before discuss-phase. Produces a SPEC.md with falsifiable requirements locked before implementation decisions begin.
155
+ - **[`gsd:spike-wrap-up`](references/commands/misc/spike-wrap-up.md)**: Package spike findings into a persistent project skill for future build conversations
156
+ - **[`gsd:spike`](references/commands/misc/spike.md)**: Rapidly spike an idea with throwaway experiments to validate feasibility before planning
135
157
  - **[`gsd:verify-work`](references/commands/misc/verify-work.md)**: Validate built features through conversational UAT
136
158
 
137
159
  ### Phase Commands
138
160
  - **[`gsd:add-phase`](references/commands/phase/add-phase.md)**: Add phase to end of current milestone in roadmap
139
161
  - **[`gsd:add-tests`](references/commands/phase/add-tests.md)**: Generate tests for a completed phase based on UAT criteria and implementation
140
- - **[`gsd:discuss-phase`](references/commands/phase/discuss-phase.md)**: Gather phase context through adaptive questioning before planning. Use --auto to skip interactive questions (Antigravity picks recommended defaults). Use --chain for interactive discuss followed by automatic plan+execute. Use --power for bulk question generation into a file-based UI (answer at your own pace).
162
+ - **[`gsd:discuss-phase`](references/commands/phase/discuss-phase.md)**: Gather phase context through adaptive questioning before planning. Use --all to skip area selection and discuss all gray areas interactively. Use --auto to skip interactive questions (Antigravity picks recommended defaults). Use --chain for interactive discuss followed by automatic plan+execute. Use --power for bulk question generation into a file-based UI (answer at your own pace).
141
163
  - **[`gsd:execute-phase`](references/commands/phase/execute-phase.md)**: Execute all plans in a phase with wave-based parallelization
142
164
  - **[`gsd:insert-phase`](references/commands/phase/insert-phase.md)**: Insert urgent work as decimal phase (e.g., 72.1) between existing phases
143
165
  - **[`gsd:list-phase-assumptions`](references/commands/phase/list-phase-assumptions.md)**: Surface Antigravity's assumptions about a phase approach before planning
@@ -218,4 +240,4 @@ General documentation on the GSD philosophy, usage patterns, and configuration.
218
240
  5. **CLI Invocation**: `gsd-tools` is **NOT** a global command. Always invoke it with the full node path: `node .agent/skills/gsd/bin/gsd-tools.cjs <command> [args]`. Never run `gsd-tools` bare.
219
241
 
220
242
  ---
221
- *Generated by gsd-converter on 2026-04-08*
243
+ *Generated by gsd-converter on 2026-04-18*
@@ -1 +1 @@
1
- 1.34.2
1
+ 1.37.1
@@ -0,0 +1,246 @@
1
+ # AI-SPEC — Phase {N}: {phase_name}
2
+
3
+ > AI design contract generated by `/gsd-ai-integration-phase`. Consumed by `gsd-planner` and `gsd-eval-auditor`.
4
+ > Locks framework selection, implementation guidance, and evaluation strategy before planning begins.
5
+
6
+ ---
7
+
8
+ ## 1. System Classification
9
+
10
+ **System Type:** <!-- RAG | Multi-Agent | Conversational | Extraction | Autonomous Agent | Content Generation | Code Automation | Hybrid -->
11
+
12
+ **Description:**
13
+ <!-- One-paragraph description of what this AI system does, who uses it, and what "good" looks like -->
14
+
15
+ **Critical Failure Modes:**
16
+ <!-- The 3-5 behaviors that absolutely cannot go wrong in this system -->
17
+ 1.
18
+ 2.
19
+ 3.
20
+
21
+ ---
22
+
23
+ ## 1b. Domain Context
24
+
25
+ > Researched by `gsd-domain-researcher`. Grounds the evaluation strategy in domain expert knowledge.
26
+
27
+ **Industry Vertical:** <!-- healthcare | legal | finance | customer service | education | developer tooling | e-commerce | etc. -->
28
+
29
+ **User Population:** <!-- who uses this system and in what context -->
30
+
31
+ **Stakes Level:** <!-- Low | Medium | High | Critical -->
32
+
33
+ **Output Consequence:** <!-- what happens downstream when the AI output is acted on -->
34
+
35
+ ### What Domain Experts Evaluate Against
36
+
37
+ <!-- Domain-specific rubric ingredients — in practitioner language, not AI jargon -->
38
+ <!-- Format: Dimension / Good (expert accepts) / Bad (expert flags) / Stakes / Source -->
39
+
40
+ ### Known Failure Modes in This Domain
41
+
42
+ <!-- Domain-specific failure modes from research — not generic hallucination, but how it manifests here -->
43
+
44
+ ### Regulatory / Compliance Context
45
+
46
+ <!-- Relevant regulations or constraints — or "None identified" if genuinely none apply -->
47
+
48
+ ### Domain Expert Roles for Evaluation
49
+
50
+ | Role | Responsibility |
51
+ |------|---------------|
52
+ | <!-- e.g., Senior practitioner --> | <!-- Dataset labeling / rubric calibration / production sampling --> |
53
+
54
+ ---
55
+
56
+ ## 2. Framework Decision
57
+
58
+ **Selected Framework:** <!-- e.g., LlamaIndex v0.10.x -->
59
+
60
+ **Version:** <!-- Pin the version -->
61
+
62
+ **Rationale:**
63
+ <!-- Why this framework fits this system type, team context, and production requirements -->
64
+
65
+ **Alternatives Considered:**
66
+
67
+ | Framework | Ruled Out Because |
68
+ |-----------|------------------|
69
+ | | |
70
+
71
+ **Vendor Lock-In Accepted:** <!-- Yes / No / Partial — document the trade-off consciously -->
72
+
73
+ ---
74
+
75
+ ## 3. Framework Quick Reference
76
+
77
+ > Fetched from official docs by `gsd-ai-researcher`. Distilled for this specific use case.
78
+
79
+ ### Installation
80
+ ```bash
81
+ # Install command(s)
82
+ ```
83
+
84
+ ### Core Imports
85
+ ```python
86
+ # Key imports for this use case
87
+ ```
88
+
89
+ ### Entry Point Pattern
90
+ ```python
91
+ # Minimal working example for this system type
92
+ ```
93
+
94
+ ### Key Abstractions
95
+ <!-- Framework-specific concepts the developer must understand before coding -->
96
+ | Concept | What It Is | When You Use It |
97
+ |---------|-----------|-----------------|
98
+ | | | |
99
+
100
+ ### Common Pitfalls
101
+ <!-- Gotchas specific to this framework and system type — from docs, issues, and community reports -->
102
+ 1.
103
+ 2.
104
+ 3.
105
+
106
+ ### Recommended Project Structure
107
+ ```
108
+ project/
109
+ ├── # Framework-specific folder layout
110
+ ```
111
+
112
+ ---
113
+
114
+ ## 4. Implementation Guidance
115
+
116
+ **Model Configuration:**
117
+ <!-- Which model(s), temperature, max tokens, and other key parameters -->
118
+
119
+ **Core Pattern:**
120
+ <!-- The primary implementation pattern for this system type in this framework -->
121
+
122
+ **Tool Use:**
123
+ <!-- Tools/integrations needed and how to configure them -->
124
+
125
+ **State Management:**
126
+ <!-- How state is persisted, retrieved, and updated -->
127
+
128
+ **Context Window Strategy:**
129
+ <!-- How to manage context limits for this system type -->
130
+
131
+ ---
132
+
133
+ ## 4b. AI Systems Best Practices
134
+
135
+ > Written by `gsd-ai-researcher`. Cross-cutting patterns every developer building AI systems needs — independent of framework choice.
136
+
137
+ ### Structured Outputs with Pydantic
138
+
139
+ <!-- Framework-specific Pydantic integration pattern for this use case -->
140
+ <!-- Include: output model definition, how the framework uses it, retry logic on validation failure -->
141
+
142
+ ```python
143
+ # Pydantic output model for this system type
144
+ ```
145
+
146
+ ### Async-First Design
147
+
148
+ <!-- How async is handled in this framework, the one common mistake, and when to stream vs. await -->
149
+
150
+ ### Prompt Engineering Discipline
151
+
152
+ <!-- System vs. user prompt separation, few-shot guidance, token budget strategy -->
153
+
154
+ ### Context Window Management
155
+
156
+ <!-- Strategy specific to this system type: RAG chunking / conversation summarisation / agent compaction -->
157
+
158
+ ### Cost and Latency Budget
159
+
160
+ <!-- Per-call cost estimate, caching strategy, sub-task model routing -->
161
+
162
+ ---
163
+
164
+ ## 5. Evaluation Strategy
165
+
166
+ ### Dimensions
167
+
168
+ | Dimension | Rubric (Pass/Fail or 1-5) | Measurement Approach | Priority |
169
+ |-----------|--------------------------|---------------------|----------|
170
+ | | | Code / LLM Judge / Human | Critical / High / Medium |
171
+
172
+ ### Eval Tooling
173
+
174
+ **Primary Tool:** <!-- e.g., RAGAS + Langfuse -->
175
+
176
+ **Setup:**
177
+ ```bash
178
+ # Install and configure
179
+ ```
180
+
181
+ **CI/CD Integration:**
182
+ ```bash
183
+ # Command to run evals in CI/CD pipeline
184
+ ```
185
+
186
+ ### Reference Dataset
187
+
188
+ **Size:** <!-- e.g., 20 examples to start -->
189
+
190
+ **Composition:**
191
+ <!-- What scenario types the dataset covers: critical paths, edge cases, failure modes -->
192
+
193
+ **Labeling:**
194
+ <!-- Who labels examples and how (domain expert, LLM judge with calibration, etc.) -->
195
+
196
+ ---
197
+
198
+ ## 6. Guardrails
199
+
200
+ ### Online (Real-Time)
201
+
202
+ | Guardrail | Trigger | Intervention |
203
+ |-----------|---------|--------------|
204
+ | | | Block / Escalate / Flag |
205
+
206
+ ### Offline (Flywheel)
207
+
208
+ | Metric | Sampling Strategy | Action on Degradation |
209
+ |--------|------------------|----------------------|
210
+ | | | |
211
+
212
+ ---
213
+
214
+ ## 7. Production Monitoring
215
+
216
+ **Tracing Tool:** <!-- e.g., Langfuse self-hosted -->
217
+
218
+ **Key Metrics to Track:**
219
+ <!-- 3-5 metrics that will be monitored in production -->
220
+
221
+ **Alert Thresholds:**
222
+ <!-- When to page/alert -->
223
+
224
+ **Smart Sampling Strategy:**
225
+ <!-- How to select interactions for human review — signal-based filters -->
226
+
227
+ ---
228
+
229
+ ## Checklist
230
+
231
+ - [ ] System type classified
232
+ - [ ] Critical failure modes identified (≥ 3)
233
+ - [ ] Domain context researched (Section 1b: vertical, stakes, expert criteria, failure modes)
234
+ - [ ] Regulatory/compliance context identified or explicitly noted as none
235
+ - [ ] Domain expert roles defined for evaluation involvement
236
+ - [ ] Framework selected with rationale documented
237
+ - [ ] Alternatives considered and ruled out
238
+ - [ ] Framework quick reference written (install, imports, pattern, pitfalls)
239
+ - [ ] AI systems best practices written (Section 4b: Pydantic, async, prompt discipline, context)
240
+ - [ ] Evaluation dimensions grounded in domain rubric ingredients
241
+ - [ ] Each eval dimension has a concrete rubric (Good/Bad in domain language)
242
+ - [ ] Eval tooling selected — Arize Phoenix default confirmed or override noted
243
+ - [ ] Reference dataset spec written (size ≥ 10, composition + labeling defined)
244
+ - [ ] CI/CD eval integration specified
245
+ - [ ] Online guardrails defined
246
+ - [ ] Production monitoring configured (tracing tool + sampling strategy)
@@ -20,7 +20,9 @@ updated: [ISO timestamp]
20
20
  hypothesis: [current theory being tested]
21
21
  test: [how testing it]
22
22
  expecting: [what result means if true/false]
23
- next_action: [immediate next step]
23
+ next_action: [immediate next step — be specific, not "continue investigating"]
24
+ reasoning_checkpoint: null <!-- populated before every fix attempt — see structured_returns -->
25
+ tdd_checkpoint: null <!-- populated when tdd_mode is active after root cause confirmed -->
24
26
 
25
27
  ## Symptoms
26
28
  <!-- Written during gathering, then immutable -->
@@ -69,7 +71,10 @@ files_changed: []
69
71
  - OVERWRITE entirely on each update
70
72
  - Always reflects what Antigravity is doing RIGHT NOW
71
73
  - If Antigravity reads this after /clear, it knows exactly where to resume
72
- - Fields: hypothesis, test, expecting, next_action
74
+ - Fields: hypothesis, test, expecting, next_action, reasoning_checkpoint, tdd_checkpoint
75
+ - `next_action`: must be concrete and actionable — bad: "continue investigating"; good: "Add logging at line 47 of auth.js to observe token value before jwt.verify()"
76
+ - `reasoning_checkpoint`: OVERWRITE before every fix_and_verify — five-field structured reasoning record (hypothesis, confirming_evidence, falsification_test, fix_rationale, blind_spots)
77
+ - `tdd_checkpoint`: OVERWRITE during TDD red/green phases — test file, name, status, failure output
73
78
 
74
79
  **Symptoms:**
75
80
  - Written during initial gathering phase
@@ -1,48 +1,56 @@
1
- {
2
- "mode": "interactive",
3
- "granularity": "standard",
4
- "workflow": {
5
- "research": true,
6
- "plan_check": true,
7
- "verifier": true,
8
- "auto_advance": false,
9
- "nyquist_validation": true,
10
- "security_enforcement": true,
11
- "security_asvs_level": 1,
12
- "security_block_on": "high",
13
- "discuss_mode": "discuss",
14
- "research_before_questions": false
15
- },
16
- "planning": {
17
- "commit_docs": true,
18
- "search_gitignored": false,
19
- "sub_repos": []
20
- },
21
- "parallelization": {
22
- "enabled": true,
23
- "plan_level": true,
24
- "task_level": false,
25
- "skip_checkpoints": true,
26
- "max_concurrent_agents": 3,
27
- "min_plans_for_parallel": 2
28
- },
29
- "gates": {
30
- "confirm_project": true,
31
- "confirm_phases": true,
32
- "confirm_roadmap": true,
33
- "confirm_breakdown": true,
34
- "confirm_plan": true,
35
- "execute_next_plan": true,
36
- "issues_review": true,
37
- "confirm_transition": true
38
- },
39
- "safety": {
40
- "always_confirm_destructive": true,
41
- "always_confirm_external_services": true
42
- },
43
- "hooks": {
44
- "context_warnings": true
45
- },
46
- "project_code": null,
47
- "agent_skills": {}
48
- }
1
+ {
2
+ "mode": "interactive",
3
+ "granularity": "standard",
4
+ "workflow": {
5
+ "research": true,
6
+ "plan_check": true,
7
+ "verifier": true,
8
+ "auto_advance": false,
9
+ "nyquist_validation": true,
10
+ "security_enforcement": true,
11
+ "security_asvs_level": 1,
12
+ "security_block_on": "high",
13
+ "discuss_mode": "discuss",
14
+ "research_before_questions": false,
15
+ "code_review_command": null,
16
+ "plan_bounce": false,
17
+ "plan_bounce_script": null,
18
+ "plan_bounce_passes": 2,
19
+ "cross_ai_execution": false,
20
+ "cross_ai_command": "",
21
+ "cross_ai_timeout": 300
22
+ },
23
+ "planning": {
24
+ "commit_docs": true,
25
+ "search_gitignored": false,
26
+ "sub_repos": []
27
+ },
28
+ "parallelization": {
29
+ "enabled": true,
30
+ "plan_level": true,
31
+ "task_level": false,
32
+ "skip_checkpoints": true,
33
+ "max_concurrent_agents": 3,
34
+ "min_plans_for_parallel": 2
35
+ },
36
+ "gates": {
37
+ "confirm_project": true,
38
+ "confirm_phases": true,
39
+ "confirm_roadmap": true,
40
+ "confirm_breakdown": true,
41
+ "confirm_plan": true,
42
+ "execute_next_plan": true,
43
+ "issues_review": true,
44
+ "confirm_transition": true
45
+ },
46
+ "safety": {
47
+ "always_confirm_destructive": true,
48
+ "always_confirm_external_services": true
49
+ },
50
+ "hooks": {
51
+ "context_warnings": true
52
+ },
53
+ "project_code": null,
54
+ "agent_skills": {},
55
+ "antigravity_md_path": "./ANTIGRAVITY.md"
56
+ }
@@ -38,6 +38,18 @@ Template for `.planning/phases/XX-name/{phase_num}-RESEARCH.md` - comprehensive
38
38
  **If no CONTEXT.md exists:** Write "No user constraints - all decisions at Antigravity's discretion"
39
39
  </user_constraints>
40
40
 
41
+ <architectural_responsibility_map>
42
+ ## Architectural Responsibility Map
43
+
44
+ Map each phase capability to its standard architectural tier owner before diving into framework research. This prevents tier misassignment from propagating into plans.
45
+
46
+ | Capability | Primary Tier | Secondary Tier | Rationale |
47
+ |------------|-------------|----------------|-----------|
48
+ | [capability from phase description] | [Browser/Client, Frontend Server, API/Backend, CDN/Static, or Database/Storage] | [secondary tier or —] | [why this tier owns it] |
49
+
50
+ **If single-tier application:** Write "Single-tier application — all capabilities reside in [tier]" and omit the table.
51
+ </architectural_responsibility_map>
52
+
41
53
  <research_summary>
42
54
  ## Summary
43
55
 
@@ -82,6 +94,20 @@ yarn add [packages]
82
94
  <architecture_patterns>
83
95
  ## Architecture Patterns
84
96
 
97
+ ### System Architecture Diagram
98
+
99
+ Architecture diagrams MUST show data flow through conceptual components, not file listings.
100
+
101
+ Requirements:
102
+ - Show entry points (how data/requests enter the system)
103
+ - Show processing stages (what transformations happen, in what order)
104
+ - Show decision points and branching paths
105
+ - Show external dependencies and service boundaries
106
+ - Use arrows to indicate data flow direction
107
+ - A reader should be able to trace the primary use case from input to output by following the arrows
108
+
109
+ File-to-implementation mapping belongs in the Component Responsibilities table, not in the diagram.
110
+
85
111
  ### Recommended Project Structure
86
112
  ```
87
113
  src/
@@ -300,6 +326,20 @@ npm install three @react-three/fiber @react-three/drei @react-three/rapier zusta
300
326
  <architecture_patterns>
301
327
  ## Architecture Patterns
302
328
 
329
+ ### System Architecture Diagram
330
+
331
+ Architecture diagrams MUST show data flow through conceptual components, not file listings.
332
+
333
+ Requirements:
334
+ - Show entry points (how data/requests enter the system)
335
+ - Show processing stages (what transformations happen, in what order)
336
+ - Show decision points and branching paths
337
+ - Show external dependencies and service boundaries
338
+ - Use arrows to indicate data flow direction
339
+ - A reader should be able to trace the primary use case from input to output by following the arrows
340
+
341
+ File-to-implementation mapping belongs in the Component Responsibilities table, not in the diagram.
342
+
303
343
  ### Recommended Project Structure
304
344
  ```
305
345
  src/