gsd-trae 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (763) hide show
  1. package/.claude/settings.local.json +8 -0
  2. package/.gitmodules +6 -0
  3. package/.trae/project_rules.md +56 -0
  4. package/.trae/rules/project_rules.md +56 -0
  5. package/.vscode/code-counter/code-counter.db +0 -0
  6. package/.vscode/settings.json +5 -0
  7. package/README.md +193 -0
  8. package/bin/cli.js +13 -0
  9. package/install.sh +77 -0
  10. package/package.json +29 -0
  11. package/refs/gsd/.github/CODEOWNERS +2 -0
  12. package/refs/gsd/.github/FUNDING.yml +1 -0
  13. package/refs/gsd/.github/ISSUE_TEMPLATE/bug_report.yml +59 -0
  14. package/refs/gsd/.github/ISSUE_TEMPLATE/feature_request.yml +37 -0
  15. package/refs/gsd/.github/pull_request_template.md +24 -0
  16. package/refs/gsd/.github/workflows/auto-label-issues.yml +21 -0
  17. package/refs/gsd/CHANGELOG.md +1520 -0
  18. package/refs/gsd/LICENSE +21 -0
  19. package/refs/gsd/README.md +704 -0
  20. package/refs/gsd/SECURITY.md +33 -0
  21. package/refs/gsd/agents/gsd-codebase-mapper.md +764 -0
  22. package/refs/gsd/agents/gsd-debugger.md +1246 -0
  23. package/refs/gsd/agents/gsd-executor.md +469 -0
  24. package/refs/gsd/agents/gsd-integration-checker.md +443 -0
  25. package/refs/gsd/agents/gsd-phase-researcher.md +546 -0
  26. package/refs/gsd/agents/gsd-plan-checker.md +690 -0
  27. package/refs/gsd/agents/gsd-planner.md +1275 -0
  28. package/refs/gsd/agents/gsd-project-researcher.md +621 -0
  29. package/refs/gsd/agents/gsd-research-synthesizer.md +239 -0
  30. package/refs/gsd/agents/gsd-roadmapper.md +642 -0
  31. package/refs/gsd/agents/gsd-verifier.md +573 -0
  32. package/refs/gsd/assets/gsd-logo-2000-transparent.png +0 -0
  33. package/refs/gsd/assets/gsd-logo-2000-transparent.svg +17 -0
  34. package/refs/gsd/assets/gsd-logo-2000.png +0 -0
  35. package/refs/gsd/assets/gsd-logo-2000.svg +21 -0
  36. package/refs/gsd/assets/terminal.svg +68 -0
  37. package/refs/gsd/bin/install.js +2090 -0
  38. package/refs/gsd/commands/gsd/add-phase.md +43 -0
  39. package/refs/gsd/commands/gsd/add-tests.md +41 -0
  40. package/refs/gsd/commands/gsd/add-todo.md +47 -0
  41. package/refs/gsd/commands/gsd/audit-milestone.md +36 -0
  42. package/refs/gsd/commands/gsd/check-todos.md +45 -0
  43. package/refs/gsd/commands/gsd/cleanup.md +18 -0
  44. package/refs/gsd/commands/gsd/complete-milestone.md +136 -0
  45. package/refs/gsd/commands/gsd/debug.md +167 -0
  46. package/refs/gsd/commands/gsd/discuss-phase.md +83 -0
  47. package/refs/gsd/commands/gsd/execute-phase.md +41 -0
  48. package/refs/gsd/commands/gsd/health.md +22 -0
  49. package/refs/gsd/commands/gsd/help.md +22 -0
  50. package/refs/gsd/commands/gsd/insert-phase.md +32 -0
  51. package/refs/gsd/commands/gsd/join-discord.md +18 -0
  52. package/refs/gsd/commands/gsd/list-phase-assumptions.md +46 -0
  53. package/refs/gsd/commands/gsd/map-codebase.md +71 -0
  54. package/refs/gsd/commands/gsd/new-milestone.md +44 -0
  55. package/refs/gsd/commands/gsd/new-project.md +42 -0
  56. package/refs/gsd/commands/gsd/new-project.md.bak +1041 -0
  57. package/refs/gsd/commands/gsd/pause-work.md +38 -0
  58. package/refs/gsd/commands/gsd/plan-milestone-gaps.md +34 -0
  59. package/refs/gsd/commands/gsd/plan-phase.md +45 -0
  60. package/refs/gsd/commands/gsd/progress.md +24 -0
  61. package/refs/gsd/commands/gsd/quick.md +41 -0
  62. package/refs/gsd/commands/gsd/reapply-patches.md +110 -0
  63. package/refs/gsd/commands/gsd/remove-phase.md +31 -0
  64. package/refs/gsd/commands/gsd/research-phase.md +189 -0
  65. package/refs/gsd/commands/gsd/resume-work.md +40 -0
  66. package/refs/gsd/commands/gsd/set-profile.md +34 -0
  67. package/refs/gsd/commands/gsd/settings.md +36 -0
  68. package/refs/gsd/commands/gsd/update.md +37 -0
  69. package/refs/gsd/commands/gsd/verify-work.md +38 -0
  70. package/refs/gsd/docs/USER-GUIDE.md +471 -0
  71. package/refs/gsd/docs/context-monitor.md +96 -0
  72. package/refs/gsd/get-shit-done/bin/gsd-tools.cjs +585 -0
  73. package/refs/gsd/get-shit-done/bin/lib/commands.cjs +553 -0
  74. package/refs/gsd/get-shit-done/bin/lib/config.cjs +162 -0
  75. package/refs/gsd/get-shit-done/bin/lib/core.cjs +411 -0
  76. package/refs/gsd/get-shit-done/bin/lib/frontmatter.cjs +299 -0
  77. package/refs/gsd/get-shit-done/bin/lib/init.cjs +710 -0
  78. package/refs/gsd/get-shit-done/bin/lib/milestone.cjs +215 -0
  79. package/refs/gsd/get-shit-done/bin/lib/phase.cjs +870 -0
  80. package/refs/gsd/get-shit-done/bin/lib/roadmap.cjs +298 -0
  81. package/refs/gsd/get-shit-done/bin/lib/state.cjs +521 -0
  82. package/refs/gsd/get-shit-done/bin/lib/template.cjs +222 -0
  83. package/refs/gsd/get-shit-done/bin/lib/verify.cjs +772 -0
  84. package/refs/gsd/get-shit-done/references/checkpoints.md +776 -0
  85. package/refs/gsd/get-shit-done/references/continuation-format.md +249 -0
  86. package/refs/gsd/get-shit-done/references/decimal-phase-calculation.md +65 -0
  87. package/refs/gsd/get-shit-done/references/git-integration.md +248 -0
  88. package/refs/gsd/get-shit-done/references/git-planning-commit.md +38 -0
  89. package/refs/gsd/get-shit-done/references/model-profile-resolution.md +34 -0
  90. package/refs/gsd/get-shit-done/references/model-profiles.md +92 -0
  91. package/refs/gsd/get-shit-done/references/phase-argument-parsing.md +61 -0
  92. package/refs/gsd/get-shit-done/references/planning-config.md +196 -0
  93. package/refs/gsd/get-shit-done/references/questioning.md +145 -0
  94. package/refs/gsd/get-shit-done/references/tdd.md +263 -0
  95. package/refs/gsd/get-shit-done/references/ui-brand.md +160 -0
  96. package/refs/gsd/get-shit-done/references/verification-patterns.md +612 -0
  97. package/refs/gsd/get-shit-done/templates/DEBUG.md +164 -0
  98. package/refs/gsd/get-shit-done/templates/UAT.md +247 -0
  99. package/refs/gsd/get-shit-done/templates/VALIDATION.md +76 -0
  100. package/refs/gsd/get-shit-done/templates/codebase/architecture.md +255 -0
  101. package/refs/gsd/get-shit-done/templates/codebase/concerns.md +310 -0
  102. package/refs/gsd/get-shit-done/templates/codebase/conventions.md +307 -0
  103. package/refs/gsd/get-shit-done/templates/codebase/integrations.md +280 -0
  104. package/refs/gsd/get-shit-done/templates/codebase/stack.md +186 -0
  105. package/refs/gsd/get-shit-done/templates/codebase/structure.md +285 -0
  106. package/refs/gsd/get-shit-done/templates/codebase/testing.md +480 -0
  107. package/refs/gsd/get-shit-done/templates/config.json +37 -0
  108. package/refs/gsd/get-shit-done/templates/context.md +283 -0
  109. package/refs/gsd/get-shit-done/templates/continue-here.md +78 -0
  110. package/refs/gsd/get-shit-done/templates/debug-subagent-prompt.md +91 -0
  111. package/refs/gsd/get-shit-done/templates/discovery.md +146 -0
  112. package/refs/gsd/get-shit-done/templates/milestone-archive.md +123 -0
  113. package/refs/gsd/get-shit-done/templates/milestone.md +115 -0
  114. package/refs/gsd/get-shit-done/templates/phase-prompt.md +569 -0
  115. package/refs/gsd/get-shit-done/templates/planner-subagent-prompt.md +117 -0
  116. package/refs/gsd/get-shit-done/templates/project.md +184 -0
  117. package/refs/gsd/get-shit-done/templates/requirements.md +231 -0
  118. package/refs/gsd/get-shit-done/templates/research-project/ARCHITECTURE.md +204 -0
  119. package/refs/gsd/get-shit-done/templates/research-project/FEATURES.md +147 -0
  120. package/refs/gsd/get-shit-done/templates/research-project/PITFALLS.md +200 -0
  121. package/refs/gsd/get-shit-done/templates/research-project/STACK.md +120 -0
  122. package/refs/gsd/get-shit-done/templates/research-project/SUMMARY.md +170 -0
  123. package/refs/gsd/get-shit-done/templates/research.md +552 -0
  124. package/refs/gsd/get-shit-done/templates/retrospective.md +54 -0
  125. package/refs/gsd/get-shit-done/templates/roadmap.md +202 -0
  126. package/refs/gsd/get-shit-done/templates/state.md +176 -0
  127. package/refs/gsd/get-shit-done/templates/summary-complex.md +59 -0
  128. package/refs/gsd/get-shit-done/templates/summary-minimal.md +41 -0
  129. package/refs/gsd/get-shit-done/templates/summary-standard.md +48 -0
  130. package/refs/gsd/get-shit-done/templates/summary.md +248 -0
  131. package/refs/gsd/get-shit-done/templates/user-setup.md +311 -0
  132. package/refs/gsd/get-shit-done/templates/verification-report.md +322 -0
  133. package/refs/gsd/get-shit-done/workflows/add-phase.md +111 -0
  134. package/refs/gsd/get-shit-done/workflows/add-tests.md +350 -0
  135. package/refs/gsd/get-shit-done/workflows/add-todo.md +157 -0
  136. package/refs/gsd/get-shit-done/workflows/audit-milestone.md +297 -0
  137. package/refs/gsd/get-shit-done/workflows/check-todos.md +176 -0
  138. package/refs/gsd/get-shit-done/workflows/cleanup.md +152 -0
  139. package/refs/gsd/get-shit-done/workflows/complete-milestone.md +763 -0
  140. package/refs/gsd/get-shit-done/workflows/diagnose-issues.md +219 -0
  141. package/refs/gsd/get-shit-done/workflows/discovery-phase.md +289 -0
  142. package/refs/gsd/get-shit-done/workflows/discuss-phase.md +542 -0
  143. package/refs/gsd/get-shit-done/workflows/execute-phase.md +449 -0
  144. package/refs/gsd/get-shit-done/workflows/execute-plan.md +448 -0
  145. package/refs/gsd/get-shit-done/workflows/health.md +156 -0
  146. package/refs/gsd/get-shit-done/workflows/help.md +489 -0
  147. package/refs/gsd/get-shit-done/workflows/insert-phase.md +129 -0
  148. package/refs/gsd/get-shit-done/workflows/list-phase-assumptions.md +178 -0
  149. package/refs/gsd/get-shit-done/workflows/map-codebase.md +315 -0
  150. package/refs/gsd/get-shit-done/workflows/new-milestone.md +382 -0
  151. package/refs/gsd/get-shit-done/workflows/new-project.md +1116 -0
  152. package/refs/gsd/get-shit-done/workflows/pause-work.md +122 -0
  153. package/refs/gsd/get-shit-done/workflows/plan-milestone-gaps.md +274 -0
  154. package/refs/gsd/get-shit-done/workflows/plan-phase.md +569 -0
  155. package/refs/gsd/get-shit-done/workflows/progress.md +381 -0
  156. package/refs/gsd/get-shit-done/workflows/quick.md +453 -0
  157. package/refs/gsd/get-shit-done/workflows/remove-phase.md +154 -0
  158. package/refs/gsd/get-shit-done/workflows/research-phase.md +73 -0
  159. package/refs/gsd/get-shit-done/workflows/resume-project.md +306 -0
  160. package/refs/gsd/get-shit-done/workflows/set-profile.md +80 -0
  161. package/refs/gsd/get-shit-done/workflows/settings.md +213 -0
  162. package/refs/gsd/get-shit-done/workflows/transition.md +544 -0
  163. package/refs/gsd/get-shit-done/workflows/update.md +219 -0
  164. package/refs/gsd/get-shit-done/workflows/verify-phase.md +242 -0
  165. package/refs/gsd/get-shit-done/workflows/verify-work.md +569 -0
  166. package/refs/gsd/hooks/gsd-check-update.js +62 -0
  167. package/refs/gsd/hooks/gsd-context-monitor.js +122 -0
  168. package/refs/gsd/hooks/gsd-statusline.js +108 -0
  169. package/refs/gsd/package.json +50 -0
  170. package/refs/gsd/scripts/build-hooks.js +43 -0
  171. package/refs/gsd/tests/commands.test.cjs +661 -0
  172. package/refs/gsd/tests/helpers.cjs +40 -0
  173. package/refs/gsd/tests/init.test.cjs +205 -0
  174. package/refs/gsd/tests/milestone.test.cjs +98 -0
  175. package/refs/gsd/tests/phase.test.cjs +1241 -0
  176. package/refs/gsd/tests/roadmap.test.cjs +265 -0
  177. package/refs/gsd/tests/state.test.cjs +302 -0
  178. package/refs/gsd/tests/verify.test.cjs +80 -0
  179. package/refs/vbenchmark/.agent/agents/codebase-explorer.md +224 -0
  180. package/refs/vbenchmark/.agent/agents/debugger.md +180 -0
  181. package/refs/vbenchmark/.agent/agents/documenter.md +166 -0
  182. package/refs/vbenchmark/.agent/agents/implementer.md +70 -0
  183. package/refs/vbenchmark/.agent/agents/orchestrator.md +212 -0
  184. package/refs/vbenchmark/.agent/agents/researcher.md +80 -0
  185. package/refs/vbenchmark/.agent/agents/reviewer.md +184 -0
  186. package/refs/vbenchmark/.agent/agents/tester.md +170 -0
  187. package/refs/vbenchmark/.agent/commands/commit.md +29 -0
  188. package/refs/vbenchmark/.agent/commands/debug.md +59 -0
  189. package/refs/vbenchmark/.agent/commands/document.md +52 -0
  190. package/refs/vbenchmark/.agent/commands/gather-context.md +58 -0
  191. package/refs/vbenchmark/.agent/commands/init.md +56 -0
  192. package/refs/vbenchmark/.agent/commands/preset-help.md +50 -0
  193. package/refs/vbenchmark/.agent/commands/refactor.md +71 -0
  194. package/refs/vbenchmark/.agent/commands/research.md +37 -0
  195. package/refs/vbenchmark/.agent/commands/review.md +38 -0
  196. package/refs/vbenchmark/.agent/commands/test.md +61 -0
  197. package/refs/vbenchmark/.agent/rules/01-code-quality.md +33 -0
  198. package/refs/vbenchmark/.agent/rules/02-typescript-go.md +46 -0
  199. package/refs/vbenchmark/.agent/rules/03-security-git.md +34 -0
  200. package/refs/vbenchmark/.agent/rules/04-architecture.md +40 -0
  201. package/refs/vbenchmark/.agent/sync.js +536 -0
  202. package/refs/vbenchmark/.agent/workflows/commit.md +29 -0
  203. package/refs/vbenchmark/.agent/workflows/debug.md +59 -0
  204. package/refs/vbenchmark/.agent/workflows/document.md +52 -0
  205. package/refs/vbenchmark/.agent/workflows/gather-context.md +58 -0
  206. package/refs/vbenchmark/.agent/workflows/init.md +56 -0
  207. package/refs/vbenchmark/.agent/workflows/preset-help.md +50 -0
  208. package/refs/vbenchmark/.agent/workflows/refactor.md +71 -0
  209. package/refs/vbenchmark/.agent/workflows/research.md +37 -0
  210. package/refs/vbenchmark/.agent/workflows/review.md +38 -0
  211. package/refs/vbenchmark/.agent/workflows/test.md +61 -0
  212. package/refs/vbenchmark/.claude/commands/agentic-dev/apply.md +222 -0
  213. package/refs/vbenchmark/.claude/commands/agentic-dev/done.md +166 -0
  214. package/refs/vbenchmark/.claude/commands/agentic-dev/proposal.md +220 -0
  215. package/refs/vbenchmark/.claude/commands/openspec/apply.md +23 -0
  216. package/refs/vbenchmark/.claude/commands/openspec/archive.md +27 -0
  217. package/refs/vbenchmark/.claude/commands/openspec/proposal.md +28 -0
  218. package/refs/vbenchmark/.clinerules/01-rules.md +73 -0
  219. package/refs/vbenchmark/.clinerules/02-agents.md +34 -0
  220. package/refs/vbenchmark/.cursor/commands/commit.md +29 -0
  221. package/refs/vbenchmark/.cursor/commands/debug.md +59 -0
  222. package/refs/vbenchmark/.cursor/commands/document.md +52 -0
  223. package/refs/vbenchmark/.cursor/commands/gather-context.md +58 -0
  224. package/refs/vbenchmark/.cursor/commands/init.md +56 -0
  225. package/refs/vbenchmark/.cursor/commands/preset-help.md +50 -0
  226. package/refs/vbenchmark/.cursor/commands/refactor.md +71 -0
  227. package/refs/vbenchmark/.cursor/commands/research.md +37 -0
  228. package/refs/vbenchmark/.cursor/commands/review.md +38 -0
  229. package/refs/vbenchmark/.cursor/commands/test.md +61 -0
  230. package/refs/vbenchmark/.cursor/rules/agents.mdc +1357 -0
  231. package/refs/vbenchmark/.factory/droids/codebase-explorer.md +224 -0
  232. package/refs/vbenchmark/.factory/droids/debugger.md +180 -0
  233. package/refs/vbenchmark/.factory/droids/documenter.md +166 -0
  234. package/refs/vbenchmark/.factory/droids/implementer.md +70 -0
  235. package/refs/vbenchmark/.factory/droids/orchestrator.md +212 -0
  236. package/refs/vbenchmark/.factory/droids/researcher.md +80 -0
  237. package/refs/vbenchmark/.factory/droids/reviewer.md +184 -0
  238. package/refs/vbenchmark/.factory/droids/tester.md +170 -0
  239. package/refs/vbenchmark/.gemini/workflows/commit.md +29 -0
  240. package/refs/vbenchmark/.gemini/workflows/debug.md +59 -0
  241. package/refs/vbenchmark/.gemini/workflows/document.md +52 -0
  242. package/refs/vbenchmark/.gemini/workflows/gather-context.md +58 -0
  243. package/refs/vbenchmark/.gemini/workflows/init.md +56 -0
  244. package/refs/vbenchmark/.gemini/workflows/preset-help.md +50 -0
  245. package/refs/vbenchmark/.gemini/workflows/refactor.md +71 -0
  246. package/refs/vbenchmark/.gemini/workflows/research.md +37 -0
  247. package/refs/vbenchmark/.gemini/workflows/review.md +38 -0
  248. package/refs/vbenchmark/.gemini/workflows/test.md +61 -0
  249. package/refs/vbenchmark/.github/CODEOWNERS +20 -0
  250. package/refs/vbenchmark/.github/FUNDING.yml +4 -0
  251. package/refs/vbenchmark/.github/ISSUE_TEMPLATE/bug-report.yml +76 -0
  252. package/refs/vbenchmark/.github/ISSUE_TEMPLATE/new-task.yml +106 -0
  253. package/refs/vbenchmark/.github/PULL_REQUEST_TEMPLATE.md +38 -0
  254. package/refs/vbenchmark/.github/copilot-instructions.md +73 -0
  255. package/refs/vbenchmark/.github/workflows/ci.yaml +33 -0
  256. package/refs/vbenchmark/.github/workflows/vercel-auto-pr.yml +478 -0
  257. package/refs/vbenchmark/.github/workflows/vercel-deploy.yaml +487 -0
  258. package/refs/vbenchmark/.github/workflows/vercel-pr-command.yaml +337 -0
  259. package/refs/vbenchmark/.github/workflows/vercel-project-init.yaml +208 -0
  260. package/refs/vbenchmark/.opencode/agent/codebase-explorer.md +224 -0
  261. package/refs/vbenchmark/.opencode/agent/debugger.md +180 -0
  262. package/refs/vbenchmark/.opencode/agent/documenter.md +166 -0
  263. package/refs/vbenchmark/.opencode/agent/implementer.md +70 -0
  264. package/refs/vbenchmark/.opencode/agent/orchestrator.md +212 -0
  265. package/refs/vbenchmark/.opencode/agent/researcher.md +80 -0
  266. package/refs/vbenchmark/.opencode/agent/reviewer.md +184 -0
  267. package/refs/vbenchmark/.opencode/agent/tester.md +170 -0
  268. package/refs/vbenchmark/.opencode/command/commit.md +29 -0
  269. package/refs/vbenchmark/.opencode/command/debug.md +59 -0
  270. package/refs/vbenchmark/.opencode/command/document.md +52 -0
  271. package/refs/vbenchmark/.opencode/command/gather-context.md +58 -0
  272. package/refs/vbenchmark/.opencode/command/init.md +56 -0
  273. package/refs/vbenchmark/.opencode/command/preset-help.md +50 -0
  274. package/refs/vbenchmark/.opencode/command/refactor.md +71 -0
  275. package/refs/vbenchmark/.opencode/command/research.md +37 -0
  276. package/refs/vbenchmark/.opencode/command/review.md +38 -0
  277. package/refs/vbenchmark/.opencode/command/test.md +61 -0
  278. package/refs/vbenchmark/.trae/project_rules.md +73 -0
  279. package/refs/vbenchmark/.windsurf/rules/rules.md +85 -0
  280. package/refs/vbenchmark/AGENTS.md +73 -0
  281. package/refs/vbenchmark/CONTRIBUTING.md +332 -0
  282. package/refs/vbenchmark/Caddyfile +3 -0
  283. package/refs/vbenchmark/LICENSE +47 -0
  284. package/refs/vbenchmark/README.md +354 -0
  285. package/refs/vbenchmark/docker-compose.prod.yaml +35 -0
  286. package/refs/vbenchmark/docker-compose.yaml +53 -0
  287. package/refs/vbenchmark/docs/TASK_EXPANSION_PLAN.md +211 -0
  288. package/refs/vbenchmark/docs/THESIS.md +441 -0
  289. package/refs/vbenchmark/docs/categories/code-evolution.md +138 -0
  290. package/refs/vbenchmark/openspec/changes/init-vibecodingbench/design.md +111 -0
  291. package/refs/vbenchmark/openspec/changes/init-vibecodingbench/proposal.md +15 -0
  292. package/refs/vbenchmark/openspec/changes/init-vibecodingbench/specs/evaluation/spec.md +105 -0
  293. package/refs/vbenchmark/openspec/changes/init-vibecodingbench/specs/leaderboard/spec.md +68 -0
  294. package/refs/vbenchmark/openspec/changes/init-vibecodingbench/specs/task-definition/spec.md +45 -0
  295. package/refs/vbenchmark/openspec/changes/init-vibecodingbench/specs/task-runner/spec.md +49 -0
  296. package/refs/vbenchmark/openspec/changes/init-vibecodingbench/tasks.md +413 -0
  297. package/refs/vbenchmark/package.json +51 -0
  298. package/refs/vbenchmark/packages/cli/eslint.config.js +16 -0
  299. package/refs/vbenchmark/packages/cli/package.json +35 -0
  300. package/refs/vbenchmark/packages/cli/src/agents/index.ts +655 -0
  301. package/refs/vbenchmark/packages/cli/src/commands/eval.ts +197 -0
  302. package/refs/vbenchmark/packages/cli/src/commands/list.ts +63 -0
  303. package/refs/vbenchmark/packages/cli/src/commands/run.ts +147 -0
  304. package/refs/vbenchmark/packages/cli/src/evaluator.ts +125 -0
  305. package/refs/vbenchmark/packages/cli/src/index.ts +21 -0
  306. package/refs/vbenchmark/packages/cli/src/lib/task-variation.ts +153 -0
  307. package/refs/vbenchmark/packages/cli/src/loader.ts +258 -0
  308. package/refs/vbenchmark/packages/cli/src/reporter.ts +222 -0
  309. package/refs/vbenchmark/packages/cli/src/runtime/docker.ts +385 -0
  310. package/refs/vbenchmark/packages/cli/tsconfig.json +8 -0
  311. package/refs/vbenchmark/packages/dashboard/Dockerfile +42 -0
  312. package/refs/vbenchmark/packages/dashboard/index.html +21 -0
  313. package/refs/vbenchmark/packages/dashboard/package.json +29 -0
  314. package/refs/vbenchmark/packages/dashboard/postcss.config.js +6 -0
  315. package/refs/vbenchmark/packages/dashboard/public/favicon.svg +24 -0
  316. package/refs/vbenchmark/packages/dashboard/public/logo.png +0 -0
  317. package/refs/vbenchmark/packages/dashboard/public/logo.svg +39 -0
  318. package/refs/vbenchmark/packages/dashboard/src/App.tsx +1468 -0
  319. package/refs/vbenchmark/packages/dashboard/src/data/category-performance.json +1 -0
  320. package/refs/vbenchmark/packages/dashboard/src/data/leaderboard.json +1 -0
  321. package/refs/vbenchmark/packages/dashboard/src/data/task-results.json +1 -0
  322. package/refs/vbenchmark/packages/dashboard/src/data/tasks.json +1 -0
  323. package/refs/vbenchmark/packages/dashboard/src/index.css +3 -0
  324. package/refs/vbenchmark/packages/dashboard/src/main.tsx +13 -0
  325. package/refs/vbenchmark/packages/dashboard/src/vite-env.d.ts +9 -0
  326. package/refs/vbenchmark/packages/dashboard/tailwind.config.js +11 -0
  327. package/refs/vbenchmark/packages/dashboard/tsconfig.json +21 -0
  328. package/refs/vbenchmark/packages/dashboard/tsconfig.node.json +11 -0
  329. package/refs/vbenchmark/packages/dashboard/vercel.json +6 -0
  330. package/refs/vbenchmark/packages/dashboard/vite.config.ts +28 -0
  331. package/refs/vbenchmark/packages/evaluator/eslint.config.js +16 -0
  332. package/refs/vbenchmark/packages/evaluator/package.json +24 -0
  333. package/refs/vbenchmark/packages/evaluator/src/index.ts +15 -0
  334. package/refs/vbenchmark/packages/evaluator/src/runners/functional.ts +88 -0
  335. package/refs/vbenchmark/packages/evaluator/src/runners/quality.ts +140 -0
  336. package/refs/vbenchmark/packages/evaluator/src/runners/security.ts +94 -0
  337. package/refs/vbenchmark/packages/evaluator/src/runners/visual.ts +108 -0
  338. package/refs/vbenchmark/packages/evaluator/src/types.d.ts +19 -0
  339. package/refs/vbenchmark/packages/evaluator/tsconfig.json +8 -0
  340. package/refs/vbenchmark/packages/leaderboard/Dockerfile +38 -0
  341. package/refs/vbenchmark/packages/leaderboard/drizzle.config.ts +10 -0
  342. package/refs/vbenchmark/packages/leaderboard/eslint.config.js +16 -0
  343. package/refs/vbenchmark/packages/leaderboard/fly.toml +29 -0
  344. package/refs/vbenchmark/packages/leaderboard/package.json +36 -0
  345. package/refs/vbenchmark/packages/leaderboard/src/app.ts +29 -0
  346. package/refs/vbenchmark/packages/leaderboard/src/components/BrowserPreview.tsx +190 -0
  347. package/refs/vbenchmark/packages/leaderboard/src/components/ComparisonView.tsx +205 -0
  348. package/refs/vbenchmark/packages/leaderboard/src/components/LeaderboardTable.tsx +150 -0
  349. package/refs/vbenchmark/packages/leaderboard/src/components/LiveRunCard.tsx +133 -0
  350. package/refs/vbenchmark/packages/leaderboard/src/components/SubmissionForm.tsx +406 -0
  351. package/refs/vbenchmark/packages/leaderboard/src/components/SubmitForm.tsx +293 -0
  352. package/refs/vbenchmark/packages/leaderboard/src/components/TerminalStream.tsx +111 -0
  353. package/refs/vbenchmark/packages/leaderboard/src/config/pricing.ts +206 -0
  354. package/refs/vbenchmark/packages/leaderboard/src/db/index.ts +31 -0
  355. package/refs/vbenchmark/packages/leaderboard/src/db/schema.ts +125 -0
  356. package/refs/vbenchmark/packages/leaderboard/src/index.ts +13 -0
  357. package/refs/vbenchmark/packages/leaderboard/src/lib/websocket.ts +124 -0
  358. package/refs/vbenchmark/packages/leaderboard/src/routes/leaderboard.ts +698 -0
  359. package/refs/vbenchmark/packages/leaderboard/src/routes/live.ts +175 -0
  360. package/refs/vbenchmark/packages/leaderboard/src/routes/submissions.ts +183 -0
  361. package/refs/vbenchmark/packages/leaderboard/src/routes/tasks.ts +215 -0
  362. package/refs/vbenchmark/packages/leaderboard/tests/api.test.ts +228 -0
  363. package/refs/vbenchmark/packages/leaderboard/tsconfig.json +9 -0
  364. package/refs/vbenchmark/scripts/deploy.sh +70 -0
  365. package/refs/vbenchmark/tasks/ai-integration/advanced/context-management/PROMPT.md +15 -0
  366. package/refs/vbenchmark/tasks/ai-integration/advanced/context-management/task.yaml +16 -0
  367. package/refs/vbenchmark/tasks/ai-integration/advanced/evaluation-framework/PROMPT.md +15 -0
  368. package/refs/vbenchmark/tasks/ai-integration/advanced/evaluation-framework/task.yaml +16 -0
  369. package/refs/vbenchmark/tasks/ai-integration/advanced/guardrails-safety/PROMPT.md +15 -0
  370. package/refs/vbenchmark/tasks/ai-integration/advanced/guardrails-safety/task.yaml +16 -0
  371. package/refs/vbenchmark/tasks/ai-integration/advanced/memory-system/PROMPT.md +15 -0
  372. package/refs/vbenchmark/tasks/ai-integration/advanced/memory-system/task.yaml +16 -0
  373. package/refs/vbenchmark/tasks/ai-integration/advanced/model-routing/PROMPT.md +15 -0
  374. package/refs/vbenchmark/tasks/ai-integration/advanced/model-routing/task.yaml +16 -0
  375. package/refs/vbenchmark/tasks/ai-integration/advanced/multi-agent-system/PROMPT.md +15 -0
  376. package/refs/vbenchmark/tasks/ai-integration/advanced/multi-agent-system/task.yaml +16 -0
  377. package/refs/vbenchmark/tasks/ai-integration/advanced/prompt-optimization/PROMPT.md +15 -0
  378. package/refs/vbenchmark/tasks/ai-integration/advanced/prompt-optimization/task.yaml +16 -0
  379. package/refs/vbenchmark/tasks/ai-integration/advanced/reasoning-chain/PROMPT.md +15 -0
  380. package/refs/vbenchmark/tasks/ai-integration/advanced/reasoning-chain/task.yaml +16 -0
  381. package/refs/vbenchmark/tasks/ai-integration/advanced/streaming-pipeline/PROMPT.md +15 -0
  382. package/refs/vbenchmark/tasks/ai-integration/advanced/streaming-pipeline/task.yaml +16 -0
  383. package/refs/vbenchmark/tasks/ai-integration/advanced/tool-use-orchestration/PROMPT.md +15 -0
  384. package/refs/vbenchmark/tasks/ai-integration/advanced/tool-use-orchestration/task.yaml +16 -0
  385. package/refs/vbenchmark/tasks/ai-integration/agents/code-review-agent/PROMPT.md +64 -0
  386. package/refs/vbenchmark/tasks/ai-integration/agents/code-review-agent/task.yaml +24 -0
  387. package/refs/vbenchmark/tasks/ai-integration/agents/research-agent/PROMPT.md +61 -0
  388. package/refs/vbenchmark/tasks/ai-integration/agents/research-agent/task.yaml +24 -0
  389. package/refs/vbenchmark/tasks/ai-integration/agents/web-scraper-agent/PROMPT.md +57 -0
  390. package/refs/vbenchmark/tasks/ai-integration/agents/web-scraper-agent/task.yaml +24 -0
  391. package/refs/vbenchmark/tasks/ai-integration/embeddings/duplicate-detection/PROMPT.md +50 -0
  392. package/refs/vbenchmark/tasks/ai-integration/embeddings/duplicate-detection/task.yaml +24 -0
  393. package/refs/vbenchmark/tasks/ai-integration/embeddings/recommendation-engine/PROMPT.md +51 -0
  394. package/refs/vbenchmark/tasks/ai-integration/embeddings/recommendation-engine/task.yaml +24 -0
  395. package/refs/vbenchmark/tasks/ai-integration/embeddings/semantic-search/PROMPT.md +50 -0
  396. package/refs/vbenchmark/tasks/ai-integration/embeddings/semantic-search/task.yaml +24 -0
  397. package/refs/vbenchmark/tasks/ai-integration/fine-tuning/classification-model/PROMPT.md +50 -0
  398. package/refs/vbenchmark/tasks/ai-integration/fine-tuning/classification-model/task.yaml +24 -0
  399. package/refs/vbenchmark/tasks/ai-integration/function-calling/api-orchestrator/PROMPT.md +60 -0
  400. package/refs/vbenchmark/tasks/ai-integration/function-calling/api-orchestrator/task.yaml +24 -0
  401. package/refs/vbenchmark/tasks/ai-integration/function-calling/calendar-assistant/PROMPT.md +50 -0
  402. package/refs/vbenchmark/tasks/ai-integration/function-calling/calendar-assistant/task.yaml +24 -0
  403. package/refs/vbenchmark/tasks/ai-integration/function-calling/database-query/PROMPT.md +62 -0
  404. package/refs/vbenchmark/tasks/ai-integration/function-calling/database-query/task.yaml +24 -0
  405. package/refs/vbenchmark/tasks/ai-integration/multimodal/chart-interpreter/PROMPT.md +60 -0
  406. package/refs/vbenchmark/tasks/ai-integration/multimodal/chart-interpreter/task.yaml +24 -0
  407. package/refs/vbenchmark/tasks/ai-integration/multimodal/image-captioning/PROMPT.md +49 -0
  408. package/refs/vbenchmark/tasks/ai-integration/multimodal/image-captioning/task.yaml +24 -0
  409. package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/code-assistant/PROMPT.md +51 -0
  410. package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/code-assistant/task.yaml +24 -0
  411. package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/doc-search/PROMPT.md +51 -0
  412. package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/doc-search/task.yaml +24 -0
  413. package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/pdf-qa/PROMPT.md +76 -0
  414. package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/pdf-qa/docker-compose.yaml +30 -0
  415. package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/pdf-qa/task.yaml +30 -0
  416. package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/pdf-qa/tests/functional/qa.test.py +146 -0
  417. package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/support-bot/PROMPT.md +51 -0
  418. package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/support-bot/task.yaml +24 -0
  419. package/refs/vbenchmark/tasks/ai-integration/structured-output/contract-analyzer/PROMPT.md +67 -0
  420. package/refs/vbenchmark/tasks/ai-integration/structured-output/contract-analyzer/task.yaml +24 -0
  421. package/refs/vbenchmark/tasks/ai-integration/structured-output/invoice-parser/PROMPT.md +61 -0
  422. package/refs/vbenchmark/tasks/ai-integration/structured-output/invoice-parser/task.yaml +27 -0
  423. package/refs/vbenchmark/tasks/ai-integration/structured-output/receipt-scanner/PROMPT.md +65 -0
  424. package/refs/vbenchmark/tasks/ai-integration/structured-output/receipt-scanner/task.yaml +24 -0
  425. package/refs/vbenchmark/tasks/ai-integration/structured-output/resume-parser/PROMPT.md +70 -0
  426. package/refs/vbenchmark/tasks/ai-integration/structured-output/resume-parser/task.yaml +24 -0
  427. package/refs/vbenchmark/tasks/api-integrations/advanced/api-analytics/PROMPT.md +15 -0
  428. package/refs/vbenchmark/tasks/api-integrations/advanced/api-analytics/task.yaml +16 -0
  429. package/refs/vbenchmark/tasks/api-integrations/advanced/api-gateway/PROMPT.md +15 -0
  430. package/refs/vbenchmark/tasks/api-integrations/advanced/api-gateway/task.yaml +16 -0
  431. package/refs/vbenchmark/tasks/api-integrations/advanced/api-mocking/PROMPT.md +15 -0
  432. package/refs/vbenchmark/tasks/api-integrations/advanced/api-mocking/task.yaml +16 -0
  433. package/refs/vbenchmark/tasks/api-integrations/advanced/contract-testing/PROMPT.md +15 -0
  434. package/refs/vbenchmark/tasks/api-integrations/advanced/contract-testing/task.yaml +16 -0
  435. package/refs/vbenchmark/tasks/api-integrations/advanced/graphql-federation/PROMPT.md +15 -0
  436. package/refs/vbenchmark/tasks/api-integrations/advanced/graphql-federation/task.yaml +16 -0
  437. package/refs/vbenchmark/tasks/api-integrations/advanced/grpc-gateway/PROMPT.md +15 -0
  438. package/refs/vbenchmark/tasks/api-integrations/advanced/grpc-gateway/task.yaml +16 -0
  439. package/refs/vbenchmark/tasks/api-integrations/advanced/rate-limiter/PROMPT.md +15 -0
  440. package/refs/vbenchmark/tasks/api-integrations/advanced/rate-limiter/task.yaml +16 -0
  441. package/refs/vbenchmark/tasks/api-integrations/advanced/request-validator/PROMPT.md +15 -0
  442. package/refs/vbenchmark/tasks/api-integrations/advanced/request-validator/task.yaml +16 -0
  443. package/refs/vbenchmark/tasks/api-integrations/advanced/sdk-generator/PROMPT.md +15 -0
  444. package/refs/vbenchmark/tasks/api-integrations/advanced/sdk-generator/task.yaml +16 -0
  445. package/refs/vbenchmark/tasks/api-integrations/advanced/webhook-processor/PROMPT.md +15 -0
  446. package/refs/vbenchmark/tasks/api-integrations/advanced/webhook-processor/task.yaml +16 -0
  447. package/refs/vbenchmark/tasks/api-integrations/analytics/mixpanel-events/PROMPT.md +42 -0
  448. package/refs/vbenchmark/tasks/api-integrations/analytics/mixpanel-events/task.yaml +24 -0
  449. package/refs/vbenchmark/tasks/api-integrations/analytics/segment-tracking/PROMPT.md +42 -0
  450. package/refs/vbenchmark/tasks/api-integrations/analytics/segment-tracking/task.yaml +24 -0
  451. package/refs/vbenchmark/tasks/api-integrations/auth-provider/oauth2-github/PROMPT.md +42 -0
  452. package/refs/vbenchmark/tasks/api-integrations/auth-provider/oauth2-github/task.yaml +24 -0
  453. package/refs/vbenchmark/tasks/api-integrations/auth-provider/okta-integration/PROMPT.md +44 -0
  454. package/refs/vbenchmark/tasks/api-integrations/auth-provider/okta-integration/task.yaml +24 -0
  455. package/refs/vbenchmark/tasks/api-integrations/auth-provider/saml-sso/PROMPT.md +42 -0
  456. package/refs/vbenchmark/tasks/api-integrations/auth-provider/saml-sso/task.yaml +24 -0
  457. package/refs/vbenchmark/tasks/api-integrations/communication/discord-webhook/PROMPT.md +44 -0
  458. package/refs/vbenchmark/tasks/api-integrations/communication/discord-webhook/task.yaml +24 -0
  459. package/refs/vbenchmark/tasks/api-integrations/communication/slack-bot/PROMPT.md +42 -0
  460. package/refs/vbenchmark/tasks/api-integrations/communication/slack-bot/task.yaml +24 -0
  461. package/refs/vbenchmark/tasks/api-integrations/communication/twilio-sms/PROMPT.md +42 -0
  462. package/refs/vbenchmark/tasks/api-integrations/communication/twilio-sms/task.yaml +24 -0
  463. package/refs/vbenchmark/tasks/api-integrations/email/transactional/PROMPT.md +82 -0
  464. package/refs/vbenchmark/tasks/api-integrations/email/transactional/task.yaml +27 -0
  465. package/refs/vbenchmark/tasks/api-integrations/maps/google-maps-geocoding/PROMPT.md +41 -0
  466. package/refs/vbenchmark/tasks/api-integrations/maps/google-maps-geocoding/task.yaml +24 -0
  467. package/refs/vbenchmark/tasks/api-integrations/maps/mapbox-directions/PROMPT.md +41 -0
  468. package/refs/vbenchmark/tasks/api-integrations/maps/mapbox-directions/task.yaml +24 -0
  469. package/refs/vbenchmark/tasks/api-integrations/payment/crypto-payments/PROMPT.md +43 -0
  470. package/refs/vbenchmark/tasks/api-integrations/payment/crypto-payments/task.yaml +24 -0
  471. package/refs/vbenchmark/tasks/api-integrations/payment/paypal-integration/PROMPT.md +41 -0
  472. package/refs/vbenchmark/tasks/api-integrations/payment/paypal-integration/task.yaml +24 -0
  473. package/refs/vbenchmark/tasks/api-integrations/social/twitter-api/PROMPT.md +41 -0
  474. package/refs/vbenchmark/tasks/api-integrations/social/twitter-api/task.yaml +24 -0
  475. package/refs/vbenchmark/tasks/api-integrations/storage/cloudinary-upload/PROMPT.md +43 -0
  476. package/refs/vbenchmark/tasks/api-integrations/storage/cloudinary-upload/task.yaml +24 -0
  477. package/refs/vbenchmark/tasks/api-integrations/storage/gcs-streaming/PROMPT.md +43 -0
  478. package/refs/vbenchmark/tasks/api-integrations/storage/gcs-streaming/task.yaml +24 -0
  479. package/refs/vbenchmark/tasks/api-integrations/storage/s3-presigned-urls/PROMPT.md +41 -0
  480. package/refs/vbenchmark/tasks/api-integrations/storage/s3-presigned-urls/task.yaml +24 -0
  481. package/refs/vbenchmark/tasks/api-integrations/stripe/checkout-session/PROMPT.md +41 -0
  482. package/refs/vbenchmark/tasks/api-integrations/stripe/checkout-session/task.yaml +24 -0
  483. package/refs/vbenchmark/tasks/api-integrations/stripe/payment-webhook/PROMPT.md +60 -0
  484. package/refs/vbenchmark/tasks/api-integrations/stripe/payment-webhook/docker-compose.yaml +38 -0
  485. package/refs/vbenchmark/tasks/api-integrations/stripe/payment-webhook/task.yaml +31 -0
  486. package/refs/vbenchmark/tasks/api-integrations/stripe/payment-webhook/tests/webhook.test.ts +193 -0
  487. package/refs/vbenchmark/tasks/api-integrations/stripe/subscription-portal/PROMPT.md +41 -0
  488. package/refs/vbenchmark/tasks/api-integrations/stripe/subscription-portal/task.yaml +24 -0
  489. package/refs/vbenchmark/tasks/code-evolution/advanced/api-deprecation/PROMPT.md +15 -0
  490. package/refs/vbenchmark/tasks/code-evolution/advanced/api-deprecation/task.yaml +16 -0
  491. package/refs/vbenchmark/tasks/code-evolution/advanced/ast-refactoring/PROMPT.md +15 -0
  492. package/refs/vbenchmark/tasks/code-evolution/advanced/ast-refactoring/task.yaml +16 -0
  493. package/refs/vbenchmark/tasks/code-evolution/advanced/concurrency-fix/PROMPT.md +15 -0
  494. package/refs/vbenchmark/tasks/code-evolution/advanced/concurrency-fix/task.yaml +16 -0
  495. package/refs/vbenchmark/tasks/code-evolution/advanced/database-schema-migration/PROMPT.md +15 -0
  496. package/refs/vbenchmark/tasks/code-evolution/advanced/database-schema-migration/task.yaml +16 -0
  497. package/refs/vbenchmark/tasks/code-evolution/advanced/dead-code-elimination/PROMPT.md +15 -0
  498. package/refs/vbenchmark/tasks/code-evolution/advanced/dead-code-elimination/task.yaml +16 -0
  499. package/refs/vbenchmark/tasks/code-evolution/advanced/dependency-upgrade/PROMPT.md +15 -0
  500. package/refs/vbenchmark/tasks/code-evolution/advanced/dependency-upgrade/task.yaml +16 -0
  501. package/refs/vbenchmark/tasks/code-evolution/advanced/memory-optimization/PROMPT.md +15 -0
  502. package/refs/vbenchmark/tasks/code-evolution/advanced/memory-optimization/task.yaml +16 -0
  503. package/refs/vbenchmark/tasks/code-evolution/advanced/monorepo-extraction/PROMPT.md +15 -0
  504. package/refs/vbenchmark/tasks/code-evolution/advanced/monorepo-extraction/task.yaml +16 -0
  505. package/refs/vbenchmark/tasks/code-evolution/advanced/performance-profiling/PROMPT.md +15 -0
  506. package/refs/vbenchmark/tasks/code-evolution/advanced/performance-profiling/task.yaml +16 -0
  507. package/refs/vbenchmark/tasks/code-evolution/advanced/type-migration/PROMPT.md +15 -0
  508. package/refs/vbenchmark/tasks/code-evolution/advanced/type-migration/task.yaml +16 -0
  509. package/refs/vbenchmark/tasks/code-evolution/legacy-migration/callback-to-async/PROMPT.md +47 -0
  510. package/refs/vbenchmark/tasks/code-evolution/legacy-migration/callback-to-async/task.yaml +24 -0
  511. package/refs/vbenchmark/tasks/code-evolution/legacy-migration/express-to-fastify/PROMPT.md +49 -0
  512. package/refs/vbenchmark/tasks/code-evolution/legacy-migration/express-to-fastify/base-code/src/app.ts +22 -0
  513. package/refs/vbenchmark/tasks/code-evolution/legacy-migration/express-to-fastify/task.yaml +37 -0
  514. package/refs/vbenchmark/tasks/code-evolution/legacy-migration/express-to-fastify/tests/api.test.ts +70 -0
  515. package/refs/vbenchmark/tasks/code-evolution/legacy-migration/flask-to-fastapi/PROMPT.md +46 -0
  516. package/refs/vbenchmark/tasks/code-evolution/legacy-migration/flask-to-fastapi/task.yaml +24 -0
  517. package/refs/vbenchmark/tasks/code-evolution/legacy-migration/java-to-kotlin/PROMPT.md +45 -0
  518. package/refs/vbenchmark/tasks/code-evolution/legacy-migration/java-to-kotlin/task.yaml +24 -0
  519. package/refs/vbenchmark/tasks/code-evolution/legacy-migration/jquery-to-react/PROMPT.md +47 -0
  520. package/refs/vbenchmark/tasks/code-evolution/legacy-migration/jquery-to-react/task.yaml +24 -0
  521. package/refs/vbenchmark/tasks/code-evolution/legacy-migration/rest-to-grpc/PROMPT.md +47 -0
  522. package/refs/vbenchmark/tasks/code-evolution/legacy-migration/rest-to-grpc/task.yaml +24 -0
  523. package/refs/vbenchmark/tasks/code-evolution/performance/async-refactor/PROMPT.md +47 -0
  524. package/refs/vbenchmark/tasks/code-evolution/performance/async-refactor/task.yaml +24 -0
  525. package/refs/vbenchmark/tasks/code-evolution/performance/memory-leak-fix/PROMPT.md +47 -0
  526. package/refs/vbenchmark/tasks/code-evolution/performance/memory-leak-fix/task.yaml +24 -0
  527. package/refs/vbenchmark/tasks/code-evolution/performance/query-optimization/PROMPT.md +49 -0
  528. package/refs/vbenchmark/tasks/code-evolution/performance/query-optimization/task.yaml +24 -0
  529. package/refs/vbenchmark/tasks/code-evolution/refactoring/class-to-hooks/PROMPT.md +96 -0
  530. package/refs/vbenchmark/tasks/code-evolution/refactoring/class-to-hooks/task.yaml +27 -0
  531. package/refs/vbenchmark/tasks/code-evolution/refactoring/dependency-injection/PROMPT.md +47 -0
  532. package/refs/vbenchmark/tasks/code-evolution/refactoring/dependency-injection/task.yaml +24 -0
  533. package/refs/vbenchmark/tasks/code-evolution/refactoring/error-handling/PROMPT.md +48 -0
  534. package/refs/vbenchmark/tasks/code-evolution/refactoring/error-handling/task.yaml +24 -0
  535. package/refs/vbenchmark/tasks/code-evolution/refactoring/monolith-to-modules/PROMPT.md +50 -0
  536. package/refs/vbenchmark/tasks/code-evolution/refactoring/monolith-to-modules/task.yaml +24 -0
  537. package/refs/vbenchmark/tasks/code-evolution/refactoring/orm-migration/PROMPT.md +47 -0
  538. package/refs/vbenchmark/tasks/code-evolution/refactoring/orm-migration/task.yaml +24 -0
  539. package/refs/vbenchmark/tasks/code-evolution/security/secrets-rotation/PROMPT.md +49 -0
  540. package/refs/vbenchmark/tasks/code-evolution/security/secrets-rotation/task.yaml +24 -0
  541. package/refs/vbenchmark/tasks/code-evolution/security/sql-injection-fix/PROMPT.md +50 -0
  542. package/refs/vbenchmark/tasks/code-evolution/security/sql-injection-fix/task.yaml +24 -0
  543. package/refs/vbenchmark/tasks/code-evolution/security/xss-prevention/PROMPT.md +47 -0
  544. package/refs/vbenchmark/tasks/code-evolution/security/xss-prevention/task.yaml +24 -0
  545. package/refs/vbenchmark/tasks/code-evolution/testing/add-unit-tests/PROMPT.md +48 -0
  546. package/refs/vbenchmark/tasks/code-evolution/testing/add-unit-tests/task.yaml +24 -0
  547. package/refs/vbenchmark/tasks/code-evolution/testing/e2e-playwright/PROMPT.md +50 -0
  548. package/refs/vbenchmark/tasks/code-evolution/testing/e2e-playwright/task.yaml +24 -0
  549. package/refs/vbenchmark/tasks/code-evolution/testing/pytest-fixtures/PROMPT.md +47 -0
  550. package/refs/vbenchmark/tasks/code-evolution/testing/pytest-fixtures/task.yaml +24 -0
  551. package/refs/vbenchmark/tasks/frontend/accessibility/keyboard-shortcuts/PROMPT.md +44 -0
  552. package/refs/vbenchmark/tasks/frontend/accessibility/keyboard-shortcuts/task.yaml +24 -0
  553. package/refs/vbenchmark/tasks/frontend/accessibility/screen-reader-nav/PROMPT.md +44 -0
  554. package/refs/vbenchmark/tasks/frontend/accessibility/screen-reader-nav/task.yaml +24 -0
  555. package/refs/vbenchmark/tasks/frontend/advanced/canvas-editor/PROMPT.md +15 -0
  556. package/refs/vbenchmark/tasks/frontend/advanced/canvas-editor/task.yaml +16 -0
  557. package/refs/vbenchmark/tasks/frontend/advanced/micro-frontend/PROMPT.md +15 -0
  558. package/refs/vbenchmark/tasks/frontend/advanced/micro-frontend/task.yaml +16 -0
  559. package/refs/vbenchmark/tasks/frontend/advanced/offline-first/PROMPT.md +15 -0
  560. package/refs/vbenchmark/tasks/frontend/advanced/offline-first/task.yaml +16 -0
  561. package/refs/vbenchmark/tasks/frontend/advanced/realtime-collab/PROMPT.md +15 -0
  562. package/refs/vbenchmark/tasks/frontend/advanced/realtime-collab/task.yaml +16 -0
  563. package/refs/vbenchmark/tasks/frontend/advanced/service-worker/PROMPT.md +15 -0
  564. package/refs/vbenchmark/tasks/frontend/advanced/service-worker/task.yaml +16 -0
  565. package/refs/vbenchmark/tasks/frontend/advanced/state-machine/PROMPT.md +15 -0
  566. package/refs/vbenchmark/tasks/frontend/advanced/state-machine/task.yaml +16 -0
  567. package/refs/vbenchmark/tasks/frontend/advanced/virtual-list/PROMPT.md +15 -0
  568. package/refs/vbenchmark/tasks/frontend/advanced/virtual-list/task.yaml +16 -0
  569. package/refs/vbenchmark/tasks/frontend/advanced/wasm-integration/PROMPT.md +15 -0
  570. package/refs/vbenchmark/tasks/frontend/advanced/wasm-integration/task.yaml +16 -0
  571. package/refs/vbenchmark/tasks/frontend/advanced/web-worker/PROMPT.md +15 -0
  572. package/refs/vbenchmark/tasks/frontend/advanced/web-worker/task.yaml +16 -0
  573. package/refs/vbenchmark/tasks/frontend/advanced/webgl-visualization/PROMPT.md +15 -0
  574. package/refs/vbenchmark/tasks/frontend/advanced/webgl-visualization/task.yaml +16 -0
  575. package/refs/vbenchmark/tasks/frontend/animation/page-transitions/PROMPT.md +44 -0
  576. package/refs/vbenchmark/tasks/frontend/animation/page-transitions/task.yaml +24 -0
  577. package/refs/vbenchmark/tasks/frontend/components/data-grid/PROMPT.md +59 -0
  578. package/refs/vbenchmark/tasks/frontend/components/data-grid/task.yaml +24 -0
  579. package/refs/vbenchmark/tasks/frontend/components/date-range-picker/PROMPT.md +57 -0
  580. package/refs/vbenchmark/tasks/frontend/components/date-range-picker/task.yaml +24 -0
  581. package/refs/vbenchmark/tasks/frontend/components/file-uploader/PROMPT.md +55 -0
  582. package/refs/vbenchmark/tasks/frontend/components/file-uploader/task.yaml +24 -0
  583. package/refs/vbenchmark/tasks/frontend/components/form-builder/PROMPT.md +96 -0
  584. package/refs/vbenchmark/tasks/frontend/components/form-builder/task.yaml +28 -0
  585. package/refs/vbenchmark/tasks/frontend/components/rich-text-editor/PROMPT.md +45 -0
  586. package/refs/vbenchmark/tasks/frontend/components/rich-text-editor/task.yaml +24 -0
  587. package/refs/vbenchmark/tasks/frontend/figma-to-code/dashboard-layout/PROMPT.md +50 -0
  588. package/refs/vbenchmark/tasks/frontend/figma-to-code/dashboard-layout/task.yaml +25 -0
  589. package/refs/vbenchmark/tasks/frontend/figma-to-code/landing-page/PROMPT.md +49 -0
  590. package/refs/vbenchmark/tasks/frontend/figma-to-code/landing-page/task.yaml +25 -0
  591. package/refs/vbenchmark/tasks/frontend/figma-to-code/mobile-app-screen/PROMPT.md +51 -0
  592. package/refs/vbenchmark/tasks/frontend/figma-to-code/mobile-app-screen/task.yaml +24 -0
  593. package/refs/vbenchmark/tasks/frontend/figma-to-code/pricing-card/PROMPT.md +93 -0
  594. package/refs/vbenchmark/tasks/frontend/figma-to-code/pricing-card/docker-compose.yaml +23 -0
  595. package/refs/vbenchmark/tasks/frontend/figma-to-code/pricing-card/task.yaml +30 -0
  596. package/refs/vbenchmark/tasks/frontend/figma-to-code/pricing-card/tests/visual/diff.test.ts +107 -0
  597. package/refs/vbenchmark/tasks/frontend/figma-to-code/pricing-card/tests/visual/interaction.test.ts +88 -0
  598. package/refs/vbenchmark/tasks/frontend/performance/image-lazy-load/PROMPT.md +43 -0
  599. package/refs/vbenchmark/tasks/frontend/performance/image-lazy-load/task.yaml +24 -0
  600. package/refs/vbenchmark/tasks/frontend/performance/infinite-scroll/PROMPT.md +44 -0
  601. package/refs/vbenchmark/tasks/frontend/performance/infinite-scroll/task.yaml +24 -0
  602. package/refs/vbenchmark/tasks/frontend/state-management/collaborative-editor/PROMPT.md +44 -0
  603. package/refs/vbenchmark/tasks/frontend/state-management/collaborative-editor/task.yaml +24 -0
  604. package/refs/vbenchmark/tasks/frontend/state-management/shopping-cart/PROMPT.md +53 -0
  605. package/refs/vbenchmark/tasks/frontend/state-management/shopping-cart/task.yaml +24 -0
  606. package/refs/vbenchmark/tasks/frontend/visualization/chart-dashboard/PROMPT.md +83 -0
  607. package/refs/vbenchmark/tasks/frontend/visualization/chart-dashboard/task.yaml +28 -0
  608. package/refs/vbenchmark/tasks/frontend/visualization/gantt-chart/PROMPT.md +57 -0
  609. package/refs/vbenchmark/tasks/frontend/visualization/gantt-chart/task.yaml +24 -0
  610. package/refs/vbenchmark/tasks/frontend/visualization/map-dashboard/PROMPT.md +44 -0
  611. package/refs/vbenchmark/tasks/frontend/visualization/map-dashboard/task.yaml +24 -0
  612. package/refs/vbenchmark/tasks/frontend/visualization/realtime-charts/PROMPT.md +43 -0
  613. package/refs/vbenchmark/tasks/frontend/visualization/realtime-charts/task.yaml +24 -0
  614. package/refs/vbenchmark/tasks/glue-code/advanced/blue-green-deploy/PROMPT.md +15 -0
  615. package/refs/vbenchmark/tasks/glue-code/advanced/blue-green-deploy/task.yaml +16 -0
  616. package/refs/vbenchmark/tasks/glue-code/advanced/canary-release/PROMPT.md +15 -0
  617. package/refs/vbenchmark/tasks/glue-code/advanced/canary-release/task.yaml +16 -0
  618. package/refs/vbenchmark/tasks/glue-code/advanced/change-data-capture/PROMPT.md +15 -0
  619. package/refs/vbenchmark/tasks/glue-code/advanced/change-data-capture/task.yaml +16 -0
  620. package/refs/vbenchmark/tasks/glue-code/advanced/config-management/PROMPT.md +15 -0
  621. package/refs/vbenchmark/tasks/glue-code/advanced/config-management/task.yaml +16 -0
  622. package/refs/vbenchmark/tasks/glue-code/advanced/data-pipeline/PROMPT.md +15 -0
  623. package/refs/vbenchmark/tasks/glue-code/advanced/data-pipeline/task.yaml +16 -0
  624. package/refs/vbenchmark/tasks/glue-code/advanced/distributed-tracing/PROMPT.md +15 -0
  625. package/refs/vbenchmark/tasks/glue-code/advanced/distributed-tracing/task.yaml +16 -0
  626. package/refs/vbenchmark/tasks/glue-code/advanced/log-aggregation/PROMPT.md +15 -0
  627. package/refs/vbenchmark/tasks/glue-code/advanced/log-aggregation/task.yaml +16 -0
  628. package/refs/vbenchmark/tasks/glue-code/advanced/schema-registry/PROMPT.md +15 -0
  629. package/refs/vbenchmark/tasks/glue-code/advanced/schema-registry/task.yaml +16 -0
  630. package/refs/vbenchmark/tasks/glue-code/advanced/secret-rotation/PROMPT.md +15 -0
  631. package/refs/vbenchmark/tasks/glue-code/advanced/secret-rotation/task.yaml +16 -0
  632. package/refs/vbenchmark/tasks/glue-code/advanced/stream-processing/PROMPT.md +15 -0
  633. package/refs/vbenchmark/tasks/glue-code/advanced/stream-processing/task.yaml +16 -0
  634. package/refs/vbenchmark/tasks/glue-code/api-sync/rest-to-graphql/PROMPT.md +66 -0
  635. package/refs/vbenchmark/tasks/glue-code/api-sync/rest-to-graphql/task.yaml +27 -0
  636. package/refs/vbenchmark/tasks/glue-code/caching/redis-cache/PROMPT.md +82 -0
  637. package/refs/vbenchmark/tasks/glue-code/caching/redis-cache/task.yaml +27 -0
  638. package/refs/vbenchmark/tasks/glue-code/data-transform/avro-schema-evolution/PROMPT.md +51 -0
  639. package/refs/vbenchmark/tasks/glue-code/data-transform/avro-schema-evolution/task.yaml +24 -0
  640. package/refs/vbenchmark/tasks/glue-code/data-transform/csv-normalizer/PROMPT.md +49 -0
  641. package/refs/vbenchmark/tasks/glue-code/data-transform/csv-normalizer/task.yaml +24 -0
  642. package/refs/vbenchmark/tasks/glue-code/data-transform/excel-to-json/PROMPT.md +67 -0
  643. package/refs/vbenchmark/tasks/glue-code/data-transform/excel-to-json/task.yaml +28 -0
  644. package/refs/vbenchmark/tasks/glue-code/data-transform/excel-to-json/tests/transform.test.py +137 -0
  645. package/refs/vbenchmark/tasks/glue-code/data-transform/json-to-xml/PROMPT.md +45 -0
  646. package/refs/vbenchmark/tasks/glue-code/data-transform/json-to-xml/task.yaml +24 -0
  647. package/refs/vbenchmark/tasks/glue-code/data-transform/protobuf-converter/PROMPT.md +44 -0
  648. package/refs/vbenchmark/tasks/glue-code/data-transform/protobuf-converter/task.yaml +24 -0
  649. package/refs/vbenchmark/tasks/glue-code/etl/cdc-pipeline/PROMPT.md +52 -0
  650. package/refs/vbenchmark/tasks/glue-code/etl/cdc-pipeline/task.yaml +27 -0
  651. package/refs/vbenchmark/tasks/glue-code/etl/database-sync/PROMPT.md +51 -0
  652. package/refs/vbenchmark/tasks/glue-code/etl/database-sync/task.yaml +24 -0
  653. package/refs/vbenchmark/tasks/glue-code/etl/s3-to-warehouse/PROMPT.md +50 -0
  654. package/refs/vbenchmark/tasks/glue-code/etl/s3-to-warehouse/task.yaml +24 -0
  655. package/refs/vbenchmark/tasks/glue-code/file-processing/image-resizer/PROMPT.md +52 -0
  656. package/refs/vbenchmark/tasks/glue-code/file-processing/image-resizer/task.yaml +24 -0
  657. package/refs/vbenchmark/tasks/glue-code/file-processing/pdf-merger/PROMPT.md +50 -0
  658. package/refs/vbenchmark/tasks/glue-code/file-processing/pdf-merger/task.yaml +24 -0
  659. package/refs/vbenchmark/tasks/glue-code/file-processing/video-transcoder/PROMPT.md +50 -0
  660. package/refs/vbenchmark/tasks/glue-code/file-processing/video-transcoder/task.yaml +27 -0
  661. package/refs/vbenchmark/tasks/glue-code/migration/data-backfill/PROMPT.md +50 -0
  662. package/refs/vbenchmark/tasks/glue-code/migration/data-backfill/task.yaml +24 -0
  663. package/refs/vbenchmark/tasks/glue-code/migration/database-versioning/PROMPT.md +50 -0
  664. package/refs/vbenchmark/tasks/glue-code/migration/database-versioning/task.yaml +24 -0
  665. package/refs/vbenchmark/tasks/glue-code/queue/kafka-producer/PROMPT.md +49 -0
  666. package/refs/vbenchmark/tasks/glue-code/queue/kafka-producer/task.yaml +27 -0
  667. package/refs/vbenchmark/tasks/glue-code/queue/rabbitmq-consumer/PROMPT.md +50 -0
  668. package/refs/vbenchmark/tasks/glue-code/queue/rabbitmq-consumer/task.yaml +27 -0
  669. package/refs/vbenchmark/tasks/glue-code/queue/sqs-batch-processor/PROMPT.md +47 -0
  670. package/refs/vbenchmark/tasks/glue-code/queue/sqs-batch-processor/task.yaml +24 -0
  671. package/refs/vbenchmark/tasks/glue-code/scheduler/cron-job-manager/PROMPT.md +52 -0
  672. package/refs/vbenchmark/tasks/glue-code/scheduler/cron-job-manager/task.yaml +27 -0
  673. package/refs/vbenchmark/tasks/glue-code/scheduler/delayed-tasks/PROMPT.md +51 -0
  674. package/refs/vbenchmark/tasks/glue-code/scheduler/delayed-tasks/task.yaml +27 -0
  675. package/refs/vbenchmark/tasks/saas-core/advanced/api-versioning/PROMPT.md +15 -0
  676. package/refs/vbenchmark/tasks/saas-core/advanced/api-versioning/task.yaml +16 -0
  677. package/refs/vbenchmark/tasks/saas-core/advanced/circuit-breaker/PROMPT.md +13 -0
  678. package/refs/vbenchmark/tasks/saas-core/advanced/circuit-breaker/task.yaml +16 -0
  679. package/refs/vbenchmark/tasks/saas-core/advanced/compliance-gdpr/PROMPT.md +15 -0
  680. package/refs/vbenchmark/tasks/saas-core/advanced/compliance-gdpr/task.yaml +16 -0
  681. package/refs/vbenchmark/tasks/saas-core/advanced/cqrs-pattern/PROMPT.md +13 -0
  682. package/refs/vbenchmark/tasks/saas-core/advanced/cqrs-pattern/task.yaml +16 -0
  683. package/refs/vbenchmark/tasks/saas-core/advanced/data-encryption/PROMPT.md +15 -0
  684. package/refs/vbenchmark/tasks/saas-core/advanced/data-encryption/task.yaml +16 -0
  685. package/refs/vbenchmark/tasks/saas-core/advanced/distributed-locking/PROMPT.md +46 -0
  686. package/refs/vbenchmark/tasks/saas-core/advanced/distributed-locking/task.yaml +24 -0
  687. package/refs/vbenchmark/tasks/saas-core/advanced/event-sourcing/PROMPT.md +23 -0
  688. package/refs/vbenchmark/tasks/saas-core/advanced/event-sourcing/task.yaml +16 -0
  689. package/refs/vbenchmark/tasks/saas-core/advanced/feature-flags-ab/PROMPT.md +15 -0
  690. package/refs/vbenchmark/tasks/saas-core/advanced/feature-flags-ab/task.yaml +16 -0
  691. package/refs/vbenchmark/tasks/saas-core/advanced/saga-orchestration/PROMPT.md +13 -0
  692. package/refs/vbenchmark/tasks/saas-core/advanced/saga-orchestration/task.yaml +16 -0
  693. package/refs/vbenchmark/tasks/saas-core/advanced/webhook-delivery/PROMPT.md +15 -0
  694. package/refs/vbenchmark/tasks/saas-core/advanced/webhook-delivery/task.yaml +16 -0
  695. package/refs/vbenchmark/tasks/saas-core/audit/activity-logging/PROMPT.md +50 -0
  696. package/refs/vbenchmark/tasks/saas-core/audit/activity-logging/task.yaml +27 -0
  697. package/refs/vbenchmark/tasks/saas-core/auth/jwt-refresh-tokens/PROMPT.md +50 -0
  698. package/refs/vbenchmark/tasks/saas-core/auth/jwt-refresh-tokens/task.yaml +27 -0
  699. package/refs/vbenchmark/tasks/saas-core/auth/magic-link-email/PROMPT.md +53 -0
  700. package/refs/vbenchmark/tasks/saas-core/auth/magic-link-email/task.yaml +27 -0
  701. package/refs/vbenchmark/tasks/saas-core/auth/mfa-totp/PROMPT.md +79 -0
  702. package/refs/vbenchmark/tasks/saas-core/auth/mfa-totp/task.yaml +27 -0
  703. package/refs/vbenchmark/tasks/saas-core/auth/rbac-permissions/PROMPT.md +51 -0
  704. package/refs/vbenchmark/tasks/saas-core/auth/rbac-permissions/task.yaml +27 -0
  705. package/refs/vbenchmark/tasks/saas-core/auth/session-management/PROMPT.md +52 -0
  706. package/refs/vbenchmark/tasks/saas-core/auth/session-management/task.yaml +27 -0
  707. package/refs/vbenchmark/tasks/saas-core/auth/supabase-oauth/PROMPT.md +45 -0
  708. package/refs/vbenchmark/tasks/saas-core/auth/supabase-oauth/docker-compose.yaml +47 -0
  709. package/refs/vbenchmark/tasks/saas-core/auth/supabase-oauth/task.yaml +32 -0
  710. package/refs/vbenchmark/tasks/saas-core/auth/supabase-oauth/tests/auth.test.ts +59 -0
  711. package/refs/vbenchmark/tasks/saas-core/billing/invoice-generation/PROMPT.md +53 -0
  712. package/refs/vbenchmark/tasks/saas-core/billing/invoice-generation/task.yaml +27 -0
  713. package/refs/vbenchmark/tasks/saas-core/billing/stripe-subscriptions/PROMPT.md +51 -0
  714. package/refs/vbenchmark/tasks/saas-core/billing/stripe-subscriptions/task.yaml +27 -0
  715. package/refs/vbenchmark/tasks/saas-core/billing/usage-metering/PROMPT.md +52 -0
  716. package/refs/vbenchmark/tasks/saas-core/billing/usage-metering/task.yaml +27 -0
  717. package/refs/vbenchmark/tasks/saas-core/crud/dashboard-table/PROMPT.md +48 -0
  718. package/refs/vbenchmark/tasks/saas-core/crud/dashboard-table/task.yaml +28 -0
  719. package/refs/vbenchmark/tasks/saas-core/multi-tenant/org-isolation/PROMPT.md +50 -0
  720. package/refs/vbenchmark/tasks/saas-core/multi-tenant/org-isolation/task.yaml +27 -0
  721. package/refs/vbenchmark/tasks/saas-core/multi-tenant/subdomain-routing/PROMPT.md +50 -0
  722. package/refs/vbenchmark/tasks/saas-core/multi-tenant/subdomain-routing/task.yaml +27 -0
  723. package/refs/vbenchmark/tasks/saas-core/notifications/email-queue/PROMPT.md +53 -0
  724. package/refs/vbenchmark/tasks/saas-core/notifications/email-queue/task.yaml +27 -0
  725. package/refs/vbenchmark/tasks/saas-core/notifications/in-app-alerts/PROMPT.md +51 -0
  726. package/refs/vbenchmark/tasks/saas-core/notifications/in-app-alerts/task.yaml +27 -0
  727. package/refs/vbenchmark/tasks/saas-core/notifications/push-notifications/PROMPT.md +51 -0
  728. package/refs/vbenchmark/tasks/saas-core/notifications/push-notifications/task.yaml +27 -0
  729. package/refs/vbenchmark/tasks/saas-core/realtime/websocket-chat/PROMPT.md +80 -0
  730. package/refs/vbenchmark/tasks/saas-core/realtime/websocket-chat/task.yaml +27 -0
  731. package/refs/vbenchmark/tasks/saas-core/search/full-text-search/PROMPT.md +51 -0
  732. package/refs/vbenchmark/tasks/saas-core/search/full-text-search/task.yaml +27 -0
  733. package/refs/vbenchmark/tasks/saas-core/security/rate-limiter/PROMPT.md +99 -0
  734. package/refs/vbenchmark/tasks/saas-core/security/rate-limiter/task.yaml +27 -0
  735. package/refs/vbenchmark/tasks/saas-core/settings/user-preferences/PROMPT.md +78 -0
  736. package/refs/vbenchmark/tasks/saas-core/settings/user-preferences/task.yaml +27 -0
  737. package/refs/vbenchmark/templates/fastapi-postgres/docker-compose.yaml +36 -0
  738. package/refs/vbenchmark/templates/fastapi-postgres/pyproject.toml +34 -0
  739. package/refs/vbenchmark/templates/fastapi-postgres/src/__init__.py +0 -0
  740. package/refs/vbenchmark/templates/fastapi-postgres/src/config.py +12 -0
  741. package/refs/vbenchmark/templates/fastapi-postgres/src/database.py +15 -0
  742. package/refs/vbenchmark/templates/fastapi-postgres/src/main.py +51 -0
  743. package/refs/vbenchmark/templates/fastapi-postgres/src/models.py +12 -0
  744. package/refs/vbenchmark/templates/fastapi-postgres/src/schemas.py +20 -0
  745. package/refs/vbenchmark/templates/go-fiber/docker-compose.yaml +34 -0
  746. package/refs/vbenchmark/templates/go-fiber/go.mod +33 -0
  747. package/refs/vbenchmark/templates/go-fiber/go.sum +68 -0
  748. package/refs/vbenchmark/templates/go-fiber/main.go +98 -0
  749. package/refs/vbenchmark/templates/nextjs-supabase/.env.example +3 -0
  750. package/refs/vbenchmark/templates/nextjs-supabase/docker-compose.yaml +68 -0
  751. package/refs/vbenchmark/templates/nextjs-supabase/src/app/globals.css +13 -0
  752. package/refs/vbenchmark/templates/nextjs-supabase/src/app/layout.tsx +19 -0
  753. package/refs/vbenchmark/templates/nextjs-supabase/src/app/page.tsx +38 -0
  754. package/refs/vbenchmark/templates/nextjs-supabase/src/lib/supabase/client.ts +8 -0
  755. package/refs/vbenchmark/templates/nextjs-supabase/src/lib/supabase/server.ts +32 -0
  756. package/refs/vbenchmark/templates/rust-axum/Cargo.lock +2371 -0
  757. package/refs/vbenchmark/templates/rust-axum/Cargo.toml +16 -0
  758. package/refs/vbenchmark/templates/rust-axum/docker-compose.yaml +34 -0
  759. package/refs/vbenchmark/templates/rust-axum/migrations/20240101000000_init.sql +20 -0
  760. package/refs/vbenchmark/templates/rust-axum/src/main.rs +121 -0
  761. package/refs/vbenchmark/tsconfig.base.json +18 -0
  762. package/refs/vbenchmark/turbo.json +23 -0
  763. package/refs/vbenchmark/vercel.json +10 -0
@@ -0,0 +1,38 @@
1
+ ---
2
+ name: gsd:verify-work
3
+ description: Validate built features through conversational UAT
4
+ argument-hint: "[phase number, e.g., '4']"
5
+ allowed-tools:
6
+ - Read
7
+ - Bash
8
+ - Glob
9
+ - Grep
10
+ - Edit
11
+ - Write
12
+ - Task
13
+ ---
14
+ <objective>
15
+ Validate built features through conversational testing with persistent state.
16
+
17
+ Purpose: Confirm what Claude built actually works from user's perspective. One test at a time, plain text responses, no interrogation. When issues are found, automatically diagnose, plan fixes, and prepare for execution.
18
+
19
+ Output: {phase_num}-UAT.md tracking all test results. If issues found: diagnosed gaps, verified fix plans ready for /gsd:execute-phase
20
+ </objective>
21
+
22
+ <execution_context>
23
+ @~/.claude/get-shit-done/workflows/verify-work.md
24
+ @~/.claude/get-shit-done/templates/UAT.md
25
+ </execution_context>
26
+
27
+ <context>
28
+ Phase: $ARGUMENTS (optional)
29
+ - If provided: Test specific phase (e.g., "4")
30
+ - If not provided: Check for active sessions or prompt for phase
31
+
32
+ Context files are resolved inside the workflow (`init verify-work`) and delegated via `<files_to_read>` blocks.
33
+ </context>
34
+
35
+ <process>
36
+ Execute the verify-work workflow from @~/.claude/get-shit-done/workflows/verify-work.md end-to-end.
37
+ Preserve all workflow gates (session management, test presentation, diagnosis, fix planning, routing).
38
+ </process>
@@ -0,0 +1,471 @@
1
+ # GSD User Guide
2
+
3
+ A detailed reference for workflows, troubleshooting, and configuration. For quick-start setup, see the [README](../README.md).
4
+
5
+ ---
6
+
7
+ ## Table of Contents
8
+
9
+ - [Workflow Diagrams](#workflow-diagrams)
10
+ - [Command Reference](#command-reference)
11
+ - [Configuration Reference](#configuration-reference)
12
+ - [Usage Examples](#usage-examples)
13
+ - [Troubleshooting](#troubleshooting)
14
+ - [Recovery Quick Reference](#recovery-quick-reference)
15
+
16
+ ---
17
+
18
+ ## Workflow Diagrams
19
+
20
+ ### Full Project Lifecycle
21
+
22
+ ```
23
+ ┌──────────────────────────────────────────────────┐
24
+ │ NEW PROJECT │
25
+ │ /gsd:new-project │
26
+ │ Questions -> Research -> Requirements -> Roadmap│
27
+ └─────────────────────────┬────────────────────────┘
28
+
29
+ ┌──────────────▼─────────────┐
30
+ │ FOR EACH PHASE: │
31
+ │ │
32
+ │ ┌────────────────────┐ │
33
+ │ │ /gsd:discuss-phase │ │ <- Lock in preferences
34
+ │ └──────────┬─────────┘ │
35
+ │ │ │
36
+ │ ┌──────────▼─────────┐ │
37
+ │ │ /gsd:plan-phase │ │ <- Research + Plan + Verify
38
+ │ └──────────┬─────────┘ │
39
+ │ │ │
40
+ │ ┌──────────▼─────────┐ │
41
+ │ │ /gsd:execute-phase │ │ <- Parallel execution
42
+ │ └──────────┬─────────┘ │
43
+ │ │ │
44
+ │ ┌──────────▼─────────┐ │
45
+ │ │ /gsd:verify-work │ │ <- Manual UAT
46
+ │ └──────────┬─────────┘ │
47
+ │ │ │
48
+ │ Next Phase?────────────┘
49
+ │ │ No
50
+ └─────────────┼──────────────┘
51
+
52
+ ┌───────────────▼──────────────┐
53
+ │ /gsd:audit-milestone │
54
+ │ /gsd:complete-milestone │
55
+ └───────────────┬──────────────┘
56
+
57
+ Another milestone?
58
+ │ │
59
+ Yes No -> Done!
60
+
61
+ ┌───────▼──────────────┐
62
+ │ /gsd:new-milestone │
63
+ └──────────────────────┘
64
+ ```
65
+
66
+ ### Planning Agent Coordination
67
+
68
+ ```
69
+ /gsd:plan-phase N
70
+
71
+ ├── Phase Researcher (x4 parallel)
72
+ │ ├── Stack researcher
73
+ │ ├── Features researcher
74
+ │ ├── Architecture researcher
75
+ │ └── Pitfalls researcher
76
+ │ │
77
+ │ ┌──────▼──────┐
78
+ │ │ RESEARCH.md │
79
+ │ └──────┬──────┘
80
+ │ │
81
+ │ ┌──────▼──────┐
82
+ │ │ Planner │ <- Reads PROJECT.md, REQUIREMENTS.md,
83
+ │ │ │ CONTEXT.md, RESEARCH.md
84
+ │ └──────┬──────┘
85
+ │ │
86
+ │ ┌──────▼───────────┐ ┌────────┐
87
+ │ │ Plan Checker │────>│ PASS? │
88
+ │ └──────────────────┘ └───┬────┘
89
+ │ │
90
+ │ Yes │ No
91
+ │ │ │ │
92
+ │ │ └───┘ (loop, up to 3x)
93
+ │ │
94
+ │ ┌─────▼──────┐
95
+ │ │ PLAN files │
96
+ │ └────────────┘
97
+ └── Done
98
+ ```
99
+
100
+ ### Validation Architecture (Nyquist Layer)
101
+
102
+ During plan-phase research, GSD now maps automated test coverage to each phase
103
+ requirement before any code is written. This ensures that when Claude's executor
104
+ commits a task, a feedback mechanism already exists to verify it within seconds.
105
+
106
+ The researcher detects your existing test infrastructure, maps each requirement to
107
+ a specific test command, and identifies any test scaffolding that must be created
108
+ before implementation begins (Wave 0 tasks).
109
+
110
+ The plan-checker enforces this as an 8th verification dimension: plans where tasks
111
+ lack automated verify commands will not be approved.
112
+
113
+ **Output:** `{phase}-VALIDATION.md` -- the feedback contract for the phase.
114
+
115
+ **Disable:** Set `workflow.nyquist_validation: false` in `/gsd:settings` for
116
+ rapid prototyping phases where test infrastructure isn't the focus.
117
+
118
+ ### Execution Wave Coordination
119
+
120
+ ```
121
+ /gsd:execute-phase N
122
+
123
+ ├── Analyze plan dependencies
124
+
125
+ ├── Wave 1 (independent plans):
126
+ │ ├── Executor A (fresh 200K context) -> commit
127
+ │ └── Executor B (fresh 200K context) -> commit
128
+
129
+ ├── Wave 2 (depends on Wave 1):
130
+ │ └── Executor C (fresh 200K context) -> commit
131
+
132
+ └── Verifier
133
+ └── Check codebase against phase goals
134
+
135
+ ├── PASS -> VERIFICATION.md (success)
136
+ └── FAIL -> Issues logged for /gsd:verify-work
137
+ ```
138
+
139
+ ### Brownfield Workflow (Existing Codebase)
140
+
141
+ ```
142
+ /gsd:map-codebase
143
+
144
+ ├── Stack Mapper -> codebase/STACK.md
145
+ ├── Arch Mapper -> codebase/ARCHITECTURE.md
146
+ ├── Convention Mapper -> codebase/CONVENTIONS.md
147
+ └── Concern Mapper -> codebase/CONCERNS.md
148
+
149
+ ┌───────▼──────────┐
150
+ │ /gsd:new-project │ <- Questions focus on what you're ADDING
151
+ └──────────────────┘
152
+ ```
153
+
154
+ ---
155
+
156
+ ## Command Reference
157
+
158
+ ### Core Workflow
159
+
160
+ | Command | Purpose | When to Use |
161
+ |---------|---------|-------------|
162
+ | `/gsd:new-project` | Full project init: questions, research, requirements, roadmap | Start of a new project |
163
+ | `/gsd:new-project --auto @idea.md` | Automated init from document | Have a PRD or idea doc ready |
164
+ | `/gsd:discuss-phase [N]` | Capture implementation decisions | Before planning, to shape how it gets built |
165
+ | `/gsd:plan-phase [N]` | Research + plan + verify | Before executing a phase |
166
+ | `/gsd:execute-phase <N>` | Execute all plans in parallel waves | After planning is complete |
167
+ | `/gsd:verify-work [N]` | Manual UAT with auto-diagnosis | After execution completes |
168
+ | `/gsd:audit-milestone` | Verify milestone met its definition of done | Before completing milestone |
169
+ | `/gsd:complete-milestone` | Archive milestone, tag release | All phases verified |
170
+ | `/gsd:new-milestone [name]` | Start next version cycle | After completing a milestone |
171
+
172
+ ### Navigation
173
+
174
+ | Command | Purpose | When to Use |
175
+ |---------|---------|-------------|
176
+ | `/gsd:progress` | Show status and next steps | Anytime -- "where am I?" |
177
+ | `/gsd:resume-work` | Restore full context from last session | Starting a new session |
178
+ | `/gsd:pause-work` | Save context handoff | Stopping mid-phase |
179
+ | `/gsd:help` | Show all commands | Quick reference |
180
+ | `/gsd:update` | Update GSD with changelog preview | Check for new versions |
181
+ | `/gsd:join-discord` | Open Discord community invite | Questions or community |
182
+
183
+ ### Phase Management
184
+
185
+ | Command | Purpose | When to Use |
186
+ |---------|---------|-------------|
187
+ | `/gsd:add-phase` | Append new phase to roadmap | Scope grows after initial planning |
188
+ | `/gsd:insert-phase [N]` | Insert urgent work (decimal numbering) | Urgent fix mid-milestone |
189
+ | `/gsd:remove-phase [N]` | Remove future phase and renumber | Descoping a feature |
190
+ | `/gsd:list-phase-assumptions [N]` | Preview Claude's intended approach | Before planning, to validate direction |
191
+ | `/gsd:plan-milestone-gaps` | Create phases for audit gaps | After audit finds missing items |
192
+ | `/gsd:research-phase [N]` | Deep ecosystem research only | Complex or unfamiliar domain |
193
+
194
+ ### Brownfield & Utilities
195
+
196
+ | Command | Purpose | When to Use |
197
+ |---------|---------|-------------|
198
+ | `/gsd:map-codebase` | Analyze existing codebase | Before `/gsd:new-project` on existing code |
199
+ | `/gsd:quick` | Ad-hoc task with GSD guarantees | Bug fixes, small features, config changes |
200
+ | `/gsd:debug [desc]` | Systematic debugging with persistent state | When something breaks |
201
+ | `/gsd:add-todo [desc]` | Capture an idea for later | Think of something during a session |
202
+ | `/gsd:check-todos` | List pending todos | Review captured ideas |
203
+ | `/gsd:settings` | Configure workflow toggles and model profile | Change model, toggle agents |
204
+ | `/gsd:set-profile <profile>` | Quick profile switch | Change cost/quality tradeoff |
205
+ | `/gsd:reapply-patches` | Restore local modifications after update | After `/gsd:update` if you had local edits |
206
+
207
+ ---
208
+
209
+ ## Configuration Reference
210
+
211
+ GSD stores project settings in `.planning/config.json`. Configure during `/gsd:new-project` or update later with `/gsd:settings`.
212
+
213
+ ### Full config.json Schema
214
+
215
+ ```json
216
+ {
217
+ "mode": "interactive",
218
+ "depth": "standard",
219
+ "model_profile": "balanced",
220
+ "planning": {
221
+ "commit_docs": true,
222
+ "search_gitignored": false
223
+ },
224
+ "workflow": {
225
+ "research": true,
226
+ "plan_check": true,
227
+ "verifier": true,
228
+ "nyquist_validation": true
229
+ },
230
+ "git": {
231
+ "branching_strategy": "none",
232
+ "phase_branch_template": "gsd/phase-{phase}-{slug}",
233
+ "milestone_branch_template": "gsd/{milestone}-{slug}"
234
+ }
235
+ }
236
+ ```
237
+
238
+ ### Core Settings
239
+
240
+ | Setting | Options | Default | What it Controls |
241
+ |---------|---------|---------|------------------|
242
+ | `mode` | `interactive`, `yolo` | `interactive` | `yolo` auto-approves decisions; `interactive` confirms at each step |
243
+ | `depth` | `quick`, `standard`, `comprehensive` | `standard` | Planning thoroughness: 3-5, 5-8, or 8-12 phases |
244
+ | `model_profile` | `quality`, `balanced`, `budget` | `balanced` | Model tier for each agent (see table below) |
245
+
246
+ ### Planning Settings
247
+
248
+ | Setting | Options | Default | What it Controls |
249
+ |---------|---------|---------|------------------|
250
+ | `planning.commit_docs` | `true`, `false` | `true` | Whether `.planning/` files are committed to git |
251
+ | `planning.search_gitignored` | `true`, `false` | `false` | Add `--no-ignore` to broad searches to include `.planning/` |
252
+
253
+ > **Note:** If `.planning/` is in `.gitignore`, `commit_docs` is automatically `false` regardless of the config value.
254
+
255
+ ### Workflow Toggles
256
+
257
+ | Setting | Options | Default | What it Controls |
258
+ |---------|---------|---------|------------------|
259
+ | `workflow.research` | `true`, `false` | `true` | Domain investigation before planning |
260
+ | `workflow.plan_check` | `true`, `false` | `true` | Plan verification loop (up to 3 iterations) |
261
+ | `workflow.verifier` | `true`, `false` | `true` | Post-execution verification against phase goals |
262
+ | `workflow.nyquist_validation` | `true`, `false` | `true` | Validation architecture research during plan-phase; 8th plan-check dimension |
263
+
264
+ Disable these to speed up phases in familiar domains or when conserving tokens.
265
+
266
+ ### Git Branching
267
+
268
+ | Setting | Options | Default | What it Controls |
269
+ |---------|---------|---------|------------------|
270
+ | `git.branching_strategy` | `none`, `phase`, `milestone` | `none` | When and how branches are created |
271
+ | `git.phase_branch_template` | Template string | `gsd/phase-{phase}-{slug}` | Branch name for phase strategy |
272
+ | `git.milestone_branch_template` | Template string | `gsd/{milestone}-{slug}` | Branch name for milestone strategy |
273
+
274
+ **Branching strategies explained:**
275
+
276
+ | Strategy | Creates Branch | Scope | Best For |
277
+ |----------|---------------|-------|----------|
278
+ | `none` | Never | N/A | Solo development, simple projects |
279
+ | `phase` | At each `execute-phase` | One phase per branch | Code review per phase, granular rollback |
280
+ | `milestone` | At first `execute-phase` | All phases share one branch | Release branches, PR per version |
281
+
282
+ **Template variables:** `{phase}` = zero-padded number (e.g., "03"), `{slug}` = lowercase hyphenated name, `{milestone}` = version (e.g., "v1.0").
283
+
284
+ ### Model Profiles (Per-Agent Breakdown)
285
+
286
+ | Agent | `quality` | `balanced` | `budget` |
287
+ |-------|-----------|------------|----------|
288
+ | gsd-planner | Opus | Opus | Sonnet |
289
+ | gsd-roadmapper | Opus | Sonnet | Sonnet |
290
+ | gsd-executor | Opus | Sonnet | Sonnet |
291
+ | gsd-phase-researcher | Opus | Sonnet | Haiku |
292
+ | gsd-project-researcher | Opus | Sonnet | Haiku |
293
+ | gsd-research-synthesizer | Sonnet | Sonnet | Haiku |
294
+ | gsd-debugger | Opus | Sonnet | Sonnet |
295
+ | gsd-codebase-mapper | Sonnet | Haiku | Haiku |
296
+ | gsd-verifier | Sonnet | Sonnet | Haiku |
297
+ | gsd-plan-checker | Sonnet | Sonnet | Haiku |
298
+ | gsd-integration-checker | Sonnet | Sonnet | Haiku |
299
+
300
+ **Profile philosophy:**
301
+ - **quality** -- Opus for all decision-making agents, Sonnet for read-only verification. Use when quota is available and the work is critical.
302
+ - **balanced** -- Opus only for planning (where architecture decisions happen), Sonnet for everything else. The default for good reason.
303
+ - **budget** -- Sonnet for anything that writes code, Haiku for research and verification. Use for high-volume work or less critical phases.
304
+
305
+ ---
306
+
307
+ ## Usage Examples
308
+
309
+ ### New Project (Full Cycle)
310
+
311
+ ```bash
312
+ claude --dangerously-skip-permissions
313
+ /gsd:new-project # Answer questions, configure, approve roadmap
314
+ /clear
315
+ /gsd:discuss-phase 1 # Lock in your preferences
316
+ /gsd:plan-phase 1 # Research + plan + verify
317
+ /gsd:execute-phase 1 # Parallel execution
318
+ /gsd:verify-work 1 # Manual UAT
319
+ /clear
320
+ /gsd:discuss-phase 2 # Repeat for each phase
321
+ ...
322
+ /gsd:audit-milestone # Check everything shipped
323
+ /gsd:complete-milestone # Archive, tag, done
324
+ ```
325
+
326
+ ### New Project from Existing Document
327
+
328
+ ```bash
329
+ /gsd:new-project --auto @prd.md # Auto-runs research/requirements/roadmap from your doc
330
+ /clear
331
+ /gsd:discuss-phase 1 # Normal flow from here
332
+ ```
333
+
334
+ ### Existing Codebase
335
+
336
+ ```bash
337
+ /gsd:map-codebase # Analyze what exists (parallel agents)
338
+ /gsd:new-project # Questions focus on what you're ADDING
339
+ # (normal phase workflow from here)
340
+ ```
341
+
342
+ ### Quick Bug Fix
343
+
344
+ ```bash
345
+ /gsd:quick
346
+ > "Fix the login button not responding on mobile Safari"
347
+ ```
348
+
349
+ ### Resuming After a Break
350
+
351
+ ```bash
352
+ /gsd:progress # See where you left off and what's next
353
+ # or
354
+ /gsd:resume-work # Full context restoration from last session
355
+ ```
356
+
357
+ ### Preparing for Release
358
+
359
+ ```bash
360
+ /gsd:audit-milestone # Check requirements coverage, detect stubs
361
+ /gsd:plan-milestone-gaps # If audit found gaps, create phases to close them
362
+ /gsd:complete-milestone # Archive, tag, done
363
+ ```
364
+
365
+ ### Speed vs Quality Presets
366
+
367
+ | Scenario | Mode | Depth | Profile | Research | Plan Check | Verifier |
368
+ |----------|------|-------|---------|----------|------------|----------|
369
+ | Prototyping | `yolo` | `quick` | `budget` | off | off | off |
370
+ | Normal dev | `interactive` | `standard` | `balanced` | on | on | on |
371
+ | Production | `interactive` | `comprehensive` | `quality` | on | on | on |
372
+
373
+ ### Mid-Milestone Scope Changes
374
+
375
+ ```bash
376
+ /gsd:add-phase # Append a new phase to the roadmap
377
+ # or
378
+ /gsd:insert-phase 3 # Insert urgent work between phases 3 and 4
379
+ # or
380
+ /gsd:remove-phase 7 # Descope phase 7 and renumber
381
+ ```
382
+
383
+ ---
384
+
385
+ ## Troubleshooting
386
+
387
+ ### "Project already initialized"
388
+
389
+ You ran `/gsd:new-project` but `.planning/PROJECT.md` already exists. This is a safety check. If you want to start over, delete the `.planning/` directory first.
390
+
391
+ ### Context Degradation During Long Sessions
392
+
393
+ Clear your context window between major commands: `/clear` in Claude Code. GSD is designed around fresh contexts -- every subagent gets a clean 200K window. If quality is dropping in the main session, clear and use `/gsd:resume-work` or `/gsd:progress` to restore state.
394
+
395
+ ### Plans Seem Wrong or Misaligned
396
+
397
+ Run `/gsd:discuss-phase [N]` before planning. Most plan quality issues come from Claude making assumptions that `CONTEXT.md` would have prevented. You can also run `/gsd:list-phase-assumptions [N]` to see what Claude intends to do before committing to a plan.
398
+
399
+ ### Execution Fails or Produces Stubs
400
+
401
+ Check that the plan was not too ambitious. Plans should have 2-3 tasks maximum. If tasks are too large, they exceed what a single context window can produce reliably. Re-plan with smaller scope.
402
+
403
+ ### Lost Track of Where You Are
404
+
405
+ Run `/gsd:progress`. It reads all state files and tells you exactly where you are and what to do next.
406
+
407
+ ### Need to Change Something After Execution
408
+
409
+ Do not re-run `/gsd:execute-phase`. Use `/gsd:quick` for targeted fixes, or `/gsd:verify-work` to systematically identify and fix issues through UAT.
410
+
411
+ ### Model Costs Too High
412
+
413
+ Switch to budget profile: `/gsd:set-profile budget`. Disable research and plan-check agents via `/gsd:settings` if the domain is familiar to you (or to Claude).
414
+
415
+ ### Working on a Sensitive/Private Project
416
+
417
+ Set `commit_docs: false` during `/gsd:new-project` or via `/gsd:settings`. Add `.planning/` to your `.gitignore`. Planning artifacts stay local and never touch git.
418
+
419
+ ### GSD Update Overwrote My Local Changes
420
+
421
+ Since v1.17, the installer backs up locally modified files to `gsd-local-patches/`. Run `/gsd:reapply-patches` to merge your changes back.
422
+
423
+ ### Subagent Appears to Fail but Work Was Done
424
+
425
+ A known workaround exists for a Claude Code classification bug. GSD's orchestrators (execute-phase, quick) spot-check actual output before reporting failure. If you see a failure message but commits were made, check `git log` -- the work may have succeeded.
426
+
427
+ ---
428
+
429
+ ## Recovery Quick Reference
430
+
431
+ | Problem | Solution |
432
+ |---------|----------|
433
+ | Lost context / new session | `/gsd:resume-work` or `/gsd:progress` |
434
+ | Phase went wrong | `git revert` the phase commits, then re-plan |
435
+ | Need to change scope | `/gsd:add-phase`, `/gsd:insert-phase`, or `/gsd:remove-phase` |
436
+ | Milestone audit found gaps | `/gsd:plan-milestone-gaps` |
437
+ | Something broke | `/gsd:debug "description"` |
438
+ | Quick targeted fix | `/gsd:quick` |
439
+ | Plan doesn't match your vision | `/gsd:discuss-phase [N]` then re-plan |
440
+ | Costs running high | `/gsd:set-profile budget` and `/gsd:settings` to toggle agents off |
441
+ | Update broke local changes | `/gsd:reapply-patches` |
442
+
443
+ ---
444
+
445
+ ## Project File Structure
446
+
447
+ For reference, here is what GSD creates in your project:
448
+
449
+ ```
450
+ .planning/
451
+ PROJECT.md # Project vision and context (always loaded)
452
+ REQUIREMENTS.md # Scoped v1/v2 requirements with IDs
453
+ ROADMAP.md # Phase breakdown with status tracking
454
+ STATE.md # Decisions, blockers, session memory
455
+ config.json # Workflow configuration
456
+ MILESTONES.md # Completed milestone archive
457
+ research/ # Domain research from /gsd:new-project
458
+ todos/
459
+ pending/ # Captured ideas awaiting work
460
+ done/ # Completed todos
461
+ debug/ # Active debug sessions
462
+ resolved/ # Archived debug sessions
463
+ codebase/ # Brownfield codebase mapping (from /gsd:map-codebase)
464
+ phases/
465
+ XX-phase-name/
466
+ XX-YY-PLAN.md # Atomic execution plans
467
+ XX-YY-SUMMARY.md # Execution outcomes and decisions
468
+ CONTEXT.md # Your implementation preferences
469
+ RESEARCH.md # Ecosystem research findings
470
+ VERIFICATION.md # Post-execution verification results
471
+ ```
@@ -0,0 +1,96 @@
1
+ # Context Window Monitor
2
+
3
+ A PostToolUse hook that warns the agent when context window usage is high.
4
+
5
+ ## Problem
6
+
7
+ The statusline shows context usage to the **user**, but the **agent** has no awareness of context limits. When context runs low, the agent continues working until it hits the wall — potentially mid-task with no state saved.
8
+
9
+ ## How It Works
10
+
11
+ 1. The statusline hook writes context metrics to `/tmp/claude-ctx-{session_id}.json`
12
+ 2. After each tool use, the context monitor reads these metrics
13
+ 3. When remaining context drops below thresholds, it injects a warning as `additionalContext`
14
+ 4. The agent receives the warning in its conversation and can act accordingly
15
+
16
+ ## Thresholds
17
+
18
+ | Level | Remaining | Agent Behavior |
19
+ |-------|-----------|----------------|
20
+ | Normal | > 35% | No warning |
21
+ | WARNING | <= 35% | Wrap up current task, avoid starting new complex work |
22
+ | CRITICAL | <= 25% | Stop immediately, save state (`/gsd:pause-work`) |
23
+
24
+ ## Debounce
25
+
26
+ To avoid spamming the agent with repeated warnings:
27
+ - First warning always fires immediately
28
+ - Subsequent warnings require 5 tool uses between them
29
+ - Severity escalation (WARNING -> CRITICAL) bypasses debounce
30
+
31
+ ## Architecture
32
+
33
+ ```
34
+ Statusline Hook (gsd-statusline.js)
35
+ | writes
36
+ v
37
+ /tmp/claude-ctx-{session_id}.json
38
+ ^ reads
39
+ |
40
+ Context Monitor (gsd-context-monitor.js, PostToolUse)
41
+ | injects
42
+ v
43
+ additionalContext -> Agent sees warning
44
+ ```
45
+
46
+ The bridge file is a simple JSON object:
47
+
48
+ ```json
49
+ {
50
+ "session_id": "abc123",
51
+ "remaining_percentage": 28.5,
52
+ "used_pct": 71,
53
+ "timestamp": 1708200000
54
+ }
55
+ ```
56
+
57
+ ## Integration with GSD
58
+
59
+ GSD's `/gsd:pause-work` command saves execution state. The WARNING message suggests using it. The CRITICAL message instructs immediate state save.
60
+
61
+ ## Setup
62
+
63
+ Both hooks are automatically registered during `npx get-shit-done-cc` installation:
64
+
65
+ - **Statusline** (writes bridge file): Registered as `statusLine` in settings.json
66
+ - **Context Monitor** (reads bridge file): Registered as `PostToolUse` hook in settings.json
67
+
68
+ Manual registration in `~/.claude/settings.json`:
69
+
70
+ ```json
71
+ {
72
+ "statusLine": {
73
+ "type": "command",
74
+ "command": "node ~/.claude/hooks/gsd-statusline.js"
75
+ },
76
+ "hooks": {
77
+ "PostToolUse": [
78
+ {
79
+ "hooks": [
80
+ {
81
+ "type": "command",
82
+ "command": "node ~/.claude/hooks/gsd-context-monitor.js"
83
+ }
84
+ ]
85
+ }
86
+ ]
87
+ }
88
+ }
89
+ ```
90
+
91
+ ## Safety
92
+
93
+ - The hook wraps everything in try/catch and exits silently on error
94
+ - It never blocks tool execution — a broken monitor should not break the agent's workflow
95
+ - Stale metrics (older than 60s) are ignored
96
+ - Missing bridge files are handled gracefully (subagents, fresh sessions)