gsd-trae 1.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude/settings.local.json +8 -0
- package/.gitmodules +6 -0
- package/.trae/project_rules.md +56 -0
- package/.trae/rules/project_rules.md +56 -0
- package/.vscode/code-counter/code-counter.db +0 -0
- package/.vscode/settings.json +5 -0
- package/README.md +193 -0
- package/bin/cli.js +13 -0
- package/install.sh +77 -0
- package/package.json +29 -0
- package/refs/gsd/.github/CODEOWNERS +2 -0
- package/refs/gsd/.github/FUNDING.yml +1 -0
- package/refs/gsd/.github/ISSUE_TEMPLATE/bug_report.yml +59 -0
- package/refs/gsd/.github/ISSUE_TEMPLATE/feature_request.yml +37 -0
- package/refs/gsd/.github/pull_request_template.md +24 -0
- package/refs/gsd/.github/workflows/auto-label-issues.yml +21 -0
- package/refs/gsd/CHANGELOG.md +1520 -0
- package/refs/gsd/LICENSE +21 -0
- package/refs/gsd/README.md +704 -0
- package/refs/gsd/SECURITY.md +33 -0
- package/refs/gsd/agents/gsd-codebase-mapper.md +764 -0
- package/refs/gsd/agents/gsd-debugger.md +1246 -0
- package/refs/gsd/agents/gsd-executor.md +469 -0
- package/refs/gsd/agents/gsd-integration-checker.md +443 -0
- package/refs/gsd/agents/gsd-phase-researcher.md +546 -0
- package/refs/gsd/agents/gsd-plan-checker.md +690 -0
- package/refs/gsd/agents/gsd-planner.md +1275 -0
- package/refs/gsd/agents/gsd-project-researcher.md +621 -0
- package/refs/gsd/agents/gsd-research-synthesizer.md +239 -0
- package/refs/gsd/agents/gsd-roadmapper.md +642 -0
- package/refs/gsd/agents/gsd-verifier.md +573 -0
- package/refs/gsd/assets/gsd-logo-2000-transparent.png +0 -0
- package/refs/gsd/assets/gsd-logo-2000-transparent.svg +17 -0
- package/refs/gsd/assets/gsd-logo-2000.png +0 -0
- package/refs/gsd/assets/gsd-logo-2000.svg +21 -0
- package/refs/gsd/assets/terminal.svg +68 -0
- package/refs/gsd/bin/install.js +2090 -0
- package/refs/gsd/commands/gsd/add-phase.md +43 -0
- package/refs/gsd/commands/gsd/add-tests.md +41 -0
- package/refs/gsd/commands/gsd/add-todo.md +47 -0
- package/refs/gsd/commands/gsd/audit-milestone.md +36 -0
- package/refs/gsd/commands/gsd/check-todos.md +45 -0
- package/refs/gsd/commands/gsd/cleanup.md +18 -0
- package/refs/gsd/commands/gsd/complete-milestone.md +136 -0
- package/refs/gsd/commands/gsd/debug.md +167 -0
- package/refs/gsd/commands/gsd/discuss-phase.md +83 -0
- package/refs/gsd/commands/gsd/execute-phase.md +41 -0
- package/refs/gsd/commands/gsd/health.md +22 -0
- package/refs/gsd/commands/gsd/help.md +22 -0
- package/refs/gsd/commands/gsd/insert-phase.md +32 -0
- package/refs/gsd/commands/gsd/join-discord.md +18 -0
- package/refs/gsd/commands/gsd/list-phase-assumptions.md +46 -0
- package/refs/gsd/commands/gsd/map-codebase.md +71 -0
- package/refs/gsd/commands/gsd/new-milestone.md +44 -0
- package/refs/gsd/commands/gsd/new-project.md +42 -0
- package/refs/gsd/commands/gsd/new-project.md.bak +1041 -0
- package/refs/gsd/commands/gsd/pause-work.md +38 -0
- package/refs/gsd/commands/gsd/plan-milestone-gaps.md +34 -0
- package/refs/gsd/commands/gsd/plan-phase.md +45 -0
- package/refs/gsd/commands/gsd/progress.md +24 -0
- package/refs/gsd/commands/gsd/quick.md +41 -0
- package/refs/gsd/commands/gsd/reapply-patches.md +110 -0
- package/refs/gsd/commands/gsd/remove-phase.md +31 -0
- package/refs/gsd/commands/gsd/research-phase.md +189 -0
- package/refs/gsd/commands/gsd/resume-work.md +40 -0
- package/refs/gsd/commands/gsd/set-profile.md +34 -0
- package/refs/gsd/commands/gsd/settings.md +36 -0
- package/refs/gsd/commands/gsd/update.md +37 -0
- package/refs/gsd/commands/gsd/verify-work.md +38 -0
- package/refs/gsd/docs/USER-GUIDE.md +471 -0
- package/refs/gsd/docs/context-monitor.md +96 -0
- package/refs/gsd/get-shit-done/bin/gsd-tools.cjs +585 -0
- package/refs/gsd/get-shit-done/bin/lib/commands.cjs +553 -0
- package/refs/gsd/get-shit-done/bin/lib/config.cjs +162 -0
- package/refs/gsd/get-shit-done/bin/lib/core.cjs +411 -0
- package/refs/gsd/get-shit-done/bin/lib/frontmatter.cjs +299 -0
- package/refs/gsd/get-shit-done/bin/lib/init.cjs +710 -0
- package/refs/gsd/get-shit-done/bin/lib/milestone.cjs +215 -0
- package/refs/gsd/get-shit-done/bin/lib/phase.cjs +870 -0
- package/refs/gsd/get-shit-done/bin/lib/roadmap.cjs +298 -0
- package/refs/gsd/get-shit-done/bin/lib/state.cjs +521 -0
- package/refs/gsd/get-shit-done/bin/lib/template.cjs +222 -0
- package/refs/gsd/get-shit-done/bin/lib/verify.cjs +772 -0
- package/refs/gsd/get-shit-done/references/checkpoints.md +776 -0
- package/refs/gsd/get-shit-done/references/continuation-format.md +249 -0
- package/refs/gsd/get-shit-done/references/decimal-phase-calculation.md +65 -0
- package/refs/gsd/get-shit-done/references/git-integration.md +248 -0
- package/refs/gsd/get-shit-done/references/git-planning-commit.md +38 -0
- package/refs/gsd/get-shit-done/references/model-profile-resolution.md +34 -0
- package/refs/gsd/get-shit-done/references/model-profiles.md +92 -0
- package/refs/gsd/get-shit-done/references/phase-argument-parsing.md +61 -0
- package/refs/gsd/get-shit-done/references/planning-config.md +196 -0
- package/refs/gsd/get-shit-done/references/questioning.md +145 -0
- package/refs/gsd/get-shit-done/references/tdd.md +263 -0
- package/refs/gsd/get-shit-done/references/ui-brand.md +160 -0
- package/refs/gsd/get-shit-done/references/verification-patterns.md +612 -0
- package/refs/gsd/get-shit-done/templates/DEBUG.md +164 -0
- package/refs/gsd/get-shit-done/templates/UAT.md +247 -0
- package/refs/gsd/get-shit-done/templates/VALIDATION.md +76 -0
- package/refs/gsd/get-shit-done/templates/codebase/architecture.md +255 -0
- package/refs/gsd/get-shit-done/templates/codebase/concerns.md +310 -0
- package/refs/gsd/get-shit-done/templates/codebase/conventions.md +307 -0
- package/refs/gsd/get-shit-done/templates/codebase/integrations.md +280 -0
- package/refs/gsd/get-shit-done/templates/codebase/stack.md +186 -0
- package/refs/gsd/get-shit-done/templates/codebase/structure.md +285 -0
- package/refs/gsd/get-shit-done/templates/codebase/testing.md +480 -0
- package/refs/gsd/get-shit-done/templates/config.json +37 -0
- package/refs/gsd/get-shit-done/templates/context.md +283 -0
- package/refs/gsd/get-shit-done/templates/continue-here.md +78 -0
- package/refs/gsd/get-shit-done/templates/debug-subagent-prompt.md +91 -0
- package/refs/gsd/get-shit-done/templates/discovery.md +146 -0
- package/refs/gsd/get-shit-done/templates/milestone-archive.md +123 -0
- package/refs/gsd/get-shit-done/templates/milestone.md +115 -0
- package/refs/gsd/get-shit-done/templates/phase-prompt.md +569 -0
- package/refs/gsd/get-shit-done/templates/planner-subagent-prompt.md +117 -0
- package/refs/gsd/get-shit-done/templates/project.md +184 -0
- package/refs/gsd/get-shit-done/templates/requirements.md +231 -0
- package/refs/gsd/get-shit-done/templates/research-project/ARCHITECTURE.md +204 -0
- package/refs/gsd/get-shit-done/templates/research-project/FEATURES.md +147 -0
- package/refs/gsd/get-shit-done/templates/research-project/PITFALLS.md +200 -0
- package/refs/gsd/get-shit-done/templates/research-project/STACK.md +120 -0
- package/refs/gsd/get-shit-done/templates/research-project/SUMMARY.md +170 -0
- package/refs/gsd/get-shit-done/templates/research.md +552 -0
- package/refs/gsd/get-shit-done/templates/retrospective.md +54 -0
- package/refs/gsd/get-shit-done/templates/roadmap.md +202 -0
- package/refs/gsd/get-shit-done/templates/state.md +176 -0
- package/refs/gsd/get-shit-done/templates/summary-complex.md +59 -0
- package/refs/gsd/get-shit-done/templates/summary-minimal.md +41 -0
- package/refs/gsd/get-shit-done/templates/summary-standard.md +48 -0
- package/refs/gsd/get-shit-done/templates/summary.md +248 -0
- package/refs/gsd/get-shit-done/templates/user-setup.md +311 -0
- package/refs/gsd/get-shit-done/templates/verification-report.md +322 -0
- package/refs/gsd/get-shit-done/workflows/add-phase.md +111 -0
- package/refs/gsd/get-shit-done/workflows/add-tests.md +350 -0
- package/refs/gsd/get-shit-done/workflows/add-todo.md +157 -0
- package/refs/gsd/get-shit-done/workflows/audit-milestone.md +297 -0
- package/refs/gsd/get-shit-done/workflows/check-todos.md +176 -0
- package/refs/gsd/get-shit-done/workflows/cleanup.md +152 -0
- package/refs/gsd/get-shit-done/workflows/complete-milestone.md +763 -0
- package/refs/gsd/get-shit-done/workflows/diagnose-issues.md +219 -0
- package/refs/gsd/get-shit-done/workflows/discovery-phase.md +289 -0
- package/refs/gsd/get-shit-done/workflows/discuss-phase.md +542 -0
- package/refs/gsd/get-shit-done/workflows/execute-phase.md +449 -0
- package/refs/gsd/get-shit-done/workflows/execute-plan.md +448 -0
- package/refs/gsd/get-shit-done/workflows/health.md +156 -0
- package/refs/gsd/get-shit-done/workflows/help.md +489 -0
- package/refs/gsd/get-shit-done/workflows/insert-phase.md +129 -0
- package/refs/gsd/get-shit-done/workflows/list-phase-assumptions.md +178 -0
- package/refs/gsd/get-shit-done/workflows/map-codebase.md +315 -0
- package/refs/gsd/get-shit-done/workflows/new-milestone.md +382 -0
- package/refs/gsd/get-shit-done/workflows/new-project.md +1116 -0
- package/refs/gsd/get-shit-done/workflows/pause-work.md +122 -0
- package/refs/gsd/get-shit-done/workflows/plan-milestone-gaps.md +274 -0
- package/refs/gsd/get-shit-done/workflows/plan-phase.md +569 -0
- package/refs/gsd/get-shit-done/workflows/progress.md +381 -0
- package/refs/gsd/get-shit-done/workflows/quick.md +453 -0
- package/refs/gsd/get-shit-done/workflows/remove-phase.md +154 -0
- package/refs/gsd/get-shit-done/workflows/research-phase.md +73 -0
- package/refs/gsd/get-shit-done/workflows/resume-project.md +306 -0
- package/refs/gsd/get-shit-done/workflows/set-profile.md +80 -0
- package/refs/gsd/get-shit-done/workflows/settings.md +213 -0
- package/refs/gsd/get-shit-done/workflows/transition.md +544 -0
- package/refs/gsd/get-shit-done/workflows/update.md +219 -0
- package/refs/gsd/get-shit-done/workflows/verify-phase.md +242 -0
- package/refs/gsd/get-shit-done/workflows/verify-work.md +569 -0
- package/refs/gsd/hooks/gsd-check-update.js +62 -0
- package/refs/gsd/hooks/gsd-context-monitor.js +122 -0
- package/refs/gsd/hooks/gsd-statusline.js +108 -0
- package/refs/gsd/package.json +50 -0
- package/refs/gsd/scripts/build-hooks.js +43 -0
- package/refs/gsd/tests/commands.test.cjs +661 -0
- package/refs/gsd/tests/helpers.cjs +40 -0
- package/refs/gsd/tests/init.test.cjs +205 -0
- package/refs/gsd/tests/milestone.test.cjs +98 -0
- package/refs/gsd/tests/phase.test.cjs +1241 -0
- package/refs/gsd/tests/roadmap.test.cjs +265 -0
- package/refs/gsd/tests/state.test.cjs +302 -0
- package/refs/gsd/tests/verify.test.cjs +80 -0
- package/refs/vbenchmark/.agent/agents/codebase-explorer.md +224 -0
- package/refs/vbenchmark/.agent/agents/debugger.md +180 -0
- package/refs/vbenchmark/.agent/agents/documenter.md +166 -0
- package/refs/vbenchmark/.agent/agents/implementer.md +70 -0
- package/refs/vbenchmark/.agent/agents/orchestrator.md +212 -0
- package/refs/vbenchmark/.agent/agents/researcher.md +80 -0
- package/refs/vbenchmark/.agent/agents/reviewer.md +184 -0
- package/refs/vbenchmark/.agent/agents/tester.md +170 -0
- package/refs/vbenchmark/.agent/commands/commit.md +29 -0
- package/refs/vbenchmark/.agent/commands/debug.md +59 -0
- package/refs/vbenchmark/.agent/commands/document.md +52 -0
- package/refs/vbenchmark/.agent/commands/gather-context.md +58 -0
- package/refs/vbenchmark/.agent/commands/init.md +56 -0
- package/refs/vbenchmark/.agent/commands/preset-help.md +50 -0
- package/refs/vbenchmark/.agent/commands/refactor.md +71 -0
- package/refs/vbenchmark/.agent/commands/research.md +37 -0
- package/refs/vbenchmark/.agent/commands/review.md +38 -0
- package/refs/vbenchmark/.agent/commands/test.md +61 -0
- package/refs/vbenchmark/.agent/rules/01-code-quality.md +33 -0
- package/refs/vbenchmark/.agent/rules/02-typescript-go.md +46 -0
- package/refs/vbenchmark/.agent/rules/03-security-git.md +34 -0
- package/refs/vbenchmark/.agent/rules/04-architecture.md +40 -0
- package/refs/vbenchmark/.agent/sync.js +536 -0
- package/refs/vbenchmark/.agent/workflows/commit.md +29 -0
- package/refs/vbenchmark/.agent/workflows/debug.md +59 -0
- package/refs/vbenchmark/.agent/workflows/document.md +52 -0
- package/refs/vbenchmark/.agent/workflows/gather-context.md +58 -0
- package/refs/vbenchmark/.agent/workflows/init.md +56 -0
- package/refs/vbenchmark/.agent/workflows/preset-help.md +50 -0
- package/refs/vbenchmark/.agent/workflows/refactor.md +71 -0
- package/refs/vbenchmark/.agent/workflows/research.md +37 -0
- package/refs/vbenchmark/.agent/workflows/review.md +38 -0
- package/refs/vbenchmark/.agent/workflows/test.md +61 -0
- package/refs/vbenchmark/.claude/commands/agentic-dev/apply.md +222 -0
- package/refs/vbenchmark/.claude/commands/agentic-dev/done.md +166 -0
- package/refs/vbenchmark/.claude/commands/agentic-dev/proposal.md +220 -0
- package/refs/vbenchmark/.claude/commands/openspec/apply.md +23 -0
- package/refs/vbenchmark/.claude/commands/openspec/archive.md +27 -0
- package/refs/vbenchmark/.claude/commands/openspec/proposal.md +28 -0
- package/refs/vbenchmark/.clinerules/01-rules.md +73 -0
- package/refs/vbenchmark/.clinerules/02-agents.md +34 -0
- package/refs/vbenchmark/.cursor/commands/commit.md +29 -0
- package/refs/vbenchmark/.cursor/commands/debug.md +59 -0
- package/refs/vbenchmark/.cursor/commands/document.md +52 -0
- package/refs/vbenchmark/.cursor/commands/gather-context.md +58 -0
- package/refs/vbenchmark/.cursor/commands/init.md +56 -0
- package/refs/vbenchmark/.cursor/commands/preset-help.md +50 -0
- package/refs/vbenchmark/.cursor/commands/refactor.md +71 -0
- package/refs/vbenchmark/.cursor/commands/research.md +37 -0
- package/refs/vbenchmark/.cursor/commands/review.md +38 -0
- package/refs/vbenchmark/.cursor/commands/test.md +61 -0
- package/refs/vbenchmark/.cursor/rules/agents.mdc +1357 -0
- package/refs/vbenchmark/.factory/droids/codebase-explorer.md +224 -0
- package/refs/vbenchmark/.factory/droids/debugger.md +180 -0
- package/refs/vbenchmark/.factory/droids/documenter.md +166 -0
- package/refs/vbenchmark/.factory/droids/implementer.md +70 -0
- package/refs/vbenchmark/.factory/droids/orchestrator.md +212 -0
- package/refs/vbenchmark/.factory/droids/researcher.md +80 -0
- package/refs/vbenchmark/.factory/droids/reviewer.md +184 -0
- package/refs/vbenchmark/.factory/droids/tester.md +170 -0
- package/refs/vbenchmark/.gemini/workflows/commit.md +29 -0
- package/refs/vbenchmark/.gemini/workflows/debug.md +59 -0
- package/refs/vbenchmark/.gemini/workflows/document.md +52 -0
- package/refs/vbenchmark/.gemini/workflows/gather-context.md +58 -0
- package/refs/vbenchmark/.gemini/workflows/init.md +56 -0
- package/refs/vbenchmark/.gemini/workflows/preset-help.md +50 -0
- package/refs/vbenchmark/.gemini/workflows/refactor.md +71 -0
- package/refs/vbenchmark/.gemini/workflows/research.md +37 -0
- package/refs/vbenchmark/.gemini/workflows/review.md +38 -0
- package/refs/vbenchmark/.gemini/workflows/test.md +61 -0
- package/refs/vbenchmark/.github/CODEOWNERS +20 -0
- package/refs/vbenchmark/.github/FUNDING.yml +4 -0
- package/refs/vbenchmark/.github/ISSUE_TEMPLATE/bug-report.yml +76 -0
- package/refs/vbenchmark/.github/ISSUE_TEMPLATE/new-task.yml +106 -0
- package/refs/vbenchmark/.github/PULL_REQUEST_TEMPLATE.md +38 -0
- package/refs/vbenchmark/.github/copilot-instructions.md +73 -0
- package/refs/vbenchmark/.github/workflows/ci.yaml +33 -0
- package/refs/vbenchmark/.github/workflows/vercel-auto-pr.yml +478 -0
- package/refs/vbenchmark/.github/workflows/vercel-deploy.yaml +487 -0
- package/refs/vbenchmark/.github/workflows/vercel-pr-command.yaml +337 -0
- package/refs/vbenchmark/.github/workflows/vercel-project-init.yaml +208 -0
- package/refs/vbenchmark/.opencode/agent/codebase-explorer.md +224 -0
- package/refs/vbenchmark/.opencode/agent/debugger.md +180 -0
- package/refs/vbenchmark/.opencode/agent/documenter.md +166 -0
- package/refs/vbenchmark/.opencode/agent/implementer.md +70 -0
- package/refs/vbenchmark/.opencode/agent/orchestrator.md +212 -0
- package/refs/vbenchmark/.opencode/agent/researcher.md +80 -0
- package/refs/vbenchmark/.opencode/agent/reviewer.md +184 -0
- package/refs/vbenchmark/.opencode/agent/tester.md +170 -0
- package/refs/vbenchmark/.opencode/command/commit.md +29 -0
- package/refs/vbenchmark/.opencode/command/debug.md +59 -0
- package/refs/vbenchmark/.opencode/command/document.md +52 -0
- package/refs/vbenchmark/.opencode/command/gather-context.md +58 -0
- package/refs/vbenchmark/.opencode/command/init.md +56 -0
- package/refs/vbenchmark/.opencode/command/preset-help.md +50 -0
- package/refs/vbenchmark/.opencode/command/refactor.md +71 -0
- package/refs/vbenchmark/.opencode/command/research.md +37 -0
- package/refs/vbenchmark/.opencode/command/review.md +38 -0
- package/refs/vbenchmark/.opencode/command/test.md +61 -0
- package/refs/vbenchmark/.trae/project_rules.md +73 -0
- package/refs/vbenchmark/.windsurf/rules/rules.md +85 -0
- package/refs/vbenchmark/AGENTS.md +73 -0
- package/refs/vbenchmark/CONTRIBUTING.md +332 -0
- package/refs/vbenchmark/Caddyfile +3 -0
- package/refs/vbenchmark/LICENSE +47 -0
- package/refs/vbenchmark/README.md +354 -0
- package/refs/vbenchmark/docker-compose.prod.yaml +35 -0
- package/refs/vbenchmark/docker-compose.yaml +53 -0
- package/refs/vbenchmark/docs/TASK_EXPANSION_PLAN.md +211 -0
- package/refs/vbenchmark/docs/THESIS.md +441 -0
- package/refs/vbenchmark/docs/categories/code-evolution.md +138 -0
- package/refs/vbenchmark/openspec/changes/init-vibecodingbench/design.md +111 -0
- package/refs/vbenchmark/openspec/changes/init-vibecodingbench/proposal.md +15 -0
- package/refs/vbenchmark/openspec/changes/init-vibecodingbench/specs/evaluation/spec.md +105 -0
- package/refs/vbenchmark/openspec/changes/init-vibecodingbench/specs/leaderboard/spec.md +68 -0
- package/refs/vbenchmark/openspec/changes/init-vibecodingbench/specs/task-definition/spec.md +45 -0
- package/refs/vbenchmark/openspec/changes/init-vibecodingbench/specs/task-runner/spec.md +49 -0
- package/refs/vbenchmark/openspec/changes/init-vibecodingbench/tasks.md +413 -0
- package/refs/vbenchmark/package.json +51 -0
- package/refs/vbenchmark/packages/cli/eslint.config.js +16 -0
- package/refs/vbenchmark/packages/cli/package.json +35 -0
- package/refs/vbenchmark/packages/cli/src/agents/index.ts +655 -0
- package/refs/vbenchmark/packages/cli/src/commands/eval.ts +197 -0
- package/refs/vbenchmark/packages/cli/src/commands/list.ts +63 -0
- package/refs/vbenchmark/packages/cli/src/commands/run.ts +147 -0
- package/refs/vbenchmark/packages/cli/src/evaluator.ts +125 -0
- package/refs/vbenchmark/packages/cli/src/index.ts +21 -0
- package/refs/vbenchmark/packages/cli/src/lib/task-variation.ts +153 -0
- package/refs/vbenchmark/packages/cli/src/loader.ts +258 -0
- package/refs/vbenchmark/packages/cli/src/reporter.ts +222 -0
- package/refs/vbenchmark/packages/cli/src/runtime/docker.ts +385 -0
- package/refs/vbenchmark/packages/cli/tsconfig.json +8 -0
- package/refs/vbenchmark/packages/dashboard/Dockerfile +42 -0
- package/refs/vbenchmark/packages/dashboard/index.html +21 -0
- package/refs/vbenchmark/packages/dashboard/package.json +29 -0
- package/refs/vbenchmark/packages/dashboard/postcss.config.js +6 -0
- package/refs/vbenchmark/packages/dashboard/public/favicon.svg +24 -0
- package/refs/vbenchmark/packages/dashboard/public/logo.png +0 -0
- package/refs/vbenchmark/packages/dashboard/public/logo.svg +39 -0
- package/refs/vbenchmark/packages/dashboard/src/App.tsx +1468 -0
- package/refs/vbenchmark/packages/dashboard/src/data/category-performance.json +1 -0
- package/refs/vbenchmark/packages/dashboard/src/data/leaderboard.json +1 -0
- package/refs/vbenchmark/packages/dashboard/src/data/task-results.json +1 -0
- package/refs/vbenchmark/packages/dashboard/src/data/tasks.json +1 -0
- package/refs/vbenchmark/packages/dashboard/src/index.css +3 -0
- package/refs/vbenchmark/packages/dashboard/src/main.tsx +13 -0
- package/refs/vbenchmark/packages/dashboard/src/vite-env.d.ts +9 -0
- package/refs/vbenchmark/packages/dashboard/tailwind.config.js +11 -0
- package/refs/vbenchmark/packages/dashboard/tsconfig.json +21 -0
- package/refs/vbenchmark/packages/dashboard/tsconfig.node.json +11 -0
- package/refs/vbenchmark/packages/dashboard/vercel.json +6 -0
- package/refs/vbenchmark/packages/dashboard/vite.config.ts +28 -0
- package/refs/vbenchmark/packages/evaluator/eslint.config.js +16 -0
- package/refs/vbenchmark/packages/evaluator/package.json +24 -0
- package/refs/vbenchmark/packages/evaluator/src/index.ts +15 -0
- package/refs/vbenchmark/packages/evaluator/src/runners/functional.ts +88 -0
- package/refs/vbenchmark/packages/evaluator/src/runners/quality.ts +140 -0
- package/refs/vbenchmark/packages/evaluator/src/runners/security.ts +94 -0
- package/refs/vbenchmark/packages/evaluator/src/runners/visual.ts +108 -0
- package/refs/vbenchmark/packages/evaluator/src/types.d.ts +19 -0
- package/refs/vbenchmark/packages/evaluator/tsconfig.json +8 -0
- package/refs/vbenchmark/packages/leaderboard/Dockerfile +38 -0
- package/refs/vbenchmark/packages/leaderboard/drizzle.config.ts +10 -0
- package/refs/vbenchmark/packages/leaderboard/eslint.config.js +16 -0
- package/refs/vbenchmark/packages/leaderboard/fly.toml +29 -0
- package/refs/vbenchmark/packages/leaderboard/package.json +36 -0
- package/refs/vbenchmark/packages/leaderboard/src/app.ts +29 -0
- package/refs/vbenchmark/packages/leaderboard/src/components/BrowserPreview.tsx +190 -0
- package/refs/vbenchmark/packages/leaderboard/src/components/ComparisonView.tsx +205 -0
- package/refs/vbenchmark/packages/leaderboard/src/components/LeaderboardTable.tsx +150 -0
- package/refs/vbenchmark/packages/leaderboard/src/components/LiveRunCard.tsx +133 -0
- package/refs/vbenchmark/packages/leaderboard/src/components/SubmissionForm.tsx +406 -0
- package/refs/vbenchmark/packages/leaderboard/src/components/SubmitForm.tsx +293 -0
- package/refs/vbenchmark/packages/leaderboard/src/components/TerminalStream.tsx +111 -0
- package/refs/vbenchmark/packages/leaderboard/src/config/pricing.ts +206 -0
- package/refs/vbenchmark/packages/leaderboard/src/db/index.ts +31 -0
- package/refs/vbenchmark/packages/leaderboard/src/db/schema.ts +125 -0
- package/refs/vbenchmark/packages/leaderboard/src/index.ts +13 -0
- package/refs/vbenchmark/packages/leaderboard/src/lib/websocket.ts +124 -0
- package/refs/vbenchmark/packages/leaderboard/src/routes/leaderboard.ts +698 -0
- package/refs/vbenchmark/packages/leaderboard/src/routes/live.ts +175 -0
- package/refs/vbenchmark/packages/leaderboard/src/routes/submissions.ts +183 -0
- package/refs/vbenchmark/packages/leaderboard/src/routes/tasks.ts +215 -0
- package/refs/vbenchmark/packages/leaderboard/tests/api.test.ts +228 -0
- package/refs/vbenchmark/packages/leaderboard/tsconfig.json +9 -0
- package/refs/vbenchmark/scripts/deploy.sh +70 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/context-management/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/context-management/task.yaml +16 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/evaluation-framework/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/evaluation-framework/task.yaml +16 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/guardrails-safety/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/guardrails-safety/task.yaml +16 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/memory-system/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/memory-system/task.yaml +16 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/model-routing/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/model-routing/task.yaml +16 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/multi-agent-system/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/multi-agent-system/task.yaml +16 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/prompt-optimization/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/prompt-optimization/task.yaml +16 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/reasoning-chain/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/reasoning-chain/task.yaml +16 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/streaming-pipeline/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/streaming-pipeline/task.yaml +16 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/tool-use-orchestration/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/ai-integration/advanced/tool-use-orchestration/task.yaml +16 -0
- package/refs/vbenchmark/tasks/ai-integration/agents/code-review-agent/PROMPT.md +64 -0
- package/refs/vbenchmark/tasks/ai-integration/agents/code-review-agent/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/agents/research-agent/PROMPT.md +61 -0
- package/refs/vbenchmark/tasks/ai-integration/agents/research-agent/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/agents/web-scraper-agent/PROMPT.md +57 -0
- package/refs/vbenchmark/tasks/ai-integration/agents/web-scraper-agent/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/embeddings/duplicate-detection/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/ai-integration/embeddings/duplicate-detection/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/embeddings/recommendation-engine/PROMPT.md +51 -0
- package/refs/vbenchmark/tasks/ai-integration/embeddings/recommendation-engine/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/embeddings/semantic-search/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/ai-integration/embeddings/semantic-search/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/fine-tuning/classification-model/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/ai-integration/fine-tuning/classification-model/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/function-calling/api-orchestrator/PROMPT.md +60 -0
- package/refs/vbenchmark/tasks/ai-integration/function-calling/api-orchestrator/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/function-calling/calendar-assistant/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/ai-integration/function-calling/calendar-assistant/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/function-calling/database-query/PROMPT.md +62 -0
- package/refs/vbenchmark/tasks/ai-integration/function-calling/database-query/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/multimodal/chart-interpreter/PROMPT.md +60 -0
- package/refs/vbenchmark/tasks/ai-integration/multimodal/chart-interpreter/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/multimodal/image-captioning/PROMPT.md +49 -0
- package/refs/vbenchmark/tasks/ai-integration/multimodal/image-captioning/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/code-assistant/PROMPT.md +51 -0
- package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/code-assistant/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/doc-search/PROMPT.md +51 -0
- package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/doc-search/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/pdf-qa/PROMPT.md +76 -0
- package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/pdf-qa/docker-compose.yaml +30 -0
- package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/pdf-qa/task.yaml +30 -0
- package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/pdf-qa/tests/functional/qa.test.py +146 -0
- package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/support-bot/PROMPT.md +51 -0
- package/refs/vbenchmark/tasks/ai-integration/rag-chatbot/support-bot/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/structured-output/contract-analyzer/PROMPT.md +67 -0
- package/refs/vbenchmark/tasks/ai-integration/structured-output/contract-analyzer/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/structured-output/invoice-parser/PROMPT.md +61 -0
- package/refs/vbenchmark/tasks/ai-integration/structured-output/invoice-parser/task.yaml +27 -0
- package/refs/vbenchmark/tasks/ai-integration/structured-output/receipt-scanner/PROMPT.md +65 -0
- package/refs/vbenchmark/tasks/ai-integration/structured-output/receipt-scanner/task.yaml +24 -0
- package/refs/vbenchmark/tasks/ai-integration/structured-output/resume-parser/PROMPT.md +70 -0
- package/refs/vbenchmark/tasks/ai-integration/structured-output/resume-parser/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/api-analytics/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/api-analytics/task.yaml +16 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/api-gateway/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/api-gateway/task.yaml +16 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/api-mocking/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/api-mocking/task.yaml +16 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/contract-testing/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/contract-testing/task.yaml +16 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/graphql-federation/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/graphql-federation/task.yaml +16 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/grpc-gateway/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/grpc-gateway/task.yaml +16 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/rate-limiter/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/rate-limiter/task.yaml +16 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/request-validator/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/request-validator/task.yaml +16 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/sdk-generator/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/sdk-generator/task.yaml +16 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/webhook-processor/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/api-integrations/advanced/webhook-processor/task.yaml +16 -0
- package/refs/vbenchmark/tasks/api-integrations/analytics/mixpanel-events/PROMPT.md +42 -0
- package/refs/vbenchmark/tasks/api-integrations/analytics/mixpanel-events/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/analytics/segment-tracking/PROMPT.md +42 -0
- package/refs/vbenchmark/tasks/api-integrations/analytics/segment-tracking/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/auth-provider/oauth2-github/PROMPT.md +42 -0
- package/refs/vbenchmark/tasks/api-integrations/auth-provider/oauth2-github/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/auth-provider/okta-integration/PROMPT.md +44 -0
- package/refs/vbenchmark/tasks/api-integrations/auth-provider/okta-integration/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/auth-provider/saml-sso/PROMPT.md +42 -0
- package/refs/vbenchmark/tasks/api-integrations/auth-provider/saml-sso/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/communication/discord-webhook/PROMPT.md +44 -0
- package/refs/vbenchmark/tasks/api-integrations/communication/discord-webhook/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/communication/slack-bot/PROMPT.md +42 -0
- package/refs/vbenchmark/tasks/api-integrations/communication/slack-bot/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/communication/twilio-sms/PROMPT.md +42 -0
- package/refs/vbenchmark/tasks/api-integrations/communication/twilio-sms/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/email/transactional/PROMPT.md +82 -0
- package/refs/vbenchmark/tasks/api-integrations/email/transactional/task.yaml +27 -0
- package/refs/vbenchmark/tasks/api-integrations/maps/google-maps-geocoding/PROMPT.md +41 -0
- package/refs/vbenchmark/tasks/api-integrations/maps/google-maps-geocoding/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/maps/mapbox-directions/PROMPT.md +41 -0
- package/refs/vbenchmark/tasks/api-integrations/maps/mapbox-directions/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/payment/crypto-payments/PROMPT.md +43 -0
- package/refs/vbenchmark/tasks/api-integrations/payment/crypto-payments/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/payment/paypal-integration/PROMPT.md +41 -0
- package/refs/vbenchmark/tasks/api-integrations/payment/paypal-integration/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/social/twitter-api/PROMPT.md +41 -0
- package/refs/vbenchmark/tasks/api-integrations/social/twitter-api/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/storage/cloudinary-upload/PROMPT.md +43 -0
- package/refs/vbenchmark/tasks/api-integrations/storage/cloudinary-upload/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/storage/gcs-streaming/PROMPT.md +43 -0
- package/refs/vbenchmark/tasks/api-integrations/storage/gcs-streaming/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/storage/s3-presigned-urls/PROMPT.md +41 -0
- package/refs/vbenchmark/tasks/api-integrations/storage/s3-presigned-urls/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/stripe/checkout-session/PROMPT.md +41 -0
- package/refs/vbenchmark/tasks/api-integrations/stripe/checkout-session/task.yaml +24 -0
- package/refs/vbenchmark/tasks/api-integrations/stripe/payment-webhook/PROMPT.md +60 -0
- package/refs/vbenchmark/tasks/api-integrations/stripe/payment-webhook/docker-compose.yaml +38 -0
- package/refs/vbenchmark/tasks/api-integrations/stripe/payment-webhook/task.yaml +31 -0
- package/refs/vbenchmark/tasks/api-integrations/stripe/payment-webhook/tests/webhook.test.ts +193 -0
- package/refs/vbenchmark/tasks/api-integrations/stripe/subscription-portal/PROMPT.md +41 -0
- package/refs/vbenchmark/tasks/api-integrations/stripe/subscription-portal/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/api-deprecation/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/api-deprecation/task.yaml +16 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/ast-refactoring/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/ast-refactoring/task.yaml +16 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/concurrency-fix/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/concurrency-fix/task.yaml +16 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/database-schema-migration/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/database-schema-migration/task.yaml +16 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/dead-code-elimination/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/dead-code-elimination/task.yaml +16 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/dependency-upgrade/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/dependency-upgrade/task.yaml +16 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/memory-optimization/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/memory-optimization/task.yaml +16 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/monorepo-extraction/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/monorepo-extraction/task.yaml +16 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/performance-profiling/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/performance-profiling/task.yaml +16 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/type-migration/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/code-evolution/advanced/type-migration/task.yaml +16 -0
- package/refs/vbenchmark/tasks/code-evolution/legacy-migration/callback-to-async/PROMPT.md +47 -0
- package/refs/vbenchmark/tasks/code-evolution/legacy-migration/callback-to-async/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/legacy-migration/express-to-fastify/PROMPT.md +49 -0
- package/refs/vbenchmark/tasks/code-evolution/legacy-migration/express-to-fastify/base-code/src/app.ts +22 -0
- package/refs/vbenchmark/tasks/code-evolution/legacy-migration/express-to-fastify/task.yaml +37 -0
- package/refs/vbenchmark/tasks/code-evolution/legacy-migration/express-to-fastify/tests/api.test.ts +70 -0
- package/refs/vbenchmark/tasks/code-evolution/legacy-migration/flask-to-fastapi/PROMPT.md +46 -0
- package/refs/vbenchmark/tasks/code-evolution/legacy-migration/flask-to-fastapi/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/legacy-migration/java-to-kotlin/PROMPT.md +45 -0
- package/refs/vbenchmark/tasks/code-evolution/legacy-migration/java-to-kotlin/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/legacy-migration/jquery-to-react/PROMPT.md +47 -0
- package/refs/vbenchmark/tasks/code-evolution/legacy-migration/jquery-to-react/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/legacy-migration/rest-to-grpc/PROMPT.md +47 -0
- package/refs/vbenchmark/tasks/code-evolution/legacy-migration/rest-to-grpc/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/performance/async-refactor/PROMPT.md +47 -0
- package/refs/vbenchmark/tasks/code-evolution/performance/async-refactor/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/performance/memory-leak-fix/PROMPT.md +47 -0
- package/refs/vbenchmark/tasks/code-evolution/performance/memory-leak-fix/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/performance/query-optimization/PROMPT.md +49 -0
- package/refs/vbenchmark/tasks/code-evolution/performance/query-optimization/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/refactoring/class-to-hooks/PROMPT.md +96 -0
- package/refs/vbenchmark/tasks/code-evolution/refactoring/class-to-hooks/task.yaml +27 -0
- package/refs/vbenchmark/tasks/code-evolution/refactoring/dependency-injection/PROMPT.md +47 -0
- package/refs/vbenchmark/tasks/code-evolution/refactoring/dependency-injection/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/refactoring/error-handling/PROMPT.md +48 -0
- package/refs/vbenchmark/tasks/code-evolution/refactoring/error-handling/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/refactoring/monolith-to-modules/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/code-evolution/refactoring/monolith-to-modules/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/refactoring/orm-migration/PROMPT.md +47 -0
- package/refs/vbenchmark/tasks/code-evolution/refactoring/orm-migration/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/security/secrets-rotation/PROMPT.md +49 -0
- package/refs/vbenchmark/tasks/code-evolution/security/secrets-rotation/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/security/sql-injection-fix/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/code-evolution/security/sql-injection-fix/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/security/xss-prevention/PROMPT.md +47 -0
- package/refs/vbenchmark/tasks/code-evolution/security/xss-prevention/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/testing/add-unit-tests/PROMPT.md +48 -0
- package/refs/vbenchmark/tasks/code-evolution/testing/add-unit-tests/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/testing/e2e-playwright/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/code-evolution/testing/e2e-playwright/task.yaml +24 -0
- package/refs/vbenchmark/tasks/code-evolution/testing/pytest-fixtures/PROMPT.md +47 -0
- package/refs/vbenchmark/tasks/code-evolution/testing/pytest-fixtures/task.yaml +24 -0
- package/refs/vbenchmark/tasks/frontend/accessibility/keyboard-shortcuts/PROMPT.md +44 -0
- package/refs/vbenchmark/tasks/frontend/accessibility/keyboard-shortcuts/task.yaml +24 -0
- package/refs/vbenchmark/tasks/frontend/accessibility/screen-reader-nav/PROMPT.md +44 -0
- package/refs/vbenchmark/tasks/frontend/accessibility/screen-reader-nav/task.yaml +24 -0
- package/refs/vbenchmark/tasks/frontend/advanced/canvas-editor/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/frontend/advanced/canvas-editor/task.yaml +16 -0
- package/refs/vbenchmark/tasks/frontend/advanced/micro-frontend/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/frontend/advanced/micro-frontend/task.yaml +16 -0
- package/refs/vbenchmark/tasks/frontend/advanced/offline-first/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/frontend/advanced/offline-first/task.yaml +16 -0
- package/refs/vbenchmark/tasks/frontend/advanced/realtime-collab/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/frontend/advanced/realtime-collab/task.yaml +16 -0
- package/refs/vbenchmark/tasks/frontend/advanced/service-worker/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/frontend/advanced/service-worker/task.yaml +16 -0
- package/refs/vbenchmark/tasks/frontend/advanced/state-machine/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/frontend/advanced/state-machine/task.yaml +16 -0
- package/refs/vbenchmark/tasks/frontend/advanced/virtual-list/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/frontend/advanced/virtual-list/task.yaml +16 -0
- package/refs/vbenchmark/tasks/frontend/advanced/wasm-integration/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/frontend/advanced/wasm-integration/task.yaml +16 -0
- package/refs/vbenchmark/tasks/frontend/advanced/web-worker/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/frontend/advanced/web-worker/task.yaml +16 -0
- package/refs/vbenchmark/tasks/frontend/advanced/webgl-visualization/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/frontend/advanced/webgl-visualization/task.yaml +16 -0
- package/refs/vbenchmark/tasks/frontend/animation/page-transitions/PROMPT.md +44 -0
- package/refs/vbenchmark/tasks/frontend/animation/page-transitions/task.yaml +24 -0
- package/refs/vbenchmark/tasks/frontend/components/data-grid/PROMPT.md +59 -0
- package/refs/vbenchmark/tasks/frontend/components/data-grid/task.yaml +24 -0
- package/refs/vbenchmark/tasks/frontend/components/date-range-picker/PROMPT.md +57 -0
- package/refs/vbenchmark/tasks/frontend/components/date-range-picker/task.yaml +24 -0
- package/refs/vbenchmark/tasks/frontend/components/file-uploader/PROMPT.md +55 -0
- package/refs/vbenchmark/tasks/frontend/components/file-uploader/task.yaml +24 -0
- package/refs/vbenchmark/tasks/frontend/components/form-builder/PROMPT.md +96 -0
- package/refs/vbenchmark/tasks/frontend/components/form-builder/task.yaml +28 -0
- package/refs/vbenchmark/tasks/frontend/components/rich-text-editor/PROMPT.md +45 -0
- package/refs/vbenchmark/tasks/frontend/components/rich-text-editor/task.yaml +24 -0
- package/refs/vbenchmark/tasks/frontend/figma-to-code/dashboard-layout/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/frontend/figma-to-code/dashboard-layout/task.yaml +25 -0
- package/refs/vbenchmark/tasks/frontend/figma-to-code/landing-page/PROMPT.md +49 -0
- package/refs/vbenchmark/tasks/frontend/figma-to-code/landing-page/task.yaml +25 -0
- package/refs/vbenchmark/tasks/frontend/figma-to-code/mobile-app-screen/PROMPT.md +51 -0
- package/refs/vbenchmark/tasks/frontend/figma-to-code/mobile-app-screen/task.yaml +24 -0
- package/refs/vbenchmark/tasks/frontend/figma-to-code/pricing-card/PROMPT.md +93 -0
- package/refs/vbenchmark/tasks/frontend/figma-to-code/pricing-card/docker-compose.yaml +23 -0
- package/refs/vbenchmark/tasks/frontend/figma-to-code/pricing-card/task.yaml +30 -0
- package/refs/vbenchmark/tasks/frontend/figma-to-code/pricing-card/tests/visual/diff.test.ts +107 -0
- package/refs/vbenchmark/tasks/frontend/figma-to-code/pricing-card/tests/visual/interaction.test.ts +88 -0
- package/refs/vbenchmark/tasks/frontend/performance/image-lazy-load/PROMPT.md +43 -0
- package/refs/vbenchmark/tasks/frontend/performance/image-lazy-load/task.yaml +24 -0
- package/refs/vbenchmark/tasks/frontend/performance/infinite-scroll/PROMPT.md +44 -0
- package/refs/vbenchmark/tasks/frontend/performance/infinite-scroll/task.yaml +24 -0
- package/refs/vbenchmark/tasks/frontend/state-management/collaborative-editor/PROMPT.md +44 -0
- package/refs/vbenchmark/tasks/frontend/state-management/collaborative-editor/task.yaml +24 -0
- package/refs/vbenchmark/tasks/frontend/state-management/shopping-cart/PROMPT.md +53 -0
- package/refs/vbenchmark/tasks/frontend/state-management/shopping-cart/task.yaml +24 -0
- package/refs/vbenchmark/tasks/frontend/visualization/chart-dashboard/PROMPT.md +83 -0
- package/refs/vbenchmark/tasks/frontend/visualization/chart-dashboard/task.yaml +28 -0
- package/refs/vbenchmark/tasks/frontend/visualization/gantt-chart/PROMPT.md +57 -0
- package/refs/vbenchmark/tasks/frontend/visualization/gantt-chart/task.yaml +24 -0
- package/refs/vbenchmark/tasks/frontend/visualization/map-dashboard/PROMPT.md +44 -0
- package/refs/vbenchmark/tasks/frontend/visualization/map-dashboard/task.yaml +24 -0
- package/refs/vbenchmark/tasks/frontend/visualization/realtime-charts/PROMPT.md +43 -0
- package/refs/vbenchmark/tasks/frontend/visualization/realtime-charts/task.yaml +24 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/blue-green-deploy/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/blue-green-deploy/task.yaml +16 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/canary-release/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/canary-release/task.yaml +16 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/change-data-capture/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/change-data-capture/task.yaml +16 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/config-management/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/config-management/task.yaml +16 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/data-pipeline/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/data-pipeline/task.yaml +16 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/distributed-tracing/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/distributed-tracing/task.yaml +16 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/log-aggregation/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/log-aggregation/task.yaml +16 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/schema-registry/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/schema-registry/task.yaml +16 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/secret-rotation/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/secret-rotation/task.yaml +16 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/stream-processing/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/glue-code/advanced/stream-processing/task.yaml +16 -0
- package/refs/vbenchmark/tasks/glue-code/api-sync/rest-to-graphql/PROMPT.md +66 -0
- package/refs/vbenchmark/tasks/glue-code/api-sync/rest-to-graphql/task.yaml +27 -0
- package/refs/vbenchmark/tasks/glue-code/caching/redis-cache/PROMPT.md +82 -0
- package/refs/vbenchmark/tasks/glue-code/caching/redis-cache/task.yaml +27 -0
- package/refs/vbenchmark/tasks/glue-code/data-transform/avro-schema-evolution/PROMPT.md +51 -0
- package/refs/vbenchmark/tasks/glue-code/data-transform/avro-schema-evolution/task.yaml +24 -0
- package/refs/vbenchmark/tasks/glue-code/data-transform/csv-normalizer/PROMPT.md +49 -0
- package/refs/vbenchmark/tasks/glue-code/data-transform/csv-normalizer/task.yaml +24 -0
- package/refs/vbenchmark/tasks/glue-code/data-transform/excel-to-json/PROMPT.md +67 -0
- package/refs/vbenchmark/tasks/glue-code/data-transform/excel-to-json/task.yaml +28 -0
- package/refs/vbenchmark/tasks/glue-code/data-transform/excel-to-json/tests/transform.test.py +137 -0
- package/refs/vbenchmark/tasks/glue-code/data-transform/json-to-xml/PROMPT.md +45 -0
- package/refs/vbenchmark/tasks/glue-code/data-transform/json-to-xml/task.yaml +24 -0
- package/refs/vbenchmark/tasks/glue-code/data-transform/protobuf-converter/PROMPT.md +44 -0
- package/refs/vbenchmark/tasks/glue-code/data-transform/protobuf-converter/task.yaml +24 -0
- package/refs/vbenchmark/tasks/glue-code/etl/cdc-pipeline/PROMPT.md +52 -0
- package/refs/vbenchmark/tasks/glue-code/etl/cdc-pipeline/task.yaml +27 -0
- package/refs/vbenchmark/tasks/glue-code/etl/database-sync/PROMPT.md +51 -0
- package/refs/vbenchmark/tasks/glue-code/etl/database-sync/task.yaml +24 -0
- package/refs/vbenchmark/tasks/glue-code/etl/s3-to-warehouse/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/glue-code/etl/s3-to-warehouse/task.yaml +24 -0
- package/refs/vbenchmark/tasks/glue-code/file-processing/image-resizer/PROMPT.md +52 -0
- package/refs/vbenchmark/tasks/glue-code/file-processing/image-resizer/task.yaml +24 -0
- package/refs/vbenchmark/tasks/glue-code/file-processing/pdf-merger/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/glue-code/file-processing/pdf-merger/task.yaml +24 -0
- package/refs/vbenchmark/tasks/glue-code/file-processing/video-transcoder/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/glue-code/file-processing/video-transcoder/task.yaml +27 -0
- package/refs/vbenchmark/tasks/glue-code/migration/data-backfill/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/glue-code/migration/data-backfill/task.yaml +24 -0
- package/refs/vbenchmark/tasks/glue-code/migration/database-versioning/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/glue-code/migration/database-versioning/task.yaml +24 -0
- package/refs/vbenchmark/tasks/glue-code/queue/kafka-producer/PROMPT.md +49 -0
- package/refs/vbenchmark/tasks/glue-code/queue/kafka-producer/task.yaml +27 -0
- package/refs/vbenchmark/tasks/glue-code/queue/rabbitmq-consumer/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/glue-code/queue/rabbitmq-consumer/task.yaml +27 -0
- package/refs/vbenchmark/tasks/glue-code/queue/sqs-batch-processor/PROMPT.md +47 -0
- package/refs/vbenchmark/tasks/glue-code/queue/sqs-batch-processor/task.yaml +24 -0
- package/refs/vbenchmark/tasks/glue-code/scheduler/cron-job-manager/PROMPT.md +52 -0
- package/refs/vbenchmark/tasks/glue-code/scheduler/cron-job-manager/task.yaml +27 -0
- package/refs/vbenchmark/tasks/glue-code/scheduler/delayed-tasks/PROMPT.md +51 -0
- package/refs/vbenchmark/tasks/glue-code/scheduler/delayed-tasks/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/api-versioning/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/api-versioning/task.yaml +16 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/circuit-breaker/PROMPT.md +13 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/circuit-breaker/task.yaml +16 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/compliance-gdpr/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/compliance-gdpr/task.yaml +16 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/cqrs-pattern/PROMPT.md +13 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/cqrs-pattern/task.yaml +16 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/data-encryption/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/data-encryption/task.yaml +16 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/distributed-locking/PROMPT.md +46 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/distributed-locking/task.yaml +24 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/event-sourcing/PROMPT.md +23 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/event-sourcing/task.yaml +16 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/feature-flags-ab/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/feature-flags-ab/task.yaml +16 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/saga-orchestration/PROMPT.md +13 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/saga-orchestration/task.yaml +16 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/webhook-delivery/PROMPT.md +15 -0
- package/refs/vbenchmark/tasks/saas-core/advanced/webhook-delivery/task.yaml +16 -0
- package/refs/vbenchmark/tasks/saas-core/audit/activity-logging/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/saas-core/audit/activity-logging/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/auth/jwt-refresh-tokens/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/saas-core/auth/jwt-refresh-tokens/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/auth/magic-link-email/PROMPT.md +53 -0
- package/refs/vbenchmark/tasks/saas-core/auth/magic-link-email/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/auth/mfa-totp/PROMPT.md +79 -0
- package/refs/vbenchmark/tasks/saas-core/auth/mfa-totp/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/auth/rbac-permissions/PROMPT.md +51 -0
- package/refs/vbenchmark/tasks/saas-core/auth/rbac-permissions/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/auth/session-management/PROMPT.md +52 -0
- package/refs/vbenchmark/tasks/saas-core/auth/session-management/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/auth/supabase-oauth/PROMPT.md +45 -0
- package/refs/vbenchmark/tasks/saas-core/auth/supabase-oauth/docker-compose.yaml +47 -0
- package/refs/vbenchmark/tasks/saas-core/auth/supabase-oauth/task.yaml +32 -0
- package/refs/vbenchmark/tasks/saas-core/auth/supabase-oauth/tests/auth.test.ts +59 -0
- package/refs/vbenchmark/tasks/saas-core/billing/invoice-generation/PROMPT.md +53 -0
- package/refs/vbenchmark/tasks/saas-core/billing/invoice-generation/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/billing/stripe-subscriptions/PROMPT.md +51 -0
- package/refs/vbenchmark/tasks/saas-core/billing/stripe-subscriptions/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/billing/usage-metering/PROMPT.md +52 -0
- package/refs/vbenchmark/tasks/saas-core/billing/usage-metering/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/crud/dashboard-table/PROMPT.md +48 -0
- package/refs/vbenchmark/tasks/saas-core/crud/dashboard-table/task.yaml +28 -0
- package/refs/vbenchmark/tasks/saas-core/multi-tenant/org-isolation/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/saas-core/multi-tenant/org-isolation/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/multi-tenant/subdomain-routing/PROMPT.md +50 -0
- package/refs/vbenchmark/tasks/saas-core/multi-tenant/subdomain-routing/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/notifications/email-queue/PROMPT.md +53 -0
- package/refs/vbenchmark/tasks/saas-core/notifications/email-queue/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/notifications/in-app-alerts/PROMPT.md +51 -0
- package/refs/vbenchmark/tasks/saas-core/notifications/in-app-alerts/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/notifications/push-notifications/PROMPT.md +51 -0
- package/refs/vbenchmark/tasks/saas-core/notifications/push-notifications/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/realtime/websocket-chat/PROMPT.md +80 -0
- package/refs/vbenchmark/tasks/saas-core/realtime/websocket-chat/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/search/full-text-search/PROMPT.md +51 -0
- package/refs/vbenchmark/tasks/saas-core/search/full-text-search/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/security/rate-limiter/PROMPT.md +99 -0
- package/refs/vbenchmark/tasks/saas-core/security/rate-limiter/task.yaml +27 -0
- package/refs/vbenchmark/tasks/saas-core/settings/user-preferences/PROMPT.md +78 -0
- package/refs/vbenchmark/tasks/saas-core/settings/user-preferences/task.yaml +27 -0
- package/refs/vbenchmark/templates/fastapi-postgres/docker-compose.yaml +36 -0
- package/refs/vbenchmark/templates/fastapi-postgres/pyproject.toml +34 -0
- package/refs/vbenchmark/templates/fastapi-postgres/src/__init__.py +0 -0
- package/refs/vbenchmark/templates/fastapi-postgres/src/config.py +12 -0
- package/refs/vbenchmark/templates/fastapi-postgres/src/database.py +15 -0
- package/refs/vbenchmark/templates/fastapi-postgres/src/main.py +51 -0
- package/refs/vbenchmark/templates/fastapi-postgres/src/models.py +12 -0
- package/refs/vbenchmark/templates/fastapi-postgres/src/schemas.py +20 -0
- package/refs/vbenchmark/templates/go-fiber/docker-compose.yaml +34 -0
- package/refs/vbenchmark/templates/go-fiber/go.mod +33 -0
- package/refs/vbenchmark/templates/go-fiber/go.sum +68 -0
- package/refs/vbenchmark/templates/go-fiber/main.go +98 -0
- package/refs/vbenchmark/templates/nextjs-supabase/.env.example +3 -0
- package/refs/vbenchmark/templates/nextjs-supabase/docker-compose.yaml +68 -0
- package/refs/vbenchmark/templates/nextjs-supabase/src/app/globals.css +13 -0
- package/refs/vbenchmark/templates/nextjs-supabase/src/app/layout.tsx +19 -0
- package/refs/vbenchmark/templates/nextjs-supabase/src/app/page.tsx +38 -0
- package/refs/vbenchmark/templates/nextjs-supabase/src/lib/supabase/client.ts +8 -0
- package/refs/vbenchmark/templates/nextjs-supabase/src/lib/supabase/server.ts +32 -0
- package/refs/vbenchmark/templates/rust-axum/Cargo.lock +2371 -0
- package/refs/vbenchmark/templates/rust-axum/Cargo.toml +16 -0
- package/refs/vbenchmark/templates/rust-axum/docker-compose.yaml +34 -0
- package/refs/vbenchmark/templates/rust-axum/migrations/20240101000000_init.sql +20 -0
- package/refs/vbenchmark/templates/rust-axum/src/main.rs +121 -0
- package/refs/vbenchmark/tsconfig.base.json +18 -0
- package/refs/vbenchmark/turbo.json +23 -0
- package/refs/vbenchmark/vercel.json +10 -0
|
@@ -0,0 +1,38 @@
|
|
|
1
|
+
---
|
|
2
|
+
name: gsd:verify-work
|
|
3
|
+
description: Validate built features through conversational UAT
|
|
4
|
+
argument-hint: "[phase number, e.g., '4']"
|
|
5
|
+
allowed-tools:
|
|
6
|
+
- Read
|
|
7
|
+
- Bash
|
|
8
|
+
- Glob
|
|
9
|
+
- Grep
|
|
10
|
+
- Edit
|
|
11
|
+
- Write
|
|
12
|
+
- Task
|
|
13
|
+
---
|
|
14
|
+
<objective>
|
|
15
|
+
Validate built features through conversational testing with persistent state.
|
|
16
|
+
|
|
17
|
+
Purpose: Confirm what Claude built actually works from user's perspective. One test at a time, plain text responses, no interrogation. When issues are found, automatically diagnose, plan fixes, and prepare for execution.
|
|
18
|
+
|
|
19
|
+
Output: {phase_num}-UAT.md tracking all test results. If issues found: diagnosed gaps, verified fix plans ready for /gsd:execute-phase
|
|
20
|
+
</objective>
|
|
21
|
+
|
|
22
|
+
<execution_context>
|
|
23
|
+
@~/.claude/get-shit-done/workflows/verify-work.md
|
|
24
|
+
@~/.claude/get-shit-done/templates/UAT.md
|
|
25
|
+
</execution_context>
|
|
26
|
+
|
|
27
|
+
<context>
|
|
28
|
+
Phase: $ARGUMENTS (optional)
|
|
29
|
+
- If provided: Test specific phase (e.g., "4")
|
|
30
|
+
- If not provided: Check for active sessions or prompt for phase
|
|
31
|
+
|
|
32
|
+
Context files are resolved inside the workflow (`init verify-work`) and delegated via `<files_to_read>` blocks.
|
|
33
|
+
</context>
|
|
34
|
+
|
|
35
|
+
<process>
|
|
36
|
+
Execute the verify-work workflow from @~/.claude/get-shit-done/workflows/verify-work.md end-to-end.
|
|
37
|
+
Preserve all workflow gates (session management, test presentation, diagnosis, fix planning, routing).
|
|
38
|
+
</process>
|
|
@@ -0,0 +1,471 @@
|
|
|
1
|
+
# GSD User Guide
|
|
2
|
+
|
|
3
|
+
A detailed reference for workflows, troubleshooting, and configuration. For quick-start setup, see the [README](../README.md).
|
|
4
|
+
|
|
5
|
+
---
|
|
6
|
+
|
|
7
|
+
## Table of Contents
|
|
8
|
+
|
|
9
|
+
- [Workflow Diagrams](#workflow-diagrams)
|
|
10
|
+
- [Command Reference](#command-reference)
|
|
11
|
+
- [Configuration Reference](#configuration-reference)
|
|
12
|
+
- [Usage Examples](#usage-examples)
|
|
13
|
+
- [Troubleshooting](#troubleshooting)
|
|
14
|
+
- [Recovery Quick Reference](#recovery-quick-reference)
|
|
15
|
+
|
|
16
|
+
---
|
|
17
|
+
|
|
18
|
+
## Workflow Diagrams
|
|
19
|
+
|
|
20
|
+
### Full Project Lifecycle
|
|
21
|
+
|
|
22
|
+
```
|
|
23
|
+
┌──────────────────────────────────────────────────┐
|
|
24
|
+
│ NEW PROJECT │
|
|
25
|
+
│ /gsd:new-project │
|
|
26
|
+
│ Questions -> Research -> Requirements -> Roadmap│
|
|
27
|
+
└─────────────────────────┬────────────────────────┘
|
|
28
|
+
│
|
|
29
|
+
┌──────────────▼─────────────┐
|
|
30
|
+
│ FOR EACH PHASE: │
|
|
31
|
+
│ │
|
|
32
|
+
│ ┌────────────────────┐ │
|
|
33
|
+
│ │ /gsd:discuss-phase │ │ <- Lock in preferences
|
|
34
|
+
│ └──────────┬─────────┘ │
|
|
35
|
+
│ │ │
|
|
36
|
+
│ ┌──────────▼─────────┐ │
|
|
37
|
+
│ │ /gsd:plan-phase │ │ <- Research + Plan + Verify
|
|
38
|
+
│ └──────────┬─────────┘ │
|
|
39
|
+
│ │ │
|
|
40
|
+
│ ┌──────────▼─────────┐ │
|
|
41
|
+
│ │ /gsd:execute-phase │ │ <- Parallel execution
|
|
42
|
+
│ └──────────┬─────────┘ │
|
|
43
|
+
│ │ │
|
|
44
|
+
│ ┌──────────▼─────────┐ │
|
|
45
|
+
│ │ /gsd:verify-work │ │ <- Manual UAT
|
|
46
|
+
│ └──────────┬─────────┘ │
|
|
47
|
+
│ │ │
|
|
48
|
+
│ Next Phase?────────────┘
|
|
49
|
+
│ │ No
|
|
50
|
+
└─────────────┼──────────────┘
|
|
51
|
+
│
|
|
52
|
+
┌───────────────▼──────────────┐
|
|
53
|
+
│ /gsd:audit-milestone │
|
|
54
|
+
│ /gsd:complete-milestone │
|
|
55
|
+
└───────────────┬──────────────┘
|
|
56
|
+
│
|
|
57
|
+
Another milestone?
|
|
58
|
+
│ │
|
|
59
|
+
Yes No -> Done!
|
|
60
|
+
│
|
|
61
|
+
┌───────▼──────────────┐
|
|
62
|
+
│ /gsd:new-milestone │
|
|
63
|
+
└──────────────────────┘
|
|
64
|
+
```
|
|
65
|
+
|
|
66
|
+
### Planning Agent Coordination
|
|
67
|
+
|
|
68
|
+
```
|
|
69
|
+
/gsd:plan-phase N
|
|
70
|
+
│
|
|
71
|
+
├── Phase Researcher (x4 parallel)
|
|
72
|
+
│ ├── Stack researcher
|
|
73
|
+
│ ├── Features researcher
|
|
74
|
+
│ ├── Architecture researcher
|
|
75
|
+
│ └── Pitfalls researcher
|
|
76
|
+
│ │
|
|
77
|
+
│ ┌──────▼──────┐
|
|
78
|
+
│ │ RESEARCH.md │
|
|
79
|
+
│ └──────┬──────┘
|
|
80
|
+
│ │
|
|
81
|
+
│ ┌──────▼──────┐
|
|
82
|
+
│ │ Planner │ <- Reads PROJECT.md, REQUIREMENTS.md,
|
|
83
|
+
│ │ │ CONTEXT.md, RESEARCH.md
|
|
84
|
+
│ └──────┬──────┘
|
|
85
|
+
│ │
|
|
86
|
+
│ ┌──────▼───────────┐ ┌────────┐
|
|
87
|
+
│ │ Plan Checker │────>│ PASS? │
|
|
88
|
+
│ └──────────────────┘ └───┬────┘
|
|
89
|
+
│ │
|
|
90
|
+
│ Yes │ No
|
|
91
|
+
│ │ │ │
|
|
92
|
+
│ │ └───┘ (loop, up to 3x)
|
|
93
|
+
│ │
|
|
94
|
+
│ ┌─────▼──────┐
|
|
95
|
+
│ │ PLAN files │
|
|
96
|
+
│ └────────────┘
|
|
97
|
+
└── Done
|
|
98
|
+
```
|
|
99
|
+
|
|
100
|
+
### Validation Architecture (Nyquist Layer)
|
|
101
|
+
|
|
102
|
+
During plan-phase research, GSD now maps automated test coverage to each phase
|
|
103
|
+
requirement before any code is written. This ensures that when Claude's executor
|
|
104
|
+
commits a task, a feedback mechanism already exists to verify it within seconds.
|
|
105
|
+
|
|
106
|
+
The researcher detects your existing test infrastructure, maps each requirement to
|
|
107
|
+
a specific test command, and identifies any test scaffolding that must be created
|
|
108
|
+
before implementation begins (Wave 0 tasks).
|
|
109
|
+
|
|
110
|
+
The plan-checker enforces this as an 8th verification dimension: plans where tasks
|
|
111
|
+
lack automated verify commands will not be approved.
|
|
112
|
+
|
|
113
|
+
**Output:** `{phase}-VALIDATION.md` -- the feedback contract for the phase.
|
|
114
|
+
|
|
115
|
+
**Disable:** Set `workflow.nyquist_validation: false` in `/gsd:settings` for
|
|
116
|
+
rapid prototyping phases where test infrastructure isn't the focus.
|
|
117
|
+
|
|
118
|
+
### Execution Wave Coordination
|
|
119
|
+
|
|
120
|
+
```
|
|
121
|
+
/gsd:execute-phase N
|
|
122
|
+
│
|
|
123
|
+
├── Analyze plan dependencies
|
|
124
|
+
│
|
|
125
|
+
├── Wave 1 (independent plans):
|
|
126
|
+
│ ├── Executor A (fresh 200K context) -> commit
|
|
127
|
+
│ └── Executor B (fresh 200K context) -> commit
|
|
128
|
+
│
|
|
129
|
+
├── Wave 2 (depends on Wave 1):
|
|
130
|
+
│ └── Executor C (fresh 200K context) -> commit
|
|
131
|
+
│
|
|
132
|
+
└── Verifier
|
|
133
|
+
└── Check codebase against phase goals
|
|
134
|
+
│
|
|
135
|
+
├── PASS -> VERIFICATION.md (success)
|
|
136
|
+
└── FAIL -> Issues logged for /gsd:verify-work
|
|
137
|
+
```
|
|
138
|
+
|
|
139
|
+
### Brownfield Workflow (Existing Codebase)
|
|
140
|
+
|
|
141
|
+
```
|
|
142
|
+
/gsd:map-codebase
|
|
143
|
+
│
|
|
144
|
+
├── Stack Mapper -> codebase/STACK.md
|
|
145
|
+
├── Arch Mapper -> codebase/ARCHITECTURE.md
|
|
146
|
+
├── Convention Mapper -> codebase/CONVENTIONS.md
|
|
147
|
+
└── Concern Mapper -> codebase/CONCERNS.md
|
|
148
|
+
│
|
|
149
|
+
┌───────▼──────────┐
|
|
150
|
+
│ /gsd:new-project │ <- Questions focus on what you're ADDING
|
|
151
|
+
└──────────────────┘
|
|
152
|
+
```
|
|
153
|
+
|
|
154
|
+
---
|
|
155
|
+
|
|
156
|
+
## Command Reference
|
|
157
|
+
|
|
158
|
+
### Core Workflow
|
|
159
|
+
|
|
160
|
+
| Command | Purpose | When to Use |
|
|
161
|
+
|---------|---------|-------------|
|
|
162
|
+
| `/gsd:new-project` | Full project init: questions, research, requirements, roadmap | Start of a new project |
|
|
163
|
+
| `/gsd:new-project --auto @idea.md` | Automated init from document | Have a PRD or idea doc ready |
|
|
164
|
+
| `/gsd:discuss-phase [N]` | Capture implementation decisions | Before planning, to shape how it gets built |
|
|
165
|
+
| `/gsd:plan-phase [N]` | Research + plan + verify | Before executing a phase |
|
|
166
|
+
| `/gsd:execute-phase <N>` | Execute all plans in parallel waves | After planning is complete |
|
|
167
|
+
| `/gsd:verify-work [N]` | Manual UAT with auto-diagnosis | After execution completes |
|
|
168
|
+
| `/gsd:audit-milestone` | Verify milestone met its definition of done | Before completing milestone |
|
|
169
|
+
| `/gsd:complete-milestone` | Archive milestone, tag release | All phases verified |
|
|
170
|
+
| `/gsd:new-milestone [name]` | Start next version cycle | After completing a milestone |
|
|
171
|
+
|
|
172
|
+
### Navigation
|
|
173
|
+
|
|
174
|
+
| Command | Purpose | When to Use |
|
|
175
|
+
|---------|---------|-------------|
|
|
176
|
+
| `/gsd:progress` | Show status and next steps | Anytime -- "where am I?" |
|
|
177
|
+
| `/gsd:resume-work` | Restore full context from last session | Starting a new session |
|
|
178
|
+
| `/gsd:pause-work` | Save context handoff | Stopping mid-phase |
|
|
179
|
+
| `/gsd:help` | Show all commands | Quick reference |
|
|
180
|
+
| `/gsd:update` | Update GSD with changelog preview | Check for new versions |
|
|
181
|
+
| `/gsd:join-discord` | Open Discord community invite | Questions or community |
|
|
182
|
+
|
|
183
|
+
### Phase Management
|
|
184
|
+
|
|
185
|
+
| Command | Purpose | When to Use |
|
|
186
|
+
|---------|---------|-------------|
|
|
187
|
+
| `/gsd:add-phase` | Append new phase to roadmap | Scope grows after initial planning |
|
|
188
|
+
| `/gsd:insert-phase [N]` | Insert urgent work (decimal numbering) | Urgent fix mid-milestone |
|
|
189
|
+
| `/gsd:remove-phase [N]` | Remove future phase and renumber | Descoping a feature |
|
|
190
|
+
| `/gsd:list-phase-assumptions [N]` | Preview Claude's intended approach | Before planning, to validate direction |
|
|
191
|
+
| `/gsd:plan-milestone-gaps` | Create phases for audit gaps | After audit finds missing items |
|
|
192
|
+
| `/gsd:research-phase [N]` | Deep ecosystem research only | Complex or unfamiliar domain |
|
|
193
|
+
|
|
194
|
+
### Brownfield & Utilities
|
|
195
|
+
|
|
196
|
+
| Command | Purpose | When to Use |
|
|
197
|
+
|---------|---------|-------------|
|
|
198
|
+
| `/gsd:map-codebase` | Analyze existing codebase | Before `/gsd:new-project` on existing code |
|
|
199
|
+
| `/gsd:quick` | Ad-hoc task with GSD guarantees | Bug fixes, small features, config changes |
|
|
200
|
+
| `/gsd:debug [desc]` | Systematic debugging with persistent state | When something breaks |
|
|
201
|
+
| `/gsd:add-todo [desc]` | Capture an idea for later | Think of something during a session |
|
|
202
|
+
| `/gsd:check-todos` | List pending todos | Review captured ideas |
|
|
203
|
+
| `/gsd:settings` | Configure workflow toggles and model profile | Change model, toggle agents |
|
|
204
|
+
| `/gsd:set-profile <profile>` | Quick profile switch | Change cost/quality tradeoff |
|
|
205
|
+
| `/gsd:reapply-patches` | Restore local modifications after update | After `/gsd:update` if you had local edits |
|
|
206
|
+
|
|
207
|
+
---
|
|
208
|
+
|
|
209
|
+
## Configuration Reference
|
|
210
|
+
|
|
211
|
+
GSD stores project settings in `.planning/config.json`. Configure during `/gsd:new-project` or update later with `/gsd:settings`.
|
|
212
|
+
|
|
213
|
+
### Full config.json Schema
|
|
214
|
+
|
|
215
|
+
```json
|
|
216
|
+
{
|
|
217
|
+
"mode": "interactive",
|
|
218
|
+
"depth": "standard",
|
|
219
|
+
"model_profile": "balanced",
|
|
220
|
+
"planning": {
|
|
221
|
+
"commit_docs": true,
|
|
222
|
+
"search_gitignored": false
|
|
223
|
+
},
|
|
224
|
+
"workflow": {
|
|
225
|
+
"research": true,
|
|
226
|
+
"plan_check": true,
|
|
227
|
+
"verifier": true,
|
|
228
|
+
"nyquist_validation": true
|
|
229
|
+
},
|
|
230
|
+
"git": {
|
|
231
|
+
"branching_strategy": "none",
|
|
232
|
+
"phase_branch_template": "gsd/phase-{phase}-{slug}",
|
|
233
|
+
"milestone_branch_template": "gsd/{milestone}-{slug}"
|
|
234
|
+
}
|
|
235
|
+
}
|
|
236
|
+
```
|
|
237
|
+
|
|
238
|
+
### Core Settings
|
|
239
|
+
|
|
240
|
+
| Setting | Options | Default | What it Controls |
|
|
241
|
+
|---------|---------|---------|------------------|
|
|
242
|
+
| `mode` | `interactive`, `yolo` | `interactive` | `yolo` auto-approves decisions; `interactive` confirms at each step |
|
|
243
|
+
| `depth` | `quick`, `standard`, `comprehensive` | `standard` | Planning thoroughness: 3-5, 5-8, or 8-12 phases |
|
|
244
|
+
| `model_profile` | `quality`, `balanced`, `budget` | `balanced` | Model tier for each agent (see table below) |
|
|
245
|
+
|
|
246
|
+
### Planning Settings
|
|
247
|
+
|
|
248
|
+
| Setting | Options | Default | What it Controls |
|
|
249
|
+
|---------|---------|---------|------------------|
|
|
250
|
+
| `planning.commit_docs` | `true`, `false` | `true` | Whether `.planning/` files are committed to git |
|
|
251
|
+
| `planning.search_gitignored` | `true`, `false` | `false` | Add `--no-ignore` to broad searches to include `.planning/` |
|
|
252
|
+
|
|
253
|
+
> **Note:** If `.planning/` is in `.gitignore`, `commit_docs` is automatically `false` regardless of the config value.
|
|
254
|
+
|
|
255
|
+
### Workflow Toggles
|
|
256
|
+
|
|
257
|
+
| Setting | Options | Default | What it Controls |
|
|
258
|
+
|---------|---------|---------|------------------|
|
|
259
|
+
| `workflow.research` | `true`, `false` | `true` | Domain investigation before planning |
|
|
260
|
+
| `workflow.plan_check` | `true`, `false` | `true` | Plan verification loop (up to 3 iterations) |
|
|
261
|
+
| `workflow.verifier` | `true`, `false` | `true` | Post-execution verification against phase goals |
|
|
262
|
+
| `workflow.nyquist_validation` | `true`, `false` | `true` | Validation architecture research during plan-phase; 8th plan-check dimension |
|
|
263
|
+
|
|
264
|
+
Disable these to speed up phases in familiar domains or when conserving tokens.
|
|
265
|
+
|
|
266
|
+
### Git Branching
|
|
267
|
+
|
|
268
|
+
| Setting | Options | Default | What it Controls |
|
|
269
|
+
|---------|---------|---------|------------------|
|
|
270
|
+
| `git.branching_strategy` | `none`, `phase`, `milestone` | `none` | When and how branches are created |
|
|
271
|
+
| `git.phase_branch_template` | Template string | `gsd/phase-{phase}-{slug}` | Branch name for phase strategy |
|
|
272
|
+
| `git.milestone_branch_template` | Template string | `gsd/{milestone}-{slug}` | Branch name for milestone strategy |
|
|
273
|
+
|
|
274
|
+
**Branching strategies explained:**
|
|
275
|
+
|
|
276
|
+
| Strategy | Creates Branch | Scope | Best For |
|
|
277
|
+
|----------|---------------|-------|----------|
|
|
278
|
+
| `none` | Never | N/A | Solo development, simple projects |
|
|
279
|
+
| `phase` | At each `execute-phase` | One phase per branch | Code review per phase, granular rollback |
|
|
280
|
+
| `milestone` | At first `execute-phase` | All phases share one branch | Release branches, PR per version |
|
|
281
|
+
|
|
282
|
+
**Template variables:** `{phase}` = zero-padded number (e.g., "03"), `{slug}` = lowercase hyphenated name, `{milestone}` = version (e.g., "v1.0").
|
|
283
|
+
|
|
284
|
+
### Model Profiles (Per-Agent Breakdown)
|
|
285
|
+
|
|
286
|
+
| Agent | `quality` | `balanced` | `budget` |
|
|
287
|
+
|-------|-----------|------------|----------|
|
|
288
|
+
| gsd-planner | Opus | Opus | Sonnet |
|
|
289
|
+
| gsd-roadmapper | Opus | Sonnet | Sonnet |
|
|
290
|
+
| gsd-executor | Opus | Sonnet | Sonnet |
|
|
291
|
+
| gsd-phase-researcher | Opus | Sonnet | Haiku |
|
|
292
|
+
| gsd-project-researcher | Opus | Sonnet | Haiku |
|
|
293
|
+
| gsd-research-synthesizer | Sonnet | Sonnet | Haiku |
|
|
294
|
+
| gsd-debugger | Opus | Sonnet | Sonnet |
|
|
295
|
+
| gsd-codebase-mapper | Sonnet | Haiku | Haiku |
|
|
296
|
+
| gsd-verifier | Sonnet | Sonnet | Haiku |
|
|
297
|
+
| gsd-plan-checker | Sonnet | Sonnet | Haiku |
|
|
298
|
+
| gsd-integration-checker | Sonnet | Sonnet | Haiku |
|
|
299
|
+
|
|
300
|
+
**Profile philosophy:**
|
|
301
|
+
- **quality** -- Opus for all decision-making agents, Sonnet for read-only verification. Use when quota is available and the work is critical.
|
|
302
|
+
- **balanced** -- Opus only for planning (where architecture decisions happen), Sonnet for everything else. The default for good reason.
|
|
303
|
+
- **budget** -- Sonnet for anything that writes code, Haiku for research and verification. Use for high-volume work or less critical phases.
|
|
304
|
+
|
|
305
|
+
---
|
|
306
|
+
|
|
307
|
+
## Usage Examples
|
|
308
|
+
|
|
309
|
+
### New Project (Full Cycle)
|
|
310
|
+
|
|
311
|
+
```bash
|
|
312
|
+
claude --dangerously-skip-permissions
|
|
313
|
+
/gsd:new-project # Answer questions, configure, approve roadmap
|
|
314
|
+
/clear
|
|
315
|
+
/gsd:discuss-phase 1 # Lock in your preferences
|
|
316
|
+
/gsd:plan-phase 1 # Research + plan + verify
|
|
317
|
+
/gsd:execute-phase 1 # Parallel execution
|
|
318
|
+
/gsd:verify-work 1 # Manual UAT
|
|
319
|
+
/clear
|
|
320
|
+
/gsd:discuss-phase 2 # Repeat for each phase
|
|
321
|
+
...
|
|
322
|
+
/gsd:audit-milestone # Check everything shipped
|
|
323
|
+
/gsd:complete-milestone # Archive, tag, done
|
|
324
|
+
```
|
|
325
|
+
|
|
326
|
+
### New Project from Existing Document
|
|
327
|
+
|
|
328
|
+
```bash
|
|
329
|
+
/gsd:new-project --auto @prd.md # Auto-runs research/requirements/roadmap from your doc
|
|
330
|
+
/clear
|
|
331
|
+
/gsd:discuss-phase 1 # Normal flow from here
|
|
332
|
+
```
|
|
333
|
+
|
|
334
|
+
### Existing Codebase
|
|
335
|
+
|
|
336
|
+
```bash
|
|
337
|
+
/gsd:map-codebase # Analyze what exists (parallel agents)
|
|
338
|
+
/gsd:new-project # Questions focus on what you're ADDING
|
|
339
|
+
# (normal phase workflow from here)
|
|
340
|
+
```
|
|
341
|
+
|
|
342
|
+
### Quick Bug Fix
|
|
343
|
+
|
|
344
|
+
```bash
|
|
345
|
+
/gsd:quick
|
|
346
|
+
> "Fix the login button not responding on mobile Safari"
|
|
347
|
+
```
|
|
348
|
+
|
|
349
|
+
### Resuming After a Break
|
|
350
|
+
|
|
351
|
+
```bash
|
|
352
|
+
/gsd:progress # See where you left off and what's next
|
|
353
|
+
# or
|
|
354
|
+
/gsd:resume-work # Full context restoration from last session
|
|
355
|
+
```
|
|
356
|
+
|
|
357
|
+
### Preparing for Release
|
|
358
|
+
|
|
359
|
+
```bash
|
|
360
|
+
/gsd:audit-milestone # Check requirements coverage, detect stubs
|
|
361
|
+
/gsd:plan-milestone-gaps # If audit found gaps, create phases to close them
|
|
362
|
+
/gsd:complete-milestone # Archive, tag, done
|
|
363
|
+
```
|
|
364
|
+
|
|
365
|
+
### Speed vs Quality Presets
|
|
366
|
+
|
|
367
|
+
| Scenario | Mode | Depth | Profile | Research | Plan Check | Verifier |
|
|
368
|
+
|----------|------|-------|---------|----------|------------|----------|
|
|
369
|
+
| Prototyping | `yolo` | `quick` | `budget` | off | off | off |
|
|
370
|
+
| Normal dev | `interactive` | `standard` | `balanced` | on | on | on |
|
|
371
|
+
| Production | `interactive` | `comprehensive` | `quality` | on | on | on |
|
|
372
|
+
|
|
373
|
+
### Mid-Milestone Scope Changes
|
|
374
|
+
|
|
375
|
+
```bash
|
|
376
|
+
/gsd:add-phase # Append a new phase to the roadmap
|
|
377
|
+
# or
|
|
378
|
+
/gsd:insert-phase 3 # Insert urgent work between phases 3 and 4
|
|
379
|
+
# or
|
|
380
|
+
/gsd:remove-phase 7 # Descope phase 7 and renumber
|
|
381
|
+
```
|
|
382
|
+
|
|
383
|
+
---
|
|
384
|
+
|
|
385
|
+
## Troubleshooting
|
|
386
|
+
|
|
387
|
+
### "Project already initialized"
|
|
388
|
+
|
|
389
|
+
You ran `/gsd:new-project` but `.planning/PROJECT.md` already exists. This is a safety check. If you want to start over, delete the `.planning/` directory first.
|
|
390
|
+
|
|
391
|
+
### Context Degradation During Long Sessions
|
|
392
|
+
|
|
393
|
+
Clear your context window between major commands: `/clear` in Claude Code. GSD is designed around fresh contexts -- every subagent gets a clean 200K window. If quality is dropping in the main session, clear and use `/gsd:resume-work` or `/gsd:progress` to restore state.
|
|
394
|
+
|
|
395
|
+
### Plans Seem Wrong or Misaligned
|
|
396
|
+
|
|
397
|
+
Run `/gsd:discuss-phase [N]` before planning. Most plan quality issues come from Claude making assumptions that `CONTEXT.md` would have prevented. You can also run `/gsd:list-phase-assumptions [N]` to see what Claude intends to do before committing to a plan.
|
|
398
|
+
|
|
399
|
+
### Execution Fails or Produces Stubs
|
|
400
|
+
|
|
401
|
+
Check that the plan was not too ambitious. Plans should have 2-3 tasks maximum. If tasks are too large, they exceed what a single context window can produce reliably. Re-plan with smaller scope.
|
|
402
|
+
|
|
403
|
+
### Lost Track of Where You Are
|
|
404
|
+
|
|
405
|
+
Run `/gsd:progress`. It reads all state files and tells you exactly where you are and what to do next.
|
|
406
|
+
|
|
407
|
+
### Need to Change Something After Execution
|
|
408
|
+
|
|
409
|
+
Do not re-run `/gsd:execute-phase`. Use `/gsd:quick` for targeted fixes, or `/gsd:verify-work` to systematically identify and fix issues through UAT.
|
|
410
|
+
|
|
411
|
+
### Model Costs Too High
|
|
412
|
+
|
|
413
|
+
Switch to budget profile: `/gsd:set-profile budget`. Disable research and plan-check agents via `/gsd:settings` if the domain is familiar to you (or to Claude).
|
|
414
|
+
|
|
415
|
+
### Working on a Sensitive/Private Project
|
|
416
|
+
|
|
417
|
+
Set `commit_docs: false` during `/gsd:new-project` or via `/gsd:settings`. Add `.planning/` to your `.gitignore`. Planning artifacts stay local and never touch git.
|
|
418
|
+
|
|
419
|
+
### GSD Update Overwrote My Local Changes
|
|
420
|
+
|
|
421
|
+
Since v1.17, the installer backs up locally modified files to `gsd-local-patches/`. Run `/gsd:reapply-patches` to merge your changes back.
|
|
422
|
+
|
|
423
|
+
### Subagent Appears to Fail but Work Was Done
|
|
424
|
+
|
|
425
|
+
A known workaround exists for a Claude Code classification bug. GSD's orchestrators (execute-phase, quick) spot-check actual output before reporting failure. If you see a failure message but commits were made, check `git log` -- the work may have succeeded.
|
|
426
|
+
|
|
427
|
+
---
|
|
428
|
+
|
|
429
|
+
## Recovery Quick Reference
|
|
430
|
+
|
|
431
|
+
| Problem | Solution |
|
|
432
|
+
|---------|----------|
|
|
433
|
+
| Lost context / new session | `/gsd:resume-work` or `/gsd:progress` |
|
|
434
|
+
| Phase went wrong | `git revert` the phase commits, then re-plan |
|
|
435
|
+
| Need to change scope | `/gsd:add-phase`, `/gsd:insert-phase`, or `/gsd:remove-phase` |
|
|
436
|
+
| Milestone audit found gaps | `/gsd:plan-milestone-gaps` |
|
|
437
|
+
| Something broke | `/gsd:debug "description"` |
|
|
438
|
+
| Quick targeted fix | `/gsd:quick` |
|
|
439
|
+
| Plan doesn't match your vision | `/gsd:discuss-phase [N]` then re-plan |
|
|
440
|
+
| Costs running high | `/gsd:set-profile budget` and `/gsd:settings` to toggle agents off |
|
|
441
|
+
| Update broke local changes | `/gsd:reapply-patches` |
|
|
442
|
+
|
|
443
|
+
---
|
|
444
|
+
|
|
445
|
+
## Project File Structure
|
|
446
|
+
|
|
447
|
+
For reference, here is what GSD creates in your project:
|
|
448
|
+
|
|
449
|
+
```
|
|
450
|
+
.planning/
|
|
451
|
+
PROJECT.md # Project vision and context (always loaded)
|
|
452
|
+
REQUIREMENTS.md # Scoped v1/v2 requirements with IDs
|
|
453
|
+
ROADMAP.md # Phase breakdown with status tracking
|
|
454
|
+
STATE.md # Decisions, blockers, session memory
|
|
455
|
+
config.json # Workflow configuration
|
|
456
|
+
MILESTONES.md # Completed milestone archive
|
|
457
|
+
research/ # Domain research from /gsd:new-project
|
|
458
|
+
todos/
|
|
459
|
+
pending/ # Captured ideas awaiting work
|
|
460
|
+
done/ # Completed todos
|
|
461
|
+
debug/ # Active debug sessions
|
|
462
|
+
resolved/ # Archived debug sessions
|
|
463
|
+
codebase/ # Brownfield codebase mapping (from /gsd:map-codebase)
|
|
464
|
+
phases/
|
|
465
|
+
XX-phase-name/
|
|
466
|
+
XX-YY-PLAN.md # Atomic execution plans
|
|
467
|
+
XX-YY-SUMMARY.md # Execution outcomes and decisions
|
|
468
|
+
CONTEXT.md # Your implementation preferences
|
|
469
|
+
RESEARCH.md # Ecosystem research findings
|
|
470
|
+
VERIFICATION.md # Post-execution verification results
|
|
471
|
+
```
|
|
@@ -0,0 +1,96 @@
|
|
|
1
|
+
# Context Window Monitor
|
|
2
|
+
|
|
3
|
+
A PostToolUse hook that warns the agent when context window usage is high.
|
|
4
|
+
|
|
5
|
+
## Problem
|
|
6
|
+
|
|
7
|
+
The statusline shows context usage to the **user**, but the **agent** has no awareness of context limits. When context runs low, the agent continues working until it hits the wall — potentially mid-task with no state saved.
|
|
8
|
+
|
|
9
|
+
## How It Works
|
|
10
|
+
|
|
11
|
+
1. The statusline hook writes context metrics to `/tmp/claude-ctx-{session_id}.json`
|
|
12
|
+
2. After each tool use, the context monitor reads these metrics
|
|
13
|
+
3. When remaining context drops below thresholds, it injects a warning as `additionalContext`
|
|
14
|
+
4. The agent receives the warning in its conversation and can act accordingly
|
|
15
|
+
|
|
16
|
+
## Thresholds
|
|
17
|
+
|
|
18
|
+
| Level | Remaining | Agent Behavior |
|
|
19
|
+
|-------|-----------|----------------|
|
|
20
|
+
| Normal | > 35% | No warning |
|
|
21
|
+
| WARNING | <= 35% | Wrap up current task, avoid starting new complex work |
|
|
22
|
+
| CRITICAL | <= 25% | Stop immediately, save state (`/gsd:pause-work`) |
|
|
23
|
+
|
|
24
|
+
## Debounce
|
|
25
|
+
|
|
26
|
+
To avoid spamming the agent with repeated warnings:
|
|
27
|
+
- First warning always fires immediately
|
|
28
|
+
- Subsequent warnings require 5 tool uses between them
|
|
29
|
+
- Severity escalation (WARNING -> CRITICAL) bypasses debounce
|
|
30
|
+
|
|
31
|
+
## Architecture
|
|
32
|
+
|
|
33
|
+
```
|
|
34
|
+
Statusline Hook (gsd-statusline.js)
|
|
35
|
+
| writes
|
|
36
|
+
v
|
|
37
|
+
/tmp/claude-ctx-{session_id}.json
|
|
38
|
+
^ reads
|
|
39
|
+
|
|
|
40
|
+
Context Monitor (gsd-context-monitor.js, PostToolUse)
|
|
41
|
+
| injects
|
|
42
|
+
v
|
|
43
|
+
additionalContext -> Agent sees warning
|
|
44
|
+
```
|
|
45
|
+
|
|
46
|
+
The bridge file is a simple JSON object:
|
|
47
|
+
|
|
48
|
+
```json
|
|
49
|
+
{
|
|
50
|
+
"session_id": "abc123",
|
|
51
|
+
"remaining_percentage": 28.5,
|
|
52
|
+
"used_pct": 71,
|
|
53
|
+
"timestamp": 1708200000
|
|
54
|
+
}
|
|
55
|
+
```
|
|
56
|
+
|
|
57
|
+
## Integration with GSD
|
|
58
|
+
|
|
59
|
+
GSD's `/gsd:pause-work` command saves execution state. The WARNING message suggests using it. The CRITICAL message instructs immediate state save.
|
|
60
|
+
|
|
61
|
+
## Setup
|
|
62
|
+
|
|
63
|
+
Both hooks are automatically registered during `npx get-shit-done-cc` installation:
|
|
64
|
+
|
|
65
|
+
- **Statusline** (writes bridge file): Registered as `statusLine` in settings.json
|
|
66
|
+
- **Context Monitor** (reads bridge file): Registered as `PostToolUse` hook in settings.json
|
|
67
|
+
|
|
68
|
+
Manual registration in `~/.claude/settings.json`:
|
|
69
|
+
|
|
70
|
+
```json
|
|
71
|
+
{
|
|
72
|
+
"statusLine": {
|
|
73
|
+
"type": "command",
|
|
74
|
+
"command": "node ~/.claude/hooks/gsd-statusline.js"
|
|
75
|
+
},
|
|
76
|
+
"hooks": {
|
|
77
|
+
"PostToolUse": [
|
|
78
|
+
{
|
|
79
|
+
"hooks": [
|
|
80
|
+
{
|
|
81
|
+
"type": "command",
|
|
82
|
+
"command": "node ~/.claude/hooks/gsd-context-monitor.js"
|
|
83
|
+
}
|
|
84
|
+
]
|
|
85
|
+
}
|
|
86
|
+
]
|
|
87
|
+
}
|
|
88
|
+
}
|
|
89
|
+
```
|
|
90
|
+
|
|
91
|
+
## Safety
|
|
92
|
+
|
|
93
|
+
- The hook wraps everything in try/catch and exits silently on error
|
|
94
|
+
- It never blocks tool execution — a broken monitor should not break the agent's workflow
|
|
95
|
+
- Stale metrics (older than 60s) are ignored
|
|
96
|
+
- Missing bridge files are handled gracefully (subagents, fresh sessions)
|