autonomous-coding-toolkit 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (324) hide show
  1. package/.claude-plugin/marketplace.json +22 -0
  2. package/.claude-plugin/plugin.json +13 -0
  3. package/LICENSE +21 -0
  4. package/Makefile +21 -0
  5. package/README.md +140 -0
  6. package/SECURITY.md +28 -0
  7. package/agents/bash-expert.md +113 -0
  8. package/agents/dependency-auditor.md +138 -0
  9. package/agents/integration-tester.md +120 -0
  10. package/agents/lesson-scanner.md +149 -0
  11. package/agents/python-expert.md +179 -0
  12. package/agents/service-monitor.md +141 -0
  13. package/agents/shell-expert.md +147 -0
  14. package/benchmarks/runner.sh +147 -0
  15. package/benchmarks/tasks/01-rest-endpoint/rubric.sh +29 -0
  16. package/benchmarks/tasks/01-rest-endpoint/task.md +17 -0
  17. package/benchmarks/tasks/02-refactor-module/task.md +8 -0
  18. package/benchmarks/tasks/03-fix-integration-bug/task.md +8 -0
  19. package/benchmarks/tasks/04-add-test-coverage/task.md +8 -0
  20. package/benchmarks/tasks/05-multi-file-feature/task.md +8 -0
  21. package/bin/act.js +238 -0
  22. package/commands/autocode.md +6 -0
  23. package/commands/cancel-ralph.md +18 -0
  24. package/commands/code-factory.md +53 -0
  25. package/commands/create-prd.md +55 -0
  26. package/commands/ralph-loop.md +18 -0
  27. package/commands/run-plan.md +117 -0
  28. package/commands/submit-lesson.md +122 -0
  29. package/docs/ARCHITECTURE.md +630 -0
  30. package/docs/CONTRIBUTING.md +125 -0
  31. package/docs/lessons/0001-bare-exception-swallowing.md +34 -0
  32. package/docs/lessons/0002-async-def-without-await.md +28 -0
  33. package/docs/lessons/0003-create-task-without-callback.md +28 -0
  34. package/docs/lessons/0004-hardcoded-test-counts.md +28 -0
  35. package/docs/lessons/0005-sqlite-without-closing.md +33 -0
  36. package/docs/lessons/0006-venv-pip-path.md +27 -0
  37. package/docs/lessons/0007-runner-state-self-rejection.md +35 -0
  38. package/docs/lessons/0008-quality-gate-blind-spot.md +33 -0
  39. package/docs/lessons/0009-parser-overcount-empty-batches.md +36 -0
  40. package/docs/lessons/0010-local-outside-function-bash.md +33 -0
  41. package/docs/lessons/0011-batch-tests-for-unimplemented-code.md +36 -0
  42. package/docs/lessons/0012-api-markdown-unescaped-chars.md +33 -0
  43. package/docs/lessons/0013-export-prefix-env-parsing.md +33 -0
  44. package/docs/lessons/0014-decorator-registry-import-side-effect.md +43 -0
  45. package/docs/lessons/0015-frontend-backend-schema-drift.md +43 -0
  46. package/docs/lessons/0016-event-driven-cold-start-seeding.md +44 -0
  47. package/docs/lessons/0017-copy-paste-logic-diverges.md +43 -0
  48. package/docs/lessons/0018-layer-passes-pipeline-broken.md +45 -0
  49. package/docs/lessons/0019-systemd-envfile-ignores-export.md +41 -0
  50. package/docs/lessons/0020-persist-state-incrementally.md +44 -0
  51. package/docs/lessons/0021-dual-axis-testing.md +48 -0
  52. package/docs/lessons/0022-jsx-factory-shadowing.md +43 -0
  53. package/docs/lessons/0023-static-analysis-spiral.md +51 -0
  54. package/docs/lessons/0024-shared-pipeline-implementation.md +55 -0
  55. package/docs/lessons/0025-defense-in-depth-all-entry-points.md +65 -0
  56. package/docs/lessons/0026-linter-no-rules-false-enforcement.md +54 -0
  57. package/docs/lessons/0027-jsx-silent-prop-drop.md +64 -0
  58. package/docs/lessons/0028-no-infrastructure-in-client-code.md +49 -0
  59. package/docs/lessons/0029-never-write-secrets-to-files.md +61 -0
  60. package/docs/lessons/0030-cache-merge-not-replace.md +62 -0
  61. package/docs/lessons/0031-verify-units-at-boundaries.md +66 -0
  62. package/docs/lessons/0032-module-lifecycle-subscribe-unsubscribe.md +89 -0
  63. package/docs/lessons/0033-async-iteration-mutable-snapshot.md +72 -0
  64. package/docs/lessons/0034-caller-missing-await-silent-discard.md +65 -0
  65. package/docs/lessons/0035-duplicate-registration-silent-overwrite.md +85 -0
  66. package/docs/lessons/0036-websocket-dirty-disconnect.md +33 -0
  67. package/docs/lessons/0037-parallel-agents-worktree-corruption.md +31 -0
  68. package/docs/lessons/0038-subscribe-no-stored-ref.md +36 -0
  69. package/docs/lessons/0039-fallback-or-default-hides-bugs.md +34 -0
  70. package/docs/lessons/0040-event-firehose-filter-first.md +36 -0
  71. package/docs/lessons/0041-ambiguous-base-dir-path-nesting.md +32 -0
  72. package/docs/lessons/0042-spec-compliance-insufficient.md +36 -0
  73. package/docs/lessons/0043-exact-count-extensible-collections.md +32 -0
  74. package/docs/lessons/0044-relative-file-deps-worktree.md +39 -0
  75. package/docs/lessons/0045-iterative-design-improvement.md +33 -0
  76. package/docs/lessons/0046-plan-assertion-math-bugs.md +38 -0
  77. package/docs/lessons/0047-pytest-single-threaded-default.md +37 -0
  78. package/docs/lessons/0048-integration-wiring-batch.md +40 -0
  79. package/docs/lessons/0049-ab-verification.md +41 -0
  80. package/docs/lessons/0050-editing-sourced-files-during-execution.md +33 -0
  81. package/docs/lessons/0051-infrastructure-fixes-cant-self-heal.md +30 -0
  82. package/docs/lessons/0052-uncommitted-changes-poison-quality-gates.md +31 -0
  83. package/docs/lessons/0053-jq-compact-flag-inconsistency.md +31 -0
  84. package/docs/lessons/0054-parser-matches-inside-code-blocks.md +30 -0
  85. package/docs/lessons/0055-agents-compensate-for-garbled-prompts.md +31 -0
  86. package/docs/lessons/0056-grep-count-exit-code-on-zero.md +42 -0
  87. package/docs/lessons/0057-new-artifacts-break-git-clean-gates.md +42 -0
  88. package/docs/lessons/0058-dead-config-keys-never-consumed.md +49 -0
  89. package/docs/lessons/0059-contract-test-shared-structures.md +53 -0
  90. package/docs/lessons/0060-set-e-silent-death-in-runners.md +53 -0
  91. package/docs/lessons/0061-context-injection-dirty-state.md +50 -0
  92. package/docs/lessons/0062-sibling-bug-neighborhood-scan.md +29 -0
  93. package/docs/lessons/0063-one-flag-two-lifetimes.md +31 -0
  94. package/docs/lessons/0064-test-passes-wrong-reason.md +31 -0
  95. package/docs/lessons/0065-pipefail-grep-count-double-output.md +39 -0
  96. package/docs/lessons/0066-local-keyword-outside-function.md +37 -0
  97. package/docs/lessons/0067-stdin-hang-non-interactive-shell.md +36 -0
  98. package/docs/lessons/0068-agent-builds-wrong-thing-correctly.md +31 -0
  99. package/docs/lessons/0069-plan-quality-dominates-execution.md +30 -0
  100. package/docs/lessons/0070-spec-echo-back-prevents-drift.md +31 -0
  101. package/docs/lessons/0071-positive-instructions-outperform-negative.md +30 -0
  102. package/docs/lessons/0072-lost-in-the-middle-context-placement.md +30 -0
  103. package/docs/lessons/0073-unscoped-lessons-cause-false-positives.md +30 -0
  104. package/docs/lessons/0074-stale-context-injection-wrong-batch.md +32 -0
  105. package/docs/lessons/0075-research-artifacts-must-persist.md +32 -0
  106. package/docs/lessons/0076-wrong-decomposition-contaminates-downstream.md +30 -0
  107. package/docs/lessons/0077-cherry-pick-merges-need-manual-resolution.md +30 -0
  108. package/docs/lessons/0078-static-review-without-live-test.md +30 -0
  109. package/docs/lessons/0079-integration-wiring-batch-required.md +32 -0
  110. package/docs/lessons/FRAMEWORK.md +161 -0
  111. package/docs/lessons/SUMMARY.md +201 -0
  112. package/docs/lessons/TEMPLATE.md +85 -0
  113. package/docs/plans/2026-02-21-code-factory-v2-design.md +204 -0
  114. package/docs/plans/2026-02-21-code-factory-v2-implementation-plan.md +2189 -0
  115. package/docs/plans/2026-02-21-code-factory-v2-phase4-design.md +537 -0
  116. package/docs/plans/2026-02-21-code-factory-v2-phase4-implementation-plan.md +2012 -0
  117. package/docs/plans/2026-02-21-hardening-pass-design.md +108 -0
  118. package/docs/plans/2026-02-21-hardening-pass-plan.md +1378 -0
  119. package/docs/plans/2026-02-21-mab-research-report.md +406 -0
  120. package/docs/plans/2026-02-21-marketplace-restructure-design.md +240 -0
  121. package/docs/plans/2026-02-21-marketplace-restructure-plan.md +832 -0
  122. package/docs/plans/2026-02-21-phase4-completion-plan.md +697 -0
  123. package/docs/plans/2026-02-21-validator-suite-design.md +148 -0
  124. package/docs/plans/2026-02-21-validator-suite-plan.md +540 -0
  125. package/docs/plans/2026-02-22-mab-research-round2.md +556 -0
  126. package/docs/plans/2026-02-22-mab-run-design.md +462 -0
  127. package/docs/plans/2026-02-22-mab-run-plan.md +2046 -0
  128. package/docs/plans/2026-02-22-operations-design-methodology-research.md +681 -0
  129. package/docs/plans/2026-02-22-research-agent-failure-taxonomy.md +532 -0
  130. package/docs/plans/2026-02-22-research-code-guideline-policies.md +886 -0
  131. package/docs/plans/2026-02-22-research-codebase-audit-refactoring.md +908 -0
  132. package/docs/plans/2026-02-22-research-coding-standards-documentation.md +541 -0
  133. package/docs/plans/2026-02-22-research-competitive-landscape.md +687 -0
  134. package/docs/plans/2026-02-22-research-comprehensive-testing.md +1076 -0
  135. package/docs/plans/2026-02-22-research-context-utilization.md +459 -0
  136. package/docs/plans/2026-02-22-research-cost-quality-tradeoff.md +548 -0
  137. package/docs/plans/2026-02-22-research-lesson-transferability.md +508 -0
  138. package/docs/plans/2026-02-22-research-multi-agent-coordination.md +312 -0
  139. package/docs/plans/2026-02-22-research-phase-integration.md +602 -0
  140. package/docs/plans/2026-02-22-research-plan-quality.md +428 -0
  141. package/docs/plans/2026-02-22-research-prompt-engineering.md +558 -0
  142. package/docs/plans/2026-02-22-research-unconventional-perspectives.md +528 -0
  143. package/docs/plans/2026-02-22-research-user-adoption.md +638 -0
  144. package/docs/plans/2026-02-22-research-verification-effectiveness.md +433 -0
  145. package/docs/plans/2026-02-23-agent-suite-design.md +299 -0
  146. package/docs/plans/2026-02-23-agent-suite-plan.md +578 -0
  147. package/docs/plans/2026-02-23-phase3-cost-infrastructure-design.md +148 -0
  148. package/docs/plans/2026-02-23-phase3-cost-infrastructure-plan.md +1062 -0
  149. package/docs/plans/2026-02-23-research-bash-expert-agent.md +543 -0
  150. package/docs/plans/2026-02-23-research-dependency-auditor-agent.md +564 -0
  151. package/docs/plans/2026-02-23-research-improving-existing-agents.md +503 -0
  152. package/docs/plans/2026-02-23-research-integration-tester-agent.md +454 -0
  153. package/docs/plans/2026-02-23-research-python-expert-agent.md +429 -0
  154. package/docs/plans/2026-02-23-research-service-monitor-agent.md +425 -0
  155. package/docs/plans/2026-02-23-research-shell-expert-agent.md +533 -0
  156. package/docs/plans/2026-02-23-roadmap-to-completion.md +530 -0
  157. package/docs/plans/2026-02-24-headless-module-split-design.md +98 -0
  158. package/docs/plans/2026-02-24-headless-module-split.md +443 -0
  159. package/docs/plans/2026-02-24-lesson-scope-metadata-design.md +228 -0
  160. package/docs/plans/2026-02-24-lesson-scope-metadata-plan.md +968 -0
  161. package/docs/plans/2026-02-24-npm-packaging-design.md +841 -0
  162. package/docs/plans/2026-02-24-npm-packaging-plan.md +1965 -0
  163. package/docs/plans/audit-findings.md +186 -0
  164. package/docs/telegram-notification-format.md +98 -0
  165. package/examples/example-plan.md +51 -0
  166. package/examples/example-prd.json +72 -0
  167. package/examples/example-roadmap.md +33 -0
  168. package/examples/quickstart-plan.md +63 -0
  169. package/hooks/hooks.json +26 -0
  170. package/hooks/setup-symlinks.sh +48 -0
  171. package/hooks/stop-hook.sh +135 -0
  172. package/package.json +47 -0
  173. package/policies/bash.md +71 -0
  174. package/policies/python.md +71 -0
  175. package/policies/testing.md +61 -0
  176. package/policies/universal.md +60 -0
  177. package/scripts/analyze-report.sh +97 -0
  178. package/scripts/architecture-map.sh +145 -0
  179. package/scripts/auto-compound.sh +273 -0
  180. package/scripts/batch-audit.sh +42 -0
  181. package/scripts/batch-test.sh +101 -0
  182. package/scripts/entropy-audit.sh +221 -0
  183. package/scripts/failure-digest.sh +51 -0
  184. package/scripts/generate-ast-rules.sh +96 -0
  185. package/scripts/init.sh +112 -0
  186. package/scripts/lesson-check.sh +428 -0
  187. package/scripts/lib/common.sh +61 -0
  188. package/scripts/lib/cost-tracking.sh +153 -0
  189. package/scripts/lib/ollama.sh +60 -0
  190. package/scripts/lib/progress-writer.sh +128 -0
  191. package/scripts/lib/run-plan-context.sh +215 -0
  192. package/scripts/lib/run-plan-echo-back.sh +231 -0
  193. package/scripts/lib/run-plan-headless.sh +396 -0
  194. package/scripts/lib/run-plan-notify.sh +57 -0
  195. package/scripts/lib/run-plan-parser.sh +81 -0
  196. package/scripts/lib/run-plan-prompt.sh +215 -0
  197. package/scripts/lib/run-plan-quality-gate.sh +132 -0
  198. package/scripts/lib/run-plan-routing.sh +315 -0
  199. package/scripts/lib/run-plan-sampling.sh +170 -0
  200. package/scripts/lib/run-plan-scoring.sh +146 -0
  201. package/scripts/lib/run-plan-state.sh +142 -0
  202. package/scripts/lib/run-plan-team.sh +199 -0
  203. package/scripts/lib/telegram.sh +54 -0
  204. package/scripts/lib/thompson-sampling.sh +176 -0
  205. package/scripts/license-check.sh +74 -0
  206. package/scripts/mab-run.sh +575 -0
  207. package/scripts/module-size-check.sh +146 -0
  208. package/scripts/patterns/async-no-await.yml +5 -0
  209. package/scripts/patterns/bare-except.yml +6 -0
  210. package/scripts/patterns/empty-catch.yml +6 -0
  211. package/scripts/patterns/hardcoded-localhost.yml +9 -0
  212. package/scripts/patterns/retry-loop-no-backoff.yml +12 -0
  213. package/scripts/pipeline-status.sh +197 -0
  214. package/scripts/policy-check.sh +226 -0
  215. package/scripts/prior-art-search.sh +133 -0
  216. package/scripts/promote-mab-lessons.sh +126 -0
  217. package/scripts/prompts/agent-a-superpowers.md +29 -0
  218. package/scripts/prompts/agent-b-ralph.md +29 -0
  219. package/scripts/prompts/judge-agent.md +61 -0
  220. package/scripts/prompts/planner-agent.md +44 -0
  221. package/scripts/pull-community-lessons.sh +90 -0
  222. package/scripts/quality-gate.sh +266 -0
  223. package/scripts/research-gate.sh +90 -0
  224. package/scripts/run-plan.sh +329 -0
  225. package/scripts/scope-infer.sh +159 -0
  226. package/scripts/setup-ralph-loop.sh +155 -0
  227. package/scripts/telemetry.sh +230 -0
  228. package/scripts/tests/run-all-tests.sh +52 -0
  229. package/scripts/tests/test-act-cli.sh +46 -0
  230. package/scripts/tests/test-agents-md.sh +87 -0
  231. package/scripts/tests/test-analyze-report.sh +114 -0
  232. package/scripts/tests/test-architecture-map.sh +89 -0
  233. package/scripts/tests/test-auto-compound.sh +169 -0
  234. package/scripts/tests/test-batch-test.sh +65 -0
  235. package/scripts/tests/test-benchmark-runner.sh +25 -0
  236. package/scripts/tests/test-common.sh +168 -0
  237. package/scripts/tests/test-cost-tracking.sh +158 -0
  238. package/scripts/tests/test-echo-back.sh +180 -0
  239. package/scripts/tests/test-entropy-audit.sh +146 -0
  240. package/scripts/tests/test-failure-digest.sh +66 -0
  241. package/scripts/tests/test-generate-ast-rules.sh +145 -0
  242. package/scripts/tests/test-helpers.sh +82 -0
  243. package/scripts/tests/test-init.sh +47 -0
  244. package/scripts/tests/test-lesson-check.sh +278 -0
  245. package/scripts/tests/test-lesson-local.sh +55 -0
  246. package/scripts/tests/test-license-check.sh +109 -0
  247. package/scripts/tests/test-mab-run.sh +182 -0
  248. package/scripts/tests/test-ollama-lib.sh +49 -0
  249. package/scripts/tests/test-ollama.sh +60 -0
  250. package/scripts/tests/test-pipeline-status.sh +198 -0
  251. package/scripts/tests/test-policy-check.sh +124 -0
  252. package/scripts/tests/test-prior-art-search.sh +96 -0
  253. package/scripts/tests/test-progress-writer.sh +140 -0
  254. package/scripts/tests/test-promote-mab-lessons.sh +110 -0
  255. package/scripts/tests/test-pull-community-lessons.sh +149 -0
  256. package/scripts/tests/test-quality-gate.sh +241 -0
  257. package/scripts/tests/test-research-gate.sh +132 -0
  258. package/scripts/tests/test-run-plan-cli.sh +86 -0
  259. package/scripts/tests/test-run-plan-context.sh +305 -0
  260. package/scripts/tests/test-run-plan-e2e.sh +153 -0
  261. package/scripts/tests/test-run-plan-headless.sh +424 -0
  262. package/scripts/tests/test-run-plan-notify.sh +124 -0
  263. package/scripts/tests/test-run-plan-parser.sh +217 -0
  264. package/scripts/tests/test-run-plan-prompt.sh +254 -0
  265. package/scripts/tests/test-run-plan-quality-gate.sh +222 -0
  266. package/scripts/tests/test-run-plan-routing.sh +178 -0
  267. package/scripts/tests/test-run-plan-scoring.sh +148 -0
  268. package/scripts/tests/test-run-plan-state.sh +261 -0
  269. package/scripts/tests/test-run-plan-team.sh +157 -0
  270. package/scripts/tests/test-scope-infer.sh +150 -0
  271. package/scripts/tests/test-setup-ralph-loop.sh +63 -0
  272. package/scripts/tests/test-telegram-env.sh +38 -0
  273. package/scripts/tests/test-telegram.sh +121 -0
  274. package/scripts/tests/test-telemetry.sh +46 -0
  275. package/scripts/tests/test-thompson-sampling.sh +139 -0
  276. package/scripts/tests/test-validate-all.sh +60 -0
  277. package/scripts/tests/test-validate-commands.sh +89 -0
  278. package/scripts/tests/test-validate-hooks.sh +98 -0
  279. package/scripts/tests/test-validate-lessons.sh +150 -0
  280. package/scripts/tests/test-validate-plan-quality.sh +235 -0
  281. package/scripts/tests/test-validate-plans.sh +187 -0
  282. package/scripts/tests/test-validate-plugin.sh +106 -0
  283. package/scripts/tests/test-validate-prd.sh +184 -0
  284. package/scripts/tests/test-validate-skills.sh +134 -0
  285. package/scripts/validate-all.sh +57 -0
  286. package/scripts/validate-commands.sh +67 -0
  287. package/scripts/validate-hooks.sh +89 -0
  288. package/scripts/validate-lessons.sh +98 -0
  289. package/scripts/validate-plan-quality.sh +369 -0
  290. package/scripts/validate-plans.sh +120 -0
  291. package/scripts/validate-plugin.sh +86 -0
  292. package/scripts/validate-policies.sh +42 -0
  293. package/scripts/validate-prd.sh +118 -0
  294. package/scripts/validate-skills.sh +96 -0
  295. package/skills/autocode/SKILL.md +285 -0
  296. package/skills/autocode/ab-verification.md +51 -0
  297. package/skills/autocode/code-quality-standards.md +37 -0
  298. package/skills/autocode/competitive-mode.md +364 -0
  299. package/skills/brainstorming/SKILL.md +97 -0
  300. package/skills/capture-lesson/SKILL.md +187 -0
  301. package/skills/check-lessons/SKILL.md +116 -0
  302. package/skills/dispatching-parallel-agents/SKILL.md +110 -0
  303. package/skills/executing-plans/SKILL.md +85 -0
  304. package/skills/finishing-a-development-branch/SKILL.md +201 -0
  305. package/skills/receiving-code-review/SKILL.md +72 -0
  306. package/skills/requesting-code-review/SKILL.md +59 -0
  307. package/skills/requesting-code-review/code-reviewer.md +82 -0
  308. package/skills/research/SKILL.md +145 -0
  309. package/skills/roadmap/SKILL.md +115 -0
  310. package/skills/subagent-driven-development/SKILL.md +98 -0
  311. package/skills/subagent-driven-development/code-quality-reviewer-prompt.md +18 -0
  312. package/skills/subagent-driven-development/implementer-prompt.md +73 -0
  313. package/skills/subagent-driven-development/spec-reviewer-prompt.md +57 -0
  314. package/skills/systematic-debugging/SKILL.md +134 -0
  315. package/skills/systematic-debugging/condition-based-waiting.md +64 -0
  316. package/skills/systematic-debugging/defense-in-depth.md +32 -0
  317. package/skills/systematic-debugging/root-cause-tracing.md +55 -0
  318. package/skills/test-driven-development/SKILL.md +167 -0
  319. package/skills/using-git-worktrees/SKILL.md +219 -0
  320. package/skills/using-superpowers/SKILL.md +54 -0
  321. package/skills/verification-before-completion/SKILL.md +140 -0
  322. package/skills/verify/SKILL.md +82 -0
  323. package/skills/writing-plans/SKILL.md +128 -0
  324. package/skills/writing-skills/SKILL.md +93 -0
@@ -0,0 +1,54 @@
1
+ ---
2
+ name: using-superpowers
3
+ description: Use when starting any conversation - establishes how to find and use skills, requiring Skill tool invocation before ANY response including clarifying questions
4
+ version: 1.0.0
5
+ ---
6
+
7
+ <EXTREMELY-IMPORTANT>
8
+ If you think there is even a 1% chance a skill might apply to what you are doing, you ABSOLUTELY MUST invoke the skill.
9
+
10
+ IF A SKILL APPLIES TO YOUR TASK, YOU DO NOT HAVE A CHOICE. YOU MUST USE IT.
11
+
12
+ This is not negotiable. This is not optional. You cannot rationalize your way out of this.
13
+ </EXTREMELY-IMPORTANT>
14
+
15
+ ## How to Access Skills
16
+
17
+ **In Claude Code:** Use the `Skill` tool. When you invoke a skill, its content is loaded and presented to you—follow it directly. Never use the Read tool on skill files.
18
+
19
+ **In other environments:** Check your platform's documentation for how skills are loaded.
20
+
21
+ # Using Skills
22
+
23
+ ## The Rule
24
+
25
+ **Invoke relevant or requested skills BEFORE any response or action.** Even a 1% chance a skill might apply means that you should invoke the skill to check.
26
+
27
+ ## Red Flags
28
+
29
+ These thoughts mean STOP—you're rationalizing:
30
+
31
+ | Thought | Reality |
32
+ |---------|---------|
33
+ | "This is just a simple question" | Questions are tasks. Check for skills. |
34
+ | "I need more context first" | Skill check comes BEFORE clarifying questions. |
35
+ | "Let me explore the codebase first" | Skills tell you HOW to explore. Check first. |
36
+ | "This doesn't need a formal skill" | If a skill exists, use it. |
37
+ | "I remember this skill" | Skills evolve. Read current version. |
38
+ | "The skill is overkill" | Simple things become complex. Use it. |
39
+
40
+ ## Skill Priority
41
+
42
+ When multiple skills could apply, use this order:
43
+
44
+ 1. **Process skills first** (brainstorming, debugging) - these determine HOW to approach the task
45
+ 2. **Implementation skills second** (frontend-design, mcp-builder) - these guide execution
46
+
47
+ ## Skill Types
48
+
49
+ **Rigid** (TDD, debugging): Follow exactly. Don't adapt away discipline.
50
+ **Flexible** (patterns): Adapt principles to context.
51
+
52
+ ## User Instructions
53
+
54
+ Instructions say WHAT, not HOW. "Add X" or "Fix Y" doesn't mean skip workflows.
@@ -0,0 +1,140 @@
1
+ ---
2
+ name: verification-before-completion
3
+ description: Use when about to claim work is complete, fixed, or passing, before committing or creating PRs - requires running verification commands and confirming output before making any success claims; evidence before assertions always
4
+ version: 1.0.0
5
+ ---
6
+
7
+ # Verification Before Completion
8
+
9
+ ## Overview
10
+
11
+ Claiming work is complete without verification is dishonesty, not efficiency.
12
+
13
+ **Core principle:** Evidence before claims, always.
14
+
15
+ **Violating the letter of this rule is violating the spirit of this rule.**
16
+
17
+ ## The Iron Law
18
+
19
+ ```
20
+ NO COMPLETION CLAIMS WITHOUT FRESH VERIFICATION EVIDENCE
21
+ ```
22
+
23
+ If you haven't run the verification command in this message, you cannot claim it passes.
24
+
25
+ ## The Gate Function
26
+
27
+ ```
28
+ BEFORE claiming any status or expressing satisfaction:
29
+
30
+ 1. IDENTIFY: What command proves this claim?
31
+ 2. RUN: Execute the FULL command (fresh, complete)
32
+ 3. READ: Full output, check exit code, count failures
33
+ 4. VERIFY: Does output confirm the claim?
34
+ - If NO: State actual status with evidence
35
+ - If YES: State claim WITH evidence
36
+ 5. ONLY THEN: Make the claim
37
+
38
+ Skip any step = lying, not verifying
39
+ ```
40
+
41
+ ## Common Failures
42
+
43
+ | Claim | Requires | Not Sufficient |
44
+ |-------|----------|----------------|
45
+ | Tests pass | Test command output: 0 failures | Previous run, "should pass" |
46
+ | Linter clean | Linter output: 0 errors | Partial check, extrapolation |
47
+ | Build succeeds | Build command: exit 0 | Linter passing, logs look good |
48
+ | Bug fixed | Test original symptom: passes | Code changed, assumed fixed |
49
+ | Regression test works | Red-green cycle verified | Test passes once |
50
+ | Agent completed | VCS diff shows changes | Agent reports "success" |
51
+ | Requirements met | Line-by-line checklist | Tests passing |
52
+
53
+ ## Red Flags - STOP
54
+
55
+ - Using "should", "probably", "seems to"
56
+ - Expressing satisfaction before verification ("Great!", "Perfect!", "Done!", etc.)
57
+ - About to commit/push/PR without verification
58
+ - Trusting agent success reports
59
+ - Relying on partial verification
60
+ - Thinking "just this once"
61
+ - Tired and wanting work over
62
+ - **ANY wording implying success without having run verification**
63
+
64
+ ## Rationalization Prevention
65
+
66
+ | Excuse | Reality |
67
+ |--------|---------|
68
+ | "Should work now" | RUN the verification |
69
+ | "I'm confident" | Confidence ≠ evidence |
70
+ | "Just this once" | No exceptions |
71
+ | "Linter passed" | Linter ≠ compiler |
72
+ | "Agent said success" | Verify independently |
73
+ | "I'm tired" | Exhaustion ≠ excuse |
74
+ | "Partial check is enough" | Partial proves nothing |
75
+ | "Different words so rule doesn't apply" | Spirit over letter |
76
+
77
+ ## Key Patterns
78
+
79
+ **Tests:**
80
+ ```
81
+ ✅ [Run test command] [See: 34/34 pass] "All tests pass"
82
+ ❌ "Should pass now" / "Looks correct"
83
+ ```
84
+
85
+ **Regression tests (TDD Red-Green):**
86
+ ```
87
+ ✅ Write → Run (pass) → Revert fix → Run (MUST FAIL) → Restore → Run (pass)
88
+ ❌ "I've written a regression test" (without red-green verification)
89
+ ```
90
+
91
+ **Build:**
92
+ ```
93
+ ✅ [Run build] [See: exit 0] "Build passes"
94
+ ❌ "Linter passed" (linter doesn't check compilation)
95
+ ```
96
+
97
+ **Requirements:**
98
+ ```
99
+ ✅ Re-read plan → Create checklist → Verify each → Report gaps or completion
100
+ ❌ "Tests pass, phase complete"
101
+ ```
102
+
103
+ **Agent delegation:**
104
+ ```
105
+ ✅ Agent reports success → Check VCS diff → Verify changes → Report actual state
106
+ ❌ Trust agent report
107
+ ```
108
+
109
+ ## Why This Matters
110
+
111
+ From 24 failure memories:
112
+ - your human partner said "I don't believe you" - trust broken
113
+ - Undefined functions shipped - would crash
114
+ - Missing requirements shipped - incomplete features
115
+ - Time wasted on false completion → redirect → rework
116
+ - Violates: "Honesty is a core value. If you lie, you'll be replaced."
117
+
118
+ ## When To Apply
119
+
120
+ **ALWAYS before:**
121
+ - ANY variation of success/completion claims
122
+ - ANY expression of satisfaction
123
+ - ANY positive statement about work state
124
+ - Committing, PR creation, task completion
125
+ - Moving to next task
126
+ - Delegating to agents
127
+
128
+ **Rule applies to:**
129
+ - Exact phrases
130
+ - Paraphrases and synonyms
131
+ - Implications of success
132
+ - ANY communication suggesting completion/correctness
133
+
134
+ ## The Bottom Line
135
+
136
+ **No shortcuts for verification.**
137
+
138
+ Run the command. Read the output. THEN claim the result.
139
+
140
+ This is non-negotiable.
@@ -0,0 +1,82 @@
1
+ ---
2
+ name: verify
3
+ description: Self-verification checklist — run before declaring work complete, committing, or creating PRs
4
+ disable-model-invocation: true
5
+ version: 1.0.0
6
+ ---
7
+
8
+ ## Dependencies
9
+ - Bash tool (git, test runners, linters)
10
+
11
+ Run a verification pass on the work just completed. Do NOT skip steps.
12
+
13
+ ## Step 1: Check what changed
14
+
15
+ 1. `git diff --stat` — list modified files
16
+ 2. `git diff --cached --stat` — list staged files
17
+ 3. If no git repo, list files you created or modified this session
18
+
19
+ ## Step 2: Run automated checks (if available)
20
+
21
+ Try each in order, skip if not applicable:
22
+
23
+ 1. **Tests:** Look for test runner config. Run tests. Report pass/fail count.
24
+ 2. **Linter:** Look for linter config. Run linter. Report issue count.
25
+ 3. **Type check:** Look for `tsconfig.json` or `mypy.ini`. Run type checker.
26
+ 4. **Build:** If there's a build step, run it.
27
+
28
+ ## Step 2.5: Integration Wiring + Lesson Scanner
29
+
30
+ **Run this step if the session built multiple components across batches.**
31
+
32
+ 1. **Integration wiring check:** Confirm every shared module built this session is imported/called by its consumer.
33
+ 2. **Lesson scanner:** Dispatch `lesson-scanner` agent against modified files.
34
+ 3. **Contract tests:** For parallel feature lists, verify a contract test exists.
35
+
36
+ ## Step 3: Pipeline testing (if service has API, UI, or multi-layer data flow)
37
+
38
+ ### 3a: Horizontal sweep — every endpoint/interface works
39
+
40
+ Hit every API endpoint, CLI command, and static file with a known input. Confirms the **surface exists and responds.**
41
+
42
+ ### 3b: Vertical trace — one input flows through the entire stack
43
+
44
+ Submit one real input and trace it through every layer. Confirms **data flows end-to-end and state accumulates correctly.**
45
+
46
+ ### Why both axes are required
47
+
48
+ Horizontal catches: missing routes, broken static files, schema errors, 500s.
49
+ Vertical catches: path prefix mismatches, missing state updates, aggregate bugs.
50
+
51
+ **If time-constrained:** Run the vertical trace — it catches more integration bugs per minute.
52
+
53
+ ## Step 4: Manual verification checklist
54
+
55
+ For each file changed, verify:
56
+
57
+ - [ ] Does the change do what was asked?
58
+ - [ ] No secrets committed
59
+ - [ ] No debug artifacts left
60
+ - [ ] File permissions correct
61
+ - [ ] If config changed: service reloaded/restarted?
62
+
63
+ ## Step 5: Report
64
+
65
+ Present as:
66
+
67
+ ```
68
+ VERIFICATION — <date>
69
+ Files changed: N
70
+ Tests: X passed, Y failed (or N/A)
71
+ Lint: X issues (or N/A)
72
+ Types: clean (or N/A)
73
+ Pipeline (horizontal): X/Y endpoints pass (or N/A)
74
+ Pipeline (vertical): data traced input→output / [list gaps] (or N/A)
75
+ Manual checks: all clear / [list issues]
76
+ ```
77
+
78
+ ## Anti-patterns
79
+
80
+ - NEVER say "looks good" without running actual commands
81
+ - NEVER skip the git diff
82
+ - NEVER declare work complete if any test fails
@@ -0,0 +1,128 @@
1
+ ---
2
+ name: writing-plans
3
+ description: Use when you have a spec or requirements for a multi-step task, before touching code
4
+ version: 1.0.0
5
+ ---
6
+
7
+ # Writing Plans
8
+
9
+ ## Overview
10
+
11
+ Write comprehensive implementation plans assuming the engineer has zero context for our codebase and questionable taste. Document everything they need to know: which files to touch for each task, code, testing, docs they might need to check, how to test it. Give them the whole plan as bite-sized tasks. DRY. YAGNI. TDD. Frequent commits.
12
+
13
+ Assume they are a skilled developer, but know almost nothing about our toolset or problem domain. Assume they don't know good test design very well.
14
+
15
+ **Announce at start:** "I'm using the writing-plans skill to create the implementation plan."
16
+
17
+ **Context:** This should be run in a dedicated worktree (created by brainstorming skill).
18
+
19
+ **Save plans to:** `docs/plans/YYYY-MM-DD-<feature-name>.md`
20
+
21
+ ## Bite-Sized Task Granularity
22
+
23
+ **Each step is one action (2-5 minutes):**
24
+ - "Write the failing test" - step
25
+ - "Run it to make sure it fails" - step
26
+ - "Implement the minimal code to make the test pass" - step
27
+ - "Run the tests and make sure they pass" - step
28
+ - "Commit" - step
29
+
30
+ ## Plan Document Header
31
+
32
+ **Every plan MUST start with this header:**
33
+
34
+ ```markdown
35
+ # [Feature Name] Implementation Plan
36
+
37
+ > **For Claude:** REQUIRED SUB-SKILL: Use superpowers:executing-plans to implement this plan task-by-task.
38
+
39
+ **Goal:** [One sentence describing what this builds]
40
+
41
+ **Architecture:** [2-3 sentences about approach]
42
+
43
+ **Tech Stack:** [Key technologies/libraries]
44
+
45
+ ---
46
+ ```
47
+
48
+ ## Task Structure
49
+
50
+ ````markdown
51
+ ### Task N: [Component Name]
52
+
53
+ **Files:**
54
+ - Create: `exact/path/to/file.py`
55
+ - Modify: `exact/path/to/existing.py:123-145`
56
+ - Test: `tests/exact/path/to/test.py`
57
+
58
+ **Step 1: Write the failing test**
59
+
60
+ ```python
61
+ def test_specific_behavior():
62
+ result = function(input)
63
+ assert result == expected
64
+ ```
65
+
66
+ **Step 2: Run test to verify it fails**
67
+
68
+ Run: `pytest tests/path/test.py::test_name -v`
69
+ Expected: FAIL with "function not defined"
70
+
71
+ **Step 3: Write minimal implementation**
72
+
73
+ ```python
74
+ def function(input):
75
+ return expected
76
+ ```
77
+
78
+ **Step 4: Run test to verify it passes**
79
+
80
+ Run: `pytest tests/path/test.py::test_name -v`
81
+ Expected: PASS
82
+
83
+ **Step 5: Commit**
84
+
85
+ ```bash
86
+ git add tests/path/test.py src/path/file.py
87
+ git commit -m "feat: add specific feature"
88
+ ```
89
+ ````
90
+
91
+ ## Remember
92
+ - Exact file paths always
93
+ - Complete code in plan (not "add validation")
94
+ - Exact commands with expected output
95
+ - Reference relevant skills with @ syntax
96
+ - DRY, YAGNI, TDD, frequent commits
97
+
98
+ ## Execution Handoff
99
+
100
+ After saving the plan, offer execution choice:
101
+
102
+ **"Plan complete and saved to `docs/plans/<filename>.md`. Three execution options:**
103
+
104
+ **1. Subagent-Driven (this session)** - I dispatch fresh subagent per task with two-stage review, fast iteration, you watch progress
105
+
106
+ **2. Parallel Session (separate)** - Open new session with executing-plans, batch execution with human review checkpoints
107
+
108
+ **3. Headless (walk away)** - Run `scripts/run-plan.sh` in the background. Fresh `claude -p` per batch, quality gates between batches, resume on interruption. Best for 5+ batch plans.
109
+
110
+ **Which approach?"**
111
+
112
+ **If Subagent-Driven chosen:**
113
+ - **REQUIRED SUB-SKILL:** Use superpowers:subagent-driven-development
114
+ - Stay in this session
115
+ - Fresh subagent per task + code review
116
+
117
+ **If Parallel Session chosen:**
118
+ - Guide them to open new session in worktree
119
+ - **REQUIRED SUB-SKILL:** New session uses superpowers:executing-plans
120
+
121
+ **If Headless chosen:**
122
+ - Generate the run command with appropriate flags:
123
+ ```bash
124
+ scripts/run-plan.sh docs/plans/<plan-file>.md --quality-gate "scripts/quality-gate.sh --project-root ."
125
+ ```
126
+ - If the plan has critical batches, suggest `--mode competitive --competitive-batches N,M`
127
+ - For long plans (10+ batches), suggest `--on-failure retry --max-retries 3`
128
+ - Remind them: `--resume` picks up where it left off after interruption
@@ -0,0 +1,93 @@
1
+ ---
2
+ name: writing-skills
3
+ description: Use when creating new skills, editing existing skills, or verifying skills work before deployment
4
+ version: 1.0.0
5
+ ---
6
+
7
+ # Writing Skills
8
+
9
+ ## Overview
10
+
11
+ **Writing skills IS Test-Driven Development applied to process documentation.**
12
+
13
+ You write test cases (pressure scenarios with subagents), watch them fail (baseline behavior), write the skill (documentation), watch tests pass (agents comply), and refactor (close loopholes).
14
+
15
+ **Core principle:** If you didn't watch an agent fail without the skill, you don't know if the skill teaches the right thing.
16
+
17
+ ## What is a Skill?
18
+
19
+ A **skill** is a reference guide for proven techniques, patterns, or tools. Skills help future Claude instances find and apply effective approaches.
20
+
21
+ **Skills are:** Reusable techniques, patterns, tools, reference guides
22
+ **Skills are NOT:** Narratives about how you solved a problem once
23
+
24
+ ## SKILL.md Structure
25
+
26
+ **Frontmatter (YAML):**
27
+ - Only two fields supported: `name` and `description`
28
+ - Max 1024 characters total
29
+ - `name`: Use letters, numbers, and hyphens only
30
+ - `description`: Third-person, describes ONLY when to use (NOT what it does)
31
+
32
+ ```markdown
33
+ ---
34
+ name: Skill-Name-With-Hyphens
35
+ description: Use when [specific triggering conditions and symptoms]
36
+ ---
37
+
38
+ # Skill Name
39
+
40
+ ## Overview
41
+ What is this? Core principle in 1-2 sentences.
42
+
43
+ ## When to Use
44
+ Bullet list with SYMPTOMS and use cases
45
+
46
+ ## Core Pattern
47
+ Before/after code comparison
48
+
49
+ ## Quick Reference
50
+ Table or bullets for scanning
51
+
52
+ ## Common Mistakes
53
+ What goes wrong + fixes
54
+ ```
55
+
56
+ ## The Iron Law (Same as TDD)
57
+
58
+ ```
59
+ NO SKILL WITHOUT A FAILING TEST FIRST
60
+ ```
61
+
62
+ Write skill before testing? Delete it. Start over.
63
+
64
+ ## RED-GREEN-REFACTOR for Skills
65
+
66
+ ### RED: Write Failing Test (Baseline)
67
+ Run pressure scenario with subagent WITHOUT the skill. Document exact behavior.
68
+
69
+ ### GREEN: Write Minimal Skill
70
+ Write skill that addresses those specific rationalizations. Run same scenarios WITH skill.
71
+
72
+ ### REFACTOR: Close Loopholes
73
+ Agent found new rationalization? Add explicit counter. Re-test until bulletproof.
74
+
75
+ ## Skill Creation Checklist
76
+
77
+ **RED Phase:**
78
+ - [ ] Create pressure scenarios
79
+ - [ ] Run scenarios WITHOUT skill - document baseline
80
+ - [ ] Identify patterns in rationalizations/failures
81
+
82
+ **GREEN Phase:**
83
+ - [ ] Name uses only letters, numbers, hyphens
84
+ - [ ] YAML frontmatter with only name and description
85
+ - [ ] Description starts with "Use when..."
86
+ - [ ] Address specific baseline failures
87
+ - [ ] Run scenarios WITH skill - verify compliance
88
+
89
+ **REFACTOR Phase:**
90
+ - [ ] Identify NEW rationalizations from testing
91
+ - [ ] Add explicit counters
92
+ - [ ] Build rationalization table
93
+ - [ ] Re-test until bulletproof