cognitive-core 0.2.0 → 0.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (397) hide show
  1. package/.claude/settings.json +111 -2
  2. package/.sessionlog/settings.json +4 -0
  3. package/dist/atlas.d.ts +10 -0
  4. package/dist/atlas.d.ts.map +1 -1
  5. package/dist/atlas.js +65 -0
  6. package/dist/atlas.js.map +1 -1
  7. package/dist/index.d.ts +1 -1
  8. package/dist/index.d.ts.map +1 -1
  9. package/dist/index.js +5 -1
  10. package/dist/index.js.map +1 -1
  11. package/dist/learning/index.d.ts +1 -1
  12. package/dist/learning/index.d.ts.map +1 -1
  13. package/dist/learning/index.js.map +1 -1
  14. package/dist/learning/pipeline.d.ts +4 -31
  15. package/dist/learning/pipeline.d.ts.map +1 -1
  16. package/dist/learning/pipeline.js +12 -64
  17. package/dist/learning/pipeline.js.map +1 -1
  18. package/dist/learning/unified-pipeline.d.ts +30 -0
  19. package/dist/learning/unified-pipeline.d.ts.map +1 -1
  20. package/dist/learning/unified-pipeline.js +207 -0
  21. package/dist/learning/unified-pipeline.js.map +1 -1
  22. package/dist/memory/candidate-retrieval.d.ts.map +1 -1
  23. package/dist/memory/candidate-retrieval.js +3 -1
  24. package/dist/memory/candidate-retrieval.js.map +1 -1
  25. package/dist/memory/curated-loader.d.ts +21 -4
  26. package/dist/memory/curated-loader.d.ts.map +1 -1
  27. package/dist/memory/curated-loader.js +53 -16
  28. package/dist/memory/curated-loader.js.map +1 -1
  29. package/dist/memory/index.d.ts +2 -1
  30. package/dist/memory/index.d.ts.map +1 -1
  31. package/dist/memory/index.js +3 -1
  32. package/dist/memory/index.js.map +1 -1
  33. package/dist/memory/playbook.d.ts +6 -0
  34. package/dist/memory/playbook.d.ts.map +1 -1
  35. package/dist/memory/playbook.js +15 -0
  36. package/dist/memory/playbook.js.map +1 -1
  37. package/dist/memory/source-resolver.d.ts +120 -0
  38. package/dist/memory/source-resolver.d.ts.map +1 -0
  39. package/dist/memory/source-resolver.js +300 -0
  40. package/dist/memory/source-resolver.js.map +1 -0
  41. package/dist/types/config.d.ts +141 -0
  42. package/dist/types/config.d.ts.map +1 -1
  43. package/dist/types/config.js +40 -0
  44. package/dist/types/config.js.map +1 -1
  45. package/dist/types/index.d.ts +1 -1
  46. package/dist/types/index.d.ts.map +1 -1
  47. package/dist/types/index.js +1 -1
  48. package/dist/types/index.js.map +1 -1
  49. package/dist/utils/error-classifier.js +8 -8
  50. package/dist/utils/error-classifier.js.map +1 -1
  51. package/dist/workspace/efficacy-toolkit.d.ts +164 -0
  52. package/dist/workspace/efficacy-toolkit.d.ts.map +1 -0
  53. package/dist/workspace/efficacy-toolkit.js +281 -0
  54. package/dist/workspace/efficacy-toolkit.js.map +1 -0
  55. package/dist/workspace/index.d.ts +2 -1
  56. package/dist/workspace/index.d.ts.map +1 -1
  57. package/dist/workspace/index.js +3 -1
  58. package/dist/workspace/index.js.map +1 -1
  59. package/dist/workspace/templates/index.d.ts +3 -0
  60. package/dist/workspace/templates/index.d.ts.map +1 -1
  61. package/dist/workspace/templates/index.js +6 -0
  62. package/dist/workspace/templates/index.js.map +1 -1
  63. package/dist/workspace/templates/playbook-decay-detection.d.ts +46 -0
  64. package/dist/workspace/templates/playbook-decay-detection.d.ts.map +1 -0
  65. package/dist/workspace/templates/playbook-decay-detection.js +197 -0
  66. package/dist/workspace/templates/playbook-decay-detection.js.map +1 -0
  67. package/dist/workspace/templates/playbook-efficacy-audit.d.ts +46 -0
  68. package/dist/workspace/templates/playbook-efficacy-audit.d.ts.map +1 -0
  69. package/dist/workspace/templates/playbook-efficacy-audit.js +160 -0
  70. package/dist/workspace/templates/playbook-efficacy-audit.js.map +1 -0
  71. package/dist/workspace/templates/playbook-lifecycle-review.d.ts +51 -0
  72. package/dist/workspace/templates/playbook-lifecycle-review.d.ts.map +1 -0
  73. package/dist/workspace/templates/playbook-lifecycle-review.js +187 -0
  74. package/dist/workspace/templates/playbook-lifecycle-review.js.map +1 -0
  75. package/dist/workspace/types.d.ts +12 -54
  76. package/dist/workspace/types.d.ts.map +1 -1
  77. package/dist/workspace/types.js.map +1 -1
  78. package/package.json +8 -2
  79. package/playbooks/compound-engineering/adversarial-review.json +51 -0
  80. package/playbooks/compound-engineering/agent-native-architecture.json +59 -0
  81. package/playbooks/compound-engineering/agent-native-review.json +54 -0
  82. package/playbooks/compound-engineering/api-contract-review.json +52 -0
  83. package/playbooks/compound-engineering/brainstorm-requirements.json +55 -0
  84. package/playbooks/compound-engineering/bug-reproduction.json +62 -0
  85. package/playbooks/compound-engineering/confidence-calibration.json +49 -0
  86. package/playbooks/compound-engineering/correctness-review.json +49 -0
  87. package/playbooks/compound-engineering/data-migration-safety.json +59 -0
  88. package/playbooks/compound-engineering/deployment-verification.json +63 -0
  89. package/playbooks/compound-engineering/error-recovery-patterns.json +53 -0
  90. package/playbooks/compound-engineering/implementation-planning.json +64 -0
  91. package/playbooks/compound-engineering/issue-pattern-analysis.json +53 -0
  92. package/playbooks/compound-engineering/knowledge-compounding.json +63 -0
  93. package/playbooks/compound-engineering/learnings-research.json +54 -0
  94. package/playbooks/compound-engineering/maintainability-review.json +49 -0
  95. package/playbooks/compound-engineering/performance-review.json +54 -0
  96. package/playbooks/compound-engineering/plan-adversarial-review.json +56 -0
  97. package/playbooks/compound-engineering/plan-feasibility-review.json +56 -0
  98. package/playbooks/compound-engineering/project-standards-review.json +52 -0
  99. package/playbooks/compound-engineering/reliability-review.json +53 -0
  100. package/playbooks/compound-engineering/review-orchestration.json +64 -0
  101. package/playbooks/compound-engineering/security-review.json +54 -0
  102. package/playbooks/compound-engineering/systematic-execution.json +64 -0
  103. package/playbooks/compound-engineering/testing-review.json +50 -0
  104. package/src/atlas.ts +96 -0
  105. package/src/index.ts +27 -0
  106. package/src/learning/index.ts +1 -0
  107. package/src/learning/unified-pipeline.ts +271 -1
  108. package/src/memory/candidate-retrieval.ts +2 -1
  109. package/src/memory/curated-loader.ts +69 -16
  110. package/src/memory/index.ts +16 -0
  111. package/src/memory/playbook.ts +19 -0
  112. package/src/memory/source-resolver.ts +422 -0
  113. package/src/types/config.ts +46 -0
  114. package/src/types/index.ts +4 -0
  115. package/src/utils/error-classifier.ts +8 -8
  116. package/src/workspace/efficacy-toolkit.ts +496 -0
  117. package/src/workspace/index.ts +29 -0
  118. package/src/workspace/templates/index.ts +24 -0
  119. package/src/workspace/templates/playbook-decay-detection.ts +272 -0
  120. package/src/workspace/templates/playbook-efficacy-audit.ts +246 -0
  121. package/src/workspace/templates/playbook-lifecycle-review.ts +274 -0
  122. package/src/workspace/types.ts +22 -78
  123. package/tests/fixtures/behavioral-trajectories.ts +210 -0
  124. package/tests/integration/curated-sources-e2e.test.ts +502 -0
  125. package/tests/integration/pipeline-data-correctness.test.ts +794 -0
  126. package/tests/learning/meta-learner.test.ts +418 -0
  127. package/tests/learning/pipeline-memory-updates.test.ts +721 -0
  128. package/tests/learning/unified-pipeline-efficacy.test.ts +232 -0
  129. package/tests/memory/candidate-retrieval.test.ts +167 -0
  130. package/tests/memory/compound-engineering-seed.test.ts +338 -0
  131. package/tests/memory/curated-loader-extended.test.ts +225 -0
  132. package/tests/memory/meta.test.ts +399 -0
  133. package/tests/memory/playbook-quality-validation.test.ts +430 -0
  134. package/tests/memory/source-resolver.test.ts +700 -0
  135. package/tests/search/evaluator.test.ts +257 -0
  136. package/tests/search/verification-runner.test.ts +357 -0
  137. package/tests/utils/error-classifier.test.ts +149 -0
  138. package/tests/utils/trajectory-helpers.test.ts +163 -0
  139. package/tests/workspace/efficacy-toolkit.test.ts +404 -0
  140. package/tests/workspace/templates/playbook-efficacy.test.ts +377 -0
  141. package/.claude/settings.local.json +0 -11
  142. package/dist/learning/llm-extractor.d.ts +0 -88
  143. package/dist/learning/llm-extractor.d.ts.map +0 -1
  144. package/dist/learning/llm-extractor.js +0 -372
  145. package/dist/learning/llm-extractor.js.map +0 -1
  146. package/dist/learning/loop-coordinator.d.ts +0 -61
  147. package/dist/learning/loop-coordinator.d.ts.map +0 -1
  148. package/dist/learning/loop-coordinator.js +0 -96
  149. package/dist/learning/loop-coordinator.js.map +0 -1
  150. package/references/agent-workspace/CLAUDE.md +0 -74
  151. package/references/agent-workspace/README.md +0 -587
  152. package/references/agent-workspace/media/banner.png +0 -0
  153. package/references/agent-workspace/package-lock.json +0 -2061
  154. package/references/agent-workspace/package.json +0 -54
  155. package/references/agent-workspace/src/handle.ts +0 -122
  156. package/references/agent-workspace/src/index.ts +0 -32
  157. package/references/agent-workspace/src/manager.ts +0 -102
  158. package/references/agent-workspace/src/readers/json.ts +0 -71
  159. package/references/agent-workspace/src/readers/markdown.ts +0 -37
  160. package/references/agent-workspace/src/readers/raw.ts +0 -27
  161. package/references/agent-workspace/src/types.ts +0 -68
  162. package/references/agent-workspace/src/validation.ts +0 -93
  163. package/references/agent-workspace/src/writers/json.ts +0 -17
  164. package/references/agent-workspace/src/writers/markdown.ts +0 -27
  165. package/references/agent-workspace/src/writers/raw.ts +0 -22
  166. package/references/agent-workspace/tests/errors.test.ts +0 -652
  167. package/references/agent-workspace/tests/handle.test.ts +0 -144
  168. package/references/agent-workspace/tests/manager.test.ts +0 -124
  169. package/references/agent-workspace/tests/readers.test.ts +0 -205
  170. package/references/agent-workspace/tests/validation.test.ts +0 -196
  171. package/references/agent-workspace/tests/writers.test.ts +0 -108
  172. package/references/agent-workspace/tsconfig.json +0 -20
  173. package/references/agent-workspace/tsup.config.ts +0 -9
  174. package/references/minimem/.claude/settings.json +0 -7
  175. package/references/minimem/.sudocode/issues.jsonl +0 -18
  176. package/references/minimem/.sudocode/specs.jsonl +0 -1
  177. package/references/minimem/CLAUDE.md +0 -310
  178. package/references/minimem/README.md +0 -556
  179. package/references/minimem/claude-plugin/.claude-plugin/plugin.json +0 -10
  180. package/references/minimem/claude-plugin/.mcp.json +0 -7
  181. package/references/minimem/claude-plugin/README.md +0 -158
  182. package/references/minimem/claude-plugin/commands/recall.md +0 -47
  183. package/references/minimem/claude-plugin/commands/remember.md +0 -41
  184. package/references/minimem/claude-plugin/hooks/__tests__/hooks.test.ts +0 -272
  185. package/references/minimem/claude-plugin/hooks/hooks.json +0 -27
  186. package/references/minimem/claude-plugin/hooks/session-end.sh +0 -86
  187. package/references/minimem/claude-plugin/hooks/session-start.sh +0 -85
  188. package/references/minimem/claude-plugin/skills/memory/SKILL.md +0 -108
  189. package/references/minimem/package-lock.json +0 -5373
  190. package/references/minimem/package.json +0 -60
  191. package/references/minimem/scripts/postbuild.js +0 -35
  192. package/references/minimem/src/__tests__/edge-cases.test.ts +0 -371
  193. package/references/minimem/src/__tests__/errors.test.ts +0 -265
  194. package/references/minimem/src/__tests__/helpers.ts +0 -199
  195. package/references/minimem/src/__tests__/internal.test.ts +0 -407
  196. package/references/minimem/src/__tests__/knowledge.test.ts +0 -287
  197. package/references/minimem/src/__tests__/minimem.integration.test.ts +0 -1127
  198. package/references/minimem/src/__tests__/session.test.ts +0 -190
  199. package/references/minimem/src/cli/__tests__/commands.test.ts +0 -759
  200. package/references/minimem/src/cli/commands/__tests__/conflicts.test.ts +0 -141
  201. package/references/minimem/src/cli/commands/append.ts +0 -76
  202. package/references/minimem/src/cli/commands/config.ts +0 -262
  203. package/references/minimem/src/cli/commands/conflicts.ts +0 -413
  204. package/references/minimem/src/cli/commands/daemon.ts +0 -169
  205. package/references/minimem/src/cli/commands/index.ts +0 -12
  206. package/references/minimem/src/cli/commands/init.ts +0 -88
  207. package/references/minimem/src/cli/commands/mcp.ts +0 -177
  208. package/references/minimem/src/cli/commands/push-pull.ts +0 -213
  209. package/references/minimem/src/cli/commands/search.ts +0 -158
  210. package/references/minimem/src/cli/commands/status.ts +0 -84
  211. package/references/minimem/src/cli/commands/sync-init.ts +0 -290
  212. package/references/minimem/src/cli/commands/sync.ts +0 -70
  213. package/references/minimem/src/cli/commands/upsert.ts +0 -197
  214. package/references/minimem/src/cli/config.ts +0 -584
  215. package/references/minimem/src/cli/index.ts +0 -264
  216. package/references/minimem/src/cli/shared.ts +0 -161
  217. package/references/minimem/src/cli/sync/__tests__/central.test.ts +0 -152
  218. package/references/minimem/src/cli/sync/__tests__/conflicts.test.ts +0 -209
  219. package/references/minimem/src/cli/sync/__tests__/daemon.test.ts +0 -118
  220. package/references/minimem/src/cli/sync/__tests__/detection.test.ts +0 -207
  221. package/references/minimem/src/cli/sync/__tests__/integration.test.ts +0 -476
  222. package/references/minimem/src/cli/sync/__tests__/registry.test.ts +0 -363
  223. package/references/minimem/src/cli/sync/__tests__/state.test.ts +0 -255
  224. package/references/minimem/src/cli/sync/__tests__/validation.test.ts +0 -193
  225. package/references/minimem/src/cli/sync/__tests__/watcher.test.ts +0 -178
  226. package/references/minimem/src/cli/sync/central.ts +0 -292
  227. package/references/minimem/src/cli/sync/conflicts.ts +0 -204
  228. package/references/minimem/src/cli/sync/daemon.ts +0 -407
  229. package/references/minimem/src/cli/sync/detection.ts +0 -138
  230. package/references/minimem/src/cli/sync/index.ts +0 -107
  231. package/references/minimem/src/cli/sync/operations.ts +0 -373
  232. package/references/minimem/src/cli/sync/registry.ts +0 -279
  233. package/references/minimem/src/cli/sync/state.ts +0 -355
  234. package/references/minimem/src/cli/sync/validation.ts +0 -206
  235. package/references/minimem/src/cli/sync/watcher.ts +0 -234
  236. package/references/minimem/src/cli/version.ts +0 -34
  237. package/references/minimem/src/core/index.ts +0 -9
  238. package/references/minimem/src/core/indexer.ts +0 -628
  239. package/references/minimem/src/core/searcher.ts +0 -221
  240. package/references/minimem/src/db/schema.ts +0 -183
  241. package/references/minimem/src/db/sqlite-vec.ts +0 -24
  242. package/references/minimem/src/embeddings/__tests__/embeddings.test.ts +0 -431
  243. package/references/minimem/src/embeddings/batch-gemini.ts +0 -392
  244. package/references/minimem/src/embeddings/batch-openai.ts +0 -409
  245. package/references/minimem/src/embeddings/embeddings.ts +0 -434
  246. package/references/minimem/src/index.ts +0 -109
  247. package/references/minimem/src/internal.ts +0 -299
  248. package/references/minimem/src/minimem.ts +0 -1276
  249. package/references/minimem/src/search/__tests__/hybrid.test.ts +0 -247
  250. package/references/minimem/src/search/graph.ts +0 -234
  251. package/references/minimem/src/search/hybrid.ts +0 -151
  252. package/references/minimem/src/search/search.ts +0 -256
  253. package/references/minimem/src/server/__tests__/mcp.test.ts +0 -341
  254. package/references/minimem/src/server/__tests__/tools.test.ts +0 -364
  255. package/references/minimem/src/server/mcp.ts +0 -326
  256. package/references/minimem/src/server/tools.ts +0 -720
  257. package/references/minimem/src/session.ts +0 -460
  258. package/references/minimem/tsconfig.json +0 -19
  259. package/references/minimem/tsup.config.ts +0 -26
  260. package/references/minimem/vitest.config.ts +0 -24
  261. package/references/sessionlog/.husky/pre-commit +0 -1
  262. package/references/sessionlog/.lintstagedrc.json +0 -4
  263. package/references/sessionlog/.prettierignore +0 -4
  264. package/references/sessionlog/.prettierrc.json +0 -11
  265. package/references/sessionlog/LICENSE +0 -21
  266. package/references/sessionlog/README.md +0 -453
  267. package/references/sessionlog/eslint.config.js +0 -58
  268. package/references/sessionlog/package-lock.json +0 -3672
  269. package/references/sessionlog/package.json +0 -65
  270. package/references/sessionlog/src/__tests__/agent-hooks.test.ts +0 -570
  271. package/references/sessionlog/src/__tests__/agent-registry.test.ts +0 -127
  272. package/references/sessionlog/src/__tests__/claude-code-hooks.test.ts +0 -225
  273. package/references/sessionlog/src/__tests__/claude-generator.test.ts +0 -46
  274. package/references/sessionlog/src/__tests__/commit-msg.test.ts +0 -86
  275. package/references/sessionlog/src/__tests__/cursor-agent.test.ts +0 -224
  276. package/references/sessionlog/src/__tests__/e2e-live.test.ts +0 -890
  277. package/references/sessionlog/src/__tests__/event-log.test.ts +0 -183
  278. package/references/sessionlog/src/__tests__/flush-sentinel.test.ts +0 -105
  279. package/references/sessionlog/src/__tests__/gemini-agent.test.ts +0 -375
  280. package/references/sessionlog/src/__tests__/git-hooks.test.ts +0 -78
  281. package/references/sessionlog/src/__tests__/hook-managers.test.ts +0 -121
  282. package/references/sessionlog/src/__tests__/lifecycle-tasks.test.ts +0 -759
  283. package/references/sessionlog/src/__tests__/opencode-agent.test.ts +0 -338
  284. package/references/sessionlog/src/__tests__/redaction.test.ts +0 -136
  285. package/references/sessionlog/src/__tests__/session-repo.test.ts +0 -353
  286. package/references/sessionlog/src/__tests__/session-store.test.ts +0 -166
  287. package/references/sessionlog/src/__tests__/setup-ccweb.test.ts +0 -466
  288. package/references/sessionlog/src/__tests__/skill-live.test.ts +0 -461
  289. package/references/sessionlog/src/__tests__/summarize.test.ts +0 -348
  290. package/references/sessionlog/src/__tests__/task-plan-e2e.test.ts +0 -610
  291. package/references/sessionlog/src/__tests__/task-plan-live.test.ts +0 -632
  292. package/references/sessionlog/src/__tests__/transcript-timestamp.test.ts +0 -121
  293. package/references/sessionlog/src/__tests__/types.test.ts +0 -166
  294. package/references/sessionlog/src/__tests__/utils.test.ts +0 -333
  295. package/references/sessionlog/src/__tests__/validation.test.ts +0 -103
  296. package/references/sessionlog/src/__tests__/worktree.test.ts +0 -57
  297. package/references/sessionlog/src/agent/agents/claude-code.ts +0 -1089
  298. package/references/sessionlog/src/agent/agents/cursor.ts +0 -361
  299. package/references/sessionlog/src/agent/agents/gemini-cli.ts +0 -632
  300. package/references/sessionlog/src/agent/agents/opencode.ts +0 -540
  301. package/references/sessionlog/src/agent/registry.ts +0 -143
  302. package/references/sessionlog/src/agent/session-types.ts +0 -113
  303. package/references/sessionlog/src/agent/types.ts +0 -220
  304. package/references/sessionlog/src/cli.ts +0 -597
  305. package/references/sessionlog/src/commands/clean.ts +0 -133
  306. package/references/sessionlog/src/commands/disable.ts +0 -84
  307. package/references/sessionlog/src/commands/doctor.ts +0 -145
  308. package/references/sessionlog/src/commands/enable.ts +0 -202
  309. package/references/sessionlog/src/commands/explain.ts +0 -261
  310. package/references/sessionlog/src/commands/reset.ts +0 -105
  311. package/references/sessionlog/src/commands/resume.ts +0 -180
  312. package/references/sessionlog/src/commands/rewind.ts +0 -195
  313. package/references/sessionlog/src/commands/setup-ccweb.ts +0 -275
  314. package/references/sessionlog/src/commands/status.ts +0 -172
  315. package/references/sessionlog/src/config.ts +0 -165
  316. package/references/sessionlog/src/events/event-log.ts +0 -126
  317. package/references/sessionlog/src/git-operations.ts +0 -558
  318. package/references/sessionlog/src/hooks/git-hooks.ts +0 -165
  319. package/references/sessionlog/src/hooks/lifecycle.ts +0 -391
  320. package/references/sessionlog/src/index.ts +0 -650
  321. package/references/sessionlog/src/security/redaction.ts +0 -283
  322. package/references/sessionlog/src/session/state-machine.ts +0 -452
  323. package/references/sessionlog/src/store/checkpoint-store.ts +0 -509
  324. package/references/sessionlog/src/store/native-store.ts +0 -173
  325. package/references/sessionlog/src/store/provider-types.ts +0 -99
  326. package/references/sessionlog/src/store/session-store.ts +0 -266
  327. package/references/sessionlog/src/strategy/attribution.ts +0 -296
  328. package/references/sessionlog/src/strategy/common.ts +0 -207
  329. package/references/sessionlog/src/strategy/content-overlap.ts +0 -228
  330. package/references/sessionlog/src/strategy/manual-commit.ts +0 -988
  331. package/references/sessionlog/src/strategy/types.ts +0 -279
  332. package/references/sessionlog/src/summarize/claude-generator.ts +0 -115
  333. package/references/sessionlog/src/summarize/summarize.ts +0 -432
  334. package/references/sessionlog/src/types.ts +0 -508
  335. package/references/sessionlog/src/utils/chunk-files.ts +0 -49
  336. package/references/sessionlog/src/utils/commit-message.ts +0 -65
  337. package/references/sessionlog/src/utils/detect-agent.ts +0 -36
  338. package/references/sessionlog/src/utils/hook-managers.ts +0 -125
  339. package/references/sessionlog/src/utils/ide-tags.ts +0 -32
  340. package/references/sessionlog/src/utils/paths.ts +0 -79
  341. package/references/sessionlog/src/utils/preview-rewind.ts +0 -80
  342. package/references/sessionlog/src/utils/rewind-conflict.ts +0 -121
  343. package/references/sessionlog/src/utils/shadow-branch.ts +0 -109
  344. package/references/sessionlog/src/utils/string-utils.ts +0 -46
  345. package/references/sessionlog/src/utils/todo-extract.ts +0 -188
  346. package/references/sessionlog/src/utils/trailers.ts +0 -187
  347. package/references/sessionlog/src/utils/transcript-parse.ts +0 -177
  348. package/references/sessionlog/src/utils/transcript-timestamp.ts +0 -59
  349. package/references/sessionlog/src/utils/tree-ops.ts +0 -219
  350. package/references/sessionlog/src/utils/tty.ts +0 -72
  351. package/references/sessionlog/src/utils/validation.ts +0 -65
  352. package/references/sessionlog/src/utils/worktree.ts +0 -58
  353. package/references/sessionlog/src/wire-types.ts +0 -59
  354. package/references/sessionlog/templates/setup-env.sh +0 -153
  355. package/references/sessionlog/tsconfig.json +0 -18
  356. package/references/sessionlog/vitest.config.ts +0 -12
  357. package/references/skill-tree/.claude/settings.json +0 -6
  358. package/references/skill-tree/.sudocode/issues.jsonl +0 -19
  359. package/references/skill-tree/.sudocode/specs.jsonl +0 -3
  360. package/references/skill-tree/CLAUDE.md +0 -126
  361. package/references/skill-tree/README.md +0 -372
  362. package/references/skill-tree/docs/GAPS_v1.md +0 -221
  363. package/references/skill-tree/docs/INTEGRATION_PLAN.md +0 -467
  364. package/references/skill-tree/docs/TODOS.md +0 -91
  365. package/references/skill-tree/docs/anthropic_skill_guide.md +0 -1364
  366. package/references/skill-tree/docs/design/federated-skill-trees.md +0 -524
  367. package/references/skill-tree/docs/design/multi-agent-sync.md +0 -759
  368. package/references/skill-tree/docs/scraper/BRAINSTORM.md +0 -583
  369. package/references/skill-tree/docs/scraper/POC_PLAN.md +0 -420
  370. package/references/skill-tree/docs/scraper/README.md +0 -170
  371. package/references/skill-tree/examples/basic-usage.ts +0 -164
  372. package/references/skill-tree/package-lock.json +0 -1852
  373. package/references/skill-tree/package.json +0 -66
  374. package/references/skill-tree/scraper/README.md +0 -123
  375. package/references/skill-tree/scraper/docs/DESIGN.md +0 -683
  376. package/references/skill-tree/scraper/docs/PLAN.md +0 -336
  377. package/references/skill-tree/scraper/drizzle.config.ts +0 -10
  378. package/references/skill-tree/scraper/package-lock.json +0 -6329
  379. package/references/skill-tree/scraper/package.json +0 -68
  380. package/references/skill-tree/scraper/test/fixtures/invalid-skill/missing-description.md +0 -7
  381. package/references/skill-tree/scraper/test/fixtures/invalid-skill/missing-name.md +0 -7
  382. package/references/skill-tree/scraper/test/fixtures/minimal-skill/SKILL.md +0 -27
  383. package/references/skill-tree/scraper/test/fixtures/skill-json/SKILL.json +0 -21
  384. package/references/skill-tree/scraper/test/fixtures/skill-with-meta/SKILL.md +0 -54
  385. package/references/skill-tree/scraper/test/fixtures/skill-with-meta/_meta.json +0 -24
  386. package/references/skill-tree/scraper/test/fixtures/valid-skill/SKILL.md +0 -93
  387. package/references/skill-tree/scraper/test/fixtures/valid-skill/_meta.json +0 -22
  388. package/references/skill-tree/scraper/tsup.config.ts +0 -14
  389. package/references/skill-tree/scraper/vitest.config.ts +0 -17
  390. package/references/skill-tree/scripts/convert-to-vitest.ts +0 -166
  391. package/references/skill-tree/skills/skill-writer/SKILL.md +0 -339
  392. package/references/skill-tree/skills/skill-writer/references/examples.md +0 -326
  393. package/references/skill-tree/skills/skill-writer/references/patterns.md +0 -210
  394. package/references/skill-tree/skills/skill-writer/references/quality-checklist.md +0 -123
  395. package/references/skill-tree/test/run-all.ts +0 -106
  396. package/references/skill-tree/test/utils.ts +0 -128
  397. package/references/skill-tree/vitest.config.ts +0 -16
@@ -0,0 +1,54 @@
1
+ {
2
+ "name": "learnings-research",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.85,
5
+ "complexity": "moderate",
6
+ "estimatedEffort": 3,
7
+ "applicability": {
8
+ "situations": [
9
+ "Looking up institutional knowledge before starting work",
10
+ "Finding past solutions for similar problems during debugging",
11
+ "Preventing repeated mistakes by surfacing known patterns and gotchas"
12
+ ],
13
+ "triggers": [
14
+ "search knowledge",
15
+ "past solutions",
16
+ "known issues",
17
+ "institutional knowledge",
18
+ "what do we know about"
19
+ ],
20
+ "antiPatterns": [
21
+ "Searching for information that doesn't exist in the knowledge base yet",
22
+ "Using full-text search as the first step instead of grep-first filtering",
23
+ "Reading all files sequentially instead of parallel keyword search"
24
+ ],
25
+ "domains": ["knowledge-management", "research", "debugging"]
26
+ },
27
+ "guidance": {
28
+ "strategy": "Grep-first filtering: extract keywords, narrow by category, run parallel content searches on frontmatter fields, then read only strong/moderate matches. Never read all files — always pre-filter.",
29
+ "tactics": [
30
+ "Extract keywords from the current task/problem description",
31
+ "Category narrowing (if clear): focus on the relevant knowledge subdirectory first",
32
+ "Parallel content-search: search on frontmatter fields (title, tags, module, component) using multiple keywords in parallel; use case-insensitive matching; use OR for synonyms",
33
+ "Score matches into four categories: Strong (module + tags match), Moderate (problem_type relevant + tags), Weak (tangential), None — only read Strong and Moderate",
34
+ "Always check critical-patterns document regardless of grep results — it contains must-know patterns for all work",
35
+ "Distill summaries from matched documents — surface actionable insights, not raw content",
36
+ "Assess overlap on 5 dimensions: problem statement, root cause, solution, referenced files, prevention rules",
37
+ "Run multiple searches in parallel — never sequentially"
38
+ ]
39
+ },
40
+ "verification": {
41
+ "successIndicators": [
42
+ "Relevant documents found and ranked by relevance strength",
43
+ "Critical patterns checked and incorporated",
44
+ "Summaries are distilled and actionable (not raw file dumps)",
45
+ "Search used grep-first filtering, not sequential file reading"
46
+ ],
47
+ "failureIndicators": [
48
+ "All files read sequentially instead of pre-filtered",
49
+ "Tangentially related entries included, adding noise",
50
+ "Critical patterns document skipped",
51
+ "Searches run sequentially instead of in parallel"
52
+ ]
53
+ }
54
+ }
@@ -0,0 +1,49 @@
1
+ {
2
+ "name": "maintainability-review",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.85,
5
+ "complexity": "moderate",
6
+ "estimatedEffort": 3,
7
+ "applicability": {
8
+ "situations": [
9
+ "Reviewing code for long-term carrying cost and maintainability",
10
+ "Evaluating abstractions, indirection, and naming clarity",
11
+ "Checking for dead code, unnecessary coupling, and premature complexity"
12
+ ],
13
+ "triggers": [
14
+ "code review",
15
+ "maintainability",
16
+ "complexity",
17
+ "refactoring"
18
+ ],
19
+ "antiPatterns": [
20
+ "Reviewing for correctness bugs — use correctness review instead",
21
+ "Style preferences that don't affect comprehension",
22
+ "Debating naming conventions already established in the codebase"
23
+ ],
24
+ "domains": ["code-review", "maintainability", "quality-assurance"]
25
+ },
26
+ "guidance": {
27
+ "strategy": "Apply the future developer lens: will the next person who touches this in 6 months understand it quickly? Every abstraction must earn its keep with 3+ implementations or proven variation.",
28
+ "tactics": [
29
+ "Hunt for: premature abstraction (interface/factory with one user), unnecessary indirection (>2 delegation levels), dead code (commented, unused exports, unreachable), unrelated module coupling, naming that obscures intent",
30
+ "Anti-pattern catalog: generic solution for specific problem, wrapper with no added value, config for unchanging values, unused extension points, circular dependencies, shared mutable state",
31
+ "Abstractions must earn their keep: 3+ implementations or proven variation axis — otherwise inline",
32
+ "Indirection must add clear value: if a function just delegates to another without transformation, it's overhead",
33
+ "Naming describes what, not how: booleans have is/has/should prefixes; functions describe outcome not mechanism",
34
+ "Confidence calibration: HIGH (0.80+) when objectively provable (abstraction has 1 user visible in codebase); MODERATE (0.60-0.79) for naming/abstraction boundary judgments; suppress below 0.60 for style preferences"
35
+ ]
36
+ },
37
+ "verification": {
38
+ "successIndicators": [
39
+ "All flagged abstractions are objectively underused (provable from codebase search)",
40
+ "Indirection findings show concrete delegation chain with no value-add",
41
+ "Dead code findings are verifiable via search (no callers/importers)"
42
+ ],
43
+ "failureIndicators": [
44
+ "Finding is really a style preference, not a maintainability concern",
45
+ "Abstraction flagged as premature but actually has 3+ users",
46
+ "Naming critique is subjective rather than clarity-impacting"
47
+ ]
48
+ }
49
+ }
@@ -0,0 +1,54 @@
1
+ {
2
+ "name": "performance-review",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.85,
5
+ "complexity": "moderate",
6
+ "estimatedEffort": 4,
7
+ "applicability": {
8
+ "situations": [
9
+ "Reviewing code that touches database queries, loops, caching, or I/O-intensive paths",
10
+ "Evaluating scalability of new features at 10x/100x/1000x current data volumes",
11
+ "Checking for production-observable performance regressions"
12
+ ],
13
+ "triggers": [
14
+ "performance review",
15
+ "N+1 query",
16
+ "slow query",
17
+ "memory leak",
18
+ "pagination",
19
+ "caching"
20
+ ],
21
+ "antiPatterns": [
22
+ "Micro-optimizations in cold paths (startup, migrations, admin tools, one-time initialization)",
23
+ "Premature caching suggestions without evidence of actual slowness",
24
+ "Theoretical scale issues in MVP/prototype code",
25
+ "Style-based performance opinions (for vs forEach, Map vs plain object)"
26
+ ],
27
+ "domains": ["code-review", "performance", "quality-assurance"]
28
+ },
29
+ "guidance": {
30
+ "strategy": "Read code through the lens of 'what happens when this runs 10,000 times' or 'when the table has a million rows'. Focus on measurable, production-observable problems — not theoretical micro-optimizations. Project performance at 10x, 100x, and 1000x current volumes.",
31
+ "tactics": [
32
+ "N+1 queries: flag database queries inside loops that should be batched or eager-loaded; count loop iterations against expected data size",
33
+ "Unbounded memory: flag loading entire tables without pagination, caches without eviction policies, string concatenation in loops, large object allocations",
34
+ "Missing pagination: flag endpoints returning all results without limit/offset/cursor/streaming",
35
+ "Hot-path allocations: flag object creation, regex compilation, or expensive computation inside loops or per-request paths",
36
+ "Blocking I/O in async: flag synchronous file reads, blocking HTTP calls, CPU-intensive computation on the event loop",
37
+ "Algorithmic complexity: flag O(n^2) or worse without justification; verify all database queries use appropriate indexes",
38
+ "Performance benchmarks: API responses under 200ms for standard operations, bundle size increases under 5KB per feature, background jobs process in batches",
39
+ "Confidence calibration: HIGH (0.80+) when impact is provable from code (N+1 clearly in loop, unbounded query on large table); MODERATE (0.60-0.79) when pattern present but impact depends on unconfirmed data size; suppress below 0.60"
40
+ ]
41
+ },
42
+ "verification": {
43
+ "successIndicators": [
44
+ "Each finding identifies a specific code path with measurable impact at expected scale",
45
+ "N+1 findings show the loop and the query inside it",
46
+ "No micro-optimization findings on cold paths"
47
+ ],
48
+ "failureIndicators": [
49
+ "Finding is speculative optimization without evidence of hot path",
50
+ "Caching recommendation without evidence of repeated expensive computation",
51
+ "Flagging cold-path code (startup, migrations) for performance"
52
+ ]
53
+ }
54
+ }
@@ -0,0 +1,56 @@
1
+ {
2
+ "name": "plan-adversarial-review",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.8,
5
+ "complexity": "complex",
6
+ "estimatedEffort": 5,
7
+ "applicability": {
8
+ "situations": [
9
+ "Reviewing implementation plans or requirement documents before execution",
10
+ "Stress-testing planning assumptions, premises, and scope decisions",
11
+ "Catching contradictions, scope creep, and unstated assumptions in plans"
12
+ ],
13
+ "triggers": [
14
+ "review plan",
15
+ "plan review",
16
+ "challenge assumptions",
17
+ "scope review",
18
+ "requirements review"
19
+ ],
20
+ "antiPatterns": [
21
+ "Implementation style or technology selection choices",
22
+ "Product strategy or priority preferences",
23
+ "Security, design, or feasibility concerns (use plan-feasibility-review instead)",
24
+ "The plan is already in execution — too late for adversarial review"
25
+ ],
26
+ "domains": ["planning", "requirements", "quality-assurance"]
27
+ },
28
+ "guidance": {
29
+ "strategy": "Challenge premises before solutions. Surface unstated assumptions. Stress-test decisions for reversal cost. Check for internal contradictions and scope-goal misalignment. Apply three lenses: adversarial (break assumptions), coherence (internal consistency), and scope guardian (right-sized).",
30
+ "tactics": [
31
+ "Premise challenging: Is this the right problem? Does the solution match the problem? What if we did nothing? What would make this fail? Surface framing effects that bias toward one solution",
32
+ "Assumption surfacing: identify environmental assumptions (infrastructure exists, APIs stable), user behavior assumptions (adoption, usage patterns), scale assumptions (data volume, concurrency), temporal assumptions (availability, ordering)",
33
+ "Decision stress-testing: for each major decision, apply falsification test (what evidence would prove this wrong?), reversal cost (how expensive to change later?), and decision-scope mismatch (is decision bigger/smaller than the problem?)",
34
+ "Simplification pressure: audit abstractions (how many consumers?), find minimum viable version, apply subtraction test (remove each component — does plan still work?), enforce complexity budget",
35
+ "Coherence checking: catch contradictions between sections, terminology drift (same concept with different names), forward references to undefined terms, ungrouped requirements spanning multiple concerns",
36
+ "Scope-goal alignment: flag scope exceeding goals (building more than needed), goals exceeding scope (promising more than plan delivers), new abstractions with one implementation, framework-ahead-of-need, configuration without consumers",
37
+ "Alternative blindness: check for omitted alternatives, build-vs-use analysis, do-nothing baseline comparison",
38
+ "Depth calibration: Quick (short docs, <5 requirements) = max 3 findings; Standard = proportional to decision density; Deep (>10 requirements, high-stakes) = multiple passes with assumption chain tracing",
39
+ "Confidence calibration: HIGH (0.80+) when specific text can be quoted showing gap; MODERATE (0.60-0.79) when gap likely but requires context not in document; suppress below 0.50"
40
+ ]
41
+ },
42
+ "verification": {
43
+ "successIndicators": [
44
+ "Findings quote specific text from the plan showing the gap or contradiction",
45
+ "Assumptions surfaced are testable and actionable",
46
+ "Scope-goal alignment checked with concrete evidence",
47
+ "No findings that belong to feasibility, security, or design review"
48
+ ],
49
+ "failureIndicators": [
50
+ "Findings are vague concerns without quoting specific plan text",
51
+ "Assumptions identified are untestable or irrelevant",
52
+ "Scope opinions based on preference rather than goal alignment",
53
+ "Contradictions flagged that are reconcilable with charitable reading"
54
+ ]
55
+ }
56
+ }
@@ -0,0 +1,56 @@
1
+ {
2
+ "name": "plan-feasibility-review",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.8,
5
+ "complexity": "complex",
6
+ "estimatedEffort": 5,
7
+ "applicability": {
8
+ "situations": [
9
+ "Evaluating technical feasibility of implementation plans",
10
+ "Checking product-market fit and strategic alignment of proposed features",
11
+ "Reviewing plans for security gaps, design completeness, and migration safety"
12
+ ],
13
+ "triggers": [
14
+ "feasibility review",
15
+ "plan feasibility",
16
+ "technical review",
17
+ "can we build this",
18
+ "is this plan viable"
19
+ ],
20
+ "antiPatterns": [
21
+ "Implementation style choices that don't affect feasibility",
22
+ "Code organization preferences",
23
+ "Theoretical scalability without evidence",
24
+ "Scope or assumption concerns (use plan-adversarial-review instead)"
25
+ ],
26
+ "domains": ["planning", "architecture", "quality-assurance"]
27
+ },
28
+ "guidance": {
29
+ "strategy": "Evaluate plans across four dimensions: technical feasibility (can we build it?), product fit (should we build it?), security readiness (is it safe?), and design completeness (is it specified enough?). Each dimension has a distinct lens.",
30
+ "tactics": [
31
+ "Technical feasibility: verify plan acknowledges existing code/services/infrastructure; check for architecture conflicts with current stack; validate that referenced file paths and interfaces actually exist; check framework compatibility",
32
+ "Shadow path tracing: for each feature, trace the happy path, nil/empty input path, error path, and concurrent access path — plans that only cover happy path will fail in implementation",
33
+ "Migration safety: verify concrete migration path (not 'migrate later'), backward compatibility during rollout, rollback strategy, data volume estimates, and operation ordering",
34
+ "Product lens: challenge the premise — is this the right problem? What's the actual outcome? What happens if we do nothing? Is there an 80% value at 20% cost alternative? Check goal-requirement alignment (orphan requirements, unserved goals)",
35
+ "Security lens: inventory attack surfaces (endpoints, data stores, integrations, user inputs), check auth/authz per endpoint, identify sensitive data flows, assess third-party trust boundaries, outline top-3 threat model (most likely, highest impact, most subtle exploit)",
36
+ "Design completeness: check interaction state coverage (loading, empty, error, success, partial for every interactive element), user flow completeness (entry points, happy path, 2-3 edge cases, exit points), responsive/accessibility considerations",
37
+ "Dependency analysis: verify external dependencies are available and compatible; identify implicit assumptions about infrastructure, APIs, or services",
38
+ "Performance feasibility: back-of-envelope math for expected load, data volumes, and response time requirements",
39
+ "Confidence calibration: HIGH (0.80+) when specific technical constraint blocks the approach; MODERATE (0.60-0.79) when constraint likely but depends on implementation details; suppress below 0.50"
40
+ ]
41
+ },
42
+ "verification": {
43
+ "successIndicators": [
44
+ "Technical blockers identified with specific evidence (missing API, framework incompatibility)",
45
+ "Shadow paths traced — plan covers more than just the happy path",
46
+ "Security attack surfaces inventoried with mitigation gaps flagged",
47
+ "Product alignment verified — goals trace to requirements"
48
+ ],
49
+ "failureIndicators": [
50
+ "Feasibility concerns are vague without specific technical evidence",
51
+ "Only happy path evaluated — error/empty/concurrent paths ignored",
52
+ "Security review is generic OWASP checklist without plan-specific analysis",
53
+ "Product concerns are preference-based rather than goal-alignment-based"
54
+ ]
55
+ }
56
+ }
@@ -0,0 +1,52 @@
1
+ {
2
+ "name": "project-standards-review",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.85,
5
+ "complexity": "simple",
6
+ "estimatedEffort": 2,
7
+ "applicability": {
8
+ "situations": [
9
+ "Reviewing changes for compliance with the project's own standards (CLAUDE.md, AGENTS.md, contributing guides)",
10
+ "Enforcing naming conventions, file placement, and configuration rules",
11
+ "Auditing changes against established project conventions"
12
+ ],
13
+ "triggers": [
14
+ "standards review",
15
+ "convention check",
16
+ "CLAUDE.md compliance",
17
+ "project rules"
18
+ ],
19
+ "antiPatterns": [
20
+ "Rules that don't apply to the changed file type",
21
+ "Violations already caught by automated linters or CI",
22
+ "Pre-existing violations in unchanged code",
23
+ "Generic best practices not documented in the project's standards files",
24
+ "Opinions about quality of the standards themselves"
25
+ ],
26
+ "domains": ["code-review", "standards", "quality-assurance"]
27
+ },
28
+ "guidance": {
29
+ "strategy": "Audit changes against the project's own documented standards. Every finding must cite a specific rule from the standards file AND a specific violation in the diff. Without both, drop the finding.",
30
+ "tactics": [
31
+ "Discover standards: read CLAUDE.md, AGENTS.md, and any contributing/convention files in the changed file's ancestor directories",
32
+ "Match rules to file types: only apply rules relevant to the specific files being changed",
33
+ "Evidence requirement: for each finding, provide (1) exact quote/section from standards file defining the rule, and (2) specific line(s) in diff violating the rule",
34
+ "Common violations: missing required frontmatter fields, names not matching directory/file names, wrong reference inclusion mode, shell commands where native tools are required, misplaced files in wrong directories",
35
+ "Language violations: second-person 'you should' where standards require imperative form, hedge words (might/could/consider) leaving behavior undefined",
36
+ "Protected artifacts: never flag documented protected paths (docs/, plans/, solutions/) for deletion",
37
+ "Confidence calibration: HIGH (0.80+) when specific rule quote and specific diff violation are both identifiable; MODERATE (0.60-0.79) when rule exists but applying it requires judgment; suppress below 0.60"
38
+ ]
39
+ },
40
+ "verification": {
41
+ "successIndicators": [
42
+ "Every finding cites both the rule source and the specific violation",
43
+ "Only rules from the project's actual standards files are enforced",
44
+ "No findings about unchanged code or generic best practices"
45
+ ],
46
+ "failureIndicators": [
47
+ "Finding enforces a rule not documented in any standards file",
48
+ "Finding about pre-existing code that wasn't changed in this diff",
49
+ "Generic best practice advice without project-specific rule citation"
50
+ ]
51
+ }
52
+ }
@@ -0,0 +1,53 @@
1
+ {
2
+ "name": "reliability-review",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.85,
5
+ "complexity": "moderate",
6
+ "estimatedEffort": 4,
7
+ "applicability": {
8
+ "situations": [
9
+ "Reviewing code with external dependencies, I/O boundaries, or error handling",
10
+ "Evaluating failure modes, retry logic, and cascading failure paths",
11
+ "Checking resilience of services that depend on other services"
12
+ ],
13
+ "triggers": [
14
+ "reliability review",
15
+ "error handling",
16
+ "retry",
17
+ "timeout",
18
+ "circuit breaker",
19
+ "cascade failure"
20
+ ],
21
+ "antiPatterns": [
22
+ "Flagging internal pure functions that cannot fail (string formatting, math, in-memory transforms)",
23
+ "Test helper error handling",
24
+ "Error message formatting choices",
25
+ "Theoretical cascading failures without traceable evidence"
26
+ ],
27
+ "domains": ["code-review", "reliability", "quality-assurance"]
28
+ },
29
+ "guidance": {
30
+ "strategy": "Ask 'what happens when this dependency is down?' for every external call. Think about partial failures, retry storms, and cascading timeouts. Read code by assuming the environment can be hostile.",
31
+ "tactics": [
32
+ "Missing error handling on I/O boundaries: flag HTTP calls, database queries, file operations, and message queue interactions without try/catch or error callbacks",
33
+ "Retry loops without backoff/limits: immediate indefinite retries create retry storms — require exponential backoff and max attempt limits",
34
+ "Missing timeouts on external calls: HTTP clients, database connections, and RPC without explicit timeouts can hang indefinitely and exhaust connection pools",
35
+ "Error swallowing: flag catch blocks that ignore errors, silent failures that return misleading defaults, and error handlers that don't log or propagate",
36
+ "Cascading failure paths: trace how failure in service A causes B to retry aggressively, overloading C; how slow dependencies fill request queues causing health check failures, restarts, and cold-start storms",
37
+ "Recovery-induced failures: retries creating duplicates, rollbacks leaving orphaned state, circuit breakers preventing legitimate recovery",
38
+ "Confidence calibration: HIGH (0.80+) when reliability gap is directly visible (HTTP call without timeout, retry without max attempts, catch swallowing error); MODERATE (0.60-0.79) when code lacks protection but framework defaults might handle it; suppress below 0.60"
39
+ ]
40
+ },
41
+ "verification": {
42
+ "successIndicators": [
43
+ "Each finding points to a specific I/O boundary without protection",
44
+ "Retry findings show the loop and its missing backoff/limit",
45
+ "Cascade findings trace the multi-service failure chain"
46
+ ],
47
+ "failureIndicators": [
48
+ "Flagging pure functions or in-memory operations for error handling",
49
+ "Missing that framework middleware already handles the concern",
50
+ "Architectural concerns that can't be confirmed from the diff"
51
+ ]
52
+ }
53
+ }
@@ -0,0 +1,64 @@
1
+ {
2
+ "name": "review-orchestration",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.8,
5
+ "complexity": "complex",
6
+ "estimatedEffort": 8,
7
+ "applicability": {
8
+ "situations": [
9
+ "Code review before creating a PR",
10
+ "Reviewing changes after completing a task during iterative implementation",
11
+ "Structured multi-persona code review for quality assurance"
12
+ ],
13
+ "triggers": [
14
+ "review code",
15
+ "code review",
16
+ "check changes",
17
+ "pre-PR review"
18
+ ],
19
+ "antiPatterns": [
20
+ "Reviewing trivial formatting-only changes",
21
+ "Reviewing auto-generated code that will be regenerated",
22
+ "Single-line config changes that don't affect behavior"
23
+ ],
24
+ "domains": ["code-review", "quality-assurance", "software-engineering"]
25
+ },
26
+ "guidance": {
27
+ "strategy": "Deploy tiered reviewer personas in parallel, then merge and deduplicate findings. Always-on reviewers run on every review; conditional reviewers are selected based on the diff content.",
28
+ "tactics": [
29
+ "Always-on reviewers: correctness (logic bugs), testing (coverage gaps), maintainability (coupling/complexity), project-standards (convention compliance), agent-native (action/context parity), learnings-researcher (institutional knowledge)",
30
+ "Conditional reviewers selected per-diff: security (auth/injection), performance (N+1/memory), API-contract (breaking changes), data-migrations (schema safety), reliability (error handling), adversarial (edge cases), stack-specific language reviewers",
31
+ "Each reviewer returns structured findings with severity (P0-P3), confidence (0.0-1.0), and autofix_class (safe_auto/gated_auto/manual/advisory)",
32
+ "Suppress all findings below 0.60 confidence to prevent noise",
33
+ "Merge/deduplicate findings by fingerprint: (file + line_bucket +/- 3 lines + normalized_title). On conflict, keep highest severity and strongest confidence",
34
+ "Route actions by class: safe_auto findings get auto-fixed; gated_auto/manual findings go to human review; advisory findings are informational only",
35
+ "Maximum 2 rounds of autofix to prevent loops"
36
+ ],
37
+ "steps": [
38
+ "1. Detect scope of changes (files, languages, domains affected)",
39
+ "2. Discover intent from commit messages, PR description, or task context",
40
+ "3. Select conditional reviewers based on scope (security for auth files, performance for queries, etc.)",
41
+ "4. Dispatch all selected reviewers in parallel — each reads the diff independently",
42
+ "5. Collect structured JSON findings from all reviewers",
43
+ "6. Merge findings: deduplicate by fingerprint, resolve severity conflicts conservatively",
44
+ "7. Synthesize final report with verdict: Ready / Ready with fixes / Not ready"
45
+ ]
46
+ },
47
+ "verification": {
48
+ "successIndicators": [
49
+ "All P0 findings are genuine breakage traceable to specific code paths",
50
+ "Line numbers point to exact buggy code, not nearby lines",
51
+ "Each finding is actionable with a clear fix path",
52
+ "No false positives from style issues that linters catch",
53
+ "Deduplication produces no redundant findings"
54
+ ],
55
+ "failureIndicators": [
56
+ "P0 findings that are actually style nits",
57
+ "False positives exceeding 20% of total findings",
58
+ "Same issue reported multiple times after deduplication",
59
+ "Findings that require runtime observation to confirm (not provable from code)",
60
+ "Protected artifacts (docs, plans, brainstorms) flagged for deletion"
61
+ ],
62
+ "rollbackStrategy": "Review findings are advisory — no code changes until human approval (except safe_auto in autofix mode)"
63
+ }
64
+ }
@@ -0,0 +1,54 @@
1
+ {
2
+ "name": "security-review",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.85,
5
+ "complexity": "moderate",
6
+ "estimatedEffort": 4,
7
+ "applicability": {
8
+ "situations": [
9
+ "Reviewing code changes that touch auth, user input, public endpoints, or permissions",
10
+ "Auditing for exploitable vulnerabilities before deployment",
11
+ "Systematic OWASP Top 10 compliance checking"
12
+ ],
13
+ "triggers": [
14
+ "security review",
15
+ "auth",
16
+ "injection",
17
+ "XSS",
18
+ "CSRF",
19
+ "user input",
20
+ "public endpoint"
21
+ ],
22
+ "antiPatterns": [
23
+ "Defense-in-depth on already-protected code",
24
+ "Theoretical attacks requiring physical access",
25
+ "HTTP vs HTTPS in dev/test configs",
26
+ "Generic hardening advice without specific exploitable findings"
27
+ ],
28
+ "domains": ["code-review", "security", "quality-assurance"]
29
+ },
30
+ "guidance": {
31
+ "strategy": "Think like an attacker looking for one exploitable path through the code. Trace data from entry point to dangerous sink. Combine targeted attack-path analysis with systematic OWASP Top 10 coverage.",
32
+ "tactics": [
33
+ "Injection vectors: trace untrusted input to SQL, XSS, shell commands, template engines, innerHTML/dangerouslySetInnerHTML — flag when no sanitization between entry and sink",
34
+ "Auth/authz bypasses: check for missing auth middleware, broken ownership checks (user A accessing user B's resources), privilege escalation, CSRF on state-changing endpoints",
35
+ "Secrets exposure: scan for hardcoded keys/tokens/passwords, sensitive data in error messages or logs, PII in responses without need-to-know filtering",
36
+ "Insecure deserialization: flag pickle, Marshal, unserialize, JSON.parse of executable content from untrusted sources",
37
+ "SSRF and path traversal: flag user-controlled URLs or file paths passed to fetch/open without allowlist validation",
38
+ "Systematic OWASP Top 10 check: input validation on all entry points (req.body, req.params, req.query), SQL parameterization, XSS escaping + CSP headers, auth on all endpoints, encryption for sensitive data at rest and in transit",
39
+ "Confidence calibration: HIGH (0.80+) when full attack path is traceable from untrusted input to dangerous sink without sanitization; MODERATE (0.60-0.79) when dangerous pattern present but exploitability unconfirmed; suppress below 0.60"
40
+ ]
41
+ },
42
+ "verification": {
43
+ "successIndicators": [
44
+ "Each finding traces a complete attack path: untrusted input → specific code path → exploitable outcome",
45
+ "No false positives from already-protected code or dev-only configs",
46
+ "OWASP categories systematically checked, not just obvious injection"
47
+ ],
48
+ "failureIndicators": [
49
+ "Finding requires physical access or internal-only network to exploit",
50
+ "Generic 'could be vulnerable' without tracing specific input to specific sink",
51
+ "Flagging defense-in-depth that's already behind validated auth"
52
+ ]
53
+ }
54
+ }
@@ -0,0 +1,64 @@
1
+ {
2
+ "name": "systematic-execution",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.8,
5
+ "complexity": "complex",
6
+ "estimatedEffort": 10,
7
+ "applicability": {
8
+ "situations": [
9
+ "Executing an implementation plan systematically",
10
+ "Shipping a feature with testing, review, and quality gates",
11
+ "Multi-unit implementation requiring incremental progress and verification"
12
+ ],
13
+ "triggers": [
14
+ "execute plan",
15
+ "start work",
16
+ "implement this",
17
+ "ship feature"
18
+ ],
19
+ "antiPatterns": [
20
+ "No plan exists — create one first",
21
+ "Exploratory work where requirements aren't defined",
22
+ "Hotfix that needs to ship immediately without full process"
23
+ ],
24
+ "domains": ["execution", "implementation", "software-engineering"]
25
+ },
26
+ "guidance": {
27
+ "strategy": "Treat the plan as a decision artifact, not an instruction script. Execute implementation units in dependency order, testing continuously, with incremental commits after each logical unit. Simplify after every 2-3 units.",
28
+ "tactics": [
29
+ "Read plan's Implementation Units; honor execution posture (test-first, characterization-first) when annotated; check 'Deferred to Implementation' questions before starting",
30
+ "Strategy selection by scale: inline (1-2 small tasks), serial subagents (3+ with dependencies), parallel subagents (3+ independent), swarm (10+ with coordination)",
31
+ "Test as you go, not at end: run tests after each significant change; never batch testing to the end",
32
+ "System-wide test check before marking task done: trace callbacks/middleware/observers two levels out; write integration tests with real objects through full chain; verify failure doesn't leave orphaned state; check if other interfaces expose same behavior",
33
+ "Incremental commits after each complete logical unit — messages describe complete valuable changes, not WIP",
34
+ "Simplify after every 2-3 units: review changed files for consolidation opportunities, dead code, naming improvements",
35
+ "Pattern following discipline: read referenced files from plan before implementing — don't invent new conventions",
36
+ "Feature completeness first: don't move to next feature until current one ships"
37
+ ],
38
+ "steps": [
39
+ "1. Read plan, clarify any ambiguities, set up environment",
40
+ "2. Create task tracking for all implementation units",
41
+ "3. Execute units in dependency order: implement → test → verify → commit",
42
+ "4. After every 2-3 units, review for simplification opportunities",
43
+ "5. Run quality checks: tests pass, linting passes, code follows existing patterns",
44
+ "6. Prepare PR: summary (what/why/decisions), testing notes, post-deploy monitoring plan",
45
+ "7. Update plan status"
46
+ ]
47
+ },
48
+ "verification": {
49
+ "successIndicators": [
50
+ "All implementation units completed and tested",
51
+ "Tests pass and linting passes",
52
+ "Code follows existing patterns — no new conventions invented",
53
+ "Each commit describes a complete valuable change",
54
+ "PR includes post-deploy monitoring plan with concrete metrics"
55
+ ],
56
+ "failureIndicators": [
57
+ "Tests batched to end and found late-breaking issues",
58
+ "New conventions invented instead of following existing patterns",
59
+ "Commits contain WIP or incomplete changes",
60
+ "Feature moved on before current one fully shipped",
61
+ "System-wide test check skipped for code with callbacks or error handling"
62
+ ]
63
+ }
64
+ }
@@ -0,0 +1,50 @@
1
+ {
2
+ "name": "testing-review",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.85,
5
+ "complexity": "moderate",
6
+ "estimatedEffort": 3,
7
+ "applicability": {
8
+ "situations": [
9
+ "Reviewing test quality and coverage for code changes",
10
+ "Evaluating whether tests prove code works or provide false confidence",
11
+ "Checking for untested branches, weak assertions, and missing error paths"
12
+ ],
13
+ "triggers": [
14
+ "code review",
15
+ "test coverage",
16
+ "test quality",
17
+ "missing tests"
18
+ ],
19
+ "antiPatterns": [
20
+ "Reviewing test infrastructure or test framework setup",
21
+ "Evaluating test performance or execution speed",
22
+ "Coverage percentage targets without considering test quality"
23
+ ],
24
+ "domains": ["code-review", "testing", "quality-assurance"]
25
+ },
26
+ "guidance": {
27
+ "strategy": "For every new branch (if/else/switch/try/catch) in the diff, verify at least one test exercises it. Focus on whether tests prove behavior, not just that code doesn't throw.",
28
+ "tactics": [
29
+ "Hunt for: untested branches (new if/else/switch/try/catch), tests that don't assert behavior (only assert 'doesn't throw'), implementation-coupled brittle tests (assert on mocks, test private methods, snapshot internals), missing error path coverage",
30
+ "Branch coverage discipline: each new branch must have at least one test; trace all paths through the new code",
31
+ "Behavior assertion rigor: assert specific values not just truthiness; verify both happy path AND sad path",
32
+ "Check that error paths are tested: catch blocks, fallback branches, error returns should have dedicated tests",
33
+ "Flag implementation-coupled tests: tests that break when refactoring without behavior change are brittle",
34
+ "Confidence calibration: HIGH (0.80+) when test gap is provable from diff (new branch, no test); MODERATE (0.60-0.79) when inferred from structure (parser.ts with no parser.test.ts); suppress below 0.60 when coverage may exist in integration tests"
35
+ ]
36
+ },
37
+ "verification": {
38
+ "successIndicators": [
39
+ "All new branches have corresponding test cases",
40
+ "Tests assert actual behavior with specific expected values",
41
+ "Error paths have dedicated tests, not just happy path",
42
+ "No implementation-coupled brittleness identified"
43
+ ],
44
+ "failureIndicators": [
45
+ "New branches found without any test coverage",
46
+ "Tests only assert 'doesn't throw' or truthiness without checking values",
47
+ "Error handling code has no test exercising the error path"
48
+ ]
49
+ }
50
+ }