cognitive-core 0.2.1 → 0.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (331) hide show
  1. package/dist/atlas.d.ts +10 -0
  2. package/dist/atlas.d.ts.map +1 -1
  3. package/dist/atlas.js +65 -0
  4. package/dist/atlas.js.map +1 -1
  5. package/dist/learning/pipeline.d.ts +4 -31
  6. package/dist/learning/pipeline.d.ts.map +1 -1
  7. package/dist/learning/pipeline.js +12 -64
  8. package/dist/learning/pipeline.js.map +1 -1
  9. package/dist/memory/curated-loader.d.ts +21 -4
  10. package/dist/memory/curated-loader.d.ts.map +1 -1
  11. package/dist/memory/curated-loader.js +53 -16
  12. package/dist/memory/curated-loader.js.map +1 -1
  13. package/dist/memory/index.d.ts +2 -1
  14. package/dist/memory/index.d.ts.map +1 -1
  15. package/dist/memory/index.js +3 -1
  16. package/dist/memory/index.js.map +1 -1
  17. package/dist/memory/playbook.d.ts +6 -0
  18. package/dist/memory/playbook.d.ts.map +1 -1
  19. package/dist/memory/playbook.js +15 -0
  20. package/dist/memory/playbook.js.map +1 -1
  21. package/dist/memory/source-resolver.d.ts +120 -0
  22. package/dist/memory/source-resolver.d.ts.map +1 -0
  23. package/dist/memory/source-resolver.js +300 -0
  24. package/dist/memory/source-resolver.js.map +1 -0
  25. package/dist/types/config.d.ts +141 -0
  26. package/dist/types/config.d.ts.map +1 -1
  27. package/dist/types/config.js +40 -0
  28. package/dist/types/config.js.map +1 -1
  29. package/dist/types/index.d.ts +1 -1
  30. package/dist/types/index.d.ts.map +1 -1
  31. package/dist/types/index.js +1 -1
  32. package/dist/types/index.js.map +1 -1
  33. package/dist/workspace/types.d.ts +12 -54
  34. package/dist/workspace/types.d.ts.map +1 -1
  35. package/dist/workspace/types.js.map +1 -1
  36. package/package.json +2 -2
  37. package/playbooks/compound-engineering/adversarial-review.json +51 -0
  38. package/playbooks/compound-engineering/agent-native-architecture.json +59 -0
  39. package/playbooks/compound-engineering/agent-native-review.json +54 -0
  40. package/playbooks/compound-engineering/api-contract-review.json +52 -0
  41. package/playbooks/compound-engineering/brainstorm-requirements.json +55 -0
  42. package/playbooks/compound-engineering/bug-reproduction.json +62 -0
  43. package/playbooks/compound-engineering/confidence-calibration.json +49 -0
  44. package/playbooks/compound-engineering/correctness-review.json +49 -0
  45. package/playbooks/compound-engineering/data-migration-safety.json +59 -0
  46. package/playbooks/compound-engineering/deployment-verification.json +63 -0
  47. package/playbooks/compound-engineering/error-recovery-patterns.json +53 -0
  48. package/playbooks/compound-engineering/implementation-planning.json +64 -0
  49. package/playbooks/compound-engineering/issue-pattern-analysis.json +53 -0
  50. package/playbooks/compound-engineering/knowledge-compounding.json +63 -0
  51. package/playbooks/compound-engineering/learnings-research.json +54 -0
  52. package/playbooks/compound-engineering/maintainability-review.json +49 -0
  53. package/playbooks/compound-engineering/performance-review.json +54 -0
  54. package/playbooks/compound-engineering/plan-adversarial-review.json +56 -0
  55. package/playbooks/compound-engineering/plan-feasibility-review.json +56 -0
  56. package/playbooks/compound-engineering/project-standards-review.json +52 -0
  57. package/playbooks/compound-engineering/reliability-review.json +53 -0
  58. package/playbooks/compound-engineering/review-orchestration.json +64 -0
  59. package/playbooks/compound-engineering/security-review.json +54 -0
  60. package/playbooks/compound-engineering/systematic-execution.json +64 -0
  61. package/playbooks/compound-engineering/testing-review.json +50 -0
  62. package/src/atlas.ts +96 -0
  63. package/src/memory/curated-loader.ts +69 -16
  64. package/src/memory/index.ts +16 -0
  65. package/src/memory/playbook.ts +19 -0
  66. package/src/memory/source-resolver.ts +422 -0
  67. package/src/types/config.ts +46 -0
  68. package/src/types/index.ts +4 -0
  69. package/src/workspace/types.ts +22 -78
  70. package/tests/integration/curated-sources-e2e.test.ts +502 -0
  71. package/tests/memory/compound-engineering-seed.test.ts +338 -0
  72. package/tests/memory/curated-loader-extended.test.ts +225 -0
  73. package/tests/memory/playbook-quality-validation.test.ts +430 -0
  74. package/tests/memory/source-resolver.test.ts +700 -0
  75. package/.claude/settings.local.json +0 -11
  76. package/dist/learning/llm-extractor.d.ts +0 -88
  77. package/dist/learning/llm-extractor.d.ts.map +0 -1
  78. package/dist/learning/llm-extractor.js +0 -372
  79. package/dist/learning/llm-extractor.js.map +0 -1
  80. package/dist/learning/loop-coordinator.d.ts +0 -61
  81. package/dist/learning/loop-coordinator.d.ts.map +0 -1
  82. package/dist/learning/loop-coordinator.js +0 -96
  83. package/dist/learning/loop-coordinator.js.map +0 -1
  84. package/references/agent-workspace/CLAUDE.md +0 -74
  85. package/references/agent-workspace/README.md +0 -587
  86. package/references/agent-workspace/media/banner.png +0 -0
  87. package/references/agent-workspace/package-lock.json +0 -2061
  88. package/references/agent-workspace/package.json +0 -54
  89. package/references/agent-workspace/src/handle.ts +0 -122
  90. package/references/agent-workspace/src/index.ts +0 -32
  91. package/references/agent-workspace/src/manager.ts +0 -102
  92. package/references/agent-workspace/src/readers/json.ts +0 -71
  93. package/references/agent-workspace/src/readers/markdown.ts +0 -37
  94. package/references/agent-workspace/src/readers/raw.ts +0 -27
  95. package/references/agent-workspace/src/types.ts +0 -68
  96. package/references/agent-workspace/src/validation.ts +0 -93
  97. package/references/agent-workspace/src/writers/json.ts +0 -17
  98. package/references/agent-workspace/src/writers/markdown.ts +0 -27
  99. package/references/agent-workspace/src/writers/raw.ts +0 -22
  100. package/references/agent-workspace/tests/errors.test.ts +0 -652
  101. package/references/agent-workspace/tests/handle.test.ts +0 -144
  102. package/references/agent-workspace/tests/manager.test.ts +0 -124
  103. package/references/agent-workspace/tests/readers.test.ts +0 -205
  104. package/references/agent-workspace/tests/validation.test.ts +0 -196
  105. package/references/agent-workspace/tests/writers.test.ts +0 -108
  106. package/references/agent-workspace/tsconfig.json +0 -20
  107. package/references/agent-workspace/tsup.config.ts +0 -9
  108. package/references/minimem/.claude/settings.json +0 -7
  109. package/references/minimem/.sudocode/issues.jsonl +0 -18
  110. package/references/minimem/.sudocode/specs.jsonl +0 -1
  111. package/references/minimem/CLAUDE.md +0 -310
  112. package/references/minimem/README.md +0 -556
  113. package/references/minimem/claude-plugin/.claude-plugin/plugin.json +0 -10
  114. package/references/minimem/claude-plugin/.mcp.json +0 -7
  115. package/references/minimem/claude-plugin/README.md +0 -158
  116. package/references/minimem/claude-plugin/commands/recall.md +0 -47
  117. package/references/minimem/claude-plugin/commands/remember.md +0 -41
  118. package/references/minimem/claude-plugin/hooks/__tests__/hooks.test.ts +0 -272
  119. package/references/minimem/claude-plugin/hooks/hooks.json +0 -27
  120. package/references/minimem/claude-plugin/hooks/session-end.sh +0 -86
  121. package/references/minimem/claude-plugin/hooks/session-start.sh +0 -85
  122. package/references/minimem/claude-plugin/skills/memory/SKILL.md +0 -108
  123. package/references/minimem/package-lock.json +0 -5373
  124. package/references/minimem/package.json +0 -60
  125. package/references/minimem/scripts/postbuild.js +0 -35
  126. package/references/minimem/src/__tests__/edge-cases.test.ts +0 -371
  127. package/references/minimem/src/__tests__/errors.test.ts +0 -265
  128. package/references/minimem/src/__tests__/helpers.ts +0 -199
  129. package/references/minimem/src/__tests__/internal.test.ts +0 -407
  130. package/references/minimem/src/__tests__/knowledge.test.ts +0 -287
  131. package/references/minimem/src/__tests__/minimem.integration.test.ts +0 -1127
  132. package/references/minimem/src/__tests__/session.test.ts +0 -190
  133. package/references/minimem/src/cli/__tests__/commands.test.ts +0 -759
  134. package/references/minimem/src/cli/commands/__tests__/conflicts.test.ts +0 -141
  135. package/references/minimem/src/cli/commands/append.ts +0 -76
  136. package/references/minimem/src/cli/commands/config.ts +0 -262
  137. package/references/minimem/src/cli/commands/conflicts.ts +0 -413
  138. package/references/minimem/src/cli/commands/daemon.ts +0 -169
  139. package/references/minimem/src/cli/commands/index.ts +0 -12
  140. package/references/minimem/src/cli/commands/init.ts +0 -88
  141. package/references/minimem/src/cli/commands/mcp.ts +0 -177
  142. package/references/minimem/src/cli/commands/push-pull.ts +0 -213
  143. package/references/minimem/src/cli/commands/search.ts +0 -158
  144. package/references/minimem/src/cli/commands/status.ts +0 -84
  145. package/references/minimem/src/cli/commands/sync-init.ts +0 -290
  146. package/references/minimem/src/cli/commands/sync.ts +0 -70
  147. package/references/minimem/src/cli/commands/upsert.ts +0 -197
  148. package/references/minimem/src/cli/config.ts +0 -584
  149. package/references/minimem/src/cli/index.ts +0 -264
  150. package/references/minimem/src/cli/shared.ts +0 -161
  151. package/references/minimem/src/cli/sync/__tests__/central.test.ts +0 -152
  152. package/references/minimem/src/cli/sync/__tests__/conflicts.test.ts +0 -209
  153. package/references/minimem/src/cli/sync/__tests__/daemon.test.ts +0 -118
  154. package/references/minimem/src/cli/sync/__tests__/detection.test.ts +0 -207
  155. package/references/minimem/src/cli/sync/__tests__/integration.test.ts +0 -476
  156. package/references/minimem/src/cli/sync/__tests__/registry.test.ts +0 -363
  157. package/references/minimem/src/cli/sync/__tests__/state.test.ts +0 -255
  158. package/references/minimem/src/cli/sync/__tests__/validation.test.ts +0 -193
  159. package/references/minimem/src/cli/sync/__tests__/watcher.test.ts +0 -178
  160. package/references/minimem/src/cli/sync/central.ts +0 -292
  161. package/references/minimem/src/cli/sync/conflicts.ts +0 -204
  162. package/references/minimem/src/cli/sync/daemon.ts +0 -407
  163. package/references/minimem/src/cli/sync/detection.ts +0 -138
  164. package/references/minimem/src/cli/sync/index.ts +0 -107
  165. package/references/minimem/src/cli/sync/operations.ts +0 -373
  166. package/references/minimem/src/cli/sync/registry.ts +0 -279
  167. package/references/minimem/src/cli/sync/state.ts +0 -355
  168. package/references/minimem/src/cli/sync/validation.ts +0 -206
  169. package/references/minimem/src/cli/sync/watcher.ts +0 -234
  170. package/references/minimem/src/cli/version.ts +0 -34
  171. package/references/minimem/src/core/index.ts +0 -9
  172. package/references/minimem/src/core/indexer.ts +0 -628
  173. package/references/minimem/src/core/searcher.ts +0 -221
  174. package/references/minimem/src/db/schema.ts +0 -183
  175. package/references/minimem/src/db/sqlite-vec.ts +0 -24
  176. package/references/minimem/src/embeddings/__tests__/embeddings.test.ts +0 -431
  177. package/references/minimem/src/embeddings/batch-gemini.ts +0 -392
  178. package/references/minimem/src/embeddings/batch-openai.ts +0 -409
  179. package/references/minimem/src/embeddings/embeddings.ts +0 -434
  180. package/references/minimem/src/index.ts +0 -109
  181. package/references/minimem/src/internal.ts +0 -299
  182. package/references/minimem/src/minimem.ts +0 -1276
  183. package/references/minimem/src/search/__tests__/hybrid.test.ts +0 -247
  184. package/references/minimem/src/search/graph.ts +0 -234
  185. package/references/minimem/src/search/hybrid.ts +0 -151
  186. package/references/minimem/src/search/search.ts +0 -256
  187. package/references/minimem/src/server/__tests__/mcp.test.ts +0 -341
  188. package/references/minimem/src/server/__tests__/tools.test.ts +0 -364
  189. package/references/minimem/src/server/mcp.ts +0 -326
  190. package/references/minimem/src/server/tools.ts +0 -720
  191. package/references/minimem/src/session.ts +0 -460
  192. package/references/minimem/tsconfig.json +0 -19
  193. package/references/minimem/tsup.config.ts +0 -26
  194. package/references/minimem/vitest.config.ts +0 -24
  195. package/references/sessionlog/.husky/pre-commit +0 -1
  196. package/references/sessionlog/.lintstagedrc.json +0 -4
  197. package/references/sessionlog/.prettierignore +0 -4
  198. package/references/sessionlog/.prettierrc.json +0 -11
  199. package/references/sessionlog/LICENSE +0 -21
  200. package/references/sessionlog/README.md +0 -453
  201. package/references/sessionlog/eslint.config.js +0 -58
  202. package/references/sessionlog/package-lock.json +0 -3672
  203. package/references/sessionlog/package.json +0 -65
  204. package/references/sessionlog/src/__tests__/agent-hooks.test.ts +0 -570
  205. package/references/sessionlog/src/__tests__/agent-registry.test.ts +0 -127
  206. package/references/sessionlog/src/__tests__/claude-code-hooks.test.ts +0 -225
  207. package/references/sessionlog/src/__tests__/claude-generator.test.ts +0 -46
  208. package/references/sessionlog/src/__tests__/commit-msg.test.ts +0 -86
  209. package/references/sessionlog/src/__tests__/cursor-agent.test.ts +0 -224
  210. package/references/sessionlog/src/__tests__/e2e-live.test.ts +0 -890
  211. package/references/sessionlog/src/__tests__/event-log.test.ts +0 -183
  212. package/references/sessionlog/src/__tests__/flush-sentinel.test.ts +0 -105
  213. package/references/sessionlog/src/__tests__/gemini-agent.test.ts +0 -375
  214. package/references/sessionlog/src/__tests__/git-hooks.test.ts +0 -78
  215. package/references/sessionlog/src/__tests__/hook-managers.test.ts +0 -121
  216. package/references/sessionlog/src/__tests__/lifecycle-tasks.test.ts +0 -759
  217. package/references/sessionlog/src/__tests__/opencode-agent.test.ts +0 -338
  218. package/references/sessionlog/src/__tests__/redaction.test.ts +0 -136
  219. package/references/sessionlog/src/__tests__/session-repo.test.ts +0 -353
  220. package/references/sessionlog/src/__tests__/session-store.test.ts +0 -166
  221. package/references/sessionlog/src/__tests__/setup-ccweb.test.ts +0 -466
  222. package/references/sessionlog/src/__tests__/skill-live.test.ts +0 -461
  223. package/references/sessionlog/src/__tests__/summarize.test.ts +0 -348
  224. package/references/sessionlog/src/__tests__/task-plan-e2e.test.ts +0 -610
  225. package/references/sessionlog/src/__tests__/task-plan-live.test.ts +0 -632
  226. package/references/sessionlog/src/__tests__/transcript-timestamp.test.ts +0 -121
  227. package/references/sessionlog/src/__tests__/types.test.ts +0 -166
  228. package/references/sessionlog/src/__tests__/utils.test.ts +0 -333
  229. package/references/sessionlog/src/__tests__/validation.test.ts +0 -103
  230. package/references/sessionlog/src/__tests__/worktree.test.ts +0 -57
  231. package/references/sessionlog/src/agent/agents/claude-code.ts +0 -1089
  232. package/references/sessionlog/src/agent/agents/cursor.ts +0 -361
  233. package/references/sessionlog/src/agent/agents/gemini-cli.ts +0 -632
  234. package/references/sessionlog/src/agent/agents/opencode.ts +0 -540
  235. package/references/sessionlog/src/agent/registry.ts +0 -143
  236. package/references/sessionlog/src/agent/session-types.ts +0 -113
  237. package/references/sessionlog/src/agent/types.ts +0 -220
  238. package/references/sessionlog/src/cli.ts +0 -597
  239. package/references/sessionlog/src/commands/clean.ts +0 -133
  240. package/references/sessionlog/src/commands/disable.ts +0 -84
  241. package/references/sessionlog/src/commands/doctor.ts +0 -145
  242. package/references/sessionlog/src/commands/enable.ts +0 -202
  243. package/references/sessionlog/src/commands/explain.ts +0 -261
  244. package/references/sessionlog/src/commands/reset.ts +0 -105
  245. package/references/sessionlog/src/commands/resume.ts +0 -180
  246. package/references/sessionlog/src/commands/rewind.ts +0 -195
  247. package/references/sessionlog/src/commands/setup-ccweb.ts +0 -275
  248. package/references/sessionlog/src/commands/status.ts +0 -172
  249. package/references/sessionlog/src/config.ts +0 -165
  250. package/references/sessionlog/src/events/event-log.ts +0 -126
  251. package/references/sessionlog/src/git-operations.ts +0 -558
  252. package/references/sessionlog/src/hooks/git-hooks.ts +0 -165
  253. package/references/sessionlog/src/hooks/lifecycle.ts +0 -391
  254. package/references/sessionlog/src/index.ts +0 -650
  255. package/references/sessionlog/src/security/redaction.ts +0 -283
  256. package/references/sessionlog/src/session/state-machine.ts +0 -452
  257. package/references/sessionlog/src/store/checkpoint-store.ts +0 -509
  258. package/references/sessionlog/src/store/native-store.ts +0 -173
  259. package/references/sessionlog/src/store/provider-types.ts +0 -99
  260. package/references/sessionlog/src/store/session-store.ts +0 -266
  261. package/references/sessionlog/src/strategy/attribution.ts +0 -296
  262. package/references/sessionlog/src/strategy/common.ts +0 -207
  263. package/references/sessionlog/src/strategy/content-overlap.ts +0 -228
  264. package/references/sessionlog/src/strategy/manual-commit.ts +0 -988
  265. package/references/sessionlog/src/strategy/types.ts +0 -279
  266. package/references/sessionlog/src/summarize/claude-generator.ts +0 -115
  267. package/references/sessionlog/src/summarize/summarize.ts +0 -432
  268. package/references/sessionlog/src/types.ts +0 -508
  269. package/references/sessionlog/src/utils/chunk-files.ts +0 -49
  270. package/references/sessionlog/src/utils/commit-message.ts +0 -65
  271. package/references/sessionlog/src/utils/detect-agent.ts +0 -36
  272. package/references/sessionlog/src/utils/hook-managers.ts +0 -125
  273. package/references/sessionlog/src/utils/ide-tags.ts +0 -32
  274. package/references/sessionlog/src/utils/paths.ts +0 -79
  275. package/references/sessionlog/src/utils/preview-rewind.ts +0 -80
  276. package/references/sessionlog/src/utils/rewind-conflict.ts +0 -121
  277. package/references/sessionlog/src/utils/shadow-branch.ts +0 -109
  278. package/references/sessionlog/src/utils/string-utils.ts +0 -46
  279. package/references/sessionlog/src/utils/todo-extract.ts +0 -188
  280. package/references/sessionlog/src/utils/trailers.ts +0 -187
  281. package/references/sessionlog/src/utils/transcript-parse.ts +0 -177
  282. package/references/sessionlog/src/utils/transcript-timestamp.ts +0 -59
  283. package/references/sessionlog/src/utils/tree-ops.ts +0 -219
  284. package/references/sessionlog/src/utils/tty.ts +0 -72
  285. package/references/sessionlog/src/utils/validation.ts +0 -65
  286. package/references/sessionlog/src/utils/worktree.ts +0 -58
  287. package/references/sessionlog/src/wire-types.ts +0 -59
  288. package/references/sessionlog/templates/setup-env.sh +0 -153
  289. package/references/sessionlog/tsconfig.json +0 -18
  290. package/references/sessionlog/vitest.config.ts +0 -12
  291. package/references/skill-tree/.claude/settings.json +0 -6
  292. package/references/skill-tree/.sudocode/issues.jsonl +0 -19
  293. package/references/skill-tree/.sudocode/specs.jsonl +0 -3
  294. package/references/skill-tree/CLAUDE.md +0 -126
  295. package/references/skill-tree/README.md +0 -372
  296. package/references/skill-tree/docs/GAPS_v1.md +0 -221
  297. package/references/skill-tree/docs/INTEGRATION_PLAN.md +0 -467
  298. package/references/skill-tree/docs/TODOS.md +0 -91
  299. package/references/skill-tree/docs/anthropic_skill_guide.md +0 -1364
  300. package/references/skill-tree/docs/design/federated-skill-trees.md +0 -524
  301. package/references/skill-tree/docs/design/multi-agent-sync.md +0 -759
  302. package/references/skill-tree/docs/scraper/BRAINSTORM.md +0 -583
  303. package/references/skill-tree/docs/scraper/POC_PLAN.md +0 -420
  304. package/references/skill-tree/docs/scraper/README.md +0 -170
  305. package/references/skill-tree/examples/basic-usage.ts +0 -164
  306. package/references/skill-tree/package-lock.json +0 -1852
  307. package/references/skill-tree/package.json +0 -66
  308. package/references/skill-tree/scraper/README.md +0 -123
  309. package/references/skill-tree/scraper/docs/DESIGN.md +0 -683
  310. package/references/skill-tree/scraper/docs/PLAN.md +0 -336
  311. package/references/skill-tree/scraper/drizzle.config.ts +0 -10
  312. package/references/skill-tree/scraper/package-lock.json +0 -6329
  313. package/references/skill-tree/scraper/package.json +0 -68
  314. package/references/skill-tree/scraper/test/fixtures/invalid-skill/missing-description.md +0 -7
  315. package/references/skill-tree/scraper/test/fixtures/invalid-skill/missing-name.md +0 -7
  316. package/references/skill-tree/scraper/test/fixtures/minimal-skill/SKILL.md +0 -27
  317. package/references/skill-tree/scraper/test/fixtures/skill-json/SKILL.json +0 -21
  318. package/references/skill-tree/scraper/test/fixtures/skill-with-meta/SKILL.md +0 -54
  319. package/references/skill-tree/scraper/test/fixtures/skill-with-meta/_meta.json +0 -24
  320. package/references/skill-tree/scraper/test/fixtures/valid-skill/SKILL.md +0 -93
  321. package/references/skill-tree/scraper/test/fixtures/valid-skill/_meta.json +0 -22
  322. package/references/skill-tree/scraper/tsup.config.ts +0 -14
  323. package/references/skill-tree/scraper/vitest.config.ts +0 -17
  324. package/references/skill-tree/scripts/convert-to-vitest.ts +0 -166
  325. package/references/skill-tree/skills/skill-writer/SKILL.md +0 -339
  326. package/references/skill-tree/skills/skill-writer/references/examples.md +0 -326
  327. package/references/skill-tree/skills/skill-writer/references/patterns.md +0 -210
  328. package/references/skill-tree/skills/skill-writer/references/quality-checklist.md +0 -123
  329. package/references/skill-tree/test/run-all.ts +0 -106
  330. package/references/skill-tree/test/utils.ts +0 -128
  331. package/references/skill-tree/vitest.config.ts +0 -16
@@ -0,0 +1,54 @@
1
+ {
2
+ "name": "performance-review",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.85,
5
+ "complexity": "moderate",
6
+ "estimatedEffort": 4,
7
+ "applicability": {
8
+ "situations": [
9
+ "Reviewing code that touches database queries, loops, caching, or I/O-intensive paths",
10
+ "Evaluating scalability of new features at 10x/100x/1000x current data volumes",
11
+ "Checking for production-observable performance regressions"
12
+ ],
13
+ "triggers": [
14
+ "performance review",
15
+ "N+1 query",
16
+ "slow query",
17
+ "memory leak",
18
+ "pagination",
19
+ "caching"
20
+ ],
21
+ "antiPatterns": [
22
+ "Micro-optimizations in cold paths (startup, migrations, admin tools, one-time initialization)",
23
+ "Premature caching suggestions without evidence of actual slowness",
24
+ "Theoretical scale issues in MVP/prototype code",
25
+ "Style-based performance opinions (for vs forEach, Map vs plain object)"
26
+ ],
27
+ "domains": ["code-review", "performance", "quality-assurance"]
28
+ },
29
+ "guidance": {
30
+ "strategy": "Read code through the lens of 'what happens when this runs 10,000 times' or 'when the table has a million rows'. Focus on measurable, production-observable problems — not theoretical micro-optimizations. Project performance at 10x, 100x, and 1000x current volumes.",
31
+ "tactics": [
32
+ "N+1 queries: flag database queries inside loops that should be batched or eager-loaded; count loop iterations against expected data size",
33
+ "Unbounded memory: flag loading entire tables without pagination, caches without eviction policies, string concatenation in loops, large object allocations",
34
+ "Missing pagination: flag endpoints returning all results without limit/offset/cursor/streaming",
35
+ "Hot-path allocations: flag object creation, regex compilation, or expensive computation inside loops or per-request paths",
36
+ "Blocking I/O in async: flag synchronous file reads, blocking HTTP calls, CPU-intensive computation on the event loop",
37
+ "Algorithmic complexity: flag O(n^2) or worse without justification; verify all database queries use appropriate indexes",
38
+ "Performance benchmarks: API responses under 200ms for standard operations, bundle size increases under 5KB per feature, background jobs process in batches",
39
+ "Confidence calibration: HIGH (0.80+) when impact is provable from code (N+1 clearly in loop, unbounded query on large table); MODERATE (0.60-0.79) when pattern present but impact depends on unconfirmed data size; suppress below 0.60"
40
+ ]
41
+ },
42
+ "verification": {
43
+ "successIndicators": [
44
+ "Each finding identifies a specific code path with measurable impact at expected scale",
45
+ "N+1 findings show the loop and the query inside it",
46
+ "No micro-optimization findings on cold paths"
47
+ ],
48
+ "failureIndicators": [
49
+ "Finding is speculative optimization without evidence of hot path",
50
+ "Caching recommendation without evidence of repeated expensive computation",
51
+ "Flagging cold-path code (startup, migrations) for performance"
52
+ ]
53
+ }
54
+ }
@@ -0,0 +1,56 @@
1
+ {
2
+ "name": "plan-adversarial-review",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.8,
5
+ "complexity": "complex",
6
+ "estimatedEffort": 5,
7
+ "applicability": {
8
+ "situations": [
9
+ "Reviewing implementation plans or requirement documents before execution",
10
+ "Stress-testing planning assumptions, premises, and scope decisions",
11
+ "Catching contradictions, scope creep, and unstated assumptions in plans"
12
+ ],
13
+ "triggers": [
14
+ "review plan",
15
+ "plan review",
16
+ "challenge assumptions",
17
+ "scope review",
18
+ "requirements review"
19
+ ],
20
+ "antiPatterns": [
21
+ "Implementation style or technology selection choices",
22
+ "Product strategy or priority preferences",
23
+ "Security, design, or feasibility concerns (use plan-feasibility-review instead)",
24
+ "The plan is already in execution — too late for adversarial review"
25
+ ],
26
+ "domains": ["planning", "requirements", "quality-assurance"]
27
+ },
28
+ "guidance": {
29
+ "strategy": "Challenge premises before solutions. Surface unstated assumptions. Stress-test decisions for reversal cost. Check for internal contradictions and scope-goal misalignment. Apply three lenses: adversarial (break assumptions), coherence (internal consistency), and scope guardian (right-sized).",
30
+ "tactics": [
31
+ "Premise challenging: Is this the right problem? Does the solution match the problem? What if we did nothing? What would make this fail? Surface framing effects that bias toward one solution",
32
+ "Assumption surfacing: identify environmental assumptions (infrastructure exists, APIs stable), user behavior assumptions (adoption, usage patterns), scale assumptions (data volume, concurrency), temporal assumptions (availability, ordering)",
33
+ "Decision stress-testing: for each major decision, apply falsification test (what evidence would prove this wrong?), reversal cost (how expensive to change later?), and decision-scope mismatch (is decision bigger/smaller than the problem?)",
34
+ "Simplification pressure: audit abstractions (how many consumers?), find minimum viable version, apply subtraction test (remove each component — does plan still work?), enforce complexity budget",
35
+ "Coherence checking: catch contradictions between sections, terminology drift (same concept with different names), forward references to undefined terms, ungrouped requirements spanning multiple concerns",
36
+ "Scope-goal alignment: flag scope exceeding goals (building more than needed), goals exceeding scope (promising more than plan delivers), new abstractions with one implementation, framework-ahead-of-need, configuration without consumers",
37
+ "Alternative blindness: check for omitted alternatives, build-vs-use analysis, do-nothing baseline comparison",
38
+ "Depth calibration: Quick (short docs, <5 requirements) = max 3 findings; Standard = proportional to decision density; Deep (>10 requirements, high-stakes) = multiple passes with assumption chain tracing",
39
+ "Confidence calibration: HIGH (0.80+) when specific text can be quoted showing gap; MODERATE (0.60-0.79) when gap likely but requires context not in document; suppress below 0.50"
40
+ ]
41
+ },
42
+ "verification": {
43
+ "successIndicators": [
44
+ "Findings quote specific text from the plan showing the gap or contradiction",
45
+ "Assumptions surfaced are testable and actionable",
46
+ "Scope-goal alignment checked with concrete evidence",
47
+ "No findings that belong to feasibility, security, or design review"
48
+ ],
49
+ "failureIndicators": [
50
+ "Findings are vague concerns without quoting specific plan text",
51
+ "Assumptions identified are untestable or irrelevant",
52
+ "Scope opinions based on preference rather than goal alignment",
53
+ "Contradictions flagged that are reconcilable with charitable reading"
54
+ ]
55
+ }
56
+ }
@@ -0,0 +1,56 @@
1
+ {
2
+ "name": "plan-feasibility-review",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.8,
5
+ "complexity": "complex",
6
+ "estimatedEffort": 5,
7
+ "applicability": {
8
+ "situations": [
9
+ "Evaluating technical feasibility of implementation plans",
10
+ "Checking product-market fit and strategic alignment of proposed features",
11
+ "Reviewing plans for security gaps, design completeness, and migration safety"
12
+ ],
13
+ "triggers": [
14
+ "feasibility review",
15
+ "plan feasibility",
16
+ "technical review",
17
+ "can we build this",
18
+ "is this plan viable"
19
+ ],
20
+ "antiPatterns": [
21
+ "Implementation style choices that don't affect feasibility",
22
+ "Code organization preferences",
23
+ "Theoretical scalability without evidence",
24
+ "Scope or assumption concerns (use plan-adversarial-review instead)"
25
+ ],
26
+ "domains": ["planning", "architecture", "quality-assurance"]
27
+ },
28
+ "guidance": {
29
+ "strategy": "Evaluate plans across four dimensions: technical feasibility (can we build it?), product fit (should we build it?), security readiness (is it safe?), and design completeness (is it specified enough?). Each dimension has a distinct lens.",
30
+ "tactics": [
31
+ "Technical feasibility: verify plan acknowledges existing code/services/infrastructure; check for architecture conflicts with current stack; validate that referenced file paths and interfaces actually exist; check framework compatibility",
32
+ "Shadow path tracing: for each feature, trace the happy path, nil/empty input path, error path, and concurrent access path — plans that only cover happy path will fail in implementation",
33
+ "Migration safety: verify concrete migration path (not 'migrate later'), backward compatibility during rollout, rollback strategy, data volume estimates, and operation ordering",
34
+ "Product lens: challenge the premise — is this the right problem? What's the actual outcome? What happens if we do nothing? Is there an 80% value at 20% cost alternative? Check goal-requirement alignment (orphan requirements, unserved goals)",
35
+ "Security lens: inventory attack surfaces (endpoints, data stores, integrations, user inputs), check auth/authz per endpoint, identify sensitive data flows, assess third-party trust boundaries, outline top-3 threat model (most likely, highest impact, most subtle exploit)",
36
+ "Design completeness: check interaction state coverage (loading, empty, error, success, partial for every interactive element), user flow completeness (entry points, happy path, 2-3 edge cases, exit points), responsive/accessibility considerations",
37
+ "Dependency analysis: verify external dependencies are available and compatible; identify implicit assumptions about infrastructure, APIs, or services",
38
+ "Performance feasibility: back-of-envelope math for expected load, data volumes, and response time requirements",
39
+ "Confidence calibration: HIGH (0.80+) when specific technical constraint blocks the approach; MODERATE (0.60-0.79) when constraint likely but depends on implementation details; suppress below 0.50"
40
+ ]
41
+ },
42
+ "verification": {
43
+ "successIndicators": [
44
+ "Technical blockers identified with specific evidence (missing API, framework incompatibility)",
45
+ "Shadow paths traced — plan covers more than just the happy path",
46
+ "Security attack surfaces inventoried with mitigation gaps flagged",
47
+ "Product alignment verified — goals trace to requirements"
48
+ ],
49
+ "failureIndicators": [
50
+ "Feasibility concerns are vague without specific technical evidence",
51
+ "Only happy path evaluated — error/empty/concurrent paths ignored",
52
+ "Security review is generic OWASP checklist without plan-specific analysis",
53
+ "Product concerns are preference-based rather than goal-alignment-based"
54
+ ]
55
+ }
56
+ }
@@ -0,0 +1,52 @@
1
+ {
2
+ "name": "project-standards-review",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.85,
5
+ "complexity": "simple",
6
+ "estimatedEffort": 2,
7
+ "applicability": {
8
+ "situations": [
9
+ "Reviewing changes for compliance with the project's own standards (CLAUDE.md, AGENTS.md, contributing guides)",
10
+ "Enforcing naming conventions, file placement, and configuration rules",
11
+ "Auditing changes against established project conventions"
12
+ ],
13
+ "triggers": [
14
+ "standards review",
15
+ "convention check",
16
+ "CLAUDE.md compliance",
17
+ "project rules"
18
+ ],
19
+ "antiPatterns": [
20
+ "Rules that don't apply to the changed file type",
21
+ "Violations already caught by automated linters or CI",
22
+ "Pre-existing violations in unchanged code",
23
+ "Generic best practices not documented in the project's standards files",
24
+ "Opinions about quality of the standards themselves"
25
+ ],
26
+ "domains": ["code-review", "standards", "quality-assurance"]
27
+ },
28
+ "guidance": {
29
+ "strategy": "Audit changes against the project's own documented standards. Every finding must cite a specific rule from the standards file AND a specific violation in the diff. Without both, drop the finding.",
30
+ "tactics": [
31
+ "Discover standards: read CLAUDE.md, AGENTS.md, and any contributing/convention files in the changed file's ancestor directories",
32
+ "Match rules to file types: only apply rules relevant to the specific files being changed",
33
+ "Evidence requirement: for each finding, provide (1) exact quote/section from standards file defining the rule, and (2) specific line(s) in diff violating the rule",
34
+ "Common violations: missing required frontmatter fields, names not matching directory/file names, wrong reference inclusion mode, shell commands where native tools are required, misplaced files in wrong directories",
35
+ "Language violations: second-person 'you should' where standards require imperative form, hedge words (might/could/consider) leaving behavior undefined",
36
+ "Protected artifacts: never flag documented protected paths (docs/, plans/, solutions/) for deletion",
37
+ "Confidence calibration: HIGH (0.80+) when specific rule quote and specific diff violation are both identifiable; MODERATE (0.60-0.79) when rule exists but applying it requires judgment; suppress below 0.60"
38
+ ]
39
+ },
40
+ "verification": {
41
+ "successIndicators": [
42
+ "Every finding cites both the rule source and the specific violation",
43
+ "Only rules from the project's actual standards files are enforced",
44
+ "No findings about unchanged code or generic best practices"
45
+ ],
46
+ "failureIndicators": [
47
+ "Finding enforces a rule not documented in any standards file",
48
+ "Finding about pre-existing code that wasn't changed in this diff",
49
+ "Generic best practice advice without project-specific rule citation"
50
+ ]
51
+ }
52
+ }
@@ -0,0 +1,53 @@
1
+ {
2
+ "name": "reliability-review",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.85,
5
+ "complexity": "moderate",
6
+ "estimatedEffort": 4,
7
+ "applicability": {
8
+ "situations": [
9
+ "Reviewing code with external dependencies, I/O boundaries, or error handling",
10
+ "Evaluating failure modes, retry logic, and cascading failure paths",
11
+ "Checking resilience of services that depend on other services"
12
+ ],
13
+ "triggers": [
14
+ "reliability review",
15
+ "error handling",
16
+ "retry",
17
+ "timeout",
18
+ "circuit breaker",
19
+ "cascade failure"
20
+ ],
21
+ "antiPatterns": [
22
+ "Flagging internal pure functions that cannot fail (string formatting, math, in-memory transforms)",
23
+ "Test helper error handling",
24
+ "Error message formatting choices",
25
+ "Theoretical cascading failures without traceable evidence"
26
+ ],
27
+ "domains": ["code-review", "reliability", "quality-assurance"]
28
+ },
29
+ "guidance": {
30
+ "strategy": "Ask 'what happens when this dependency is down?' for every external call. Think about partial failures, retry storms, and cascading timeouts. Read code by assuming the environment can be hostile.",
31
+ "tactics": [
32
+ "Missing error handling on I/O boundaries: flag HTTP calls, database queries, file operations, and message queue interactions without try/catch or error callbacks",
33
+ "Retry loops without backoff/limits: immediate indefinite retries create retry storms — require exponential backoff and max attempt limits",
34
+ "Missing timeouts on external calls: HTTP clients, database connections, and RPC without explicit timeouts can hang indefinitely and exhaust connection pools",
35
+ "Error swallowing: flag catch blocks that ignore errors, silent failures that return misleading defaults, and error handlers that don't log or propagate",
36
+ "Cascading failure paths: trace how failure in service A causes B to retry aggressively, overloading C; how slow dependencies fill request queues causing health check failures, restarts, and cold-start storms",
37
+ "Recovery-induced failures: retries creating duplicates, rollbacks leaving orphaned state, circuit breakers preventing legitimate recovery",
38
+ "Confidence calibration: HIGH (0.80+) when reliability gap is directly visible (HTTP call without timeout, retry without max attempts, catch swallowing error); MODERATE (0.60-0.79) when code lacks protection but framework defaults might handle it; suppress below 0.60"
39
+ ]
40
+ },
41
+ "verification": {
42
+ "successIndicators": [
43
+ "Each finding points to a specific I/O boundary without protection",
44
+ "Retry findings show the loop and its missing backoff/limit",
45
+ "Cascade findings trace the multi-service failure chain"
46
+ ],
47
+ "failureIndicators": [
48
+ "Flagging pure functions or in-memory operations for error handling",
49
+ "Missing that framework middleware already handles the concern",
50
+ "Architectural concerns that can't be confirmed from the diff"
51
+ ]
52
+ }
53
+ }
@@ -0,0 +1,64 @@
1
+ {
2
+ "name": "review-orchestration",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.8,
5
+ "complexity": "complex",
6
+ "estimatedEffort": 8,
7
+ "applicability": {
8
+ "situations": [
9
+ "Code review before creating a PR",
10
+ "Reviewing changes after completing a task during iterative implementation",
11
+ "Structured multi-persona code review for quality assurance"
12
+ ],
13
+ "triggers": [
14
+ "review code",
15
+ "code review",
16
+ "check changes",
17
+ "pre-PR review"
18
+ ],
19
+ "antiPatterns": [
20
+ "Reviewing trivial formatting-only changes",
21
+ "Reviewing auto-generated code that will be regenerated",
22
+ "Single-line config changes that don't affect behavior"
23
+ ],
24
+ "domains": ["code-review", "quality-assurance", "software-engineering"]
25
+ },
26
+ "guidance": {
27
+ "strategy": "Deploy tiered reviewer personas in parallel, then merge and deduplicate findings. Always-on reviewers run on every review; conditional reviewers are selected based on the diff content.",
28
+ "tactics": [
29
+ "Always-on reviewers: correctness (logic bugs), testing (coverage gaps), maintainability (coupling/complexity), project-standards (convention compliance), agent-native (action/context parity), learnings-researcher (institutional knowledge)",
30
+ "Conditional reviewers selected per-diff: security (auth/injection), performance (N+1/memory), API-contract (breaking changes), data-migrations (schema safety), reliability (error handling), adversarial (edge cases), stack-specific language reviewers",
31
+ "Each reviewer returns structured findings with severity (P0-P3), confidence (0.0-1.0), and autofix_class (safe_auto/gated_auto/manual/advisory)",
32
+ "Suppress all findings below 0.60 confidence to prevent noise",
33
+ "Merge/deduplicate findings by fingerprint: (file + line_bucket +/- 3 lines + normalized_title). On conflict, keep highest severity and strongest confidence",
34
+ "Route actions by class: safe_auto findings get auto-fixed; gated_auto/manual findings go to human review; advisory findings are informational only",
35
+ "Maximum 2 rounds of autofix to prevent loops"
36
+ ],
37
+ "steps": [
38
+ "1. Detect scope of changes (files, languages, domains affected)",
39
+ "2. Discover intent from commit messages, PR description, or task context",
40
+ "3. Select conditional reviewers based on scope (security for auth files, performance for queries, etc.)",
41
+ "4. Dispatch all selected reviewers in parallel — each reads the diff independently",
42
+ "5. Collect structured JSON findings from all reviewers",
43
+ "6. Merge findings: deduplicate by fingerprint, resolve severity conflicts conservatively",
44
+ "7. Synthesize final report with verdict: Ready / Ready with fixes / Not ready"
45
+ ]
46
+ },
47
+ "verification": {
48
+ "successIndicators": [
49
+ "All P0 findings are genuine breakage traceable to specific code paths",
50
+ "Line numbers point to exact buggy code, not nearby lines",
51
+ "Each finding is actionable with a clear fix path",
52
+ "No false positives from style issues that linters catch",
53
+ "Deduplication produces no redundant findings"
54
+ ],
55
+ "failureIndicators": [
56
+ "P0 findings that are actually style nits",
57
+ "False positives exceeding 20% of total findings",
58
+ "Same issue reported multiple times after deduplication",
59
+ "Findings that require runtime observation to confirm (not provable from code)",
60
+ "Protected artifacts (docs, plans, brainstorms) flagged for deletion"
61
+ ],
62
+ "rollbackStrategy": "Review findings are advisory — no code changes until human approval (except safe_auto in autofix mode)"
63
+ }
64
+ }
@@ -0,0 +1,54 @@
1
+ {
2
+ "name": "security-review",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.85,
5
+ "complexity": "moderate",
6
+ "estimatedEffort": 4,
7
+ "applicability": {
8
+ "situations": [
9
+ "Reviewing code changes that touch auth, user input, public endpoints, or permissions",
10
+ "Auditing for exploitable vulnerabilities before deployment",
11
+ "Systematic OWASP Top 10 compliance checking"
12
+ ],
13
+ "triggers": [
14
+ "security review",
15
+ "auth",
16
+ "injection",
17
+ "XSS",
18
+ "CSRF",
19
+ "user input",
20
+ "public endpoint"
21
+ ],
22
+ "antiPatterns": [
23
+ "Defense-in-depth on already-protected code",
24
+ "Theoretical attacks requiring physical access",
25
+ "HTTP vs HTTPS in dev/test configs",
26
+ "Generic hardening advice without specific exploitable findings"
27
+ ],
28
+ "domains": ["code-review", "security", "quality-assurance"]
29
+ },
30
+ "guidance": {
31
+ "strategy": "Think like an attacker looking for one exploitable path through the code. Trace data from entry point to dangerous sink. Combine targeted attack-path analysis with systematic OWASP Top 10 coverage.",
32
+ "tactics": [
33
+ "Injection vectors: trace untrusted input to SQL, XSS, shell commands, template engines, innerHTML/dangerouslySetInnerHTML — flag when no sanitization between entry and sink",
34
+ "Auth/authz bypasses: check for missing auth middleware, broken ownership checks (user A accessing user B's resources), privilege escalation, CSRF on state-changing endpoints",
35
+ "Secrets exposure: scan for hardcoded keys/tokens/passwords, sensitive data in error messages or logs, PII in responses without need-to-know filtering",
36
+ "Insecure deserialization: flag pickle, Marshal, unserialize, JSON.parse of executable content from untrusted sources",
37
+ "SSRF and path traversal: flag user-controlled URLs or file paths passed to fetch/open without allowlist validation",
38
+ "Systematic OWASP Top 10 check: input validation on all entry points (req.body, req.params, req.query), SQL parameterization, XSS escaping + CSP headers, auth on all endpoints, encryption for sensitive data at rest and in transit",
39
+ "Confidence calibration: HIGH (0.80+) when full attack path is traceable from untrusted input to dangerous sink without sanitization; MODERATE (0.60-0.79) when dangerous pattern present but exploitability unconfirmed; suppress below 0.60"
40
+ ]
41
+ },
42
+ "verification": {
43
+ "successIndicators": [
44
+ "Each finding traces a complete attack path: untrusted input → specific code path → exploitable outcome",
45
+ "No false positives from already-protected code or dev-only configs",
46
+ "OWASP categories systematically checked, not just obvious injection"
47
+ ],
48
+ "failureIndicators": [
49
+ "Finding requires physical access or internal-only network to exploit",
50
+ "Generic 'could be vulnerable' without tracing specific input to specific sink",
51
+ "Flagging defense-in-depth that's already behind validated auth"
52
+ ]
53
+ }
54
+ }
@@ -0,0 +1,64 @@
1
+ {
2
+ "name": "systematic-execution",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.8,
5
+ "complexity": "complex",
6
+ "estimatedEffort": 10,
7
+ "applicability": {
8
+ "situations": [
9
+ "Executing an implementation plan systematically",
10
+ "Shipping a feature with testing, review, and quality gates",
11
+ "Multi-unit implementation requiring incremental progress and verification"
12
+ ],
13
+ "triggers": [
14
+ "execute plan",
15
+ "start work",
16
+ "implement this",
17
+ "ship feature"
18
+ ],
19
+ "antiPatterns": [
20
+ "No plan exists — create one first",
21
+ "Exploratory work where requirements aren't defined",
22
+ "Hotfix that needs to ship immediately without full process"
23
+ ],
24
+ "domains": ["execution", "implementation", "software-engineering"]
25
+ },
26
+ "guidance": {
27
+ "strategy": "Treat the plan as a decision artifact, not an instruction script. Execute implementation units in dependency order, testing continuously, with incremental commits after each logical unit. Simplify after every 2-3 units.",
28
+ "tactics": [
29
+ "Read plan's Implementation Units; honor execution posture (test-first, characterization-first) when annotated; check 'Deferred to Implementation' questions before starting",
30
+ "Strategy selection by scale: inline (1-2 small tasks), serial subagents (3+ with dependencies), parallel subagents (3+ independent), swarm (10+ with coordination)",
31
+ "Test as you go, not at end: run tests after each significant change; never batch testing to the end",
32
+ "System-wide test check before marking task done: trace callbacks/middleware/observers two levels out; write integration tests with real objects through full chain; verify failure doesn't leave orphaned state; check if other interfaces expose same behavior",
33
+ "Incremental commits after each complete logical unit — messages describe complete valuable changes, not WIP",
34
+ "Simplify after every 2-3 units: review changed files for consolidation opportunities, dead code, naming improvements",
35
+ "Pattern following discipline: read referenced files from plan before implementing — don't invent new conventions",
36
+ "Feature completeness first: don't move to next feature until current one ships"
37
+ ],
38
+ "steps": [
39
+ "1. Read plan, clarify any ambiguities, set up environment",
40
+ "2. Create task tracking for all implementation units",
41
+ "3. Execute units in dependency order: implement → test → verify → commit",
42
+ "4. After every 2-3 units, review for simplification opportunities",
43
+ "5. Run quality checks: tests pass, linting passes, code follows existing patterns",
44
+ "6. Prepare PR: summary (what/why/decisions), testing notes, post-deploy monitoring plan",
45
+ "7. Update plan status"
46
+ ]
47
+ },
48
+ "verification": {
49
+ "successIndicators": [
50
+ "All implementation units completed and tested",
51
+ "Tests pass and linting passes",
52
+ "Code follows existing patterns — no new conventions invented",
53
+ "Each commit describes a complete valuable change",
54
+ "PR includes post-deploy monitoring plan with concrete metrics"
55
+ ],
56
+ "failureIndicators": [
57
+ "Tests batched to end and found late-breaking issues",
58
+ "New conventions invented instead of following existing patterns",
59
+ "Commits contain WIP or incomplete changes",
60
+ "Feature moved on before current one fully shipped",
61
+ "System-wide test check skipped for code with callbacks or error handling"
62
+ ]
63
+ }
64
+ }
@@ -0,0 +1,50 @@
1
+ {
2
+ "name": "testing-review",
3
+ "curatedBy": "compound-engineering",
4
+ "confidence": 0.85,
5
+ "complexity": "moderate",
6
+ "estimatedEffort": 3,
7
+ "applicability": {
8
+ "situations": [
9
+ "Reviewing test quality and coverage for code changes",
10
+ "Evaluating whether tests prove code works or provide false confidence",
11
+ "Checking for untested branches, weak assertions, and missing error paths"
12
+ ],
13
+ "triggers": [
14
+ "code review",
15
+ "test coverage",
16
+ "test quality",
17
+ "missing tests"
18
+ ],
19
+ "antiPatterns": [
20
+ "Reviewing test infrastructure or test framework setup",
21
+ "Evaluating test performance or execution speed",
22
+ "Coverage percentage targets without considering test quality"
23
+ ],
24
+ "domains": ["code-review", "testing", "quality-assurance"]
25
+ },
26
+ "guidance": {
27
+ "strategy": "For every new branch (if/else/switch/try/catch) in the diff, verify at least one test exercises it. Focus on whether tests prove behavior, not just that code doesn't throw.",
28
+ "tactics": [
29
+ "Hunt for: untested branches (new if/else/switch/try/catch), tests that don't assert behavior (only assert 'doesn't throw'), implementation-coupled brittle tests (assert on mocks, test private methods, snapshot internals), missing error path coverage",
30
+ "Branch coverage discipline: each new branch must have at least one test; trace all paths through the new code",
31
+ "Behavior assertion rigor: assert specific values not just truthiness; verify both happy path AND sad path",
32
+ "Check that error paths are tested: catch blocks, fallback branches, error returns should have dedicated tests",
33
+ "Flag implementation-coupled tests: tests that break when refactoring without behavior change are brittle",
34
+ "Confidence calibration: HIGH (0.80+) when test gap is provable from diff (new branch, no test); MODERATE (0.60-0.79) when inferred from structure (parser.ts with no parser.test.ts); suppress below 0.60 when coverage may exist in integration tests"
35
+ ]
36
+ },
37
+ "verification": {
38
+ "successIndicators": [
39
+ "All new branches have corresponding test cases",
40
+ "Tests assert actual behavior with specific expected values",
41
+ "Error paths have dedicated tests, not just happy path",
42
+ "No implementation-coupled brittleness identified"
43
+ ],
44
+ "failureIndicators": [
45
+ "New branches found without any test coverage",
46
+ "Tests only assert 'doesn't throw' or truthiness without checking values",
47
+ "Error handling code has no test exercising the error path"
48
+ ]
49
+ }
50
+ }
package/src/atlas.ts CHANGED
@@ -9,6 +9,15 @@ import type {
9
9
  import type { KnowledgeMatch } from './types/knowledge.js';
10
10
  import { createDefaultConfig } from './types/index.js';
11
11
  import { MemorySystem, createMemorySystem, type TeamExperience } from './memory/index.js';
12
+ import {
13
+ loadCuratedPlaybooks as loadCuratedPlaybooksFn,
14
+ BUNDLED_SEED_PACK_DIR,
15
+ } from './memory/curated-loader.js';
16
+ import {
17
+ resolvePlaybookSource,
18
+ sourceStateKey,
19
+ type SourceState,
20
+ } from './memory/source-resolver.js';
12
21
  import {
13
22
  UnifiedLearningPipeline,
14
23
  createUnifiedPipeline,
@@ -271,6 +280,9 @@ export class Atlas {
271
280
 
272
281
  // Initialize playbook-based components if playbooks are available
273
282
  if (this.memory.playbooks) {
283
+ // Load curated playbooks (bundled seed pack + additional dirs)
284
+ await this.loadCuratedPlaybooks();
285
+
274
286
  this.skillLibrary = createSkillLibrary(
275
287
  this.memory.playbooks,
276
288
  this.config.skillLibrary
@@ -290,6 +302,90 @@ export class Atlas {
290
302
  }
291
303
  }
292
304
 
305
+ /**
306
+ * Load curated playbooks from bundled seed pack, additional directories,
307
+ * and resolved sources (local paths or git repos).
308
+ * Called during init() when curatedPlaybooks config is enabled.
309
+ */
310
+ private async loadCuratedPlaybooks(): Promise<void> {
311
+ const cfg = this.config.curatedPlaybooks;
312
+ const recreate = cfg.recreateOnInit;
313
+
314
+ // Load bundled seed pack (shipped with cognitive-core)
315
+ if (cfg.loadBundledSeedPack) {
316
+ const loadOpts = recreate
317
+ ? { recreate: true, sourceId: 'bundled' }
318
+ : { sourceId: 'bundled' };
319
+ await loadCuratedPlaybooksFn(
320
+ BUNDLED_SEED_PACK_DIR,
321
+ this.memory.playbooks,
322
+ loadOpts,
323
+ );
324
+ }
325
+
326
+ // Load from additional directories (backward compat)
327
+ for (const dir of cfg.additionalDirs) {
328
+ const loadOpts = recreate
329
+ ? { recreate: true, sourceId: dir }
330
+ : { sourceId: dir };
331
+ await loadCuratedPlaybooksFn(dir, this.memory.playbooks, loadOpts);
332
+ }
333
+
334
+ // Resolve and load from sources (local paths + git repos)
335
+ if (cfg.sources.length > 0) {
336
+ const cacheDir = join(this.config.storage.baseDir, cfg.cache.dir);
337
+ for (const source of cfg.sources) {
338
+ await this.loadFromSource(source, cacheDir, recreate);
339
+ }
340
+ }
341
+ }
342
+
343
+ /**
344
+ * Resolve a single source (local or git) and load its playbooks.
345
+ */
346
+ private async loadFromSource(
347
+ source: string,
348
+ cacheDir: string,
349
+ recreate: boolean,
350
+ ): Promise<void> {
351
+ const cfg = this.config.curatedPlaybooks;
352
+
353
+ const resolved = await resolvePlaybookSource(source, {
354
+ cacheDir,
355
+ maxAgeMs: cfg.cache.maxAgeMs,
356
+ forceUpdate: recreate,
357
+ getSourceState: (s) =>
358
+ this.persistence.getSystemState<SourceState>(sourceStateKey(s)),
359
+ setSourceState: (s, state) =>
360
+ this.persistence.setSystemState(sourceStateKey(s), state),
361
+ });
362
+
363
+ if (!resolved) return;
364
+
365
+ // For git sources: skip loading if SHA hasn't changed and we're not recreating
366
+ // (playbooks are already in the library from a previous init).
367
+ // For local paths: always load (the loader handles dedup via getByName).
368
+ if (resolved.isGit && !resolved.updated && !recreate) return;
369
+
370
+ const loadOpts = recreate
371
+ ? { recreate: true, sourceId: resolved.sourceId }
372
+ : { sourceId: resolved.sourceId };
373
+
374
+ const result = await loadCuratedPlaybooksFn(
375
+ resolved.playbookDir,
376
+ this.memory.playbooks,
377
+ loadOpts,
378
+ );
379
+
380
+ // Update source state with playbook count
381
+ const stateKey = sourceStateKey(source);
382
+ const prevState = this.persistence.getSystemState<SourceState>(stateKey);
383
+ if (prevState) {
384
+ prevState.playbookCount = result.loaded;
385
+ this.persistence.setSystemState(stateKey, prevState);
386
+ }
387
+ }
388
+
293
389
  /**
294
390
  * Set the LLM provider for solving (deprecated)
295
391
  * @deprecated Use setAgentManager() with backends for real execution