cognitive-core 0.2.0 → 0.2.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude/settings.json +111 -2
- package/.sessionlog/settings.json +4 -0
- package/dist/atlas.d.ts +10 -0
- package/dist/atlas.d.ts.map +1 -1
- package/dist/atlas.js +65 -0
- package/dist/atlas.js.map +1 -1
- package/dist/index.d.ts +1 -1
- package/dist/index.d.ts.map +1 -1
- package/dist/index.js +5 -1
- package/dist/index.js.map +1 -1
- package/dist/learning/index.d.ts +1 -1
- package/dist/learning/index.d.ts.map +1 -1
- package/dist/learning/index.js.map +1 -1
- package/dist/learning/pipeline.d.ts +4 -31
- package/dist/learning/pipeline.d.ts.map +1 -1
- package/dist/learning/pipeline.js +12 -64
- package/dist/learning/pipeline.js.map +1 -1
- package/dist/learning/unified-pipeline.d.ts +30 -0
- package/dist/learning/unified-pipeline.d.ts.map +1 -1
- package/dist/learning/unified-pipeline.js +207 -0
- package/dist/learning/unified-pipeline.js.map +1 -1
- package/dist/memory/candidate-retrieval.d.ts.map +1 -1
- package/dist/memory/candidate-retrieval.js +3 -1
- package/dist/memory/candidate-retrieval.js.map +1 -1
- package/dist/memory/curated-loader.d.ts +21 -4
- package/dist/memory/curated-loader.d.ts.map +1 -1
- package/dist/memory/curated-loader.js +53 -16
- package/dist/memory/curated-loader.js.map +1 -1
- package/dist/memory/index.d.ts +2 -1
- package/dist/memory/index.d.ts.map +1 -1
- package/dist/memory/index.js +3 -1
- package/dist/memory/index.js.map +1 -1
- package/dist/memory/playbook.d.ts +6 -0
- package/dist/memory/playbook.d.ts.map +1 -1
- package/dist/memory/playbook.js +15 -0
- package/dist/memory/playbook.js.map +1 -1
- package/dist/memory/source-resolver.d.ts +120 -0
- package/dist/memory/source-resolver.d.ts.map +1 -0
- package/dist/memory/source-resolver.js +300 -0
- package/dist/memory/source-resolver.js.map +1 -0
- package/dist/types/config.d.ts +141 -0
- package/dist/types/config.d.ts.map +1 -1
- package/dist/types/config.js +40 -0
- package/dist/types/config.js.map +1 -1
- package/dist/types/index.d.ts +1 -1
- package/dist/types/index.d.ts.map +1 -1
- package/dist/types/index.js +1 -1
- package/dist/types/index.js.map +1 -1
- package/dist/utils/error-classifier.js +8 -8
- package/dist/utils/error-classifier.js.map +1 -1
- package/dist/workspace/efficacy-toolkit.d.ts +164 -0
- package/dist/workspace/efficacy-toolkit.d.ts.map +1 -0
- package/dist/workspace/efficacy-toolkit.js +281 -0
- package/dist/workspace/efficacy-toolkit.js.map +1 -0
- package/dist/workspace/index.d.ts +2 -1
- package/dist/workspace/index.d.ts.map +1 -1
- package/dist/workspace/index.js +3 -1
- package/dist/workspace/index.js.map +1 -1
- package/dist/workspace/templates/index.d.ts +3 -0
- package/dist/workspace/templates/index.d.ts.map +1 -1
- package/dist/workspace/templates/index.js +6 -0
- package/dist/workspace/templates/index.js.map +1 -1
- package/dist/workspace/templates/playbook-decay-detection.d.ts +46 -0
- package/dist/workspace/templates/playbook-decay-detection.d.ts.map +1 -0
- package/dist/workspace/templates/playbook-decay-detection.js +197 -0
- package/dist/workspace/templates/playbook-decay-detection.js.map +1 -0
- package/dist/workspace/templates/playbook-efficacy-audit.d.ts +46 -0
- package/dist/workspace/templates/playbook-efficacy-audit.d.ts.map +1 -0
- package/dist/workspace/templates/playbook-efficacy-audit.js +160 -0
- package/dist/workspace/templates/playbook-efficacy-audit.js.map +1 -0
- package/dist/workspace/templates/playbook-lifecycle-review.d.ts +51 -0
- package/dist/workspace/templates/playbook-lifecycle-review.d.ts.map +1 -0
- package/dist/workspace/templates/playbook-lifecycle-review.js +187 -0
- package/dist/workspace/templates/playbook-lifecycle-review.js.map +1 -0
- package/dist/workspace/types.d.ts +12 -54
- package/dist/workspace/types.d.ts.map +1 -1
- package/dist/workspace/types.js.map +1 -1
- package/package.json +8 -2
- package/playbooks/compound-engineering/adversarial-review.json +51 -0
- package/playbooks/compound-engineering/agent-native-architecture.json +59 -0
- package/playbooks/compound-engineering/agent-native-review.json +54 -0
- package/playbooks/compound-engineering/api-contract-review.json +52 -0
- package/playbooks/compound-engineering/brainstorm-requirements.json +55 -0
- package/playbooks/compound-engineering/bug-reproduction.json +62 -0
- package/playbooks/compound-engineering/confidence-calibration.json +49 -0
- package/playbooks/compound-engineering/correctness-review.json +49 -0
- package/playbooks/compound-engineering/data-migration-safety.json +59 -0
- package/playbooks/compound-engineering/deployment-verification.json +63 -0
- package/playbooks/compound-engineering/error-recovery-patterns.json +53 -0
- package/playbooks/compound-engineering/implementation-planning.json +64 -0
- package/playbooks/compound-engineering/issue-pattern-analysis.json +53 -0
- package/playbooks/compound-engineering/knowledge-compounding.json +63 -0
- package/playbooks/compound-engineering/learnings-research.json +54 -0
- package/playbooks/compound-engineering/maintainability-review.json +49 -0
- package/playbooks/compound-engineering/performance-review.json +54 -0
- package/playbooks/compound-engineering/plan-adversarial-review.json +56 -0
- package/playbooks/compound-engineering/plan-feasibility-review.json +56 -0
- package/playbooks/compound-engineering/project-standards-review.json +52 -0
- package/playbooks/compound-engineering/reliability-review.json +53 -0
- package/playbooks/compound-engineering/review-orchestration.json +64 -0
- package/playbooks/compound-engineering/security-review.json +54 -0
- package/playbooks/compound-engineering/systematic-execution.json +64 -0
- package/playbooks/compound-engineering/testing-review.json +50 -0
- package/src/atlas.ts +96 -0
- package/src/index.ts +27 -0
- package/src/learning/index.ts +1 -0
- package/src/learning/unified-pipeline.ts +271 -1
- package/src/memory/candidate-retrieval.ts +2 -1
- package/src/memory/curated-loader.ts +69 -16
- package/src/memory/index.ts +16 -0
- package/src/memory/playbook.ts +19 -0
- package/src/memory/source-resolver.ts +422 -0
- package/src/types/config.ts +46 -0
- package/src/types/index.ts +4 -0
- package/src/utils/error-classifier.ts +8 -8
- package/src/workspace/efficacy-toolkit.ts +496 -0
- package/src/workspace/index.ts +29 -0
- package/src/workspace/templates/index.ts +24 -0
- package/src/workspace/templates/playbook-decay-detection.ts +272 -0
- package/src/workspace/templates/playbook-efficacy-audit.ts +246 -0
- package/src/workspace/templates/playbook-lifecycle-review.ts +274 -0
- package/src/workspace/types.ts +22 -78
- package/tests/fixtures/behavioral-trajectories.ts +210 -0
- package/tests/integration/curated-sources-e2e.test.ts +502 -0
- package/tests/integration/pipeline-data-correctness.test.ts +794 -0
- package/tests/learning/meta-learner.test.ts +418 -0
- package/tests/learning/pipeline-memory-updates.test.ts +721 -0
- package/tests/learning/unified-pipeline-efficacy.test.ts +232 -0
- package/tests/memory/candidate-retrieval.test.ts +167 -0
- package/tests/memory/compound-engineering-seed.test.ts +338 -0
- package/tests/memory/curated-loader-extended.test.ts +225 -0
- package/tests/memory/meta.test.ts +399 -0
- package/tests/memory/playbook-quality-validation.test.ts +430 -0
- package/tests/memory/source-resolver.test.ts +700 -0
- package/tests/search/evaluator.test.ts +257 -0
- package/tests/search/verification-runner.test.ts +357 -0
- package/tests/utils/error-classifier.test.ts +149 -0
- package/tests/utils/trajectory-helpers.test.ts +163 -0
- package/tests/workspace/efficacy-toolkit.test.ts +404 -0
- package/tests/workspace/templates/playbook-efficacy.test.ts +377 -0
- package/.claude/settings.local.json +0 -11
- package/dist/learning/llm-extractor.d.ts +0 -88
- package/dist/learning/llm-extractor.d.ts.map +0 -1
- package/dist/learning/llm-extractor.js +0 -372
- package/dist/learning/llm-extractor.js.map +0 -1
- package/dist/learning/loop-coordinator.d.ts +0 -61
- package/dist/learning/loop-coordinator.d.ts.map +0 -1
- package/dist/learning/loop-coordinator.js +0 -96
- package/dist/learning/loop-coordinator.js.map +0 -1
- package/references/agent-workspace/CLAUDE.md +0 -74
- package/references/agent-workspace/README.md +0 -587
- package/references/agent-workspace/media/banner.png +0 -0
- package/references/agent-workspace/package-lock.json +0 -2061
- package/references/agent-workspace/package.json +0 -54
- package/references/agent-workspace/src/handle.ts +0 -122
- package/references/agent-workspace/src/index.ts +0 -32
- package/references/agent-workspace/src/manager.ts +0 -102
- package/references/agent-workspace/src/readers/json.ts +0 -71
- package/references/agent-workspace/src/readers/markdown.ts +0 -37
- package/references/agent-workspace/src/readers/raw.ts +0 -27
- package/references/agent-workspace/src/types.ts +0 -68
- package/references/agent-workspace/src/validation.ts +0 -93
- package/references/agent-workspace/src/writers/json.ts +0 -17
- package/references/agent-workspace/src/writers/markdown.ts +0 -27
- package/references/agent-workspace/src/writers/raw.ts +0 -22
- package/references/agent-workspace/tests/errors.test.ts +0 -652
- package/references/agent-workspace/tests/handle.test.ts +0 -144
- package/references/agent-workspace/tests/manager.test.ts +0 -124
- package/references/agent-workspace/tests/readers.test.ts +0 -205
- package/references/agent-workspace/tests/validation.test.ts +0 -196
- package/references/agent-workspace/tests/writers.test.ts +0 -108
- package/references/agent-workspace/tsconfig.json +0 -20
- package/references/agent-workspace/tsup.config.ts +0 -9
- package/references/minimem/.claude/settings.json +0 -7
- package/references/minimem/.sudocode/issues.jsonl +0 -18
- package/references/minimem/.sudocode/specs.jsonl +0 -1
- package/references/minimem/CLAUDE.md +0 -310
- package/references/minimem/README.md +0 -556
- package/references/minimem/claude-plugin/.claude-plugin/plugin.json +0 -10
- package/references/minimem/claude-plugin/.mcp.json +0 -7
- package/references/minimem/claude-plugin/README.md +0 -158
- package/references/minimem/claude-plugin/commands/recall.md +0 -47
- package/references/minimem/claude-plugin/commands/remember.md +0 -41
- package/references/minimem/claude-plugin/hooks/__tests__/hooks.test.ts +0 -272
- package/references/minimem/claude-plugin/hooks/hooks.json +0 -27
- package/references/minimem/claude-plugin/hooks/session-end.sh +0 -86
- package/references/minimem/claude-plugin/hooks/session-start.sh +0 -85
- package/references/minimem/claude-plugin/skills/memory/SKILL.md +0 -108
- package/references/minimem/package-lock.json +0 -5373
- package/references/minimem/package.json +0 -60
- package/references/minimem/scripts/postbuild.js +0 -35
- package/references/minimem/src/__tests__/edge-cases.test.ts +0 -371
- package/references/minimem/src/__tests__/errors.test.ts +0 -265
- package/references/minimem/src/__tests__/helpers.ts +0 -199
- package/references/minimem/src/__tests__/internal.test.ts +0 -407
- package/references/minimem/src/__tests__/knowledge.test.ts +0 -287
- package/references/minimem/src/__tests__/minimem.integration.test.ts +0 -1127
- package/references/minimem/src/__tests__/session.test.ts +0 -190
- package/references/minimem/src/cli/__tests__/commands.test.ts +0 -759
- package/references/minimem/src/cli/commands/__tests__/conflicts.test.ts +0 -141
- package/references/minimem/src/cli/commands/append.ts +0 -76
- package/references/minimem/src/cli/commands/config.ts +0 -262
- package/references/minimem/src/cli/commands/conflicts.ts +0 -413
- package/references/minimem/src/cli/commands/daemon.ts +0 -169
- package/references/minimem/src/cli/commands/index.ts +0 -12
- package/references/minimem/src/cli/commands/init.ts +0 -88
- package/references/minimem/src/cli/commands/mcp.ts +0 -177
- package/references/minimem/src/cli/commands/push-pull.ts +0 -213
- package/references/minimem/src/cli/commands/search.ts +0 -158
- package/references/minimem/src/cli/commands/status.ts +0 -84
- package/references/minimem/src/cli/commands/sync-init.ts +0 -290
- package/references/minimem/src/cli/commands/sync.ts +0 -70
- package/references/minimem/src/cli/commands/upsert.ts +0 -197
- package/references/minimem/src/cli/config.ts +0 -584
- package/references/minimem/src/cli/index.ts +0 -264
- package/references/minimem/src/cli/shared.ts +0 -161
- package/references/minimem/src/cli/sync/__tests__/central.test.ts +0 -152
- package/references/minimem/src/cli/sync/__tests__/conflicts.test.ts +0 -209
- package/references/minimem/src/cli/sync/__tests__/daemon.test.ts +0 -118
- package/references/minimem/src/cli/sync/__tests__/detection.test.ts +0 -207
- package/references/minimem/src/cli/sync/__tests__/integration.test.ts +0 -476
- package/references/minimem/src/cli/sync/__tests__/registry.test.ts +0 -363
- package/references/minimem/src/cli/sync/__tests__/state.test.ts +0 -255
- package/references/minimem/src/cli/sync/__tests__/validation.test.ts +0 -193
- package/references/minimem/src/cli/sync/__tests__/watcher.test.ts +0 -178
- package/references/minimem/src/cli/sync/central.ts +0 -292
- package/references/minimem/src/cli/sync/conflicts.ts +0 -204
- package/references/minimem/src/cli/sync/daemon.ts +0 -407
- package/references/minimem/src/cli/sync/detection.ts +0 -138
- package/references/minimem/src/cli/sync/index.ts +0 -107
- package/references/minimem/src/cli/sync/operations.ts +0 -373
- package/references/minimem/src/cli/sync/registry.ts +0 -279
- package/references/minimem/src/cli/sync/state.ts +0 -355
- package/references/minimem/src/cli/sync/validation.ts +0 -206
- package/references/minimem/src/cli/sync/watcher.ts +0 -234
- package/references/minimem/src/cli/version.ts +0 -34
- package/references/minimem/src/core/index.ts +0 -9
- package/references/minimem/src/core/indexer.ts +0 -628
- package/references/minimem/src/core/searcher.ts +0 -221
- package/references/minimem/src/db/schema.ts +0 -183
- package/references/minimem/src/db/sqlite-vec.ts +0 -24
- package/references/minimem/src/embeddings/__tests__/embeddings.test.ts +0 -431
- package/references/minimem/src/embeddings/batch-gemini.ts +0 -392
- package/references/minimem/src/embeddings/batch-openai.ts +0 -409
- package/references/minimem/src/embeddings/embeddings.ts +0 -434
- package/references/minimem/src/index.ts +0 -109
- package/references/minimem/src/internal.ts +0 -299
- package/references/minimem/src/minimem.ts +0 -1276
- package/references/minimem/src/search/__tests__/hybrid.test.ts +0 -247
- package/references/minimem/src/search/graph.ts +0 -234
- package/references/minimem/src/search/hybrid.ts +0 -151
- package/references/minimem/src/search/search.ts +0 -256
- package/references/minimem/src/server/__tests__/mcp.test.ts +0 -341
- package/references/minimem/src/server/__tests__/tools.test.ts +0 -364
- package/references/minimem/src/server/mcp.ts +0 -326
- package/references/minimem/src/server/tools.ts +0 -720
- package/references/minimem/src/session.ts +0 -460
- package/references/minimem/tsconfig.json +0 -19
- package/references/minimem/tsup.config.ts +0 -26
- package/references/minimem/vitest.config.ts +0 -24
- package/references/sessionlog/.husky/pre-commit +0 -1
- package/references/sessionlog/.lintstagedrc.json +0 -4
- package/references/sessionlog/.prettierignore +0 -4
- package/references/sessionlog/.prettierrc.json +0 -11
- package/references/sessionlog/LICENSE +0 -21
- package/references/sessionlog/README.md +0 -453
- package/references/sessionlog/eslint.config.js +0 -58
- package/references/sessionlog/package-lock.json +0 -3672
- package/references/sessionlog/package.json +0 -65
- package/references/sessionlog/src/__tests__/agent-hooks.test.ts +0 -570
- package/references/sessionlog/src/__tests__/agent-registry.test.ts +0 -127
- package/references/sessionlog/src/__tests__/claude-code-hooks.test.ts +0 -225
- package/references/sessionlog/src/__tests__/claude-generator.test.ts +0 -46
- package/references/sessionlog/src/__tests__/commit-msg.test.ts +0 -86
- package/references/sessionlog/src/__tests__/cursor-agent.test.ts +0 -224
- package/references/sessionlog/src/__tests__/e2e-live.test.ts +0 -890
- package/references/sessionlog/src/__tests__/event-log.test.ts +0 -183
- package/references/sessionlog/src/__tests__/flush-sentinel.test.ts +0 -105
- package/references/sessionlog/src/__tests__/gemini-agent.test.ts +0 -375
- package/references/sessionlog/src/__tests__/git-hooks.test.ts +0 -78
- package/references/sessionlog/src/__tests__/hook-managers.test.ts +0 -121
- package/references/sessionlog/src/__tests__/lifecycle-tasks.test.ts +0 -759
- package/references/sessionlog/src/__tests__/opencode-agent.test.ts +0 -338
- package/references/sessionlog/src/__tests__/redaction.test.ts +0 -136
- package/references/sessionlog/src/__tests__/session-repo.test.ts +0 -353
- package/references/sessionlog/src/__tests__/session-store.test.ts +0 -166
- package/references/sessionlog/src/__tests__/setup-ccweb.test.ts +0 -466
- package/references/sessionlog/src/__tests__/skill-live.test.ts +0 -461
- package/references/sessionlog/src/__tests__/summarize.test.ts +0 -348
- package/references/sessionlog/src/__tests__/task-plan-e2e.test.ts +0 -610
- package/references/sessionlog/src/__tests__/task-plan-live.test.ts +0 -632
- package/references/sessionlog/src/__tests__/transcript-timestamp.test.ts +0 -121
- package/references/sessionlog/src/__tests__/types.test.ts +0 -166
- package/references/sessionlog/src/__tests__/utils.test.ts +0 -333
- package/references/sessionlog/src/__tests__/validation.test.ts +0 -103
- package/references/sessionlog/src/__tests__/worktree.test.ts +0 -57
- package/references/sessionlog/src/agent/agents/claude-code.ts +0 -1089
- package/references/sessionlog/src/agent/agents/cursor.ts +0 -361
- package/references/sessionlog/src/agent/agents/gemini-cli.ts +0 -632
- package/references/sessionlog/src/agent/agents/opencode.ts +0 -540
- package/references/sessionlog/src/agent/registry.ts +0 -143
- package/references/sessionlog/src/agent/session-types.ts +0 -113
- package/references/sessionlog/src/agent/types.ts +0 -220
- package/references/sessionlog/src/cli.ts +0 -597
- package/references/sessionlog/src/commands/clean.ts +0 -133
- package/references/sessionlog/src/commands/disable.ts +0 -84
- package/references/sessionlog/src/commands/doctor.ts +0 -145
- package/references/sessionlog/src/commands/enable.ts +0 -202
- package/references/sessionlog/src/commands/explain.ts +0 -261
- package/references/sessionlog/src/commands/reset.ts +0 -105
- package/references/sessionlog/src/commands/resume.ts +0 -180
- package/references/sessionlog/src/commands/rewind.ts +0 -195
- package/references/sessionlog/src/commands/setup-ccweb.ts +0 -275
- package/references/sessionlog/src/commands/status.ts +0 -172
- package/references/sessionlog/src/config.ts +0 -165
- package/references/sessionlog/src/events/event-log.ts +0 -126
- package/references/sessionlog/src/git-operations.ts +0 -558
- package/references/sessionlog/src/hooks/git-hooks.ts +0 -165
- package/references/sessionlog/src/hooks/lifecycle.ts +0 -391
- package/references/sessionlog/src/index.ts +0 -650
- package/references/sessionlog/src/security/redaction.ts +0 -283
- package/references/sessionlog/src/session/state-machine.ts +0 -452
- package/references/sessionlog/src/store/checkpoint-store.ts +0 -509
- package/references/sessionlog/src/store/native-store.ts +0 -173
- package/references/sessionlog/src/store/provider-types.ts +0 -99
- package/references/sessionlog/src/store/session-store.ts +0 -266
- package/references/sessionlog/src/strategy/attribution.ts +0 -296
- package/references/sessionlog/src/strategy/common.ts +0 -207
- package/references/sessionlog/src/strategy/content-overlap.ts +0 -228
- package/references/sessionlog/src/strategy/manual-commit.ts +0 -988
- package/references/sessionlog/src/strategy/types.ts +0 -279
- package/references/sessionlog/src/summarize/claude-generator.ts +0 -115
- package/references/sessionlog/src/summarize/summarize.ts +0 -432
- package/references/sessionlog/src/types.ts +0 -508
- package/references/sessionlog/src/utils/chunk-files.ts +0 -49
- package/references/sessionlog/src/utils/commit-message.ts +0 -65
- package/references/sessionlog/src/utils/detect-agent.ts +0 -36
- package/references/sessionlog/src/utils/hook-managers.ts +0 -125
- package/references/sessionlog/src/utils/ide-tags.ts +0 -32
- package/references/sessionlog/src/utils/paths.ts +0 -79
- package/references/sessionlog/src/utils/preview-rewind.ts +0 -80
- package/references/sessionlog/src/utils/rewind-conflict.ts +0 -121
- package/references/sessionlog/src/utils/shadow-branch.ts +0 -109
- package/references/sessionlog/src/utils/string-utils.ts +0 -46
- package/references/sessionlog/src/utils/todo-extract.ts +0 -188
- package/references/sessionlog/src/utils/trailers.ts +0 -187
- package/references/sessionlog/src/utils/transcript-parse.ts +0 -177
- package/references/sessionlog/src/utils/transcript-timestamp.ts +0 -59
- package/references/sessionlog/src/utils/tree-ops.ts +0 -219
- package/references/sessionlog/src/utils/tty.ts +0 -72
- package/references/sessionlog/src/utils/validation.ts +0 -65
- package/references/sessionlog/src/utils/worktree.ts +0 -58
- package/references/sessionlog/src/wire-types.ts +0 -59
- package/references/sessionlog/templates/setup-env.sh +0 -153
- package/references/sessionlog/tsconfig.json +0 -18
- package/references/sessionlog/vitest.config.ts +0 -12
- package/references/skill-tree/.claude/settings.json +0 -6
- package/references/skill-tree/.sudocode/issues.jsonl +0 -19
- package/references/skill-tree/.sudocode/specs.jsonl +0 -3
- package/references/skill-tree/CLAUDE.md +0 -126
- package/references/skill-tree/README.md +0 -372
- package/references/skill-tree/docs/GAPS_v1.md +0 -221
- package/references/skill-tree/docs/INTEGRATION_PLAN.md +0 -467
- package/references/skill-tree/docs/TODOS.md +0 -91
- package/references/skill-tree/docs/anthropic_skill_guide.md +0 -1364
- package/references/skill-tree/docs/design/federated-skill-trees.md +0 -524
- package/references/skill-tree/docs/design/multi-agent-sync.md +0 -759
- package/references/skill-tree/docs/scraper/BRAINSTORM.md +0 -583
- package/references/skill-tree/docs/scraper/POC_PLAN.md +0 -420
- package/references/skill-tree/docs/scraper/README.md +0 -170
- package/references/skill-tree/examples/basic-usage.ts +0 -164
- package/references/skill-tree/package-lock.json +0 -1852
- package/references/skill-tree/package.json +0 -66
- package/references/skill-tree/scraper/README.md +0 -123
- package/references/skill-tree/scraper/docs/DESIGN.md +0 -683
- package/references/skill-tree/scraper/docs/PLAN.md +0 -336
- package/references/skill-tree/scraper/drizzle.config.ts +0 -10
- package/references/skill-tree/scraper/package-lock.json +0 -6329
- package/references/skill-tree/scraper/package.json +0 -68
- package/references/skill-tree/scraper/test/fixtures/invalid-skill/missing-description.md +0 -7
- package/references/skill-tree/scraper/test/fixtures/invalid-skill/missing-name.md +0 -7
- package/references/skill-tree/scraper/test/fixtures/minimal-skill/SKILL.md +0 -27
- package/references/skill-tree/scraper/test/fixtures/skill-json/SKILL.json +0 -21
- package/references/skill-tree/scraper/test/fixtures/skill-with-meta/SKILL.md +0 -54
- package/references/skill-tree/scraper/test/fixtures/skill-with-meta/_meta.json +0 -24
- package/references/skill-tree/scraper/test/fixtures/valid-skill/SKILL.md +0 -93
- package/references/skill-tree/scraper/test/fixtures/valid-skill/_meta.json +0 -22
- package/references/skill-tree/scraper/tsup.config.ts +0 -14
- package/references/skill-tree/scraper/vitest.config.ts +0 -17
- package/references/skill-tree/scripts/convert-to-vitest.ts +0 -166
- package/references/skill-tree/skills/skill-writer/SKILL.md +0 -339
- package/references/skill-tree/skills/skill-writer/references/examples.md +0 -326
- package/references/skill-tree/skills/skill-writer/references/patterns.md +0 -210
- package/references/skill-tree/skills/skill-writer/references/quality-checklist.md +0 -123
- package/references/skill-tree/test/run-all.ts +0 -106
- package/references/skill-tree/test/utils.ts +0 -128
- package/references/skill-tree/vitest.config.ts +0 -16
|
@@ -0,0 +1,54 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "learnings-research",
|
|
3
|
+
"curatedBy": "compound-engineering",
|
|
4
|
+
"confidence": 0.85,
|
|
5
|
+
"complexity": "moderate",
|
|
6
|
+
"estimatedEffort": 3,
|
|
7
|
+
"applicability": {
|
|
8
|
+
"situations": [
|
|
9
|
+
"Looking up institutional knowledge before starting work",
|
|
10
|
+
"Finding past solutions for similar problems during debugging",
|
|
11
|
+
"Preventing repeated mistakes by surfacing known patterns and gotchas"
|
|
12
|
+
],
|
|
13
|
+
"triggers": [
|
|
14
|
+
"search knowledge",
|
|
15
|
+
"past solutions",
|
|
16
|
+
"known issues",
|
|
17
|
+
"institutional knowledge",
|
|
18
|
+
"what do we know about"
|
|
19
|
+
],
|
|
20
|
+
"antiPatterns": [
|
|
21
|
+
"Searching for information that doesn't exist in the knowledge base yet",
|
|
22
|
+
"Using full-text search as the first step instead of grep-first filtering",
|
|
23
|
+
"Reading all files sequentially instead of parallel keyword search"
|
|
24
|
+
],
|
|
25
|
+
"domains": ["knowledge-management", "research", "debugging"]
|
|
26
|
+
},
|
|
27
|
+
"guidance": {
|
|
28
|
+
"strategy": "Grep-first filtering: extract keywords, narrow by category, run parallel content searches on frontmatter fields, then read only strong/moderate matches. Never read all files — always pre-filter.",
|
|
29
|
+
"tactics": [
|
|
30
|
+
"Extract keywords from the current task/problem description",
|
|
31
|
+
"Category narrowing (if clear): focus on the relevant knowledge subdirectory first",
|
|
32
|
+
"Parallel content-search: search on frontmatter fields (title, tags, module, component) using multiple keywords in parallel; use case-insensitive matching; use OR for synonyms",
|
|
33
|
+
"Score matches into four categories: Strong (module + tags match), Moderate (problem_type relevant + tags), Weak (tangential), None — only read Strong and Moderate",
|
|
34
|
+
"Always check critical-patterns document regardless of grep results — it contains must-know patterns for all work",
|
|
35
|
+
"Distill summaries from matched documents — surface actionable insights, not raw content",
|
|
36
|
+
"Assess overlap on 5 dimensions: problem statement, root cause, solution, referenced files, prevention rules",
|
|
37
|
+
"Run multiple searches in parallel — never sequentially"
|
|
38
|
+
]
|
|
39
|
+
},
|
|
40
|
+
"verification": {
|
|
41
|
+
"successIndicators": [
|
|
42
|
+
"Relevant documents found and ranked by relevance strength",
|
|
43
|
+
"Critical patterns checked and incorporated",
|
|
44
|
+
"Summaries are distilled and actionable (not raw file dumps)",
|
|
45
|
+
"Search used grep-first filtering, not sequential file reading"
|
|
46
|
+
],
|
|
47
|
+
"failureIndicators": [
|
|
48
|
+
"All files read sequentially instead of pre-filtered",
|
|
49
|
+
"Tangentially related entries included, adding noise",
|
|
50
|
+
"Critical patterns document skipped",
|
|
51
|
+
"Searches run sequentially instead of in parallel"
|
|
52
|
+
]
|
|
53
|
+
}
|
|
54
|
+
}
|
|
@@ -0,0 +1,49 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "maintainability-review",
|
|
3
|
+
"curatedBy": "compound-engineering",
|
|
4
|
+
"confidence": 0.85,
|
|
5
|
+
"complexity": "moderate",
|
|
6
|
+
"estimatedEffort": 3,
|
|
7
|
+
"applicability": {
|
|
8
|
+
"situations": [
|
|
9
|
+
"Reviewing code for long-term carrying cost and maintainability",
|
|
10
|
+
"Evaluating abstractions, indirection, and naming clarity",
|
|
11
|
+
"Checking for dead code, unnecessary coupling, and premature complexity"
|
|
12
|
+
],
|
|
13
|
+
"triggers": [
|
|
14
|
+
"code review",
|
|
15
|
+
"maintainability",
|
|
16
|
+
"complexity",
|
|
17
|
+
"refactoring"
|
|
18
|
+
],
|
|
19
|
+
"antiPatterns": [
|
|
20
|
+
"Reviewing for correctness bugs — use correctness review instead",
|
|
21
|
+
"Style preferences that don't affect comprehension",
|
|
22
|
+
"Debating naming conventions already established in the codebase"
|
|
23
|
+
],
|
|
24
|
+
"domains": ["code-review", "maintainability", "quality-assurance"]
|
|
25
|
+
},
|
|
26
|
+
"guidance": {
|
|
27
|
+
"strategy": "Apply the future developer lens: will the next person who touches this in 6 months understand it quickly? Every abstraction must earn its keep with 3+ implementations or proven variation.",
|
|
28
|
+
"tactics": [
|
|
29
|
+
"Hunt for: premature abstraction (interface/factory with one user), unnecessary indirection (>2 delegation levels), dead code (commented, unused exports, unreachable), unrelated module coupling, naming that obscures intent",
|
|
30
|
+
"Anti-pattern catalog: generic solution for specific problem, wrapper with no added value, config for unchanging values, unused extension points, circular dependencies, shared mutable state",
|
|
31
|
+
"Abstractions must earn their keep: 3+ implementations or proven variation axis — otherwise inline",
|
|
32
|
+
"Indirection must add clear value: if a function just delegates to another without transformation, it's overhead",
|
|
33
|
+
"Naming describes what, not how: booleans have is/has/should prefixes; functions describe outcome not mechanism",
|
|
34
|
+
"Confidence calibration: HIGH (0.80+) when objectively provable (abstraction has 1 user visible in codebase); MODERATE (0.60-0.79) for naming/abstraction boundary judgments; suppress below 0.60 for style preferences"
|
|
35
|
+
]
|
|
36
|
+
},
|
|
37
|
+
"verification": {
|
|
38
|
+
"successIndicators": [
|
|
39
|
+
"All flagged abstractions are objectively underused (provable from codebase search)",
|
|
40
|
+
"Indirection findings show concrete delegation chain with no value-add",
|
|
41
|
+
"Dead code findings are verifiable via search (no callers/importers)"
|
|
42
|
+
],
|
|
43
|
+
"failureIndicators": [
|
|
44
|
+
"Finding is really a style preference, not a maintainability concern",
|
|
45
|
+
"Abstraction flagged as premature but actually has 3+ users",
|
|
46
|
+
"Naming critique is subjective rather than clarity-impacting"
|
|
47
|
+
]
|
|
48
|
+
}
|
|
49
|
+
}
|
|
@@ -0,0 +1,54 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "performance-review",
|
|
3
|
+
"curatedBy": "compound-engineering",
|
|
4
|
+
"confidence": 0.85,
|
|
5
|
+
"complexity": "moderate",
|
|
6
|
+
"estimatedEffort": 4,
|
|
7
|
+
"applicability": {
|
|
8
|
+
"situations": [
|
|
9
|
+
"Reviewing code that touches database queries, loops, caching, or I/O-intensive paths",
|
|
10
|
+
"Evaluating scalability of new features at 10x/100x/1000x current data volumes",
|
|
11
|
+
"Checking for production-observable performance regressions"
|
|
12
|
+
],
|
|
13
|
+
"triggers": [
|
|
14
|
+
"performance review",
|
|
15
|
+
"N+1 query",
|
|
16
|
+
"slow query",
|
|
17
|
+
"memory leak",
|
|
18
|
+
"pagination",
|
|
19
|
+
"caching"
|
|
20
|
+
],
|
|
21
|
+
"antiPatterns": [
|
|
22
|
+
"Micro-optimizations in cold paths (startup, migrations, admin tools, one-time initialization)",
|
|
23
|
+
"Premature caching suggestions without evidence of actual slowness",
|
|
24
|
+
"Theoretical scale issues in MVP/prototype code",
|
|
25
|
+
"Style-based performance opinions (for vs forEach, Map vs plain object)"
|
|
26
|
+
],
|
|
27
|
+
"domains": ["code-review", "performance", "quality-assurance"]
|
|
28
|
+
},
|
|
29
|
+
"guidance": {
|
|
30
|
+
"strategy": "Read code through the lens of 'what happens when this runs 10,000 times' or 'when the table has a million rows'. Focus on measurable, production-observable problems — not theoretical micro-optimizations. Project performance at 10x, 100x, and 1000x current volumes.",
|
|
31
|
+
"tactics": [
|
|
32
|
+
"N+1 queries: flag database queries inside loops that should be batched or eager-loaded; count loop iterations against expected data size",
|
|
33
|
+
"Unbounded memory: flag loading entire tables without pagination, caches without eviction policies, string concatenation in loops, large object allocations",
|
|
34
|
+
"Missing pagination: flag endpoints returning all results without limit/offset/cursor/streaming",
|
|
35
|
+
"Hot-path allocations: flag object creation, regex compilation, or expensive computation inside loops or per-request paths",
|
|
36
|
+
"Blocking I/O in async: flag synchronous file reads, blocking HTTP calls, CPU-intensive computation on the event loop",
|
|
37
|
+
"Algorithmic complexity: flag O(n^2) or worse without justification; verify all database queries use appropriate indexes",
|
|
38
|
+
"Performance benchmarks: API responses under 200ms for standard operations, bundle size increases under 5KB per feature, background jobs process in batches",
|
|
39
|
+
"Confidence calibration: HIGH (0.80+) when impact is provable from code (N+1 clearly in loop, unbounded query on large table); MODERATE (0.60-0.79) when pattern present but impact depends on unconfirmed data size; suppress below 0.60"
|
|
40
|
+
]
|
|
41
|
+
},
|
|
42
|
+
"verification": {
|
|
43
|
+
"successIndicators": [
|
|
44
|
+
"Each finding identifies a specific code path with measurable impact at expected scale",
|
|
45
|
+
"N+1 findings show the loop and the query inside it",
|
|
46
|
+
"No micro-optimization findings on cold paths"
|
|
47
|
+
],
|
|
48
|
+
"failureIndicators": [
|
|
49
|
+
"Finding is speculative optimization without evidence of hot path",
|
|
50
|
+
"Caching recommendation without evidence of repeated expensive computation",
|
|
51
|
+
"Flagging cold-path code (startup, migrations) for performance"
|
|
52
|
+
]
|
|
53
|
+
}
|
|
54
|
+
}
|
|
@@ -0,0 +1,56 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "plan-adversarial-review",
|
|
3
|
+
"curatedBy": "compound-engineering",
|
|
4
|
+
"confidence": 0.8,
|
|
5
|
+
"complexity": "complex",
|
|
6
|
+
"estimatedEffort": 5,
|
|
7
|
+
"applicability": {
|
|
8
|
+
"situations": [
|
|
9
|
+
"Reviewing implementation plans or requirement documents before execution",
|
|
10
|
+
"Stress-testing planning assumptions, premises, and scope decisions",
|
|
11
|
+
"Catching contradictions, scope creep, and unstated assumptions in plans"
|
|
12
|
+
],
|
|
13
|
+
"triggers": [
|
|
14
|
+
"review plan",
|
|
15
|
+
"plan review",
|
|
16
|
+
"challenge assumptions",
|
|
17
|
+
"scope review",
|
|
18
|
+
"requirements review"
|
|
19
|
+
],
|
|
20
|
+
"antiPatterns": [
|
|
21
|
+
"Implementation style or technology selection choices",
|
|
22
|
+
"Product strategy or priority preferences",
|
|
23
|
+
"Security, design, or feasibility concerns (use plan-feasibility-review instead)",
|
|
24
|
+
"The plan is already in execution — too late for adversarial review"
|
|
25
|
+
],
|
|
26
|
+
"domains": ["planning", "requirements", "quality-assurance"]
|
|
27
|
+
},
|
|
28
|
+
"guidance": {
|
|
29
|
+
"strategy": "Challenge premises before solutions. Surface unstated assumptions. Stress-test decisions for reversal cost. Check for internal contradictions and scope-goal misalignment. Apply three lenses: adversarial (break assumptions), coherence (internal consistency), and scope guardian (right-sized).",
|
|
30
|
+
"tactics": [
|
|
31
|
+
"Premise challenging: Is this the right problem? Does the solution match the problem? What if we did nothing? What would make this fail? Surface framing effects that bias toward one solution",
|
|
32
|
+
"Assumption surfacing: identify environmental assumptions (infrastructure exists, APIs stable), user behavior assumptions (adoption, usage patterns), scale assumptions (data volume, concurrency), temporal assumptions (availability, ordering)",
|
|
33
|
+
"Decision stress-testing: for each major decision, apply falsification test (what evidence would prove this wrong?), reversal cost (how expensive to change later?), and decision-scope mismatch (is decision bigger/smaller than the problem?)",
|
|
34
|
+
"Simplification pressure: audit abstractions (how many consumers?), find minimum viable version, apply subtraction test (remove each component — does plan still work?), enforce complexity budget",
|
|
35
|
+
"Coherence checking: catch contradictions between sections, terminology drift (same concept with different names), forward references to undefined terms, ungrouped requirements spanning multiple concerns",
|
|
36
|
+
"Scope-goal alignment: flag scope exceeding goals (building more than needed), goals exceeding scope (promising more than plan delivers), new abstractions with one implementation, framework-ahead-of-need, configuration without consumers",
|
|
37
|
+
"Alternative blindness: check for omitted alternatives, build-vs-use analysis, do-nothing baseline comparison",
|
|
38
|
+
"Depth calibration: Quick (short docs, <5 requirements) = max 3 findings; Standard = proportional to decision density; Deep (>10 requirements, high-stakes) = multiple passes with assumption chain tracing",
|
|
39
|
+
"Confidence calibration: HIGH (0.80+) when specific text can be quoted showing gap; MODERATE (0.60-0.79) when gap likely but requires context not in document; suppress below 0.50"
|
|
40
|
+
]
|
|
41
|
+
},
|
|
42
|
+
"verification": {
|
|
43
|
+
"successIndicators": [
|
|
44
|
+
"Findings quote specific text from the plan showing the gap or contradiction",
|
|
45
|
+
"Assumptions surfaced are testable and actionable",
|
|
46
|
+
"Scope-goal alignment checked with concrete evidence",
|
|
47
|
+
"No findings that belong to feasibility, security, or design review"
|
|
48
|
+
],
|
|
49
|
+
"failureIndicators": [
|
|
50
|
+
"Findings are vague concerns without quoting specific plan text",
|
|
51
|
+
"Assumptions identified are untestable or irrelevant",
|
|
52
|
+
"Scope opinions based on preference rather than goal alignment",
|
|
53
|
+
"Contradictions flagged that are reconcilable with charitable reading"
|
|
54
|
+
]
|
|
55
|
+
}
|
|
56
|
+
}
|
|
@@ -0,0 +1,56 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "plan-feasibility-review",
|
|
3
|
+
"curatedBy": "compound-engineering",
|
|
4
|
+
"confidence": 0.8,
|
|
5
|
+
"complexity": "complex",
|
|
6
|
+
"estimatedEffort": 5,
|
|
7
|
+
"applicability": {
|
|
8
|
+
"situations": [
|
|
9
|
+
"Evaluating technical feasibility of implementation plans",
|
|
10
|
+
"Checking product-market fit and strategic alignment of proposed features",
|
|
11
|
+
"Reviewing plans for security gaps, design completeness, and migration safety"
|
|
12
|
+
],
|
|
13
|
+
"triggers": [
|
|
14
|
+
"feasibility review",
|
|
15
|
+
"plan feasibility",
|
|
16
|
+
"technical review",
|
|
17
|
+
"can we build this",
|
|
18
|
+
"is this plan viable"
|
|
19
|
+
],
|
|
20
|
+
"antiPatterns": [
|
|
21
|
+
"Implementation style choices that don't affect feasibility",
|
|
22
|
+
"Code organization preferences",
|
|
23
|
+
"Theoretical scalability without evidence",
|
|
24
|
+
"Scope or assumption concerns (use plan-adversarial-review instead)"
|
|
25
|
+
],
|
|
26
|
+
"domains": ["planning", "architecture", "quality-assurance"]
|
|
27
|
+
},
|
|
28
|
+
"guidance": {
|
|
29
|
+
"strategy": "Evaluate plans across four dimensions: technical feasibility (can we build it?), product fit (should we build it?), security readiness (is it safe?), and design completeness (is it specified enough?). Each dimension has a distinct lens.",
|
|
30
|
+
"tactics": [
|
|
31
|
+
"Technical feasibility: verify plan acknowledges existing code/services/infrastructure; check for architecture conflicts with current stack; validate that referenced file paths and interfaces actually exist; check framework compatibility",
|
|
32
|
+
"Shadow path tracing: for each feature, trace the happy path, nil/empty input path, error path, and concurrent access path — plans that only cover happy path will fail in implementation",
|
|
33
|
+
"Migration safety: verify concrete migration path (not 'migrate later'), backward compatibility during rollout, rollback strategy, data volume estimates, and operation ordering",
|
|
34
|
+
"Product lens: challenge the premise — is this the right problem? What's the actual outcome? What happens if we do nothing? Is there an 80% value at 20% cost alternative? Check goal-requirement alignment (orphan requirements, unserved goals)",
|
|
35
|
+
"Security lens: inventory attack surfaces (endpoints, data stores, integrations, user inputs), check auth/authz per endpoint, identify sensitive data flows, assess third-party trust boundaries, outline top-3 threat model (most likely, highest impact, most subtle exploit)",
|
|
36
|
+
"Design completeness: check interaction state coverage (loading, empty, error, success, partial for every interactive element), user flow completeness (entry points, happy path, 2-3 edge cases, exit points), responsive/accessibility considerations",
|
|
37
|
+
"Dependency analysis: verify external dependencies are available and compatible; identify implicit assumptions about infrastructure, APIs, or services",
|
|
38
|
+
"Performance feasibility: back-of-envelope math for expected load, data volumes, and response time requirements",
|
|
39
|
+
"Confidence calibration: HIGH (0.80+) when specific technical constraint blocks the approach; MODERATE (0.60-0.79) when constraint likely but depends on implementation details; suppress below 0.50"
|
|
40
|
+
]
|
|
41
|
+
},
|
|
42
|
+
"verification": {
|
|
43
|
+
"successIndicators": [
|
|
44
|
+
"Technical blockers identified with specific evidence (missing API, framework incompatibility)",
|
|
45
|
+
"Shadow paths traced — plan covers more than just the happy path",
|
|
46
|
+
"Security attack surfaces inventoried with mitigation gaps flagged",
|
|
47
|
+
"Product alignment verified — goals trace to requirements"
|
|
48
|
+
],
|
|
49
|
+
"failureIndicators": [
|
|
50
|
+
"Feasibility concerns are vague without specific technical evidence",
|
|
51
|
+
"Only happy path evaluated — error/empty/concurrent paths ignored",
|
|
52
|
+
"Security review is generic OWASP checklist without plan-specific analysis",
|
|
53
|
+
"Product concerns are preference-based rather than goal-alignment-based"
|
|
54
|
+
]
|
|
55
|
+
}
|
|
56
|
+
}
|
|
@@ -0,0 +1,52 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "project-standards-review",
|
|
3
|
+
"curatedBy": "compound-engineering",
|
|
4
|
+
"confidence": 0.85,
|
|
5
|
+
"complexity": "simple",
|
|
6
|
+
"estimatedEffort": 2,
|
|
7
|
+
"applicability": {
|
|
8
|
+
"situations": [
|
|
9
|
+
"Reviewing changes for compliance with the project's own standards (CLAUDE.md, AGENTS.md, contributing guides)",
|
|
10
|
+
"Enforcing naming conventions, file placement, and configuration rules",
|
|
11
|
+
"Auditing changes against established project conventions"
|
|
12
|
+
],
|
|
13
|
+
"triggers": [
|
|
14
|
+
"standards review",
|
|
15
|
+
"convention check",
|
|
16
|
+
"CLAUDE.md compliance",
|
|
17
|
+
"project rules"
|
|
18
|
+
],
|
|
19
|
+
"antiPatterns": [
|
|
20
|
+
"Rules that don't apply to the changed file type",
|
|
21
|
+
"Violations already caught by automated linters or CI",
|
|
22
|
+
"Pre-existing violations in unchanged code",
|
|
23
|
+
"Generic best practices not documented in the project's standards files",
|
|
24
|
+
"Opinions about quality of the standards themselves"
|
|
25
|
+
],
|
|
26
|
+
"domains": ["code-review", "standards", "quality-assurance"]
|
|
27
|
+
},
|
|
28
|
+
"guidance": {
|
|
29
|
+
"strategy": "Audit changes against the project's own documented standards. Every finding must cite a specific rule from the standards file AND a specific violation in the diff. Without both, drop the finding.",
|
|
30
|
+
"tactics": [
|
|
31
|
+
"Discover standards: read CLAUDE.md, AGENTS.md, and any contributing/convention files in the changed file's ancestor directories",
|
|
32
|
+
"Match rules to file types: only apply rules relevant to the specific files being changed",
|
|
33
|
+
"Evidence requirement: for each finding, provide (1) exact quote/section from standards file defining the rule, and (2) specific line(s) in diff violating the rule",
|
|
34
|
+
"Common violations: missing required frontmatter fields, names not matching directory/file names, wrong reference inclusion mode, shell commands where native tools are required, misplaced files in wrong directories",
|
|
35
|
+
"Language violations: second-person 'you should' where standards require imperative form, hedge words (might/could/consider) leaving behavior undefined",
|
|
36
|
+
"Protected artifacts: never flag documented protected paths (docs/, plans/, solutions/) for deletion",
|
|
37
|
+
"Confidence calibration: HIGH (0.80+) when specific rule quote and specific diff violation are both identifiable; MODERATE (0.60-0.79) when rule exists but applying it requires judgment; suppress below 0.60"
|
|
38
|
+
]
|
|
39
|
+
},
|
|
40
|
+
"verification": {
|
|
41
|
+
"successIndicators": [
|
|
42
|
+
"Every finding cites both the rule source and the specific violation",
|
|
43
|
+
"Only rules from the project's actual standards files are enforced",
|
|
44
|
+
"No findings about unchanged code or generic best practices"
|
|
45
|
+
],
|
|
46
|
+
"failureIndicators": [
|
|
47
|
+
"Finding enforces a rule not documented in any standards file",
|
|
48
|
+
"Finding about pre-existing code that wasn't changed in this diff",
|
|
49
|
+
"Generic best practice advice without project-specific rule citation"
|
|
50
|
+
]
|
|
51
|
+
}
|
|
52
|
+
}
|
|
@@ -0,0 +1,53 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "reliability-review",
|
|
3
|
+
"curatedBy": "compound-engineering",
|
|
4
|
+
"confidence": 0.85,
|
|
5
|
+
"complexity": "moderate",
|
|
6
|
+
"estimatedEffort": 4,
|
|
7
|
+
"applicability": {
|
|
8
|
+
"situations": [
|
|
9
|
+
"Reviewing code with external dependencies, I/O boundaries, or error handling",
|
|
10
|
+
"Evaluating failure modes, retry logic, and cascading failure paths",
|
|
11
|
+
"Checking resilience of services that depend on other services"
|
|
12
|
+
],
|
|
13
|
+
"triggers": [
|
|
14
|
+
"reliability review",
|
|
15
|
+
"error handling",
|
|
16
|
+
"retry",
|
|
17
|
+
"timeout",
|
|
18
|
+
"circuit breaker",
|
|
19
|
+
"cascade failure"
|
|
20
|
+
],
|
|
21
|
+
"antiPatterns": [
|
|
22
|
+
"Flagging internal pure functions that cannot fail (string formatting, math, in-memory transforms)",
|
|
23
|
+
"Test helper error handling",
|
|
24
|
+
"Error message formatting choices",
|
|
25
|
+
"Theoretical cascading failures without traceable evidence"
|
|
26
|
+
],
|
|
27
|
+
"domains": ["code-review", "reliability", "quality-assurance"]
|
|
28
|
+
},
|
|
29
|
+
"guidance": {
|
|
30
|
+
"strategy": "Ask 'what happens when this dependency is down?' for every external call. Think about partial failures, retry storms, and cascading timeouts. Read code by assuming the environment can be hostile.",
|
|
31
|
+
"tactics": [
|
|
32
|
+
"Missing error handling on I/O boundaries: flag HTTP calls, database queries, file operations, and message queue interactions without try/catch or error callbacks",
|
|
33
|
+
"Retry loops without backoff/limits: immediate indefinite retries create retry storms — require exponential backoff and max attempt limits",
|
|
34
|
+
"Missing timeouts on external calls: HTTP clients, database connections, and RPC without explicit timeouts can hang indefinitely and exhaust connection pools",
|
|
35
|
+
"Error swallowing: flag catch blocks that ignore errors, silent failures that return misleading defaults, and error handlers that don't log or propagate",
|
|
36
|
+
"Cascading failure paths: trace how failure in service A causes B to retry aggressively, overloading C; how slow dependencies fill request queues causing health check failures, restarts, and cold-start storms",
|
|
37
|
+
"Recovery-induced failures: retries creating duplicates, rollbacks leaving orphaned state, circuit breakers preventing legitimate recovery",
|
|
38
|
+
"Confidence calibration: HIGH (0.80+) when reliability gap is directly visible (HTTP call without timeout, retry without max attempts, catch swallowing error); MODERATE (0.60-0.79) when code lacks protection but framework defaults might handle it; suppress below 0.60"
|
|
39
|
+
]
|
|
40
|
+
},
|
|
41
|
+
"verification": {
|
|
42
|
+
"successIndicators": [
|
|
43
|
+
"Each finding points to a specific I/O boundary without protection",
|
|
44
|
+
"Retry findings show the loop and its missing backoff/limit",
|
|
45
|
+
"Cascade findings trace the multi-service failure chain"
|
|
46
|
+
],
|
|
47
|
+
"failureIndicators": [
|
|
48
|
+
"Flagging pure functions or in-memory operations for error handling",
|
|
49
|
+
"Missing that framework middleware already handles the concern",
|
|
50
|
+
"Architectural concerns that can't be confirmed from the diff"
|
|
51
|
+
]
|
|
52
|
+
}
|
|
53
|
+
}
|
|
@@ -0,0 +1,64 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "review-orchestration",
|
|
3
|
+
"curatedBy": "compound-engineering",
|
|
4
|
+
"confidence": 0.8,
|
|
5
|
+
"complexity": "complex",
|
|
6
|
+
"estimatedEffort": 8,
|
|
7
|
+
"applicability": {
|
|
8
|
+
"situations": [
|
|
9
|
+
"Code review before creating a PR",
|
|
10
|
+
"Reviewing changes after completing a task during iterative implementation",
|
|
11
|
+
"Structured multi-persona code review for quality assurance"
|
|
12
|
+
],
|
|
13
|
+
"triggers": [
|
|
14
|
+
"review code",
|
|
15
|
+
"code review",
|
|
16
|
+
"check changes",
|
|
17
|
+
"pre-PR review"
|
|
18
|
+
],
|
|
19
|
+
"antiPatterns": [
|
|
20
|
+
"Reviewing trivial formatting-only changes",
|
|
21
|
+
"Reviewing auto-generated code that will be regenerated",
|
|
22
|
+
"Single-line config changes that don't affect behavior"
|
|
23
|
+
],
|
|
24
|
+
"domains": ["code-review", "quality-assurance", "software-engineering"]
|
|
25
|
+
},
|
|
26
|
+
"guidance": {
|
|
27
|
+
"strategy": "Deploy tiered reviewer personas in parallel, then merge and deduplicate findings. Always-on reviewers run on every review; conditional reviewers are selected based on the diff content.",
|
|
28
|
+
"tactics": [
|
|
29
|
+
"Always-on reviewers: correctness (logic bugs), testing (coverage gaps), maintainability (coupling/complexity), project-standards (convention compliance), agent-native (action/context parity), learnings-researcher (institutional knowledge)",
|
|
30
|
+
"Conditional reviewers selected per-diff: security (auth/injection), performance (N+1/memory), API-contract (breaking changes), data-migrations (schema safety), reliability (error handling), adversarial (edge cases), stack-specific language reviewers",
|
|
31
|
+
"Each reviewer returns structured findings with severity (P0-P3), confidence (0.0-1.0), and autofix_class (safe_auto/gated_auto/manual/advisory)",
|
|
32
|
+
"Suppress all findings below 0.60 confidence to prevent noise",
|
|
33
|
+
"Merge/deduplicate findings by fingerprint: (file + line_bucket +/- 3 lines + normalized_title). On conflict, keep highest severity and strongest confidence",
|
|
34
|
+
"Route actions by class: safe_auto findings get auto-fixed; gated_auto/manual findings go to human review; advisory findings are informational only",
|
|
35
|
+
"Maximum 2 rounds of autofix to prevent loops"
|
|
36
|
+
],
|
|
37
|
+
"steps": [
|
|
38
|
+
"1. Detect scope of changes (files, languages, domains affected)",
|
|
39
|
+
"2. Discover intent from commit messages, PR description, or task context",
|
|
40
|
+
"3. Select conditional reviewers based on scope (security for auth files, performance for queries, etc.)",
|
|
41
|
+
"4. Dispatch all selected reviewers in parallel — each reads the diff independently",
|
|
42
|
+
"5. Collect structured JSON findings from all reviewers",
|
|
43
|
+
"6. Merge findings: deduplicate by fingerprint, resolve severity conflicts conservatively",
|
|
44
|
+
"7. Synthesize final report with verdict: Ready / Ready with fixes / Not ready"
|
|
45
|
+
]
|
|
46
|
+
},
|
|
47
|
+
"verification": {
|
|
48
|
+
"successIndicators": [
|
|
49
|
+
"All P0 findings are genuine breakage traceable to specific code paths",
|
|
50
|
+
"Line numbers point to exact buggy code, not nearby lines",
|
|
51
|
+
"Each finding is actionable with a clear fix path",
|
|
52
|
+
"No false positives from style issues that linters catch",
|
|
53
|
+
"Deduplication produces no redundant findings"
|
|
54
|
+
],
|
|
55
|
+
"failureIndicators": [
|
|
56
|
+
"P0 findings that are actually style nits",
|
|
57
|
+
"False positives exceeding 20% of total findings",
|
|
58
|
+
"Same issue reported multiple times after deduplication",
|
|
59
|
+
"Findings that require runtime observation to confirm (not provable from code)",
|
|
60
|
+
"Protected artifacts (docs, plans, brainstorms) flagged for deletion"
|
|
61
|
+
],
|
|
62
|
+
"rollbackStrategy": "Review findings are advisory — no code changes until human approval (except safe_auto in autofix mode)"
|
|
63
|
+
}
|
|
64
|
+
}
|
|
@@ -0,0 +1,54 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "security-review",
|
|
3
|
+
"curatedBy": "compound-engineering",
|
|
4
|
+
"confidence": 0.85,
|
|
5
|
+
"complexity": "moderate",
|
|
6
|
+
"estimatedEffort": 4,
|
|
7
|
+
"applicability": {
|
|
8
|
+
"situations": [
|
|
9
|
+
"Reviewing code changes that touch auth, user input, public endpoints, or permissions",
|
|
10
|
+
"Auditing for exploitable vulnerabilities before deployment",
|
|
11
|
+
"Systematic OWASP Top 10 compliance checking"
|
|
12
|
+
],
|
|
13
|
+
"triggers": [
|
|
14
|
+
"security review",
|
|
15
|
+
"auth",
|
|
16
|
+
"injection",
|
|
17
|
+
"XSS",
|
|
18
|
+
"CSRF",
|
|
19
|
+
"user input",
|
|
20
|
+
"public endpoint"
|
|
21
|
+
],
|
|
22
|
+
"antiPatterns": [
|
|
23
|
+
"Defense-in-depth on already-protected code",
|
|
24
|
+
"Theoretical attacks requiring physical access",
|
|
25
|
+
"HTTP vs HTTPS in dev/test configs",
|
|
26
|
+
"Generic hardening advice without specific exploitable findings"
|
|
27
|
+
],
|
|
28
|
+
"domains": ["code-review", "security", "quality-assurance"]
|
|
29
|
+
},
|
|
30
|
+
"guidance": {
|
|
31
|
+
"strategy": "Think like an attacker looking for one exploitable path through the code. Trace data from entry point to dangerous sink. Combine targeted attack-path analysis with systematic OWASP Top 10 coverage.",
|
|
32
|
+
"tactics": [
|
|
33
|
+
"Injection vectors: trace untrusted input to SQL, XSS, shell commands, template engines, innerHTML/dangerouslySetInnerHTML — flag when no sanitization between entry and sink",
|
|
34
|
+
"Auth/authz bypasses: check for missing auth middleware, broken ownership checks (user A accessing user B's resources), privilege escalation, CSRF on state-changing endpoints",
|
|
35
|
+
"Secrets exposure: scan for hardcoded keys/tokens/passwords, sensitive data in error messages or logs, PII in responses without need-to-know filtering",
|
|
36
|
+
"Insecure deserialization: flag pickle, Marshal, unserialize, JSON.parse of executable content from untrusted sources",
|
|
37
|
+
"SSRF and path traversal: flag user-controlled URLs or file paths passed to fetch/open without allowlist validation",
|
|
38
|
+
"Systematic OWASP Top 10 check: input validation on all entry points (req.body, req.params, req.query), SQL parameterization, XSS escaping + CSP headers, auth on all endpoints, encryption for sensitive data at rest and in transit",
|
|
39
|
+
"Confidence calibration: HIGH (0.80+) when full attack path is traceable from untrusted input to dangerous sink without sanitization; MODERATE (0.60-0.79) when dangerous pattern present but exploitability unconfirmed; suppress below 0.60"
|
|
40
|
+
]
|
|
41
|
+
},
|
|
42
|
+
"verification": {
|
|
43
|
+
"successIndicators": [
|
|
44
|
+
"Each finding traces a complete attack path: untrusted input → specific code path → exploitable outcome",
|
|
45
|
+
"No false positives from already-protected code or dev-only configs",
|
|
46
|
+
"OWASP categories systematically checked, not just obvious injection"
|
|
47
|
+
],
|
|
48
|
+
"failureIndicators": [
|
|
49
|
+
"Finding requires physical access or internal-only network to exploit",
|
|
50
|
+
"Generic 'could be vulnerable' without tracing specific input to specific sink",
|
|
51
|
+
"Flagging defense-in-depth that's already behind validated auth"
|
|
52
|
+
]
|
|
53
|
+
}
|
|
54
|
+
}
|
|
@@ -0,0 +1,64 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "systematic-execution",
|
|
3
|
+
"curatedBy": "compound-engineering",
|
|
4
|
+
"confidence": 0.8,
|
|
5
|
+
"complexity": "complex",
|
|
6
|
+
"estimatedEffort": 10,
|
|
7
|
+
"applicability": {
|
|
8
|
+
"situations": [
|
|
9
|
+
"Executing an implementation plan systematically",
|
|
10
|
+
"Shipping a feature with testing, review, and quality gates",
|
|
11
|
+
"Multi-unit implementation requiring incremental progress and verification"
|
|
12
|
+
],
|
|
13
|
+
"triggers": [
|
|
14
|
+
"execute plan",
|
|
15
|
+
"start work",
|
|
16
|
+
"implement this",
|
|
17
|
+
"ship feature"
|
|
18
|
+
],
|
|
19
|
+
"antiPatterns": [
|
|
20
|
+
"No plan exists — create one first",
|
|
21
|
+
"Exploratory work where requirements aren't defined",
|
|
22
|
+
"Hotfix that needs to ship immediately without full process"
|
|
23
|
+
],
|
|
24
|
+
"domains": ["execution", "implementation", "software-engineering"]
|
|
25
|
+
},
|
|
26
|
+
"guidance": {
|
|
27
|
+
"strategy": "Treat the plan as a decision artifact, not an instruction script. Execute implementation units in dependency order, testing continuously, with incremental commits after each logical unit. Simplify after every 2-3 units.",
|
|
28
|
+
"tactics": [
|
|
29
|
+
"Read plan's Implementation Units; honor execution posture (test-first, characterization-first) when annotated; check 'Deferred to Implementation' questions before starting",
|
|
30
|
+
"Strategy selection by scale: inline (1-2 small tasks), serial subagents (3+ with dependencies), parallel subagents (3+ independent), swarm (10+ with coordination)",
|
|
31
|
+
"Test as you go, not at end: run tests after each significant change; never batch testing to the end",
|
|
32
|
+
"System-wide test check before marking task done: trace callbacks/middleware/observers two levels out; write integration tests with real objects through full chain; verify failure doesn't leave orphaned state; check if other interfaces expose same behavior",
|
|
33
|
+
"Incremental commits after each complete logical unit — messages describe complete valuable changes, not WIP",
|
|
34
|
+
"Simplify after every 2-3 units: review changed files for consolidation opportunities, dead code, naming improvements",
|
|
35
|
+
"Pattern following discipline: read referenced files from plan before implementing — don't invent new conventions",
|
|
36
|
+
"Feature completeness first: don't move to next feature until current one ships"
|
|
37
|
+
],
|
|
38
|
+
"steps": [
|
|
39
|
+
"1. Read plan, clarify any ambiguities, set up environment",
|
|
40
|
+
"2. Create task tracking for all implementation units",
|
|
41
|
+
"3. Execute units in dependency order: implement → test → verify → commit",
|
|
42
|
+
"4. After every 2-3 units, review for simplification opportunities",
|
|
43
|
+
"5. Run quality checks: tests pass, linting passes, code follows existing patterns",
|
|
44
|
+
"6. Prepare PR: summary (what/why/decisions), testing notes, post-deploy monitoring plan",
|
|
45
|
+
"7. Update plan status"
|
|
46
|
+
]
|
|
47
|
+
},
|
|
48
|
+
"verification": {
|
|
49
|
+
"successIndicators": [
|
|
50
|
+
"All implementation units completed and tested",
|
|
51
|
+
"Tests pass and linting passes",
|
|
52
|
+
"Code follows existing patterns — no new conventions invented",
|
|
53
|
+
"Each commit describes a complete valuable change",
|
|
54
|
+
"PR includes post-deploy monitoring plan with concrete metrics"
|
|
55
|
+
],
|
|
56
|
+
"failureIndicators": [
|
|
57
|
+
"Tests batched to end and found late-breaking issues",
|
|
58
|
+
"New conventions invented instead of following existing patterns",
|
|
59
|
+
"Commits contain WIP or incomplete changes",
|
|
60
|
+
"Feature moved on before current one fully shipped",
|
|
61
|
+
"System-wide test check skipped for code with callbacks or error handling"
|
|
62
|
+
]
|
|
63
|
+
}
|
|
64
|
+
}
|
|
@@ -0,0 +1,50 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "testing-review",
|
|
3
|
+
"curatedBy": "compound-engineering",
|
|
4
|
+
"confidence": 0.85,
|
|
5
|
+
"complexity": "moderate",
|
|
6
|
+
"estimatedEffort": 3,
|
|
7
|
+
"applicability": {
|
|
8
|
+
"situations": [
|
|
9
|
+
"Reviewing test quality and coverage for code changes",
|
|
10
|
+
"Evaluating whether tests prove code works or provide false confidence",
|
|
11
|
+
"Checking for untested branches, weak assertions, and missing error paths"
|
|
12
|
+
],
|
|
13
|
+
"triggers": [
|
|
14
|
+
"code review",
|
|
15
|
+
"test coverage",
|
|
16
|
+
"test quality",
|
|
17
|
+
"missing tests"
|
|
18
|
+
],
|
|
19
|
+
"antiPatterns": [
|
|
20
|
+
"Reviewing test infrastructure or test framework setup",
|
|
21
|
+
"Evaluating test performance or execution speed",
|
|
22
|
+
"Coverage percentage targets without considering test quality"
|
|
23
|
+
],
|
|
24
|
+
"domains": ["code-review", "testing", "quality-assurance"]
|
|
25
|
+
},
|
|
26
|
+
"guidance": {
|
|
27
|
+
"strategy": "For every new branch (if/else/switch/try/catch) in the diff, verify at least one test exercises it. Focus on whether tests prove behavior, not just that code doesn't throw.",
|
|
28
|
+
"tactics": [
|
|
29
|
+
"Hunt for: untested branches (new if/else/switch/try/catch), tests that don't assert behavior (only assert 'doesn't throw'), implementation-coupled brittle tests (assert on mocks, test private methods, snapshot internals), missing error path coverage",
|
|
30
|
+
"Branch coverage discipline: each new branch must have at least one test; trace all paths through the new code",
|
|
31
|
+
"Behavior assertion rigor: assert specific values not just truthiness; verify both happy path AND sad path",
|
|
32
|
+
"Check that error paths are tested: catch blocks, fallback branches, error returns should have dedicated tests",
|
|
33
|
+
"Flag implementation-coupled tests: tests that break when refactoring without behavior change are brittle",
|
|
34
|
+
"Confidence calibration: HIGH (0.80+) when test gap is provable from diff (new branch, no test); MODERATE (0.60-0.79) when inferred from structure (parser.ts with no parser.test.ts); suppress below 0.60 when coverage may exist in integration tests"
|
|
35
|
+
]
|
|
36
|
+
},
|
|
37
|
+
"verification": {
|
|
38
|
+
"successIndicators": [
|
|
39
|
+
"All new branches have corresponding test cases",
|
|
40
|
+
"Tests assert actual behavior with specific expected values",
|
|
41
|
+
"Error paths have dedicated tests, not just happy path",
|
|
42
|
+
"No implementation-coupled brittleness identified"
|
|
43
|
+
],
|
|
44
|
+
"failureIndicators": [
|
|
45
|
+
"New branches found without any test coverage",
|
|
46
|
+
"Tests only assert 'doesn't throw' or truthiness without checking values",
|
|
47
|
+
"Error handling code has no test exercising the error path"
|
|
48
|
+
]
|
|
49
|
+
}
|
|
50
|
+
}
|