npm - cognitive-core - Versions diffs - 0.2.0 → 0.2.2 - Mend

cognitive-core 0.2.0 → 0.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (397) hide show

package/.claude/settings.json +111 -2
package/.sessionlog/settings.json +4 -0
package/dist/atlas.d.ts +10 -0
package/dist/atlas.d.ts.map +1 -1
package/dist/atlas.js +65 -0
package/dist/atlas.js.map +1 -1
package/dist/index.d.ts +1 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js +5 -1
package/dist/index.js.map +1 -1
package/dist/learning/index.d.ts +1 -1
package/dist/learning/index.d.ts.map +1 -1
package/dist/learning/index.js.map +1 -1
package/dist/learning/pipeline.d.ts +4 -31
package/dist/learning/pipeline.d.ts.map +1 -1
package/dist/learning/pipeline.js +12 -64
package/dist/learning/pipeline.js.map +1 -1
package/dist/learning/unified-pipeline.d.ts +30 -0
package/dist/learning/unified-pipeline.d.ts.map +1 -1
package/dist/learning/unified-pipeline.js +207 -0
package/dist/learning/unified-pipeline.js.map +1 -1
package/dist/memory/candidate-retrieval.d.ts.map +1 -1
package/dist/memory/candidate-retrieval.js +3 -1
package/dist/memory/candidate-retrieval.js.map +1 -1
package/dist/memory/curated-loader.d.ts +21 -4
package/dist/memory/curated-loader.d.ts.map +1 -1
package/dist/memory/curated-loader.js +53 -16
package/dist/memory/curated-loader.js.map +1 -1
package/dist/memory/index.d.ts +2 -1
package/dist/memory/index.d.ts.map +1 -1
package/dist/memory/index.js +3 -1
package/dist/memory/index.js.map +1 -1
package/dist/memory/playbook.d.ts +6 -0
package/dist/memory/playbook.d.ts.map +1 -1
package/dist/memory/playbook.js +15 -0
package/dist/memory/playbook.js.map +1 -1
package/dist/memory/source-resolver.d.ts +120 -0
package/dist/memory/source-resolver.d.ts.map +1 -0
package/dist/memory/source-resolver.js +300 -0
package/dist/memory/source-resolver.js.map +1 -0
package/dist/types/config.d.ts +141 -0
package/dist/types/config.d.ts.map +1 -1
package/dist/types/config.js +40 -0
package/dist/types/config.js.map +1 -1
package/dist/types/index.d.ts +1 -1
package/dist/types/index.d.ts.map +1 -1
package/dist/types/index.js +1 -1
package/dist/types/index.js.map +1 -1
package/dist/utils/error-classifier.js +8 -8
package/dist/utils/error-classifier.js.map +1 -1
package/dist/workspace/efficacy-toolkit.d.ts +164 -0
package/dist/workspace/efficacy-toolkit.d.ts.map +1 -0
package/dist/workspace/efficacy-toolkit.js +281 -0
package/dist/workspace/efficacy-toolkit.js.map +1 -0
package/dist/workspace/index.d.ts +2 -1
package/dist/workspace/index.d.ts.map +1 -1
package/dist/workspace/index.js +3 -1
package/dist/workspace/index.js.map +1 -1
package/dist/workspace/templates/index.d.ts +3 -0
package/dist/workspace/templates/index.d.ts.map +1 -1
package/dist/workspace/templates/index.js +6 -0
package/dist/workspace/templates/index.js.map +1 -1
package/dist/workspace/templates/playbook-decay-detection.d.ts +46 -0
package/dist/workspace/templates/playbook-decay-detection.d.ts.map +1 -0
package/dist/workspace/templates/playbook-decay-detection.js +197 -0
package/dist/workspace/templates/playbook-decay-detection.js.map +1 -0
package/dist/workspace/templates/playbook-efficacy-audit.d.ts +46 -0
package/dist/workspace/templates/playbook-efficacy-audit.d.ts.map +1 -0
package/dist/workspace/templates/playbook-efficacy-audit.js +160 -0
package/dist/workspace/templates/playbook-efficacy-audit.js.map +1 -0
package/dist/workspace/templates/playbook-lifecycle-review.d.ts +51 -0
package/dist/workspace/templates/playbook-lifecycle-review.d.ts.map +1 -0
package/dist/workspace/templates/playbook-lifecycle-review.js +187 -0
package/dist/workspace/templates/playbook-lifecycle-review.js.map +1 -0
package/dist/workspace/types.d.ts +12 -54
package/dist/workspace/types.d.ts.map +1 -1
package/dist/workspace/types.js.map +1 -1
package/package.json +8 -2
package/playbooks/compound-engineering/adversarial-review.json +51 -0
package/playbooks/compound-engineering/agent-native-architecture.json +59 -0
package/playbooks/compound-engineering/agent-native-review.json +54 -0
package/playbooks/compound-engineering/api-contract-review.json +52 -0
package/playbooks/compound-engineering/brainstorm-requirements.json +55 -0
package/playbooks/compound-engineering/bug-reproduction.json +62 -0
package/playbooks/compound-engineering/confidence-calibration.json +49 -0
package/playbooks/compound-engineering/correctness-review.json +49 -0
package/playbooks/compound-engineering/data-migration-safety.json +59 -0
package/playbooks/compound-engineering/deployment-verification.json +63 -0
package/playbooks/compound-engineering/error-recovery-patterns.json +53 -0
package/playbooks/compound-engineering/implementation-planning.json +64 -0
package/playbooks/compound-engineering/issue-pattern-analysis.json +53 -0
package/playbooks/compound-engineering/knowledge-compounding.json +63 -0
package/playbooks/compound-engineering/learnings-research.json +54 -0
package/playbooks/compound-engineering/maintainability-review.json +49 -0
package/playbooks/compound-engineering/performance-review.json +54 -0
package/playbooks/compound-engineering/plan-adversarial-review.json +56 -0
package/playbooks/compound-engineering/plan-feasibility-review.json +56 -0
package/playbooks/compound-engineering/project-standards-review.json +52 -0
package/playbooks/compound-engineering/reliability-review.json +53 -0
package/playbooks/compound-engineering/review-orchestration.json +64 -0
package/playbooks/compound-engineering/security-review.json +54 -0
package/playbooks/compound-engineering/systematic-execution.json +64 -0
package/playbooks/compound-engineering/testing-review.json +50 -0
package/src/atlas.ts +96 -0
package/src/index.ts +27 -0
package/src/learning/index.ts +1 -0
package/src/learning/unified-pipeline.ts +271 -1
package/src/memory/candidate-retrieval.ts +2 -1
package/src/memory/curated-loader.ts +69 -16
package/src/memory/index.ts +16 -0
package/src/memory/playbook.ts +19 -0
package/src/memory/source-resolver.ts +422 -0
package/src/types/config.ts +46 -0
package/src/types/index.ts +4 -0
package/src/utils/error-classifier.ts +8 -8
package/src/workspace/efficacy-toolkit.ts +496 -0
package/src/workspace/index.ts +29 -0
package/src/workspace/templates/index.ts +24 -0
package/src/workspace/templates/playbook-decay-detection.ts +272 -0
package/src/workspace/templates/playbook-efficacy-audit.ts +246 -0
package/src/workspace/templates/playbook-lifecycle-review.ts +274 -0
package/src/workspace/types.ts +22 -78
package/tests/fixtures/behavioral-trajectories.ts +210 -0
package/tests/integration/curated-sources-e2e.test.ts +502 -0
package/tests/integration/pipeline-data-correctness.test.ts +794 -0
package/tests/learning/meta-learner.test.ts +418 -0
package/tests/learning/pipeline-memory-updates.test.ts +721 -0
package/tests/learning/unified-pipeline-efficacy.test.ts +232 -0
package/tests/memory/candidate-retrieval.test.ts +167 -0
package/tests/memory/compound-engineering-seed.test.ts +338 -0
package/tests/memory/curated-loader-extended.test.ts +225 -0
package/tests/memory/meta.test.ts +399 -0
package/tests/memory/playbook-quality-validation.test.ts +430 -0
package/tests/memory/source-resolver.test.ts +700 -0
package/tests/search/evaluator.test.ts +257 -0
package/tests/search/verification-runner.test.ts +357 -0
package/tests/utils/error-classifier.test.ts +149 -0
package/tests/utils/trajectory-helpers.test.ts +163 -0
package/tests/workspace/efficacy-toolkit.test.ts +404 -0
package/tests/workspace/templates/playbook-efficacy.test.ts +377 -0
package/.claude/settings.local.json +0 -11
package/dist/learning/llm-extractor.d.ts +0 -88
package/dist/learning/llm-extractor.d.ts.map +0 -1
package/dist/learning/llm-extractor.js +0 -372
package/dist/learning/llm-extractor.js.map +0 -1
package/dist/learning/loop-coordinator.d.ts +0 -61
package/dist/learning/loop-coordinator.d.ts.map +0 -1
package/dist/learning/loop-coordinator.js +0 -96
package/dist/learning/loop-coordinator.js.map +0 -1
package/references/agent-workspace/CLAUDE.md +0 -74
package/references/agent-workspace/README.md +0 -587
package/references/agent-workspace/media/banner.png +0 -0
package/references/agent-workspace/package-lock.json +0 -2061
package/references/agent-workspace/package.json +0 -54
package/references/agent-workspace/src/handle.ts +0 -122
package/references/agent-workspace/src/index.ts +0 -32
package/references/agent-workspace/src/manager.ts +0 -102
package/references/agent-workspace/src/readers/json.ts +0 -71
package/references/agent-workspace/src/readers/markdown.ts +0 -37
package/references/agent-workspace/src/readers/raw.ts +0 -27
package/references/agent-workspace/src/types.ts +0 -68
package/references/agent-workspace/src/validation.ts +0 -93
package/references/agent-workspace/src/writers/json.ts +0 -17
package/references/agent-workspace/src/writers/markdown.ts +0 -27
package/references/agent-workspace/src/writers/raw.ts +0 -22
package/references/agent-workspace/tests/errors.test.ts +0 -652
package/references/agent-workspace/tests/handle.test.ts +0 -144
package/references/agent-workspace/tests/manager.test.ts +0 -124
package/references/agent-workspace/tests/readers.test.ts +0 -205
package/references/agent-workspace/tests/validation.test.ts +0 -196
package/references/agent-workspace/tests/writers.test.ts +0 -108
package/references/agent-workspace/tsconfig.json +0 -20
package/references/agent-workspace/tsup.config.ts +0 -9
package/references/minimem/.claude/settings.json +0 -7
package/references/minimem/.sudocode/issues.jsonl +0 -18
package/references/minimem/.sudocode/specs.jsonl +0 -1
package/references/minimem/CLAUDE.md +0 -310
package/references/minimem/README.md +0 -556
package/references/minimem/claude-plugin/.claude-plugin/plugin.json +0 -10
package/references/minimem/claude-plugin/.mcp.json +0 -7
package/references/minimem/claude-plugin/README.md +0 -158
package/references/minimem/claude-plugin/commands/recall.md +0 -47
package/references/minimem/claude-plugin/commands/remember.md +0 -41
package/references/minimem/claude-plugin/hooks/__tests__/hooks.test.ts +0 -272
package/references/minimem/claude-plugin/hooks/hooks.json +0 -27
package/references/minimem/claude-plugin/hooks/session-end.sh +0 -86
package/references/minimem/claude-plugin/hooks/session-start.sh +0 -85
package/references/minimem/claude-plugin/skills/memory/SKILL.md +0 -108
package/references/minimem/package-lock.json +0 -5373
package/references/minimem/package.json +0 -60
package/references/minimem/scripts/postbuild.js +0 -35
package/references/minimem/src/__tests__/edge-cases.test.ts +0 -371
package/references/minimem/src/__tests__/errors.test.ts +0 -265
package/references/minimem/src/__tests__/helpers.ts +0 -199
package/references/minimem/src/__tests__/internal.test.ts +0 -407
package/references/minimem/src/__tests__/knowledge.test.ts +0 -287
package/references/minimem/src/__tests__/minimem.integration.test.ts +0 -1127
package/references/minimem/src/__tests__/session.test.ts +0 -190
package/references/minimem/src/cli/__tests__/commands.test.ts +0 -759
package/references/minimem/src/cli/commands/__tests__/conflicts.test.ts +0 -141
package/references/minimem/src/cli/commands/append.ts +0 -76
package/references/minimem/src/cli/commands/config.ts +0 -262
package/references/minimem/src/cli/commands/conflicts.ts +0 -413
package/references/minimem/src/cli/commands/daemon.ts +0 -169
package/references/minimem/src/cli/commands/index.ts +0 -12
package/references/minimem/src/cli/commands/init.ts +0 -88
package/references/minimem/src/cli/commands/mcp.ts +0 -177
package/references/minimem/src/cli/commands/push-pull.ts +0 -213
package/references/minimem/src/cli/commands/search.ts +0 -158
package/references/minimem/src/cli/commands/status.ts +0 -84
package/references/minimem/src/cli/commands/sync-init.ts +0 -290
package/references/minimem/src/cli/commands/sync.ts +0 -70
package/references/minimem/src/cli/commands/upsert.ts +0 -197
package/references/minimem/src/cli/config.ts +0 -584
package/references/minimem/src/cli/index.ts +0 -264
package/references/minimem/src/cli/shared.ts +0 -161
package/references/minimem/src/cli/sync/__tests__/central.test.ts +0 -152
package/references/minimem/src/cli/sync/__tests__/conflicts.test.ts +0 -209
package/references/minimem/src/cli/sync/__tests__/daemon.test.ts +0 -118
package/references/minimem/src/cli/sync/__tests__/detection.test.ts +0 -207
package/references/minimem/src/cli/sync/__tests__/integration.test.ts +0 -476
package/references/minimem/src/cli/sync/__tests__/registry.test.ts +0 -363
package/references/minimem/src/cli/sync/__tests__/state.test.ts +0 -255
package/references/minimem/src/cli/sync/__tests__/validation.test.ts +0 -193
package/references/minimem/src/cli/sync/__tests__/watcher.test.ts +0 -178
package/references/minimem/src/cli/sync/central.ts +0 -292
package/references/minimem/src/cli/sync/conflicts.ts +0 -204
package/references/minimem/src/cli/sync/daemon.ts +0 -407
package/references/minimem/src/cli/sync/detection.ts +0 -138
package/references/minimem/src/cli/sync/index.ts +0 -107
package/references/minimem/src/cli/sync/operations.ts +0 -373
package/references/minimem/src/cli/sync/registry.ts +0 -279
package/references/minimem/src/cli/sync/state.ts +0 -355
package/references/minimem/src/cli/sync/validation.ts +0 -206
package/references/minimem/src/cli/sync/watcher.ts +0 -234
package/references/minimem/src/cli/version.ts +0 -34
package/references/minimem/src/core/index.ts +0 -9
package/references/minimem/src/core/indexer.ts +0 -628
package/references/minimem/src/core/searcher.ts +0 -221
package/references/minimem/src/db/schema.ts +0 -183
package/references/minimem/src/db/sqlite-vec.ts +0 -24
package/references/minimem/src/embeddings/__tests__/embeddings.test.ts +0 -431
package/references/minimem/src/embeddings/batch-gemini.ts +0 -392
package/references/minimem/src/embeddings/batch-openai.ts +0 -409
package/references/minimem/src/embeddings/embeddings.ts +0 -434
package/references/minimem/src/index.ts +0 -109
package/references/minimem/src/internal.ts +0 -299
package/references/minimem/src/minimem.ts +0 -1276
package/references/minimem/src/search/__tests__/hybrid.test.ts +0 -247
package/references/minimem/src/search/graph.ts +0 -234
package/references/minimem/src/search/hybrid.ts +0 -151
package/references/minimem/src/search/search.ts +0 -256
package/references/minimem/src/server/__tests__/mcp.test.ts +0 -341
package/references/minimem/src/server/__tests__/tools.test.ts +0 -364
package/references/minimem/src/server/mcp.ts +0 -326
package/references/minimem/src/server/tools.ts +0 -720
package/references/minimem/src/session.ts +0 -460
package/references/minimem/tsconfig.json +0 -19
package/references/minimem/tsup.config.ts +0 -26
package/references/minimem/vitest.config.ts +0 -24
package/references/sessionlog/.husky/pre-commit +0 -1
package/references/sessionlog/.lintstagedrc.json +0 -4
package/references/sessionlog/.prettierignore +0 -4
package/references/sessionlog/.prettierrc.json +0 -11
package/references/sessionlog/LICENSE +0 -21
package/references/sessionlog/README.md +0 -453
package/references/sessionlog/eslint.config.js +0 -58
package/references/sessionlog/package-lock.json +0 -3672
package/references/sessionlog/package.json +0 -65
package/references/sessionlog/src/__tests__/agent-hooks.test.ts +0 -570
package/references/sessionlog/src/__tests__/agent-registry.test.ts +0 -127
package/references/sessionlog/src/__tests__/claude-code-hooks.test.ts +0 -225
package/references/sessionlog/src/__tests__/claude-generator.test.ts +0 -46
package/references/sessionlog/src/__tests__/commit-msg.test.ts +0 -86
package/references/sessionlog/src/__tests__/cursor-agent.test.ts +0 -224
package/references/sessionlog/src/__tests__/e2e-live.test.ts +0 -890
package/references/sessionlog/src/__tests__/event-log.test.ts +0 -183
package/references/sessionlog/src/__tests__/flush-sentinel.test.ts +0 -105
package/references/sessionlog/src/__tests__/gemini-agent.test.ts +0 -375
package/references/sessionlog/src/__tests__/git-hooks.test.ts +0 -78
package/references/sessionlog/src/__tests__/hook-managers.test.ts +0 -121
package/references/sessionlog/src/__tests__/lifecycle-tasks.test.ts +0 -759
package/references/sessionlog/src/__tests__/opencode-agent.test.ts +0 -338
package/references/sessionlog/src/__tests__/redaction.test.ts +0 -136
package/references/sessionlog/src/__tests__/session-repo.test.ts +0 -353
package/references/sessionlog/src/__tests__/session-store.test.ts +0 -166
package/references/sessionlog/src/__tests__/setup-ccweb.test.ts +0 -466
package/references/sessionlog/src/__tests__/skill-live.test.ts +0 -461
package/references/sessionlog/src/__tests__/summarize.test.ts +0 -348
package/references/sessionlog/src/__tests__/task-plan-e2e.test.ts +0 -610
package/references/sessionlog/src/__tests__/task-plan-live.test.ts +0 -632
package/references/sessionlog/src/__tests__/transcript-timestamp.test.ts +0 -121
package/references/sessionlog/src/__tests__/types.test.ts +0 -166
package/references/sessionlog/src/__tests__/utils.test.ts +0 -333
package/references/sessionlog/src/__tests__/validation.test.ts +0 -103
package/references/sessionlog/src/__tests__/worktree.test.ts +0 -57
package/references/sessionlog/src/agent/agents/claude-code.ts +0 -1089
package/references/sessionlog/src/agent/agents/cursor.ts +0 -361
package/references/sessionlog/src/agent/agents/gemini-cli.ts +0 -632
package/references/sessionlog/src/agent/agents/opencode.ts +0 -540
package/references/sessionlog/src/agent/registry.ts +0 -143
package/references/sessionlog/src/agent/session-types.ts +0 -113
package/references/sessionlog/src/agent/types.ts +0 -220
package/references/sessionlog/src/cli.ts +0 -597
package/references/sessionlog/src/commands/clean.ts +0 -133
package/references/sessionlog/src/commands/disable.ts +0 -84
package/references/sessionlog/src/commands/doctor.ts +0 -145
package/references/sessionlog/src/commands/enable.ts +0 -202
package/references/sessionlog/src/commands/explain.ts +0 -261
package/references/sessionlog/src/commands/reset.ts +0 -105
package/references/sessionlog/src/commands/resume.ts +0 -180
package/references/sessionlog/src/commands/rewind.ts +0 -195
package/references/sessionlog/src/commands/setup-ccweb.ts +0 -275
package/references/sessionlog/src/commands/status.ts +0 -172
package/references/sessionlog/src/config.ts +0 -165
package/references/sessionlog/src/events/event-log.ts +0 -126
package/references/sessionlog/src/git-operations.ts +0 -558
package/references/sessionlog/src/hooks/git-hooks.ts +0 -165
package/references/sessionlog/src/hooks/lifecycle.ts +0 -391
package/references/sessionlog/src/index.ts +0 -650
package/references/sessionlog/src/security/redaction.ts +0 -283
package/references/sessionlog/src/session/state-machine.ts +0 -452
package/references/sessionlog/src/store/checkpoint-store.ts +0 -509
package/references/sessionlog/src/store/native-store.ts +0 -173
package/references/sessionlog/src/store/provider-types.ts +0 -99
package/references/sessionlog/src/store/session-store.ts +0 -266
package/references/sessionlog/src/strategy/attribution.ts +0 -296
package/references/sessionlog/src/strategy/common.ts +0 -207
package/references/sessionlog/src/strategy/content-overlap.ts +0 -228
package/references/sessionlog/src/strategy/manual-commit.ts +0 -988
package/references/sessionlog/src/strategy/types.ts +0 -279
package/references/sessionlog/src/summarize/claude-generator.ts +0 -115
package/references/sessionlog/src/summarize/summarize.ts +0 -432
package/references/sessionlog/src/types.ts +0 -508
package/references/sessionlog/src/utils/chunk-files.ts +0 -49
package/references/sessionlog/src/utils/commit-message.ts +0 -65
package/references/sessionlog/src/utils/detect-agent.ts +0 -36
package/references/sessionlog/src/utils/hook-managers.ts +0 -125
package/references/sessionlog/src/utils/ide-tags.ts +0 -32
package/references/sessionlog/src/utils/paths.ts +0 -79
package/references/sessionlog/src/utils/preview-rewind.ts +0 -80
package/references/sessionlog/src/utils/rewind-conflict.ts +0 -121
package/references/sessionlog/src/utils/shadow-branch.ts +0 -109
package/references/sessionlog/src/utils/string-utils.ts +0 -46
package/references/sessionlog/src/utils/todo-extract.ts +0 -188
package/references/sessionlog/src/utils/trailers.ts +0 -187
package/references/sessionlog/src/utils/transcript-parse.ts +0 -177
package/references/sessionlog/src/utils/transcript-timestamp.ts +0 -59
package/references/sessionlog/src/utils/tree-ops.ts +0 -219
package/references/sessionlog/src/utils/tty.ts +0 -72
package/references/sessionlog/src/utils/validation.ts +0 -65
package/references/sessionlog/src/utils/worktree.ts +0 -58
package/references/sessionlog/src/wire-types.ts +0 -59
package/references/sessionlog/templates/setup-env.sh +0 -153
package/references/sessionlog/tsconfig.json +0 -18
package/references/sessionlog/vitest.config.ts +0 -12
package/references/skill-tree/.claude/settings.json +0 -6
package/references/skill-tree/.sudocode/issues.jsonl +0 -19
package/references/skill-tree/.sudocode/specs.jsonl +0 -3
package/references/skill-tree/CLAUDE.md +0 -126
package/references/skill-tree/README.md +0 -372
package/references/skill-tree/docs/GAPS_v1.md +0 -221
package/references/skill-tree/docs/INTEGRATION_PLAN.md +0 -467
package/references/skill-tree/docs/TODOS.md +0 -91
package/references/skill-tree/docs/anthropic_skill_guide.md +0 -1364
package/references/skill-tree/docs/design/federated-skill-trees.md +0 -524
package/references/skill-tree/docs/design/multi-agent-sync.md +0 -759
package/references/skill-tree/docs/scraper/BRAINSTORM.md +0 -583
package/references/skill-tree/docs/scraper/POC_PLAN.md +0 -420
package/references/skill-tree/docs/scraper/README.md +0 -170
package/references/skill-tree/examples/basic-usage.ts +0 -164
package/references/skill-tree/package-lock.json +0 -1852
package/references/skill-tree/package.json +0 -66
package/references/skill-tree/scraper/README.md +0 -123
package/references/skill-tree/scraper/docs/DESIGN.md +0 -683
package/references/skill-tree/scraper/docs/PLAN.md +0 -336
package/references/skill-tree/scraper/drizzle.config.ts +0 -10
package/references/skill-tree/scraper/package-lock.json +0 -6329
package/references/skill-tree/scraper/package.json +0 -68
package/references/skill-tree/scraper/test/fixtures/invalid-skill/missing-description.md +0 -7
package/references/skill-tree/scraper/test/fixtures/invalid-skill/missing-name.md +0 -7
package/references/skill-tree/scraper/test/fixtures/minimal-skill/SKILL.md +0 -27
package/references/skill-tree/scraper/test/fixtures/skill-json/SKILL.json +0 -21
package/references/skill-tree/scraper/test/fixtures/skill-with-meta/SKILL.md +0 -54
package/references/skill-tree/scraper/test/fixtures/skill-with-meta/_meta.json +0 -24
package/references/skill-tree/scraper/test/fixtures/valid-skill/SKILL.md +0 -93
package/references/skill-tree/scraper/test/fixtures/valid-skill/_meta.json +0 -22
package/references/skill-tree/scraper/tsup.config.ts +0 -14
package/references/skill-tree/scraper/vitest.config.ts +0 -17
package/references/skill-tree/scripts/convert-to-vitest.ts +0 -166
package/references/skill-tree/skills/skill-writer/SKILL.md +0 -339
package/references/skill-tree/skills/skill-writer/references/examples.md +0 -326
package/references/skill-tree/skills/skill-writer/references/patterns.md +0 -210
package/references/skill-tree/skills/skill-writer/references/quality-checklist.md +0 -123
package/references/skill-tree/test/run-all.ts +0 -106
package/references/skill-tree/test/utils.ts +0 -128
package/references/skill-tree/vitest.config.ts +0 -16

package/playbooks/compound-engineering/learnings-research.json ADDED Viewed

@@ -0,0 +1,54 @@
+{
+  "name": "learnings-research",
+  "curatedBy": "compound-engineering",
+  "confidence": 0.85,
+  "complexity": "moderate",
+  "estimatedEffort": 3,
+  "applicability": {
+    "situations": [
+      "Looking up institutional knowledge before starting work",
+      "Finding past solutions for similar problems during debugging",
+      "Preventing repeated mistakes by surfacing known patterns and gotchas"
+    ],
+    "triggers": [
+      "search knowledge",
+      "past solutions",
+      "known issues",
+      "institutional knowledge",
+      "what do we know about"
+    ],
+    "antiPatterns": [
+      "Searching for information that doesn't exist in the knowledge base yet",
+      "Using full-text search as the first step instead of grep-first filtering",
+      "Reading all files sequentially instead of parallel keyword search"
+    ],
+    "domains": ["knowledge-management", "research", "debugging"]
+  },
+  "guidance": {
+    "strategy": "Grep-first filtering: extract keywords, narrow by category, run parallel content searches on frontmatter fields, then read only strong/moderate matches. Never read all files — always pre-filter.",
+    "tactics": [
+      "Extract keywords from the current task/problem description",
+      "Category narrowing (if clear): focus on the relevant knowledge subdirectory first",
+      "Parallel content-search: search on frontmatter fields (title, tags, module, component) using multiple keywords in parallel; use case-insensitive matching; use OR for synonyms",
+      "Score matches into four categories: Strong (module + tags match), Moderate (problem_type relevant + tags), Weak (tangential), None — only read Strong and Moderate",
+      "Always check critical-patterns document regardless of grep results — it contains must-know patterns for all work",
+      "Distill summaries from matched documents — surface actionable insights, not raw content",
+      "Assess overlap on 5 dimensions: problem statement, root cause, solution, referenced files, prevention rules",
+      "Run multiple searches in parallel — never sequentially"
+    ]
+  },
+  "verification": {
+    "successIndicators": [
+      "Relevant documents found and ranked by relevance strength",
+      "Critical patterns checked and incorporated",
+      "Summaries are distilled and actionable (not raw file dumps)",
+      "Search used grep-first filtering, not sequential file reading"
+    ],
+    "failureIndicators": [
+      "All files read sequentially instead of pre-filtered",
+      "Tangentially related entries included, adding noise",
+      "Critical patterns document skipped",
+      "Searches run sequentially instead of in parallel"
+    ]
+  }
+}

package/playbooks/compound-engineering/maintainability-review.json ADDED Viewed

@@ -0,0 +1,49 @@
+{
+  "name": "maintainability-review",
+  "curatedBy": "compound-engineering",
+  "confidence": 0.85,
+  "complexity": "moderate",
+  "estimatedEffort": 3,
+  "applicability": {
+    "situations": [
+      "Reviewing code for long-term carrying cost and maintainability",
+      "Evaluating abstractions, indirection, and naming clarity",
+      "Checking for dead code, unnecessary coupling, and premature complexity"
+    ],
+    "triggers": [
+      "code review",
+      "maintainability",
+      "complexity",
+      "refactoring"
+    ],
+    "antiPatterns": [
+      "Reviewing for correctness bugs — use correctness review instead",
+      "Style preferences that don't affect comprehension",
+      "Debating naming conventions already established in the codebase"
+    ],
+    "domains": ["code-review", "maintainability", "quality-assurance"]
+  },
+  "guidance": {
+    "strategy": "Apply the future developer lens: will the next person who touches this in 6 months understand it quickly? Every abstraction must earn its keep with 3+ implementations or proven variation.",
+    "tactics": [
+      "Hunt for: premature abstraction (interface/factory with one user), unnecessary indirection (>2 delegation levels), dead code (commented, unused exports, unreachable), unrelated module coupling, naming that obscures intent",
+      "Anti-pattern catalog: generic solution for specific problem, wrapper with no added value, config for unchanging values, unused extension points, circular dependencies, shared mutable state",
+      "Abstractions must earn their keep: 3+ implementations or proven variation axis — otherwise inline",
+      "Indirection must add clear value: if a function just delegates to another without transformation, it's overhead",
+      "Naming describes what, not how: booleans have is/has/should prefixes; functions describe outcome not mechanism",
+      "Confidence calibration: HIGH (0.80+) when objectively provable (abstraction has 1 user visible in codebase); MODERATE (0.60-0.79) for naming/abstraction boundary judgments; suppress below 0.60 for style preferences"
+    ]
+  },
+  "verification": {
+    "successIndicators": [
+      "All flagged abstractions are objectively underused (provable from codebase search)",
+      "Indirection findings show concrete delegation chain with no value-add",
+      "Dead code findings are verifiable via search (no callers/importers)"
+    ],
+    "failureIndicators": [
+      "Finding is really a style preference, not a maintainability concern",
+      "Abstraction flagged as premature but actually has 3+ users",
+      "Naming critique is subjective rather than clarity-impacting"
+    ]
+  }
+}

package/playbooks/compound-engineering/performance-review.json ADDED Viewed

@@ -0,0 +1,54 @@
+{
+  "name": "performance-review",
+  "curatedBy": "compound-engineering",
+  "confidence": 0.85,
+  "complexity": "moderate",
+  "estimatedEffort": 4,
+  "applicability": {
+    "situations": [
+      "Reviewing code that touches database queries, loops, caching, or I/O-intensive paths",
+      "Evaluating scalability of new features at 10x/100x/1000x current data volumes",
+      "Checking for production-observable performance regressions"
+    ],
+    "triggers": [
+      "performance review",
+      "N+1 query",
+      "slow query",
+      "memory leak",
+      "pagination",
+      "caching"
+    ],
+    "antiPatterns": [
+      "Micro-optimizations in cold paths (startup, migrations, admin tools, one-time initialization)",
+      "Premature caching suggestions without evidence of actual slowness",
+      "Theoretical scale issues in MVP/prototype code",
+      "Style-based performance opinions (for vs forEach, Map vs plain object)"
+    ],
+    "domains": ["code-review", "performance", "quality-assurance"]
+  },
+  "guidance": {
+    "strategy": "Read code through the lens of 'what happens when this runs 10,000 times' or 'when the table has a million rows'. Focus on measurable, production-observable problems — not theoretical micro-optimizations. Project performance at 10x, 100x, and 1000x current volumes.",
+    "tactics": [
+      "N+1 queries: flag database queries inside loops that should be batched or eager-loaded; count loop iterations against expected data size",
+      "Unbounded memory: flag loading entire tables without pagination, caches without eviction policies, string concatenation in loops, large object allocations",
+      "Missing pagination: flag endpoints returning all results without limit/offset/cursor/streaming",
+      "Hot-path allocations: flag object creation, regex compilation, or expensive computation inside loops or per-request paths",
+      "Blocking I/O in async: flag synchronous file reads, blocking HTTP calls, CPU-intensive computation on the event loop",
+      "Algorithmic complexity: flag O(n^2) or worse without justification; verify all database queries use appropriate indexes",
+      "Performance benchmarks: API responses under 200ms for standard operations, bundle size increases under 5KB per feature, background jobs process in batches",
+      "Confidence calibration: HIGH (0.80+) when impact is provable from code (N+1 clearly in loop, unbounded query on large table); MODERATE (0.60-0.79) when pattern present but impact depends on unconfirmed data size; suppress below 0.60"
+    ]
+  },
+  "verification": {
+    "successIndicators": [
+      "Each finding identifies a specific code path with measurable impact at expected scale",
+      "N+1 findings show the loop and the query inside it",
+      "No micro-optimization findings on cold paths"
+    ],
+    "failureIndicators": [
+      "Finding is speculative optimization without evidence of hot path",
+      "Caching recommendation without evidence of repeated expensive computation",
+      "Flagging cold-path code (startup, migrations) for performance"
+    ]
+  }
+}

package/playbooks/compound-engineering/plan-adversarial-review.json ADDED Viewed

@@ -0,0 +1,56 @@
+{
+  "name": "plan-adversarial-review",
+  "curatedBy": "compound-engineering",
+  "confidence": 0.8,
+  "complexity": "complex",
+  "estimatedEffort": 5,
+  "applicability": {
+    "situations": [
+      "Reviewing implementation plans or requirement documents before execution",
+      "Stress-testing planning assumptions, premises, and scope decisions",
+      "Catching contradictions, scope creep, and unstated assumptions in plans"
+    ],
+    "triggers": [
+      "review plan",
+      "plan review",
+      "challenge assumptions",
+      "scope review",
+      "requirements review"
+    ],
+    "antiPatterns": [
+      "Implementation style or technology selection choices",
+      "Product strategy or priority preferences",
+      "Security, design, or feasibility concerns (use plan-feasibility-review instead)",
+      "The plan is already in execution — too late for adversarial review"
+    ],
+    "domains": ["planning", "requirements", "quality-assurance"]
+  },
+  "guidance": {
+    "strategy": "Challenge premises before solutions. Surface unstated assumptions. Stress-test decisions for reversal cost. Check for internal contradictions and scope-goal misalignment. Apply three lenses: adversarial (break assumptions), coherence (internal consistency), and scope guardian (right-sized).",
+    "tactics": [
+      "Premise challenging: Is this the right problem? Does the solution match the problem? What if we did nothing? What would make this fail? Surface framing effects that bias toward one solution",
+      "Assumption surfacing: identify environmental assumptions (infrastructure exists, APIs stable), user behavior assumptions (adoption, usage patterns), scale assumptions (data volume, concurrency), temporal assumptions (availability, ordering)",
+      "Decision stress-testing: for each major decision, apply falsification test (what evidence would prove this wrong?), reversal cost (how expensive to change later?), and decision-scope mismatch (is decision bigger/smaller than the problem?)",
+      "Simplification pressure: audit abstractions (how many consumers?), find minimum viable version, apply subtraction test (remove each component — does plan still work?), enforce complexity budget",
+      "Coherence checking: catch contradictions between sections, terminology drift (same concept with different names), forward references to undefined terms, ungrouped requirements spanning multiple concerns",
+      "Scope-goal alignment: flag scope exceeding goals (building more than needed), goals exceeding scope (promising more than plan delivers), new abstractions with one implementation, framework-ahead-of-need, configuration without consumers",
+      "Alternative blindness: check for omitted alternatives, build-vs-use analysis, do-nothing baseline comparison",
+      "Depth calibration: Quick (short docs, <5 requirements) = max 3 findings; Standard = proportional to decision density; Deep (>10 requirements, high-stakes) = multiple passes with assumption chain tracing",
+      "Confidence calibration: HIGH (0.80+) when specific text can be quoted showing gap; MODERATE (0.60-0.79) when gap likely but requires context not in document; suppress below 0.50"
+    ]
+  },
+  "verification": {
+    "successIndicators": [
+      "Findings quote specific text from the plan showing the gap or contradiction",
+      "Assumptions surfaced are testable and actionable",
+      "Scope-goal alignment checked with concrete evidence",
+      "No findings that belong to feasibility, security, or design review"
+    ],
+    "failureIndicators": [
+      "Findings are vague concerns without quoting specific plan text",
+      "Assumptions identified are untestable or irrelevant",
+      "Scope opinions based on preference rather than goal alignment",
+      "Contradictions flagged that are reconcilable with charitable reading"
+    ]
+  }
+}

package/playbooks/compound-engineering/plan-feasibility-review.json ADDED Viewed

@@ -0,0 +1,56 @@
+{
+  "name": "plan-feasibility-review",
+  "curatedBy": "compound-engineering",
+  "confidence": 0.8,
+  "complexity": "complex",
+  "estimatedEffort": 5,
+  "applicability": {
+    "situations": [
+      "Evaluating technical feasibility of implementation plans",
+      "Checking product-market fit and strategic alignment of proposed features",
+      "Reviewing plans for security gaps, design completeness, and migration safety"
+    ],
+    "triggers": [
+      "feasibility review",
+      "plan feasibility",
+      "technical review",
+      "can we build this",
+      "is this plan viable"
+    ],
+    "antiPatterns": [
+      "Implementation style choices that don't affect feasibility",
+      "Code organization preferences",
+      "Theoretical scalability without evidence",
+      "Scope or assumption concerns (use plan-adversarial-review instead)"
+    ],
+    "domains": ["planning", "architecture", "quality-assurance"]
+  },
+  "guidance": {
+    "strategy": "Evaluate plans across four dimensions: technical feasibility (can we build it?), product fit (should we build it?), security readiness (is it safe?), and design completeness (is it specified enough?). Each dimension has a distinct lens.",
+    "tactics": [
+      "Technical feasibility: verify plan acknowledges existing code/services/infrastructure; check for architecture conflicts with current stack; validate that referenced file paths and interfaces actually exist; check framework compatibility",
+      "Shadow path tracing: for each feature, trace the happy path, nil/empty input path, error path, and concurrent access path — plans that only cover happy path will fail in implementation",
+      "Migration safety: verify concrete migration path (not 'migrate later'), backward compatibility during rollout, rollback strategy, data volume estimates, and operation ordering",
+      "Product lens: challenge the premise — is this the right problem? What's the actual outcome? What happens if we do nothing? Is there an 80% value at 20% cost alternative? Check goal-requirement alignment (orphan requirements, unserved goals)",
+      "Security lens: inventory attack surfaces (endpoints, data stores, integrations, user inputs), check auth/authz per endpoint, identify sensitive data flows, assess third-party trust boundaries, outline top-3 threat model (most likely, highest impact, most subtle exploit)",
+      "Design completeness: check interaction state coverage (loading, empty, error, success, partial for every interactive element), user flow completeness (entry points, happy path, 2-3 edge cases, exit points), responsive/accessibility considerations",
+      "Dependency analysis: verify external dependencies are available and compatible; identify implicit assumptions about infrastructure, APIs, or services",
+      "Performance feasibility: back-of-envelope math for expected load, data volumes, and response time requirements",
+      "Confidence calibration: HIGH (0.80+) when specific technical constraint blocks the approach; MODERATE (0.60-0.79) when constraint likely but depends on implementation details; suppress below 0.50"
+    ]
+  },
+  "verification": {
+    "successIndicators": [
+      "Technical blockers identified with specific evidence (missing API, framework incompatibility)",
+      "Shadow paths traced — plan covers more than just the happy path",
+      "Security attack surfaces inventoried with mitigation gaps flagged",
+      "Product alignment verified — goals trace to requirements"
+    ],
+    "failureIndicators": [
+      "Feasibility concerns are vague without specific technical evidence",
+      "Only happy path evaluated — error/empty/concurrent paths ignored",
+      "Security review is generic OWASP checklist without plan-specific analysis",
+      "Product concerns are preference-based rather than goal-alignment-based"
+    ]
+  }
+}

package/playbooks/compound-engineering/project-standards-review.json ADDED Viewed

@@ -0,0 +1,52 @@
+{
+  "name": "project-standards-review",
+  "curatedBy": "compound-engineering",
+  "confidence": 0.85,
+  "complexity": "simple",
+  "estimatedEffort": 2,
+  "applicability": {
+    "situations": [
+      "Reviewing changes for compliance with the project's own standards (CLAUDE.md, AGENTS.md, contributing guides)",
+      "Enforcing naming conventions, file placement, and configuration rules",
+      "Auditing changes against established project conventions"
+    ],
+    "triggers": [
+      "standards review",
+      "convention check",
+      "CLAUDE.md compliance",
+      "project rules"
+    ],
+    "antiPatterns": [
+      "Rules that don't apply to the changed file type",
+      "Violations already caught by automated linters or CI",
+      "Pre-existing violations in unchanged code",
+      "Generic best practices not documented in the project's standards files",
+      "Opinions about quality of the standards themselves"
+    ],
+    "domains": ["code-review", "standards", "quality-assurance"]
+  },
+  "guidance": {
+    "strategy": "Audit changes against the project's own documented standards. Every finding must cite a specific rule from the standards file AND a specific violation in the diff. Without both, drop the finding.",
+    "tactics": [
+      "Discover standards: read CLAUDE.md, AGENTS.md, and any contributing/convention files in the changed file's ancestor directories",
+      "Match rules to file types: only apply rules relevant to the specific files being changed",
+      "Evidence requirement: for each finding, provide (1) exact quote/section from standards file defining the rule, and (2) specific line(s) in diff violating the rule",
+      "Common violations: missing required frontmatter fields, names not matching directory/file names, wrong reference inclusion mode, shell commands where native tools are required, misplaced files in wrong directories",
+      "Language violations: second-person 'you should' where standards require imperative form, hedge words (might/could/consider) leaving behavior undefined",
+      "Protected artifacts: never flag documented protected paths (docs/, plans/, solutions/) for deletion",
+      "Confidence calibration: HIGH (0.80+) when specific rule quote and specific diff violation are both identifiable; MODERATE (0.60-0.79) when rule exists but applying it requires judgment; suppress below 0.60"
+    ]
+  },
+  "verification": {
+    "successIndicators": [
+      "Every finding cites both the rule source and the specific violation",
+      "Only rules from the project's actual standards files are enforced",
+      "No findings about unchanged code or generic best practices"
+    ],
+    "failureIndicators": [
+      "Finding enforces a rule not documented in any standards file",
+      "Finding about pre-existing code that wasn't changed in this diff",
+      "Generic best practice advice without project-specific rule citation"
+    ]
+  }
+}

package/playbooks/compound-engineering/reliability-review.json ADDED Viewed

@@ -0,0 +1,53 @@
+{
+  "name": "reliability-review",
+  "curatedBy": "compound-engineering",
+  "confidence": 0.85,
+  "complexity": "moderate",
+  "estimatedEffort": 4,
+  "applicability": {
+    "situations": [
+      "Reviewing code with external dependencies, I/O boundaries, or error handling",
+      "Evaluating failure modes, retry logic, and cascading failure paths",
+      "Checking resilience of services that depend on other services"
+    ],
+    "triggers": [
+      "reliability review",
+      "error handling",
+      "retry",
+      "timeout",
+      "circuit breaker",
+      "cascade failure"
+    ],
+    "antiPatterns": [
+      "Flagging internal pure functions that cannot fail (string formatting, math, in-memory transforms)",
+      "Test helper error handling",
+      "Error message formatting choices",
+      "Theoretical cascading failures without traceable evidence"
+    ],
+    "domains": ["code-review", "reliability", "quality-assurance"]
+  },
+  "guidance": {
+    "strategy": "Ask 'what happens when this dependency is down?' for every external call. Think about partial failures, retry storms, and cascading timeouts. Read code by assuming the environment can be hostile.",
+    "tactics": [
+      "Missing error handling on I/O boundaries: flag HTTP calls, database queries, file operations, and message queue interactions without try/catch or error callbacks",
+      "Retry loops without backoff/limits: immediate indefinite retries create retry storms — require exponential backoff and max attempt limits",
+      "Missing timeouts on external calls: HTTP clients, database connections, and RPC without explicit timeouts can hang indefinitely and exhaust connection pools",
+      "Error swallowing: flag catch blocks that ignore errors, silent failures that return misleading defaults, and error handlers that don't log or propagate",
+      "Cascading failure paths: trace how failure in service A causes B to retry aggressively, overloading C; how slow dependencies fill request queues causing health check failures, restarts, and cold-start storms",
+      "Recovery-induced failures: retries creating duplicates, rollbacks leaving orphaned state, circuit breakers preventing legitimate recovery",
+      "Confidence calibration: HIGH (0.80+) when reliability gap is directly visible (HTTP call without timeout, retry without max attempts, catch swallowing error); MODERATE (0.60-0.79) when code lacks protection but framework defaults might handle it; suppress below 0.60"
+    ]
+  },
+  "verification": {
+    "successIndicators": [
+      "Each finding points to a specific I/O boundary without protection",
+      "Retry findings show the loop and its missing backoff/limit",
+      "Cascade findings trace the multi-service failure chain"
+    ],
+    "failureIndicators": [
+      "Flagging pure functions or in-memory operations for error handling",
+      "Missing that framework middleware already handles the concern",
+      "Architectural concerns that can't be confirmed from the diff"
+    ]
+  }
+}

package/playbooks/compound-engineering/review-orchestration.json ADDED Viewed

@@ -0,0 +1,64 @@
+{
+  "name": "review-orchestration",
+  "curatedBy": "compound-engineering",
+  "confidence": 0.8,
+  "complexity": "complex",
+  "estimatedEffort": 8,
+  "applicability": {
+    "situations": [
+      "Code review before creating a PR",
+      "Reviewing changes after completing a task during iterative implementation",
+      "Structured multi-persona code review for quality assurance"
+    ],
+    "triggers": [
+      "review code",
+      "code review",
+      "check changes",
+      "pre-PR review"
+    ],
+    "antiPatterns": [
+      "Reviewing trivial formatting-only changes",
+      "Reviewing auto-generated code that will be regenerated",
+      "Single-line config changes that don't affect behavior"
+    ],
+    "domains": ["code-review", "quality-assurance", "software-engineering"]
+  },
+  "guidance": {
+    "strategy": "Deploy tiered reviewer personas in parallel, then merge and deduplicate findings. Always-on reviewers run on every review; conditional reviewers are selected based on the diff content.",
+    "tactics": [
+      "Always-on reviewers: correctness (logic bugs), testing (coverage gaps), maintainability (coupling/complexity), project-standards (convention compliance), agent-native (action/context parity), learnings-researcher (institutional knowledge)",
+      "Conditional reviewers selected per-diff: security (auth/injection), performance (N+1/memory), API-contract (breaking changes), data-migrations (schema safety), reliability (error handling), adversarial (edge cases), stack-specific language reviewers",
+      "Each reviewer returns structured findings with severity (P0-P3), confidence (0.0-1.0), and autofix_class (safe_auto/gated_auto/manual/advisory)",
+      "Suppress all findings below 0.60 confidence to prevent noise",
+      "Merge/deduplicate findings by fingerprint: (file + line_bucket +/- 3 lines + normalized_title). On conflict, keep highest severity and strongest confidence",
+      "Route actions by class: safe_auto findings get auto-fixed; gated_auto/manual findings go to human review; advisory findings are informational only",
+      "Maximum 2 rounds of autofix to prevent loops"
+    ],
+    "steps": [
+      "1. Detect scope of changes (files, languages, domains affected)",
+      "2. Discover intent from commit messages, PR description, or task context",
+      "3. Select conditional reviewers based on scope (security for auth files, performance for queries, etc.)",
+      "4. Dispatch all selected reviewers in parallel — each reads the diff independently",
+      "5. Collect structured JSON findings from all reviewers",
+      "6. Merge findings: deduplicate by fingerprint, resolve severity conflicts conservatively",
+      "7. Synthesize final report with verdict: Ready / Ready with fixes / Not ready"
+    ]
+  },
+  "verification": {
+    "successIndicators": [
+      "All P0 findings are genuine breakage traceable to specific code paths",
+      "Line numbers point to exact buggy code, not nearby lines",
+      "Each finding is actionable with a clear fix path",
+      "No false positives from style issues that linters catch",
+      "Deduplication produces no redundant findings"
+    ],
+    "failureIndicators": [
+      "P0 findings that are actually style nits",
+      "False positives exceeding 20% of total findings",
+      "Same issue reported multiple times after deduplication",
+      "Findings that require runtime observation to confirm (not provable from code)",
+      "Protected artifacts (docs, plans, brainstorms) flagged for deletion"
+    ],
+    "rollbackStrategy": "Review findings are advisory — no code changes until human approval (except safe_auto in autofix mode)"
+  }
+}

package/playbooks/compound-engineering/security-review.json ADDED Viewed

@@ -0,0 +1,54 @@
+{
+  "name": "security-review",
+  "curatedBy": "compound-engineering",
+  "confidence": 0.85,
+  "complexity": "moderate",
+  "estimatedEffort": 4,
+  "applicability": {
+    "situations": [
+      "Reviewing code changes that touch auth, user input, public endpoints, or permissions",
+      "Auditing for exploitable vulnerabilities before deployment",
+      "Systematic OWASP Top 10 compliance checking"
+    ],
+    "triggers": [
+      "security review",
+      "auth",
+      "injection",
+      "XSS",
+      "CSRF",
+      "user input",
+      "public endpoint"
+    ],
+    "antiPatterns": [
+      "Defense-in-depth on already-protected code",
+      "Theoretical attacks requiring physical access",
+      "HTTP vs HTTPS in dev/test configs",
+      "Generic hardening advice without specific exploitable findings"
+    ],
+    "domains": ["code-review", "security", "quality-assurance"]
+  },
+  "guidance": {
+    "strategy": "Think like an attacker looking for one exploitable path through the code. Trace data from entry point to dangerous sink. Combine targeted attack-path analysis with systematic OWASP Top 10 coverage.",
+    "tactics": [
+      "Injection vectors: trace untrusted input to SQL, XSS, shell commands, template engines, innerHTML/dangerouslySetInnerHTML — flag when no sanitization between entry and sink",
+      "Auth/authz bypasses: check for missing auth middleware, broken ownership checks (user A accessing user B's resources), privilege escalation, CSRF on state-changing endpoints",
+      "Secrets exposure: scan for hardcoded keys/tokens/passwords, sensitive data in error messages or logs, PII in responses without need-to-know filtering",
+      "Insecure deserialization: flag pickle, Marshal, unserialize, JSON.parse of executable content from untrusted sources",
+      "SSRF and path traversal: flag user-controlled URLs or file paths passed to fetch/open without allowlist validation",
+      "Systematic OWASP Top 10 check: input validation on all entry points (req.body, req.params, req.query), SQL parameterization, XSS escaping + CSP headers, auth on all endpoints, encryption for sensitive data at rest and in transit",
+      "Confidence calibration: HIGH (0.80+) when full attack path is traceable from untrusted input to dangerous sink without sanitization; MODERATE (0.60-0.79) when dangerous pattern present but exploitability unconfirmed; suppress below 0.60"
+    ]
+  },
+  "verification": {
+    "successIndicators": [
+      "Each finding traces a complete attack path: untrusted input → specific code path → exploitable outcome",
+      "No false positives from already-protected code or dev-only configs",
+      "OWASP categories systematically checked, not just obvious injection"
+    ],
+    "failureIndicators": [
+      "Finding requires physical access or internal-only network to exploit",
+      "Generic 'could be vulnerable' without tracing specific input to specific sink",
+      "Flagging defense-in-depth that's already behind validated auth"
+    ]
+  }
+}

package/playbooks/compound-engineering/systematic-execution.json ADDED Viewed

@@ -0,0 +1,64 @@
+{
+  "name": "systematic-execution",
+  "curatedBy": "compound-engineering",
+  "confidence": 0.8,
+  "complexity": "complex",
+  "estimatedEffort": 10,
+  "applicability": {
+    "situations": [
+      "Executing an implementation plan systematically",
+      "Shipping a feature with testing, review, and quality gates",
+      "Multi-unit implementation requiring incremental progress and verification"
+    ],
+    "triggers": [
+      "execute plan",
+      "start work",
+      "implement this",
+      "ship feature"
+    ],
+    "antiPatterns": [
+      "No plan exists — create one first",
+      "Exploratory work where requirements aren't defined",
+      "Hotfix that needs to ship immediately without full process"
+    ],
+    "domains": ["execution", "implementation", "software-engineering"]
+  },
+  "guidance": {
+    "strategy": "Treat the plan as a decision artifact, not an instruction script. Execute implementation units in dependency order, testing continuously, with incremental commits after each logical unit. Simplify after every 2-3 units.",
+    "tactics": [
+      "Read plan's Implementation Units; honor execution posture (test-first, characterization-first) when annotated; check 'Deferred to Implementation' questions before starting",
+      "Strategy selection by scale: inline (1-2 small tasks), serial subagents (3+ with dependencies), parallel subagents (3+ independent), swarm (10+ with coordination)",
+      "Test as you go, not at end: run tests after each significant change; never batch testing to the end",
+      "System-wide test check before marking task done: trace callbacks/middleware/observers two levels out; write integration tests with real objects through full chain; verify failure doesn't leave orphaned state; check if other interfaces expose same behavior",
+      "Incremental commits after each complete logical unit — messages describe complete valuable changes, not WIP",
+      "Simplify after every 2-3 units: review changed files for consolidation opportunities, dead code, naming improvements",
+      "Pattern following discipline: read referenced files from plan before implementing — don't invent new conventions",
+      "Feature completeness first: don't move to next feature until current one ships"
+    ],
+    "steps": [
+      "1. Read plan, clarify any ambiguities, set up environment",
+      "2. Create task tracking for all implementation units",
+      "3. Execute units in dependency order: implement → test → verify → commit",
+      "4. After every 2-3 units, review for simplification opportunities",
+      "5. Run quality checks: tests pass, linting passes, code follows existing patterns",
+      "6. Prepare PR: summary (what/why/decisions), testing notes, post-deploy monitoring plan",
+      "7. Update plan status"
+    ]
+  },
+  "verification": {
+    "successIndicators": [
+      "All implementation units completed and tested",
+      "Tests pass and linting passes",
+      "Code follows existing patterns — no new conventions invented",
+      "Each commit describes a complete valuable change",
+      "PR includes post-deploy monitoring plan with concrete metrics"
+    ],
+    "failureIndicators": [
+      "Tests batched to end and found late-breaking issues",
+      "New conventions invented instead of following existing patterns",
+      "Commits contain WIP or incomplete changes",
+      "Feature moved on before current one fully shipped",
+      "System-wide test check skipped for code with callbacks or error handling"
+    ]
+  }
+}

package/playbooks/compound-engineering/testing-review.json ADDED Viewed

@@ -0,0 +1,50 @@
+{
+  "name": "testing-review",
+  "curatedBy": "compound-engineering",
+  "confidence": 0.85,
+  "complexity": "moderate",
+  "estimatedEffort": 3,
+  "applicability": {
+    "situations": [
+      "Reviewing test quality and coverage for code changes",
+      "Evaluating whether tests prove code works or provide false confidence",
+      "Checking for untested branches, weak assertions, and missing error paths"
+    ],
+    "triggers": [
+      "code review",
+      "test coverage",
+      "test quality",
+      "missing tests"
+    ],
+    "antiPatterns": [
+      "Reviewing test infrastructure or test framework setup",
+      "Evaluating test performance or execution speed",
+      "Coverage percentage targets without considering test quality"
+    ],
+    "domains": ["code-review", "testing", "quality-assurance"]
+  },
+  "guidance": {
+    "strategy": "For every new branch (if/else/switch/try/catch) in the diff, verify at least one test exercises it. Focus on whether tests prove behavior, not just that code doesn't throw.",
+    "tactics": [
+      "Hunt for: untested branches (new if/else/switch/try/catch), tests that don't assert behavior (only assert 'doesn't throw'), implementation-coupled brittle tests (assert on mocks, test private methods, snapshot internals), missing error path coverage",
+      "Branch coverage discipline: each new branch must have at least one test; trace all paths through the new code",
+      "Behavior assertion rigor: assert specific values not just truthiness; verify both happy path AND sad path",
+      "Check that error paths are tested: catch blocks, fallback branches, error returns should have dedicated tests",
+      "Flag implementation-coupled tests: tests that break when refactoring without behavior change are brittle",
+      "Confidence calibration: HIGH (0.80+) when test gap is provable from diff (new branch, no test); MODERATE (0.60-0.79) when inferred from structure (parser.ts with no parser.test.ts); suppress below 0.60 when coverage may exist in integration tests"
+    ]
+  },
+  "verification": {
+    "successIndicators": [
+      "All new branches have corresponding test cases",
+      "Tests assert actual behavior with specific expected values",
+      "Error paths have dedicated tests, not just happy path",
+      "No implementation-coupled brittleness identified"
+    ],
+    "failureIndicators": [
+      "New branches found without any test coverage",
+      "Tests only assert 'doesn't throw' or truthiness without checking values",
+      "Error handling code has no test exercising the error path"
+    ]
+  }
+}