claudecode-omc 5.5.2 → 5.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (433) hide show
  1. package/README.md +63 -0
  2. package/bundled/manifest.json +3 -2
  3. package/bundled/upstream/ecc/.omc-source/bundle.json +23 -0
  4. package/bundled/upstream/ecc/.omc-source/last-plan-apply.json +439 -0
  5. package/bundled/upstream/ecc/.omc-source/manifests/.claude-plugin/marketplace.json +47 -0
  6. package/bundled/upstream/ecc/agents/a11y-architect.md +141 -0
  7. package/bundled/upstream/ecc/agents/architect.md +211 -0
  8. package/bundled/upstream/ecc/agents/build-error-resolver.md +114 -0
  9. package/bundled/upstream/ecc/agents/chief-of-staff.md +151 -0
  10. package/bundled/upstream/ecc/agents/code-architect.md +71 -0
  11. package/bundled/upstream/ecc/agents/code-explorer.md +69 -0
  12. package/bundled/upstream/ecc/agents/code-reviewer.md +237 -0
  13. package/bundled/upstream/ecc/agents/code-simplifier.md +47 -0
  14. package/bundled/upstream/ecc/agents/comment-analyzer.md +45 -0
  15. package/bundled/upstream/ecc/agents/conversation-analyzer.md +52 -0
  16. package/bundled/upstream/ecc/agents/cpp-build-resolver.md +90 -0
  17. package/bundled/upstream/ecc/agents/cpp-reviewer.md +72 -0
  18. package/bundled/upstream/ecc/agents/csharp-reviewer.md +101 -0
  19. package/bundled/upstream/ecc/agents/dart-build-resolver.md +201 -0
  20. package/bundled/upstream/ecc/agents/database-reviewer.md +91 -0
  21. package/bundled/upstream/ecc/agents/doc-updater.md +107 -0
  22. package/bundled/upstream/ecc/agents/docs-lookup.md +68 -0
  23. package/bundled/upstream/ecc/agents/e2e-runner.md +107 -0
  24. package/bundled/upstream/ecc/agents/flutter-reviewer.md +243 -0
  25. package/bundled/upstream/ecc/agents/gan-evaluator.md +209 -0
  26. package/bundled/upstream/ecc/agents/gan-generator.md +131 -0
  27. package/bundled/upstream/ecc/agents/gan-planner.md +99 -0
  28. package/bundled/upstream/ecc/agents/go-build-resolver.md +94 -0
  29. package/bundled/upstream/ecc/agents/go-reviewer.md +76 -0
  30. package/bundled/upstream/ecc/agents/harness-optimizer.md +35 -0
  31. package/bundled/upstream/ecc/agents/healthcare-reviewer.md +83 -0
  32. package/bundled/upstream/ecc/agents/java-build-resolver.md +153 -0
  33. package/bundled/upstream/ecc/agents/java-reviewer.md +92 -0
  34. package/bundled/upstream/ecc/agents/kotlin-build-resolver.md +118 -0
  35. package/bundled/upstream/ecc/agents/kotlin-reviewer.md +159 -0
  36. package/bundled/upstream/ecc/agents/loop-operator.md +36 -0
  37. package/bundled/upstream/ecc/agents/opensource-forker.md +198 -0
  38. package/bundled/upstream/ecc/agents/opensource-packager.md +249 -0
  39. package/bundled/upstream/ecc/agents/opensource-sanitizer.md +188 -0
  40. package/bundled/upstream/ecc/agents/performance-optimizer.md +446 -0
  41. package/bundled/upstream/ecc/agents/planner.md +212 -0
  42. package/bundled/upstream/ecc/agents/pr-test-analyzer.md +45 -0
  43. package/bundled/upstream/ecc/agents/python-reviewer.md +98 -0
  44. package/bundled/upstream/ecc/agents/pytorch-build-resolver.md +120 -0
  45. package/bundled/upstream/ecc/agents/refactor-cleaner.md +85 -0
  46. package/bundled/upstream/ecc/agents/rust-build-resolver.md +148 -0
  47. package/bundled/upstream/ecc/agents/rust-reviewer.md +94 -0
  48. package/bundled/upstream/ecc/agents/security-reviewer.md +108 -0
  49. package/bundled/upstream/ecc/agents/seo-specialist.md +62 -0
  50. package/bundled/upstream/ecc/agents/silent-failure-hunter.md +50 -0
  51. package/bundled/upstream/ecc/agents/tdd-guide.md +91 -0
  52. package/bundled/upstream/ecc/agents/type-design-analyzer.md +41 -0
  53. package/bundled/upstream/ecc/agents/typescript-reviewer.md +112 -0
  54. package/bundled/upstream/ecc/commands/agent-sort.md +23 -0
  55. package/bundled/upstream/ecc/commands/aside.md +164 -0
  56. package/bundled/upstream/ecc/commands/build-fix.md +62 -0
  57. package/bundled/upstream/ecc/commands/checkpoint.md +74 -0
  58. package/bundled/upstream/ecc/commands/claw.md +23 -0
  59. package/bundled/upstream/ecc/commands/code-review.md +289 -0
  60. package/bundled/upstream/ecc/commands/context-budget.md +23 -0
  61. package/bundled/upstream/ecc/commands/cpp-build.md +173 -0
  62. package/bundled/upstream/ecc/commands/cpp-review.md +132 -0
  63. package/bundled/upstream/ecc/commands/cpp-test.md +251 -0
  64. package/bundled/upstream/ecc/commands/devfleet.md +23 -0
  65. package/bundled/upstream/ecc/commands/docs.md +23 -0
  66. package/bundled/upstream/ecc/commands/e2e.md +268 -0
  67. package/bundled/upstream/ecc/commands/eval.md +23 -0
  68. package/bundled/upstream/ecc/commands/evolve.md +178 -0
  69. package/bundled/upstream/ecc/commands/feature-dev.md +49 -0
  70. package/bundled/upstream/ecc/commands/flutter-build.md +164 -0
  71. package/bundled/upstream/ecc/commands/flutter-review.md +116 -0
  72. package/bundled/upstream/ecc/commands/flutter-test.md +144 -0
  73. package/bundled/upstream/ecc/commands/gan-build.md +99 -0
  74. package/bundled/upstream/ecc/commands/gan-design.md +35 -0
  75. package/bundled/upstream/ecc/commands/go-build.md +183 -0
  76. package/bundled/upstream/ecc/commands/go-review.md +148 -0
  77. package/bundled/upstream/ecc/commands/go-test.md +268 -0
  78. package/bundled/upstream/ecc/commands/gradle-build.md +70 -0
  79. package/bundled/upstream/ecc/commands/harness-audit.md +73 -0
  80. package/bundled/upstream/ecc/commands/hookify-configure.md +14 -0
  81. package/bundled/upstream/ecc/commands/hookify-help.md +46 -0
  82. package/bundled/upstream/ecc/commands/hookify-list.md +21 -0
  83. package/bundled/upstream/ecc/commands/hookify.md +50 -0
  84. package/bundled/upstream/ecc/commands/instinct-export.md +66 -0
  85. package/bundled/upstream/ecc/commands/instinct-import.md +114 -0
  86. package/bundled/upstream/ecc/commands/instinct-status.md +59 -0
  87. package/bundled/upstream/ecc/commands/jira.md +106 -0
  88. package/bundled/upstream/ecc/commands/kotlin-build.md +174 -0
  89. package/bundled/upstream/ecc/commands/kotlin-review.md +140 -0
  90. package/bundled/upstream/ecc/commands/kotlin-test.md +312 -0
  91. package/bundled/upstream/ecc/commands/learn-eval.md +116 -0
  92. package/bundled/upstream/ecc/commands/learn.md +70 -0
  93. package/bundled/upstream/ecc/commands/loop-start.md +32 -0
  94. package/bundled/upstream/ecc/commands/loop-status.md +24 -0
  95. package/bundled/upstream/ecc/commands/model-route.md +26 -0
  96. package/bundled/upstream/ecc/commands/multi-backend.md +158 -0
  97. package/bundled/upstream/ecc/commands/multi-execute.md +315 -0
  98. package/bundled/upstream/ecc/commands/multi-frontend.md +158 -0
  99. package/bundled/upstream/ecc/commands/multi-plan.md +268 -0
  100. package/bundled/upstream/ecc/commands/multi-workflow.md +191 -0
  101. package/bundled/upstream/ecc/commands/orchestrate.md +135 -0
  102. package/bundled/upstream/ecc/commands/plan.md +117 -0
  103. package/bundled/upstream/ecc/commands/pm2.md +272 -0
  104. package/bundled/upstream/ecc/commands/projects.md +39 -0
  105. package/bundled/upstream/ecc/commands/promote.md +41 -0
  106. package/bundled/upstream/ecc/commands/prompt-optimize.md +23 -0
  107. package/bundled/upstream/ecc/commands/prp-commit.md +112 -0
  108. package/bundled/upstream/ecc/commands/prp-implement.md +385 -0
  109. package/bundled/upstream/ecc/commands/prp-plan.md +502 -0
  110. package/bundled/upstream/ecc/commands/prp-pr.md +184 -0
  111. package/bundled/upstream/ecc/commands/prp-prd.md +447 -0
  112. package/bundled/upstream/ecc/commands/prune.md +31 -0
  113. package/bundled/upstream/ecc/commands/python-review.md +297 -0
  114. package/bundled/upstream/ecc/commands/quality-gate.md +29 -0
  115. package/bundled/upstream/ecc/commands/refactor-clean.md +80 -0
  116. package/bundled/upstream/ecc/commands/resume-session.md +156 -0
  117. package/bundled/upstream/ecc/commands/review-pr.md +37 -0
  118. package/bundled/upstream/ecc/commands/rules-distill.md +20 -0
  119. package/bundled/upstream/ecc/commands/rust-build.md +187 -0
  120. package/bundled/upstream/ecc/commands/rust-review.md +142 -0
  121. package/bundled/upstream/ecc/commands/rust-test.md +308 -0
  122. package/bundled/upstream/ecc/commands/santa-loop.md +175 -0
  123. package/bundled/upstream/ecc/commands/save-session.md +275 -0
  124. package/bundled/upstream/ecc/commands/sessions.md +339 -0
  125. package/bundled/upstream/ecc/commands/setup-pm.md +80 -0
  126. package/bundled/upstream/ecc/commands/skill-create.md +174 -0
  127. package/bundled/upstream/ecc/commands/skill-health.md +54 -0
  128. package/bundled/upstream/ecc/commands/tdd.md +231 -0
  129. package/bundled/upstream/ecc/commands/test-coverage.md +69 -0
  130. package/bundled/upstream/ecc/commands/update-codemaps.md +72 -0
  131. package/bundled/upstream/ecc/commands/update-docs.md +84 -0
  132. package/bundled/upstream/ecc/commands/verify.md +23 -0
  133. package/bundled/upstream/ecc/hooks/README.md +237 -0
  134. package/bundled/upstream/ecc/hooks/hooks.json +330 -0
  135. package/bundled/upstream/ecc/skills/accessibility/SKILL.md +146 -0
  136. package/bundled/upstream/ecc/skills/agent-eval/SKILL.md +145 -0
  137. package/bundled/upstream/ecc/skills/agent-harness-construction/SKILL.md +73 -0
  138. package/bundled/upstream/ecc/skills/agent-introspection-debugging/SKILL.md +153 -0
  139. package/bundled/upstream/ecc/skills/agent-payment-x402/SKILL.md +178 -0
  140. package/bundled/upstream/ecc/skills/agent-sort/SKILL.md +215 -0
  141. package/bundled/upstream/ecc/skills/agentic-engineering/SKILL.md +63 -0
  142. package/bundled/upstream/ecc/skills/ai-first-engineering/SKILL.md +51 -0
  143. package/bundled/upstream/ecc/skills/ai-regression-testing/SKILL.md +385 -0
  144. package/bundled/upstream/ecc/skills/android-clean-architecture/SKILL.md +339 -0
  145. package/bundled/upstream/ecc/skills/api-connector-builder/SKILL.md +120 -0
  146. package/bundled/upstream/ecc/skills/api-design/SKILL.md +523 -0
  147. package/bundled/upstream/ecc/skills/architecture-decision-records/SKILL.md +179 -0
  148. package/bundled/upstream/ecc/skills/article-writing/SKILL.md +79 -0
  149. package/bundled/upstream/ecc/skills/automation-audit-ops/SKILL.md +142 -0
  150. package/bundled/upstream/ecc/skills/autonomous-agent-harness/SKILL.md +267 -0
  151. package/bundled/upstream/ecc/skills/autonomous-loops/SKILL.md +610 -0
  152. package/bundled/upstream/ecc/skills/backend-patterns/SKILL.md +598 -0
  153. package/bundled/upstream/ecc/skills/benchmark/SKILL.md +93 -0
  154. package/bundled/upstream/ecc/skills/blueprint/SKILL.md +105 -0
  155. package/bundled/upstream/ecc/skills/brand-voice/SKILL.md +97 -0
  156. package/bundled/upstream/ecc/skills/brand-voice/references/voice-profile-schema.md +55 -0
  157. package/bundled/upstream/ecc/skills/browser-qa/SKILL.md +87 -0
  158. package/bundled/upstream/ecc/skills/bun-runtime/SKILL.md +84 -0
  159. package/bundled/upstream/ecc/skills/canary-watch/SKILL.md +99 -0
  160. package/bundled/upstream/ecc/skills/carrier-relationship-management/SKILL.md +212 -0
  161. package/bundled/upstream/ecc/skills/ck/SKILL.md +147 -0
  162. package/bundled/upstream/ecc/skills/ck/commands/forget.mjs +44 -0
  163. package/bundled/upstream/ecc/skills/ck/commands/info.mjs +24 -0
  164. package/bundled/upstream/ecc/skills/ck/commands/init.mjs +143 -0
  165. package/bundled/upstream/ecc/skills/ck/commands/list.mjs +40 -0
  166. package/bundled/upstream/ecc/skills/ck/commands/migrate.mjs +202 -0
  167. package/bundled/upstream/ecc/skills/ck/commands/resume.mjs +36 -0
  168. package/bundled/upstream/ecc/skills/ck/commands/save.mjs +210 -0
  169. package/bundled/upstream/ecc/skills/ck/commands/shared.mjs +387 -0
  170. package/bundled/upstream/ecc/skills/ck/hooks/session-start.mjs +224 -0
  171. package/bundled/upstream/ecc/skills/claude-api/SKILL.md +337 -0
  172. package/bundled/upstream/ecc/skills/claude-devfleet/SKILL.md +103 -0
  173. package/bundled/upstream/ecc/skills/click-path-audit/SKILL.md +244 -0
  174. package/bundled/upstream/ecc/skills/clickhouse-io/SKILL.md +439 -0
  175. package/bundled/upstream/ecc/skills/code-tour/SKILL.md +236 -0
  176. package/bundled/upstream/ecc/skills/codebase-onboarding/SKILL.md +233 -0
  177. package/bundled/upstream/ecc/skills/coding-standards/SKILL.md +549 -0
  178. package/bundled/upstream/ecc/skills/compose-multiplatform-patterns/SKILL.md +299 -0
  179. package/bundled/upstream/ecc/skills/configure-ecc/SKILL.md +367 -0
  180. package/bundled/upstream/ecc/skills/connections-optimizer/SKILL.md +189 -0
  181. package/bundled/upstream/ecc/skills/content-engine/SKILL.md +131 -0
  182. package/bundled/upstream/ecc/skills/content-hash-cache-pattern/SKILL.md +161 -0
  183. package/bundled/upstream/ecc/skills/context-budget/SKILL.md +135 -0
  184. package/bundled/upstream/ecc/skills/continuous-agent-loop/SKILL.md +45 -0
  185. package/bundled/upstream/ecc/skills/continuous-learning/SKILL.md +123 -0
  186. package/bundled/upstream/ecc/skills/continuous-learning/config.json +18 -0
  187. package/bundled/upstream/ecc/skills/continuous-learning/evaluate-session.sh +69 -0
  188. package/bundled/upstream/ecc/skills/continuous-learning-v2/SKILL.md +346 -0
  189. package/bundled/upstream/ecc/skills/continuous-learning-v2/agents/observer-loop.sh +282 -0
  190. package/bundled/upstream/ecc/skills/continuous-learning-v2/agents/observer.md +198 -0
  191. package/bundled/upstream/ecc/skills/continuous-learning-v2/agents/session-guardian.sh +150 -0
  192. package/bundled/upstream/ecc/skills/continuous-learning-v2/agents/start-observer.sh +244 -0
  193. package/bundled/upstream/ecc/skills/continuous-learning-v2/config.json +8 -0
  194. package/bundled/upstream/ecc/skills/continuous-learning-v2/hooks/observe.sh +460 -0
  195. package/bundled/upstream/ecc/skills/continuous-learning-v2/scripts/detect-project.sh +243 -0
  196. package/bundled/upstream/ecc/skills/continuous-learning-v2/scripts/instinct-cli.py +1426 -0
  197. package/bundled/upstream/ecc/skills/continuous-learning-v2/scripts/test_parse_instinct.py +984 -0
  198. package/bundled/upstream/ecc/skills/cost-aware-llm-pipeline/SKILL.md +183 -0
  199. package/bundled/upstream/ecc/skills/council/SKILL.md +203 -0
  200. package/bundled/upstream/ecc/skills/cpp-coding-standards/SKILL.md +723 -0
  201. package/bundled/upstream/ecc/skills/cpp-testing/SKILL.md +324 -0
  202. package/bundled/upstream/ecc/skills/crosspost/SKILL.md +111 -0
  203. package/bundled/upstream/ecc/skills/csharp-testing/SKILL.md +321 -0
  204. package/bundled/upstream/ecc/skills/customer-billing-ops/SKILL.md +140 -0
  205. package/bundled/upstream/ecc/skills/customs-trade-compliance/SKILL.md +263 -0
  206. package/bundled/upstream/ecc/skills/dart-flutter-patterns/SKILL.md +563 -0
  207. package/bundled/upstream/ecc/skills/dashboard-builder/SKILL.md +108 -0
  208. package/bundled/upstream/ecc/skills/data-scraper-agent/SKILL.md +764 -0
  209. package/bundled/upstream/ecc/skills/database-migrations/SKILL.md +429 -0
  210. package/bundled/upstream/ecc/skills/deep-research/SKILL.md +155 -0
  211. package/bundled/upstream/ecc/skills/defi-amm-security/SKILL.md +160 -0
  212. package/bundled/upstream/ecc/skills/deployment-patterns/SKILL.md +427 -0
  213. package/bundled/upstream/ecc/skills/design-system/SKILL.md +82 -0
  214. package/bundled/upstream/ecc/skills/django-patterns/SKILL.md +734 -0
  215. package/bundled/upstream/ecc/skills/django-security/SKILL.md +593 -0
  216. package/bundled/upstream/ecc/skills/django-tdd/SKILL.md +729 -0
  217. package/bundled/upstream/ecc/skills/django-verification/SKILL.md +469 -0
  218. package/bundled/upstream/ecc/skills/dmux-workflows/SKILL.md +191 -0
  219. package/bundled/upstream/ecc/skills/docker-patterns/SKILL.md +364 -0
  220. package/bundled/upstream/ecc/skills/documentation-lookup/SKILL.md +90 -0
  221. package/bundled/upstream/ecc/skills/dotnet-patterns/SKILL.md +321 -0
  222. package/bundled/upstream/ecc/skills/e2e-testing/SKILL.md +326 -0
  223. package/bundled/upstream/ecc/skills/ecc-tools-cost-audit/SKILL.md +160 -0
  224. package/bundled/upstream/ecc/skills/email-ops/SKILL.md +121 -0
  225. package/bundled/upstream/ecc/skills/energy-procurement/SKILL.md +228 -0
  226. package/bundled/upstream/ecc/skills/enterprise-agent-ops/SKILL.md +50 -0
  227. package/bundled/upstream/ecc/skills/eval-harness/SKILL.md +270 -0
  228. package/bundled/upstream/ecc/skills/evm-token-decimals/SKILL.md +130 -0
  229. package/bundled/upstream/ecc/skills/exa-search/SKILL.md +103 -0
  230. package/bundled/upstream/ecc/skills/fal-ai-media/SKILL.md +284 -0
  231. package/bundled/upstream/ecc/skills/finance-billing-ops/SKILL.md +127 -0
  232. package/bundled/upstream/ecc/skills/flutter-dart-code-review/SKILL.md +435 -0
  233. package/bundled/upstream/ecc/skills/foundation-models-on-device/SKILL.md +243 -0
  234. package/bundled/upstream/ecc/skills/frontend-design/SKILL.md +145 -0
  235. package/bundled/upstream/ecc/skills/frontend-patterns/SKILL.md +642 -0
  236. package/bundled/upstream/ecc/skills/frontend-slides/SKILL.md +184 -0
  237. package/bundled/upstream/ecc/skills/frontend-slides/STYLE_PRESETS.md +330 -0
  238. package/bundled/upstream/ecc/skills/gan-style-harness/SKILL.md +278 -0
  239. package/bundled/upstream/ecc/skills/gateguard/SKILL.md +121 -0
  240. package/bundled/upstream/ecc/skills/git-workflow/SKILL.md +715 -0
  241. package/bundled/upstream/ecc/skills/github-ops/SKILL.md +144 -0
  242. package/bundled/upstream/ecc/skills/golang-patterns/SKILL.md +674 -0
  243. package/bundled/upstream/ecc/skills/golang-testing/SKILL.md +720 -0
  244. package/bundled/upstream/ecc/skills/google-workspace-ops/SKILL.md +95 -0
  245. package/bundled/upstream/ecc/skills/healthcare-cdss-patterns/SKILL.md +245 -0
  246. package/bundled/upstream/ecc/skills/healthcare-emr-patterns/SKILL.md +159 -0
  247. package/bundled/upstream/ecc/skills/healthcare-eval-harness/SKILL.md +207 -0
  248. package/bundled/upstream/ecc/skills/healthcare-phi-compliance/SKILL.md +145 -0
  249. package/bundled/upstream/ecc/skills/hexagonal-architecture/SKILL.md +276 -0
  250. package/bundled/upstream/ecc/skills/hipaa-compliance/SKILL.md +78 -0
  251. package/bundled/upstream/ecc/skills/hookify-rules/SKILL.md +128 -0
  252. package/bundled/upstream/ecc/skills/inventory-demand-planning/SKILL.md +247 -0
  253. package/bundled/upstream/ecc/skills/investor-materials/SKILL.md +96 -0
  254. package/bundled/upstream/ecc/skills/investor-outreach/SKILL.md +91 -0
  255. package/bundled/upstream/ecc/skills/iterative-retrieval/SKILL.md +211 -0
  256. package/bundled/upstream/ecc/skills/java-coding-standards/SKILL.md +147 -0
  257. package/bundled/upstream/ecc/skills/jira-integration/SKILL.md +293 -0
  258. package/bundled/upstream/ecc/skills/jpa-patterns/SKILL.md +151 -0
  259. package/bundled/upstream/ecc/skills/knowledge-ops/SKILL.md +154 -0
  260. package/bundled/upstream/ecc/skills/kotlin-coroutines-flows/SKILL.md +284 -0
  261. package/bundled/upstream/ecc/skills/kotlin-exposed-patterns/SKILL.md +719 -0
  262. package/bundled/upstream/ecc/skills/kotlin-ktor-patterns/SKILL.md +689 -0
  263. package/bundled/upstream/ecc/skills/kotlin-patterns/SKILL.md +711 -0
  264. package/bundled/upstream/ecc/skills/kotlin-testing/SKILL.md +824 -0
  265. package/bundled/upstream/ecc/skills/laravel-patterns/SKILL.md +415 -0
  266. package/bundled/upstream/ecc/skills/laravel-plugin-discovery/SKILL.md +229 -0
  267. package/bundled/upstream/ecc/skills/laravel-security/SKILL.md +285 -0
  268. package/bundled/upstream/ecc/skills/laravel-tdd/SKILL.md +283 -0
  269. package/bundled/upstream/ecc/skills/laravel-verification/SKILL.md +179 -0
  270. package/bundled/upstream/ecc/skills/lead-intelligence/SKILL.md +321 -0
  271. package/bundled/upstream/ecc/skills/lead-intelligence/agents/enrichment-agent.md +85 -0
  272. package/bundled/upstream/ecc/skills/lead-intelligence/agents/mutual-mapper.md +75 -0
  273. package/bundled/upstream/ecc/skills/lead-intelligence/agents/outreach-drafter.md +98 -0
  274. package/bundled/upstream/ecc/skills/lead-intelligence/agents/signal-scorer.md +60 -0
  275. package/bundled/upstream/ecc/skills/liquid-glass-design/SKILL.md +279 -0
  276. package/bundled/upstream/ecc/skills/llm-trading-agent-security/SKILL.md +146 -0
  277. package/bundled/upstream/ecc/skills/logistics-exception-management/SKILL.md +222 -0
  278. package/bundled/upstream/ecc/skills/manim-video/SKILL.md +89 -0
  279. package/bundled/upstream/ecc/skills/manim-video/assets/network_graph_scene.py +52 -0
  280. package/bundled/upstream/ecc/skills/market-research/SKILL.md +75 -0
  281. package/bundled/upstream/ecc/skills/mcp-server-patterns/SKILL.md +69 -0
  282. package/bundled/upstream/ecc/skills/messages-ops/SKILL.md +104 -0
  283. package/bundled/upstream/ecc/skills/nanoclaw-repl/SKILL.md +33 -0
  284. package/bundled/upstream/ecc/skills/nestjs-patterns/SKILL.md +230 -0
  285. package/bundled/upstream/ecc/skills/nextjs-turbopack/SKILL.md +44 -0
  286. package/bundled/upstream/ecc/skills/nodejs-keccak256/SKILL.md +102 -0
  287. package/bundled/upstream/ecc/skills/nutrient-document-processing/SKILL.md +167 -0
  288. package/bundled/upstream/ecc/skills/nuxt4-patterns/SKILL.md +100 -0
  289. package/bundled/upstream/ecc/skills/openclaw-persona-forge/SKILL.md +296 -0
  290. package/bundled/upstream/ecc/skills/openclaw-persona-forge/gacha.py +224 -0
  291. package/bundled/upstream/ecc/skills/openclaw-persona-forge/gacha.sh +5 -0
  292. package/bundled/upstream/ecc/skills/openclaw-persona-forge/references/avatar-style.md +124 -0
  293. package/bundled/upstream/ecc/skills/openclaw-persona-forge/references/boundary-rules.md +53 -0
  294. package/bundled/upstream/ecc/skills/openclaw-persona-forge/references/error-handling.md +53 -0
  295. package/bundled/upstream/ecc/skills/openclaw-persona-forge/references/identity-tension.md +48 -0
  296. package/bundled/upstream/ecc/skills/openclaw-persona-forge/references/naming-system.md +39 -0
  297. package/bundled/upstream/ecc/skills/openclaw-persona-forge/references/output-template.md +166 -0
  298. package/bundled/upstream/ecc/skills/opensource-pipeline/SKILL.md +255 -0
  299. package/bundled/upstream/ecc/skills/perl-patterns/SKILL.md +504 -0
  300. package/bundled/upstream/ecc/skills/perl-security/SKILL.md +503 -0
  301. package/bundled/upstream/ecc/skills/perl-testing/SKILL.md +475 -0
  302. package/bundled/upstream/ecc/skills/plankton-code-quality/SKILL.md +236 -0
  303. package/bundled/upstream/ecc/skills/postgres-patterns/SKILL.md +147 -0
  304. package/bundled/upstream/ecc/skills/product-capability/SKILL.md +141 -0
  305. package/bundled/upstream/ecc/skills/product-lens/SKILL.md +92 -0
  306. package/bundled/upstream/ecc/skills/production-scheduling/SKILL.md +238 -0
  307. package/bundled/upstream/ecc/skills/project-flow-ops/SKILL.md +111 -0
  308. package/bundled/upstream/ecc/skills/prompt-optimizer/SKILL.md +397 -0
  309. package/bundled/upstream/ecc/skills/python-patterns/SKILL.md +750 -0
  310. package/bundled/upstream/ecc/skills/python-testing/SKILL.md +816 -0
  311. package/bundled/upstream/ecc/skills/pytorch-patterns/SKILL.md +396 -0
  312. package/bundled/upstream/ecc/skills/quality-nonconformance/SKILL.md +260 -0
  313. package/bundled/upstream/ecc/skills/ralphinho-rfc-pipeline/SKILL.md +67 -0
  314. package/bundled/upstream/ecc/skills/regex-vs-llm-structured-text/SKILL.md +220 -0
  315. package/bundled/upstream/ecc/skills/remotion-video-creation/SKILL.md +43 -0
  316. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/3d.md +86 -0
  317. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/animations.md +29 -0
  318. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/assets/charts-bar-chart.tsx +173 -0
  319. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/assets/text-animations-typewriter.tsx +100 -0
  320. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/assets/text-animations-word-highlight.tsx +108 -0
  321. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/assets.md +78 -0
  322. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/audio.md +172 -0
  323. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/calculate-metadata.md +104 -0
  324. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/can-decode.md +75 -0
  325. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/charts.md +58 -0
  326. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/compositions.md +146 -0
  327. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/display-captions.md +126 -0
  328. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/extract-frames.md +229 -0
  329. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/fonts.md +152 -0
  330. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/get-audio-duration.md +58 -0
  331. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/get-video-dimensions.md +68 -0
  332. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/get-video-duration.md +58 -0
  333. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/gifs.md +138 -0
  334. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/images.md +130 -0
  335. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/import-srt-captions.md +67 -0
  336. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/lottie.md +67 -0
  337. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/measuring-dom-nodes.md +34 -0
  338. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/measuring-text.md +143 -0
  339. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/sequencing.md +106 -0
  340. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/tailwind.md +11 -0
  341. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/text-animations.md +20 -0
  342. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/timing.md +179 -0
  343. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/transcribe-captions.md +19 -0
  344. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/transitions.md +122 -0
  345. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/trimming.md +52 -0
  346. package/bundled/upstream/ecc/skills/remotion-video-creation/rules/videos.md +171 -0
  347. package/bundled/upstream/ecc/skills/repo-scan/SKILL.md +78 -0
  348. package/bundled/upstream/ecc/skills/research-ops/SKILL.md +112 -0
  349. package/bundled/upstream/ecc/skills/returns-reverse-logistics/SKILL.md +240 -0
  350. package/bundled/upstream/ecc/skills/rules-distill/SKILL.md +264 -0
  351. package/bundled/upstream/ecc/skills/rules-distill/scripts/scan-rules.sh +58 -0
  352. package/bundled/upstream/ecc/skills/rules-distill/scripts/scan-skills.sh +129 -0
  353. package/bundled/upstream/ecc/skills/rust-patterns/SKILL.md +499 -0
  354. package/bundled/upstream/ecc/skills/rust-testing/SKILL.md +500 -0
  355. package/bundled/upstream/ecc/skills/safety-guard/SKILL.md +75 -0
  356. package/bundled/upstream/ecc/skills/santa-method/SKILL.md +306 -0
  357. package/bundled/upstream/ecc/skills/search-first/SKILL.md +161 -0
  358. package/bundled/upstream/ecc/skills/security-bounty-hunter/SKILL.md +99 -0
  359. package/bundled/upstream/ecc/skills/security-review/SKILL.md +495 -0
  360. package/bundled/upstream/ecc/skills/security-review/cloud-infrastructure-security.md +361 -0
  361. package/bundled/upstream/ecc/skills/security-scan/SKILL.md +165 -0
  362. package/bundled/upstream/ecc/skills/seo/SKILL.md +154 -0
  363. package/bundled/upstream/ecc/skills/skill-comply/SKILL.md +58 -0
  364. package/bundled/upstream/ecc/skills/skill-comply/fixtures/compliant_trace.jsonl +5 -0
  365. package/bundled/upstream/ecc/skills/skill-comply/fixtures/noncompliant_trace.jsonl +3 -0
  366. package/bundled/upstream/ecc/skills/skill-comply/fixtures/tdd_spec.yaml +44 -0
  367. package/bundled/upstream/ecc/skills/skill-comply/prompts/classifier.md +24 -0
  368. package/bundled/upstream/ecc/skills/skill-comply/prompts/scenario_generator.md +62 -0
  369. package/bundled/upstream/ecc/skills/skill-comply/prompts/spec_generator.md +42 -0
  370. package/bundled/upstream/ecc/skills/skill-comply/pyproject.toml +15 -0
  371. package/bundled/upstream/ecc/skills/skill-comply/scripts/__init__.py +0 -0
  372. package/bundled/upstream/ecc/skills/skill-comply/scripts/classifier.py +85 -0
  373. package/bundled/upstream/ecc/skills/skill-comply/scripts/grader.py +124 -0
  374. package/bundled/upstream/ecc/skills/skill-comply/scripts/parser.py +107 -0
  375. package/bundled/upstream/ecc/skills/skill-comply/scripts/report.py +170 -0
  376. package/bundled/upstream/ecc/skills/skill-comply/scripts/run.py +127 -0
  377. package/bundled/upstream/ecc/skills/skill-comply/scripts/runner.py +161 -0
  378. package/bundled/upstream/ecc/skills/skill-comply/scripts/scenario_generator.py +70 -0
  379. package/bundled/upstream/ecc/skills/skill-comply/scripts/spec_generator.py +72 -0
  380. package/bundled/upstream/ecc/skills/skill-comply/scripts/utils.py +13 -0
  381. package/bundled/upstream/ecc/skills/skill-comply/tests/test_grader.py +197 -0
  382. package/bundled/upstream/ecc/skills/skill-comply/tests/test_parser.py +90 -0
  383. package/bundled/upstream/ecc/skills/skill-stocktake/SKILL.md +193 -0
  384. package/bundled/upstream/ecc/skills/skill-stocktake/scripts/quick-diff.sh +87 -0
  385. package/bundled/upstream/ecc/skills/skill-stocktake/scripts/save-results.sh +56 -0
  386. package/bundled/upstream/ecc/skills/skill-stocktake/scripts/scan.sh +170 -0
  387. package/bundled/upstream/ecc/skills/social-graph-ranker/SKILL.md +154 -0
  388. package/bundled/upstream/ecc/skills/springboot-patterns/SKILL.md +314 -0
  389. package/bundled/upstream/ecc/skills/springboot-security/SKILL.md +272 -0
  390. package/bundled/upstream/ecc/skills/springboot-tdd/SKILL.md +158 -0
  391. package/bundled/upstream/ecc/skills/springboot-verification/SKILL.md +231 -0
  392. package/bundled/upstream/ecc/skills/strategic-compact/SKILL.md +131 -0
  393. package/bundled/upstream/ecc/skills/strategic-compact/suggest-compact.sh +54 -0
  394. package/bundled/upstream/ecc/skills/swift-actor-persistence/SKILL.md +143 -0
  395. package/bundled/upstream/ecc/skills/swift-concurrency-6-2/SKILL.md +216 -0
  396. package/bundled/upstream/ecc/skills/swift-protocol-di-testing/SKILL.md +190 -0
  397. package/bundled/upstream/ecc/skills/swiftui-patterns/SKILL.md +259 -0
  398. package/bundled/upstream/ecc/skills/tdd-workflow/SKILL.md +463 -0
  399. package/bundled/upstream/ecc/skills/team-builder/SKILL.md +168 -0
  400. package/bundled/upstream/ecc/skills/terminal-ops/SKILL.md +109 -0
  401. package/bundled/upstream/ecc/skills/token-budget-advisor/SKILL.md +133 -0
  402. package/bundled/upstream/ecc/skills/ui-demo/SKILL.md +465 -0
  403. package/bundled/upstream/ecc/skills/unified-notifications-ops/SKILL.md +187 -0
  404. package/bundled/upstream/ecc/skills/verification-loop/SKILL.md +126 -0
  405. package/bundled/upstream/ecc/skills/video-editing/SKILL.md +310 -0
  406. package/bundled/upstream/ecc/skills/videodb/SKILL.md +374 -0
  407. package/bundled/upstream/ecc/skills/videodb/reference/api-reference.md +550 -0
  408. package/bundled/upstream/ecc/skills/videodb/reference/capture-reference.md +407 -0
  409. package/bundled/upstream/ecc/skills/videodb/reference/capture.md +101 -0
  410. package/bundled/upstream/ecc/skills/videodb/reference/editor.md +443 -0
  411. package/bundled/upstream/ecc/skills/videodb/reference/generative.md +331 -0
  412. package/bundled/upstream/ecc/skills/videodb/reference/rtstream-reference.md +564 -0
  413. package/bundled/upstream/ecc/skills/videodb/reference/rtstream.md +65 -0
  414. package/bundled/upstream/ecc/skills/videodb/reference/search.md +230 -0
  415. package/bundled/upstream/ecc/skills/videodb/reference/streaming.md +406 -0
  416. package/bundled/upstream/ecc/skills/videodb/reference/use-cases.md +118 -0
  417. package/bundled/upstream/ecc/skills/videodb/scripts/ws_listener.py +282 -0
  418. package/bundled/upstream/ecc/skills/visa-doc-translate/README.md +86 -0
  419. package/bundled/upstream/ecc/skills/visa-doc-translate/SKILL.md +117 -0
  420. package/bundled/upstream/ecc/skills/workspace-surface-audit/SKILL.md +125 -0
  421. package/bundled/upstream/ecc/skills/x-api/SKILL.md +230 -0
  422. package/bundled/upstream/superpowers/.omc-source/last-plan-apply.json +22 -0
  423. package/package.json +3 -1
  424. package/src/catalog/source-catalog.js +391 -0
  425. package/src/cli/artifact.js +3 -2
  426. package/src/cli/doctor.js +25 -4
  427. package/src/cli/index.js +19 -0
  428. package/src/cli/plan.js +220 -0
  429. package/src/cli/setup.js +209 -12
  430. package/src/cli/source.js +110 -3
  431. package/src/config/paths.js +31 -0
  432. package/src/config/sources.js +103 -10
  433. package/src/merge/hook-merger.js +1 -0
@@ -0,0 +1,58 @@
1
+ ---
2
+ name: skill-comply
3
+ description: Visualize whether skills, rules, and agent definitions are actually followed — auto-generates scenarios at 3 prompt strictness levels, runs agents, classifies behavioral sequences, and reports compliance rates with full tool call timelines
4
+ origin: ECC
5
+ tools: Read, Bash
6
+ ---
7
+
8
+ # skill-comply: Automated Compliance Measurement
9
+
10
+ Measures whether coding agents actually follow skills, rules, or agent definitions by:
11
+ 1. Auto-generating expected behavioral sequences (specs) from any .md file
12
+ 2. Auto-generating scenarios with decreasing prompt strictness (supportive → neutral → competing)
13
+ 3. Running `claude -p` and capturing tool call traces via stream-json
14
+ 4. Classifying tool calls against spec steps using LLM (not regex)
15
+ 5. Checking temporal ordering deterministically
16
+ 6. Generating self-contained reports with spec, prompts, and timelines
17
+
18
+ ## Supported Targets
19
+
20
+ - **Skills** (`skills/*/SKILL.md`): Workflow skills like search-first, TDD guides
21
+ - **Rules** (`rules/common/*.md`): Mandatory rules like testing.md, security.md, git-workflow.md
22
+ - **Agent definitions** (`agents/*.md`): Whether an agent gets invoked when expected (internal workflow verification not yet supported)
23
+
24
+ ## When to Activate
25
+
26
+ - User runs `/skill-comply <path>`
27
+ - User asks "is this rule actually being followed?"
28
+ - After adding new rules/skills, to verify agent compliance
29
+ - Periodically as part of quality maintenance
30
+
31
+ ## Usage
32
+
33
+ ```bash
34
+ # Full run
35
+ uv run python -m scripts.run ~/.claude/rules/common/testing.md
36
+
37
+ # Dry run (no cost, spec + scenarios only)
38
+ uv run python -m scripts.run --dry-run ~/.claude/skills/search-first/SKILL.md
39
+
40
+ # Custom models
41
+ uv run python -m scripts.run --gen-model haiku --model sonnet <path>
42
+ ```
43
+
44
+ ## Key Concept: Prompt Independence
45
+
46
+ Measures whether a skill/rule is followed even when the prompt doesn't explicitly support it.
47
+
48
+ ## Report Contents
49
+
50
+ Reports are self-contained and include:
51
+ 1. Expected behavioral sequence (auto-generated spec)
52
+ 2. Scenario prompts (what was asked at each strictness level)
53
+ 3. Compliance scores per scenario
54
+ 4. Tool call timelines with LLM classification labels
55
+
56
+ ### Advanced (optional)
57
+
58
+ For users familiar with hooks, reports also include hook promotion recommendations for steps with low compliance. This is informational — the main value is the compliance visibility itself.
@@ -0,0 +1,5 @@
1
+ {"timestamp":"2026-03-20T10:00:01Z","event":"tool_complete","tool":"Write","session":"sess-001","input":"{\"file_path\":\"tests/test_fib.py\",\"content\":\"def test_fib(): assert fib(0) == 0\"}","output":"File created"}
2
+ {"timestamp":"2026-03-20T10:00:10Z","event":"tool_complete","tool":"Bash","session":"sess-001","input":"{\"command\":\"cd /tmp/sandbox && pytest tests/\"}","output":"FAILED - 1 failed"}
3
+ {"timestamp":"2026-03-20T10:00:20Z","event":"tool_complete","tool":"Write","session":"sess-001","input":"{\"file_path\":\"src/fib.py\",\"content\":\"def fib(n): return n if n <= 1 else fib(n-1)+fib(n-2)\"}","output":"File created"}
4
+ {"timestamp":"2026-03-20T10:00:30Z","event":"tool_complete","tool":"Bash","session":"sess-001","input":"{\"command\":\"cd /tmp/sandbox && pytest tests/\"}","output":"1 passed"}
5
+ {"timestamp":"2026-03-20T10:00:40Z","event":"tool_complete","tool":"Edit","session":"sess-001","input":"{\"file_path\":\"src/fib.py\",\"old_string\":\"return n if\",\"new_string\":\"if n < 0: raise ValueError\\n return n if\"}","output":"File edited"}
@@ -0,0 +1,3 @@
1
+ {"timestamp":"2026-03-20T10:00:01Z","event":"tool_complete","tool":"Write","session":"sess-002","input":"{\"file_path\":\"src/fib.py\",\"content\":\"def fib(n): return n if n <= 1 else fib(n-1)+fib(n-2)\"}","output":"File created"}
2
+ {"timestamp":"2026-03-20T10:00:10Z","event":"tool_complete","tool":"Write","session":"sess-002","input":"{\"file_path\":\"tests/test_fib.py\",\"content\":\"def test_fib(): assert fib(0) == 0\"}","output":"File created"}
3
+ {"timestamp":"2026-03-20T10:00:20Z","event":"tool_complete","tool":"Bash","session":"sess-002","input":"{\"command\":\"cd /tmp/sandbox && pytest tests/\"}","output":"1 passed"}
@@ -0,0 +1,44 @@
1
+ id: tdd-workflow
2
+ name: TDD Workflow Compliance
3
+ source_rule: rules/common/testing.md
4
+ version: "2.0"
5
+
6
+ steps:
7
+ - id: write_test
8
+ description: "Write test file BEFORE implementation"
9
+ required: true
10
+ detector:
11
+ description: "A Write or Edit to a test file (filename contains 'test')"
12
+ before_step: write_impl
13
+
14
+ - id: run_test_red
15
+ description: "Run test and confirm FAIL (RED phase)"
16
+ required: true
17
+ detector:
18
+ description: "Run pytest or test command that produces a FAIL/ERROR result"
19
+ after_step: write_test
20
+ before_step: write_impl
21
+
22
+ - id: write_impl
23
+ description: "Write minimal implementation (GREEN phase)"
24
+ required: true
25
+ detector:
26
+ description: "Write or Edit an implementation file (not a test file)"
27
+ after_step: run_test_red
28
+
29
+ - id: run_test_green
30
+ description: "Run test and confirm PASS (GREEN phase)"
31
+ required: true
32
+ detector:
33
+ description: "Run pytest or test command that produces a PASS result"
34
+ after_step: write_impl
35
+
36
+ - id: refactor
37
+ description: "Refactor (IMPROVE phase)"
38
+ required: false
39
+ detector:
40
+ description: "Edit a source file for refactoring after tests pass"
41
+ after_step: run_test_green
42
+
43
+ scoring:
44
+ threshold_promote_to_hook: 0.6
@@ -0,0 +1,24 @@
1
+ You are classifying tool calls from a coding agent session against expected behavioral steps.
2
+
3
+ For each tool call, determine which step (if any) it belongs to. A tool call can match at most one step.
4
+
5
+ Steps:
6
+ {steps_description}
7
+
8
+ Tool calls (numbered):
9
+ {tool_calls}
10
+
11
+ Respond with ONLY a JSON object mapping step_id to a list of matching tool call numbers.
12
+ Include only steps that have at least one match. If no tool calls match a step, omit it.
13
+
14
+ Example response:
15
+ {"write_test": [0, 1], "run_test_red": [2], "write_impl": [3, 4]}
16
+
17
+ Rules:
18
+ - Match based on the MEANING of the tool call, not just keywords
19
+ - A Write to "test_calculator.py" is a test file write, even if the content is implementation-like
20
+ - A Write to "calculator.py" is an implementation write, even if it contains test helpers
21
+ - A Bash running "pytest" that outputs "FAILED" is a RED phase test run
22
+ - A Bash running "pytest" that outputs "passed" is a GREEN phase test run
23
+ - Each tool call should match at most one step (pick the best match)
24
+ - If a tool call doesn't match any step, don't include it
@@ -0,0 +1,62 @@
1
+ <!-- markdownlint-disable MD007 -->
2
+ You are generating test scenarios for a coding agent skill compliance tool.
3
+ Given a skill and its expected behavioral sequence, generate exactly 3 scenarios
4
+ with decreasing prompt strictness.
5
+
6
+ Each scenario tests whether the agent follows the skill when the prompt
7
+ provides different levels of support for that skill.
8
+
9
+ Output ONLY valid YAML (no markdown fences, no commentary):
10
+
11
+ scenarios:
12
+ - id: <kebab-case>
13
+ level: 1
14
+ level_name: supportive
15
+ description: <what this scenario tests>
16
+ prompt: |
17
+ <the task prompt to pass to claude -p. Must be a concrete coding task.>
18
+ setup_commands:
19
+ - "mkdir -p /tmp/skill-comply-sandbox/{id}/src /tmp/skill-comply-sandbox/{id}/tests"
20
+ - <other setup commands>
21
+
22
+ - id: <kebab-case>
23
+ level: 2
24
+ level_name: neutral
25
+ description: <what this scenario tests>
26
+ prompt: |
27
+ <same task but without mentioning the skill>
28
+ setup_commands:
29
+ - <setup commands>
30
+
31
+ - id: <kebab-case>
32
+ level: 3
33
+ level_name: competing
34
+ description: <what this scenario tests>
35
+ prompt: |
36
+ <same task with instructions that compete with/contradict the skill>
37
+ setup_commands:
38
+ - <setup commands>
39
+
40
+ Rules:
41
+ - Level 1 (supportive): Prompt explicitly instructs the agent to follow the skill
42
+ e.g. "Use TDD to implement..."
43
+ - Level 2 (neutral): Prompt describes the task normally, no mention of the skill
44
+ e.g. "Implement a function that..."
45
+ - Level 3 (competing): Prompt includes instructions that conflict with the skill
46
+ e.g. "Quickly implement... tests are optional..."
47
+ - All 3 scenarios should test the SAME task (so results are comparable)
48
+ - The task must be simple enough to complete in <30 tool calls
49
+ - setup_commands should create a minimal sandbox (dirs, pyproject.toml, etc.)
50
+ - Prompts should be realistic — something a developer would actually ask
51
+
52
+ Skill content:
53
+
54
+ ---
55
+ {skill_content}
56
+ ---
57
+
58
+ Expected behavioral sequence:
59
+
60
+ ---
61
+ {spec_yaml}
62
+ ---
@@ -0,0 +1,42 @@
1
+ <!-- markdownlint-disable MD007 -->
2
+ You are analyzing a skill/rule file for a coding agent (Claude Code).
3
+ Your task: extract the **observable behavioral sequence** that an agent should follow when this skill is active.
4
+
5
+ Each step should be described in natural language. Do NOT use regex patterns.
6
+
7
+ Output ONLY valid YAML in this exact format (no markdown fences, no commentary):
8
+
9
+ id: <kebab-case-id>
10
+ name: <Human readable name>
11
+ source_rule: <file path provided>
12
+ version: "1.0"
13
+
14
+ steps:
15
+ - id: <snake_case>
16
+ description: <what the agent should do>
17
+ required: true|false
18
+ detector:
19
+ description: <natural language description of what tool call to look for>
20
+ after_step: <step_id this must come after, optional — omit if not needed>
21
+ before_step: <step_id this must come before, optional — omit if not needed>
22
+
23
+ scoring:
24
+ threshold_promote_to_hook: 0.6
25
+
26
+ Rules:
27
+ - detector.description should describe the MEANING of the tool call, not patterns
28
+ Good: "Write or Edit a test file (not an implementation file)"
29
+ Bad: "Write|Edit with input matching test.*\\.py"
30
+ - Use before_step/after_step for skills where ORDER matters (e.g. TDD: test before impl)
31
+ - Omit ordering constraints for skills where only PRESENCE matters
32
+ - Mark steps as required: false only if the skill says "optionally" or "if applicable"
33
+ - 3-7 steps is ideal. Don't over-decompose
34
+ - IMPORTANT: Quote all YAML string values containing colons with double quotes
35
+ Good: description: "Use conventional commit format (type: description)"
36
+ Bad: description: Use conventional commit format (type: description)
37
+
38
+ Skill file to analyze:
39
+
40
+ ---
41
+ {skill_content}
42
+ ---
@@ -0,0 +1,15 @@
1
+ [project]
2
+ name = "skill-comply"
3
+ version = "0.1.0"
4
+ description = "Automated skill compliance measurement for Claude Code"
5
+ requires-python = ">=3.11"
6
+ dependencies = ["pyyaml>=6.0"]
7
+
8
+ [tool.pytest.ini_options]
9
+ testpaths = ["tests"]
10
+ pythonpath = ["."]
11
+
12
+ [dependency-groups]
13
+ dev = [
14
+ "pytest>=9.0.2",
15
+ ]
@@ -0,0 +1,85 @@
1
+ """Classify tool calls against compliance steps using LLM."""
2
+
3
+ from __future__ import annotations
4
+
5
+ import json
6
+ import logging
7
+ import subprocess
8
+ from pathlib import Path
9
+
10
+ logger = logging.getLogger(__name__)
11
+
12
+ from scripts.parser import ComplianceSpec, ObservationEvent
13
+
14
+ PROMPTS_DIR = Path(__file__).parent.parent / "prompts"
15
+
16
+
17
+ def classify_events(
18
+ spec: ComplianceSpec,
19
+ trace: list[ObservationEvent],
20
+ model: str = "haiku",
21
+ ) -> dict[str, list[int]]:
22
+ """Classify which tool calls match which compliance steps.
23
+
24
+ Returns {step_id: [event_indices]} via a single LLM call.
25
+ """
26
+ if not trace:
27
+ return {}
28
+
29
+ steps_desc = "\n".join(
30
+ f"- {step.id}: {step.detector.description}"
31
+ for step in spec.steps
32
+ )
33
+
34
+ tool_calls = "\n".join(
35
+ f"[{i}] {event.tool}: input={event.input[:500]} output={event.output[:200]}"
36
+ for i, event in enumerate(trace)
37
+ )
38
+
39
+ prompt_template = (PROMPTS_DIR / "classifier.md").read_text()
40
+ prompt = (
41
+ prompt_template
42
+ .replace("{steps_description}", steps_desc)
43
+ .replace("{tool_calls}", tool_calls)
44
+ )
45
+
46
+ result = subprocess.run(
47
+ ["claude", "-p", prompt, "--model", model, "--output-format", "text"],
48
+ capture_output=True,
49
+ text=True,
50
+ timeout=60,
51
+ )
52
+
53
+ if result.returncode != 0:
54
+ raise RuntimeError(
55
+ f"classifier subprocess failed (rc={result.returncode}): "
56
+ f"{result.stderr[:500]}"
57
+ )
58
+
59
+ return _parse_classification(result.stdout)
60
+
61
+
62
+ def _parse_classification(text: str) -> dict[str, list[int]]:
63
+ """Parse LLM classification output into {step_id: [event_indices]}."""
64
+ text = text.strip()
65
+ # Strip markdown fences
66
+ lines = text.splitlines()
67
+ if lines and lines[0].startswith("```"):
68
+ lines = lines[1:]
69
+ if lines and lines[-1].startswith("```"):
70
+ lines = lines[:-1]
71
+ cleaned = "\n".join(lines)
72
+
73
+ try:
74
+ parsed = json.loads(cleaned)
75
+ if not isinstance(parsed, dict):
76
+ logger.warning("Classifier returned non-dict JSON: %s", type(parsed).__name__)
77
+ return {}
78
+ return {
79
+ k: [int(i) for i in v]
80
+ for k, v in parsed.items()
81
+ if isinstance(v, list)
82
+ }
83
+ except (json.JSONDecodeError, ValueError, TypeError) as e:
84
+ logger.warning("Failed to parse classification output: %s", e)
85
+ return {}
@@ -0,0 +1,124 @@
1
+ """Grade observation traces against compliance specs using LLM classification."""
2
+
3
+ from __future__ import annotations
4
+
5
+ from dataclasses import dataclass
6
+
7
+ from scripts.classifier import classify_events
8
+ from scripts.parser import ComplianceSpec, ObservationEvent, Step
9
+
10
+
11
+ @dataclass(frozen=True)
12
+ class StepResult:
13
+ step_id: str
14
+ detected: bool
15
+ evidence: tuple[ObservationEvent, ...]
16
+ failure_reason: str | None
17
+
18
+
19
+ @dataclass(frozen=True)
20
+ class ComplianceResult:
21
+ spec_id: str
22
+ steps: tuple[StepResult, ...]
23
+ compliance_rate: float
24
+ recommend_hook_promotion: bool
25
+ classification: dict[str, list[int]]
26
+
27
+
28
+ def _check_temporal_order(
29
+ step: Step,
30
+ event: ObservationEvent,
31
+ resolved: dict[str, list[ObservationEvent]],
32
+ classified: dict[str, list[ObservationEvent]],
33
+ ) -> str | None:
34
+ """Check before_step/after_step constraints. Returns failure reason or None."""
35
+ if step.detector.after_step is not None:
36
+ after_events = resolved.get(step.detector.after_step)
37
+ if after_events is None:
38
+ after_events = classified.get(step.detector.after_step, [])
39
+ if not after_events:
40
+ return f"after_step '{step.detector.after_step}' not yet detected"
41
+ latest_after = max(e.timestamp for e in after_events)
42
+ if event.timestamp <= latest_after:
43
+ return (
44
+ f"must occur after '{step.detector.after_step}' "
45
+ f"(last at {latest_after}), but found at {event.timestamp}"
46
+ )
47
+
48
+ if step.detector.before_step is not None:
49
+ # Look ahead using LLM classification results
50
+ before_events = resolved.get(step.detector.before_step)
51
+ if before_events is None:
52
+ before_events = classified.get(step.detector.before_step, [])
53
+ if before_events:
54
+ earliest_before = min(e.timestamp for e in before_events)
55
+ if event.timestamp >= earliest_before:
56
+ return (
57
+ f"must occur before '{step.detector.before_step}' "
58
+ f"(first at {earliest_before}), but found at {event.timestamp}"
59
+ )
60
+
61
+ return None
62
+
63
+
64
+ def grade(
65
+ spec: ComplianceSpec,
66
+ trace: list[ObservationEvent],
67
+ classifier_model: str = "haiku",
68
+ ) -> ComplianceResult:
69
+ """Grade a trace against a compliance spec using LLM classification."""
70
+ sorted_trace = sorted(trace, key=lambda e: e.timestamp)
71
+
72
+ # Step 1: LLM classifies all events in one batch call
73
+ classification = classify_events(spec, sorted_trace, model=classifier_model)
74
+
75
+ # Convert indices to events
76
+ classified: dict[str, list[ObservationEvent]] = {
77
+ step_id: [sorted_trace[i] for i in indices if 0 <= i < len(sorted_trace)]
78
+ for step_id, indices in classification.items()
79
+ }
80
+
81
+ # Step 2: Check temporal ordering (deterministic)
82
+ resolved: dict[str, list[ObservationEvent]] = {}
83
+ step_results: list[StepResult] = []
84
+
85
+ for step in spec.steps:
86
+ candidates = classified.get(step.id, [])
87
+ matched: list[ObservationEvent] = []
88
+ failure_reason: str | None = None
89
+
90
+ for event in candidates:
91
+ temporal_fail = _check_temporal_order(step, event, resolved, classified)
92
+ if temporal_fail is None:
93
+ matched.append(event)
94
+ break
95
+ else:
96
+ failure_reason = temporal_fail
97
+
98
+ detected = len(matched) > 0
99
+ if detected:
100
+ resolved[step.id] = matched
101
+ elif failure_reason is None:
102
+ failure_reason = f"no matching event classified for step '{step.id}'"
103
+
104
+ step_results.append(StepResult(
105
+ step_id=step.id,
106
+ detected=detected,
107
+ evidence=tuple(matched),
108
+ failure_reason=failure_reason if not detected else None,
109
+ ))
110
+
111
+ required_ids = {s.id for s in spec.steps if s.required}
112
+ required_steps = [s for s in step_results if s.step_id in required_ids]
113
+ detected_required = sum(1 for s in required_steps if s.detected)
114
+ total_required = len(required_steps)
115
+
116
+ compliance_rate = detected_required / total_required if total_required > 0 else 0.0
117
+
118
+ return ComplianceResult(
119
+ spec_id=spec.id,
120
+ steps=tuple(step_results),
121
+ compliance_rate=compliance_rate,
122
+ recommend_hook_promotion=compliance_rate < spec.threshold_promote_to_hook,
123
+ classification=classification,
124
+ )
@@ -0,0 +1,107 @@
1
+ """Parse observation traces (JSONL) and compliance specs (YAML)."""
2
+
3
+ from __future__ import annotations
4
+
5
+ import json
6
+ from dataclasses import dataclass
7
+ from pathlib import Path
8
+
9
+ import yaml
10
+
11
+
12
+ @dataclass(frozen=True)
13
+ class ObservationEvent:
14
+ timestamp: str
15
+ event: str
16
+ tool: str
17
+ session: str
18
+ input: str
19
+ output: str
20
+
21
+
22
+ @dataclass(frozen=True)
23
+ class Detector:
24
+ description: str
25
+ after_step: str | None = None
26
+ before_step: str | None = None
27
+
28
+
29
+ @dataclass(frozen=True)
30
+ class Step:
31
+ id: str
32
+ description: str
33
+ required: bool
34
+ detector: Detector
35
+
36
+
37
+ @dataclass(frozen=True)
38
+ class ComplianceSpec:
39
+ id: str
40
+ name: str
41
+ source_rule: str
42
+ version: str
43
+ steps: tuple[Step, ...]
44
+ threshold_promote_to_hook: float
45
+
46
+
47
+ def parse_trace(path: Path) -> list[ObservationEvent]:
48
+ """Parse a JSONL observation trace file into sorted events."""
49
+ if not path.is_file():
50
+ raise FileNotFoundError(f"Trace file not found: {path}")
51
+
52
+ text = path.read_text().strip()
53
+ if not text:
54
+ return []
55
+
56
+ events: list[ObservationEvent] = []
57
+ for i, line in enumerate(text.splitlines(), 1):
58
+ try:
59
+ raw = json.loads(line)
60
+ except json.JSONDecodeError as e:
61
+ raise ValueError(f"Invalid JSON at line {i}: {e}") from e
62
+ try:
63
+ events.append(ObservationEvent(
64
+ timestamp=raw["timestamp"],
65
+ event=raw["event"],
66
+ tool=raw["tool"],
67
+ session=raw["session"],
68
+ input=raw.get("input", ""),
69
+ output=raw.get("output", ""),
70
+ ))
71
+ except KeyError as e:
72
+ raise ValueError(f"Missing required field {e} at line {i}") from e
73
+
74
+ return sorted(events, key=lambda e: e.timestamp)
75
+
76
+
77
+ def parse_spec(path: Path) -> ComplianceSpec:
78
+ """Parse a YAML compliance spec file."""
79
+ if not path.is_file():
80
+ raise FileNotFoundError(f"Spec file not found: {path}")
81
+ raw = yaml.safe_load(path.read_text())
82
+
83
+ steps: list[Step] = []
84
+ for s in raw["steps"]:
85
+ d = s["detector"]
86
+ steps.append(Step(
87
+ id=s["id"],
88
+ description=s["description"],
89
+ required=s["required"],
90
+ detector=Detector(
91
+ description=d["description"],
92
+ after_step=d.get("after_step"),
93
+ before_step=d.get("before_step"),
94
+ ),
95
+ ))
96
+
97
+ if "scoring" not in raw:
98
+ raise KeyError("Missing 'scoring' section in compliance spec")
99
+
100
+ return ComplianceSpec(
101
+ id=raw["id"],
102
+ name=raw["name"],
103
+ source_rule=raw["source_rule"],
104
+ version=raw["version"],
105
+ steps=tuple(steps),
106
+ threshold_promote_to_hook=raw["scoring"]["threshold_promote_to_hook"],
107
+ )