xtrm-tools 0.7.0 → 0.7.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (632) hide show
  1. package/.xtrm/config/README.md +10 -0
  2. package/{config/mcp_servers.json → .xtrm/config/claude.mcp.json} +0 -28
  3. package/{config → .xtrm/config}/instructions/agents-top.md +12 -3
  4. package/{config → .xtrm/config}/instructions/claude-top.md +12 -3
  5. package/{config → .xtrm/config}/pi/extensions/beads/index.ts +44 -13
  6. package/{config → .xtrm/config}/pi/extensions/custom-footer/index.ts +59 -82
  7. package/{config → .xtrm/config}/pi/extensions/xtrm-ui/index.ts +2 -2
  8. package/{config → .xtrm/config}/pi/install-schema.json +2 -2
  9. package/.xtrm/config/pi.mcp.json +39 -0
  10. package/.xtrm/config/settings.json +41 -0
  11. package/.xtrm/extensions/auto-session-name/index.ts +29 -0
  12. package/.xtrm/extensions/auto-session-name/package.json +16 -0
  13. package/.xtrm/extensions/auto-update/index.ts +71 -0
  14. package/.xtrm/extensions/auto-update/package.json +16 -0
  15. package/.xtrm/extensions/beads/index.ts +232 -0
  16. package/.xtrm/extensions/beads/package.json +19 -0
  17. package/.xtrm/extensions/compact-header/index.ts +69 -0
  18. package/.xtrm/extensions/compact-header/package.json +16 -0
  19. package/.xtrm/extensions/core/adapter.ts +52 -0
  20. package/.xtrm/extensions/core/guard-rules.ts +100 -0
  21. package/.xtrm/extensions/core/lib.ts +3 -0
  22. package/.xtrm/extensions/core/logger.ts +45 -0
  23. package/.xtrm/extensions/core/package.json +18 -0
  24. package/.xtrm/extensions/core/runner.ts +71 -0
  25. package/.xtrm/extensions/core/session-state.ts +59 -0
  26. package/.xtrm/extensions/custom-footer/index.ts +398 -0
  27. package/.xtrm/extensions/custom-footer/package.json +19 -0
  28. package/.xtrm/extensions/custom-provider-qwen-cli/index.ts +363 -0
  29. package/.xtrm/extensions/custom-provider-qwen-cli/package.json +1 -0
  30. package/.xtrm/extensions/git-checkpoint/index.ts +53 -0
  31. package/.xtrm/extensions/git-checkpoint/package.json +16 -0
  32. package/.xtrm/extensions/lsp-bootstrap/index.ts +134 -0
  33. package/.xtrm/extensions/lsp-bootstrap/package.json +17 -0
  34. package/.xtrm/extensions/pi-serena-compact/index.ts +121 -0
  35. package/.xtrm/extensions/pi-serena-compact/package.json +16 -0
  36. package/.xtrm/extensions/quality-gates/index.ts +66 -0
  37. package/.xtrm/extensions/quality-gates/package.json +19 -0
  38. package/.xtrm/extensions/service-skills/index.ts +108 -0
  39. package/.xtrm/extensions/service-skills/package.json +19 -0
  40. package/.xtrm/extensions/session-flow/index.ts +96 -0
  41. package/.xtrm/extensions/session-flow/package.json +19 -0
  42. package/.xtrm/extensions/xtrm-loader/index.ts +152 -0
  43. package/.xtrm/extensions/xtrm-loader/package.json +19 -0
  44. package/.xtrm/extensions/xtrm-ui/format.ts +93 -0
  45. package/.xtrm/extensions/xtrm-ui/index.ts +1044 -0
  46. package/.xtrm/extensions/xtrm-ui/package.json +10 -0
  47. package/.xtrm/extensions/xtrm-ui/themes/pidex-dark.json +85 -0
  48. package/.xtrm/extensions/xtrm-ui/themes/pidex-light.json +85 -0
  49. package/{hooks → .xtrm/hooks}/README.md +2 -1
  50. package/{hooks → .xtrm/hooks}/beads-commit-gate.mjs +4 -0
  51. package/.xtrm/hooks/beads-memory-gate.mjs +119 -0
  52. package/{plugins/xtrm-tools → .xtrm}/hooks/quality-check-env.mjs +1 -4
  53. package/.xtrm/hooks/statusline.mjs +156 -0
  54. package/{plugins/xtrm-tools → .xtrm}/hooks/using-xtrm-reminder.mjs +8 -7
  55. package/.xtrm/registry.json +1323 -0
  56. package/CHANGELOG.md +27 -0
  57. package/README.md +3 -1
  58. package/cli/dist/index.cjs +27158 -31320
  59. package/cli/dist/index.cjs.map +1 -1
  60. package/cli/package.json +2 -1
  61. package/package.json +12 -12
  62. package/.claude-plugin/marketplace.json +0 -19
  63. package/.claude-plugin/plugin.json +0 -9
  64. package/config/hooks.json +0 -83
  65. package/config/settings.json +0 -70
  66. package/hooks/beads-memory-gate.mjs +0 -94
  67. package/hooks/quality-check-env.mjs +0 -79
  68. package/hooks/statusline.mjs +0 -183
  69. package/hooks/tsconfig-cache.json +0 -4
  70. package/hooks/using-xtrm-reminder.mjs +0 -47
  71. package/plugins/xtrm-tools/.claude-plugin/plugin.json +0 -9
  72. package/plugins/xtrm-tools/.mcp.json +0 -18
  73. package/plugins/xtrm-tools/hooks/README.md +0 -61
  74. package/plugins/xtrm-tools/hooks/beads-claim-sync.mjs +0 -154
  75. package/plugins/xtrm-tools/hooks/beads-commit-gate.mjs +0 -70
  76. package/plugins/xtrm-tools/hooks/beads-compact-restore.mjs +0 -77
  77. package/plugins/xtrm-tools/hooks/beads-compact-save.mjs +0 -63
  78. package/plugins/xtrm-tools/hooks/beads-edit-gate.mjs +0 -85
  79. package/plugins/xtrm-tools/hooks/beads-gate-core.mjs +0 -236
  80. package/plugins/xtrm-tools/hooks/beads-gate-messages.mjs +0 -75
  81. package/plugins/xtrm-tools/hooks/beads-gate-utils.mjs +0 -176
  82. package/plugins/xtrm-tools/hooks/beads-memory-gate.mjs +0 -94
  83. package/plugins/xtrm-tools/hooks/beads-stop-gate.mjs +0 -53
  84. package/plugins/xtrm-tools/hooks/gitnexus/gitnexus-hook.cjs +0 -222
  85. package/plugins/xtrm-tools/hooks/hooks.json +0 -129
  86. package/plugins/xtrm-tools/hooks/quality-check.cjs +0 -1286
  87. package/plugins/xtrm-tools/hooks/quality-check.py +0 -345
  88. package/plugins/xtrm-tools/hooks/statusline.mjs +0 -183
  89. package/plugins/xtrm-tools/hooks/tsconfig-cache.json +0 -4
  90. package/plugins/xtrm-tools/hooks/worktree-boundary.mjs +0 -33
  91. package/plugins/xtrm-tools/hooks/xtrm-logger.mjs +0 -123
  92. package/plugins/xtrm-tools/hooks/xtrm-session-logger.mjs +0 -27
  93. package/plugins/xtrm-tools/hooks/xtrm-tool-logger.mjs +0 -53
  94. package/plugins/xtrm-tools/skills/README.txt +0 -31
  95. package/plugins/xtrm-tools/skills/clean-code/SKILL.md +0 -201
  96. package/plugins/xtrm-tools/skills/creating-service-skills/SKILL.md +0 -433
  97. package/plugins/xtrm-tools/skills/creating-service-skills/references/script_quality_standards.md +0 -425
  98. package/plugins/xtrm-tools/skills/creating-service-skills/references/service_skill_system_guide.md +0 -278
  99. package/plugins/xtrm-tools/skills/creating-service-skills/scripts/bootstrap.py +0 -326
  100. package/plugins/xtrm-tools/skills/creating-service-skills/scripts/deep_dive.py +0 -304
  101. package/plugins/xtrm-tools/skills/creating-service-skills/scripts/scaffolder.py +0 -482
  102. package/plugins/xtrm-tools/skills/delegating/SKILL.md +0 -196
  103. package/plugins/xtrm-tools/skills/delegating/config.yaml +0 -210
  104. package/plugins/xtrm-tools/skills/delegating/references/orchestration-protocols.md +0 -41
  105. package/plugins/xtrm-tools/skills/docker-expert/SKILL.md +0 -409
  106. package/plugins/xtrm-tools/skills/documenting/CHANGELOG.md +0 -23
  107. package/plugins/xtrm-tools/skills/documenting/README.md +0 -148
  108. package/plugins/xtrm-tools/skills/documenting/SKILL.md +0 -113
  109. package/plugins/xtrm-tools/skills/documenting/examples/example_pattern.md +0 -70
  110. package/plugins/xtrm-tools/skills/documenting/examples/example_reference.md +0 -70
  111. package/plugins/xtrm-tools/skills/documenting/examples/example_ssot_analytics.md +0 -64
  112. package/plugins/xtrm-tools/skills/documenting/examples/example_workflow.md +0 -141
  113. package/plugins/xtrm-tools/skills/documenting/references/changelog-format.md +0 -97
  114. package/plugins/xtrm-tools/skills/documenting/references/metadata-schema.md +0 -136
  115. package/plugins/xtrm-tools/skills/documenting/references/taxonomy.md +0 -81
  116. package/plugins/xtrm-tools/skills/documenting/references/versioning-rules.md +0 -78
  117. package/plugins/xtrm-tools/skills/documenting/scripts/bump_version.sh +0 -60
  118. package/plugins/xtrm-tools/skills/documenting/scripts/changelog/__init__.py +0 -0
  119. package/plugins/xtrm-tools/skills/documenting/scripts/changelog/add_entry.py +0 -216
  120. package/plugins/xtrm-tools/skills/documenting/scripts/changelog/bump_release.py +0 -117
  121. package/plugins/xtrm-tools/skills/documenting/scripts/changelog/init_changelog.py +0 -54
  122. package/plugins/xtrm-tools/skills/documenting/scripts/changelog/validate_changelog.py +0 -128
  123. package/plugins/xtrm-tools/skills/documenting/scripts/drift_detector.py +0 -266
  124. package/plugins/xtrm-tools/skills/documenting/scripts/generate_template.py +0 -311
  125. package/plugins/xtrm-tools/skills/documenting/scripts/list_by_category.sh +0 -84
  126. package/plugins/xtrm-tools/skills/documenting/scripts/orchestrator.py +0 -255
  127. package/plugins/xtrm-tools/skills/documenting/scripts/validate_metadata.py +0 -242
  128. package/plugins/xtrm-tools/skills/documenting/templates/CHANGELOG.md.template +0 -13
  129. package/plugins/xtrm-tools/skills/documenting/tests/integration_test.sh +0 -70
  130. package/plugins/xtrm-tools/skills/documenting/tests/test_changelog.py +0 -201
  131. package/plugins/xtrm-tools/skills/documenting/tests/test_drift_detector.py +0 -80
  132. package/plugins/xtrm-tools/skills/documenting/tests/test_orchestrator.py +0 -52
  133. package/plugins/xtrm-tools/skills/documenting/tests/test_validate_metadata.py +0 -64
  134. package/plugins/xtrm-tools/skills/find-skills/SKILL.md +0 -133
  135. package/plugins/xtrm-tools/skills/gitnexus-exploring/SKILL.md +0 -75
  136. package/plugins/xtrm-tools/skills/gitnexus-impact-analysis/SKILL.md +0 -94
  137. package/plugins/xtrm-tools/skills/gitnexus-refactoring/SKILL.md +0 -113
  138. package/plugins/xtrm-tools/skills/hook-development/SKILL.md +0 -797
  139. package/plugins/xtrm-tools/skills/hook-development/examples/load-context.sh +0 -55
  140. package/plugins/xtrm-tools/skills/hook-development/examples/quality-check.js +0 -1168
  141. package/plugins/xtrm-tools/skills/hook-development/examples/validate-bash.sh +0 -43
  142. package/plugins/xtrm-tools/skills/hook-development/examples/validate-write.sh +0 -38
  143. package/plugins/xtrm-tools/skills/hook-development/references/advanced.md +0 -527
  144. package/plugins/xtrm-tools/skills/hook-development/references/migration.md +0 -369
  145. package/plugins/xtrm-tools/skills/hook-development/references/patterns.md +0 -412
  146. package/plugins/xtrm-tools/skills/hook-development/scripts/README.md +0 -164
  147. package/plugins/xtrm-tools/skills/hook-development/scripts/hook-linter.sh +0 -153
  148. package/plugins/xtrm-tools/skills/hook-development/scripts/test-hook.sh +0 -252
  149. package/plugins/xtrm-tools/skills/hook-development/scripts/validate-hook-schema.sh +0 -159
  150. package/plugins/xtrm-tools/skills/obsidian-cli/SKILL.md +0 -106
  151. package/plugins/xtrm-tools/skills/orchestrating-agents/SKILL.md +0 -135
  152. package/plugins/xtrm-tools/skills/orchestrating-agents/config.yaml +0 -45
  153. package/plugins/xtrm-tools/skills/orchestrating-agents/references/agent-context-integration.md +0 -37
  154. package/plugins/xtrm-tools/skills/orchestrating-agents/references/examples.md +0 -45
  155. package/plugins/xtrm-tools/skills/orchestrating-agents/references/handover-protocol.md +0 -31
  156. package/plugins/xtrm-tools/skills/orchestrating-agents/references/workflows.md +0 -42
  157. package/plugins/xtrm-tools/skills/orchestrating-agents/scripts/detect_neighbors.py +0 -23
  158. package/plugins/xtrm-tools/skills/planning/SKILL.md +0 -405
  159. package/plugins/xtrm-tools/skills/planning/evals/evals.json +0 -19
  160. package/plugins/xtrm-tools/skills/prompt-improving/README.md +0 -162
  161. package/plugins/xtrm-tools/skills/prompt-improving/SKILL.md +0 -74
  162. package/plugins/xtrm-tools/skills/prompt-improving/references/analysis_commands.md +0 -24
  163. package/plugins/xtrm-tools/skills/prompt-improving/references/chain_of_thought.md +0 -24
  164. package/plugins/xtrm-tools/skills/prompt-improving/references/mcp_definitions.md +0 -20
  165. package/plugins/xtrm-tools/skills/prompt-improving/references/multishot.md +0 -23
  166. package/plugins/xtrm-tools/skills/prompt-improving/references/xml_core.md +0 -60
  167. package/plugins/xtrm-tools/skills/python-testing/SKILL.md +0 -815
  168. package/plugins/xtrm-tools/skills/scoping-service-skills/SKILL.md +0 -231
  169. package/plugins/xtrm-tools/skills/scoping-service-skills/scripts/scope.py +0 -74
  170. package/plugins/xtrm-tools/skills/senior-backend/SKILL.md +0 -209
  171. package/plugins/xtrm-tools/skills/senior-backend/references/api_design_patterns.md +0 -103
  172. package/plugins/xtrm-tools/skills/senior-backend/references/backend_security_practices.md +0 -103
  173. package/plugins/xtrm-tools/skills/senior-backend/references/database_optimization_guide.md +0 -103
  174. package/plugins/xtrm-tools/skills/senior-backend/scripts/api_load_tester.py +0 -114
  175. package/plugins/xtrm-tools/skills/senior-backend/scripts/api_scaffolder.py +0 -114
  176. package/plugins/xtrm-tools/skills/senior-backend/scripts/database_migration_tool.py +0 -114
  177. package/plugins/xtrm-tools/skills/senior-data-scientist/SKILL.md +0 -226
  178. package/plugins/xtrm-tools/skills/senior-data-scientist/references/experiment_design_frameworks.md +0 -80
  179. package/plugins/xtrm-tools/skills/senior-data-scientist/references/feature_engineering_patterns.md +0 -80
  180. package/plugins/xtrm-tools/skills/senior-data-scientist/references/statistical_methods_advanced.md +0 -80
  181. package/plugins/xtrm-tools/skills/senior-data-scientist/scripts/experiment_designer.py +0 -100
  182. package/plugins/xtrm-tools/skills/senior-data-scientist/scripts/feature_engineering_pipeline.py +0 -100
  183. package/plugins/xtrm-tools/skills/senior-data-scientist/scripts/model_evaluation_suite.py +0 -100
  184. package/plugins/xtrm-tools/skills/senior-devops/SKILL.md +0 -209
  185. package/plugins/xtrm-tools/skills/senior-devops/references/cicd_pipeline_guide.md +0 -103
  186. package/plugins/xtrm-tools/skills/senior-devops/references/deployment_strategies.md +0 -103
  187. package/plugins/xtrm-tools/skills/senior-devops/references/infrastructure_as_code.md +0 -103
  188. package/plugins/xtrm-tools/skills/senior-devops/scripts/deployment_manager.py +0 -114
  189. package/plugins/xtrm-tools/skills/senior-devops/scripts/pipeline_generator.py +0 -114
  190. package/plugins/xtrm-tools/skills/senior-devops/scripts/terraform_scaffolder.py +0 -114
  191. package/plugins/xtrm-tools/skills/senior-security/SKILL.md +0 -209
  192. package/plugins/xtrm-tools/skills/senior-security/references/cryptography_implementation.md +0 -103
  193. package/plugins/xtrm-tools/skills/senior-security/references/penetration_testing_guide.md +0 -103
  194. package/plugins/xtrm-tools/skills/senior-security/references/security_architecture_patterns.md +0 -103
  195. package/plugins/xtrm-tools/skills/senior-security/scripts/pentest_automator.py +0 -114
  196. package/plugins/xtrm-tools/skills/senior-security/scripts/security_auditor.py +0 -114
  197. package/plugins/xtrm-tools/skills/senior-security/scripts/threat_modeler.py +0 -114
  198. package/plugins/xtrm-tools/skills/skill-creator/LICENSE.txt +0 -202
  199. package/plugins/xtrm-tools/skills/skill-creator/SKILL.md +0 -479
  200. package/plugins/xtrm-tools/skills/skill-creator/agents/analyzer.md +0 -274
  201. package/plugins/xtrm-tools/skills/skill-creator/agents/comparator.md +0 -202
  202. package/plugins/xtrm-tools/skills/skill-creator/agents/grader.md +0 -223
  203. package/plugins/xtrm-tools/skills/skill-creator/assets/eval_review.html +0 -146
  204. package/plugins/xtrm-tools/skills/skill-creator/eval-viewer/generate_review.py +0 -471
  205. package/plugins/xtrm-tools/skills/skill-creator/eval-viewer/viewer.html +0 -1325
  206. package/plugins/xtrm-tools/skills/skill-creator/references/schemas.md +0 -430
  207. package/plugins/xtrm-tools/skills/skill-creator/scripts/__init__.py +0 -0
  208. package/plugins/xtrm-tools/skills/skill-creator/scripts/aggregate_benchmark.py +0 -401
  209. package/plugins/xtrm-tools/skills/skill-creator/scripts/generate_report.py +0 -326
  210. package/plugins/xtrm-tools/skills/skill-creator/scripts/improve_description.py +0 -248
  211. package/plugins/xtrm-tools/skills/skill-creator/scripts/package_skill.py +0 -136
  212. package/plugins/xtrm-tools/skills/skill-creator/scripts/quick_validate.py +0 -103
  213. package/plugins/xtrm-tools/skills/skill-creator/scripts/run_eval.py +0 -310
  214. package/plugins/xtrm-tools/skills/skill-creator/scripts/run_loop.py +0 -332
  215. package/plugins/xtrm-tools/skills/skill-creator/scripts/utils.py +0 -47
  216. package/plugins/xtrm-tools/skills/sync-docs/SKILL.md +0 -286
  217. package/plugins/xtrm-tools/skills/sync-docs/evals/evals.json +0 -89
  218. package/plugins/xtrm-tools/skills/sync-docs/references/doc-structure.md +0 -99
  219. package/plugins/xtrm-tools/skills/sync-docs/references/schema.md +0 -103
  220. package/plugins/xtrm-tools/skills/sync-docs/scripts/changelog/add_entry.py +0 -216
  221. package/plugins/xtrm-tools/skills/sync-docs/scripts/context_gatherer.py +0 -240
  222. package/plugins/xtrm-tools/skills/sync-docs/scripts/doc_structure_analyzer.py +0 -495
  223. package/plugins/xtrm-tools/skills/sync-docs/scripts/drift_detector.py +0 -563
  224. package/plugins/xtrm-tools/skills/sync-docs/scripts/validate_doc.py +0 -365
  225. package/plugins/xtrm-tools/skills/sync-docs/scripts/validate_metadata.py +0 -185
  226. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/benchmark.json +0 -293
  227. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/benchmark.md +0 -13
  228. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/eval_metadata.json +0 -27
  229. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/with_skill/outputs/result.md +0 -210
  230. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/with_skill/run-1/grading.json +0 -28
  231. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/with_skill/run-1/timing.json +0 -1
  232. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/outputs/result.md +0 -101
  233. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/run-1/grading.json +0 -28
  234. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/run-1/timing.json +0 -5
  235. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/timing.json +0 -5
  236. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-fix-mode/eval_metadata.json +0 -27
  237. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-fix-mode/with_skill/outputs/result.md +0 -198
  238. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-fix-mode/with_skill/run-1/grading.json +0 -28
  239. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-fix-mode/with_skill/run-1/timing.json +0 -1
  240. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-fix-mode/without_skill/outputs/result.md +0 -94
  241. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-fix-mode/without_skill/run-1/grading.json +0 -28
  242. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-fix-mode/without_skill/run-1/timing.json +0 -1
  243. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/eval_metadata.json +0 -27
  244. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/with_skill/outputs/result.md +0 -237
  245. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/with_skill/run-1/grading.json +0 -28
  246. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/with_skill/run-1/timing.json +0 -1
  247. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/without_skill/outputs/result.md +0 -134
  248. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/without_skill/run-1/grading.json +0 -28
  249. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/without_skill/run-1/timing.json +0 -1
  250. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/benchmark.json +0 -297
  251. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/benchmark.md +0 -13
  252. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-doc-audit/eval_metadata.json +0 -27
  253. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-doc-audit/with_skill/outputs/result.md +0 -137
  254. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-doc-audit/with_skill/run-1/grading.json +0 -92
  255. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-doc-audit/with_skill/run-1/timing.json +0 -1
  256. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-doc-audit/without_skill/outputs/result.md +0 -134
  257. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-doc-audit/without_skill/run-1/grading.json +0 -86
  258. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-doc-audit/without_skill/run-1/timing.json +0 -1
  259. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-fix-mode/eval_metadata.json +0 -27
  260. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-fix-mode/with_skill/outputs/result.md +0 -193
  261. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-fix-mode/with_skill/run-1/grading.json +0 -72
  262. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-fix-mode/with_skill/run-1/timing.json +0 -1
  263. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-fix-mode/without_skill/outputs/result.md +0 -211
  264. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-fix-mode/without_skill/run-1/grading.json +0 -91
  265. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-fix-mode/without_skill/run-1/timing.json +0 -5
  266. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/eval_metadata.json +0 -27
  267. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/with_skill/outputs/result.md +0 -182
  268. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/with_skill/run-1/grading.json +0 -95
  269. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/with_skill/run-1/timing.json +0 -1
  270. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/without_skill/outputs/result.md +0 -222
  271. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/without_skill/run-1/grading.json +0 -88
  272. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/without_skill/run-1/timing.json +0 -5
  273. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/benchmark.json +0 -298
  274. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/benchmark.md +0 -13
  275. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-doc-audit/eval_metadata.json +0 -27
  276. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-doc-audit/with_skill/outputs/result.md +0 -125
  277. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-doc-audit/with_skill/run-1/grading.json +0 -97
  278. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-doc-audit/with_skill/run-1/timing.json +0 -5
  279. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-doc-audit/without_skill/outputs/result.md +0 -144
  280. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-doc-audit/without_skill/run-1/grading.json +0 -78
  281. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-doc-audit/without_skill/run-1/timing.json +0 -5
  282. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-fix-mode/eval_metadata.json +0 -27
  283. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-fix-mode/with_skill/outputs/result.md +0 -104
  284. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-fix-mode/with_skill/run-1/grading.json +0 -91
  285. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-fix-mode/with_skill/run-1/timing.json +0 -5
  286. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-fix-mode/without_skill/outputs/result.md +0 -79
  287. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-fix-mode/without_skill/run-1/grading.json +0 -82
  288. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-fix-mode/without_skill/run-1/timing.json +0 -5
  289. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/eval_metadata.json +0 -27
  290. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase1_context.json +0 -302
  291. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase2_drift.txt +0 -33
  292. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase3_analysis.json +0 -114
  293. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase4_fix.txt +0 -118
  294. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase5_validate.txt +0 -38
  295. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/result.md +0 -158
  296. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/run-1/grading.json +0 -95
  297. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/run-1/timing.json +0 -5
  298. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/without_skill/outputs/result.md +0 -71
  299. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/without_skill/run-1/grading.json +0 -90
  300. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/without_skill/run-1/timing.json +0 -5
  301. package/plugins/xtrm-tools/skills/test-planning/SKILL.md +0 -465
  302. package/plugins/xtrm-tools/skills/test-planning/evals/evals.json +0 -23
  303. package/plugins/xtrm-tools/skills/updating-service-skills/SKILL.md +0 -136
  304. package/plugins/xtrm-tools/skills/updating-service-skills/scripts/drift_detector.py +0 -222
  305. package/plugins/xtrm-tools/skills/using-quality-gates/SKILL.md +0 -254
  306. package/plugins/xtrm-tools/skills/using-serena-lsp/README.md +0 -8
  307. package/plugins/xtrm-tools/skills/using-serena-lsp/REFERENCE.md +0 -194
  308. package/plugins/xtrm-tools/skills/using-serena-lsp/SKILL.md +0 -82
  309. package/plugins/xtrm-tools/skills/using-service-skills/SKILL.md +0 -108
  310. package/plugins/xtrm-tools/skills/using-service-skills/scripts/cataloger.py +0 -74
  311. package/plugins/xtrm-tools/skills/using-service-skills/scripts/skill_activator.py +0 -152
  312. package/plugins/xtrm-tools/skills/using-service-skills/scripts/test_skill_activator.py +0 -58
  313. package/plugins/xtrm-tools/skills/using-tdd/SKILL.md +0 -410
  314. package/plugins/xtrm-tools/skills/using-xtrm/SKILL.md +0 -127
  315. package/plugins/xtrm-tools/skills/xt-debugging/SKILL.md +0 -149
  316. package/plugins/xtrm-tools/skills/xt-end/SKILL.md +0 -297
  317. package/plugins/xtrm-tools/skills/xt-merge/SKILL.md +0 -313
  318. package/project-skills/quality-gates/.claude/hooks/hook-config.json +0 -66
  319. package/project-skills/quality-gates/.claude/hooks/quality-check.cjs +0 -1286
  320. package/project-skills/quality-gates/.claude/hooks/quality-check.py +0 -334
  321. package/project-skills/quality-gates/.claude/settings.json +0 -3
  322. package/project-skills/quality-gates/.claude/skills/using-quality-gates/SKILL.md +0 -254
  323. package/project-skills/quality-gates/README.md +0 -109
  324. package/project-skills/quality-gates/evals/evals.json +0 -181
  325. package/project-skills/quality-gates/workspace/iteration-1/FINAL-EVAL-SUMMARY.md +0 -75
  326. package/project-skills/quality-gates/workspace/iteration-1/edge-case-auto-fix-verification/with_skill/outputs/response.md +0 -59
  327. package/project-skills/quality-gates/workspace/iteration-1/edge-case-mixed-language-project/with_skill/outputs/response.md +0 -60
  328. package/project-skills/quality-gates/workspace/iteration-1/eval-summary.md +0 -105
  329. package/project-skills/quality-gates/workspace/iteration-1/partial-install-python-only/with_skill/outputs/response.md +0 -93
  330. package/project-skills/quality-gates/workspace/iteration-1/python-refactor-request/with_skill/outputs/response.md +0 -104
  331. package/project-skills/quality-gates/workspace/iteration-1/quality-gate-error-fix/with_skill/outputs/response.md +0 -74
  332. package/project-skills/quality-gates/workspace/iteration-1/should-not-trigger-general-chat/with_skill/outputs/response.md +0 -18
  333. package/project-skills/quality-gates/workspace/iteration-1/should-not-trigger-math-question/with_skill/outputs/response.md +0 -18
  334. package/project-skills/quality-gates/workspace/iteration-1/should-not-trigger-unrelated-coding/with_skill/outputs/response.md +0 -56
  335. package/project-skills/quality-gates/workspace/iteration-1/tdd-guard-blocking-confusion/with_skill/outputs/response.md +0 -67
  336. package/project-skills/quality-gates/workspace/iteration-1/typescript-feature-with-tests/with_skill/outputs/response.md +0 -97
  337. package/project-skills/service-skills-set/.claude/git-hooks/doc_reminder.py +0 -67
  338. package/project-skills/service-skills-set/.claude/git-hooks/skill_staleness.py +0 -194
  339. package/project-skills/service-skills-set/.claude/service-registry.json +0 -4
  340. package/project-skills/service-skills-set/.claude/settings.json +0 -37
  341. package/project-skills/service-skills-set/.claude/skills/creating-service-skills/SKILL.md +0 -433
  342. package/project-skills/service-skills-set/.claude/skills/creating-service-skills/references/script_quality_standards.md +0 -425
  343. package/project-skills/service-skills-set/.claude/skills/creating-service-skills/references/service_skill_system_guide.md +0 -278
  344. package/project-skills/service-skills-set/.claude/skills/creating-service-skills/scripts/bootstrap.py +0 -308
  345. package/project-skills/service-skills-set/.claude/skills/creating-service-skills/scripts/deep_dive.py +0 -304
  346. package/project-skills/service-skills-set/.claude/skills/creating-service-skills/scripts/scaffolder.py +0 -482
  347. package/project-skills/service-skills-set/.claude/skills/scoping-service-skills/SKILL.md +0 -231
  348. package/project-skills/service-skills-set/.claude/skills/scoping-service-skills/scripts/scope.py +0 -74
  349. package/project-skills/service-skills-set/.claude/skills/updating-service-skills/SKILL.md +0 -136
  350. package/project-skills/service-skills-set/.claude/skills/updating-service-skills/scripts/drift_detector.py +0 -222
  351. package/project-skills/service-skills-set/.claude/skills/using-service-skills/SKILL.md +0 -108
  352. package/project-skills/service-skills-set/.claude/skills/using-service-skills/scripts/cataloger.py +0 -74
  353. package/project-skills/service-skills-set/.claude/skills/using-service-skills/scripts/skill_activator.py +0 -152
  354. package/project-skills/service-skills-set/README.md +0 -93
  355. package/project-skills/service-skills-set/install-service-skills.py +0 -193
  356. package/project-skills/service-skills-set/service-skills-readme.md +0 -236
  357. package/skills/README.txt +0 -31
  358. package/skills/clean-code/SKILL.md +0 -201
  359. package/skills/creating-service-skills/SKILL.md +0 -433
  360. package/skills/creating-service-skills/references/script_quality_standards.md +0 -425
  361. package/skills/creating-service-skills/references/service_skill_system_guide.md +0 -278
  362. package/skills/creating-service-skills/scripts/bootstrap.py +0 -326
  363. package/skills/creating-service-skills/scripts/deep_dive.py +0 -304
  364. package/skills/creating-service-skills/scripts/scaffolder.py +0 -482
  365. package/skills/delegating/SKILL.md +0 -196
  366. package/skills/delegating/config.yaml +0 -210
  367. package/skills/delegating/references/orchestration-protocols.md +0 -41
  368. package/skills/docker-expert/SKILL.md +0 -409
  369. package/skills/documenting/CHANGELOG.md +0 -23
  370. package/skills/documenting/README.md +0 -148
  371. package/skills/documenting/SKILL.md +0 -113
  372. package/skills/documenting/examples/example_pattern.md +0 -70
  373. package/skills/documenting/examples/example_reference.md +0 -70
  374. package/skills/documenting/examples/example_ssot_analytics.md +0 -64
  375. package/skills/documenting/examples/example_workflow.md +0 -141
  376. package/skills/documenting/references/changelog-format.md +0 -97
  377. package/skills/documenting/references/metadata-schema.md +0 -136
  378. package/skills/documenting/references/taxonomy.md +0 -81
  379. package/skills/documenting/references/versioning-rules.md +0 -78
  380. package/skills/documenting/scripts/bump_version.sh +0 -60
  381. package/skills/documenting/scripts/changelog/__init__.py +0 -0
  382. package/skills/documenting/scripts/changelog/add_entry.py +0 -216
  383. package/skills/documenting/scripts/changelog/bump_release.py +0 -117
  384. package/skills/documenting/scripts/changelog/init_changelog.py +0 -54
  385. package/skills/documenting/scripts/changelog/validate_changelog.py +0 -128
  386. package/skills/documenting/scripts/drift_detector.py +0 -266
  387. package/skills/documenting/scripts/generate_template.py +0 -311
  388. package/skills/documenting/scripts/list_by_category.sh +0 -84
  389. package/skills/documenting/scripts/orchestrator.py +0 -255
  390. package/skills/documenting/scripts/validate_metadata.py +0 -242
  391. package/skills/documenting/templates/CHANGELOG.md.template +0 -13
  392. package/skills/find-skills/SKILL.md +0 -133
  393. package/skills/gitnexus-exploring/SKILL.md +0 -75
  394. package/skills/gitnexus-impact-analysis/SKILL.md +0 -94
  395. package/skills/gitnexus-refactoring/SKILL.md +0 -113
  396. package/skills/hook-development/SKILL.md +0 -797
  397. package/skills/hook-development/examples/load-context.sh +0 -55
  398. package/skills/hook-development/examples/quality-check.js +0 -1168
  399. package/skills/hook-development/examples/validate-bash.sh +0 -43
  400. package/skills/hook-development/examples/validate-write.sh +0 -38
  401. package/skills/hook-development/references/advanced.md +0 -527
  402. package/skills/hook-development/references/migration.md +0 -369
  403. package/skills/hook-development/references/patterns.md +0 -412
  404. package/skills/hook-development/scripts/README.md +0 -164
  405. package/skills/hook-development/scripts/hook-linter.sh +0 -153
  406. package/skills/hook-development/scripts/test-hook.sh +0 -252
  407. package/skills/hook-development/scripts/validate-hook-schema.sh +0 -159
  408. package/skills/obsidian-cli/SKILL.md +0 -106
  409. package/skills/orchestrating-agents/SKILL.md +0 -135
  410. package/skills/orchestrating-agents/config.yaml +0 -45
  411. package/skills/orchestrating-agents/references/agent-context-integration.md +0 -37
  412. package/skills/orchestrating-agents/references/examples.md +0 -45
  413. package/skills/orchestrating-agents/references/handover-protocol.md +0 -31
  414. package/skills/orchestrating-agents/references/workflows.md +0 -42
  415. package/skills/orchestrating-agents/scripts/detect_neighbors.py +0 -23
  416. package/skills/planning/SKILL.md +0 -405
  417. package/skills/planning/evals/evals.json +0 -19
  418. package/skills/prompt-improving/README.md +0 -162
  419. package/skills/prompt-improving/SKILL.md +0 -74
  420. package/skills/prompt-improving/references/analysis_commands.md +0 -24
  421. package/skills/prompt-improving/references/chain_of_thought.md +0 -24
  422. package/skills/prompt-improving/references/mcp_definitions.md +0 -20
  423. package/skills/prompt-improving/references/multishot.md +0 -23
  424. package/skills/prompt-improving/references/xml_core.md +0 -60
  425. package/skills/python-testing/SKILL.md +0 -815
  426. package/skills/scoping-service-skills/SKILL.md +0 -231
  427. package/skills/scoping-service-skills/scripts/scope.py +0 -74
  428. package/skills/senior-backend/SKILL.md +0 -209
  429. package/skills/senior-backend/references/api_design_patterns.md +0 -103
  430. package/skills/senior-backend/references/backend_security_practices.md +0 -103
  431. package/skills/senior-backend/references/database_optimization_guide.md +0 -103
  432. package/skills/senior-backend/scripts/api_load_tester.py +0 -114
  433. package/skills/senior-backend/scripts/api_scaffolder.py +0 -114
  434. package/skills/senior-backend/scripts/database_migration_tool.py +0 -114
  435. package/skills/senior-data-scientist/SKILL.md +0 -226
  436. package/skills/senior-data-scientist/references/experiment_design_frameworks.md +0 -80
  437. package/skills/senior-data-scientist/references/feature_engineering_patterns.md +0 -80
  438. package/skills/senior-data-scientist/references/statistical_methods_advanced.md +0 -80
  439. package/skills/senior-data-scientist/scripts/experiment_designer.py +0 -100
  440. package/skills/senior-data-scientist/scripts/feature_engineering_pipeline.py +0 -100
  441. package/skills/senior-data-scientist/scripts/model_evaluation_suite.py +0 -100
  442. package/skills/senior-devops/SKILL.md +0 -209
  443. package/skills/senior-devops/references/cicd_pipeline_guide.md +0 -103
  444. package/skills/senior-devops/references/deployment_strategies.md +0 -103
  445. package/skills/senior-devops/references/infrastructure_as_code.md +0 -103
  446. package/skills/senior-devops/scripts/deployment_manager.py +0 -114
  447. package/skills/senior-devops/scripts/pipeline_generator.py +0 -114
  448. package/skills/senior-devops/scripts/terraform_scaffolder.py +0 -114
  449. package/skills/senior-security/SKILL.md +0 -209
  450. package/skills/senior-security/references/cryptography_implementation.md +0 -103
  451. package/skills/senior-security/references/penetration_testing_guide.md +0 -103
  452. package/skills/senior-security/references/security_architecture_patterns.md +0 -103
  453. package/skills/senior-security/scripts/pentest_automator.py +0 -114
  454. package/skills/senior-security/scripts/security_auditor.py +0 -114
  455. package/skills/senior-security/scripts/threat_modeler.py +0 -114
  456. package/skills/skill-creator/LICENSE.txt +0 -202
  457. package/skills/skill-creator/SKILL.md +0 -479
  458. package/skills/skill-creator/agents/analyzer.md +0 -274
  459. package/skills/skill-creator/agents/comparator.md +0 -202
  460. package/skills/skill-creator/agents/grader.md +0 -223
  461. package/skills/skill-creator/assets/eval_review.html +0 -146
  462. package/skills/skill-creator/eval-viewer/generate_review.py +0 -471
  463. package/skills/skill-creator/eval-viewer/viewer.html +0 -1325
  464. package/skills/skill-creator/references/schemas.md +0 -430
  465. package/skills/skill-creator/scripts/__init__.py +0 -0
  466. package/skills/skill-creator/scripts/aggregate_benchmark.py +0 -401
  467. package/skills/skill-creator/scripts/generate_report.py +0 -326
  468. package/skills/skill-creator/scripts/improve_description.py +0 -248
  469. package/skills/skill-creator/scripts/package_skill.py +0 -136
  470. package/skills/skill-creator/scripts/quick_validate.py +0 -103
  471. package/skills/skill-creator/scripts/run_eval.py +0 -310
  472. package/skills/skill-creator/scripts/run_loop.py +0 -332
  473. package/skills/skill-creator/scripts/utils.py +0 -47
  474. package/skills/sync-docs/SKILL.md +0 -286
  475. package/skills/sync-docs/evals/evals.json +0 -89
  476. package/skills/sync-docs/references/doc-structure.md +0 -99
  477. package/skills/sync-docs/references/schema.md +0 -103
  478. package/skills/sync-docs/scripts/changelog/add_entry.py +0 -216
  479. package/skills/sync-docs/scripts/context_gatherer.py +0 -240
  480. package/skills/sync-docs/scripts/doc_structure_analyzer.py +0 -495
  481. package/skills/sync-docs/scripts/drift_detector.py +0 -563
  482. package/skills/sync-docs/scripts/validate_doc.py +0 -365
  483. package/skills/sync-docs/scripts/validate_metadata.py +0 -185
  484. package/skills/sync-docs-workspace/iteration-1/benchmark.json +0 -293
  485. package/skills/sync-docs-workspace/iteration-1/benchmark.md +0 -13
  486. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/eval_metadata.json +0 -27
  487. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/with_skill/outputs/result.md +0 -210
  488. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/with_skill/run-1/grading.json +0 -28
  489. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/with_skill/run-1/timing.json +0 -1
  490. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/outputs/result.md +0 -101
  491. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/run-1/grading.json +0 -28
  492. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/run-1/timing.json +0 -5
  493. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/timing.json +0 -5
  494. package/skills/sync-docs-workspace/iteration-1/eval-fix-mode/eval_metadata.json +0 -27
  495. package/skills/sync-docs-workspace/iteration-1/eval-fix-mode/with_skill/outputs/result.md +0 -198
  496. package/skills/sync-docs-workspace/iteration-1/eval-fix-mode/with_skill/run-1/grading.json +0 -28
  497. package/skills/sync-docs-workspace/iteration-1/eval-fix-mode/with_skill/run-1/timing.json +0 -1
  498. package/skills/sync-docs-workspace/iteration-1/eval-fix-mode/without_skill/outputs/result.md +0 -94
  499. package/skills/sync-docs-workspace/iteration-1/eval-fix-mode/without_skill/run-1/grading.json +0 -28
  500. package/skills/sync-docs-workspace/iteration-1/eval-fix-mode/without_skill/run-1/timing.json +0 -1
  501. package/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/eval_metadata.json +0 -27
  502. package/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/with_skill/outputs/result.md +0 -237
  503. package/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/with_skill/run-1/grading.json +0 -28
  504. package/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/with_skill/run-1/timing.json +0 -1
  505. package/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/without_skill/outputs/result.md +0 -134
  506. package/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/without_skill/run-1/grading.json +0 -28
  507. package/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/without_skill/run-1/timing.json +0 -1
  508. package/skills/sync-docs-workspace/iteration-2/benchmark.json +0 -297
  509. package/skills/sync-docs-workspace/iteration-2/benchmark.md +0 -13
  510. package/skills/sync-docs-workspace/iteration-2/eval-doc-audit/eval_metadata.json +0 -27
  511. package/skills/sync-docs-workspace/iteration-2/eval-doc-audit/with_skill/outputs/result.md +0 -137
  512. package/skills/sync-docs-workspace/iteration-2/eval-doc-audit/with_skill/run-1/grading.json +0 -92
  513. package/skills/sync-docs-workspace/iteration-2/eval-doc-audit/with_skill/run-1/timing.json +0 -1
  514. package/skills/sync-docs-workspace/iteration-2/eval-doc-audit/without_skill/outputs/result.md +0 -134
  515. package/skills/sync-docs-workspace/iteration-2/eval-doc-audit/without_skill/run-1/grading.json +0 -86
  516. package/skills/sync-docs-workspace/iteration-2/eval-doc-audit/without_skill/run-1/timing.json +0 -1
  517. package/skills/sync-docs-workspace/iteration-2/eval-fix-mode/eval_metadata.json +0 -27
  518. package/skills/sync-docs-workspace/iteration-2/eval-fix-mode/with_skill/outputs/result.md +0 -193
  519. package/skills/sync-docs-workspace/iteration-2/eval-fix-mode/with_skill/run-1/grading.json +0 -72
  520. package/skills/sync-docs-workspace/iteration-2/eval-fix-mode/with_skill/run-1/timing.json +0 -1
  521. package/skills/sync-docs-workspace/iteration-2/eval-fix-mode/without_skill/outputs/result.md +0 -211
  522. package/skills/sync-docs-workspace/iteration-2/eval-fix-mode/without_skill/run-1/grading.json +0 -91
  523. package/skills/sync-docs-workspace/iteration-2/eval-fix-mode/without_skill/run-1/timing.json +0 -5
  524. package/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/eval_metadata.json +0 -27
  525. package/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/with_skill/outputs/result.md +0 -182
  526. package/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/with_skill/run-1/grading.json +0 -95
  527. package/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/with_skill/run-1/timing.json +0 -1
  528. package/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/without_skill/outputs/result.md +0 -222
  529. package/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/without_skill/run-1/grading.json +0 -88
  530. package/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/without_skill/run-1/timing.json +0 -5
  531. package/skills/sync-docs-workspace/iteration-3/benchmark.json +0 -298
  532. package/skills/sync-docs-workspace/iteration-3/benchmark.md +0 -13
  533. package/skills/sync-docs-workspace/iteration-3/eval-doc-audit/eval_metadata.json +0 -27
  534. package/skills/sync-docs-workspace/iteration-3/eval-doc-audit/with_skill/outputs/result.md +0 -125
  535. package/skills/sync-docs-workspace/iteration-3/eval-doc-audit/with_skill/run-1/grading.json +0 -97
  536. package/skills/sync-docs-workspace/iteration-3/eval-doc-audit/with_skill/run-1/timing.json +0 -5
  537. package/skills/sync-docs-workspace/iteration-3/eval-doc-audit/without_skill/outputs/result.md +0 -144
  538. package/skills/sync-docs-workspace/iteration-3/eval-doc-audit/without_skill/run-1/grading.json +0 -78
  539. package/skills/sync-docs-workspace/iteration-3/eval-doc-audit/without_skill/run-1/timing.json +0 -5
  540. package/skills/sync-docs-workspace/iteration-3/eval-fix-mode/eval_metadata.json +0 -27
  541. package/skills/sync-docs-workspace/iteration-3/eval-fix-mode/with_skill/outputs/result.md +0 -104
  542. package/skills/sync-docs-workspace/iteration-3/eval-fix-mode/with_skill/run-1/grading.json +0 -91
  543. package/skills/sync-docs-workspace/iteration-3/eval-fix-mode/with_skill/run-1/timing.json +0 -5
  544. package/skills/sync-docs-workspace/iteration-3/eval-fix-mode/without_skill/outputs/result.md +0 -79
  545. package/skills/sync-docs-workspace/iteration-3/eval-fix-mode/without_skill/run-1/grading.json +0 -82
  546. package/skills/sync-docs-workspace/iteration-3/eval-fix-mode/without_skill/run-1/timing.json +0 -5
  547. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/eval_metadata.json +0 -27
  548. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase1_context.json +0 -302
  549. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase2_drift.txt +0 -33
  550. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase3_analysis.json +0 -114
  551. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase4_fix.txt +0 -118
  552. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase5_validate.txt +0 -38
  553. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/result.md +0 -158
  554. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/run-1/grading.json +0 -95
  555. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/run-1/timing.json +0 -5
  556. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/without_skill/outputs/result.md +0 -71
  557. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/without_skill/run-1/grading.json +0 -90
  558. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/without_skill/run-1/timing.json +0 -5
  559. package/skills/test-planning/SKILL.md +0 -465
  560. package/skills/test-planning/evals/evals.json +0 -23
  561. package/skills/updating-service-skills/SKILL.md +0 -136
  562. package/skills/updating-service-skills/scripts/drift_detector.py +0 -222
  563. package/skills/using-quality-gates/SKILL.md +0 -254
  564. package/skills/using-serena-lsp/README.md +0 -8
  565. package/skills/using-serena-lsp/REFERENCE.md +0 -194
  566. package/skills/using-serena-lsp/SKILL.md +0 -82
  567. package/skills/using-service-skills/SKILL.md +0 -108
  568. package/skills/using-service-skills/scripts/cataloger.py +0 -74
  569. package/skills/using-service-skills/scripts/skill_activator.py +0 -152
  570. package/skills/using-service-skills/scripts/test_skill_activator.py +0 -58
  571. package/skills/using-tdd/SKILL.md +0 -410
  572. package/skills/using-xtrm/SKILL.md +0 -127
  573. package/skills/xt-debugging/SKILL.md +0 -149
  574. package/skills/xt-end/SKILL.md +0 -297
  575. package/skills/xt-merge/SKILL.md +0 -313
  576. /package/{config → .xtrm/config}/.env.example +0 -0
  577. /package/{config/mcp_servers_optional.json → .xtrm/config/claude.mcp.optional.json} +0 -0
  578. /package/{hooks → .xtrm/config}/hooks.json +0 -0
  579. /package/{config → .xtrm/config}/pi/auth.json.template +0 -0
  580. /package/{config → .xtrm/config}/pi/extensions/auto-session-name/index.ts +0 -0
  581. /package/{config → .xtrm/config}/pi/extensions/auto-session-name/package.json +0 -0
  582. /package/{config → .xtrm/config}/pi/extensions/auto-update/index.ts +0 -0
  583. /package/{config → .xtrm/config}/pi/extensions/auto-update/package.json +0 -0
  584. /package/{config → .xtrm/config}/pi/extensions/beads/package.json +0 -0
  585. /package/{config → .xtrm/config}/pi/extensions/compact-header/index.ts +0 -0
  586. /package/{config → .xtrm/config}/pi/extensions/compact-header/package.json +0 -0
  587. /package/{config → .xtrm/config}/pi/extensions/core/adapter.ts +0 -0
  588. /package/{config → .xtrm/config}/pi/extensions/core/guard-rules.ts +0 -0
  589. /package/{config → .xtrm/config}/pi/extensions/core/lib.ts +0 -0
  590. /package/{config → .xtrm/config}/pi/extensions/core/logger.ts +0 -0
  591. /package/{config → .xtrm/config}/pi/extensions/core/package.json +0 -0
  592. /package/{config → .xtrm/config}/pi/extensions/core/runner.ts +0 -0
  593. /package/{config → .xtrm/config}/pi/extensions/core/session-state.ts +0 -0
  594. /package/{config → .xtrm/config}/pi/extensions/custom-footer/package.json +0 -0
  595. /package/{config → .xtrm/config}/pi/extensions/custom-provider-qwen-cli/index.ts +0 -0
  596. /package/{config → .xtrm/config}/pi/extensions/custom-provider-qwen-cli/package.json +0 -0
  597. /package/{config → .xtrm/config}/pi/extensions/git-checkpoint/index.ts +0 -0
  598. /package/{config → .xtrm/config}/pi/extensions/git-checkpoint/package.json +0 -0
  599. /package/{config → .xtrm/config}/pi/extensions/lsp-bootstrap/index.ts +0 -0
  600. /package/{config → .xtrm/config}/pi/extensions/lsp-bootstrap/package.json +0 -0
  601. /package/{config → .xtrm/config}/pi/extensions/pi-serena-compact/index.ts +0 -0
  602. /package/{config → .xtrm/config}/pi/extensions/pi-serena-compact/package.json +0 -0
  603. /package/{config → .xtrm/config}/pi/extensions/quality-gates/index.ts +0 -0
  604. /package/{config → .xtrm/config}/pi/extensions/quality-gates/package.json +0 -0
  605. /package/{config → .xtrm/config}/pi/extensions/service-skills/index.ts +0 -0
  606. /package/{config → .xtrm/config}/pi/extensions/service-skills/package.json +0 -0
  607. /package/{config → .xtrm/config}/pi/extensions/session-flow/index.ts +0 -0
  608. /package/{config → .xtrm/config}/pi/extensions/session-flow/package.json +0 -0
  609. /package/{config → .xtrm/config}/pi/extensions/xtrm-loader/index.ts +0 -0
  610. /package/{config → .xtrm/config}/pi/extensions/xtrm-loader/package.json +0 -0
  611. /package/{config → .xtrm/config}/pi/extensions/xtrm-ui/format.ts +0 -0
  612. /package/{config → .xtrm/config}/pi/extensions/xtrm-ui/package.json +0 -0
  613. /package/{config → .xtrm/config}/pi/extensions/xtrm-ui/themes/pidex-dark.json +0 -0
  614. /package/{config → .xtrm/config}/pi/extensions/xtrm-ui/themes/pidex-light.json +0 -0
  615. /package/{config → .xtrm/config}/pi/models.json.template +0 -0
  616. /package/{config → .xtrm/config}/pi/pi-worktrees-settings.json +0 -0
  617. /package/{config → .xtrm/config}/pi/settings.json.template +0 -0
  618. /package/{hooks → .xtrm/hooks}/beads-claim-sync.mjs +0 -0
  619. /package/{hooks → .xtrm/hooks}/beads-compact-restore.mjs +0 -0
  620. /package/{hooks → .xtrm/hooks}/beads-compact-save.mjs +0 -0
  621. /package/{hooks → .xtrm/hooks}/beads-edit-gate.mjs +0 -0
  622. /package/{hooks → .xtrm/hooks}/beads-gate-core.mjs +0 -0
  623. /package/{hooks → .xtrm/hooks}/beads-gate-messages.mjs +0 -0
  624. /package/{hooks → .xtrm/hooks}/beads-gate-utils.mjs +0 -0
  625. /package/{hooks → .xtrm/hooks}/beads-stop-gate.mjs +0 -0
  626. /package/{hooks → .xtrm/hooks}/gitnexus/gitnexus-hook.cjs +0 -0
  627. /package/{hooks → .xtrm/hooks}/quality-check.cjs +0 -0
  628. /package/{hooks → .xtrm/hooks}/quality-check.py +0 -0
  629. /package/{hooks → .xtrm/hooks}/worktree-boundary.mjs +0 -0
  630. /package/{hooks → .xtrm/hooks}/xtrm-logger.mjs +0 -0
  631. /package/{hooks → .xtrm/hooks}/xtrm-session-logger.mjs +0 -0
  632. /package/{hooks → .xtrm/hooks}/xtrm-tool-logger.mjs +0 -0
@@ -1,297 +0,0 @@
1
- {
2
- "metadata": {
3
- "skill_name": "sync-docs",
4
- "skill_path": "<path/to/skill>",
5
- "executor_model": "<model-name>",
6
- "analyzer_model": "<model-name>",
7
- "timestamp": "2026-03-18T13:15:12Z",
8
- "evals_run": [
9
- 1,
10
- 2,
11
- 3
12
- ],
13
- "runs_per_configuration": 3
14
- },
15
- "runs": [
16
- {
17
- "eval_id": 3,
18
- "configuration": "with_skill",
19
- "run_number": 1,
20
- "result": {
21
- "pass_rate": 1.0,
22
- "passed": 4,
23
- "failed": 0,
24
- "total": 4,
25
- "time_seconds": 82.0,
26
- "tokens": 26000,
27
- "tool_calls": 0,
28
- "errors": 0
29
- },
30
- "expectations": [
31
- {
32
- "text": "Ran doc_structure_analyzer.py and cited its output",
33
- "passed": true,
34
- "evidence": "Phase 3 of the report cites specific script output: 'Line count: 192 / 200 threshold', 'Sections: 24', 'Extraction candidates flagged by script: None'. These metrics are consistent with structured script output rather than manual inspection, and the phrasing 'flagged by script' directly attributes them to an automated tool."
35
- },
36
- {
37
- "text": "Named at least 2 specific README sections with their suggested docs/ destination",
38
- "passed": true,
39
- "evidence": "The report names three sections with explicit docs/ destinations: 'Hooks Reference' (lines 114-141) -> docs/hooks.md, 'Policy System' (lines 66-87) -> docs/policies.md, 'MCP Servers' (lines 143-158) -> docs/mcp-servers.md. These appear both in the Phase 3 table and in the numbered summary under 'Three sections to replace with summary + link'."
40
- },
41
- {
42
- "text": "Did NOT run --fix or create/edit any files (audit-only mode respected)",
43
- "passed": true,
44
- "evidence": "The report header states 'Mode: Audit only (Phase 1-3). No files were modified.' The 'Recommended Next Steps' section frames all actions as future work 'for explicit execution, not done here'. The 'What NOT to Do' section further reinforces restraint. No output files other than result.md are present in the outputs directory."
45
- },
46
- {
47
- "text": "Report is actionable with clear next steps",
48
- "passed": true,
49
- "evidence": "The 'Recommended Next Steps' section lists 4 numbered, specific, executable actions: (1) Fix CHANGELOG using add_entry.py, (2) Fix README version badge from 2.3.0 to 2.4.0, (3) Trim README duplicate sections using Serena tools, (4) Update stale Serena memories for hooks and installer architecture. Each step names the specific tool or method to use."
50
- }
51
- ],
52
- "notes": []
53
- },
54
- {
55
- "eval_id": 2,
56
- "configuration": "with_skill",
57
- "run_number": 1,
58
- "result": {
59
- "pass_rate": 1.0,
60
- "passed": 4,
61
- "failed": 0,
62
- "total": 4,
63
- "time_seconds": 120.0,
64
- "tokens": 0,
65
- "tool_calls": 0,
66
- "errors": 0
67
- },
68
- "expectations": [
69
- {
70
- "text": "Ran doc_structure_analyzer.py with --fix flag",
71
- "passed": true,
72
- "evidence": "result.md Command Executed section shows: `python3 /home/dawid/projects/xtrm-tools/skills/sync-docs/scripts/doc_structure_analyzer.py --fix --bd-remember --root=/home/dawid/projects/xtrm-tools/.claude/worktrees/agent-ad500878`"
73
- },
74
- {
75
- "text": "Handled both MISSING scaffolds AND INVALID_SCHEMA files (or correctly reported none found)",
76
- "passed": true,
77
- "evidence": "result.md shows 5 MISSING scaffold files created (hooks.md, pi-extensions.md, mcp-servers.md, policies.md, skills.md) and 7 INVALID_SCHEMA files fixed by injecting frontmatter (cleanup.md, delegation-architecture.md, hook-system-summary.md, mcp-servers-config.md, pi-extensions-migration.md, pre-install-cleanup.md, todo.md). Both categories were handled."
78
- },
79
- {
80
- "text": "Ran bd remember and reported the memory key",
81
- "passed": true,
82
- "evidence": "result.md bd Memory section reports key `sync-docs-fix-2026-03-18` and the full insight string. The script output JSON includes `bd_remember.key = 'sync-docs-fix-2026-03-18'`. Note: `stored: false` because no `.beads/` directory existed in the worktree, but the key was computed and reported, which satisfies the expectation."
83
- },
84
- {
85
- "text": "Ran validate_doc.py docs/ after fixing to confirm results",
86
- "passed": true,
87
- "evidence": "result.md validate_doc.py docs/ Result section shows all 12 files passed (12/12) with exit code 0, covering both the 5 newly created scaffolds and the 7 schema-fixed files."
88
- }
89
- ],
90
- "notes": []
91
- },
92
- {
93
- "eval_id": 1,
94
- "configuration": "with_skill",
95
- "run_number": 1,
96
- "result": {
97
- "pass_rate": 1.0,
98
- "passed": 4,
99
- "failed": 0,
100
- "total": 4,
101
- "time_seconds": 170.0,
102
- "tokens": 27000,
103
- "tool_calls": 0,
104
- "errors": 2
105
- },
106
- "expectations": [
107
- {
108
- "text": "Ran context_gatherer.py and reported bd closed issues or merged PRs with specific data",
109
- "passed": true,
110
- "evidence": "Phase 1 documents running 'skills/sync-docs/scripts/context_gatherer.py --since=30'. While the script returned empty arrays for bd_closed_issues due to a Dolt server connectivity issue from the worktree, the agent performed a manual fallback using 'bd list --state=closed --limit=10' and reported 8 specific named issues (jaggers-agent-tools-1lc, -7dwo, -8dhs, -9bl, -ihgz, -l1g, -p9wc, plus subtasks). Merged PRs were also reported with specific details: 10 PRs including PR #15 release/2.0.1, PR #14 chore/update-status-doc, PR #13 fix/agents-target, etc."
111
- },
112
- {
113
- "text": "Ran doc_structure_analyzer.py and cited its structured output (STALE, EXTRACTABLE, MISSING, etc.)",
114
- "passed": true,
115
- "evidence": "Phase 3 documents running 'skills/sync-docs/scripts/doc_structure_analyzer.py'. The result explicitly cites: README.md as EXTRACTABLE (192 lines, threshold 200) with 5 sections identified for extraction; CHANGELOG.md as STALE; 5 MISSING docs/ files (docs/hooks.md, docs/pi-extensions.md, docs/mcp-servers.md, docs/policies.md, docs/skills.md); and 7 existing docs/ files with INVALID_SCHEMA. The structured output vocabulary (STALE, EXTRACTABLE, MISSING, INVALID_SCHEMA) is used throughout."
116
- },
117
- {
118
- "text": "Detected the CHANGELOG version gap (package.json v2.4.0 vs CHANGELOG v2.0.0)",
119
- "passed": true,
120
- "evidence": "Phase 3 explicitly states: 'package.json version: 2.4.0', 'Latest CHANGELOG entry: v2.0.0', 'Gap: v2.1.0 through v2.4.0 are undocumented'. Outstanding Actions item 1 also calls out: 'Add entries for v2.1.0 through v2.4.0 using skills/documenting/scripts/changelog/add_entry.py'."
121
- },
122
- {
123
- "text": "Named at least one concrete next step with a specific file or action",
124
- "passed": true,
125
- "evidence": "The 'Outstanding Actions' section names 4 concrete next steps with specific files/tools: (1) 'Add entries for v2.1.0 through v2.4.0 using skills/documenting/scripts/changelog/add_entry.py'; (2) 'Use Serena to extract sections into their new docs/ files'; (3) 'Update 5 stale memories, especially ssot_cli_hooks_2026-02-03'; (4) 'Fill [5 scaffolded files] using Serena or by extracting from README'."
126
- }
127
- ],
128
- "notes": []
129
- },
130
- {
131
- "eval_id": 3,
132
- "configuration": "without_skill",
133
- "run_number": 1,
134
- "result": {
135
- "pass_rate": 0.75,
136
- "passed": 3,
137
- "failed": 1,
138
- "total": 4,
139
- "time_seconds": 75.0,
140
- "tokens": 15000,
141
- "tool_calls": 0,
142
- "errors": 0
143
- },
144
- "expectations": [
145
- {
146
- "text": "Ran doc_structure_analyzer.py and cited its output",
147
- "passed": false,
148
- "evidence": "No mention of doc_structure_analyzer.py anywhere in result.md. The audit was performed by directly reading files rather than running any script. No script output is quoted or referenced."
149
- },
150
- {
151
- "text": "Named at least 2 specific README sections with their suggested docs/ destination",
152
- "passed": true,
153
- "evidence": "result.md names six README sections with specific destinations: 'Hooks Reference' -> docs/hooks.md, 'Policy System' -> docs/policies.md, 'MCP Servers' -> docs/mcp.md, 'Plugin Structure' -> docs/plugin.md or XTRM-GUIDE.md, 'Skills table' -> docs/skills.md, 'Version History' -> CHANGELOG.md. The recommended moves table further enumerates these with priority levels."
154
- },
155
- {
156
- "text": "Did NOT run --fix or create/edit any files (audit-only mode respected)",
157
- "passed": true,
158
- "evidence": "result.md is a read-only audit report. No --fix flag is mentioned, no files were edited, no docs/ files were created or modified. The report only analyzes and recommends."
159
- },
160
- {
161
- "text": "Report is actionable with clear next steps",
162
- "passed": true,
163
- "evidence": "result.md includes a 'Recommended Moves (Prioritized)' table with Priority (High/Medium/Low), README Section, Action (Move/Remove/Add), and Target columns. Each section also has a specific Verdict with a concrete instruction (e.g., 'Move this content to docs/policies.md', 'Remove this table from the README and rely on the CHANGELOG.md link')."
164
- }
165
- ],
166
- "notes": []
167
- },
168
- {
169
- "eval_id": 2,
170
- "configuration": "without_skill",
171
- "run_number": 1,
172
- "result": {
173
- "pass_rate": 1.0,
174
- "passed": 4,
175
- "failed": 0,
176
- "total": 4,
177
- "time_seconds": 129.8,
178
- "tokens": 5843,
179
- "tool_calls": 0,
180
- "errors": 1
181
- },
182
- "expectations": [
183
- {
184
- "text": "Ran doc_structure_analyzer.py with --fix flag",
185
- "passed": true,
186
- "evidence": "Step 2 of result.md shows the exact command run: 'python3 .../doc_structure_analyzer.py --root=... --fix' with stdout confirming 5 files created and 7 files fixed."
187
- },
188
- {
189
- "text": "Handled both MISSING scaffolds AND INVALID_SCHEMA files (or correctly reported none found)",
190
- "passed": true,
191
- "evidence": "Step 2 shows 5 MISSING scaffold files were created (hooks.md, pi-extensions.md, mcp-servers.md, policies.md, skills.md) and 7 INVALID_SCHEMA files had frontmatter injected (cleanup.md, delegation-architecture.md, hook-system-summary.md, mcp-servers-config.md, pi-extensions-migration.md, pre-install-cleanup.md, todo.md). Both categories were explicitly handled."
192
- },
193
- {
194
- "text": "Ran bd remember and reported the memory key",
195
- "passed": true,
196
- "evidence": "Step 4 shows bd remember was attempted with key 'sync-docs-fix-2026-03-18'. It failed with 'database jaggers_agent_tools not found on Dolt server at 127.0.0.1:13800', but the key was explicitly reported ('## bd Memory Key (intended): sync-docs-fix-2026-03-18') and the attempt was fully documented. Per grading note, attempt + reported key satisfies this assertion."
197
- },
198
- {
199
- "text": "Ran validate_doc.py docs/ after fixing to confirm results",
200
- "passed": true,
201
- "evidence": "Step 3 shows the command 'python3 .../validate_doc.py .../docs/' was run post-fix, with all 12 files showing [PASS] and final output 'Result: 12/12 files passed'."
202
- }
203
- ],
204
- "notes": [
205
- "README.md EXTRACTABLE \u2014 5 sections should move to docs/ but requires content judgment",
206
- "CHANGELOG.md STALE \u2014 v2.4.0 undocumented; requires add_entry.py and human input",
207
- "bd remember failed due to Dolt server database mismatch; key was reported manually in result.md"
208
- ]
209
- },
210
- {
211
- "eval_id": 1,
212
- "configuration": "without_skill",
213
- "run_number": 1,
214
- "result": {
215
- "pass_rate": 0.5,
216
- "passed": 2,
217
- "failed": 2,
218
- "total": 4,
219
- "time_seconds": 219.9,
220
- "tokens": 8123,
221
- "tool_calls": 0,
222
- "errors": 0
223
- },
224
- "expectations": [
225
- {
226
- "text": "Ran context_gatherer.py and reported bd closed issues or merged PRs with specific data",
227
- "passed": false,
228
- "evidence": "The result contains specific bd closed issue data (#38, #33 with dates) and merged PR data (#102\u2013#111 with titles and dates). However, the report header explicitly states 'Assessed by: Manual review (git log, gh issue/pr, file reads)' \u2014 context_gatherer.py was never invoked. The data is present but was gathered manually, not via the script. The expectation requires the script to have been run."
229
- },
230
- {
231
- "text": "Ran doc_structure_analyzer.py and cited its structured output (STALE, EXTRACTABLE, MISSING, etc.)",
232
- "passed": false,
233
- "evidence": "No mention of doc_structure_analyzer.py anywhere in the result. The documentation analysis uses informal labels like 'Drifted' and 'Stale' from the agent's own judgment, not the structured taxonomy (STALE, EXTRACTABLE, MISSING) that the script would emit. The script was not run."
234
- },
235
- {
236
- "text": "Detected the CHANGELOG version gap (package.json v2.4.0 vs CHANGELOG v2.0.0)",
237
- "passed": true,
238
- "evidence": "Section 2 of the result is titled 'CHANGELOG.md Has No v2.4.0 Entry' and is rated High severity and listed as the #1 recommended action: 'Write the [2.4.0] CHANGELOG entry \u2014 this is the most critical gap. The release shipped but has no record.' The result also references the package version as 2.4.1 (cli/package.json) and 2.4.0 (released via PR #110). The specific last CHANGELOG version is not named but the gap is clearly identified and substantiated."
239
- },
240
- {
241
- "text": "Named at least one concrete next step with a specific file or action",
242
- "passed": true,
243
- "evidence": "The 'Recommended Actions (Priority Order)' section lists 7 concrete steps, each referencing specific files: e.g., '1. Write the [2.4.0] CHANGELOG entry', '2. Update README.md version badge, example output, and version history table to 2.4.0', '4. Bump plugins/xtrm-tools/.claude-plugin/plugin.json version to 2.4.0'."
244
- }
245
- ],
246
- "notes": []
247
- }
248
- ],
249
- "run_summary": {
250
- "with_skill": {
251
- "pass_rate": {
252
- "mean": 1.0,
253
- "stddev": 0.0,
254
- "min": 1.0,
255
- "max": 1.0
256
- },
257
- "time_seconds": {
258
- "mean": 124.0,
259
- "stddev": 44.1362,
260
- "min": 82.0,
261
- "max": 170.0
262
- },
263
- "tokens": {
264
- "mean": 17666.6667,
265
- "stddev": 15307.95,
266
- "min": 0,
267
- "max": 27000
268
- }
269
- },
270
- "without_skill": {
271
- "pass_rate": {
272
- "mean": 0.75,
273
- "stddev": 0.25,
274
- "min": 0.5,
275
- "max": 1.0
276
- },
277
- "time_seconds": {
278
- "mean": 141.5667,
279
- "stddev": 73.1631,
280
- "min": 75.0,
281
- "max": 219.9
282
- },
283
- "tokens": {
284
- "mean": 9655.3333,
285
- "stddev": 4766.9378,
286
- "min": 5843,
287
- "max": 15000
288
- }
289
- },
290
- "delta": {
291
- "pass_rate": "+0.25",
292
- "time_seconds": "-17.6",
293
- "tokens": "+8011"
294
- }
295
- },
296
- "notes": []
297
- }
@@ -1,13 +0,0 @@
1
- # Skill Benchmark: sync-docs
2
-
3
- **Model**: <model-name>
4
- **Date**: 2026-03-18T13:15:12Z
5
- **Evals**: 1, 2, 3 (3 runs each per configuration)
6
-
7
- ## Summary
8
-
9
- | Metric | With Skill | Without Skill | Delta |
10
- |--------|------------|---------------|-------|
11
- | Pass Rate | 100% ± 0% | 75% ± 25% | +0.25 |
12
- | Time | 124.0s ± 44.1s | 141.6s ± 73.2s | -17.6s |
13
- | Tokens | 17667 ± 15308 | 9655 ± 4767 | +8011 |
@@ -1,27 +0,0 @@
1
- {
2
- "eval_id": 3,
3
- "eval_name": "doc-audit",
4
- "prompt": "Do a doc audit. I think the README has sections that should be in docs/ but I'm not sure which ones.",
5
- "assertions": [
6
- {
7
- "text": "Ran doc_structure_analyzer.py and cited its output",
8
- "passed": false,
9
- "evidence": ""
10
- },
11
- {
12
- "text": "Named at least 2 specific README sections with their suggested docs/ destination",
13
- "passed": false,
14
- "evidence": ""
15
- },
16
- {
17
- "text": "Did NOT run --fix or create/edit any files (audit-only mode respected)",
18
- "passed": false,
19
- "evidence": ""
20
- },
21
- {
22
- "text": "Report is actionable with clear next steps",
23
- "passed": false,
24
- "evidence": ""
25
- }
26
- ]
27
- }
@@ -1,137 +0,0 @@
1
- # Doc Audit Report — xtrm-tools
2
-
3
- **Date:** 2026-03-18
4
- **Task:** Audit README for sections that should be in docs/
5
- **Mode:** Audit only (Phase 1–3). No files were modified.
6
-
7
- ---
8
-
9
- ## Phase 1: Context Summary
10
-
11
- ### Recent Activity
12
-
13
- **Merged PRs (last ~30 days):**
14
- - PR #15 — release/2.0.1 (2026-03-13)
15
- - PR #14 — chore/update-status-doc (2026-03-13)
16
- - PR #13 — fix/agents-target (2026-03-13)
17
- - PR #12 — feat/project-install-all (2026-03-13)
18
- - PR #8 — phase2-cli-refactor (2026-03-12)
19
-
20
- **Recent significant commits (today):**
21
- - Add Pi extension drift checks and guard-rules parity
22
- - Centralize guard tool rules and matcher expansion
23
- - Deprecate install project command in favor of xtrm init
24
- - Add global-first architecture regression tests
25
- - Add project detection and service registry scaffolding to xtrm init
26
-
27
- **Active epic:** `jaggers-agent-tools-4xr6` — Global-first plugin architecture (hooks, skills, Pi extensions all go global; `xtrm init` replaces `install project`)
28
-
29
- This is a significant structural change cycle. The CLI commands table in README already shows `project init` but also still lists `install project <name>` — these may be in conflict now that install-project is deprecated.
30
-
31
- ---
32
-
33
- ## Phase 2: SSOT Drift (Serena Memories)
34
-
35
- **5 stale memories detected:**
36
-
37
- | Memory | Last Updated | Modified Files |
38
- |---|---|---|
39
- | `ssot_cli_hooks_2026-02-03` | 2026-02-25 | hooks/guard-rules.mjs, hooks/hooks.json, hooks/main-guard.mjs |
40
- | `ssot_cli_universal_hub_2026-02-19` | 2026-02-25 | cli/src/commands/install-pi.ts, cli/src/tests/policy-parity.test.ts |
41
- | `ssot_cli_ux_improvements_2026-02-22` | 2026-02-25 | cli/src/commands/install-pi.ts, cli/src/commands/install-project.ts |
42
- | `ssot_jaggers-agent-tools_installer_architecture_2026-02-03` | 2026-02-25 | cli/src/commands/install-pi.ts, cli/src/tests/policy-parity.test.ts |
43
- | `ssot_jaggers-agent-tools_migration_2026-02-01` | 2026-02-01 | cli/src/commands/install-pi.ts, cli/src/tests/policy-parity.test.ts |
44
-
45
- The hooks memories are stale due to the guard-rules centralization work done today. The installer architecture memories are stale due to the global-first migration and deprecation of `install-project`. These need updating but are out of scope for this audit (they require Serena tools and explicit intent to fix).
46
-
47
- ---
48
-
49
- ## Phase 3: Document Structure Analysis
50
-
51
- ### README.md — Status: OK (borderline)
52
-
53
- - **Line count:** 192 / 200 threshold
54
- - **Sections:** 24
55
- - **Extraction candidates flagged by script:** None
56
-
57
- The script reports `OK` because README is 8 lines under the 200-line bloat threshold. However, manual review reveals several sections that are substantive enough to warrant dedicated docs/ files or already have them:
58
-
59
- #### Sections with candidate docs/ homes
60
-
61
- | README Section | Lines | Status | Recommended Action |
62
- |---|---|---|---|
63
- | **Hooks Reference** (lines 114–141) | ~28 lines | Has `docs/hooks.md` | README section should be a 1-line summary + link to `docs/hooks.md` |
64
- | **MCP Servers** (lines 143–158) | ~16 lines | Has `docs/mcp-servers.md` | README section is a partial duplicate of `docs/mcp-servers.md` |
65
- | **Policy System** (lines 66–87) | ~22 lines | Has `docs/policies.md` | README section should be a 1-line summary + link to `docs/policies.md` |
66
- | **CLI Commands** (lines 89–111) | ~23 lines | No `docs/cli-reference.md` | At 6 commands + 3 flags this is borderline; when CLI grows, extract |
67
- | **Version History** (lines 179–187) | ~9 lines | Has CHANGELOG.md | Already linked; table is a useful quick summary, keep |
68
- | **Issue Tracking (Beads)** (lines 161–168) | ~8 lines | No dedicated docs/ file | Short enough to keep in README |
69
-
70
- **Key finding:** README has three sections (Hooks Reference, MCP Servers, Policy System) that directly duplicate content already in dedicated docs/ files. These sections should be replaced with single-line summaries + links. This would bring README down to approximately 130–140 lines and eliminate the drift risk.
71
-
72
- ### CHANGELOG.md — Status: STALE (critical)
73
-
74
- - **package.json version:** 2.4.0
75
- - **Latest CHANGELOG entry:** 2.0.0 (2026-03-12)
76
- - **Gap:** v2.1.x, v2.2.0, v2.3.0, and v2.4.0 are all undocumented in CHANGELOG
77
- - **Note:** README header also still says "Version 2.3.0" — should be 2.4.0
78
-
79
- The CHANGELOG has not been updated across multiple release cycles. This is the most critical finding.
80
-
81
- ### docs/ Files — Status: All OK
82
-
83
- All 10 existing docs/ files pass schema validation (have YAML frontmatter, no structural issues):
84
-
85
- - docs/hooks.md (133 lines) — OK
86
- - docs/mcp-servers.md (25 lines) — OK
87
- - docs/mcp.md (110 lines) — OK
88
- - docs/pi-extensions.md (25 lines) — OK
89
- - docs/policies.md (25 lines) — OK
90
- - docs/pre-install-cleanup.md (128 lines) — OK
91
- - docs/project-skills.md (105 lines) — OK
92
- - docs/skills.md (114 lines) — OK
93
- - docs/testing.md (148 lines) — OK
94
- - docs/todo.md (14 lines) — OK
95
-
96
- **No missing docs/ gaps** were flagged by the script for existing subsystems.
97
-
98
- ---
99
-
100
- ## Summary of Findings
101
-
102
- ### README Duplication (answer to the user's question)
103
-
104
- The README does contain sections that belong in docs/ — but not because they're missing docs/ files. The docs/ files already exist. The problem is that README still carries full content in those sections instead of pointing to the dedicated files.
105
-
106
- **Three sections to replace with summary + link:**
107
-
108
- 1. **"Hooks Reference"** (lines 114–141, ~28 lines) → summarize in 2–3 lines + link to `docs/hooks.md`
109
- 2. **"Policy System"** (lines 66–87, ~22 lines) → summarize in 2–3 lines + link to `docs/policies.md`
110
- 3. **"MCP Servers"** (lines 143–158, ~16 lines) → summarize in 1–2 lines + link to `docs/mcp-servers.md`
111
-
112
- Doing this would remove ~60 lines from README (192 → ~132), well within the healthy range, and eliminate drift between README and its docs/ counterparts.
113
-
114
- ### CHANGELOG is critically stale
115
-
116
- Four release versions (2.1.x through 2.4.0) have no CHANGELOG entries. The README version badge is also one version behind (shows 2.3.0, package.json is 2.4.0).
117
-
118
- ### Stale Serena memories (5 total)
119
-
120
- All relate to hooks and installer architecture — both subsystems were modified today as part of the global-first migration. These need updating via the `/documenting` skill or Phase 4 of this skill.
121
-
122
- ---
123
-
124
- ## What NOT to Do
125
-
126
- - Do not extract Beads, CLI Commands, Version History, or Quick Start from README — these are appropriate for a README-level entry point.
127
- - Do not create new docs/ files — all expected subsystem files already exist.
128
- - Do not touch the docs/ files themselves — they all pass schema validation.
129
-
130
- ---
131
-
132
- ## Recommended Next Steps (for explicit execution, not done here)
133
-
134
- 1. **Fix CHANGELOG** — add entries for v2.1.x, v2.2.0, v2.3.0, v2.4.0 using `add_entry.py`
135
- 2. **Fix README version badge** — update "Version 2.3.0" to "Version 2.4.0"
136
- 3. **Trim README duplicate sections** — replace Hooks Reference, Policy System, MCP Servers with summary + link (use Serena tools, not direct Edit)
137
- 4. **Update stale Serena memories** — especially `ssot_cli_hooks_*` and `ssot_jaggers-agent-tools_installer_architecture_*` given today's guard-rules and global-first changes
@@ -1,92 +0,0 @@
1
- {
2
- "expectations": [
3
- {
4
- "text": "Ran doc_structure_analyzer.py and cited its output",
5
- "passed": true,
6
- "evidence": "Phase 3 of the report cites specific script output: 'Line count: 192 / 200 threshold', 'Sections: 24', 'Extraction candidates flagged by script: None'. These metrics are consistent with structured script output rather than manual inspection, and the phrasing 'flagged by script' directly attributes them to an automated tool."
7
- },
8
- {
9
- "text": "Named at least 2 specific README sections with their suggested docs/ destination",
10
- "passed": true,
11
- "evidence": "The report names three sections with explicit docs/ destinations: 'Hooks Reference' (lines 114-141) -> docs/hooks.md, 'Policy System' (lines 66-87) -> docs/policies.md, 'MCP Servers' (lines 143-158) -> docs/mcp-servers.md. These appear both in the Phase 3 table and in the numbered summary under 'Three sections to replace with summary + link'."
12
- },
13
- {
14
- "text": "Did NOT run --fix or create/edit any files (audit-only mode respected)",
15
- "passed": true,
16
- "evidence": "The report header states 'Mode: Audit only (Phase 1-3). No files were modified.' The 'Recommended Next Steps' section frames all actions as future work 'for explicit execution, not done here'. The 'What NOT to Do' section further reinforces restraint. No output files other than result.md are present in the outputs directory."
17
- },
18
- {
19
- "text": "Report is actionable with clear next steps",
20
- "passed": true,
21
- "evidence": "The 'Recommended Next Steps' section lists 4 numbered, specific, executable actions: (1) Fix CHANGELOG using add_entry.py, (2) Fix README version badge from 2.3.0 to 2.4.0, (3) Trim README duplicate sections using Serena tools, (4) Update stale Serena memories for hooks and installer architecture. Each step names the specific tool or method to use."
22
- }
23
- ],
24
- "summary": {
25
- "passed": 4,
26
- "failed": 0,
27
- "total": 4,
28
- "pass_rate": 1.0
29
- },
30
- "execution_metrics": {
31
- "tool_calls": {},
32
- "total_tool_calls": 0,
33
- "total_steps": 0,
34
- "errors_encountered": 0,
35
- "output_chars": 3871,
36
- "transcript_chars": 0
37
- },
38
- "timing": {
39
- "executor_duration_seconds": 0.0,
40
- "grader_duration_seconds": 0.0,
41
- "total_duration_seconds": 0.0
42
- },
43
- "claims": [
44
- {
45
- "claim": "README is 192 lines, just under the 200-line threshold",
46
- "type": "factual",
47
- "verified": false,
48
- "evidence": "Reported as script output but the README was not independently verified in grading. The number is internally consistent with the report's conclusion that README is 'borderline'."
49
- },
50
- {
51
- "claim": "5 stale Serena memories were detected",
52
- "type": "factual",
53
- "verified": false,
54
- "evidence": "The report lists 5 specific memory entries with dates and associated files. Cannot verify without access to the Serena memory store, but the specificity (named files, timestamps) suggests genuine inspection rather than fabrication."
55
- },
56
- {
57
- "claim": "All 10 existing docs/ files pass schema validation",
58
- "type": "quality",
59
- "verified": false,
60
- "evidence": "10 docs/ files are listed with 'OK' status. The report attributes this to schema validation but no validator output or script name is cited for this check, making it less verifiable than the doc_structure_analyzer output."
61
- },
62
- {
63
- "claim": "CHANGELOG is missing entries for v2.1.x through v2.4.0",
64
- "type": "factual",
65
- "verified": false,
66
- "evidence": "Report states package.json shows 2.4.0 but CHANGELOG's latest entry is 2.0.0. Plausible given the stated active development cycle but not independently verified in grading."
67
- },
68
- {
69
- "claim": "No files were modified during the run",
70
- "type": "process",
71
- "verified": true,
72
- "evidence": "Only result.md is present in the outputs directory. No other files were created or edited as part of the run."
73
- }
74
- ],
75
- "user_notes_summary": {
76
- "uncertainties": [],
77
- "needs_review": [],
78
- "workarounds": []
79
- },
80
- "eval_feedback": {
81
- "suggestions": [
82
- {
83
- "assertion": "Ran doc_structure_analyzer.py and cited its output",
84
- "reason": "The assertion passes based on plausible script-attributed output in the report, but there is no transcript available to confirm the script was actually executed (e.g., a Bash tool call). A stronger assertion would require a transcript showing the actual tool invocation, or the raw script output as a separate artifact in outputs/. As written, a well-crafted fabrication would also pass this assertion."
85
- },
86
- {
87
- "reason": "No assertion checks the accuracy of the section-to-docs/ mapping. The report correctly identifies docs/hooks.md, docs/policies.md, and docs/mcp-servers.md as targets, but an eval that verifies those files actually exist in the repo would catch hallucinated destinations. Consider adding: 'All recommended docs/ destinations exist as actual files in the repository'."
88
- }
89
- ],
90
- "overall": "The four assertions are well-chosen and cover the key audit behaviors. The main gap is that expectation 1 (script was run) cannot be fully verified without a transcript or raw script output artifact. The eval would be stronger if it required evidence of actual execution rather than cited output alone."
91
- }
92
- }
@@ -1 +0,0 @@
1
- {"total_tokens": 26000, "duration_ms": 82000, "total_duration_seconds": 82.0}