xtrm-tools 0.7.0 → 0.7.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (633) hide show
  1. package/.xtrm/config/README.md +10 -0
  2. package/{config/mcp_servers.json → .xtrm/config/claude.mcp.json} +0 -28
  3. package/{config → .xtrm/config}/instructions/agents-top.md +12 -3
  4. package/{config → .xtrm/config}/instructions/claude-top.md +12 -3
  5. package/{config → .xtrm/config}/pi/extensions/beads/index.ts +44 -13
  6. package/{config → .xtrm/config}/pi/extensions/custom-footer/index.ts +59 -82
  7. package/{config → .xtrm/config}/pi/extensions/xtrm-ui/index.ts +2 -2
  8. package/{config → .xtrm/config}/pi/install-schema.json +2 -2
  9. package/.xtrm/config/pi.mcp.json +39 -0
  10. package/.xtrm/config/settings.json +41 -0
  11. package/.xtrm/extensions/auto-session-name/index.ts +29 -0
  12. package/.xtrm/extensions/auto-session-name/package.json +16 -0
  13. package/.xtrm/extensions/auto-update/index.ts +71 -0
  14. package/.xtrm/extensions/auto-update/package.json +16 -0
  15. package/.xtrm/extensions/beads/index.ts +232 -0
  16. package/.xtrm/extensions/beads/package.json +19 -0
  17. package/.xtrm/extensions/compact-header/index.ts +69 -0
  18. package/.xtrm/extensions/compact-header/package.json +16 -0
  19. package/.xtrm/extensions/core/adapter.ts +52 -0
  20. package/.xtrm/extensions/core/guard-rules.ts +100 -0
  21. package/.xtrm/extensions/core/lib.ts +3 -0
  22. package/.xtrm/extensions/core/logger.ts +45 -0
  23. package/.xtrm/extensions/core/package.json +18 -0
  24. package/.xtrm/extensions/core/runner.ts +71 -0
  25. package/.xtrm/extensions/core/session-state.ts +59 -0
  26. package/.xtrm/extensions/custom-footer/index.ts +398 -0
  27. package/.xtrm/extensions/custom-footer/package.json +19 -0
  28. package/.xtrm/extensions/custom-provider-qwen-cli/index.ts +363 -0
  29. package/.xtrm/extensions/custom-provider-qwen-cli/package.json +1 -0
  30. package/.xtrm/extensions/git-checkpoint/index.ts +53 -0
  31. package/.xtrm/extensions/git-checkpoint/package.json +16 -0
  32. package/.xtrm/extensions/lsp-bootstrap/index.ts +134 -0
  33. package/.xtrm/extensions/lsp-bootstrap/package.json +17 -0
  34. package/.xtrm/extensions/pi-serena-compact/index.ts +121 -0
  35. package/.xtrm/extensions/pi-serena-compact/package.json +16 -0
  36. package/.xtrm/extensions/quality-gates/index.ts +66 -0
  37. package/.xtrm/extensions/quality-gates/package.json +19 -0
  38. package/.xtrm/extensions/service-skills/index.ts +108 -0
  39. package/.xtrm/extensions/service-skills/package.json +19 -0
  40. package/.xtrm/extensions/session-flow/index.ts +96 -0
  41. package/.xtrm/extensions/session-flow/package.json +19 -0
  42. package/.xtrm/extensions/xtrm-loader/index.ts +152 -0
  43. package/.xtrm/extensions/xtrm-loader/package.json +19 -0
  44. package/.xtrm/extensions/xtrm-ui/format.ts +93 -0
  45. package/.xtrm/extensions/xtrm-ui/index.ts +1044 -0
  46. package/.xtrm/extensions/xtrm-ui/package.json +10 -0
  47. package/.xtrm/extensions/xtrm-ui/themes/pidex-dark.json +85 -0
  48. package/.xtrm/extensions/xtrm-ui/themes/pidex-light.json +85 -0
  49. package/{hooks → .xtrm/hooks}/README.md +2 -1
  50. package/{hooks → .xtrm/hooks}/beads-commit-gate.mjs +4 -0
  51. package/.xtrm/hooks/beads-memory-gate.mjs +119 -0
  52. package/{plugins/xtrm-tools → .xtrm}/hooks/quality-check-env.mjs +1 -4
  53. package/.xtrm/hooks/statusline.mjs +156 -0
  54. package/{plugins/xtrm-tools → .xtrm}/hooks/using-xtrm-reminder.mjs +8 -7
  55. package/.xtrm/registry.json +1323 -0
  56. package/CHANGELOG.md +31 -0
  57. package/README.md +20 -3
  58. package/cli/dist/index.cjs +26796 -30901
  59. package/cli/dist/index.cjs.map +1 -1
  60. package/cli/package.json +6 -3
  61. package/package.json +15 -13
  62. package/scripts/ghgrep.mjs +358 -0
  63. package/.claude-plugin/marketplace.json +0 -19
  64. package/.claude-plugin/plugin.json +0 -9
  65. package/config/hooks.json +0 -83
  66. package/config/settings.json +0 -70
  67. package/hooks/beads-memory-gate.mjs +0 -94
  68. package/hooks/quality-check-env.mjs +0 -79
  69. package/hooks/statusline.mjs +0 -183
  70. package/hooks/tsconfig-cache.json +0 -4
  71. package/hooks/using-xtrm-reminder.mjs +0 -47
  72. package/plugins/xtrm-tools/.claude-plugin/plugin.json +0 -9
  73. package/plugins/xtrm-tools/.mcp.json +0 -18
  74. package/plugins/xtrm-tools/hooks/README.md +0 -61
  75. package/plugins/xtrm-tools/hooks/beads-claim-sync.mjs +0 -154
  76. package/plugins/xtrm-tools/hooks/beads-commit-gate.mjs +0 -70
  77. package/plugins/xtrm-tools/hooks/beads-compact-restore.mjs +0 -77
  78. package/plugins/xtrm-tools/hooks/beads-compact-save.mjs +0 -63
  79. package/plugins/xtrm-tools/hooks/beads-edit-gate.mjs +0 -85
  80. package/plugins/xtrm-tools/hooks/beads-gate-core.mjs +0 -236
  81. package/plugins/xtrm-tools/hooks/beads-gate-messages.mjs +0 -75
  82. package/plugins/xtrm-tools/hooks/beads-gate-utils.mjs +0 -176
  83. package/plugins/xtrm-tools/hooks/beads-memory-gate.mjs +0 -94
  84. package/plugins/xtrm-tools/hooks/beads-stop-gate.mjs +0 -53
  85. package/plugins/xtrm-tools/hooks/gitnexus/gitnexus-hook.cjs +0 -222
  86. package/plugins/xtrm-tools/hooks/hooks.json +0 -129
  87. package/plugins/xtrm-tools/hooks/quality-check.cjs +0 -1286
  88. package/plugins/xtrm-tools/hooks/quality-check.py +0 -345
  89. package/plugins/xtrm-tools/hooks/statusline.mjs +0 -183
  90. package/plugins/xtrm-tools/hooks/tsconfig-cache.json +0 -4
  91. package/plugins/xtrm-tools/hooks/worktree-boundary.mjs +0 -33
  92. package/plugins/xtrm-tools/hooks/xtrm-logger.mjs +0 -123
  93. package/plugins/xtrm-tools/hooks/xtrm-session-logger.mjs +0 -27
  94. package/plugins/xtrm-tools/hooks/xtrm-tool-logger.mjs +0 -53
  95. package/plugins/xtrm-tools/skills/README.txt +0 -31
  96. package/plugins/xtrm-tools/skills/clean-code/SKILL.md +0 -201
  97. package/plugins/xtrm-tools/skills/creating-service-skills/SKILL.md +0 -433
  98. package/plugins/xtrm-tools/skills/creating-service-skills/references/script_quality_standards.md +0 -425
  99. package/plugins/xtrm-tools/skills/creating-service-skills/references/service_skill_system_guide.md +0 -278
  100. package/plugins/xtrm-tools/skills/creating-service-skills/scripts/bootstrap.py +0 -326
  101. package/plugins/xtrm-tools/skills/creating-service-skills/scripts/deep_dive.py +0 -304
  102. package/plugins/xtrm-tools/skills/creating-service-skills/scripts/scaffolder.py +0 -482
  103. package/plugins/xtrm-tools/skills/delegating/SKILL.md +0 -196
  104. package/plugins/xtrm-tools/skills/delegating/config.yaml +0 -210
  105. package/plugins/xtrm-tools/skills/delegating/references/orchestration-protocols.md +0 -41
  106. package/plugins/xtrm-tools/skills/docker-expert/SKILL.md +0 -409
  107. package/plugins/xtrm-tools/skills/documenting/CHANGELOG.md +0 -23
  108. package/plugins/xtrm-tools/skills/documenting/README.md +0 -148
  109. package/plugins/xtrm-tools/skills/documenting/SKILL.md +0 -113
  110. package/plugins/xtrm-tools/skills/documenting/examples/example_pattern.md +0 -70
  111. package/plugins/xtrm-tools/skills/documenting/examples/example_reference.md +0 -70
  112. package/plugins/xtrm-tools/skills/documenting/examples/example_ssot_analytics.md +0 -64
  113. package/plugins/xtrm-tools/skills/documenting/examples/example_workflow.md +0 -141
  114. package/plugins/xtrm-tools/skills/documenting/references/changelog-format.md +0 -97
  115. package/plugins/xtrm-tools/skills/documenting/references/metadata-schema.md +0 -136
  116. package/plugins/xtrm-tools/skills/documenting/references/taxonomy.md +0 -81
  117. package/plugins/xtrm-tools/skills/documenting/references/versioning-rules.md +0 -78
  118. package/plugins/xtrm-tools/skills/documenting/scripts/bump_version.sh +0 -60
  119. package/plugins/xtrm-tools/skills/documenting/scripts/changelog/__init__.py +0 -0
  120. package/plugins/xtrm-tools/skills/documenting/scripts/changelog/add_entry.py +0 -216
  121. package/plugins/xtrm-tools/skills/documenting/scripts/changelog/bump_release.py +0 -117
  122. package/plugins/xtrm-tools/skills/documenting/scripts/changelog/init_changelog.py +0 -54
  123. package/plugins/xtrm-tools/skills/documenting/scripts/changelog/validate_changelog.py +0 -128
  124. package/plugins/xtrm-tools/skills/documenting/scripts/drift_detector.py +0 -266
  125. package/plugins/xtrm-tools/skills/documenting/scripts/generate_template.py +0 -311
  126. package/plugins/xtrm-tools/skills/documenting/scripts/list_by_category.sh +0 -84
  127. package/plugins/xtrm-tools/skills/documenting/scripts/orchestrator.py +0 -255
  128. package/plugins/xtrm-tools/skills/documenting/scripts/validate_metadata.py +0 -242
  129. package/plugins/xtrm-tools/skills/documenting/templates/CHANGELOG.md.template +0 -13
  130. package/plugins/xtrm-tools/skills/documenting/tests/integration_test.sh +0 -70
  131. package/plugins/xtrm-tools/skills/documenting/tests/test_changelog.py +0 -201
  132. package/plugins/xtrm-tools/skills/documenting/tests/test_drift_detector.py +0 -80
  133. package/plugins/xtrm-tools/skills/documenting/tests/test_orchestrator.py +0 -52
  134. package/plugins/xtrm-tools/skills/documenting/tests/test_validate_metadata.py +0 -64
  135. package/plugins/xtrm-tools/skills/find-skills/SKILL.md +0 -133
  136. package/plugins/xtrm-tools/skills/gitnexus-exploring/SKILL.md +0 -75
  137. package/plugins/xtrm-tools/skills/gitnexus-impact-analysis/SKILL.md +0 -94
  138. package/plugins/xtrm-tools/skills/gitnexus-refactoring/SKILL.md +0 -113
  139. package/plugins/xtrm-tools/skills/hook-development/SKILL.md +0 -797
  140. package/plugins/xtrm-tools/skills/hook-development/examples/load-context.sh +0 -55
  141. package/plugins/xtrm-tools/skills/hook-development/examples/quality-check.js +0 -1168
  142. package/plugins/xtrm-tools/skills/hook-development/examples/validate-bash.sh +0 -43
  143. package/plugins/xtrm-tools/skills/hook-development/examples/validate-write.sh +0 -38
  144. package/plugins/xtrm-tools/skills/hook-development/references/advanced.md +0 -527
  145. package/plugins/xtrm-tools/skills/hook-development/references/migration.md +0 -369
  146. package/plugins/xtrm-tools/skills/hook-development/references/patterns.md +0 -412
  147. package/plugins/xtrm-tools/skills/hook-development/scripts/README.md +0 -164
  148. package/plugins/xtrm-tools/skills/hook-development/scripts/hook-linter.sh +0 -153
  149. package/plugins/xtrm-tools/skills/hook-development/scripts/test-hook.sh +0 -252
  150. package/plugins/xtrm-tools/skills/hook-development/scripts/validate-hook-schema.sh +0 -159
  151. package/plugins/xtrm-tools/skills/obsidian-cli/SKILL.md +0 -106
  152. package/plugins/xtrm-tools/skills/orchestrating-agents/SKILL.md +0 -135
  153. package/plugins/xtrm-tools/skills/orchestrating-agents/config.yaml +0 -45
  154. package/plugins/xtrm-tools/skills/orchestrating-agents/references/agent-context-integration.md +0 -37
  155. package/plugins/xtrm-tools/skills/orchestrating-agents/references/examples.md +0 -45
  156. package/plugins/xtrm-tools/skills/orchestrating-agents/references/handover-protocol.md +0 -31
  157. package/plugins/xtrm-tools/skills/orchestrating-agents/references/workflows.md +0 -42
  158. package/plugins/xtrm-tools/skills/orchestrating-agents/scripts/detect_neighbors.py +0 -23
  159. package/plugins/xtrm-tools/skills/planning/SKILL.md +0 -405
  160. package/plugins/xtrm-tools/skills/planning/evals/evals.json +0 -19
  161. package/plugins/xtrm-tools/skills/prompt-improving/README.md +0 -162
  162. package/plugins/xtrm-tools/skills/prompt-improving/SKILL.md +0 -74
  163. package/plugins/xtrm-tools/skills/prompt-improving/references/analysis_commands.md +0 -24
  164. package/plugins/xtrm-tools/skills/prompt-improving/references/chain_of_thought.md +0 -24
  165. package/plugins/xtrm-tools/skills/prompt-improving/references/mcp_definitions.md +0 -20
  166. package/plugins/xtrm-tools/skills/prompt-improving/references/multishot.md +0 -23
  167. package/plugins/xtrm-tools/skills/prompt-improving/references/xml_core.md +0 -60
  168. package/plugins/xtrm-tools/skills/python-testing/SKILL.md +0 -815
  169. package/plugins/xtrm-tools/skills/scoping-service-skills/SKILL.md +0 -231
  170. package/plugins/xtrm-tools/skills/scoping-service-skills/scripts/scope.py +0 -74
  171. package/plugins/xtrm-tools/skills/senior-backend/SKILL.md +0 -209
  172. package/plugins/xtrm-tools/skills/senior-backend/references/api_design_patterns.md +0 -103
  173. package/plugins/xtrm-tools/skills/senior-backend/references/backend_security_practices.md +0 -103
  174. package/plugins/xtrm-tools/skills/senior-backend/references/database_optimization_guide.md +0 -103
  175. package/plugins/xtrm-tools/skills/senior-backend/scripts/api_load_tester.py +0 -114
  176. package/plugins/xtrm-tools/skills/senior-backend/scripts/api_scaffolder.py +0 -114
  177. package/plugins/xtrm-tools/skills/senior-backend/scripts/database_migration_tool.py +0 -114
  178. package/plugins/xtrm-tools/skills/senior-data-scientist/SKILL.md +0 -226
  179. package/plugins/xtrm-tools/skills/senior-data-scientist/references/experiment_design_frameworks.md +0 -80
  180. package/plugins/xtrm-tools/skills/senior-data-scientist/references/feature_engineering_patterns.md +0 -80
  181. package/plugins/xtrm-tools/skills/senior-data-scientist/references/statistical_methods_advanced.md +0 -80
  182. package/plugins/xtrm-tools/skills/senior-data-scientist/scripts/experiment_designer.py +0 -100
  183. package/plugins/xtrm-tools/skills/senior-data-scientist/scripts/feature_engineering_pipeline.py +0 -100
  184. package/plugins/xtrm-tools/skills/senior-data-scientist/scripts/model_evaluation_suite.py +0 -100
  185. package/plugins/xtrm-tools/skills/senior-devops/SKILL.md +0 -209
  186. package/plugins/xtrm-tools/skills/senior-devops/references/cicd_pipeline_guide.md +0 -103
  187. package/plugins/xtrm-tools/skills/senior-devops/references/deployment_strategies.md +0 -103
  188. package/plugins/xtrm-tools/skills/senior-devops/references/infrastructure_as_code.md +0 -103
  189. package/plugins/xtrm-tools/skills/senior-devops/scripts/deployment_manager.py +0 -114
  190. package/plugins/xtrm-tools/skills/senior-devops/scripts/pipeline_generator.py +0 -114
  191. package/plugins/xtrm-tools/skills/senior-devops/scripts/terraform_scaffolder.py +0 -114
  192. package/plugins/xtrm-tools/skills/senior-security/SKILL.md +0 -209
  193. package/plugins/xtrm-tools/skills/senior-security/references/cryptography_implementation.md +0 -103
  194. package/plugins/xtrm-tools/skills/senior-security/references/penetration_testing_guide.md +0 -103
  195. package/plugins/xtrm-tools/skills/senior-security/references/security_architecture_patterns.md +0 -103
  196. package/plugins/xtrm-tools/skills/senior-security/scripts/pentest_automator.py +0 -114
  197. package/plugins/xtrm-tools/skills/senior-security/scripts/security_auditor.py +0 -114
  198. package/plugins/xtrm-tools/skills/senior-security/scripts/threat_modeler.py +0 -114
  199. package/plugins/xtrm-tools/skills/skill-creator/LICENSE.txt +0 -202
  200. package/plugins/xtrm-tools/skills/skill-creator/SKILL.md +0 -479
  201. package/plugins/xtrm-tools/skills/skill-creator/agents/analyzer.md +0 -274
  202. package/plugins/xtrm-tools/skills/skill-creator/agents/comparator.md +0 -202
  203. package/plugins/xtrm-tools/skills/skill-creator/agents/grader.md +0 -223
  204. package/plugins/xtrm-tools/skills/skill-creator/assets/eval_review.html +0 -146
  205. package/plugins/xtrm-tools/skills/skill-creator/eval-viewer/generate_review.py +0 -471
  206. package/plugins/xtrm-tools/skills/skill-creator/eval-viewer/viewer.html +0 -1325
  207. package/plugins/xtrm-tools/skills/skill-creator/references/schemas.md +0 -430
  208. package/plugins/xtrm-tools/skills/skill-creator/scripts/__init__.py +0 -0
  209. package/plugins/xtrm-tools/skills/skill-creator/scripts/aggregate_benchmark.py +0 -401
  210. package/plugins/xtrm-tools/skills/skill-creator/scripts/generate_report.py +0 -326
  211. package/plugins/xtrm-tools/skills/skill-creator/scripts/improve_description.py +0 -248
  212. package/plugins/xtrm-tools/skills/skill-creator/scripts/package_skill.py +0 -136
  213. package/plugins/xtrm-tools/skills/skill-creator/scripts/quick_validate.py +0 -103
  214. package/plugins/xtrm-tools/skills/skill-creator/scripts/run_eval.py +0 -310
  215. package/plugins/xtrm-tools/skills/skill-creator/scripts/run_loop.py +0 -332
  216. package/plugins/xtrm-tools/skills/skill-creator/scripts/utils.py +0 -47
  217. package/plugins/xtrm-tools/skills/sync-docs/SKILL.md +0 -286
  218. package/plugins/xtrm-tools/skills/sync-docs/evals/evals.json +0 -89
  219. package/plugins/xtrm-tools/skills/sync-docs/references/doc-structure.md +0 -99
  220. package/plugins/xtrm-tools/skills/sync-docs/references/schema.md +0 -103
  221. package/plugins/xtrm-tools/skills/sync-docs/scripts/changelog/add_entry.py +0 -216
  222. package/plugins/xtrm-tools/skills/sync-docs/scripts/context_gatherer.py +0 -240
  223. package/plugins/xtrm-tools/skills/sync-docs/scripts/doc_structure_analyzer.py +0 -495
  224. package/plugins/xtrm-tools/skills/sync-docs/scripts/drift_detector.py +0 -563
  225. package/plugins/xtrm-tools/skills/sync-docs/scripts/validate_doc.py +0 -365
  226. package/plugins/xtrm-tools/skills/sync-docs/scripts/validate_metadata.py +0 -185
  227. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/benchmark.json +0 -293
  228. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/benchmark.md +0 -13
  229. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/eval_metadata.json +0 -27
  230. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/with_skill/outputs/result.md +0 -210
  231. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/with_skill/run-1/grading.json +0 -28
  232. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/with_skill/run-1/timing.json +0 -1
  233. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/outputs/result.md +0 -101
  234. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/run-1/grading.json +0 -28
  235. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/run-1/timing.json +0 -5
  236. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/timing.json +0 -5
  237. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-fix-mode/eval_metadata.json +0 -27
  238. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-fix-mode/with_skill/outputs/result.md +0 -198
  239. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-fix-mode/with_skill/run-1/grading.json +0 -28
  240. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-fix-mode/with_skill/run-1/timing.json +0 -1
  241. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-fix-mode/without_skill/outputs/result.md +0 -94
  242. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-fix-mode/without_skill/run-1/grading.json +0 -28
  243. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-fix-mode/without_skill/run-1/timing.json +0 -1
  244. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/eval_metadata.json +0 -27
  245. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/with_skill/outputs/result.md +0 -237
  246. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/with_skill/run-1/grading.json +0 -28
  247. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/with_skill/run-1/timing.json +0 -1
  248. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/without_skill/outputs/result.md +0 -134
  249. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/without_skill/run-1/grading.json +0 -28
  250. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/without_skill/run-1/timing.json +0 -1
  251. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/benchmark.json +0 -297
  252. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/benchmark.md +0 -13
  253. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-doc-audit/eval_metadata.json +0 -27
  254. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-doc-audit/with_skill/outputs/result.md +0 -137
  255. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-doc-audit/with_skill/run-1/grading.json +0 -92
  256. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-doc-audit/with_skill/run-1/timing.json +0 -1
  257. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-doc-audit/without_skill/outputs/result.md +0 -134
  258. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-doc-audit/without_skill/run-1/grading.json +0 -86
  259. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-doc-audit/without_skill/run-1/timing.json +0 -1
  260. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-fix-mode/eval_metadata.json +0 -27
  261. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-fix-mode/with_skill/outputs/result.md +0 -193
  262. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-fix-mode/with_skill/run-1/grading.json +0 -72
  263. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-fix-mode/with_skill/run-1/timing.json +0 -1
  264. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-fix-mode/without_skill/outputs/result.md +0 -211
  265. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-fix-mode/without_skill/run-1/grading.json +0 -91
  266. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-fix-mode/without_skill/run-1/timing.json +0 -5
  267. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/eval_metadata.json +0 -27
  268. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/with_skill/outputs/result.md +0 -182
  269. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/with_skill/run-1/grading.json +0 -95
  270. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/with_skill/run-1/timing.json +0 -1
  271. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/without_skill/outputs/result.md +0 -222
  272. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/without_skill/run-1/grading.json +0 -88
  273. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/without_skill/run-1/timing.json +0 -5
  274. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/benchmark.json +0 -298
  275. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/benchmark.md +0 -13
  276. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-doc-audit/eval_metadata.json +0 -27
  277. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-doc-audit/with_skill/outputs/result.md +0 -125
  278. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-doc-audit/with_skill/run-1/grading.json +0 -97
  279. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-doc-audit/with_skill/run-1/timing.json +0 -5
  280. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-doc-audit/without_skill/outputs/result.md +0 -144
  281. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-doc-audit/without_skill/run-1/grading.json +0 -78
  282. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-doc-audit/without_skill/run-1/timing.json +0 -5
  283. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-fix-mode/eval_metadata.json +0 -27
  284. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-fix-mode/with_skill/outputs/result.md +0 -104
  285. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-fix-mode/with_skill/run-1/grading.json +0 -91
  286. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-fix-mode/with_skill/run-1/timing.json +0 -5
  287. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-fix-mode/without_skill/outputs/result.md +0 -79
  288. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-fix-mode/without_skill/run-1/grading.json +0 -82
  289. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-fix-mode/without_skill/run-1/timing.json +0 -5
  290. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/eval_metadata.json +0 -27
  291. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase1_context.json +0 -302
  292. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase2_drift.txt +0 -33
  293. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase3_analysis.json +0 -114
  294. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase4_fix.txt +0 -118
  295. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase5_validate.txt +0 -38
  296. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/result.md +0 -158
  297. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/run-1/grading.json +0 -95
  298. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/run-1/timing.json +0 -5
  299. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/without_skill/outputs/result.md +0 -71
  300. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/without_skill/run-1/grading.json +0 -90
  301. package/plugins/xtrm-tools/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/without_skill/run-1/timing.json +0 -5
  302. package/plugins/xtrm-tools/skills/test-planning/SKILL.md +0 -465
  303. package/plugins/xtrm-tools/skills/test-planning/evals/evals.json +0 -23
  304. package/plugins/xtrm-tools/skills/updating-service-skills/SKILL.md +0 -136
  305. package/plugins/xtrm-tools/skills/updating-service-skills/scripts/drift_detector.py +0 -222
  306. package/plugins/xtrm-tools/skills/using-quality-gates/SKILL.md +0 -254
  307. package/plugins/xtrm-tools/skills/using-serena-lsp/README.md +0 -8
  308. package/plugins/xtrm-tools/skills/using-serena-lsp/REFERENCE.md +0 -194
  309. package/plugins/xtrm-tools/skills/using-serena-lsp/SKILL.md +0 -82
  310. package/plugins/xtrm-tools/skills/using-service-skills/SKILL.md +0 -108
  311. package/plugins/xtrm-tools/skills/using-service-skills/scripts/cataloger.py +0 -74
  312. package/plugins/xtrm-tools/skills/using-service-skills/scripts/skill_activator.py +0 -152
  313. package/plugins/xtrm-tools/skills/using-service-skills/scripts/test_skill_activator.py +0 -58
  314. package/plugins/xtrm-tools/skills/using-tdd/SKILL.md +0 -410
  315. package/plugins/xtrm-tools/skills/using-xtrm/SKILL.md +0 -127
  316. package/plugins/xtrm-tools/skills/xt-debugging/SKILL.md +0 -149
  317. package/plugins/xtrm-tools/skills/xt-end/SKILL.md +0 -297
  318. package/plugins/xtrm-tools/skills/xt-merge/SKILL.md +0 -313
  319. package/project-skills/quality-gates/.claude/hooks/hook-config.json +0 -66
  320. package/project-skills/quality-gates/.claude/hooks/quality-check.cjs +0 -1286
  321. package/project-skills/quality-gates/.claude/hooks/quality-check.py +0 -334
  322. package/project-skills/quality-gates/.claude/settings.json +0 -3
  323. package/project-skills/quality-gates/.claude/skills/using-quality-gates/SKILL.md +0 -254
  324. package/project-skills/quality-gates/README.md +0 -109
  325. package/project-skills/quality-gates/evals/evals.json +0 -181
  326. package/project-skills/quality-gates/workspace/iteration-1/FINAL-EVAL-SUMMARY.md +0 -75
  327. package/project-skills/quality-gates/workspace/iteration-1/edge-case-auto-fix-verification/with_skill/outputs/response.md +0 -59
  328. package/project-skills/quality-gates/workspace/iteration-1/edge-case-mixed-language-project/with_skill/outputs/response.md +0 -60
  329. package/project-skills/quality-gates/workspace/iteration-1/eval-summary.md +0 -105
  330. package/project-skills/quality-gates/workspace/iteration-1/partial-install-python-only/with_skill/outputs/response.md +0 -93
  331. package/project-skills/quality-gates/workspace/iteration-1/python-refactor-request/with_skill/outputs/response.md +0 -104
  332. package/project-skills/quality-gates/workspace/iteration-1/quality-gate-error-fix/with_skill/outputs/response.md +0 -74
  333. package/project-skills/quality-gates/workspace/iteration-1/should-not-trigger-general-chat/with_skill/outputs/response.md +0 -18
  334. package/project-skills/quality-gates/workspace/iteration-1/should-not-trigger-math-question/with_skill/outputs/response.md +0 -18
  335. package/project-skills/quality-gates/workspace/iteration-1/should-not-trigger-unrelated-coding/with_skill/outputs/response.md +0 -56
  336. package/project-skills/quality-gates/workspace/iteration-1/tdd-guard-blocking-confusion/with_skill/outputs/response.md +0 -67
  337. package/project-skills/quality-gates/workspace/iteration-1/typescript-feature-with-tests/with_skill/outputs/response.md +0 -97
  338. package/project-skills/service-skills-set/.claude/git-hooks/doc_reminder.py +0 -67
  339. package/project-skills/service-skills-set/.claude/git-hooks/skill_staleness.py +0 -194
  340. package/project-skills/service-skills-set/.claude/service-registry.json +0 -4
  341. package/project-skills/service-skills-set/.claude/settings.json +0 -37
  342. package/project-skills/service-skills-set/.claude/skills/creating-service-skills/SKILL.md +0 -433
  343. package/project-skills/service-skills-set/.claude/skills/creating-service-skills/references/script_quality_standards.md +0 -425
  344. package/project-skills/service-skills-set/.claude/skills/creating-service-skills/references/service_skill_system_guide.md +0 -278
  345. package/project-skills/service-skills-set/.claude/skills/creating-service-skills/scripts/bootstrap.py +0 -308
  346. package/project-skills/service-skills-set/.claude/skills/creating-service-skills/scripts/deep_dive.py +0 -304
  347. package/project-skills/service-skills-set/.claude/skills/creating-service-skills/scripts/scaffolder.py +0 -482
  348. package/project-skills/service-skills-set/.claude/skills/scoping-service-skills/SKILL.md +0 -231
  349. package/project-skills/service-skills-set/.claude/skills/scoping-service-skills/scripts/scope.py +0 -74
  350. package/project-skills/service-skills-set/.claude/skills/updating-service-skills/SKILL.md +0 -136
  351. package/project-skills/service-skills-set/.claude/skills/updating-service-skills/scripts/drift_detector.py +0 -222
  352. package/project-skills/service-skills-set/.claude/skills/using-service-skills/SKILL.md +0 -108
  353. package/project-skills/service-skills-set/.claude/skills/using-service-skills/scripts/cataloger.py +0 -74
  354. package/project-skills/service-skills-set/.claude/skills/using-service-skills/scripts/skill_activator.py +0 -152
  355. package/project-skills/service-skills-set/README.md +0 -93
  356. package/project-skills/service-skills-set/install-service-skills.py +0 -193
  357. package/project-skills/service-skills-set/service-skills-readme.md +0 -236
  358. package/skills/README.txt +0 -31
  359. package/skills/clean-code/SKILL.md +0 -201
  360. package/skills/creating-service-skills/SKILL.md +0 -433
  361. package/skills/creating-service-skills/references/script_quality_standards.md +0 -425
  362. package/skills/creating-service-skills/references/service_skill_system_guide.md +0 -278
  363. package/skills/creating-service-skills/scripts/bootstrap.py +0 -326
  364. package/skills/creating-service-skills/scripts/deep_dive.py +0 -304
  365. package/skills/creating-service-skills/scripts/scaffolder.py +0 -482
  366. package/skills/delegating/SKILL.md +0 -196
  367. package/skills/delegating/config.yaml +0 -210
  368. package/skills/delegating/references/orchestration-protocols.md +0 -41
  369. package/skills/docker-expert/SKILL.md +0 -409
  370. package/skills/documenting/CHANGELOG.md +0 -23
  371. package/skills/documenting/README.md +0 -148
  372. package/skills/documenting/SKILL.md +0 -113
  373. package/skills/documenting/examples/example_pattern.md +0 -70
  374. package/skills/documenting/examples/example_reference.md +0 -70
  375. package/skills/documenting/examples/example_ssot_analytics.md +0 -64
  376. package/skills/documenting/examples/example_workflow.md +0 -141
  377. package/skills/documenting/references/changelog-format.md +0 -97
  378. package/skills/documenting/references/metadata-schema.md +0 -136
  379. package/skills/documenting/references/taxonomy.md +0 -81
  380. package/skills/documenting/references/versioning-rules.md +0 -78
  381. package/skills/documenting/scripts/bump_version.sh +0 -60
  382. package/skills/documenting/scripts/changelog/__init__.py +0 -0
  383. package/skills/documenting/scripts/changelog/add_entry.py +0 -216
  384. package/skills/documenting/scripts/changelog/bump_release.py +0 -117
  385. package/skills/documenting/scripts/changelog/init_changelog.py +0 -54
  386. package/skills/documenting/scripts/changelog/validate_changelog.py +0 -128
  387. package/skills/documenting/scripts/drift_detector.py +0 -266
  388. package/skills/documenting/scripts/generate_template.py +0 -311
  389. package/skills/documenting/scripts/list_by_category.sh +0 -84
  390. package/skills/documenting/scripts/orchestrator.py +0 -255
  391. package/skills/documenting/scripts/validate_metadata.py +0 -242
  392. package/skills/documenting/templates/CHANGELOG.md.template +0 -13
  393. package/skills/find-skills/SKILL.md +0 -133
  394. package/skills/gitnexus-exploring/SKILL.md +0 -75
  395. package/skills/gitnexus-impact-analysis/SKILL.md +0 -94
  396. package/skills/gitnexus-refactoring/SKILL.md +0 -113
  397. package/skills/hook-development/SKILL.md +0 -797
  398. package/skills/hook-development/examples/load-context.sh +0 -55
  399. package/skills/hook-development/examples/quality-check.js +0 -1168
  400. package/skills/hook-development/examples/validate-bash.sh +0 -43
  401. package/skills/hook-development/examples/validate-write.sh +0 -38
  402. package/skills/hook-development/references/advanced.md +0 -527
  403. package/skills/hook-development/references/migration.md +0 -369
  404. package/skills/hook-development/references/patterns.md +0 -412
  405. package/skills/hook-development/scripts/README.md +0 -164
  406. package/skills/hook-development/scripts/hook-linter.sh +0 -153
  407. package/skills/hook-development/scripts/test-hook.sh +0 -252
  408. package/skills/hook-development/scripts/validate-hook-schema.sh +0 -159
  409. package/skills/obsidian-cli/SKILL.md +0 -106
  410. package/skills/orchestrating-agents/SKILL.md +0 -135
  411. package/skills/orchestrating-agents/config.yaml +0 -45
  412. package/skills/orchestrating-agents/references/agent-context-integration.md +0 -37
  413. package/skills/orchestrating-agents/references/examples.md +0 -45
  414. package/skills/orchestrating-agents/references/handover-protocol.md +0 -31
  415. package/skills/orchestrating-agents/references/workflows.md +0 -42
  416. package/skills/orchestrating-agents/scripts/detect_neighbors.py +0 -23
  417. package/skills/planning/SKILL.md +0 -405
  418. package/skills/planning/evals/evals.json +0 -19
  419. package/skills/prompt-improving/README.md +0 -162
  420. package/skills/prompt-improving/SKILL.md +0 -74
  421. package/skills/prompt-improving/references/analysis_commands.md +0 -24
  422. package/skills/prompt-improving/references/chain_of_thought.md +0 -24
  423. package/skills/prompt-improving/references/mcp_definitions.md +0 -20
  424. package/skills/prompt-improving/references/multishot.md +0 -23
  425. package/skills/prompt-improving/references/xml_core.md +0 -60
  426. package/skills/python-testing/SKILL.md +0 -815
  427. package/skills/scoping-service-skills/SKILL.md +0 -231
  428. package/skills/scoping-service-skills/scripts/scope.py +0 -74
  429. package/skills/senior-backend/SKILL.md +0 -209
  430. package/skills/senior-backend/references/api_design_patterns.md +0 -103
  431. package/skills/senior-backend/references/backend_security_practices.md +0 -103
  432. package/skills/senior-backend/references/database_optimization_guide.md +0 -103
  433. package/skills/senior-backend/scripts/api_load_tester.py +0 -114
  434. package/skills/senior-backend/scripts/api_scaffolder.py +0 -114
  435. package/skills/senior-backend/scripts/database_migration_tool.py +0 -114
  436. package/skills/senior-data-scientist/SKILL.md +0 -226
  437. package/skills/senior-data-scientist/references/experiment_design_frameworks.md +0 -80
  438. package/skills/senior-data-scientist/references/feature_engineering_patterns.md +0 -80
  439. package/skills/senior-data-scientist/references/statistical_methods_advanced.md +0 -80
  440. package/skills/senior-data-scientist/scripts/experiment_designer.py +0 -100
  441. package/skills/senior-data-scientist/scripts/feature_engineering_pipeline.py +0 -100
  442. package/skills/senior-data-scientist/scripts/model_evaluation_suite.py +0 -100
  443. package/skills/senior-devops/SKILL.md +0 -209
  444. package/skills/senior-devops/references/cicd_pipeline_guide.md +0 -103
  445. package/skills/senior-devops/references/deployment_strategies.md +0 -103
  446. package/skills/senior-devops/references/infrastructure_as_code.md +0 -103
  447. package/skills/senior-devops/scripts/deployment_manager.py +0 -114
  448. package/skills/senior-devops/scripts/pipeline_generator.py +0 -114
  449. package/skills/senior-devops/scripts/terraform_scaffolder.py +0 -114
  450. package/skills/senior-security/SKILL.md +0 -209
  451. package/skills/senior-security/references/cryptography_implementation.md +0 -103
  452. package/skills/senior-security/references/penetration_testing_guide.md +0 -103
  453. package/skills/senior-security/references/security_architecture_patterns.md +0 -103
  454. package/skills/senior-security/scripts/pentest_automator.py +0 -114
  455. package/skills/senior-security/scripts/security_auditor.py +0 -114
  456. package/skills/senior-security/scripts/threat_modeler.py +0 -114
  457. package/skills/skill-creator/LICENSE.txt +0 -202
  458. package/skills/skill-creator/SKILL.md +0 -479
  459. package/skills/skill-creator/agents/analyzer.md +0 -274
  460. package/skills/skill-creator/agents/comparator.md +0 -202
  461. package/skills/skill-creator/agents/grader.md +0 -223
  462. package/skills/skill-creator/assets/eval_review.html +0 -146
  463. package/skills/skill-creator/eval-viewer/generate_review.py +0 -471
  464. package/skills/skill-creator/eval-viewer/viewer.html +0 -1325
  465. package/skills/skill-creator/references/schemas.md +0 -430
  466. package/skills/skill-creator/scripts/__init__.py +0 -0
  467. package/skills/skill-creator/scripts/aggregate_benchmark.py +0 -401
  468. package/skills/skill-creator/scripts/generate_report.py +0 -326
  469. package/skills/skill-creator/scripts/improve_description.py +0 -248
  470. package/skills/skill-creator/scripts/package_skill.py +0 -136
  471. package/skills/skill-creator/scripts/quick_validate.py +0 -103
  472. package/skills/skill-creator/scripts/run_eval.py +0 -310
  473. package/skills/skill-creator/scripts/run_loop.py +0 -332
  474. package/skills/skill-creator/scripts/utils.py +0 -47
  475. package/skills/sync-docs/SKILL.md +0 -286
  476. package/skills/sync-docs/evals/evals.json +0 -89
  477. package/skills/sync-docs/references/doc-structure.md +0 -99
  478. package/skills/sync-docs/references/schema.md +0 -103
  479. package/skills/sync-docs/scripts/changelog/add_entry.py +0 -216
  480. package/skills/sync-docs/scripts/context_gatherer.py +0 -240
  481. package/skills/sync-docs/scripts/doc_structure_analyzer.py +0 -495
  482. package/skills/sync-docs/scripts/drift_detector.py +0 -563
  483. package/skills/sync-docs/scripts/validate_doc.py +0 -365
  484. package/skills/sync-docs/scripts/validate_metadata.py +0 -185
  485. package/skills/sync-docs-workspace/iteration-1/benchmark.json +0 -293
  486. package/skills/sync-docs-workspace/iteration-1/benchmark.md +0 -13
  487. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/eval_metadata.json +0 -27
  488. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/with_skill/outputs/result.md +0 -210
  489. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/with_skill/run-1/grading.json +0 -28
  490. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/with_skill/run-1/timing.json +0 -1
  491. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/outputs/result.md +0 -101
  492. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/run-1/grading.json +0 -28
  493. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/run-1/timing.json +0 -5
  494. package/skills/sync-docs-workspace/iteration-1/eval-doc-audit/without_skill/timing.json +0 -5
  495. package/skills/sync-docs-workspace/iteration-1/eval-fix-mode/eval_metadata.json +0 -27
  496. package/skills/sync-docs-workspace/iteration-1/eval-fix-mode/with_skill/outputs/result.md +0 -198
  497. package/skills/sync-docs-workspace/iteration-1/eval-fix-mode/with_skill/run-1/grading.json +0 -28
  498. package/skills/sync-docs-workspace/iteration-1/eval-fix-mode/with_skill/run-1/timing.json +0 -1
  499. package/skills/sync-docs-workspace/iteration-1/eval-fix-mode/without_skill/outputs/result.md +0 -94
  500. package/skills/sync-docs-workspace/iteration-1/eval-fix-mode/without_skill/run-1/grading.json +0 -28
  501. package/skills/sync-docs-workspace/iteration-1/eval-fix-mode/without_skill/run-1/timing.json +0 -1
  502. package/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/eval_metadata.json +0 -27
  503. package/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/with_skill/outputs/result.md +0 -237
  504. package/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/with_skill/run-1/grading.json +0 -28
  505. package/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/with_skill/run-1/timing.json +0 -1
  506. package/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/without_skill/outputs/result.md +0 -134
  507. package/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/without_skill/run-1/grading.json +0 -28
  508. package/skills/sync-docs-workspace/iteration-1/eval-sprint-closeout/without_skill/run-1/timing.json +0 -1
  509. package/skills/sync-docs-workspace/iteration-2/benchmark.json +0 -297
  510. package/skills/sync-docs-workspace/iteration-2/benchmark.md +0 -13
  511. package/skills/sync-docs-workspace/iteration-2/eval-doc-audit/eval_metadata.json +0 -27
  512. package/skills/sync-docs-workspace/iteration-2/eval-doc-audit/with_skill/outputs/result.md +0 -137
  513. package/skills/sync-docs-workspace/iteration-2/eval-doc-audit/with_skill/run-1/grading.json +0 -92
  514. package/skills/sync-docs-workspace/iteration-2/eval-doc-audit/with_skill/run-1/timing.json +0 -1
  515. package/skills/sync-docs-workspace/iteration-2/eval-doc-audit/without_skill/outputs/result.md +0 -134
  516. package/skills/sync-docs-workspace/iteration-2/eval-doc-audit/without_skill/run-1/grading.json +0 -86
  517. package/skills/sync-docs-workspace/iteration-2/eval-doc-audit/without_skill/run-1/timing.json +0 -1
  518. package/skills/sync-docs-workspace/iteration-2/eval-fix-mode/eval_metadata.json +0 -27
  519. package/skills/sync-docs-workspace/iteration-2/eval-fix-mode/with_skill/outputs/result.md +0 -193
  520. package/skills/sync-docs-workspace/iteration-2/eval-fix-mode/with_skill/run-1/grading.json +0 -72
  521. package/skills/sync-docs-workspace/iteration-2/eval-fix-mode/with_skill/run-1/timing.json +0 -1
  522. package/skills/sync-docs-workspace/iteration-2/eval-fix-mode/without_skill/outputs/result.md +0 -211
  523. package/skills/sync-docs-workspace/iteration-2/eval-fix-mode/without_skill/run-1/grading.json +0 -91
  524. package/skills/sync-docs-workspace/iteration-2/eval-fix-mode/without_skill/run-1/timing.json +0 -5
  525. package/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/eval_metadata.json +0 -27
  526. package/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/with_skill/outputs/result.md +0 -182
  527. package/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/with_skill/run-1/grading.json +0 -95
  528. package/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/with_skill/run-1/timing.json +0 -1
  529. package/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/without_skill/outputs/result.md +0 -222
  530. package/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/without_skill/run-1/grading.json +0 -88
  531. package/skills/sync-docs-workspace/iteration-2/eval-sprint-closeout/without_skill/run-1/timing.json +0 -5
  532. package/skills/sync-docs-workspace/iteration-3/benchmark.json +0 -298
  533. package/skills/sync-docs-workspace/iteration-3/benchmark.md +0 -13
  534. package/skills/sync-docs-workspace/iteration-3/eval-doc-audit/eval_metadata.json +0 -27
  535. package/skills/sync-docs-workspace/iteration-3/eval-doc-audit/with_skill/outputs/result.md +0 -125
  536. package/skills/sync-docs-workspace/iteration-3/eval-doc-audit/with_skill/run-1/grading.json +0 -97
  537. package/skills/sync-docs-workspace/iteration-3/eval-doc-audit/with_skill/run-1/timing.json +0 -5
  538. package/skills/sync-docs-workspace/iteration-3/eval-doc-audit/without_skill/outputs/result.md +0 -144
  539. package/skills/sync-docs-workspace/iteration-3/eval-doc-audit/without_skill/run-1/grading.json +0 -78
  540. package/skills/sync-docs-workspace/iteration-3/eval-doc-audit/without_skill/run-1/timing.json +0 -5
  541. package/skills/sync-docs-workspace/iteration-3/eval-fix-mode/eval_metadata.json +0 -27
  542. package/skills/sync-docs-workspace/iteration-3/eval-fix-mode/with_skill/outputs/result.md +0 -104
  543. package/skills/sync-docs-workspace/iteration-3/eval-fix-mode/with_skill/run-1/grading.json +0 -91
  544. package/skills/sync-docs-workspace/iteration-3/eval-fix-mode/with_skill/run-1/timing.json +0 -5
  545. package/skills/sync-docs-workspace/iteration-3/eval-fix-mode/without_skill/outputs/result.md +0 -79
  546. package/skills/sync-docs-workspace/iteration-3/eval-fix-mode/without_skill/run-1/grading.json +0 -82
  547. package/skills/sync-docs-workspace/iteration-3/eval-fix-mode/without_skill/run-1/timing.json +0 -5
  548. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/eval_metadata.json +0 -27
  549. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase1_context.json +0 -302
  550. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase2_drift.txt +0 -33
  551. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase3_analysis.json +0 -114
  552. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase4_fix.txt +0 -118
  553. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/phase5_validate.txt +0 -38
  554. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/outputs/result.md +0 -158
  555. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/run-1/grading.json +0 -95
  556. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/with_skill/run-1/timing.json +0 -5
  557. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/without_skill/outputs/result.md +0 -71
  558. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/without_skill/run-1/grading.json +0 -90
  559. package/skills/sync-docs-workspace/iteration-3/eval-sprint-closeout/without_skill/run-1/timing.json +0 -5
  560. package/skills/test-planning/SKILL.md +0 -465
  561. package/skills/test-planning/evals/evals.json +0 -23
  562. package/skills/updating-service-skills/SKILL.md +0 -136
  563. package/skills/updating-service-skills/scripts/drift_detector.py +0 -222
  564. package/skills/using-quality-gates/SKILL.md +0 -254
  565. package/skills/using-serena-lsp/README.md +0 -8
  566. package/skills/using-serena-lsp/REFERENCE.md +0 -194
  567. package/skills/using-serena-lsp/SKILL.md +0 -82
  568. package/skills/using-service-skills/SKILL.md +0 -108
  569. package/skills/using-service-skills/scripts/cataloger.py +0 -74
  570. package/skills/using-service-skills/scripts/skill_activator.py +0 -152
  571. package/skills/using-service-skills/scripts/test_skill_activator.py +0 -58
  572. package/skills/using-tdd/SKILL.md +0 -410
  573. package/skills/using-xtrm/SKILL.md +0 -127
  574. package/skills/xt-debugging/SKILL.md +0 -149
  575. package/skills/xt-end/SKILL.md +0 -297
  576. package/skills/xt-merge/SKILL.md +0 -313
  577. /package/{config → .xtrm/config}/.env.example +0 -0
  578. /package/{config/mcp_servers_optional.json → .xtrm/config/claude.mcp.optional.json} +0 -0
  579. /package/{hooks → .xtrm/config}/hooks.json +0 -0
  580. /package/{config → .xtrm/config}/pi/auth.json.template +0 -0
  581. /package/{config → .xtrm/config}/pi/extensions/auto-session-name/index.ts +0 -0
  582. /package/{config → .xtrm/config}/pi/extensions/auto-session-name/package.json +0 -0
  583. /package/{config → .xtrm/config}/pi/extensions/auto-update/index.ts +0 -0
  584. /package/{config → .xtrm/config}/pi/extensions/auto-update/package.json +0 -0
  585. /package/{config → .xtrm/config}/pi/extensions/beads/package.json +0 -0
  586. /package/{config → .xtrm/config}/pi/extensions/compact-header/index.ts +0 -0
  587. /package/{config → .xtrm/config}/pi/extensions/compact-header/package.json +0 -0
  588. /package/{config → .xtrm/config}/pi/extensions/core/adapter.ts +0 -0
  589. /package/{config → .xtrm/config}/pi/extensions/core/guard-rules.ts +0 -0
  590. /package/{config → .xtrm/config}/pi/extensions/core/lib.ts +0 -0
  591. /package/{config → .xtrm/config}/pi/extensions/core/logger.ts +0 -0
  592. /package/{config → .xtrm/config}/pi/extensions/core/package.json +0 -0
  593. /package/{config → .xtrm/config}/pi/extensions/core/runner.ts +0 -0
  594. /package/{config → .xtrm/config}/pi/extensions/core/session-state.ts +0 -0
  595. /package/{config → .xtrm/config}/pi/extensions/custom-footer/package.json +0 -0
  596. /package/{config → .xtrm/config}/pi/extensions/custom-provider-qwen-cli/index.ts +0 -0
  597. /package/{config → .xtrm/config}/pi/extensions/custom-provider-qwen-cli/package.json +0 -0
  598. /package/{config → .xtrm/config}/pi/extensions/git-checkpoint/index.ts +0 -0
  599. /package/{config → .xtrm/config}/pi/extensions/git-checkpoint/package.json +0 -0
  600. /package/{config → .xtrm/config}/pi/extensions/lsp-bootstrap/index.ts +0 -0
  601. /package/{config → .xtrm/config}/pi/extensions/lsp-bootstrap/package.json +0 -0
  602. /package/{config → .xtrm/config}/pi/extensions/pi-serena-compact/index.ts +0 -0
  603. /package/{config → .xtrm/config}/pi/extensions/pi-serena-compact/package.json +0 -0
  604. /package/{config → .xtrm/config}/pi/extensions/quality-gates/index.ts +0 -0
  605. /package/{config → .xtrm/config}/pi/extensions/quality-gates/package.json +0 -0
  606. /package/{config → .xtrm/config}/pi/extensions/service-skills/index.ts +0 -0
  607. /package/{config → .xtrm/config}/pi/extensions/service-skills/package.json +0 -0
  608. /package/{config → .xtrm/config}/pi/extensions/session-flow/index.ts +0 -0
  609. /package/{config → .xtrm/config}/pi/extensions/session-flow/package.json +0 -0
  610. /package/{config → .xtrm/config}/pi/extensions/xtrm-loader/index.ts +0 -0
  611. /package/{config → .xtrm/config}/pi/extensions/xtrm-loader/package.json +0 -0
  612. /package/{config → .xtrm/config}/pi/extensions/xtrm-ui/format.ts +0 -0
  613. /package/{config → .xtrm/config}/pi/extensions/xtrm-ui/package.json +0 -0
  614. /package/{config → .xtrm/config}/pi/extensions/xtrm-ui/themes/pidex-dark.json +0 -0
  615. /package/{config → .xtrm/config}/pi/extensions/xtrm-ui/themes/pidex-light.json +0 -0
  616. /package/{config → .xtrm/config}/pi/models.json.template +0 -0
  617. /package/{config → .xtrm/config}/pi/pi-worktrees-settings.json +0 -0
  618. /package/{config → .xtrm/config}/pi/settings.json.template +0 -0
  619. /package/{hooks → .xtrm/hooks}/beads-claim-sync.mjs +0 -0
  620. /package/{hooks → .xtrm/hooks}/beads-compact-restore.mjs +0 -0
  621. /package/{hooks → .xtrm/hooks}/beads-compact-save.mjs +0 -0
  622. /package/{hooks → .xtrm/hooks}/beads-edit-gate.mjs +0 -0
  623. /package/{hooks → .xtrm/hooks}/beads-gate-core.mjs +0 -0
  624. /package/{hooks → .xtrm/hooks}/beads-gate-messages.mjs +0 -0
  625. /package/{hooks → .xtrm/hooks}/beads-gate-utils.mjs +0 -0
  626. /package/{hooks → .xtrm/hooks}/beads-stop-gate.mjs +0 -0
  627. /package/{hooks → .xtrm/hooks}/gitnexus/gitnexus-hook.cjs +0 -0
  628. /package/{hooks → .xtrm/hooks}/quality-check.cjs +0 -0
  629. /package/{hooks → .xtrm/hooks}/quality-check.py +0 -0
  630. /package/{hooks → .xtrm/hooks}/worktree-boundary.mjs +0 -0
  631. /package/{hooks → .xtrm/hooks}/xtrm-logger.mjs +0 -0
  632. /package/{hooks → .xtrm/hooks}/xtrm-session-logger.mjs +0 -0
  633. /package/{hooks → .xtrm/hooks}/xtrm-tool-logger.mjs +0 -0
@@ -1,297 +0,0 @@
1
- {
2
- "metadata": {
3
- "skill_name": "sync-docs",
4
- "skill_path": "<path/to/skill>",
5
- "executor_model": "<model-name>",
6
- "analyzer_model": "<model-name>",
7
- "timestamp": "2026-03-18T13:15:12Z",
8
- "evals_run": [
9
- 1,
10
- 2,
11
- 3
12
- ],
13
- "runs_per_configuration": 3
14
- },
15
- "runs": [
16
- {
17
- "eval_id": 3,
18
- "configuration": "with_skill",
19
- "run_number": 1,
20
- "result": {
21
- "pass_rate": 1.0,
22
- "passed": 4,
23
- "failed": 0,
24
- "total": 4,
25
- "time_seconds": 82.0,
26
- "tokens": 26000,
27
- "tool_calls": 0,
28
- "errors": 0
29
- },
30
- "expectations": [
31
- {
32
- "text": "Ran doc_structure_analyzer.py and cited its output",
33
- "passed": true,
34
- "evidence": "Phase 3 of the report cites specific script output: 'Line count: 192 / 200 threshold', 'Sections: 24', 'Extraction candidates flagged by script: None'. These metrics are consistent with structured script output rather than manual inspection, and the phrasing 'flagged by script' directly attributes them to an automated tool."
35
- },
36
- {
37
- "text": "Named at least 2 specific README sections with their suggested docs/ destination",
38
- "passed": true,
39
- "evidence": "The report names three sections with explicit docs/ destinations: 'Hooks Reference' (lines 114-141) -> docs/hooks.md, 'Policy System' (lines 66-87) -> docs/policies.md, 'MCP Servers' (lines 143-158) -> docs/mcp-servers.md. These appear both in the Phase 3 table and in the numbered summary under 'Three sections to replace with summary + link'."
40
- },
41
- {
42
- "text": "Did NOT run --fix or create/edit any files (audit-only mode respected)",
43
- "passed": true,
44
- "evidence": "The report header states 'Mode: Audit only (Phase 1-3). No files were modified.' The 'Recommended Next Steps' section frames all actions as future work 'for explicit execution, not done here'. The 'What NOT to Do' section further reinforces restraint. No output files other than result.md are present in the outputs directory."
45
- },
46
- {
47
- "text": "Report is actionable with clear next steps",
48
- "passed": true,
49
- "evidence": "The 'Recommended Next Steps' section lists 4 numbered, specific, executable actions: (1) Fix CHANGELOG using add_entry.py, (2) Fix README version badge from 2.3.0 to 2.4.0, (3) Trim README duplicate sections using Serena tools, (4) Update stale Serena memories for hooks and installer architecture. Each step names the specific tool or method to use."
50
- }
51
- ],
52
- "notes": []
53
- },
54
- {
55
- "eval_id": 2,
56
- "configuration": "with_skill",
57
- "run_number": 1,
58
- "result": {
59
- "pass_rate": 1.0,
60
- "passed": 4,
61
- "failed": 0,
62
- "total": 4,
63
- "time_seconds": 120.0,
64
- "tokens": 0,
65
- "tool_calls": 0,
66
- "errors": 0
67
- },
68
- "expectations": [
69
- {
70
- "text": "Ran doc_structure_analyzer.py with --fix flag",
71
- "passed": true,
72
- "evidence": "result.md Command Executed section shows: `python3 /home/dawid/projects/xtrm-tools/skills/sync-docs/scripts/doc_structure_analyzer.py --fix --bd-remember --root=/home/dawid/projects/xtrm-tools/.claude/worktrees/agent-ad500878`"
73
- },
74
- {
75
- "text": "Handled both MISSING scaffolds AND INVALID_SCHEMA files (or correctly reported none found)",
76
- "passed": true,
77
- "evidence": "result.md shows 5 MISSING scaffold files created (hooks.md, pi-extensions.md, mcp-servers.md, policies.md, skills.md) and 7 INVALID_SCHEMA files fixed by injecting frontmatter (cleanup.md, delegation-architecture.md, hook-system-summary.md, mcp-servers-config.md, pi-extensions-migration.md, pre-install-cleanup.md, todo.md). Both categories were handled."
78
- },
79
- {
80
- "text": "Ran bd remember and reported the memory key",
81
- "passed": true,
82
- "evidence": "result.md bd Memory section reports key `sync-docs-fix-2026-03-18` and the full insight string. The script output JSON includes `bd_remember.key = 'sync-docs-fix-2026-03-18'`. Note: `stored: false` because no `.beads/` directory existed in the worktree, but the key was computed and reported, which satisfies the expectation."
83
- },
84
- {
85
- "text": "Ran validate_doc.py docs/ after fixing to confirm results",
86
- "passed": true,
87
- "evidence": "result.md validate_doc.py docs/ Result section shows all 12 files passed (12/12) with exit code 0, covering both the 5 newly created scaffolds and the 7 schema-fixed files."
88
- }
89
- ],
90
- "notes": []
91
- },
92
- {
93
- "eval_id": 1,
94
- "configuration": "with_skill",
95
- "run_number": 1,
96
- "result": {
97
- "pass_rate": 1.0,
98
- "passed": 4,
99
- "failed": 0,
100
- "total": 4,
101
- "time_seconds": 170.0,
102
- "tokens": 27000,
103
- "tool_calls": 0,
104
- "errors": 2
105
- },
106
- "expectations": [
107
- {
108
- "text": "Ran context_gatherer.py and reported bd closed issues or merged PRs with specific data",
109
- "passed": true,
110
- "evidence": "Phase 1 documents running 'skills/sync-docs/scripts/context_gatherer.py --since=30'. While the script returned empty arrays for bd_closed_issues due to a Dolt server connectivity issue from the worktree, the agent performed a manual fallback using 'bd list --state=closed --limit=10' and reported 8 specific named issues (jaggers-agent-tools-1lc, -7dwo, -8dhs, -9bl, -ihgz, -l1g, -p9wc, plus subtasks). Merged PRs were also reported with specific details: 10 PRs including PR #15 release/2.0.1, PR #14 chore/update-status-doc, PR #13 fix/agents-target, etc."
111
- },
112
- {
113
- "text": "Ran doc_structure_analyzer.py and cited its structured output (STALE, EXTRACTABLE, MISSING, etc.)",
114
- "passed": true,
115
- "evidence": "Phase 3 documents running 'skills/sync-docs/scripts/doc_structure_analyzer.py'. The result explicitly cites: README.md as EXTRACTABLE (192 lines, threshold 200) with 5 sections identified for extraction; CHANGELOG.md as STALE; 5 MISSING docs/ files (docs/hooks.md, docs/pi-extensions.md, docs/mcp-servers.md, docs/policies.md, docs/skills.md); and 7 existing docs/ files with INVALID_SCHEMA. The structured output vocabulary (STALE, EXTRACTABLE, MISSING, INVALID_SCHEMA) is used throughout."
116
- },
117
- {
118
- "text": "Detected the CHANGELOG version gap (package.json v2.4.0 vs CHANGELOG v2.0.0)",
119
- "passed": true,
120
- "evidence": "Phase 3 explicitly states: 'package.json version: 2.4.0', 'Latest CHANGELOG entry: v2.0.0', 'Gap: v2.1.0 through v2.4.0 are undocumented'. Outstanding Actions item 1 also calls out: 'Add entries for v2.1.0 through v2.4.0 using skills/documenting/scripts/changelog/add_entry.py'."
121
- },
122
- {
123
- "text": "Named at least one concrete next step with a specific file or action",
124
- "passed": true,
125
- "evidence": "The 'Outstanding Actions' section names 4 concrete next steps with specific files/tools: (1) 'Add entries for v2.1.0 through v2.4.0 using skills/documenting/scripts/changelog/add_entry.py'; (2) 'Use Serena to extract sections into their new docs/ files'; (3) 'Update 5 stale memories, especially ssot_cli_hooks_2026-02-03'; (4) 'Fill [5 scaffolded files] using Serena or by extracting from README'."
126
- }
127
- ],
128
- "notes": []
129
- },
130
- {
131
- "eval_id": 3,
132
- "configuration": "without_skill",
133
- "run_number": 1,
134
- "result": {
135
- "pass_rate": 0.75,
136
- "passed": 3,
137
- "failed": 1,
138
- "total": 4,
139
- "time_seconds": 75.0,
140
- "tokens": 15000,
141
- "tool_calls": 0,
142
- "errors": 0
143
- },
144
- "expectations": [
145
- {
146
- "text": "Ran doc_structure_analyzer.py and cited its output",
147
- "passed": false,
148
- "evidence": "No mention of doc_structure_analyzer.py anywhere in result.md. The audit was performed by directly reading files rather than running any script. No script output is quoted or referenced."
149
- },
150
- {
151
- "text": "Named at least 2 specific README sections with their suggested docs/ destination",
152
- "passed": true,
153
- "evidence": "result.md names six README sections with specific destinations: 'Hooks Reference' -> docs/hooks.md, 'Policy System' -> docs/policies.md, 'MCP Servers' -> docs/mcp.md, 'Plugin Structure' -> docs/plugin.md or XTRM-GUIDE.md, 'Skills table' -> docs/skills.md, 'Version History' -> CHANGELOG.md. The recommended moves table further enumerates these with priority levels."
154
- },
155
- {
156
- "text": "Did NOT run --fix or create/edit any files (audit-only mode respected)",
157
- "passed": true,
158
- "evidence": "result.md is a read-only audit report. No --fix flag is mentioned, no files were edited, no docs/ files were created or modified. The report only analyzes and recommends."
159
- },
160
- {
161
- "text": "Report is actionable with clear next steps",
162
- "passed": true,
163
- "evidence": "result.md includes a 'Recommended Moves (Prioritized)' table with Priority (High/Medium/Low), README Section, Action (Move/Remove/Add), and Target columns. Each section also has a specific Verdict with a concrete instruction (e.g., 'Move this content to docs/policies.md', 'Remove this table from the README and rely on the CHANGELOG.md link')."
164
- }
165
- ],
166
- "notes": []
167
- },
168
- {
169
- "eval_id": 2,
170
- "configuration": "without_skill",
171
- "run_number": 1,
172
- "result": {
173
- "pass_rate": 1.0,
174
- "passed": 4,
175
- "failed": 0,
176
- "total": 4,
177
- "time_seconds": 129.8,
178
- "tokens": 5843,
179
- "tool_calls": 0,
180
- "errors": 1
181
- },
182
- "expectations": [
183
- {
184
- "text": "Ran doc_structure_analyzer.py with --fix flag",
185
- "passed": true,
186
- "evidence": "Step 2 of result.md shows the exact command run: 'python3 .../doc_structure_analyzer.py --root=... --fix' with stdout confirming 5 files created and 7 files fixed."
187
- },
188
- {
189
- "text": "Handled both MISSING scaffolds AND INVALID_SCHEMA files (or correctly reported none found)",
190
- "passed": true,
191
- "evidence": "Step 2 shows 5 MISSING scaffold files were created (hooks.md, pi-extensions.md, mcp-servers.md, policies.md, skills.md) and 7 INVALID_SCHEMA files had frontmatter injected (cleanup.md, delegation-architecture.md, hook-system-summary.md, mcp-servers-config.md, pi-extensions-migration.md, pre-install-cleanup.md, todo.md). Both categories were explicitly handled."
192
- },
193
- {
194
- "text": "Ran bd remember and reported the memory key",
195
- "passed": true,
196
- "evidence": "Step 4 shows bd remember was attempted with key 'sync-docs-fix-2026-03-18'. It failed with 'database jaggers_agent_tools not found on Dolt server at 127.0.0.1:13800', but the key was explicitly reported ('## bd Memory Key (intended): sync-docs-fix-2026-03-18') and the attempt was fully documented. Per grading note, attempt + reported key satisfies this assertion."
197
- },
198
- {
199
- "text": "Ran validate_doc.py docs/ after fixing to confirm results",
200
- "passed": true,
201
- "evidence": "Step 3 shows the command 'python3 .../validate_doc.py .../docs/' was run post-fix, with all 12 files showing [PASS] and final output 'Result: 12/12 files passed'."
202
- }
203
- ],
204
- "notes": [
205
- "README.md EXTRACTABLE \u2014 5 sections should move to docs/ but requires content judgment",
206
- "CHANGELOG.md STALE \u2014 v2.4.0 undocumented; requires add_entry.py and human input",
207
- "bd remember failed due to Dolt server database mismatch; key was reported manually in result.md"
208
- ]
209
- },
210
- {
211
- "eval_id": 1,
212
- "configuration": "without_skill",
213
- "run_number": 1,
214
- "result": {
215
- "pass_rate": 0.5,
216
- "passed": 2,
217
- "failed": 2,
218
- "total": 4,
219
- "time_seconds": 219.9,
220
- "tokens": 8123,
221
- "tool_calls": 0,
222
- "errors": 0
223
- },
224
- "expectations": [
225
- {
226
- "text": "Ran context_gatherer.py and reported bd closed issues or merged PRs with specific data",
227
- "passed": false,
228
- "evidence": "The result contains specific bd closed issue data (#38, #33 with dates) and merged PR data (#102\u2013#111 with titles and dates). However, the report header explicitly states 'Assessed by: Manual review (git log, gh issue/pr, file reads)' \u2014 context_gatherer.py was never invoked. The data is present but was gathered manually, not via the script. The expectation requires the script to have been run."
229
- },
230
- {
231
- "text": "Ran doc_structure_analyzer.py and cited its structured output (STALE, EXTRACTABLE, MISSING, etc.)",
232
- "passed": false,
233
- "evidence": "No mention of doc_structure_analyzer.py anywhere in the result. The documentation analysis uses informal labels like 'Drifted' and 'Stale' from the agent's own judgment, not the structured taxonomy (STALE, EXTRACTABLE, MISSING) that the script would emit. The script was not run."
234
- },
235
- {
236
- "text": "Detected the CHANGELOG version gap (package.json v2.4.0 vs CHANGELOG v2.0.0)",
237
- "passed": true,
238
- "evidence": "Section 2 of the result is titled 'CHANGELOG.md Has No v2.4.0 Entry' and is rated High severity and listed as the #1 recommended action: 'Write the [2.4.0] CHANGELOG entry \u2014 this is the most critical gap. The release shipped but has no record.' The result also references the package version as 2.4.1 (cli/package.json) and 2.4.0 (released via PR #110). The specific last CHANGELOG version is not named but the gap is clearly identified and substantiated."
239
- },
240
- {
241
- "text": "Named at least one concrete next step with a specific file or action",
242
- "passed": true,
243
- "evidence": "The 'Recommended Actions (Priority Order)' section lists 7 concrete steps, each referencing specific files: e.g., '1. Write the [2.4.0] CHANGELOG entry', '2. Update README.md version badge, example output, and version history table to 2.4.0', '4. Bump plugins/xtrm-tools/.claude-plugin/plugin.json version to 2.4.0'."
244
- }
245
- ],
246
- "notes": []
247
- }
248
- ],
249
- "run_summary": {
250
- "with_skill": {
251
- "pass_rate": {
252
- "mean": 1.0,
253
- "stddev": 0.0,
254
- "min": 1.0,
255
- "max": 1.0
256
- },
257
- "time_seconds": {
258
- "mean": 124.0,
259
- "stddev": 44.1362,
260
- "min": 82.0,
261
- "max": 170.0
262
- },
263
- "tokens": {
264
- "mean": 17666.6667,
265
- "stddev": 15307.95,
266
- "min": 0,
267
- "max": 27000
268
- }
269
- },
270
- "without_skill": {
271
- "pass_rate": {
272
- "mean": 0.75,
273
- "stddev": 0.25,
274
- "min": 0.5,
275
- "max": 1.0
276
- },
277
- "time_seconds": {
278
- "mean": 141.5667,
279
- "stddev": 73.1631,
280
- "min": 75.0,
281
- "max": 219.9
282
- },
283
- "tokens": {
284
- "mean": 9655.3333,
285
- "stddev": 4766.9378,
286
- "min": 5843,
287
- "max": 15000
288
- }
289
- },
290
- "delta": {
291
- "pass_rate": "+0.25",
292
- "time_seconds": "-17.6",
293
- "tokens": "+8011"
294
- }
295
- },
296
- "notes": []
297
- }
@@ -1,13 +0,0 @@
1
- # Skill Benchmark: sync-docs
2
-
3
- **Model**: <model-name>
4
- **Date**: 2026-03-18T13:15:12Z
5
- **Evals**: 1, 2, 3 (3 runs each per configuration)
6
-
7
- ## Summary
8
-
9
- | Metric | With Skill | Without Skill | Delta |
10
- |--------|------------|---------------|-------|
11
- | Pass Rate | 100% ± 0% | 75% ± 25% | +0.25 |
12
- | Time | 124.0s ± 44.1s | 141.6s ± 73.2s | -17.6s |
13
- | Tokens | 17667 ± 15308 | 9655 ± 4767 | +8011 |
@@ -1,27 +0,0 @@
1
- {
2
- "eval_id": 3,
3
- "eval_name": "doc-audit",
4
- "prompt": "Do a doc audit. I think the README has sections that should be in docs/ but I'm not sure which ones.",
5
- "assertions": [
6
- {
7
- "text": "Ran doc_structure_analyzer.py and cited its output",
8
- "passed": false,
9
- "evidence": ""
10
- },
11
- {
12
- "text": "Named at least 2 specific README sections with their suggested docs/ destination",
13
- "passed": false,
14
- "evidence": ""
15
- },
16
- {
17
- "text": "Did NOT run --fix or create/edit any files (audit-only mode respected)",
18
- "passed": false,
19
- "evidence": ""
20
- },
21
- {
22
- "text": "Report is actionable with clear next steps",
23
- "passed": false,
24
- "evidence": ""
25
- }
26
- ]
27
- }
@@ -1,137 +0,0 @@
1
- # Doc Audit Report — xtrm-tools
2
-
3
- **Date:** 2026-03-18
4
- **Task:** Audit README for sections that should be in docs/
5
- **Mode:** Audit only (Phase 1–3). No files were modified.
6
-
7
- ---
8
-
9
- ## Phase 1: Context Summary
10
-
11
- ### Recent Activity
12
-
13
- **Merged PRs (last ~30 days):**
14
- - PR #15 — release/2.0.1 (2026-03-13)
15
- - PR #14 — chore/update-status-doc (2026-03-13)
16
- - PR #13 — fix/agents-target (2026-03-13)
17
- - PR #12 — feat/project-install-all (2026-03-13)
18
- - PR #8 — phase2-cli-refactor (2026-03-12)
19
-
20
- **Recent significant commits (today):**
21
- - Add Pi extension drift checks and guard-rules parity
22
- - Centralize guard tool rules and matcher expansion
23
- - Deprecate install project command in favor of xtrm init
24
- - Add global-first architecture regression tests
25
- - Add project detection and service registry scaffolding to xtrm init
26
-
27
- **Active epic:** `jaggers-agent-tools-4xr6` — Global-first plugin architecture (hooks, skills, Pi extensions all go global; `xtrm init` replaces `install project`)
28
-
29
- This is a significant structural change cycle. The CLI commands table in README already shows `project init` but also still lists `install project <name>` — these may be in conflict now that install-project is deprecated.
30
-
31
- ---
32
-
33
- ## Phase 2: SSOT Drift (Serena Memories)
34
-
35
- **5 stale memories detected:**
36
-
37
- | Memory | Last Updated | Modified Files |
38
- |---|---|---|
39
- | `ssot_cli_hooks_2026-02-03` | 2026-02-25 | hooks/guard-rules.mjs, hooks/hooks.json, hooks/main-guard.mjs |
40
- | `ssot_cli_universal_hub_2026-02-19` | 2026-02-25 | cli/src/commands/install-pi.ts, cli/src/tests/policy-parity.test.ts |
41
- | `ssot_cli_ux_improvements_2026-02-22` | 2026-02-25 | cli/src/commands/install-pi.ts, cli/src/commands/install-project.ts |
42
- | `ssot_jaggers-agent-tools_installer_architecture_2026-02-03` | 2026-02-25 | cli/src/commands/install-pi.ts, cli/src/tests/policy-parity.test.ts |
43
- | `ssot_jaggers-agent-tools_migration_2026-02-01` | 2026-02-01 | cli/src/commands/install-pi.ts, cli/src/tests/policy-parity.test.ts |
44
-
45
- The hooks memories are stale due to the guard-rules centralization work done today. The installer architecture memories are stale due to the global-first migration and deprecation of `install-project`. These need updating but are out of scope for this audit (they require Serena tools and explicit intent to fix).
46
-
47
- ---
48
-
49
- ## Phase 3: Document Structure Analysis
50
-
51
- ### README.md — Status: OK (borderline)
52
-
53
- - **Line count:** 192 / 200 threshold
54
- - **Sections:** 24
55
- - **Extraction candidates flagged by script:** None
56
-
57
- The script reports `OK` because README is 8 lines under the 200-line bloat threshold. However, manual review reveals several sections that are substantive enough to warrant dedicated docs/ files or already have them:
58
-
59
- #### Sections with candidate docs/ homes
60
-
61
- | README Section | Lines | Status | Recommended Action |
62
- |---|---|---|---|
63
- | **Hooks Reference** (lines 114–141) | ~28 lines | Has `docs/hooks.md` | README section should be a 1-line summary + link to `docs/hooks.md` |
64
- | **MCP Servers** (lines 143–158) | ~16 lines | Has `docs/mcp-servers.md` | README section is a partial duplicate of `docs/mcp-servers.md` |
65
- | **Policy System** (lines 66–87) | ~22 lines | Has `docs/policies.md` | README section should be a 1-line summary + link to `docs/policies.md` |
66
- | **CLI Commands** (lines 89–111) | ~23 lines | No `docs/cli-reference.md` | At 6 commands + 3 flags this is borderline; when CLI grows, extract |
67
- | **Version History** (lines 179–187) | ~9 lines | Has CHANGELOG.md | Already linked; table is a useful quick summary, keep |
68
- | **Issue Tracking (Beads)** (lines 161–168) | ~8 lines | No dedicated docs/ file | Short enough to keep in README |
69
-
70
- **Key finding:** README has three sections (Hooks Reference, MCP Servers, Policy System) that directly duplicate content already in dedicated docs/ files. These sections should be replaced with single-line summaries + links. This would bring README down to approximately 130–140 lines and eliminate the drift risk.
71
-
72
- ### CHANGELOG.md — Status: STALE (critical)
73
-
74
- - **package.json version:** 2.4.0
75
- - **Latest CHANGELOG entry:** 2.0.0 (2026-03-12)
76
- - **Gap:** v2.1.x, v2.2.0, v2.3.0, and v2.4.0 are all undocumented in CHANGELOG
77
- - **Note:** README header also still says "Version 2.3.0" — should be 2.4.0
78
-
79
- The CHANGELOG has not been updated across multiple release cycles. This is the most critical finding.
80
-
81
- ### docs/ Files — Status: All OK
82
-
83
- All 10 existing docs/ files pass schema validation (have YAML frontmatter, no structural issues):
84
-
85
- - docs/hooks.md (133 lines) — OK
86
- - docs/mcp-servers.md (25 lines) — OK
87
- - docs/mcp.md (110 lines) — OK
88
- - docs/pi-extensions.md (25 lines) — OK
89
- - docs/policies.md (25 lines) — OK
90
- - docs/pre-install-cleanup.md (128 lines) — OK
91
- - docs/project-skills.md (105 lines) — OK
92
- - docs/skills.md (114 lines) — OK
93
- - docs/testing.md (148 lines) — OK
94
- - docs/todo.md (14 lines) — OK
95
-
96
- **No missing docs/ gaps** were flagged by the script for existing subsystems.
97
-
98
- ---
99
-
100
- ## Summary of Findings
101
-
102
- ### README Duplication (answer to the user's question)
103
-
104
- The README does contain sections that belong in docs/ — but not because they're missing docs/ files. The docs/ files already exist. The problem is that README still carries full content in those sections instead of pointing to the dedicated files.
105
-
106
- **Three sections to replace with summary + link:**
107
-
108
- 1. **"Hooks Reference"** (lines 114–141, ~28 lines) → summarize in 2–3 lines + link to `docs/hooks.md`
109
- 2. **"Policy System"** (lines 66–87, ~22 lines) → summarize in 2–3 lines + link to `docs/policies.md`
110
- 3. **"MCP Servers"** (lines 143–158, ~16 lines) → summarize in 1–2 lines + link to `docs/mcp-servers.md`
111
-
112
- Doing this would remove ~60 lines from README (192 → ~132), well within the healthy range, and eliminate drift between README and its docs/ counterparts.
113
-
114
- ### CHANGELOG is critically stale
115
-
116
- Four release versions (2.1.x through 2.4.0) have no CHANGELOG entries. The README version badge is also one version behind (shows 2.3.0, package.json is 2.4.0).
117
-
118
- ### Stale Serena memories (5 total)
119
-
120
- All relate to hooks and installer architecture — both subsystems were modified today as part of the global-first migration. These need updating via the `/documenting` skill or Phase 4 of this skill.
121
-
122
- ---
123
-
124
- ## What NOT to Do
125
-
126
- - Do not extract Beads, CLI Commands, Version History, or Quick Start from README — these are appropriate for a README-level entry point.
127
- - Do not create new docs/ files — all expected subsystem files already exist.
128
- - Do not touch the docs/ files themselves — they all pass schema validation.
129
-
130
- ---
131
-
132
- ## Recommended Next Steps (for explicit execution, not done here)
133
-
134
- 1. **Fix CHANGELOG** — add entries for v2.1.x, v2.2.0, v2.3.0, v2.4.0 using `add_entry.py`
135
- 2. **Fix README version badge** — update "Version 2.3.0" to "Version 2.4.0"
136
- 3. **Trim README duplicate sections** — replace Hooks Reference, Policy System, MCP Servers with summary + link (use Serena tools, not direct Edit)
137
- 4. **Update stale Serena memories** — especially `ssot_cli_hooks_*` and `ssot_jaggers-agent-tools_installer_architecture_*` given today's guard-rules and global-first changes
@@ -1,92 +0,0 @@
1
- {
2
- "expectations": [
3
- {
4
- "text": "Ran doc_structure_analyzer.py and cited its output",
5
- "passed": true,
6
- "evidence": "Phase 3 of the report cites specific script output: 'Line count: 192 / 200 threshold', 'Sections: 24', 'Extraction candidates flagged by script: None'. These metrics are consistent with structured script output rather than manual inspection, and the phrasing 'flagged by script' directly attributes them to an automated tool."
7
- },
8
- {
9
- "text": "Named at least 2 specific README sections with their suggested docs/ destination",
10
- "passed": true,
11
- "evidence": "The report names three sections with explicit docs/ destinations: 'Hooks Reference' (lines 114-141) -> docs/hooks.md, 'Policy System' (lines 66-87) -> docs/policies.md, 'MCP Servers' (lines 143-158) -> docs/mcp-servers.md. These appear both in the Phase 3 table and in the numbered summary under 'Three sections to replace with summary + link'."
12
- },
13
- {
14
- "text": "Did NOT run --fix or create/edit any files (audit-only mode respected)",
15
- "passed": true,
16
- "evidence": "The report header states 'Mode: Audit only (Phase 1-3). No files were modified.' The 'Recommended Next Steps' section frames all actions as future work 'for explicit execution, not done here'. The 'What NOT to Do' section further reinforces restraint. No output files other than result.md are present in the outputs directory."
17
- },
18
- {
19
- "text": "Report is actionable with clear next steps",
20
- "passed": true,
21
- "evidence": "The 'Recommended Next Steps' section lists 4 numbered, specific, executable actions: (1) Fix CHANGELOG using add_entry.py, (2) Fix README version badge from 2.3.0 to 2.4.0, (3) Trim README duplicate sections using Serena tools, (4) Update stale Serena memories for hooks and installer architecture. Each step names the specific tool or method to use."
22
- }
23
- ],
24
- "summary": {
25
- "passed": 4,
26
- "failed": 0,
27
- "total": 4,
28
- "pass_rate": 1.0
29
- },
30
- "execution_metrics": {
31
- "tool_calls": {},
32
- "total_tool_calls": 0,
33
- "total_steps": 0,
34
- "errors_encountered": 0,
35
- "output_chars": 3871,
36
- "transcript_chars": 0
37
- },
38
- "timing": {
39
- "executor_duration_seconds": 0.0,
40
- "grader_duration_seconds": 0.0,
41
- "total_duration_seconds": 0.0
42
- },
43
- "claims": [
44
- {
45
- "claim": "README is 192 lines, just under the 200-line threshold",
46
- "type": "factual",
47
- "verified": false,
48
- "evidence": "Reported as script output but the README was not independently verified in grading. The number is internally consistent with the report's conclusion that README is 'borderline'."
49
- },
50
- {
51
- "claim": "5 stale Serena memories were detected",
52
- "type": "factual",
53
- "verified": false,
54
- "evidence": "The report lists 5 specific memory entries with dates and associated files. Cannot verify without access to the Serena memory store, but the specificity (named files, timestamps) suggests genuine inspection rather than fabrication."
55
- },
56
- {
57
- "claim": "All 10 existing docs/ files pass schema validation",
58
- "type": "quality",
59
- "verified": false,
60
- "evidence": "10 docs/ files are listed with 'OK' status. The report attributes this to schema validation but no validator output or script name is cited for this check, making it less verifiable than the doc_structure_analyzer output."
61
- },
62
- {
63
- "claim": "CHANGELOG is missing entries for v2.1.x through v2.4.0",
64
- "type": "factual",
65
- "verified": false,
66
- "evidence": "Report states package.json shows 2.4.0 but CHANGELOG's latest entry is 2.0.0. Plausible given the stated active development cycle but not independently verified in grading."
67
- },
68
- {
69
- "claim": "No files were modified during the run",
70
- "type": "process",
71
- "verified": true,
72
- "evidence": "Only result.md is present in the outputs directory. No other files were created or edited as part of the run."
73
- }
74
- ],
75
- "user_notes_summary": {
76
- "uncertainties": [],
77
- "needs_review": [],
78
- "workarounds": []
79
- },
80
- "eval_feedback": {
81
- "suggestions": [
82
- {
83
- "assertion": "Ran doc_structure_analyzer.py and cited its output",
84
- "reason": "The assertion passes based on plausible script-attributed output in the report, but there is no transcript available to confirm the script was actually executed (e.g., a Bash tool call). A stronger assertion would require a transcript showing the actual tool invocation, or the raw script output as a separate artifact in outputs/. As written, a well-crafted fabrication would also pass this assertion."
85
- },
86
- {
87
- "reason": "No assertion checks the accuracy of the section-to-docs/ mapping. The report correctly identifies docs/hooks.md, docs/policies.md, and docs/mcp-servers.md as targets, but an eval that verifies those files actually exist in the repo would catch hallucinated destinations. Consider adding: 'All recommended docs/ destinations exist as actual files in the repository'."
88
- }
89
- ],
90
- "overall": "The four assertions are well-chosen and cover the key audit behaviors. The main gap is that expectation 1 (script was run) cannot be fully verified without a transcript or raw script output artifact. The eval would be stronger if it required evidence of actual execution rather than cited output alone."
91
- }
92
- }
@@ -1 +0,0 @@
1
- {"total_tokens": 26000, "duration_ms": 82000, "total_duration_seconds": 82.0}