workflow-ai 1.0.68 → 1.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (585) hide show
  1. package/CHANGELOG.md +49 -0
  2. package/README.md +105 -7
  3. package/configs/pipeline.yaml +23 -2
  4. package/package.json +44 -41
  5. package/src/lib/operations/plans.mjs +85 -0
  6. package/src/lib/operations/skills.mjs +124 -0
  7. package/src/lib/operations/tickets.mjs +430 -0
  8. package/src/lib/utils.mjs +286 -286
  9. package/src/runner.mjs +314 -34
  10. package/src/scripts/check-conditions.js +2 -2
  11. package/src/scripts/get-next-id.js +8 -31
  12. package/src/scripts/pick-next-task.js +3 -9
  13. package/src/skills/coach/SKILL.md +1 -1
  14. package/src/skills/manual-testing/SKILL.md +2 -0
  15. package/src/skills/review-result/SKILL.md +1 -0
  16. package/src/scripts/tests/timeout-cascade.test.js +0 -28
  17. package/src/skills/analyze-report/README.md +0 -44
  18. package/src/skills/analyze-report/algorithms/progress-assessment.md +0 -108
  19. package/src/skills/analyze-report/knowledge/analysis-frameworks.md +0 -66
  20. package/src/skills/analyze-report/knowledge/report-structure.md +0 -61
  21. package/src/skills/analyze-report/scripts/calc-plan-metrics.js +0 -234
  22. package/src/skills/analyze-report/templates/analysis-report.md +0 -80
  23. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/claude-sonnet/trial-1.md +0 -69
  24. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/claude-sonnet/trial-2.md +0 -103
  25. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/claude-sonnet/trial-3.md +0 -99
  26. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/judge.json +0 -163
  27. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-deepseek/trial-1.md +0 -89
  28. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-deepseek/trial-2.md +0 -88
  29. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-deepseek/trial-3.md +0 -100
  30. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-glm/trial-1.md +0 -77
  31. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-glm/trial-2.md +0 -64
  32. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-glm/trial-3.md +0 -110
  33. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-minimax/trial-1.md +0 -74
  34. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-minimax/trial-2.md +0 -38
  35. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-minimax/trial-3.md +0 -61
  36. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/meta.json +0 -115
  37. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001-evidence-from-log.yaml +0 -60
  38. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/claude-sonnet/trial-1.md +0 -90
  39. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/claude-sonnet/trial-2.md +0 -89
  40. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/claude-sonnet/trial-3.md +0 -77
  41. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/judge.json +0 -163
  42. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-deepseek/trial-1.md +0 -84
  43. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-deepseek/trial-2.md +0 -77
  44. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-deepseek/trial-3.md +0 -89
  45. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-glm/trial-1.md +0 -103
  46. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-glm/trial-2.md +0 -103
  47. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-glm/trial-3.md +0 -103
  48. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-minimax/trial-1.md +0 -93
  49. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-minimax/trial-2.md +0 -93
  50. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-minimax/trial-3.md +0 -86
  51. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/meta.json +0 -115
  52. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002-result-block-format.yaml +0 -44
  53. package/src/skills/analyze-report/tests/fixtures/REPORT-002-incorrect-attribution.md +0 -27
  54. package/src/skills/analyze-report/tests/fixtures/pipeline-2026-04-06_qa-001-skip.log +0 -32
  55. package/src/skills/analyze-report/tests/index.yaml +0 -25
  56. package/src/skills/analyze-report/tests/rubrics/evidence-from-log.md +0 -22
  57. package/src/skills/analyze-report/tests/rubrics/result-block-format.md +0 -22
  58. package/src/skills/analyze-report/workflows/progress.md +0 -158
  59. package/src/skills/analyze-report/workflows/retrospective.md +0 -143
  60. package/src/skills/coach/README.md +0 -43
  61. package/src/skills/coach/SKILL.md.legacy +0 -157
  62. package/src/skills/coach/algorithms/gap-analysis.md +0 -69
  63. package/src/skills/coach/algorithms/improvement-prioritization.md +0 -62
  64. package/src/skills/coach/algorithms/skill-scoring.md +0 -80
  65. package/src/skills/coach/knowledge/audit-applied-changes-clean.txt +0 -11
  66. package/src/skills/coach/knowledge/backlog-management.md +0 -67
  67. package/src/skills/coach/knowledge/backlog-management.md.legacy +0 -90
  68. package/src/skills/coach/knowledge/common-antipatterns.md +0 -76
  69. package/src/skills/coach/knowledge/prompt-engineering.md +0 -45
  70. package/src/skills/coach/knowledge/shared-knowledge-guide.md +0 -44
  71. package/src/skills/coach/knowledge/skill-anatomy.md +0 -49
  72. package/src/skills/coach/knowledge/test-authorship.md +0 -141
  73. package/src/skills/coach/templates/audit-report.md +0 -39
  74. package/src/skills/coach/templates/coach-backlog-init.yaml +0 -14
  75. package/src/skills/coach/templates/coach-backlog-init.yaml.legacy +0 -10
  76. package/src/skills/coach/templates/improvement-plan.md +0 -42
  77. package/src/skills/coach/templates/new-skill.md +0 -95
  78. package/src/skills/coach/tests/cases/TC-COACH-001/current/claude-sonnet/trial-1.md +0 -58
  79. package/src/skills/coach/tests/cases/TC-COACH-001/current/claude-sonnet/trial-2.md +0 -65
  80. package/src/skills/coach/tests/cases/TC-COACH-001/current/claude-sonnet/trial-3.md +0 -58
  81. package/src/skills/coach/tests/cases/TC-COACH-001/current/judge.json +0 -151
  82. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-deepseek/trial-1.md +0 -46
  83. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-deepseek/trial-2.md +0 -0
  84. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-deepseek/trial-3.md +0 -75
  85. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-glm/trial-1.md +0 -81
  86. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-glm/trial-2.md +0 -101
  87. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-glm/trial-3.md +0 -91
  88. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-minimax/trial-1.md +0 -48
  89. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-minimax/trial-2.md +0 -30
  90. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-minimax/trial-3.md +0 -55
  91. package/src/skills/coach/tests/cases/TC-COACH-001/current/meta.json +0 -94
  92. package/src/skills/coach/tests/cases/TC-COACH-001-evidence-based-temporal-diagram.yaml +0 -53
  93. package/src/skills/coach/tests/cases/TC-COACH-002/current/claude-sonnet/trial-1.md +0 -46
  94. package/src/skills/coach/tests/cases/TC-COACH-002/current/claude-sonnet/trial-2.md +0 -50
  95. package/src/skills/coach/tests/cases/TC-COACH-002/current/claude-sonnet/trial-3.md +0 -48
  96. package/src/skills/coach/tests/cases/TC-COACH-002/current/judge.json +0 -151
  97. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-deepseek/trial-1.md +0 -0
  98. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-deepseek/trial-2.md +0 -37
  99. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-deepseek/trial-3.md +0 -30
  100. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-glm/trial-1.md +0 -23
  101. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-glm/trial-2.md +0 -29
  102. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-glm/trial-3.md +0 -35
  103. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-minimax/trial-1.md +0 -13
  104. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-minimax/trial-2.md +0 -19
  105. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-minimax/trial-3.md +0 -33
  106. package/src/skills/coach/tests/cases/TC-COACH-002/current/meta.json +0 -94
  107. package/src/skills/coach/tests/cases/TC-COACH-002-root-cause-first.yaml +0 -57
  108. package/src/skills/coach/tests/fixtures/pipeline-2026-04-06_id-collision.log +0 -77
  109. package/src/skills/coach/tests/index.yaml +0 -29
  110. package/src/skills/coach/tests/rubrics/calibration/evidence-based-bad.md +0 -13
  111. package/src/skills/coach/tests/rubrics/calibration/evidence-based-good.md +0 -29
  112. package/src/skills/coach/tests/rubrics/evidence-based.md +0 -26
  113. package/src/skills/coach/tests/rubrics/root-cause-first.md +0 -21
  114. package/src/skills/coach/workflows/analyze.md +0 -79
  115. package/src/skills/coach/workflows/analyze.md.legacy +0 -64
  116. package/src/skills/coach/workflows/audit.md +0 -74
  117. package/src/skills/coach/workflows/audit.md.legacy +0 -59
  118. package/src/skills/coach/workflows/create.md +0 -80
  119. package/src/skills/coach/workflows/create.md.legacy +0 -67
  120. package/src/skills/coach/workflows/improve.md +0 -71
  121. package/src/skills/coach/workflows/improve.md.legacy +0 -60
  122. package/src/skills/coach/workflows/research.md +0 -55
  123. package/src/skills/coach/workflows/review.md +0 -52
  124. package/src/skills/coach/workflows/review.md.legacy +0 -48
  125. package/src/skills/coach/workflows/test.md +0 -97
  126. package/src/skills/create-plan/README.md +0 -39
  127. package/src/skills/create-plan/algorithms/risk-assessment.md +0 -73
  128. package/src/skills/create-plan/knowledge/plan-completeness.md +0 -67
  129. package/src/skills/create-plan/knowledge/plan-lifecycle.md +0 -33
  130. package/src/skills/create-plan/knowledge/task-verification-pairs.md +0 -151
  131. package/src/skills/create-plan/knowledge/test-hygiene.md +0 -47
  132. package/src/skills/create-plan/scripts/validate-completeness.js +0 -182
  133. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/claude-sonnet/trial-1.md +0 -5
  134. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/claude-sonnet/trial-2.md +0 -39
  135. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/claude-sonnet/trial-3.md +0 -35
  136. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/judge.json +0 -167
  137. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-deepseek/trial-1.md +0 -5
  138. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-deepseek/trial-2.md +0 -10
  139. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-deepseek/trial-3.md +0 -5
  140. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-glm/trial-1.md +0 -26
  141. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-glm/trial-2.md +0 -86
  142. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-glm/trial-3.md +0 -5
  143. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-minimax/trial-1.md +0 -11
  144. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-minimax/trial-2.md +0 -15
  145. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-minimax/trial-3.md +0 -14
  146. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/meta.json +0 -119
  147. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001-validate-completeness.yaml +0 -41
  148. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/claude-sonnet/trial-1.md +0 -25
  149. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/claude-sonnet/trial-2.md +0 -30
  150. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/claude-sonnet/trial-3.md +0 -37
  151. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/judge.json +0 -164
  152. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-deepseek/trial-1.md +0 -3
  153. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-deepseek/trial-2.md +0 -11
  154. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-deepseek/trial-3.md +0 -13
  155. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-glm/trial-1.md +0 -44
  156. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-glm/trial-2.md +0 -5
  157. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-glm/trial-3.md +0 -49
  158. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-minimax/trial-1.md +0 -6
  159. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-minimax/trial-2.md +0 -11
  160. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-minimax/trial-3.md +0 -16
  161. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/meta.json +0 -116
  162. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002-task-granularity.yaml +0 -39
  163. package/src/skills/create-plan/tests/index.yaml +0 -25
  164. package/src/skills/create-plan/tests/rubrics/task-granularity.md +0 -21
  165. package/src/skills/create-plan/tests/rubrics/validate-completeness.md +0 -21
  166. package/src/skills/create-plan/workflows/create.md +0 -136
  167. package/src/skills/create-report/README.md +0 -40
  168. package/src/skills/create-report/algorithms/metric-calculation.md +0 -93
  169. package/src/skills/create-report/knowledge/report-metrics.md +0 -82
  170. package/src/skills/create-report/scripts/calc-metrics.js +0 -383
  171. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/claude-sonnet/trial-1.md +0 -25
  172. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/claude-sonnet/trial-2.md +0 -26
  173. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/claude-sonnet/trial-3.md +0 -28
  174. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/judge.json +0 -163
  175. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-deepseek/trial-1.md +0 -4
  176. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-deepseek/trial-2.md +0 -3
  177. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-deepseek/trial-3.md +0 -6
  178. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-glm/trial-1.md +0 -8
  179. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-glm/trial-2.md +0 -12
  180. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-glm/trial-3.md +0 -7
  181. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-minimax/trial-1.md +0 -12
  182. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-minimax/trial-2.md +0 -22
  183. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-minimax/trial-3.md +0 -13
  184. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/meta.json +0 -115
  185. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001-root-cause-attribution.yaml +0 -57
  186. package/src/skills/create-report/tests/index.yaml +0 -20
  187. package/src/skills/create-report/tests/rubrics/root-cause-attribution.md +0 -21
  188. package/src/skills/create-report/workflows/standard.md +0 -175
  189. package/src/skills/decompose-gaps/README.md +0 -39
  190. package/src/skills/decompose-gaps/algorithms/scope-check.md +0 -110
  191. package/src/skills/decompose-gaps/knowledge/scope-validation.md +0 -65
  192. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/claude-sonnet/trial-1.md +0 -41
  193. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/claude-sonnet/trial-2.md +0 -41
  194. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/claude-sonnet/trial-3.md +0 -56
  195. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/judge.json +0 -164
  196. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-deepseek/trial-1.md +0 -25
  197. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-deepseek/trial-2.md +0 -17
  198. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-deepseek/trial-3.md +0 -22
  199. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-glm/trial-1.md +0 -25
  200. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-glm/trial-2.md +0 -5
  201. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-glm/trial-3.md +0 -29
  202. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-minimax/trial-1.md +0 -27
  203. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-minimax/trial-2.md +0 -35
  204. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-minimax/trial-3.md +0 -18
  205. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/meta.json +0 -116
  206. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001-scope-exclusion.yaml +0 -46
  207. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/claude-sonnet/trial-1.md +0 -27
  208. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/claude-sonnet/trial-2.md +0 -30
  209. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/claude-sonnet/trial-3.md +0 -27
  210. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/judge.json +0 -163
  211. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-deepseek/trial-1.md +0 -0
  212. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-deepseek/trial-2.md +0 -15
  213. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-deepseek/trial-3.md +0 -7
  214. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-glm/trial-1.md +0 -21
  215. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-glm/trial-2.md +0 -38
  216. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-glm/trial-3.md +0 -16
  217. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-minimax/trial-1.md +0 -5
  218. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-minimax/trial-2.md +0 -10
  219. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-minimax/trial-3.md +0 -9
  220. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/meta.json +0 -115
  221. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002-glob-before-write.yaml +0 -36
  222. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/claude-sonnet/trial-1.md +0 -30
  223. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/claude-sonnet/trial-2.md +0 -30
  224. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/claude-sonnet/trial-3.md +0 -30
  225. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/judge.json +0 -165
  226. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-deepseek/trial-1.md +0 -5
  227. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-deepseek/trial-2.md +0 -26
  228. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-deepseek/trial-3.md +0 -5
  229. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-glm/trial-1.md +0 -39
  230. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-glm/trial-2.md +0 -37
  231. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-glm/trial-3.md +0 -45
  232. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-minimax/trial-1.md +0 -26
  233. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-minimax/trial-2.md +0 -27
  234. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-minimax/trial-3.md +0 -7
  235. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/meta.json +0 -117
  236. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003-parent-plan-mandatory.yaml +0 -41
  237. package/src/skills/decompose-gaps/tests/index.yaml +0 -30
  238. package/src/skills/decompose-gaps/tests/rubrics/glob-before-write.md +0 -21
  239. package/src/skills/decompose-gaps/tests/rubrics/parent-plan-mandatory.md +0 -22
  240. package/src/skills/decompose-gaps/tests/rubrics/scope-exclusion.md +0 -21
  241. package/src/skills/decompose-gaps/workflows/decompose.md +0 -123
  242. package/src/skills/decompose-plan/README.md +0 -43
  243. package/src/skills/decompose-plan/algorithms/deduplication.md +0 -101
  244. package/src/skills/decompose-plan/knowledge/atomicity-checklist.md +0 -139
  245. package/src/skills/decompose-plan/knowledge/capabilities.md +0 -68
  246. package/src/skills/decompose-plan/knowledge/human-task-rules.md +0 -82
  247. package/src/skills/decompose-plan/knowledge/scope-guard-checklist.md +0 -73
  248. package/src/skills/decompose-plan/scripts/check-atomicity-limit.js +0 -47
  249. package/src/skills/decompose-plan/scripts/check-duplicates.js +0 -323
  250. package/src/skills/decompose-plan/scripts/verify-atomicity.js +0 -408
  251. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/claude-sonnet/trial-1.md +0 -30
  252. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/claude-sonnet/trial-2.md +0 -36
  253. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/claude-sonnet/trial-3.md +0 -37
  254. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/judge.json +0 -163
  255. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-deepseek/trial-1.md +0 -20
  256. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-deepseek/trial-2.md +0 -17
  257. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-deepseek/trial-3.md +0 -28
  258. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-glm/trial-1.md +0 -114
  259. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-glm/trial-2.md +0 -137
  260. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-glm/trial-3.md +0 -188
  261. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-minimax/trial-1.md +0 -0
  262. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-minimax/trial-2.md +0 -32
  263. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-minimax/trial-3.md +0 -110
  264. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/meta.json +0 -115
  265. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001-atomicity-no-1to1.yaml +0 -56
  266. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/claude-sonnet/trial-1.md +0 -47
  267. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/claude-sonnet/trial-2.md +0 -54
  268. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/claude-sonnet/trial-3.md +0 -43
  269. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/judge.json +0 -163
  270. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-deepseek/trial-1.md +0 -15
  271. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-deepseek/trial-2.md +0 -5
  272. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-deepseek/trial-3.md +0 -12
  273. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-glm/trial-1.md +0 -34
  274. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-glm/trial-2.md +0 -30
  275. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-glm/trial-3.md +0 -35
  276. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-minimax/trial-1.md +0 -0
  277. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-minimax/trial-2.md +0 -31
  278. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-minimax/trial-3.md +0 -0
  279. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/meta.json +0 -115
  280. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002-get-next-id-mandatory.yaml +0 -44
  281. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/claude-sonnet/trial-1.md +0 -21
  282. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/claude-sonnet/trial-2.md +0 -38
  283. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/claude-sonnet/trial-3.md +0 -30
  284. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/judge.json +0 -163
  285. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-deepseek/trial-1.md +0 -31
  286. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-deepseek/trial-2.md +0 -35
  287. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-deepseek/trial-3.md +0 -48
  288. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-glm/trial-1.md +0 -167
  289. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-glm/trial-2.md +0 -62
  290. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-glm/trial-3.md +0 -174
  291. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-minimax/trial-1.md +0 -0
  292. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-minimax/trial-2.md +0 -0
  293. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-minimax/trial-3.md +0 -0
  294. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/meta.json +0 -115
  295. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003-verbatim-dod-transfer.yaml +0 -42
  296. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/claude-sonnet/trial-1.md +0 -55
  297. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/claude-sonnet/trial-2.md +0 -49
  298. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/claude-sonnet/trial-3.md +0 -49
  299. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/judge.json +0 -163
  300. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-deepseek/trial-1.md +0 -104
  301. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-deepseek/trial-2.md +0 -45
  302. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-deepseek/trial-3.md +0 -58
  303. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-glm/trial-1.md +0 -193
  304. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-glm/trial-2.md +0 -202
  305. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-glm/trial-3.md +0 -155
  306. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-minimax/trial-1.md +0 -52
  307. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-minimax/trial-2.md +0 -17
  308. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-minimax/trial-3.md +0 -0
  309. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/meta.json +0 -115
  310. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004-executor-atomicity.yaml +0 -64
  311. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/claude-sonnet/trial-1.md +0 -59
  312. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/claude-sonnet/trial-2.md +0 -204
  313. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/claude-sonnet/trial-3.md +0 -213
  314. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/judge.json +0 -163
  315. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-deepseek/trial-1.md +0 -0
  316. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-deepseek/trial-2.md +0 -57
  317. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-deepseek/trial-3.md +0 -54
  318. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-glm/trial-1.md +0 -147
  319. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-glm/trial-2.md +0 -165
  320. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-glm/trial-3.md +0 -133
  321. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-minimax/trial-1.md +0 -81
  322. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-minimax/trial-2.md +0 -108
  323. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-minimax/trial-3.md +0 -3
  324. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/meta.json +0 -114
  325. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005-capabilities-registry.yaml +0 -78
  326. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/claude-sonnet/trial-1.md +0 -225
  327. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/claude-sonnet/trial-2.md +0 -66
  328. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/claude-sonnet/trial-3.md +0 -36
  329. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/judge.json +0 -163
  330. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-deepseek/trial-1.md +0 -42
  331. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-deepseek/trial-2.md +0 -67
  332. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-deepseek/trial-3.md +0 -40
  333. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-glm/trial-1.md +0 -122
  334. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-glm/trial-2.md +0 -131
  335. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-glm/trial-3.md +0 -138
  336. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-minimax/trial-1.md +0 -41
  337. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-minimax/trial-2.md +0 -88
  338. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-minimax/trial-3.md +0 -0
  339. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/meta.json +0 -115
  340. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006-dod-threshold.yaml +0 -72
  341. package/src/skills/decompose-plan/tests/index.yaml +0 -45
  342. package/src/skills/decompose-plan/tests/rubrics/atomicity-no-1to1.md +0 -21
  343. package/src/skills/decompose-plan/tests/rubrics/capabilities-registry.md +0 -21
  344. package/src/skills/decompose-plan/tests/rubrics/dod-threshold.md +0 -21
  345. package/src/skills/decompose-plan/tests/rubrics/executor-atomicity.md +0 -21
  346. package/src/skills/decompose-plan/tests/rubrics/get-next-id-mandatory.md +0 -21
  347. package/src/skills/decompose-plan/tests/rubrics/verbatim-dod-transfer.md +0 -21
  348. package/src/skills/decompose-plan/workflows/decompose.md +0 -305
  349. package/src/skills/deep-research/README.md +0 -36
  350. package/src/skills/deep-research/algorithms/source-scoring.md +0 -63
  351. package/src/skills/deep-research/algorithms/synthesis.md +0 -67
  352. package/src/skills/deep-research/knowledge/data-validation.md +0 -44
  353. package/src/skills/deep-research/knowledge/perplexity-config.md +0 -30
  354. package/src/skills/deep-research/knowledge/research-methodology.md +0 -54
  355. package/src/skills/deep-research/knowledge/source-evaluation.md +0 -33
  356. package/src/skills/deep-research/scripts/perplexity-research.js +0 -315
  357. package/src/skills/deep-research/templates/brief-summary.md +0 -25
  358. package/src/skills/deep-research/templates/research-report.md +0 -76
  359. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/claude-haiku/trial-1.md +0 -48
  360. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/claude-haiku/trial-2.md +0 -88
  361. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/claude-haiku/trial-3.md +0 -56
  362. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/judge.json +0 -163
  363. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-free/trial-1.md +0 -58
  364. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-free/trial-2.md +0 -249
  365. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-free/trial-3.md +0 -44
  366. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-glm/trial-1.md +0 -96
  367. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-glm/trial-2.md +0 -56
  368. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-glm/trial-3.md +0 -94
  369. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-glm-air/trial-1.md +0 -11
  370. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-glm-air/trial-2.md +0 -1
  371. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-glm-air/trial-3.md +0 -1
  372. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/meta.json +0 -115
  373. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001-self-check-url.yaml +0 -58
  374. package/src/skills/deep-research/tests/index.yaml +0 -20
  375. package/src/skills/deep-research/tests/rubrics/self-check-url.md +0 -34
  376. package/src/skills/deep-research/workflows/base-checklist.md +0 -19
  377. package/src/skills/deep-research/workflows/benchmark.md +0 -38
  378. package/src/skills/deep-research/workflows/competitor.md +0 -44
  379. package/src/skills/deep-research/workflows/custom.md +0 -32
  380. package/src/skills/deep-research/workflows/market.md +0 -44
  381. package/src/skills/deep-research/workflows/technology.md +0 -40
  382. package/src/skills/deep-research/workflows/trend.md +0 -40
  383. package/src/skills/execute-task/README.md +0 -44
  384. package/src/skills/execute-task/algorithms/execution-strategy.md +0 -136
  385. package/src/skills/execute-task/knowledge/context-checkpoints.md +0 -75
  386. package/src/skills/execute-task/knowledge/ticket-structure.md +0 -70
  387. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/claude-haiku/trial-1.md +0 -5
  388. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/claude-haiku/trial-2.md +0 -5
  389. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/claude-haiku/trial-3.md +0 -5
  390. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/judge.json +0 -124
  391. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/kilo-free/trial-1.md +0 -4
  392. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/kilo-free/trial-2.md +0 -4
  393. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/kilo-free/trial-3.md +0 -4
  394. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/kilo-glm-air/trial-1.md +0 -4
  395. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/kilo-glm-air/trial-2.md +0 -4
  396. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/kilo-glm-air/trial-3.md +0 -11
  397. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/meta.json +0 -88
  398. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001-no-ticket-creation.yaml +0 -48
  399. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/claude-haiku/trial-1.md +0 -5
  400. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/claude-haiku/trial-2.md +0 -6
  401. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/claude-haiku/trial-3.md +0 -5
  402. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/judge.json +0 -124
  403. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/kilo-free/trial-1.md +0 -4
  404. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/kilo-free/trial-2.md +0 -4
  405. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/kilo-free/trial-3.md +0 -8
  406. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/kilo-glm-air/trial-1.md +0 -9
  407. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/kilo-glm-air/trial-2.md +0 -26
  408. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/kilo-glm-air/trial-3.md +0 -4
  409. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/meta.json +0 -89
  410. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002-no-duplicate-dod.yaml +0 -44
  411. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-003/current/claude-haiku/trial-1.md +0 -5
  412. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-003/current/claude-haiku/trial-2.md +0 -5
  413. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-003/current/claude-haiku/trial-3.md +0 -5
  414. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-003/current/judge.json +0 -46
  415. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-003/current/meta.json +0 -37
  416. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-003-verification-proportionality.yaml +0 -46
  417. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/claude-haiku/trial-1.md +0 -18
  418. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/claude-haiku/trial-2.md +0 -16
  419. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/claude-haiku/trial-3.md +0 -14
  420. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/judge.json +0 -124
  421. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/kilo-free/trial-1.md +0 -5
  422. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/kilo-free/trial-2.md +0 -5
  423. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/kilo-free/trial-3.md +0 -1
  424. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/kilo-glm-air/trial-1.md +0 -8
  425. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/kilo-glm-air/trial-2.md +0 -5
  426. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/kilo-glm-air/trial-3.md +0 -4
  427. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/meta.json +0 -89
  428. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004-no-foreign-ticket-edit.yaml +0 -50
  429. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/claude-haiku/trial-1.md +0 -5
  430. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/claude-haiku/trial-2.md +0 -5
  431. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/claude-haiku/trial-3.md +0 -5
  432. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/judge.json +0 -124
  433. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/kilo-free/trial-1.md +0 -15
  434. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/kilo-free/trial-2.md +0 -4
  435. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/kilo-free/trial-3.md +0 -5
  436. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/kilo-glm-air/trial-1.md +0 -11
  437. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/kilo-glm-air/trial-2.md +0 -11
  438. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/kilo-glm-air/trial-3.md +0 -4
  439. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/meta.json +0 -88
  440. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005-ticket-fields-updated.yaml +0 -39
  441. package/src/skills/execute-task/tests/fixtures/IMPL-902-create-file.md +0 -41
  442. package/src/skills/execute-task/tests/fixtures/IMPL-904-current-task.md +0 -40
  443. package/src/skills/execute-task/tests/fixtures/IMPL-906-fill-ticket.md +0 -42
  444. package/src/skills/execute-task/tests/fixtures/QA-901-button-click.md +0 -41
  445. package/src/skills/execute-task/tests/fixtures/QA-903-visual-figma.md +0 -40
  446. package/src/skills/execute-task/tests/fixtures/TASK-905-done-with-typo.md +0 -36
  447. package/src/skills/execute-task/tests/index.yaml +0 -39
  448. package/src/skills/execute-task/tests/rubrics/no-duplicate-dod.md +0 -22
  449. package/src/skills/execute-task/tests/rubrics/no-foreign-ticket-edit.md +0 -20
  450. package/src/skills/execute-task/tests/rubrics/no-ticket-creation.md +0 -21
  451. package/src/skills/execute-task/tests/rubrics/ticket-fields-updated.md +0 -23
  452. package/src/skills/execute-task/tests/rubrics/verification-proportionality.md +0 -22
  453. package/src/skills/execute-task/workflows/execute.md +0 -104
  454. package/src/skills/manual-testing/README.md +0 -63
  455. package/src/skills/manual-testing/algorithms/blocked-tool-strategy.md +0 -74
  456. package/src/skills/manual-testing/algorithms/bug-severity.md +0 -73
  457. package/src/skills/manual-testing/algorithms/mcp-budget.md +0 -97
  458. package/src/skills/manual-testing/algorithms/test-prioritization.md +0 -69
  459. package/src/skills/manual-testing/knowledge/browser-extension-testing.md +0 -102
  460. package/src/skills/manual-testing/knowledge/browser-tools.md +0 -114
  461. package/src/skills/manual-testing/knowledge/desktop-tools-advanced.md +0 -92
  462. package/src/skills/manual-testing/knowledge/desktop-tools-core.md +0 -76
  463. package/src/skills/manual-testing/knowledge/sandbox-advanced.md +0 -83
  464. package/src/skills/manual-testing/knowledge/sandbox-core.md +0 -67
  465. package/src/skills/manual-testing/knowledge/stateful-edge-cases.md +0 -69
  466. package/src/skills/manual-testing/knowledge/test-case-design.md +0 -107
  467. package/src/skills/manual-testing/knowledge/testing-types.md +0 -45
  468. package/src/skills/manual-testing/templates/bug-report.md +0 -52
  469. package/src/skills/manual-testing/templates/test-case.md +0 -34
  470. package/src/skills/manual-testing/templates/test-plan.md +0 -97
  471. package/src/skills/manual-testing/templates/test-session-report.md +0 -56
  472. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/claude-sonnet/trial-1.md +0 -34
  473. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/claude-sonnet/trial-2.md +0 -32
  474. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/claude-sonnet/trial-3.md +0 -30
  475. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/judge.json +0 -163
  476. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-deepseek/trial-1.md +0 -0
  477. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-deepseek/trial-2.md +0 -7
  478. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-deepseek/trial-3.md +0 -0
  479. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-glm/trial-1.md +0 -4
  480. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-glm/trial-2.md +0 -15
  481. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-glm/trial-3.md +0 -8
  482. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-minimax/trial-1.md +0 -5
  483. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-minimax/trial-2.md +0 -7
  484. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-minimax/trial-3.md +0 -7
  485. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/meta.json +0 -114
  486. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001-sandbox-mandatory.yaml +0 -38
  487. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/claude-sonnet/trial-1.md +0 -44
  488. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/claude-sonnet/trial-2.md +0 -32
  489. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/claude-sonnet/trial-3.md +0 -47
  490. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/judge.json +0 -163
  491. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-deepseek/trial-1.md +0 -19
  492. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-deepseek/trial-2.md +0 -15
  493. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-deepseek/trial-3.md +0 -24
  494. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-glm/trial-1.md +0 -19
  495. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-glm/trial-2.md +0 -13
  496. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-glm/trial-3.md +0 -18
  497. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-minimax/trial-1.md +0 -21
  498. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-minimax/trial-2.md +0 -15
  499. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-minimax/trial-3.md +0 -14
  500. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/meta.json +0 -114
  501. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002-visual-tc-screenshot.yaml +0 -37
  502. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-003/current/claude-sonnet/trial-1.md +0 -76
  503. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-003/current/claude-sonnet/trial-2.md +0 -71
  504. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-003/current/claude-sonnet/trial-3.md +0 -85
  505. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-003/current/judge.json +0 -46
  506. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-003/current/meta.json +0 -36
  507. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-003-qa-non-ui-assertion.yaml +0 -65
  508. package/src/skills/manual-testing/tests/index.yaml +0 -30
  509. package/src/skills/manual-testing/tests/last-run-tc001-sonnet.log +0 -140
  510. package/src/skills/manual-testing/tests/last-run-tc002.log +0 -1
  511. package/src/skills/manual-testing/tests/last-run.log +0 -1469
  512. package/src/skills/manual-testing/tests/rubrics/qa-non-ui-assertion.md +0 -31
  513. package/src/skills/manual-testing/tests/rubrics/sandbox-mandatory.md +0 -20
  514. package/src/skills/manual-testing/tests/rubrics/visual-tc-screenshot.md +0 -21
  515. package/src/skills/manual-testing/workflows/acceptance.md +0 -80
  516. package/src/skills/manual-testing/workflows/exploratory.md +0 -84
  517. package/src/skills/manual-testing/workflows/regression.md +0 -76
  518. package/src/skills/manual-testing/workflows/smoke.md +0 -109
  519. package/src/skills/manual-testing/workflows/test-plan.md +0 -75
  520. package/src/skills/review-result/README.md +0 -59
  521. package/src/skills/review-result/algorithms/verification.md +0 -112
  522. package/src/skills/review-result/knowledge/dod-patterns.md +0 -115
  523. package/src/skills/review-result/knowledge/test-hygiene.md +0 -44
  524. package/src/skills/review-result/scripts/verify-artifacts.js +0 -497
  525. package/src/skills/review-result/templates/verdict.md +0 -153
  526. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/claude-haiku/trial-1.md +0 -22
  527. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/claude-haiku/trial-2.md +0 -7
  528. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/claude-haiku/trial-3.md +0 -21
  529. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/claude-sonnet/trial-1.md +0 -6
  530. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/claude-sonnet/trial-2.md +0 -6
  531. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/claude-sonnet/trial-3.md +0 -18
  532. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/judge.json +0 -164
  533. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-deepseek/trial-1.md +0 -5
  534. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-deepseek/trial-2.md +0 -7
  535. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-deepseek/trial-3.md +0 -6
  536. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-glm/trial-1.md +0 -49
  537. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-glm/trial-2.md +0 -28
  538. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-glm/trial-3.md +0 -37
  539. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-minimax/trial-1.md +0 -22
  540. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-minimax/trial-2.md +0 -13
  541. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-minimax/trial-3.md +0 -21
  542. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/meta.json +0 -116
  543. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001-visual-tc-trigger.yaml +0 -51
  544. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/claude-haiku/trial-1.md +0 -23
  545. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/claude-haiku/trial-2.md +0 -22
  546. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/claude-haiku/trial-3.md +0 -28
  547. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/claude-sonnet/trial-1.md +0 -4
  548. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/claude-sonnet/trial-2.md +0 -36
  549. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/claude-sonnet/trial-3.md +0 -4
  550. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/judge.json +0 -163
  551. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-deepseek/trial-1.md +0 -4
  552. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-deepseek/trial-2.md +0 -0
  553. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-deepseek/trial-3.md +0 -4
  554. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-glm/trial-1.md +0 -39
  555. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-glm/trial-2.md +0 -25
  556. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-glm/trial-3.md +0 -32
  557. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-minimax/trial-1.md +0 -34
  558. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-minimax/trial-2.md +0 -8
  559. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-minimax/trial-3.md +0 -23
  560. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/meta.json +0 -115
  561. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002-path-line-suffix.yaml +0 -39
  562. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/claude-sonnet/trial-1.md +0 -7
  563. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/claude-sonnet/trial-2.md +0 -7
  564. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/claude-sonnet/trial-3.md +0 -7
  565. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/judge.json +0 -163
  566. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-deepseek/trial-1.md +0 -5
  567. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-deepseek/trial-2.md +0 -5
  568. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-deepseek/trial-3.md +0 -11
  569. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-glm/trial-1.md +0 -16
  570. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-glm/trial-2.md +0 -18
  571. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-glm/trial-3.md +0 -17
  572. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-minimax/trial-1.md +0 -17
  573. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-minimax/trial-2.md +0 -31
  574. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-minimax/trial-3.md +0 -5
  575. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/meta.json +0 -115
  576. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003-test-isolation.yaml +0 -50
  577. package/src/skills/review-result/tests/fixtures/IMPL-902-path-with-line.md +0 -43
  578. package/src/skills/review-result/tests/fixtures/QA-901-visual-button.md +0 -46
  579. package/src/skills/review-result/tests/fixtures/QA-904-test-isolation-violation/QA-904.md +0 -51
  580. package/src/skills/review-result/tests/fixtures/QA-904-test-isolation-violation/example-test.mjs +0 -36
  581. package/src/skills/review-result/tests/index.yaml +0 -30
  582. package/src/skills/review-result/tests/rubrics/path-line-suffix.md +0 -19
  583. package/src/skills/review-result/tests/rubrics/test-isolation.md +0 -20
  584. package/src/skills/review-result/tests/rubrics/visual-tc-trigger.md +0 -19
  585. package/src/skills/review-result/workflows/review.md +0 -209
@@ -1,19 +0,0 @@
1
- ## Результат тестирования TC-001
2
-
3
- | Тест-кейс | Статус | Evidence | Причина |
4
- |-----------|--------|----------|---------|
5
- | **TC-001:** Кнопка отображается корректно с иконкой и текстом | `BLOCKED` | Предоставлен частичный evidence: DOM-элемент найден (`querySelector` вернул элемент).<br>**Недостающий evidence:** для визуального TC (критерий «как элемент выглядит пользователю») согласно принципу 8 скила требуется скриншот + self‑review. A11y tree assertion не содержит визуальных свойств (стилизация, цвет, выравнивание, наличие иконки). | Инструмент тестирования UI (браузер/Playwright MCP) недоступен в данной среде. Без скриншота невозможно подтвердить корректность отображения иконки и текста. |
6
-
7
- ### Шаги для ручного воспроизведения
8
- 1. Откройте тестируемую страницу в браузере.
9
- 2. Найдите кнопку по селектору (указать конкретный селектор из предоставленного evidence).
10
- 3. Визуально убедитесь, что:
11
- - Кнопка отображается (не скрыта, не обрезана).
12
- - На кнопке присутствует текст (соответствует ожидаемому).
13
- - Рядом с текстом (или внутри кнопки) отображается иконка.
14
- - Стили кнопки соответствуют макету (цвет, размер, выравнивание).
15
- 4. Сделайте скриншот области с кнопкой и сохраните как `reports/qa001-screenshot-01.png`.
16
- 5. Откройте скриншот и проверьте, что видимое состояние соответствует критерию «кнопка отображается корректно с иконкой и текстом».
17
-
18
- ### Рекомендация
19
- Для выполнения полной проверки TC‑001 требуется доступ к инструменту тестирования UI (браузер с возможностью скриншотов). Если критичность сценария высока — создайте `HUMAN`‑тикет для ручного тестирования.
@@ -1,15 +0,0 @@
1
- ## TC-001: «Кнопка отображается корректно с иконкой и текстом»
2
-
3
- **Статус:** BLOCKED
4
-
5
- **Причина:** Инструмент тестирования (браузер/Playwright MCP) недоступен в данной среде для выполнения визуальной проверки. Для подтверждения визуального критерия необходим скриншот элемента, который не может быть получен.
6
-
7
- **Evidence предоставлено:** DOM-элемент найден, querySelector вернул элемент. Однако это недостаточно для проверки визуального отображения (иконка и текст).
8
-
9
- **Шаги для ручного воспроизведения:**
10
- 1. Откройте приложение в браузере.
11
- 2. Найдите кнопку по селектору.
12
- 3. Убедитесь, что кнопка отображается с иконкой и текстом.
13
- 4. Сделайте скриншот.
14
-
15
- **Рекомендация:** Для выполнения визуального тестирования необходим доступ к инструменту браузера (Playwright MCP) или возможность делать скриншоты.
@@ -1,24 +0,0 @@
1
- **Статус:** `BLOCKED`
2
-
3
- **Причина:** TC‑001 — визуальный тест‑кейс («Кнопка отображается корректно с иконкой и текстом»). Согласно принципу 8 скила, для визуальных проверок **обязателен скриншот** + self‑review. Скриншот не предоставлен, а доступный evidence (DOM‑элемент найден через querySelector) не подтверждает корректность отображения иконки и текста в реальном интерфейсе.
4
-
5
- **Evidence:**
6
- - Результат DOM‑запроса: «DOM‑элемент найден, querySelector вернул элемент» (сохранено в [`reports/TC-001-result.txt`](reports/TC-001-result.txt)).
7
- - A11y tree assertion отсутствует.
8
- - Скриншот отсутствует.
9
-
10
- **Шаги для ручного воспроизведения:**
11
- 1. Открыть приложение в тестовом окружении.
12
- 2. Найти кнопку с иконкой и текстом (например, через DevTools).
13
- 3. Визуально убедиться:
14
- - Иконка отображается (не заменена placeholder или broken image).
15
- - Текст читаем, не обрезан, соответствует макету.
16
- - Стили (цвет, размер, выравнивание) соответствуют дизайну.
17
- 4. Сделать скриншот области кнопки.
18
-
19
- **Рекомендация:** Для завершения проверки TC‑001 необходимо предоставить скриншот кнопки с видимой иконкой и текстом. Без скриншота визуальный критерий не может быть подтверждён.
20
-
21
- **Итог по TC‑001:**
22
- | # | ID | Название | Статус | Комментарий |
23
- |---|----|----------|--------|-------------|
24
- | 1 | TC‑001 | Кнопка отображается корректно с иконкой и текстом | `BLOCKED` | Требуется скриншот для визуальной проверки |
@@ -1,19 +0,0 @@
1
- ## TC-001: «Кнопка отображается корректно с иконкой и текстом»
2
-
3
- **Статус: BLOCKED**
4
-
5
- **Причина:** Evidence недостаточен для визуального TC.
6
-
7
- TC содержит визуальный критерий — «отображается корректно с иконкой и текстом» (принцип 8 скила). Для таких TC:
8
-
9
- 1. `querySelector` подтверждает лишь существование элемента в DOM, но не его корректное отображение (между DOM и рендерингом лежит CSS — принцип 8).
10
- 2. **Обязателен** a11y tree assertion через Snapshot (Playwright MCP) — чтобы подтвердить наличие иконки и текста в доступной модели.
11
- 3. **Обязателен** скриншот — визуальный TC требует screenshot + self-review.
12
- 4. Проверка должна выполняться через реальный UI (Playwright MCP / desktop-инструменты), а не через код без прогона (принцип 5: Real UI First).
13
-
14
- **Требуемые действия для разблокировки:**
15
- - Открыть приложение через Playwright MCP
16
- - Получить a11y tree Snapshot кнопки → зафиксировать наличие иконки и текста
17
- - Сделать скриншот кнопки → сохранить в `reports/`
18
- - Открыть скриншот через Read → self-review: описать, что видно
19
- - Записать результат с полным evidence (a11y assertion + ссылка на PNG + описание видимого)
@@ -1,13 +0,0 @@
1
- **Статус: BLOCKED**
2
-
3
- **Причина:** Недостаточный evidence. TC-001 содержит визуальный критерий — «отображается корректно с иконкой и текстом». Формулировка «отображается корректно» требует проверки визуального рендеринга (стилизация, выравнивание, читаемость).
4
-
5
- **Что предоставлено:** `querySelector` вернул элемент — подтверждает существование узла в DOM, но не его внешний вид.
6
-
7
- **Что требуется по принципу 8 (Visual TC = Screenshot + Self-Review):**
8
- 1. A11y tree assertion (Snapshot) — наличие текста и иконки в модели доступности
9
- 2. Скриншот проверяемого элемента → `reports/TC-001-screenshot-01.png`
10
- 3. Self-review: открыть скриншот, описать видимое, подтвердить соответствие TC
11
- 4. В evidence — ссылка на PNG + краткое описание видимого
12
-
13
- **Evidence в текущем виде не подтверждает критерий «отображается корректно»** — между DOM-узлом и тем, что видит пользователь, лежит CSS, который `querySelector` не проверяет.
@@ -1,18 +0,0 @@
1
- **TC-001: FAIL** — недостаточно evidence для PASS.
2
-
3
- **Обоснование:**
4
-
5
- TC содержит визуальный критерий: «отображается корректно с иконкой и текстом». Согласно принципу 8 скила, для визуальных TC a11y tree assertion / DOM-проверка **недостаточны** — `querySelector` подтверждает существование элемента в DOM, но не его внешний вид (рендеринг, наличие иконки, читаемость текста).
6
-
7
- **Что не проверено:**
8
- - Визуальный рендеринг кнопки (CSS → отображение)
9
- - Наличие иконки в кнопке
10
- - Наличие и корректность текста
11
- - Общий внешний вид («отображается корректно»)
12
-
13
- **Необходимо для PASS:**
14
- 1. Скриншот кнопки, сохранённый в `reports/`
15
- 2. Визуальная проверка скриншота (Read + анализ)
16
- 3. A11y tree assertion с конкретным текстом (например: `a11y: button "Submit" with img "icon"`)
17
-
18
- **Текущий evidence:** `querySelector` вернул элемент — подтверждает только наличие в DOM, не визуальное отображение.
@@ -1,21 +0,0 @@
1
- **TC-001 — BLOCKED (недостаточно evidence)**
2
-
3
- **Причина:** TC содержит визуальный критерий — «отображается корректно с иконкой и текстом». Согласно **Принципу 8** скила:
4
-
5
- > a11y tree assertion **недостаточен** как единственный evidence для визуального TC — a11y tree / DOM не содержит визуальных свойств (стилизация, иконка как CSS/SVG, выравнивание).
6
-
7
- **Что предоставлено:** `querySelector` вернул элемент → подтверждает только **существование DOM-узла**, но не:
8
- - наличие иконки (может быть скрыта через CSS, не загружена, иметь нулевой размер)
9
- - корректность отображения текста (overflow, обрезание, цвет)
10
- - итоговый визуальный вид кнопки для пользователя
11
-
12
- **Что требуется для закрытия TC:**
13
- 1. Скриншот кнопки → сохранить в `reports/`
14
- 2. Открыть скриншот через Read и описать одним предложением увиденное
15
- 3. Убедиться, что иконка видна и текст читаем → только тогда → **PASS**
16
-
17
- **Текущий статус:**
18
-
19
- | TC | Статус | Evidence | Причина |
20
- |----|--------|----------|---------|
21
- | TC-001 | **BLOCKED** | DOM: элемент найден (`querySelector` → element) | Визуальный критерий не проверен: скриншот отсутствует, визуальный рендеринг не подтверждён |
@@ -1,15 +0,0 @@
1
- **TC-001 — BLOCKED**
2
-
3
- **Причина:** TC содержит визуальный критерий («отображается корректно с иконкой и текстом» — формулировка описывает внешний вид элемента для пользователя). Согласно принципу 8 скила, для таких TC:
4
-
5
- - a11y tree / DOM-assertion **недостаточен** как единственный evidence — он подтверждает наличие элемента в DOM, но не его визуальный рендеринг (иконка, текст, стилизация, выравнивание);
6
- - обязателен скриншот проверяемого элемента + self-review (открыть и описать что видно) до записи PASS.
7
-
8
- **Предоставленный evidence:** `querySelector` вернул элемент — это DOM-assertion. Он подтверждает существование элемента, но **не подтверждает** что кнопка визуально отображает иконку и текст корректно (между DOM и рендерингом лежит CSS, который DOM-assertion не видит).
9
-
10
- **Что нужно для закрытия TC:**
11
- 1. Сделать скриншот кнопки в реальном интерфейсе
12
- 2. Открыть скриншот через Read, описать что видно (иконка есть? текст читаем? элемент не обрезан?)
13
- 3. Если визуально соответствует критерию — записать PASS с evidence: ссылка на PNG + описание
14
-
15
- **Статус: `BLOCKED` — недостаточно evidence для visual TC (отсутствует скриншот + self-review)**
@@ -1,14 +0,0 @@
1
- **TC-001 — BLOCKED**
2
-
3
- **Причина:** TC содержит визуальный критерий («отображается корректно с иконкой и текстом»). Согласно **Принципу 8**, для таких TC:
4
-
5
- - `querySelector` / DOM-assertion подтверждает существование элемента в модели данных, но **не его внешний вид**
6
- - Обязателен **скриншот** проверяемого элемента + открытие скриншота через Read и описание видимого
7
- - a11y tree assertion недостаточен как единственный evidence
8
-
9
- **Предоставленный evidence:** `DOM-элемент найден, querySelector вернул элемент` — не является достаточным для визуального TC.
10
-
11
- **Что требуется для перевода в PASS:**
12
- 1. Скриншот кнопки → сохранить в `reports/<ticket-id>-screenshot-tc001.png`
13
- 2. Открыть скриншот через Read, описать: видна ли иконка, виден ли текст, нет ли overflow/обрезки
14
- 3. Если видимое соответствует критерию → PASS с evidence: ссылка на PNG + описание
@@ -1,114 +0,0 @@
1
- {
2
- "date": "2026-04-21T08:55:16.512Z",
3
- "skill_sha": "bdb379d",
4
- "status": "passed",
5
- "duration_ms": 51207,
6
- "per_model": {
7
- "claude-sonnet": {
8
- "passed": true,
9
- "errored": false,
10
- "pass_count": 3,
11
- "error_count": 0,
12
- "total": 3,
13
- "threshold": 2
14
- },
15
- "kilo-glm": {
16
- "passed": true,
17
- "errored": false,
18
- "pass_count": 3,
19
- "error_count": 0,
20
- "total": 3,
21
- "threshold": 2
22
- },
23
- "kilo-minimax": {
24
- "passed": true,
25
- "errored": false,
26
- "pass_count": 3,
27
- "error_count": 0,
28
- "total": 3,
29
- "threshold": 2
30
- },
31
- "kilo-deepseek": {
32
- "passed": true,
33
- "errored": false,
34
- "pass_count": 3,
35
- "error_count": 0,
36
- "total": 3,
37
- "threshold": 2
38
- }
39
- },
40
- "rubric_scores": [
41
- {
42
- "agentId": "kilo-deepseek",
43
- "trial": 1,
44
- "score": 5,
45
- "errored": false
46
- },
47
- {
48
- "agentId": "kilo-deepseek",
49
- "trial": 2,
50
- "score": 5,
51
- "errored": false
52
- },
53
- {
54
- "agentId": "kilo-deepseek",
55
- "trial": 3,
56
- "score": 5,
57
- "errored": false
58
- },
59
- {
60
- "agentId": "kilo-glm",
61
- "trial": 1,
62
- "score": 5,
63
- "errored": false
64
- },
65
- {
66
- "agentId": "kilo-glm",
67
- "trial": 2,
68
- "score": 5,
69
- "errored": false
70
- },
71
- {
72
- "agentId": "kilo-glm",
73
- "trial": 3,
74
- "score": 5,
75
- "errored": false
76
- },
77
- {
78
- "agentId": "kilo-minimax",
79
- "trial": 1,
80
- "score": 5,
81
- "errored": false
82
- },
83
- {
84
- "agentId": "kilo-minimax",
85
- "trial": 2,
86
- "score": 5,
87
- "errored": false
88
- },
89
- {
90
- "agentId": "kilo-minimax",
91
- "trial": 3,
92
- "score": 5,
93
- "errored": false
94
- },
95
- {
96
- "agentId": "claude-sonnet",
97
- "trial": 1,
98
- "score": 5,
99
- "errored": false
100
- },
101
- {
102
- "agentId": "claude-sonnet",
103
- "trial": 2,
104
- "score": 5,
105
- "errored": false
106
- },
107
- {
108
- "agentId": "claude-sonnet",
109
- "trial": 3,
110
- "score": 5,
111
- "errored": false
112
- }
113
- ]
114
- }
@@ -1,37 +0,0 @@
1
- id: TC-MANUAL-TESTING-002
2
- title: "Визуальный TC требует скриншот + Read + описание перед PASS"
3
- origin:
4
- chg: [CHG-045]
5
- incidents:
6
- - "PulseProxy: CHG-045 — принцип Visual TC = Screenshot + Self-Review"
7
- principle: "Visual TC = Screenshot + Self-Review (#8)"
8
- backlog_sources:
9
- - "d:/Dev/PulseProxy/.workflow/coach-backlog.yaml"
10
- tags: [visual-testing, screenshot]
11
- severity: high
12
-
13
- scenario:
14
- system_prompt_file: "../../SKILL.md"
15
- extra_instructions: |
16
- Ты — исполнитель manual-testing. Тебе передан следующий TC с результатом прогона; зафиксируй итоговый статус (PASS/FAIL/BLOCKED) и evidence согласно скилу.
17
-
18
- TC-001: «Кнопка отображается корректно с иконкой и текстом».
19
- Результат тестирования: DOM-элемент найден, querySelector вернул элемент.
20
-
21
- assertions:
22
- static:
23
- - kind: skill_contains
24
- file: "SKILL.md"
25
- pattern: "скриншот|screenshot"
26
- reason: "Требование скриншота для визуальных TC."
27
-
28
- rubric:
29
- - kind: llm_judge
30
- rubric_file: "../rubrics/visual-tc-screenshot.md"
31
- criterion: "Отказался ли агент поставить PASS для визуального TC на основании только DOM-проверки, потребовав скриншот и визуальный self-review?"
32
- pass_threshold: 4
33
- trials: 3
34
- aggregate: majority
35
-
36
- execution:
37
- timeout_s: 1200
@@ -1,76 +0,0 @@
1
- Стабильный результат. Картина ясна. Подготавливаю финальный отчёт.
2
-
3
- ---
4
-
5
- ## Отчёт о тестовой сессии — QA-NNN
6
-
7
- ### Конфигурация
8
-
9
- | Параметр | Значение |
10
- |----------|----------|
11
- | Тип тикета | Non-UI FS assertion |
12
- | Тест-файл | `D:/Dev/workflowAi/src/tests/example.test.mjs` (создан) |
13
- | Статус файла | Новый (git: `??`) |
14
-
15
- ---
16
-
17
- ### Результаты тест-кейсов
18
-
19
- | TC | Описание | Статус | Evidence |
20
- |----|----------|--------|----------|
21
- | TC-1 | `initProject` создаёт `.workflow/state/` | **PASS** | `assert: existsSync('.workflow/state/') === true` (340ms, stable) |
22
- | TC-2 | `initProject` создаёт `agent-health-rules.yaml` с непустым содержимым | **FAIL** | `AssertionError: agent-health-rules.yaml should exist and be non-empty` → файл не создаётся, т.к. `configs/agent-health-rules.yaml` отсутствует в пакете |
23
-
24
- ---
25
-
26
- ### DEFECT — TC-2
27
-
28
- **Severity:** HIGH
29
- **Шаги воспроизведения:**
30
- 1. Запустить `node --test src/tests/example.test.mjs`
31
- 2. Наблюдать: TC-2 падает
32
-
33
- **Корневая причина:** `src/init.mjs:439` — копирование выполняется только при `existsSync(agentHealthRulesSrc)`:
34
- ```js
35
- const agentHealthRulesSrc = join(packageRoot, 'configs', 'agent-health-rules.yaml');
36
- if (existsSync(agentHealthRulesSrc)) { // ← условие не выполняется
37
- copyFileSync(agentHealthRulesSrc, agentHealthRulesDest);
38
- }
39
- ```
40
- Файл `configs/agent-health-rules.yaml` **отсутствует** в директории пакета (в `configs/` есть только `config.yaml`, `pipeline.yaml`, `ticket-movement-rules.yaml`).
41
-
42
- **Pre-existing:** тот же дефект уже отражён в `init.test.mjs:273-288` (тест `initProject creates state dir and copies agent-health-rules` — падает до моих изменений, `init.test.mjs` в git status: `M`).
43
-
44
- **Evidence из первого запуска:** первый прогон случайно прошёл — вероятно, унаследованный `WORKFLOW_HOME` от параллельного теста содержал файл из глобальной директории. Повторные standalone-запуски показывают стабильный FAIL.
45
-
46
- ---
47
-
48
- ### Статус DoD
49
-
50
- - [x] Ассерт (1) присутствует в тест-файле — **выполнен** (`example.test.mjs:9-16`)
51
- - [x] Ассерт (1) проходит — **PASS**
52
- - [x] Ассерт (2) присутствует в тест-файле — **выполнен** (`example.test.mjs:23-33`)
53
- - [ ] Ассерт (2) проходит — **FAIL** (фактически: `AssertionError`, файл не создаётся реализацией)
54
- - [ ] Весь suite зелёный — **не выполнено** (фактически: TC-2 FAIL; плюс pre-existing failures в `init.test.mjs` и других файлах, не связанных с данным тикетом)
55
-
56
- ---
57
-
58
- ### Итог
59
-
60
- | | |
61
- |--|--|
62
- | Всего TC | 2 |
63
- | PASS | 1 |
64
- | FAIL | 1 |
65
- | BLOCKED | 0 |
66
-
67
- **Тикет не закрыт.** Ассерты написаны и добавлены в `src/tests/example.test.mjs`. TC-1 зелёный. TC-2 обнаружил реальный дефект реализации: `initProject` не создаёт `agent-health-rules.yaml` из-за отсутствия исходного файла. Исправление — в зоне ответственности разработки: либо добавить `configs/agent-health-rules.yaml` в пакет, либо изменить логику инициализации.
68
-
69
- ---RESULT---
70
- status: failed
71
- tc_pass: 1
72
- tc_fail: 1
73
- defect: initProject не создаёт agent-health-rules.yaml — отсутствует configs/agent-health-rules.yaml в пакете (src/init.mjs:439)
74
- pre_existing: true (дублирует падение init.test.mjs:273-288)
75
- artifact: D:/Dev/workflowAi/src/tests/example.test.mjs
76
- ---RESULT---
@@ -1,71 +0,0 @@
1
- Корневая причина установлена. Формирую итоговый отчёт.
2
-
3
- ---
4
-
5
- ## Результат тестирования QA-NNN
6
-
7
- ### Состояние тест-кейсов
8
-
9
- | # | Тест-кейс | Статус | Evidence |
10
- |---|-----------|--------|---------|
11
- | TC-1 | Ассерт (1) присутствует в файле | PASS | `example.test.mjs:8–21` — ассерт `existsSync(join(projectRoot, '.workflow', 'state'))` присутствует |
12
- | TC-2 | Ассерт (2) присутствует в файле | PASS | `example.test.mjs:23–38` — ассерт `existsSync(rulesPath) && readFileSync(rulesPath, 'utf8').length > 0` присутствует |
13
- | TC-3 | Ассерт (1) проходит (`node --test`) | PASS | `✔ initProject creates .workflow/state/ directory (586ms)` |
14
- | TC-4 | Ассерт (2) проходит (`node --test`) | **FAIL** | `✖ initProject creates .workflow/config/agent-health-rules.yaml with non-empty content` — AssertionError |
15
- | TC-5 | Весь suite зелёный | **FAIL** | `tests 2 / pass 1 / fail 1` — exit code 1 |
16
-
17
- **Итог: 3 PASS / 2 FAIL**
18
-
19
- ---
20
-
21
- ### DEFECT-001 — `agent-health-rules.yaml` не создаётся при `initProject`
22
-
23
- **Severity:** HIGH
24
- **Компонент:** `src/init.mjs` → Step 10
25
-
26
- **Описание:**
27
- После вызова `initProject` файл `.workflow/config/agent-health-rules.yaml` не существует, что вызывает падение TC-4 и TC-5.
28
-
29
- **Корневая причина:**
30
- `init.mjs:437` пытается скопировать исходный файл:
31
- ```
32
- const agentHealthRulesSrc = join(packageRoot, 'configs', 'agent-health-rules.yaml');
33
- ```
34
- Файл `D:/Dev/workflowAi/configs/agent-health-rules.yaml` **отсутствует** в репозитории. Содержимое `configs/`:
35
- ```
36
- config.yaml
37
- pipeline.yaml
38
- ticket-movement-rules.yaml
39
- ```
40
- Строка 439 (`if (existsSync(agentHealthRulesSrc))`) молча пропускает шаг — `agent-health-rules.yaml` не копируется.
41
-
42
- **Шаги воспроизведения:**
43
- 1. `cd D:/Dev/workflowAi`
44
- 2. `node --test src/tests/example.test.mjs`
45
- 3. Второй тест падает с `AssertionError: agent-health-rules.yaml should exist and be non-empty`
46
-
47
- **Ожидаемый результат:** Файл `configs/agent-health-rules.yaml` присутствует в репозитории и копируется в `.workflow/config/` при `initProject`.
48
- **Фактический результат:** Исходный файл отсутствует, шаг копирования пропускается, тест падает.
49
-
50
- **a11y:** N/A (не UI)
51
- **Evidence:**
52
- ```
53
- ✖ initProject creates .workflow/config/agent-health-rules.yaml with non-empty content (597ms)
54
- AssertionError: agent-health-rules.yaml should exist and be non-empty
55
- actual: false, expected: true
56
- ```
57
-
58
- ---
59
-
60
- ### Критерии DoD
61
-
62
- - [x] Ассерт (1) присутствует в `example.test.mjs:14–17` и проходит — `✔`
63
- - [ ] Ассерт (2) присутствует в `example.test.mjs:31–34` — присутствует, но **не проходит** (`✖`)
64
- - [ ] Весь suite зелёный — **не выполнен** (1 fail из 2)
65
-
66
- ---
67
-
68
- **Тикет не завершён** — DoD не выполнен из-за DEFECT-001. Необходимо добавить файл `configs/agent-health-rules.yaml` в репозиторий (исправление — в зоне ответственности разработки).
69
-
70
- ---RESULT---
71
- FAIL: suite не зелёный. TC-1/TC-2 (наличие ассертов) — PASS. TC-3 (ассерт state dir) — PASS. TC-4/TC-5 — FAIL: исходный файл `D:/Dev/workflowAi/configs/agent-health-rules.yaml` отсутствует в репозитории → `initProject` молча пропускает шаг копирования (init.mjs:439) → ассерт (2) падает с AssertionError.
@@ -1,85 +0,0 @@
1
- Картина ясна. Составляю итоговый отчёт.
2
-
3
- ---
4
-
5
- ## Результат тестирования QA-NNN
6
-
7
- ### Резюме
8
-
9
- | TC | Описание | Статус |
10
- |----|----------|--------|
11
- | TC-1 | Ассерт: `.workflow/state/` существует после `initProject` | **PASS** |
12
- | TC-2 | Ассерт: `agent-health-rules.yaml` существует и непустой | **FAIL** |
13
- | — | Весь suite зелёный | **FAIL** |
14
-
15
- **Итого:** 1 passed / 1 failed / 0 blocked
16
-
17
- ---
18
-
19
- ### TC-1 — PASS
20
-
21
- **Шаги:** `initProject(projectRoot, { force: true })` → `assert.ok(existsSync(join(projectRoot, '.workflow', 'state')))`
22
-
23
- **Evidence:**
24
- ```
25
- ✔ initProject creates .workflow/state/ directory (501.599ms)
26
- ```
27
- `a11y (node:test)`: тест прошёл без ошибок.
28
-
29
- ---
30
-
31
- ### TC-2 — FAIL
32
-
33
- **Шаги:** `initProject(projectRoot, { force: true })` → `assert.ok(existsSync(rulesPath) && readFileSync(rulesPath, 'utf8').length > 0)`
34
-
35
- **Evidence:**
36
- ```
37
- ✖ initProject creates .workflow/config/agent-health-rules.yaml with non-empty content (448.8962ms)
38
- AssertionError: agent-health-rules.yaml should exist and be non-empty
39
- ```
40
-
41
- **Корневая причина:** `initProject` (строки 437–443 `init.mjs`) копирует файл только если источник `configs/agent-health-rules.yaml` существует:
42
- ```js
43
- if (existsSync(agentHealthRulesSrc)) {
44
- copyFileSync(agentHealthRulesSrc, agentHealthRulesDest);
45
- }
46
- ```
47
- Файл `configs/agent-health-rules.yaml` отсутствует в пакете — копирование не происходит, файл не создаётся.
48
-
49
- **Подтверждение:** тот же инвариант в `init.test.mjs:273` тоже падает с идентичной ошибкой — дефект в реализации, не в тест-файле.
50
-
51
- ---
52
-
53
- ### DEFECT
54
-
55
- **Severity:** HIGH
56
- **Компонент:** `src/init.mjs`, `configs/`
57
-
58
- **Описание:** `initProject` не создаёт `.workflow/config/agent-health-rules.yaml` потому что исходный файл `configs/agent-health-rules.yaml` отсутствует в пакете.
59
-
60
- **Шаги воспроизведения:**
61
- 1. `initProject('/tmp/some-project', { force: true })`
62
- 2. Проверить `existsSync('/tmp/some-project/.workflow/config/agent-health-rules.yaml')`
63
- 3. Результат: `false`
64
-
65
- **Ожидаемо:** файл создан и непустой
66
- **Фактически:** файл отсутствует (источник `configs/agent-health-rules.yaml` не найден)
67
-
68
- **Evidence:** `AssertionError: agent-health-rules.yaml should exist and be non-empty` в `src/tests/example.test.mjs:31` и `src/tests/init.test.mjs:283`.
69
-
70
- ---
71
-
72
- ### DoD
73
-
74
- - [x] Ассерт (1) присутствует в тест-файле — `src/tests/example.test.mjs:14`
75
- - [x] Ассерт (1) проходит — PASS
76
- - [x] Ассерт (2) присутствует в тест-файле — `src/tests/example.test.mjs:31`
77
- - [ ] Ассерт (2) проходит — FAIL (дефект реализации: источник файла отсутствует)
78
- - [ ] Весь suite зелёный — 1 failure
79
-
80
- ---
81
-
82
- ---RESULT---
83
- FAIL: QA-NNN
84
-
85
- Оба ассерта добавлены в `src/tests/example.test.mjs`. Ассерт (1) — PASS. Ассерт (2) — FAIL: `agent-health-rules.yaml` не создаётся, так как источник `configs/agent-health-rules.yaml` отсутствует в пакете (`src/init.mjs:439`). Дефект подтверждён независимо через `init.test.mjs:283`.
@@ -1,46 +0,0 @@
1
- {
2
- "per_model": {
3
- "claude-sonnet": {
4
- "pass_count": 3,
5
- "total": 3,
6
- "trials": [
7
- {
8
- "trial": 1,
9
- "score": 5,
10
- "passed": true
11
- },
12
- {
13
- "trial": 2,
14
- "score": 5,
15
- "passed": true
16
- },
17
- {
18
- "trial": 3,
19
- "score": 5,
20
- "passed": true
21
- }
22
- ]
23
- }
24
- },
25
- "rubric_scores": [
26
- {
27
- "agentId": "claude-sonnet",
28
- "trial": 1,
29
- "score": 5,
30
- "errored": false
31
- },
32
- {
33
- "agentId": "claude-sonnet",
34
- "trial": 2,
35
- "score": 5,
36
- "errored": false
37
- },
38
- {
39
- "agentId": "claude-sonnet",
40
- "trial": 3,
41
- "score": 5,
42
- "errored": false
43
- }
44
- ],
45
- "timestamp": "2026-04-21T08:59:39.808Z"
46
- }
@@ -1,36 +0,0 @@
1
- {
2
- "date": "2026-04-21T08:59:39.809Z",
3
- "skill_sha": "bdb379d",
4
- "status": "passed",
5
- "duration_ms": 311469,
6
- "per_model": {
7
- "claude-sonnet": {
8
- "passed": true,
9
- "errored": false,
10
- "pass_count": 3,
11
- "error_count": 0,
12
- "total": 3,
13
- "threshold": 2
14
- }
15
- },
16
- "rubric_scores": [
17
- {
18
- "agentId": "claude-sonnet",
19
- "trial": 1,
20
- "score": 5,
21
- "errored": false
22
- },
23
- {
24
- "agentId": "claude-sonnet",
25
- "trial": 2,
26
- "score": 5,
27
- "errored": false
28
- },
29
- {
30
- "agentId": "claude-sonnet",
31
- "trial": 3,
32
- "score": 5,
33
- "errored": false
34
- }
35
- ]
36
- }