workflow-ai 1.0.68 → 1.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (585) hide show
  1. package/CHANGELOG.md +49 -0
  2. package/README.md +105 -7
  3. package/configs/pipeline.yaml +23 -2
  4. package/package.json +44 -41
  5. package/src/lib/operations/plans.mjs +85 -0
  6. package/src/lib/operations/skills.mjs +124 -0
  7. package/src/lib/operations/tickets.mjs +430 -0
  8. package/src/lib/utils.mjs +286 -286
  9. package/src/runner.mjs +314 -34
  10. package/src/scripts/check-conditions.js +2 -2
  11. package/src/scripts/get-next-id.js +8 -31
  12. package/src/scripts/pick-next-task.js +3 -9
  13. package/src/skills/coach/SKILL.md +1 -1
  14. package/src/skills/manual-testing/SKILL.md +2 -0
  15. package/src/skills/review-result/SKILL.md +1 -0
  16. package/src/scripts/tests/timeout-cascade.test.js +0 -28
  17. package/src/skills/analyze-report/README.md +0 -44
  18. package/src/skills/analyze-report/algorithms/progress-assessment.md +0 -108
  19. package/src/skills/analyze-report/knowledge/analysis-frameworks.md +0 -66
  20. package/src/skills/analyze-report/knowledge/report-structure.md +0 -61
  21. package/src/skills/analyze-report/scripts/calc-plan-metrics.js +0 -234
  22. package/src/skills/analyze-report/templates/analysis-report.md +0 -80
  23. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/claude-sonnet/trial-1.md +0 -69
  24. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/claude-sonnet/trial-2.md +0 -103
  25. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/claude-sonnet/trial-3.md +0 -99
  26. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/judge.json +0 -163
  27. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-deepseek/trial-1.md +0 -89
  28. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-deepseek/trial-2.md +0 -88
  29. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-deepseek/trial-3.md +0 -100
  30. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-glm/trial-1.md +0 -77
  31. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-glm/trial-2.md +0 -64
  32. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-glm/trial-3.md +0 -110
  33. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-minimax/trial-1.md +0 -74
  34. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-minimax/trial-2.md +0 -38
  35. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/kilo-minimax/trial-3.md +0 -61
  36. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001/current/meta.json +0 -115
  37. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-001-evidence-from-log.yaml +0 -60
  38. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/claude-sonnet/trial-1.md +0 -90
  39. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/claude-sonnet/trial-2.md +0 -89
  40. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/claude-sonnet/trial-3.md +0 -77
  41. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/judge.json +0 -163
  42. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-deepseek/trial-1.md +0 -84
  43. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-deepseek/trial-2.md +0 -77
  44. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-deepseek/trial-3.md +0 -89
  45. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-glm/trial-1.md +0 -103
  46. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-glm/trial-2.md +0 -103
  47. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-glm/trial-3.md +0 -103
  48. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-minimax/trial-1.md +0 -93
  49. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-minimax/trial-2.md +0 -93
  50. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/kilo-minimax/trial-3.md +0 -86
  51. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002/current/meta.json +0 -115
  52. package/src/skills/analyze-report/tests/cases/TC-ANALYZE-REPORT-002-result-block-format.yaml +0 -44
  53. package/src/skills/analyze-report/tests/fixtures/REPORT-002-incorrect-attribution.md +0 -27
  54. package/src/skills/analyze-report/tests/fixtures/pipeline-2026-04-06_qa-001-skip.log +0 -32
  55. package/src/skills/analyze-report/tests/index.yaml +0 -25
  56. package/src/skills/analyze-report/tests/rubrics/evidence-from-log.md +0 -22
  57. package/src/skills/analyze-report/tests/rubrics/result-block-format.md +0 -22
  58. package/src/skills/analyze-report/workflows/progress.md +0 -158
  59. package/src/skills/analyze-report/workflows/retrospective.md +0 -143
  60. package/src/skills/coach/README.md +0 -43
  61. package/src/skills/coach/SKILL.md.legacy +0 -157
  62. package/src/skills/coach/algorithms/gap-analysis.md +0 -69
  63. package/src/skills/coach/algorithms/improvement-prioritization.md +0 -62
  64. package/src/skills/coach/algorithms/skill-scoring.md +0 -80
  65. package/src/skills/coach/knowledge/audit-applied-changes-clean.txt +0 -11
  66. package/src/skills/coach/knowledge/backlog-management.md +0 -67
  67. package/src/skills/coach/knowledge/backlog-management.md.legacy +0 -90
  68. package/src/skills/coach/knowledge/common-antipatterns.md +0 -76
  69. package/src/skills/coach/knowledge/prompt-engineering.md +0 -45
  70. package/src/skills/coach/knowledge/shared-knowledge-guide.md +0 -44
  71. package/src/skills/coach/knowledge/skill-anatomy.md +0 -49
  72. package/src/skills/coach/knowledge/test-authorship.md +0 -141
  73. package/src/skills/coach/templates/audit-report.md +0 -39
  74. package/src/skills/coach/templates/coach-backlog-init.yaml +0 -14
  75. package/src/skills/coach/templates/coach-backlog-init.yaml.legacy +0 -10
  76. package/src/skills/coach/templates/improvement-plan.md +0 -42
  77. package/src/skills/coach/templates/new-skill.md +0 -95
  78. package/src/skills/coach/tests/cases/TC-COACH-001/current/claude-sonnet/trial-1.md +0 -58
  79. package/src/skills/coach/tests/cases/TC-COACH-001/current/claude-sonnet/trial-2.md +0 -65
  80. package/src/skills/coach/tests/cases/TC-COACH-001/current/claude-sonnet/trial-3.md +0 -58
  81. package/src/skills/coach/tests/cases/TC-COACH-001/current/judge.json +0 -151
  82. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-deepseek/trial-1.md +0 -46
  83. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-deepseek/trial-2.md +0 -0
  84. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-deepseek/trial-3.md +0 -75
  85. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-glm/trial-1.md +0 -81
  86. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-glm/trial-2.md +0 -101
  87. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-glm/trial-3.md +0 -91
  88. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-minimax/trial-1.md +0 -48
  89. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-minimax/trial-2.md +0 -30
  90. package/src/skills/coach/tests/cases/TC-COACH-001/current/kilo-minimax/trial-3.md +0 -55
  91. package/src/skills/coach/tests/cases/TC-COACH-001/current/meta.json +0 -94
  92. package/src/skills/coach/tests/cases/TC-COACH-001-evidence-based-temporal-diagram.yaml +0 -53
  93. package/src/skills/coach/tests/cases/TC-COACH-002/current/claude-sonnet/trial-1.md +0 -46
  94. package/src/skills/coach/tests/cases/TC-COACH-002/current/claude-sonnet/trial-2.md +0 -50
  95. package/src/skills/coach/tests/cases/TC-COACH-002/current/claude-sonnet/trial-3.md +0 -48
  96. package/src/skills/coach/tests/cases/TC-COACH-002/current/judge.json +0 -151
  97. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-deepseek/trial-1.md +0 -0
  98. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-deepseek/trial-2.md +0 -37
  99. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-deepseek/trial-3.md +0 -30
  100. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-glm/trial-1.md +0 -23
  101. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-glm/trial-2.md +0 -29
  102. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-glm/trial-3.md +0 -35
  103. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-minimax/trial-1.md +0 -13
  104. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-minimax/trial-2.md +0 -19
  105. package/src/skills/coach/tests/cases/TC-COACH-002/current/kilo-minimax/trial-3.md +0 -33
  106. package/src/skills/coach/tests/cases/TC-COACH-002/current/meta.json +0 -94
  107. package/src/skills/coach/tests/cases/TC-COACH-002-root-cause-first.yaml +0 -57
  108. package/src/skills/coach/tests/fixtures/pipeline-2026-04-06_id-collision.log +0 -77
  109. package/src/skills/coach/tests/index.yaml +0 -29
  110. package/src/skills/coach/tests/rubrics/calibration/evidence-based-bad.md +0 -13
  111. package/src/skills/coach/tests/rubrics/calibration/evidence-based-good.md +0 -29
  112. package/src/skills/coach/tests/rubrics/evidence-based.md +0 -26
  113. package/src/skills/coach/tests/rubrics/root-cause-first.md +0 -21
  114. package/src/skills/coach/workflows/analyze.md +0 -79
  115. package/src/skills/coach/workflows/analyze.md.legacy +0 -64
  116. package/src/skills/coach/workflows/audit.md +0 -74
  117. package/src/skills/coach/workflows/audit.md.legacy +0 -59
  118. package/src/skills/coach/workflows/create.md +0 -80
  119. package/src/skills/coach/workflows/create.md.legacy +0 -67
  120. package/src/skills/coach/workflows/improve.md +0 -71
  121. package/src/skills/coach/workflows/improve.md.legacy +0 -60
  122. package/src/skills/coach/workflows/research.md +0 -55
  123. package/src/skills/coach/workflows/review.md +0 -52
  124. package/src/skills/coach/workflows/review.md.legacy +0 -48
  125. package/src/skills/coach/workflows/test.md +0 -97
  126. package/src/skills/create-plan/README.md +0 -39
  127. package/src/skills/create-plan/algorithms/risk-assessment.md +0 -73
  128. package/src/skills/create-plan/knowledge/plan-completeness.md +0 -67
  129. package/src/skills/create-plan/knowledge/plan-lifecycle.md +0 -33
  130. package/src/skills/create-plan/knowledge/task-verification-pairs.md +0 -151
  131. package/src/skills/create-plan/knowledge/test-hygiene.md +0 -47
  132. package/src/skills/create-plan/scripts/validate-completeness.js +0 -182
  133. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/claude-sonnet/trial-1.md +0 -5
  134. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/claude-sonnet/trial-2.md +0 -39
  135. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/claude-sonnet/trial-3.md +0 -35
  136. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/judge.json +0 -167
  137. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-deepseek/trial-1.md +0 -5
  138. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-deepseek/trial-2.md +0 -10
  139. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-deepseek/trial-3.md +0 -5
  140. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-glm/trial-1.md +0 -26
  141. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-glm/trial-2.md +0 -86
  142. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-glm/trial-3.md +0 -5
  143. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-minimax/trial-1.md +0 -11
  144. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-minimax/trial-2.md +0 -15
  145. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/kilo-minimax/trial-3.md +0 -14
  146. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001/current/meta.json +0 -119
  147. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-001-validate-completeness.yaml +0 -41
  148. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/claude-sonnet/trial-1.md +0 -25
  149. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/claude-sonnet/trial-2.md +0 -30
  150. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/claude-sonnet/trial-3.md +0 -37
  151. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/judge.json +0 -164
  152. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-deepseek/trial-1.md +0 -3
  153. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-deepseek/trial-2.md +0 -11
  154. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-deepseek/trial-3.md +0 -13
  155. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-glm/trial-1.md +0 -44
  156. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-glm/trial-2.md +0 -5
  157. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-glm/trial-3.md +0 -49
  158. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-minimax/trial-1.md +0 -6
  159. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-minimax/trial-2.md +0 -11
  160. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/kilo-minimax/trial-3.md +0 -16
  161. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002/current/meta.json +0 -116
  162. package/src/skills/create-plan/tests/cases/TC-CREATE-PLAN-002-task-granularity.yaml +0 -39
  163. package/src/skills/create-plan/tests/index.yaml +0 -25
  164. package/src/skills/create-plan/tests/rubrics/task-granularity.md +0 -21
  165. package/src/skills/create-plan/tests/rubrics/validate-completeness.md +0 -21
  166. package/src/skills/create-plan/workflows/create.md +0 -136
  167. package/src/skills/create-report/README.md +0 -40
  168. package/src/skills/create-report/algorithms/metric-calculation.md +0 -93
  169. package/src/skills/create-report/knowledge/report-metrics.md +0 -82
  170. package/src/skills/create-report/scripts/calc-metrics.js +0 -383
  171. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/claude-sonnet/trial-1.md +0 -25
  172. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/claude-sonnet/trial-2.md +0 -26
  173. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/claude-sonnet/trial-3.md +0 -28
  174. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/judge.json +0 -163
  175. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-deepseek/trial-1.md +0 -4
  176. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-deepseek/trial-2.md +0 -3
  177. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-deepseek/trial-3.md +0 -6
  178. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-glm/trial-1.md +0 -8
  179. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-glm/trial-2.md +0 -12
  180. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-glm/trial-3.md +0 -7
  181. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-minimax/trial-1.md +0 -12
  182. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-minimax/trial-2.md +0 -22
  183. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/kilo-minimax/trial-3.md +0 -13
  184. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001/current/meta.json +0 -115
  185. package/src/skills/create-report/tests/cases/TC-CREATE-REPORT-001-root-cause-attribution.yaml +0 -57
  186. package/src/skills/create-report/tests/index.yaml +0 -20
  187. package/src/skills/create-report/tests/rubrics/root-cause-attribution.md +0 -21
  188. package/src/skills/create-report/workflows/standard.md +0 -175
  189. package/src/skills/decompose-gaps/README.md +0 -39
  190. package/src/skills/decompose-gaps/algorithms/scope-check.md +0 -110
  191. package/src/skills/decompose-gaps/knowledge/scope-validation.md +0 -65
  192. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/claude-sonnet/trial-1.md +0 -41
  193. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/claude-sonnet/trial-2.md +0 -41
  194. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/claude-sonnet/trial-3.md +0 -56
  195. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/judge.json +0 -164
  196. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-deepseek/trial-1.md +0 -25
  197. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-deepseek/trial-2.md +0 -17
  198. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-deepseek/trial-3.md +0 -22
  199. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-glm/trial-1.md +0 -25
  200. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-glm/trial-2.md +0 -5
  201. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-glm/trial-3.md +0 -29
  202. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-minimax/trial-1.md +0 -27
  203. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-minimax/trial-2.md +0 -35
  204. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/kilo-minimax/trial-3.md +0 -18
  205. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001/current/meta.json +0 -116
  206. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-001-scope-exclusion.yaml +0 -46
  207. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/claude-sonnet/trial-1.md +0 -27
  208. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/claude-sonnet/trial-2.md +0 -30
  209. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/claude-sonnet/trial-3.md +0 -27
  210. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/judge.json +0 -163
  211. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-deepseek/trial-1.md +0 -0
  212. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-deepseek/trial-2.md +0 -15
  213. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-deepseek/trial-3.md +0 -7
  214. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-glm/trial-1.md +0 -21
  215. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-glm/trial-2.md +0 -38
  216. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-glm/trial-3.md +0 -16
  217. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-minimax/trial-1.md +0 -5
  218. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-minimax/trial-2.md +0 -10
  219. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/kilo-minimax/trial-3.md +0 -9
  220. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002/current/meta.json +0 -115
  221. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-002-glob-before-write.yaml +0 -36
  222. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/claude-sonnet/trial-1.md +0 -30
  223. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/claude-sonnet/trial-2.md +0 -30
  224. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/claude-sonnet/trial-3.md +0 -30
  225. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/judge.json +0 -165
  226. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-deepseek/trial-1.md +0 -5
  227. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-deepseek/trial-2.md +0 -26
  228. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-deepseek/trial-3.md +0 -5
  229. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-glm/trial-1.md +0 -39
  230. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-glm/trial-2.md +0 -37
  231. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-glm/trial-3.md +0 -45
  232. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-minimax/trial-1.md +0 -26
  233. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-minimax/trial-2.md +0 -27
  234. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/kilo-minimax/trial-3.md +0 -7
  235. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003/current/meta.json +0 -117
  236. package/src/skills/decompose-gaps/tests/cases/TC-DECOMPOSE-GAPS-003-parent-plan-mandatory.yaml +0 -41
  237. package/src/skills/decompose-gaps/tests/index.yaml +0 -30
  238. package/src/skills/decompose-gaps/tests/rubrics/glob-before-write.md +0 -21
  239. package/src/skills/decompose-gaps/tests/rubrics/parent-plan-mandatory.md +0 -22
  240. package/src/skills/decompose-gaps/tests/rubrics/scope-exclusion.md +0 -21
  241. package/src/skills/decompose-gaps/workflows/decompose.md +0 -123
  242. package/src/skills/decompose-plan/README.md +0 -43
  243. package/src/skills/decompose-plan/algorithms/deduplication.md +0 -101
  244. package/src/skills/decompose-plan/knowledge/atomicity-checklist.md +0 -139
  245. package/src/skills/decompose-plan/knowledge/capabilities.md +0 -68
  246. package/src/skills/decompose-plan/knowledge/human-task-rules.md +0 -82
  247. package/src/skills/decompose-plan/knowledge/scope-guard-checklist.md +0 -73
  248. package/src/skills/decompose-plan/scripts/check-atomicity-limit.js +0 -47
  249. package/src/skills/decompose-plan/scripts/check-duplicates.js +0 -323
  250. package/src/skills/decompose-plan/scripts/verify-atomicity.js +0 -408
  251. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/claude-sonnet/trial-1.md +0 -30
  252. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/claude-sonnet/trial-2.md +0 -36
  253. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/claude-sonnet/trial-3.md +0 -37
  254. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/judge.json +0 -163
  255. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-deepseek/trial-1.md +0 -20
  256. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-deepseek/trial-2.md +0 -17
  257. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-deepseek/trial-3.md +0 -28
  258. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-glm/trial-1.md +0 -114
  259. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-glm/trial-2.md +0 -137
  260. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-glm/trial-3.md +0 -188
  261. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-minimax/trial-1.md +0 -0
  262. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-minimax/trial-2.md +0 -32
  263. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/kilo-minimax/trial-3.md +0 -110
  264. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001/current/meta.json +0 -115
  265. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-001-atomicity-no-1to1.yaml +0 -56
  266. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/claude-sonnet/trial-1.md +0 -47
  267. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/claude-sonnet/trial-2.md +0 -54
  268. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/claude-sonnet/trial-3.md +0 -43
  269. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/judge.json +0 -163
  270. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-deepseek/trial-1.md +0 -15
  271. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-deepseek/trial-2.md +0 -5
  272. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-deepseek/trial-3.md +0 -12
  273. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-glm/trial-1.md +0 -34
  274. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-glm/trial-2.md +0 -30
  275. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-glm/trial-3.md +0 -35
  276. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-minimax/trial-1.md +0 -0
  277. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-minimax/trial-2.md +0 -31
  278. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/kilo-minimax/trial-3.md +0 -0
  279. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002/current/meta.json +0 -115
  280. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-002-get-next-id-mandatory.yaml +0 -44
  281. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/claude-sonnet/trial-1.md +0 -21
  282. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/claude-sonnet/trial-2.md +0 -38
  283. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/claude-sonnet/trial-3.md +0 -30
  284. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/judge.json +0 -163
  285. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-deepseek/trial-1.md +0 -31
  286. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-deepseek/trial-2.md +0 -35
  287. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-deepseek/trial-3.md +0 -48
  288. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-glm/trial-1.md +0 -167
  289. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-glm/trial-2.md +0 -62
  290. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-glm/trial-3.md +0 -174
  291. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-minimax/trial-1.md +0 -0
  292. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-minimax/trial-2.md +0 -0
  293. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/kilo-minimax/trial-3.md +0 -0
  294. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003/current/meta.json +0 -115
  295. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-003-verbatim-dod-transfer.yaml +0 -42
  296. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/claude-sonnet/trial-1.md +0 -55
  297. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/claude-sonnet/trial-2.md +0 -49
  298. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/claude-sonnet/trial-3.md +0 -49
  299. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/judge.json +0 -163
  300. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-deepseek/trial-1.md +0 -104
  301. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-deepseek/trial-2.md +0 -45
  302. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-deepseek/trial-3.md +0 -58
  303. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-glm/trial-1.md +0 -193
  304. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-glm/trial-2.md +0 -202
  305. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-glm/trial-3.md +0 -155
  306. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-minimax/trial-1.md +0 -52
  307. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-minimax/trial-2.md +0 -17
  308. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/kilo-minimax/trial-3.md +0 -0
  309. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004/current/meta.json +0 -115
  310. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-004-executor-atomicity.yaml +0 -64
  311. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/claude-sonnet/trial-1.md +0 -59
  312. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/claude-sonnet/trial-2.md +0 -204
  313. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/claude-sonnet/trial-3.md +0 -213
  314. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/judge.json +0 -163
  315. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-deepseek/trial-1.md +0 -0
  316. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-deepseek/trial-2.md +0 -57
  317. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-deepseek/trial-3.md +0 -54
  318. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-glm/trial-1.md +0 -147
  319. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-glm/trial-2.md +0 -165
  320. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-glm/trial-3.md +0 -133
  321. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-minimax/trial-1.md +0 -81
  322. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-minimax/trial-2.md +0 -108
  323. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/kilo-minimax/trial-3.md +0 -3
  324. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005/current/meta.json +0 -114
  325. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-005-capabilities-registry.yaml +0 -78
  326. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/claude-sonnet/trial-1.md +0 -225
  327. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/claude-sonnet/trial-2.md +0 -66
  328. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/claude-sonnet/trial-3.md +0 -36
  329. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/judge.json +0 -163
  330. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-deepseek/trial-1.md +0 -42
  331. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-deepseek/trial-2.md +0 -67
  332. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-deepseek/trial-3.md +0 -40
  333. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-glm/trial-1.md +0 -122
  334. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-glm/trial-2.md +0 -131
  335. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-glm/trial-3.md +0 -138
  336. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-minimax/trial-1.md +0 -41
  337. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-minimax/trial-2.md +0 -88
  338. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/kilo-minimax/trial-3.md +0 -0
  339. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006/current/meta.json +0 -115
  340. package/src/skills/decompose-plan/tests/cases/TC-DECOMPOSE-PLAN-006-dod-threshold.yaml +0 -72
  341. package/src/skills/decompose-plan/tests/index.yaml +0 -45
  342. package/src/skills/decompose-plan/tests/rubrics/atomicity-no-1to1.md +0 -21
  343. package/src/skills/decompose-plan/tests/rubrics/capabilities-registry.md +0 -21
  344. package/src/skills/decompose-plan/tests/rubrics/dod-threshold.md +0 -21
  345. package/src/skills/decompose-plan/tests/rubrics/executor-atomicity.md +0 -21
  346. package/src/skills/decompose-plan/tests/rubrics/get-next-id-mandatory.md +0 -21
  347. package/src/skills/decompose-plan/tests/rubrics/verbatim-dod-transfer.md +0 -21
  348. package/src/skills/decompose-plan/workflows/decompose.md +0 -305
  349. package/src/skills/deep-research/README.md +0 -36
  350. package/src/skills/deep-research/algorithms/source-scoring.md +0 -63
  351. package/src/skills/deep-research/algorithms/synthesis.md +0 -67
  352. package/src/skills/deep-research/knowledge/data-validation.md +0 -44
  353. package/src/skills/deep-research/knowledge/perplexity-config.md +0 -30
  354. package/src/skills/deep-research/knowledge/research-methodology.md +0 -54
  355. package/src/skills/deep-research/knowledge/source-evaluation.md +0 -33
  356. package/src/skills/deep-research/scripts/perplexity-research.js +0 -315
  357. package/src/skills/deep-research/templates/brief-summary.md +0 -25
  358. package/src/skills/deep-research/templates/research-report.md +0 -76
  359. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/claude-haiku/trial-1.md +0 -48
  360. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/claude-haiku/trial-2.md +0 -88
  361. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/claude-haiku/trial-3.md +0 -56
  362. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/judge.json +0 -163
  363. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-free/trial-1.md +0 -58
  364. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-free/trial-2.md +0 -249
  365. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-free/trial-3.md +0 -44
  366. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-glm/trial-1.md +0 -96
  367. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-glm/trial-2.md +0 -56
  368. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-glm/trial-3.md +0 -94
  369. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-glm-air/trial-1.md +0 -11
  370. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-glm-air/trial-2.md +0 -1
  371. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/kilo-glm-air/trial-3.md +0 -1
  372. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001/current/meta.json +0 -115
  373. package/src/skills/deep-research/tests/cases/TC-DEEP-RESEARCH-001-self-check-url.yaml +0 -58
  374. package/src/skills/deep-research/tests/index.yaml +0 -20
  375. package/src/skills/deep-research/tests/rubrics/self-check-url.md +0 -34
  376. package/src/skills/deep-research/workflows/base-checklist.md +0 -19
  377. package/src/skills/deep-research/workflows/benchmark.md +0 -38
  378. package/src/skills/deep-research/workflows/competitor.md +0 -44
  379. package/src/skills/deep-research/workflows/custom.md +0 -32
  380. package/src/skills/deep-research/workflows/market.md +0 -44
  381. package/src/skills/deep-research/workflows/technology.md +0 -40
  382. package/src/skills/deep-research/workflows/trend.md +0 -40
  383. package/src/skills/execute-task/README.md +0 -44
  384. package/src/skills/execute-task/algorithms/execution-strategy.md +0 -136
  385. package/src/skills/execute-task/knowledge/context-checkpoints.md +0 -75
  386. package/src/skills/execute-task/knowledge/ticket-structure.md +0 -70
  387. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/claude-haiku/trial-1.md +0 -5
  388. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/claude-haiku/trial-2.md +0 -5
  389. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/claude-haiku/trial-3.md +0 -5
  390. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/judge.json +0 -124
  391. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/kilo-free/trial-1.md +0 -4
  392. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/kilo-free/trial-2.md +0 -4
  393. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/kilo-free/trial-3.md +0 -4
  394. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/kilo-glm-air/trial-1.md +0 -4
  395. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/kilo-glm-air/trial-2.md +0 -4
  396. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/kilo-glm-air/trial-3.md +0 -11
  397. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001/current/meta.json +0 -88
  398. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-001-no-ticket-creation.yaml +0 -48
  399. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/claude-haiku/trial-1.md +0 -5
  400. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/claude-haiku/trial-2.md +0 -6
  401. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/claude-haiku/trial-3.md +0 -5
  402. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/judge.json +0 -124
  403. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/kilo-free/trial-1.md +0 -4
  404. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/kilo-free/trial-2.md +0 -4
  405. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/kilo-free/trial-3.md +0 -8
  406. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/kilo-glm-air/trial-1.md +0 -9
  407. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/kilo-glm-air/trial-2.md +0 -26
  408. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/kilo-glm-air/trial-3.md +0 -4
  409. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002/current/meta.json +0 -89
  410. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-002-no-duplicate-dod.yaml +0 -44
  411. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-003/current/claude-haiku/trial-1.md +0 -5
  412. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-003/current/claude-haiku/trial-2.md +0 -5
  413. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-003/current/claude-haiku/trial-3.md +0 -5
  414. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-003/current/judge.json +0 -46
  415. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-003/current/meta.json +0 -37
  416. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-003-verification-proportionality.yaml +0 -46
  417. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/claude-haiku/trial-1.md +0 -18
  418. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/claude-haiku/trial-2.md +0 -16
  419. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/claude-haiku/trial-3.md +0 -14
  420. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/judge.json +0 -124
  421. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/kilo-free/trial-1.md +0 -5
  422. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/kilo-free/trial-2.md +0 -5
  423. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/kilo-free/trial-3.md +0 -1
  424. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/kilo-glm-air/trial-1.md +0 -8
  425. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/kilo-glm-air/trial-2.md +0 -5
  426. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/kilo-glm-air/trial-3.md +0 -4
  427. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004/current/meta.json +0 -89
  428. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-004-no-foreign-ticket-edit.yaml +0 -50
  429. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/claude-haiku/trial-1.md +0 -5
  430. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/claude-haiku/trial-2.md +0 -5
  431. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/claude-haiku/trial-3.md +0 -5
  432. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/judge.json +0 -124
  433. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/kilo-free/trial-1.md +0 -15
  434. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/kilo-free/trial-2.md +0 -4
  435. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/kilo-free/trial-3.md +0 -5
  436. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/kilo-glm-air/trial-1.md +0 -11
  437. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/kilo-glm-air/trial-2.md +0 -11
  438. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/kilo-glm-air/trial-3.md +0 -4
  439. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005/current/meta.json +0 -88
  440. package/src/skills/execute-task/tests/cases/TC-EXECUTE-TASK-005-ticket-fields-updated.yaml +0 -39
  441. package/src/skills/execute-task/tests/fixtures/IMPL-902-create-file.md +0 -41
  442. package/src/skills/execute-task/tests/fixtures/IMPL-904-current-task.md +0 -40
  443. package/src/skills/execute-task/tests/fixtures/IMPL-906-fill-ticket.md +0 -42
  444. package/src/skills/execute-task/tests/fixtures/QA-901-button-click.md +0 -41
  445. package/src/skills/execute-task/tests/fixtures/QA-903-visual-figma.md +0 -40
  446. package/src/skills/execute-task/tests/fixtures/TASK-905-done-with-typo.md +0 -36
  447. package/src/skills/execute-task/tests/index.yaml +0 -39
  448. package/src/skills/execute-task/tests/rubrics/no-duplicate-dod.md +0 -22
  449. package/src/skills/execute-task/tests/rubrics/no-foreign-ticket-edit.md +0 -20
  450. package/src/skills/execute-task/tests/rubrics/no-ticket-creation.md +0 -21
  451. package/src/skills/execute-task/tests/rubrics/ticket-fields-updated.md +0 -23
  452. package/src/skills/execute-task/tests/rubrics/verification-proportionality.md +0 -22
  453. package/src/skills/execute-task/workflows/execute.md +0 -104
  454. package/src/skills/manual-testing/README.md +0 -63
  455. package/src/skills/manual-testing/algorithms/blocked-tool-strategy.md +0 -74
  456. package/src/skills/manual-testing/algorithms/bug-severity.md +0 -73
  457. package/src/skills/manual-testing/algorithms/mcp-budget.md +0 -97
  458. package/src/skills/manual-testing/algorithms/test-prioritization.md +0 -69
  459. package/src/skills/manual-testing/knowledge/browser-extension-testing.md +0 -102
  460. package/src/skills/manual-testing/knowledge/browser-tools.md +0 -114
  461. package/src/skills/manual-testing/knowledge/desktop-tools-advanced.md +0 -92
  462. package/src/skills/manual-testing/knowledge/desktop-tools-core.md +0 -76
  463. package/src/skills/manual-testing/knowledge/sandbox-advanced.md +0 -83
  464. package/src/skills/manual-testing/knowledge/sandbox-core.md +0 -67
  465. package/src/skills/manual-testing/knowledge/stateful-edge-cases.md +0 -69
  466. package/src/skills/manual-testing/knowledge/test-case-design.md +0 -107
  467. package/src/skills/manual-testing/knowledge/testing-types.md +0 -45
  468. package/src/skills/manual-testing/templates/bug-report.md +0 -52
  469. package/src/skills/manual-testing/templates/test-case.md +0 -34
  470. package/src/skills/manual-testing/templates/test-plan.md +0 -97
  471. package/src/skills/manual-testing/templates/test-session-report.md +0 -56
  472. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/claude-sonnet/trial-1.md +0 -34
  473. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/claude-sonnet/trial-2.md +0 -32
  474. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/claude-sonnet/trial-3.md +0 -30
  475. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/judge.json +0 -163
  476. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-deepseek/trial-1.md +0 -0
  477. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-deepseek/trial-2.md +0 -7
  478. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-deepseek/trial-3.md +0 -0
  479. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-glm/trial-1.md +0 -4
  480. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-glm/trial-2.md +0 -15
  481. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-glm/trial-3.md +0 -8
  482. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-minimax/trial-1.md +0 -5
  483. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-minimax/trial-2.md +0 -7
  484. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/kilo-minimax/trial-3.md +0 -7
  485. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001/current/meta.json +0 -114
  486. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-001-sandbox-mandatory.yaml +0 -38
  487. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/claude-sonnet/trial-1.md +0 -44
  488. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/claude-sonnet/trial-2.md +0 -32
  489. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/claude-sonnet/trial-3.md +0 -47
  490. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/judge.json +0 -163
  491. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-deepseek/trial-1.md +0 -19
  492. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-deepseek/trial-2.md +0 -15
  493. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-deepseek/trial-3.md +0 -24
  494. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-glm/trial-1.md +0 -19
  495. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-glm/trial-2.md +0 -13
  496. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-glm/trial-3.md +0 -18
  497. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-minimax/trial-1.md +0 -21
  498. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-minimax/trial-2.md +0 -15
  499. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/kilo-minimax/trial-3.md +0 -14
  500. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002/current/meta.json +0 -114
  501. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-002-visual-tc-screenshot.yaml +0 -37
  502. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-003/current/claude-sonnet/trial-1.md +0 -76
  503. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-003/current/claude-sonnet/trial-2.md +0 -71
  504. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-003/current/claude-sonnet/trial-3.md +0 -85
  505. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-003/current/judge.json +0 -46
  506. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-003/current/meta.json +0 -36
  507. package/src/skills/manual-testing/tests/cases/TC-MANUAL-TESTING-003-qa-non-ui-assertion.yaml +0 -65
  508. package/src/skills/manual-testing/tests/index.yaml +0 -30
  509. package/src/skills/manual-testing/tests/last-run-tc001-sonnet.log +0 -140
  510. package/src/skills/manual-testing/tests/last-run-tc002.log +0 -1
  511. package/src/skills/manual-testing/tests/last-run.log +0 -1469
  512. package/src/skills/manual-testing/tests/rubrics/qa-non-ui-assertion.md +0 -31
  513. package/src/skills/manual-testing/tests/rubrics/sandbox-mandatory.md +0 -20
  514. package/src/skills/manual-testing/tests/rubrics/visual-tc-screenshot.md +0 -21
  515. package/src/skills/manual-testing/workflows/acceptance.md +0 -80
  516. package/src/skills/manual-testing/workflows/exploratory.md +0 -84
  517. package/src/skills/manual-testing/workflows/regression.md +0 -76
  518. package/src/skills/manual-testing/workflows/smoke.md +0 -109
  519. package/src/skills/manual-testing/workflows/test-plan.md +0 -75
  520. package/src/skills/review-result/README.md +0 -59
  521. package/src/skills/review-result/algorithms/verification.md +0 -112
  522. package/src/skills/review-result/knowledge/dod-patterns.md +0 -115
  523. package/src/skills/review-result/knowledge/test-hygiene.md +0 -44
  524. package/src/skills/review-result/scripts/verify-artifacts.js +0 -497
  525. package/src/skills/review-result/templates/verdict.md +0 -153
  526. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/claude-haiku/trial-1.md +0 -22
  527. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/claude-haiku/trial-2.md +0 -7
  528. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/claude-haiku/trial-3.md +0 -21
  529. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/claude-sonnet/trial-1.md +0 -6
  530. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/claude-sonnet/trial-2.md +0 -6
  531. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/claude-sonnet/trial-3.md +0 -18
  532. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/judge.json +0 -164
  533. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-deepseek/trial-1.md +0 -5
  534. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-deepseek/trial-2.md +0 -7
  535. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-deepseek/trial-3.md +0 -6
  536. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-glm/trial-1.md +0 -49
  537. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-glm/trial-2.md +0 -28
  538. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-glm/trial-3.md +0 -37
  539. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-minimax/trial-1.md +0 -22
  540. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-minimax/trial-2.md +0 -13
  541. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/kilo-minimax/trial-3.md +0 -21
  542. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001/current/meta.json +0 -116
  543. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-001-visual-tc-trigger.yaml +0 -51
  544. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/claude-haiku/trial-1.md +0 -23
  545. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/claude-haiku/trial-2.md +0 -22
  546. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/claude-haiku/trial-3.md +0 -28
  547. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/claude-sonnet/trial-1.md +0 -4
  548. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/claude-sonnet/trial-2.md +0 -36
  549. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/claude-sonnet/trial-3.md +0 -4
  550. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/judge.json +0 -163
  551. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-deepseek/trial-1.md +0 -4
  552. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-deepseek/trial-2.md +0 -0
  553. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-deepseek/trial-3.md +0 -4
  554. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-glm/trial-1.md +0 -39
  555. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-glm/trial-2.md +0 -25
  556. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-glm/trial-3.md +0 -32
  557. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-minimax/trial-1.md +0 -34
  558. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-minimax/trial-2.md +0 -8
  559. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/kilo-minimax/trial-3.md +0 -23
  560. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002/current/meta.json +0 -115
  561. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-002-path-line-suffix.yaml +0 -39
  562. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/claude-sonnet/trial-1.md +0 -7
  563. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/claude-sonnet/trial-2.md +0 -7
  564. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/claude-sonnet/trial-3.md +0 -7
  565. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/judge.json +0 -163
  566. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-deepseek/trial-1.md +0 -5
  567. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-deepseek/trial-2.md +0 -5
  568. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-deepseek/trial-3.md +0 -11
  569. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-glm/trial-1.md +0 -16
  570. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-glm/trial-2.md +0 -18
  571. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-glm/trial-3.md +0 -17
  572. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-minimax/trial-1.md +0 -17
  573. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-minimax/trial-2.md +0 -31
  574. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/kilo-minimax/trial-3.md +0 -5
  575. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003/current/meta.json +0 -115
  576. package/src/skills/review-result/tests/cases/TC-REVIEW-RESULT-003-test-isolation.yaml +0 -50
  577. package/src/skills/review-result/tests/fixtures/IMPL-902-path-with-line.md +0 -43
  578. package/src/skills/review-result/tests/fixtures/QA-901-visual-button.md +0 -46
  579. package/src/skills/review-result/tests/fixtures/QA-904-test-isolation-violation/QA-904.md +0 -51
  580. package/src/skills/review-result/tests/fixtures/QA-904-test-isolation-violation/example-test.mjs +0 -36
  581. package/src/skills/review-result/tests/index.yaml +0 -30
  582. package/src/skills/review-result/tests/rubrics/path-line-suffix.md +0 -19
  583. package/src/skills/review-result/tests/rubrics/test-isolation.md +0 -20
  584. package/src/skills/review-result/tests/rubrics/visual-tc-trigger.md +0 -19
  585. package/src/skills/review-result/workflows/review.md +0 -209
@@ -1,77 +0,0 @@
1
- Now I have all the context. Let me produce the analysis.
2
-
3
- ---
4
-
5
- # Анализ: Прогресс PLAN-001
6
-
7
- **Дата анализа:** 2026-04-20
8
- **Анализируемый план:** PLAN-001
9
- **Анализируемый отчёт:** REPORT-002
10
- **Тип анализа:** PROGRESS
11
-
12
- ---
13
-
14
- ## Executive Summary
15
-
16
- При верификации REPORT-002 по логу пайплайна обнаружена **некорректная атрибуция** root cause пропуска тикета QA-001. Предыдущий отчёт возложил вину на стейдж проверки условий, однако лог однозначно показывает, что решение о пропуске принял стейдж `check-relevance` (строка 26 лога: `status="irrelevant"`, `reason="dependencies_inactive"`). Требуется исправление логики релевантности и корректировка отчёта.
17
-
18
- ---
19
-
20
- ## Ключевые находки
21
-
22
- ### 1. Некорректная атрибуция root cause в REPORT-002
23
- **Уверенность:** [HIGH]
24
- **Данные из лога:**
25
-
26
- | Шаг | Стейдж | Скрипт | Результат | Строка лога |
27
- |-----|--------|--------|-----------|-------------|
28
- | 313 | `check-conditions` | `check-conditions.js` | `conditions_ok` (dependencies.resolved=true, prerequisites.met=true, blocking_tickets=[]) | 16–17 |
29
- | **314** | **`check-relevance`** | **`check-relevance.js`** | **`irrelevant` (dependencies.status=inactive, reason=dependencies_inactive)** | **26** |
30
- | 315 | `skip-ticket` | `script-skip` | `skipped` (reason from check-relevance: dependencies_inactive) | 31 |
31
-
32
- Стейдж проверки условий **успешно пропустил** тикет дальше (result=`conditions_ok`). Итоговое решение `irrelevant` принял стейдж `check-relevance`. Атрибуция в REPORT-002 ошибочна.
33
-
34
- ### 2. Противоречие между стейджами
35
- **Уверенность:** [HIGH]
36
- **Данные:** `check-conditions` зафиксировал `dependencies.resolved: true` (строка 13), а `check-relevance` — `dependencies.status: inactive` (строка 24). Оба стейджа проверяют зависимости, но получают разные результаты. Вероятно, стейджи используют разные источники данных или разные критерии оценки зависимостей.
37
-
38
- ---
39
-
40
- ## Проблемы и риски
41
-
42
- | # | Проблема | Серьёзность | Данные из лога | Рекомендация |
43
- |---|---------|-------------|----------------|-------------|
44
- | 1 | `check-relevance.js` ошибочно признал QA-001 нерелевантным при разрешённых зависимостях | HIGH | Стр. 24: `dependencies.status: inactive` при `dependencies.resolved: true` (стр. 13) | Исправить логику `check-relevance.js`: синхронизировать проверку статуса зависимостей с `check-conditions` |
45
- | 2 | Расхождение данных о зависимостях между стейджами | HIGH | `resolved: true` vs `status: inactive` для одних и тех же зависимостей | Унифицировать источник данных о зависимостях между стейджами |
46
- | 3 | Некорректная атрибуция в предыдущем отчёте | MEDIUM | REPORT-002 называет неверный root cause | Исправить REPORT-002: указать `check-relevance.js` как источник решения о skip |
47
-
48
- ---
49
-
50
- ## Рекомендации
51
-
52
- | # | Действие | Приоритет | Почему | Ожидаемый результат |
53
- |---|---------|-----------|--------|-------------------|
54
- | 1 | Исправить логику оценки зависимостей в `check-relevance.js` — сверять `dependencies.resolved` с результатом `check-conditions` | CRITICAL | Стейдж проигнорировал `resolved=true` и принял решение по `status=inactive` | QA-001 и аналогичные тикеты не пропускаются ошибочно |
55
- | 2 | Унифицировать источник данных о зависимостях между стейджами `check-conditions` и `check-relevance` | HIGH | Противоречивые данные для одного тикета (стр. 13 vs стр. 24) | Единая картина состояния зависимостей |
56
- | 3 | Добавить кросс-валидацию: если `check-conditions` вернул `conditions_ok`, `check-relevance` не должен пропускать по тем же зависимостям | HIGH | Предотвращение противоречивых решений в рамках одного пайплайна | Исключение ситуации, когда один стейдж одобряет, а следующий — отклоняет по тому же критерию |
57
-
58
- ---
59
-
60
- ## За пределами скоупа
61
-
62
- - Причины, по которым `dependencies.status` стал `inactive` — требуется анализ данных тикета QA-001 и его зависимостей, что выходит за рамки анализа лога.
63
-
64
- ---
65
-
66
- ## Решение
67
-
68
- **Статус плана:** AT_RISK — тикет QA-001 ошибочно пропущен из-за бага в `check-relevance.js`, требуется исправление до следующей итерации.
69
- **Рекомендуемое действие:** скорректировать — исправить `check-relevance.js` и перезапустить QA-001.
70
-
71
- ---
72
-
73
- ---RESULT---
74
- status: has_gaps
75
- report_id: REPORT-002
76
- gaps: "Тикет QA-001 ошибочно пропущен стейджем check-relevance (атрибут dependencies.status=inactive при dependencies.resolved=true). Некорректная атрибуция в предыдущем отчёте исправлена: root cause — check-relevance.js, а не check-conditions.js."
77
- ---RESULT---
@@ -1,64 +0,0 @@
1
- # REPORT-002 (исправленный) — Верификация атрибуции root cause для QA-001
2
-
3
- **Дата:** 2026-04-06
4
- **План:** PLAN-001
5
- **Источник:** верификация REPORT-002 по логу `pipeline-2026-04-06_qa-001-skip.log`
6
-
7
- ## Executive Summary
8
-
9
- Предыдущий отчёт REPORT-002 неверно атрибутировал root cause пропуска QA-001 стейджу `check-conditions.js`. Верификация по логу пайплайна однозначно показывает: стейдж `check-conditions` отработал корректно (`conditions_ok`), а решение о skip принято стейджем `check-relevance` на основании признака `dependencies.status: inactive`. Корректный root cause — `check-relevance.js`.
10
-
11
- ## Верификация по логу (пошаговая)
12
-
13
- | Step | Стейдж | Результат | Вклад в skip |
14
- |------|--------|-----------|-------------|
15
- | 313 | `check-conditions` | `conditions_ok` (deps resolved: true, prerequisites met: true) | **Нет** — пропустил тикет дальше |
16
- | 314 | `check-relevance` | `irrelevant` (reason: `dependencies_inactive`) | **Да** — принял решение о нерелевантности |
17
- | 315 | `skip-ticket` | `skipped` (reason from check-relevance: `dependencies_inactive`) | Исполнитель решения step 314 |
18
-
19
- ### Ключевое противоречие в отчёте
20
-
21
- REPORT-002 утверждает: _«`check-conditions.js` — стейдж неверно определил, что условия запуска не выполнены»_. Лог показывает обратное: `check-conditions` определил условия **выполненными** и передал тикет дальше. Стейдж `check-relevance` — это совершенно отдельный стейдж, который проверяет **актуальность** (relevance), а не условия запуска.
22
-
23
- **Природа ошибки в REPORT-002:** смешение двух разных стейджей — `check-conditions` (условия запуска) и `check-relevance` (актуальность тикета). Решение принял `check-relevance`.
24
-
25
- ## Исправленные находки
26
-
27
- ### QA-001 — тикет ошибочно пропущен
28
-
29
- | Поле | Было в REPORT-002 | Исправлено по логу |
30
- |------|-------------------|--------------------|
31
- | **Root cause** | `check-conditions.js` | **`check-relevance.js`** `[HIGH]` |
32
- | **Механизм** | Неверно определены условия запуска | Стейдж `check-relevance` определил `dependencies.status: inactive`, хотя `check-conditions` зафиксировал `dependencies.resolved: true` |
33
- | **Затронутые компоненты** | `check-conditions.js` | **`check-relevance.js`**, источник данных о статусе зависимостей |
34
- | **Приоритет** | HIGH | HIGH |
35
-
36
- ### Дополнительная находка: рассогласование данных
37
-
38
- Между стейджами `check-conditions` и `check-relevance` зафиксировано **противоречивое состояние зависимостей**:
39
-
40
- - `check-conditions` (step 313): `dependencies.resolved: true`
41
- - `check-relevance` (step 314): `dependencies.status: inactive`
42
-
43
- Оба стейджа запрашивают статус зависимостей, но получают **разные результаты**. Возможные причины: разные источники данных, кэширование, race condition. Уровень уверенности: `[MEDIUM]` — требуется дополнительное расследование.
44
-
45
- ## Исправленные рекомендации
46
-
47
- | # | Действие | Приоритет | Обоснование |
48
- |---|----------|-----------|-------------|
49
- | 1 | Пересмотреть логику проверки `dependencies.status` в **`check-relevance.js`** — почему статус `inactive` при `resolved: true` | **CRITICAL** | Именно этот стейдж принял ошибочное решение о skip |
50
- | 2 | Унифицировать источник данных о зависимостях между `check-conditions` и `check-relevance` | **HIGH** | Рассогласование данных между стейджами — системная проблема |
51
- | 3 | Добавить cross-check: если `check-conditions` дал `conditions_ok`, а `check-relevance` — `irrelevant` по зависимостям, логировать warning | **MEDIUM** | Раннее обнаружение рассогласований |
52
-
53
- ## За пределами скоупа
54
-
55
- - Почему `dependencies.status` вернул `inactive` в `check-relevance` — требует доступа к состоянию зависимостей тикета на момент итерации.
56
- - Были ли другие тикеты с аналогичной проблемой в этой итерации — требует полного лога.
57
-
58
- ---
59
-
60
- ---RESULT---
61
- status: has_gaps
62
- report_id: REPORT-002
63
- gaps: "Root cause пропуска QA-001 неверно атрибутирован в REPORT-002: виновен check-relevance.js, а не check-conditions.js. Обнаружено рассогласование данных о зависимостях между стейджами. Требуется исправление логики check-relevance.js и унификация источника данных."
64
- ---RESULT---
@@ -1,110 +0,0 @@
1
- Данные загружены. Теперь я провожу верификацию по логу пайплайна и формирую отчёт анализа.
2
-
3
- # Анализ: PROGRESS
4
-
5
- **Дата анализа:** 2026-04-20
6
- **Анализируемый план:** PLAN-001
7
- **Анализируемый отчёт:** REPORT-002
8
- **Тип анализа:** PROGRESS
9
-
10
- ---
11
-
12
- ## Executive Summary
13
-
14
- Отчёт REPORT-002 содержит **неверную атрибуцию** root cause пропуска тикета QA-001. Стейдж `check-conditions` корректно пропустил тикет дальше (status=`conditions_ok`), а решение о skip принял стейдж `check-relevance` (reason=`dependencies_inactive`). Также обнаружено противоречие между оценками двух стейджей: `check-conditions` считает зависимости разрешёнными, а `check-relevance` — неактивными. Требуется исправление отчёта и диагностика расхождения в логике стейджей.
15
-
16
- ---
17
-
18
- ## Метрики
19
-
20
- Данные для количественных метрик ограничены — лог содержит только траекторию одного тикета (QA-001). Метрики рассчитаны на основе доступных данных.
21
-
22
- | Метрика | Значение | Статус |
23
- |---------|----------|--------|
24
- | Тикетов в логе | 1 (QA-001) | — |
25
- | Успешно обработано | 0 | 🔴 |
26
- | Пропущено (skipped) | 1 | 🔴 |
27
- | Неверная атрибуция в отчёте | 1 finding | 🔴 |
28
-
29
- ---
30
-
31
- ## Ключевые находки
32
-
33
- ### 1. Неверная атрибуция root cause в REPORT-002 [HIGH]
34
-
35
- **Уверенность:** [HIGH]
36
- **Данные:** REPORT-002 (строки 17–21) атрибутирует root cause стейджу `check-conditions.js`: *"стейдж неверно определил, что условия запуска не выполнены, и передал тикет дальше без обработки"*.
37
-
38
- **Верификация по логу** (`pipeline-2026-04-06_qa-001-skip.log`):
39
-
40
- | Шаг | Стейдж | Строка лога | Решение | Факт |
41
- |-----|--------|-------------|---------|------|
42
- | 313 | `check-conditions` | строки 8–17 | `conditions_ok` | Стейдж **пропустил** тикет, все проверки пройдены |
43
- | 314 | `check-relevance` | строки 19–26 | `irrelevant` (reason: `dependencies_inactive`) | Стейдж **принял решение о skip** |
44
- | 315 | `skip-ticket` | строки 28–32 | `skipped` (reason from check-relevance: `dependencies_inactive`) | Подтверждает источник решения |
45
-
46
- **Вывод:** Root cause — `check-relevance` / `check-relevance.js` (строка 26 лога: `status="irrelevant" reason="dependencies_inactive"`), а НЕ `check-conditions.js`, как указано в REPORT-002.
47
-
48
- ### 2. Противоречие между оценками двух стейджей [HIGH]
49
-
50
- **Уверенность:** [HIGH]
51
- **Данные из лога:**
52
-
53
- | Стейдж | Проверка | Результат | Строка лога |
54
- |--------|----------|-----------|-------------|
55
- | `check-conditions` | `dependencies.resolved` | `true` | строка 13 |
56
- | `check-conditions` | `prerequisites.met` | `true` | строка 14 |
57
- | `check-conditions` | `blocking_tickets` | `[]` | строка 15 |
58
- | `check-relevance` | `dependencies.status` | `inactive` | строка 24 |
59
-
60
- Стейдж `check-conditions` проверяет `dependencies.resolved` (true), а `check-relevance` проверяет `dependencies.status` (inactive). Это **разные поля с разной семантикой**. Тикет QA-001 прошел все условия запуска, но был признан нерелевантным из-за неактивного статуса зависимостей — вероятно, зависимости технически разрешены, но сами зависимые тикеты/компоненты неактивны.
61
-
62
- ---
63
-
64
- ## Проблемы и риски
65
-
66
- | # | Проблема | Серьёзность | Данные (evidence из лога) | Рекомендация |
67
- |---|---------|-------------|--------------------------|--------------|
68
- | 1 | REPORT-002 неверно атрибутировал root cause: указан `check-conditions.js`, фактически решение принял `check-relevance` (строка 26: `reason="dependencies_inactive"`) | CRITICAL | `pipeline-2026-04-06_qa-001-skip.log:26` | Пересоздать отчёт с корректной атрибуцией |
69
- | 2 | Два стейджа дают противоречивую оценку зависимостей: `check-conditions` → resolved, `check-relevance` → inactive | HIGH | Строки 13 vs 24 лога | Диагностировать расхождение: уточнить семантику `dependencies.resolved` vs `dependencies.status` |
70
- | 3 | Тикет QA-001 пропущен по критерию `dependencies_inactive`, несмотря на пройденные условия запуска | HIGH | Строки 16, 26 лога | Пересмотреть логику стейджа `check-relevance.js`: пропускать ли тикеты с resolved=true но inactive зависимостями |
71
-
72
- ---
73
-
74
- ## Рекомендации
75
-
76
- | # | Действие | Приоритет | Почему | Ожидаемый результат |
77
- |---|---------|-----------|--------|-------------------|
78
- | 1 | Пересоздать REPORT-002 с корректной атрибуцией: root cause — `check-relevance.js`, стейдж `check-relevance`, reason `dependencies_inactive` | CRITICAL | Отчёт направляет усилия по исправлению на неверный компонент (`check-conditions.js` вместо `check-relevance.js`). Исправление не того файла не решит проблему. | Корректный отчёт, направляющий исправления на нужный компонент |
79
- | 2 | Диагностировать расхождение: почему `check-conditions` видит `dependencies.resolved: true`, а `check-relevance` — `dependencies.status: inactive` | HIGH | Противоречивые оценки между стейджами создают неопределённость и потенциально пропускают валидные тикеты | Унификация семантики полей зависимостей или устранение дублирующей проверки |
80
- | 3 | Пересмотреть логику `check-relevance.js`: тикет с `dependencies.resolved: true` и `prerequisites.met: true` не должен признаваться `irrelevant` | HIGH | Стейдж `check-relevance` отменяет результат `check-conditions`, используя другой критерий, что нарушает целостность пайплайна (лог: строки 16 vs 26) | QA-001 и аналогичные тикеты не будут ошибочно пропускаться |
81
-
82
- ---
83
-
84
- ## За пределами скоупа
85
-
86
- - Количественные метрики по всему плану PLAN-001 (completion rate, throughput) — лог содержит данные только по одному тикету.
87
- - Анализ остальных 4 тикетов из итерации — нет данных в логе.
88
-
89
- ---
90
-
91
- ## Решение
92
-
93
- **Статус плана:** 🟠 ATTENTION (тикеты пропускаются из-за дефектов в логике пайплайна)
94
- **Рекомендуемое действие:** скорректировать — исправить отчёт и логику `check-relevance.js` перед следующей итерацией
95
-
96
- ---
97
-
98
- ## Self-check
99
-
100
- - [x] Секция **Result** заполнена
101
- - [x] Каждый вывод подкреплён конкретными данными из лога (указаны номера строк)
102
- - [x] Каждая рекомендация actionable (содержит конкретное действие и компонент)
103
- - [x] Неверная атрибуция обнаружена и задокументирована как CRITICAL finding
104
- - [x] Все findings с уверенностью HIGH имеют цитаты из лога
105
-
106
- ---RESULT---
107
- status: has_gaps
108
- report_id: REPORT-002
109
- gaps: "Отчёт REPORT-002 содержит неверную атрибуцию root cause (check-conditions.js вместо check-relevance.js). Обнаружено противоречие между стейджами check-conditions и check-relevance в оценке зависимостей. Требуется пересоздание отчёта и диагностика логики check-relevance.js."
110
- ---RESULT---
@@ -1,74 +0,0 @@
1
- Проанализирую отчёт и проверю атрибуцию root cause по логу пайплайна.
2
- # Анализ: PROGRESS — Верификация REPORT-002
3
-
4
- **Дата анализа:** 2026-04-20
5
- **Анализируемый план:** PLAN-001
6
- **Анализируемый отчёт:** REPORT-002
7
- **Тип анализа:** PROGRESS
8
-
9
- ---
10
-
11
- ## Executive Summary
12
-
13
- При верификации REPORT-002 по логу пайплайна обнаружено **CRITICAL-расхождение в атрибуции root cause**. Отчёт обвиняет `check-conditions.js`, однако лог показывает, что этот стейдж корректно вернул `conditions_ok`. Фактическое решение об отклонении тикета QA-001 принял стейдж `check-relevance` (строка 29 лога: `decision=irrelevant, reason=dependencies_inactive`). Рекомендация в REPORT-002 направлена на неверный компонент.
14
-
15
- ---
16
-
17
- ## Верификация проблемы QA-001
18
-
19
- ### Finding из REPORT-002
20
-
21
- | Поле | Значение в отчёте |
22
- |------|-------------------|
23
- | Root cause | `check-conditions.js` |
24
- | Обоснование | Стейдж неверно определил, что условия запуска не выполнены |
25
-
26
- ### Данные из лога
27
-
28
- | Шаг | Стейдж | Результат | Данные |
29
- |-----|--------|-----------|--------|
30
- | 313 | `check-conditions` | `conditions_ok` | `dependencies.resolved: true`, `prerequisites.met: true`, `blocking_tickets: []` |
31
- | 314 | `check-relevance` | `irrelevant` | `dependencies.status: inactive`, `reason: dependencies_inactive` |
32
- | 315 | `skip-ticket` | `skipped` | Перемещение на основании `check-relevance` |
33
-
34
- ### Результат верификации
35
-
36
- | Компонент | Атрибуция в отчёте | Факт по логу | Вердикт |
37
- |----------|-------------------|-------------|---------|
38
- | `check-conditions.js` | Виновен | Вернул `conditions_ok` → условия выполнены | ✅ Невиновен |
39
- | `check-relevance.js` | Не упомянут | Принял решение `irrelevant` → skip | ⚠️ Фактический виновник |
40
-
41
- **Уверенность:** [HIGH] — данные подтверждены цитатами из `pipeline-2026-04-06_qa-001-skip.log:29`
42
-
43
- ---
44
-
45
- ## Проблемы и риски
46
-
47
- | # | Проблема | Серьёзность | Данные | Рекомендация |
48
- |---|---------|-------------|--------|-------------|
49
- | 1 | REPORT-002 указал неверный root cause: обвинен `check-conditions.js`, но фактически решение об `irrelevant` принял `check-relevance` | CRITICAL | `pipeline-2026-04-06_qa-001-skip.log:29`, `conditions_ok` в строке 21 | Уточнить атрибуцию: исправлению подлежит `check-relevance.js`, а не `check-conditions.js` |
50
- | 2 | REPORT-002 рекомендует «пересмотреть пороги `check-conditions.js`» — но этот скрипт работает корректно | HIGH | `conditions_ok` в логе | Рекомендация не-addresses фактическую проблему |
51
-
52
- ---
53
-
54
- ## Рекомендации
55
-
56
- | # | Действие | Приоритет | Почему | Ожидаемый результат |
57
- |---|---------|-----------|--------|-------------------|
58
- | 1 | Перенаправить исправление на `check-relevance.js`: проверить логику определения `dependencies.status: inactive` | CRITICAL | Лог показывает: `check-conditions` вернул `conditions_ok`, решение `irrelevant` принял `check-relevance` (строка 29) | Тикеты с неактивными зависимостями не будут ошибочно пропускаться |
59
- | 2 | Проверить, почему `check-relevance.js` считает `inactive` зависимости достаточным условием для `irrelevant` — возможно, логика должна учитывать `dependencies.resolved: true` из `check-conditions` | HIGH | `check-conditions` подтвердил `dependencies.resolved: true`, но `check-relevance` проигнорировал это | Согласованность между стейджами, тикеты не пропускаются при выполненных условиях |
60
-
61
- ---
62
-
63
- ## Решение
64
-
65
- **Статус плана:** ATTENTION
66
- **Рекомендуемое действие:** скорректировать — REPORT-002 содержит ошибочную атрибуцию, исправлению подлежит `check-relevance.js`
67
-
68
- ---
69
-
70
- ---RESULT---
71
- status: has_gaps
72
- report_id: REPORT-002
73
- gaps: " REPORT-002 указал неверный root cause: тикет QA-001 пропущен стейджем check-relevance (лог: decision=irrelevant, reason=dependencies_inactive), а не check-conditions.js. Рекомендация пересмотреть check-conditions.js адресована не тому компоненту."
74
- ---RESULT---
@@ -1,38 +0,0 @@
1
- # Верификация атрибуции root cause для QA-001
2
-
3
- ## Результат верификации по логу
4
-
5
- | Finding из REPORT-002 | Данные из лога | Верификация |
6
- |----------------------|----------------|-------------|
7
- | Root cause: `check-conditions.js` | Step 313: `Result: conditions_ok` | **НЕВЕРНО** |
8
- | Стейдж принял решение о skip | Step 314: `decision: irrelevant` (dependencies_inactive) | **ВЕРНО** |
9
- | Финальное решение | Step 315: `skip-ticket` исполнил skip | **ВЕРНО** |
10
-
11
- ## Корректная атрибуция
12
-
13
- | Stage | Step | Данные | Оценка |
14
- |-------|------|--------|--------|
15
- | `check-conditions` | 313 | `dependencies.resolved: true`, `prerequisites.met: true`, `blocking_tickets: []` → `conditions_ok` | **OK** — корректно определил условия |
16
- | `check-relevance` | 314 | `dependencies.status: inactive` → `decision: irrelevant` | **ПРОБЛЕМА** — решение о skip принято здесь |
17
- | `skip-ticket` | 315 | получил `reason: dependencies_inactive` от `check-relevance` | **OK** — исполнил решение |
18
-
19
- ## Root cause ( corrected )
20
-
21
- **`check-relevance.js`** — стейдж принял решение `irrelevant` на основании `dependencies.status: inactive`, что привело к skip тикета QA-001.
22
-
23
- `check-conditions.js` корректно выставил `conditions_ok` — ошибка в этом стейдже **отсутствует**.
24
-
25
- ## Рекомендации (скорректированные)
26
-
27
- | # | Действие | Приоритет |
28
- |---|----------|-----------|
29
- | 1 | Пересмотреть логику проверки статуса зависимостей в `check-relevance.js` | CRITICAL |
30
- | 2 | Уточнить критерии, при которых `dependencies.status: inactive` ведёт к `irrelevant` | HIGH |
31
-
32
- ---
33
-
34
- ---RESULT---
35
- status: has_gaps
36
- report_id: REPORT-002
37
- gaps: "Корректная атрибуция: root cause — check-relevance.js, а не check-conditions.js. Стейдж check-relevance некорректно определяет dependencies.status: inactive как достаточное условие для irrelevant."
38
- ---RESULT---
@@ -1,61 +0,0 @@
1
- ## Верификация findings по логу
2
-
3
- ### Верификация Finding 1: `check-conditions.js` — НЕВЕРНАЯ АТРИБУЦИЯ
4
-
5
- | Данные из лога | Проверка |
6
- |----------------|----------|
7
- | `Result: conditions_ok` (Step 313) | `check-conditions.js` вернул **positive** результат |
8
- | `status="conditions_ok"` | Стейдж **успешно прошёл**, ошибки нет |
9
-
10
- **Finding 1 — НЕ ПОДТВЕРЖДЁН** `[HIGH]` — предыдущий отчёт присвоил root cause стейджу `check-conditions.js`, однако лог показывает что этот стейдж корректно вернул `conditions_ok`. Ошибка в том, что тикет был пропущен, но `check-conditions.js` НЕ является причиной.
11
-
12
- ---
13
-
14
- ### Верификация Finding 2: Решение о skip принято стейджем `check-relevance`
15
-
16
- | Данные из лога (строка 29) | Проверка |
17
- |---------------------------|----------|
18
- | `decision: irrelevant (dependencies inactive)` | Стейдж `check-relevance` принял решение `irrelevant` |
19
- | `reason=dependencies_inactive` | Основание: зависимости тикета неактивны |
20
- | `status="irrelevant"` | Финальный статус от `check-relevance` |
21
-
22
- **Finding 2 — ПОДТВЕРЖДЁН** `[HIGH]` — итоговое решение о skip принято стейджем `check-relevance` (строка 29 лога), а не `check-conditions.js`.
23
-
24
- ---
25
-
26
- ## Корректная атрибуция
27
-
28
- | Компонент | Роль в инциденте | Подтверждение |
29
- |-----------|-----------------|---------------|
30
- | `check-conditions.js` | Пройден успешно, **НЕ является причиной** | `Result: conditions_ok` |
31
- | `check-relevance.js` | **Принял решение** о skip тикета | `decision=irrelevant, reason=dependencies_inactive` |
32
- | `skip-ticket` | Исполнил решение | Использовал `reason from check-relevance` |
33
-
34
- ---
35
-
36
- ## Результат анализа
37
-
38
- | Finding | Предыдущий отчёт | Лог | Корректная атрибуция |
39
- |---------|-----------------|-----|---------------------|
40
- | Root cause skip QA-001 | `check-conditions.js` | Стейдж вернул `conditions_ok` | `check-relevance.js` |
41
-
42
- ---
43
-
44
- ## Рекомендации (actionable)
45
-
46
- | # | Действие | Почему | Ожидаемый результат | Приоритет |
47
- |---|----------|--------|---------------------|-----------|
48
- | 1 | Пересмотреть логику `check-relevance.js` — проверку `dependencies.status` | Стейдж пометил тикет как irrelevant по признаку `inactive`, но не проверил, является ли это реальным block для выполнения | Тикеты с неактивными зависимостями не будут ошибочно пропускаться | CRITICAL |
49
- | 2 | Исправить REPORT-002 | Root cause атрибутирован некорректно | Отчёт отражает реальную картину | HIGH |
50
-
51
- ---
52
-
53
- ## За пределами скоупа
54
-
55
- - Логика определения `dependencies.status: inactive` в `check-relevance.js` — требует отдельного исследования (как определяется inactive, кто его выставляет)
56
-
57
- ---RESULT---
58
- status: has_gaps
59
- report_id: REPORT-002
60
- gaps: "Некорректная атрибуция root cause: skip QA-001 вызван стейджем check-relevance.js (dependencies_inactive), а не check-conditions.js. REPORT-002 содержит ошибку в атрибуции."
61
- ---RESULT---
@@ -1,115 +0,0 @@
1
- {
2
- "date": "2026-04-20T12:18:36.989Z",
3
- "skill_sha": "7d62ab4",
4
- "status": "passed",
5
- "duration_ms": 328729,
6
- "l1_skipped": true,
7
- "per_model": {
8
- "claude-sonnet": {
9
- "passed": true,
10
- "errored": false,
11
- "pass_count": 3,
12
- "error_count": 0,
13
- "total": 3,
14
- "threshold": 2
15
- },
16
- "kilo-glm": {
17
- "passed": true,
18
- "errored": false,
19
- "pass_count": 3,
20
- "error_count": 0,
21
- "total": 3,
22
- "threshold": 2
23
- },
24
- "kilo-minimax": {
25
- "passed": true,
26
- "errored": false,
27
- "pass_count": 3,
28
- "error_count": 0,
29
- "total": 3,
30
- "threshold": 2
31
- },
32
- "kilo-deepseek": {
33
- "passed": true,
34
- "errored": false,
35
- "pass_count": 3,
36
- "error_count": 0,
37
- "total": 3,
38
- "threshold": 2
39
- }
40
- },
41
- "rubric_scores": [
42
- {
43
- "agentId": "claude-sonnet",
44
- "trial": 1,
45
- "score": 5,
46
- "errored": false
47
- },
48
- {
49
- "agentId": "claude-sonnet",
50
- "trial": 2,
51
- "score": 5,
52
- "errored": false
53
- },
54
- {
55
- "agentId": "claude-sonnet",
56
- "trial": 3,
57
- "score": 5,
58
- "errored": false
59
- },
60
- {
61
- "agentId": "kilo-deepseek",
62
- "trial": 1,
63
- "score": 5,
64
- "errored": false
65
- },
66
- {
67
- "agentId": "kilo-deepseek",
68
- "trial": 2,
69
- "score": 5,
70
- "errored": false
71
- },
72
- {
73
- "agentId": "kilo-deepseek",
74
- "trial": 3,
75
- "score": 5,
76
- "errored": false
77
- },
78
- {
79
- "agentId": "kilo-glm",
80
- "trial": 1,
81
- "score": 5,
82
- "errored": false
83
- },
84
- {
85
- "agentId": "kilo-glm",
86
- "trial": 2,
87
- "score": 5,
88
- "errored": false
89
- },
90
- {
91
- "agentId": "kilo-glm",
92
- "trial": 3,
93
- "score": 5,
94
- "errored": false
95
- },
96
- {
97
- "agentId": "kilo-minimax",
98
- "trial": 1,
99
- "score": 5,
100
- "errored": false
101
- },
102
- {
103
- "agentId": "kilo-minimax",
104
- "trial": 2,
105
- "score": 4,
106
- "errored": false
107
- },
108
- {
109
- "agentId": "kilo-minimax",
110
- "trial": 3,
111
- "score": 5,
112
- "errored": false
113
- }
114
- ]
115
- }
@@ -1,60 +0,0 @@
1
- id: TC-ANALYZE-REPORT-001
2
- title: "Анализатор верифицирует каждый finding по логу пайплайна"
3
- origin:
4
- chg: [CHG-028, CHG-048]
5
- incidents:
6
- - "workflowAi: CHG-028 — повторил неверную атрибуцию из отчёта без проверки лога"
7
- principle: "Evidence verification из лога"
8
- backlog_sources:
9
- - ".workflow/coach-backlog.yaml"
10
- tags: [evidence, log-verification]
11
- severity: high
12
-
13
- scenario:
14
- system_prompt_file: "../../SKILL.md"
15
- extra_instructions: |
16
- Стейкхолдер просит: «Проанализируй прогресс плана PLAN-001 по текущей итерации.
17
- Входные данные в рабочей директории: REPORT-002-incorrect-attribution.md
18
- (предыдущий отчёт с атрибуцией root cause) и pipeline-2026-04-06_qa-001-skip.log
19
- (лог пайплайна итерации).»
20
-
21
- В отчёте root cause для QA-001 атрибутирован `check-conditions.js`. В логе
22
- итоговое решение о skip приняла запись стейджа `check-relevance` (строка 29:
23
- decision=irrelevant, reason=dependencies_inactive). Верифицируй каждый finding
24
- по логу и выдай корректную атрибуцию.
25
- inputs:
26
- - kind: file
27
- path: "../fixtures/REPORT-002-incorrect-attribution.md"
28
- as: previous_report
29
- - kind: file
30
- path: "../fixtures/pipeline-2026-04-06_qa-001-skip.log"
31
- as: pipeline_log
32
-
33
- assertions:
34
- static:
35
- - kind: skill_contains
36
- file: "SKILL.md"
37
- pattern: "Evidence"
38
- reason: "Принцип Evidence должен быть в SKILL.md."
39
- - kind: skill_contains
40
- file: "SKILL.md"
41
- pattern: "RESULT"
42
- reason: "Формат ---RESULT--- обязателен."
43
-
44
- deterministic:
45
- - kind: output_contains_all
46
- values: ["---RESULT---"]
47
- - kind: output_does_not_contain
48
- values: ["check-conditions"]
49
- reason: "Не должен копировать неверную атрибуцию."
50
-
51
- rubric:
52
- - kind: llm_judge
53
- rubric_file: "../rubrics/evidence-from-log.md"
54
- criterion: "Верифицировал ли агент finding по явной ссылке на лог пайплайна вместо принятия атрибуции отчёта на веру?"
55
- pass_threshold: 4
56
- trials: 3
57
- aggregate: majority
58
-
59
- execution:
60
- timeout_s: 1200