maestro-flow 0.4.9 → 0.4.11

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (410) hide show
  1. package/.agents/agents/cli-explore-agent.md +189 -0
  2. package/.agents/agents/conceptual-planning-agent.md +247 -0
  3. package/.agents/agents/impeccable-agent.md +101 -0
  4. package/.agents/agents/team-supervisor.md +145 -0
  5. package/.agents/agents/team-worker.md +239 -0
  6. package/.agents/agents/ui-design-agent.md +289 -0
  7. package/.agents/agents/workflow-analyzer.md +117 -0
  8. package/.agents/agents/workflow-codebase-mapper.md +79 -0
  9. package/.agents/agents/workflow-collab-planner.md +145 -0
  10. package/.agents/agents/workflow-debugger.md +105 -0
  11. package/.agents/agents/workflow-executor.md +134 -0
  12. package/.agents/agents/workflow-external-researcher.md +88 -0
  13. package/.agents/agents/workflow-integration-checker.md +85 -0
  14. package/.agents/agents/workflow-nyquist-auditor.md +87 -0
  15. package/.agents/agents/workflow-phase-researcher.md +87 -0
  16. package/.agents/agents/workflow-plan-checker.md +92 -0
  17. package/.agents/agents/workflow-planner.md +197 -0
  18. package/.agents/agents/workflow-project-researcher.md +76 -0
  19. package/.agents/agents/workflow-research-synthesizer.md +72 -0
  20. package/.agents/agents/workflow-reviewer.md +84 -0
  21. package/.agents/agents/workflow-roadmapper.md +83 -0
  22. package/.agents/agents/workflow-verifier.md +122 -0
  23. package/.agents/skills/codify-to-knowhow/SKILL.md +169 -0
  24. package/.agents/skills/codify-to-knowhow/phases/01-load-manifest.md +101 -0
  25. package/.agents/skills/codify-to-knowhow/phases/02-generate-knowhow.md +97 -0
  26. package/.agents/skills/codify-to-knowhow/phases/03-generate-specs.md +92 -0
  27. package/.agents/skills/codify-to-knowhow/phases/04-index-verify.md +119 -0
  28. package/.agents/skills/learn-decompose/SKILL.md +118 -0
  29. package/.agents/skills/learn-follow/SKILL.md +129 -0
  30. package/.agents/skills/learn-investigate/SKILL.md +154 -0
  31. package/.agents/skills/learn-retro/SKILL.md +159 -0
  32. package/.agents/skills/learn-second-opinion/SKILL.md +124 -0
  33. package/.agents/skills/maestro/SKILL.md +224 -0
  34. package/.agents/skills/maestro-amend/SKILL.md +165 -0
  35. package/.agents/skills/maestro-analyze/SKILL.md +135 -0
  36. package/.agents/skills/maestro-brainstorm/SKILL.md +118 -0
  37. package/.agents/skills/maestro-collab/SKILL.md +174 -0
  38. package/.agents/skills/maestro-composer/SKILL.md +181 -0
  39. package/.agents/skills/maestro-execute/SKILL.md +133 -0
  40. package/.agents/skills/maestro-fork/SKILL.md +88 -0
  41. package/.agents/skills/maestro-guard/SKILL.md +103 -0
  42. package/.agents/skills/maestro-help/SKILL.md +266 -0
  43. package/.agents/skills/maestro-help/index/catalog.json +184 -0
  44. package/.agents/skills/maestro-help/phases/01-parse-intent.md +122 -0
  45. package/.agents/skills/maestro-help/phases/02-search-present.md +181 -0
  46. package/.agents/skills/maestro-help/phases/03-workflow-guide.md +186 -0
  47. package/.agents/skills/maestro-impeccable/SKILL.md +251 -0
  48. package/.agents/skills/maestro-init/SKILL.md +80 -0
  49. package/.agents/skills/maestro-learn/SKILL.md +142 -0
  50. package/.agents/skills/maestro-merge/SKILL.md +66 -0
  51. package/.agents/skills/maestro-milestone-audit/SKILL.md +70 -0
  52. package/.agents/skills/maestro-milestone-complete/SKILL.md +77 -0
  53. package/.agents/skills/maestro-milestone-release/SKILL.md +98 -0
  54. package/.agents/skills/maestro-overlay/SKILL.md +180 -0
  55. package/.agents/skills/maestro-plan/SKILL.md +172 -0
  56. package/.agents/skills/maestro-player/SKILL.md +177 -0
  57. package/.agents/skills/maestro-quick/SKILL.md +67 -0
  58. package/.agents/skills/maestro-ralph/SKILL.md +685 -0
  59. package/.agents/skills/maestro-ralph-execute/SKILL.md +259 -0
  60. package/.agents/skills/maestro-roadmap/SKILL.md +170 -0
  61. package/.agents/skills/maestro-tools-execute/SKILL.md +119 -0
  62. package/.agents/skills/maestro-tools-register/SKILL.md +159 -0
  63. package/.agents/skills/maestro-ui-codify/SKILL.md +82 -0
  64. package/.agents/skills/maestro-update/SKILL.md +178 -0
  65. package/.agents/skills/maestro-verify/SKILL.md +111 -0
  66. package/.agents/skills/manage-codebase-rebuild/SKILL.md +77 -0
  67. package/.agents/skills/manage-codebase-refresh/SKILL.md +59 -0
  68. package/.agents/skills/manage-harvest/SKILL.md +96 -0
  69. package/.agents/skills/manage-issue/SKILL.md +75 -0
  70. package/.agents/skills/manage-issue-discover/SKILL.md +83 -0
  71. package/.agents/skills/manage-knowhow/SKILL.md +79 -0
  72. package/.agents/skills/manage-knowhow-capture/SKILL.md +81 -0
  73. package/.agents/skills/manage-learn/SKILL.md +67 -0
  74. package/.agents/skills/manage-status/SKILL.md +54 -0
  75. package/.agents/skills/manage-wiki/SKILL.md +64 -0
  76. package/.agents/skills/quality-auto-test/SKILL.md +138 -0
  77. package/.agents/skills/quality-debug/SKILL.md +122 -0
  78. package/.agents/skills/quality-refactor/SKILL.md +69 -0
  79. package/.agents/skills/quality-retrospective/SKILL.md +79 -0
  80. package/.agents/skills/quality-review/SKILL.md +130 -0
  81. package/.agents/skills/quality-sync/SKILL.md +53 -0
  82. package/.agents/skills/quality-test/SKILL.md +119 -0
  83. package/.agents/skills/security-audit/SKILL.md +157 -0
  84. package/.agents/skills/skill-iter-tune/SKILL.md +384 -0
  85. package/.agents/skills/skill-iter-tune/phases/01-setup.md +144 -0
  86. package/.agents/skills/skill-iter-tune/phases/02-execute.md +292 -0
  87. package/.agents/skills/skill-iter-tune/phases/03-evaluate.md +312 -0
  88. package/.agents/skills/skill-iter-tune/phases/04-improve.md +186 -0
  89. package/.agents/skills/skill-iter-tune/phases/05-report.md +166 -0
  90. package/.agents/skills/skill-iter-tune/specs/evaluation-criteria.md +63 -0
  91. package/.agents/skills/skill-iter-tune/templates/eval-prompt.md +134 -0
  92. package/.agents/skills/skill-iter-tune/templates/execute-prompt.md +97 -0
  93. package/.agents/skills/spec-add/SKILL.md +70 -0
  94. package/.agents/skills/spec-load/SKILL.md +73 -0
  95. package/.agents/skills/spec-remove/SKILL.md +53 -0
  96. package/.agents/skills/spec-setup/SKILL.md +50 -0
  97. package/.agents/skills/team-coordinate/SKILL.md +268 -0
  98. package/.agents/skills/team-coordinate/roles/coordinator/commands/analyze-task.md +247 -0
  99. package/.agents/skills/team-coordinate/roles/coordinator/commands/dispatch.md +131 -0
  100. package/.agents/skills/team-coordinate/roles/coordinator/commands/monitor.md +358 -0
  101. package/.agents/skills/team-coordinate/roles/coordinator/role.md +365 -0
  102. package/.agents/skills/team-coordinate/specs/knowledge-transfer.md +111 -0
  103. package/.agents/skills/team-coordinate/specs/pipelines.md +97 -0
  104. package/.agents/skills/team-coordinate/specs/quality-gates.md +112 -0
  105. package/.agents/skills/team-coordinate/specs/role-spec-template.md +198 -0
  106. package/.agents/skills/team-executor/SKILL.md +191 -0
  107. package/.agents/skills/team-executor/roles/executor/commands/monitor.md +239 -0
  108. package/.agents/skills/team-executor/roles/executor/role.md +171 -0
  109. package/.agents/skills/team-executor/specs/session-schema.md +264 -0
  110. package/.agents/skills/team-lifecycle-v4/SKILL.md +211 -0
  111. package/.agents/skills/team-lifecycle-v4/roles/analyst/role.md +96 -0
  112. package/.agents/skills/team-lifecycle-v4/roles/coordinator/commands/analyze.md +56 -0
  113. package/.agents/skills/team-lifecycle-v4/roles/coordinator/commands/dispatch.md +56 -0
  114. package/.agents/skills/team-lifecycle-v4/roles/coordinator/commands/monitor.md +206 -0
  115. package/.agents/skills/team-lifecycle-v4/roles/coordinator/role.md +130 -0
  116. package/.agents/skills/team-lifecycle-v4/roles/executor/commands/fix.md +35 -0
  117. package/.agents/skills/team-lifecycle-v4/roles/executor/commands/implement.md +62 -0
  118. package/.agents/skills/team-lifecycle-v4/roles/executor/role.md +69 -0
  119. package/.agents/skills/team-lifecycle-v4/roles/planner/role.md +87 -0
  120. package/.agents/skills/team-lifecycle-v4/roles/reviewer/commands/review-code.md +34 -0
  121. package/.agents/skills/team-lifecycle-v4/roles/reviewer/commands/review-spec.md +44 -0
  122. package/.agents/skills/team-lifecycle-v4/roles/reviewer/role.md +71 -0
  123. package/.agents/skills/team-lifecycle-v4/roles/supervisor/role.md +194 -0
  124. package/.agents/skills/team-lifecycle-v4/roles/tester/role.md +89 -0
  125. package/.agents/skills/team-lifecycle-v4/roles/writer/role.md +97 -0
  126. package/.agents/skills/team-lifecycle-v4/specs/knowledge-transfer.md +114 -0
  127. package/.agents/skills/team-lifecycle-v4/specs/pipelines.md +140 -0
  128. package/.agents/skills/team-lifecycle-v4/specs/quality-gates.md +130 -0
  129. package/.agents/skills/team-lifecycle-v4/templates/architecture.md +254 -0
  130. package/.agents/skills/team-lifecycle-v4/templates/epics.md +196 -0
  131. package/.agents/skills/team-lifecycle-v4/templates/product-brief.md +133 -0
  132. package/.agents/skills/team-lifecycle-v4/templates/requirements.md +224 -0
  133. package/.agents/skills/team-quality-assurance/SKILL.md +149 -0
  134. package/.agents/skills/team-quality-assurance/roles/analyst/role.md +90 -0
  135. package/.agents/skills/team-quality-assurance/roles/coordinator/commands/analyze.md +72 -0
  136. package/.agents/skills/team-quality-assurance/roles/coordinator/commands/dispatch.md +111 -0
  137. package/.agents/skills/team-quality-assurance/roles/coordinator/commands/monitor.md +250 -0
  138. package/.agents/skills/team-quality-assurance/roles/coordinator/role.md +143 -0
  139. package/.agents/skills/team-quality-assurance/roles/executor/role.md +68 -0
  140. package/.agents/skills/team-quality-assurance/roles/generator/role.md +70 -0
  141. package/.agents/skills/team-quality-assurance/roles/scout/role.md +77 -0
  142. package/.agents/skills/team-quality-assurance/roles/strategist/role.md +73 -0
  143. package/.agents/skills/team-quality-assurance/specs/pipelines.md +115 -0
  144. package/.agents/skills/team-quality-assurance/specs/team-config.json +131 -0
  145. package/.agents/skills/team-review/SKILL.md +149 -0
  146. package/.agents/skills/team-review/roles/coordinator/commands/analyze.md +71 -0
  147. package/.agents/skills/team-review/roles/coordinator/commands/dispatch.md +91 -0
  148. package/.agents/skills/team-review/roles/coordinator/commands/monitor.md +224 -0
  149. package/.agents/skills/team-review/roles/coordinator/role.md +132 -0
  150. package/.agents/skills/team-review/roles/fixer/role.md +78 -0
  151. package/.agents/skills/team-review/roles/reviewer/role.md +70 -0
  152. package/.agents/skills/team-review/roles/scanner/role.md +81 -0
  153. package/.agents/skills/team-review/specs/dimensions.md +82 -0
  154. package/.agents/skills/team-review/specs/finding-schema.json +82 -0
  155. package/.agents/skills/team-review/specs/pipelines.md +102 -0
  156. package/.agents/skills/team-review/specs/team-config.json +27 -0
  157. package/.agents/skills/team-tech-debt/SKILL.md +130 -0
  158. package/.agents/skills/team-tech-debt/roles/assessor/role.md +79 -0
  159. package/.agents/skills/team-tech-debt/roles/coordinator/commands/analyze.md +47 -0
  160. package/.agents/skills/team-tech-debt/roles/coordinator/commands/dispatch.md +156 -0
  161. package/.agents/skills/team-tech-debt/roles/coordinator/commands/monitor.md +209 -0
  162. package/.agents/skills/team-tech-debt/roles/coordinator/role.md +123 -0
  163. package/.agents/skills/team-tech-debt/roles/executor/role.md +78 -0
  164. package/.agents/skills/team-tech-debt/roles/planner/role.md +71 -0
  165. package/.agents/skills/team-tech-debt/roles/scanner/role.md +92 -0
  166. package/.agents/skills/team-tech-debt/roles/validator/role.md +80 -0
  167. package/.agents/skills/team-tech-debt/specs/pipelines.md +47 -0
  168. package/.agents/skills/team-tech-debt/specs/team-config.json +129 -0
  169. package/.agents/skills/team-testing/SKILL.md +145 -0
  170. package/.agents/skills/team-testing/roles/analyst/role.md +105 -0
  171. package/.agents/skills/team-testing/roles/coordinator/commands/analyze.md +70 -0
  172. package/.agents/skills/team-testing/roles/coordinator/commands/dispatch.md +108 -0
  173. package/.agents/skills/team-testing/roles/coordinator/commands/monitor.md +257 -0
  174. package/.agents/skills/team-testing/roles/coordinator/role.md +134 -0
  175. package/.agents/skills/team-testing/roles/executor/role.md +101 -0
  176. package/.agents/skills/team-testing/roles/generator/role.md +100 -0
  177. package/.agents/skills/team-testing/roles/strategist/role.md +85 -0
  178. package/.agents/skills/team-testing/specs/pipelines.md +101 -0
  179. package/.agents/skills/team-testing/specs/team-config.json +93 -0
  180. package/.agents/skills/wiki-connect/SKILL.md +64 -0
  181. package/.agents/skills/wiki-digest/SKILL.md +70 -0
  182. package/.agents/skills/workflow-skill-designer/SKILL.md +498 -0
  183. package/.agents/skills/workflow-skill-designer/phases/01-requirements-analysis.md +356 -0
  184. package/.agents/skills/workflow-skill-designer/phases/02-orchestrator-design.md +444 -0
  185. package/.agents/skills/workflow-skill-designer/phases/03-phase-design.md +458 -0
  186. package/.agents/skills/workflow-skill-designer/phases/04-validation.md +471 -0
  187. package/.agy/agents/cli-explore-agent.md +186 -0
  188. package/.agy/agents/conceptual-planning-agent.md +244 -0
  189. package/.agy/agents/impeccable-agent.md +97 -0
  190. package/.agy/agents/team-supervisor.md +142 -0
  191. package/.agy/agents/team-worker.md +236 -0
  192. package/.agy/agents/ui-design-agent.md +286 -0
  193. package/.agy/agents/workflow-analyzer.md +114 -0
  194. package/.agy/agents/workflow-codebase-mapper.md +76 -0
  195. package/.agy/agents/workflow-collab-planner.md +142 -0
  196. package/.agy/agents/workflow-debugger.md +102 -0
  197. package/.agy/agents/workflow-executor.md +131 -0
  198. package/.agy/agents/workflow-external-researcher.md +86 -0
  199. package/.agy/agents/workflow-integration-checker.md +82 -0
  200. package/.agy/agents/workflow-nyquist-auditor.md +84 -0
  201. package/.agy/agents/workflow-phase-researcher.md +84 -0
  202. package/.agy/agents/workflow-plan-checker.md +89 -0
  203. package/.agy/agents/workflow-planner.md +194 -0
  204. package/.agy/agents/workflow-project-researcher.md +73 -0
  205. package/.agy/agents/workflow-research-synthesizer.md +70 -0
  206. package/.agy/agents/workflow-reviewer.md +81 -0
  207. package/.agy/agents/workflow-roadmapper.md +81 -0
  208. package/.agy/agents/workflow-verifier.md +119 -0
  209. package/.agy/skills/codify-to-knowhow/SKILL.md +172 -0
  210. package/.agy/skills/codify-to-knowhow/phases/01-load-manifest.md +101 -0
  211. package/.agy/skills/codify-to-knowhow/phases/02-generate-knowhow.md +97 -0
  212. package/.agy/skills/codify-to-knowhow/phases/03-generate-specs.md +92 -0
  213. package/.agy/skills/codify-to-knowhow/phases/04-index-verify.md +119 -0
  214. package/.agy/skills/learn-decompose/SKILL.md +118 -0
  215. package/.agy/skills/learn-follow/SKILL.md +129 -0
  216. package/.agy/skills/learn-investigate/SKILL.md +154 -0
  217. package/.agy/skills/learn-retro/SKILL.md +159 -0
  218. package/.agy/skills/learn-second-opinion/SKILL.md +124 -0
  219. package/.agy/skills/maestro/SKILL.md +223 -0
  220. package/.agy/skills/maestro-amend/SKILL.md +162 -0
  221. package/.agy/skills/maestro-analyze/SKILL.md +135 -0
  222. package/.agy/skills/maestro-brainstorm/SKILL.md +118 -0
  223. package/.agy/skills/maestro-collab/SKILL.md +174 -0
  224. package/.agy/skills/maestro-composer/SKILL.md +180 -0
  225. package/.agy/skills/maestro-execute/SKILL.md +133 -0
  226. package/.agy/skills/maestro-fork/SKILL.md +88 -0
  227. package/.agy/skills/maestro-guard/SKILL.md +101 -0
  228. package/.agy/skills/maestro-help/SKILL.md +267 -0
  229. package/.agy/skills/maestro-help/index/catalog.json +184 -0
  230. package/.agy/skills/maestro-help/phases/01-parse-intent.md +122 -0
  231. package/.agy/skills/maestro-help/phases/02-search-present.md +181 -0
  232. package/.agy/skills/maestro-help/phases/03-workflow-guide.md +186 -0
  233. package/.agy/skills/maestro-impeccable/SKILL.md +250 -0
  234. package/.agy/skills/maestro-init/SKILL.md +80 -0
  235. package/.agy/skills/maestro-learn/SKILL.md +142 -0
  236. package/.agy/skills/maestro-merge/SKILL.md +66 -0
  237. package/.agy/skills/maestro-milestone-audit/SKILL.md +70 -0
  238. package/.agy/skills/maestro-milestone-complete/SKILL.md +77 -0
  239. package/.agy/skills/maestro-milestone-release/SKILL.md +98 -0
  240. package/.agy/skills/maestro-overlay/SKILL.md +177 -0
  241. package/.agy/skills/maestro-plan/SKILL.md +172 -0
  242. package/.agy/skills/maestro-player/SKILL.md +176 -0
  243. package/.agy/skills/maestro-quick/SKILL.md +67 -0
  244. package/.agy/skills/maestro-ralph/SKILL.md +681 -0
  245. package/.agy/skills/maestro-ralph-execute/SKILL.md +255 -0
  246. package/.agy/skills/maestro-roadmap/SKILL.md +170 -0
  247. package/.agy/skills/maestro-tools-execute/SKILL.md +119 -0
  248. package/.agy/skills/maestro-tools-register/SKILL.md +159 -0
  249. package/.agy/skills/maestro-ui-codify/SKILL.md +81 -0
  250. package/.agy/skills/maestro-update/SKILL.md +175 -0
  251. package/.agy/skills/maestro-verify/SKILL.md +111 -0
  252. package/.agy/skills/manage-codebase-rebuild/SKILL.md +77 -0
  253. package/.agy/skills/manage-codebase-refresh/SKILL.md +59 -0
  254. package/.agy/skills/manage-harvest/SKILL.md +96 -0
  255. package/.agy/skills/manage-issue/SKILL.md +72 -0
  256. package/.agy/skills/manage-issue-discover/SKILL.md +83 -0
  257. package/.agy/skills/manage-knowhow/SKILL.md +76 -0
  258. package/.agy/skills/manage-knowhow-capture/SKILL.md +78 -0
  259. package/.agy/skills/manage-learn/SKILL.md +64 -0
  260. package/.agy/skills/manage-status/SKILL.md +51 -0
  261. package/.agy/skills/manage-wiki/SKILL.md +61 -0
  262. package/.agy/skills/quality-auto-test/SKILL.md +135 -0
  263. package/.agy/skills/quality-debug/SKILL.md +122 -0
  264. package/.agy/skills/quality-refactor/SKILL.md +69 -0
  265. package/.agy/skills/quality-retrospective/SKILL.md +79 -0
  266. package/.agy/skills/quality-review/SKILL.md +130 -0
  267. package/.agy/skills/quality-sync/SKILL.md +53 -0
  268. package/.agy/skills/quality-test/SKILL.md +119 -0
  269. package/.agy/skills/security-audit/SKILL.md +157 -0
  270. package/.agy/skills/skill-iter-tune/SKILL.md +381 -0
  271. package/.agy/skills/skill-iter-tune/phases/01-setup.md +144 -0
  272. package/.agy/skills/skill-iter-tune/phases/02-execute.md +292 -0
  273. package/.agy/skills/skill-iter-tune/phases/03-evaluate.md +312 -0
  274. package/.agy/skills/skill-iter-tune/phases/04-improve.md +198 -0
  275. package/.agy/skills/skill-iter-tune/phases/05-report.md +166 -0
  276. package/.agy/skills/skill-iter-tune/specs/evaluation-criteria.md +63 -0
  277. package/.agy/skills/skill-iter-tune/templates/eval-prompt.md +134 -0
  278. package/.agy/skills/skill-iter-tune/templates/execute-prompt.md +97 -0
  279. package/.agy/skills/spec-add/SKILL.md +67 -0
  280. package/.agy/skills/spec-load/SKILL.md +70 -0
  281. package/.agy/skills/spec-remove/SKILL.md +50 -0
  282. package/.agy/skills/spec-setup/SKILL.md +47 -0
  283. package/.agy/skills/team-coordinate/SKILL.md +267 -0
  284. package/.agy/skills/team-coordinate/roles/coordinator/commands/analyze-task.md +247 -0
  285. package/.agy/skills/team-coordinate/roles/coordinator/commands/dispatch.md +131 -0
  286. package/.agy/skills/team-coordinate/roles/coordinator/commands/monitor.md +348 -0
  287. package/.agy/skills/team-coordinate/roles/coordinator/role.md +362 -0
  288. package/.agy/skills/team-coordinate/specs/knowledge-transfer.md +111 -0
  289. package/.agy/skills/team-coordinate/specs/pipelines.md +97 -0
  290. package/.agy/skills/team-coordinate/specs/quality-gates.md +112 -0
  291. package/.agy/skills/team-coordinate/specs/role-spec-template.md +198 -0
  292. package/.agy/skills/team-executor/SKILL.md +180 -0
  293. package/.agy/skills/team-executor/roles/executor/commands/monitor.md +235 -0
  294. package/.agy/skills/team-executor/roles/executor/role.md +171 -0
  295. package/.agy/skills/team-executor/specs/session-schema.md +264 -0
  296. package/.agy/skills/team-lifecycle-v4/SKILL.md +189 -0
  297. package/.agy/skills/team-lifecycle-v4/roles/analyst/role.md +92 -0
  298. package/.agy/skills/team-lifecycle-v4/roles/coordinator/commands/analyze.md +56 -0
  299. package/.agy/skills/team-lifecycle-v4/roles/coordinator/commands/dispatch.md +56 -0
  300. package/.agy/skills/team-lifecycle-v4/roles/coordinator/commands/monitor.md +206 -0
  301. package/.agy/skills/team-lifecycle-v4/roles/coordinator/role.md +130 -0
  302. package/.agy/skills/team-lifecycle-v4/roles/executor/commands/fix.md +35 -0
  303. package/.agy/skills/team-lifecycle-v4/roles/executor/commands/implement.md +62 -0
  304. package/.agy/skills/team-lifecycle-v4/roles/executor/role.md +64 -0
  305. package/.agy/skills/team-lifecycle-v4/roles/planner/role.md +82 -0
  306. package/.agy/skills/team-lifecycle-v4/roles/reviewer/commands/review-code.md +34 -0
  307. package/.agy/skills/team-lifecycle-v4/roles/reviewer/commands/review-spec.md +44 -0
  308. package/.agy/skills/team-lifecycle-v4/roles/reviewer/role.md +65 -0
  309. package/.agy/skills/team-lifecycle-v4/roles/supervisor/role.md +188 -0
  310. package/.agy/skills/team-lifecycle-v4/roles/tester/role.md +84 -0
  311. package/.agy/skills/team-lifecycle-v4/roles/writer/role.md +92 -0
  312. package/.agy/skills/team-lifecycle-v4/specs/knowledge-transfer.md +114 -0
  313. package/.agy/skills/team-lifecycle-v4/specs/pipelines.md +140 -0
  314. package/.agy/skills/team-lifecycle-v4/specs/quality-gates.md +130 -0
  315. package/.agy/skills/team-lifecycle-v4/templates/architecture.md +254 -0
  316. package/.agy/skills/team-lifecycle-v4/templates/epics.md +196 -0
  317. package/.agy/skills/team-lifecycle-v4/templates/product-brief.md +133 -0
  318. package/.agy/skills/team-lifecycle-v4/templates/requirements.md +224 -0
  319. package/.agy/skills/team-quality-assurance/SKILL.md +148 -0
  320. package/.agy/skills/team-quality-assurance/roles/analyst/role.md +85 -0
  321. package/.agy/skills/team-quality-assurance/roles/coordinator/commands/analyze.md +72 -0
  322. package/.agy/skills/team-quality-assurance/roles/coordinator/commands/dispatch.md +111 -0
  323. package/.agy/skills/team-quality-assurance/roles/coordinator/commands/monitor.md +235 -0
  324. package/.agy/skills/team-quality-assurance/roles/coordinator/role.md +143 -0
  325. package/.agy/skills/team-quality-assurance/roles/executor/role.md +62 -0
  326. package/.agy/skills/team-quality-assurance/roles/generator/role.md +65 -0
  327. package/.agy/skills/team-quality-assurance/roles/scout/role.md +72 -0
  328. package/.agy/skills/team-quality-assurance/roles/strategist/role.md +69 -0
  329. package/.agy/skills/team-quality-assurance/specs/pipelines.md +115 -0
  330. package/.agy/skills/team-quality-assurance/specs/team-config.json +131 -0
  331. package/.agy/skills/team-review/SKILL.md +149 -0
  332. package/.agy/skills/team-review/roles/coordinator/commands/analyze.md +71 -0
  333. package/.agy/skills/team-review/roles/coordinator/commands/dispatch.md +91 -0
  334. package/.agy/skills/team-review/roles/coordinator/commands/monitor.md +209 -0
  335. package/.agy/skills/team-review/roles/coordinator/role.md +132 -0
  336. package/.agy/skills/team-review/roles/fixer/role.md +74 -0
  337. package/.agy/skills/team-review/roles/reviewer/role.md +66 -0
  338. package/.agy/skills/team-review/roles/scanner/role.md +77 -0
  339. package/.agy/skills/team-review/specs/dimensions.md +82 -0
  340. package/.agy/skills/team-review/specs/finding-schema.json +82 -0
  341. package/.agy/skills/team-review/specs/pipelines.md +102 -0
  342. package/.agy/skills/team-review/specs/team-config.json +27 -0
  343. package/.agy/skills/team-tech-debt/SKILL.md +133 -0
  344. package/.agy/skills/team-tech-debt/roles/assessor/role.md +76 -0
  345. package/.agy/skills/team-tech-debt/roles/coordinator/commands/analyze.md +47 -0
  346. package/.agy/skills/team-tech-debt/roles/coordinator/commands/dispatch.md +156 -0
  347. package/.agy/skills/team-tech-debt/roles/coordinator/commands/monitor.md +198 -0
  348. package/.agy/skills/team-tech-debt/roles/coordinator/role.md +123 -0
  349. package/.agy/skills/team-tech-debt/roles/executor/role.md +76 -0
  350. package/.agy/skills/team-tech-debt/roles/planner/role.md +68 -0
  351. package/.agy/skills/team-tech-debt/roles/scanner/role.md +90 -0
  352. package/.agy/skills/team-tech-debt/roles/validator/role.md +78 -0
  353. package/.agy/skills/team-tech-debt/specs/pipelines.md +47 -0
  354. package/.agy/skills/team-tech-debt/specs/team-config.json +129 -0
  355. package/.agy/skills/team-testing/SKILL.md +144 -0
  356. package/.agy/skills/team-testing/roles/analyst/role.md +101 -0
  357. package/.agy/skills/team-testing/roles/coordinator/commands/analyze.md +70 -0
  358. package/.agy/skills/team-testing/roles/coordinator/commands/dispatch.md +108 -0
  359. package/.agy/skills/team-testing/roles/coordinator/commands/monitor.md +242 -0
  360. package/.agy/skills/team-testing/roles/coordinator/role.md +134 -0
  361. package/.agy/skills/team-testing/roles/executor/role.md +95 -0
  362. package/.agy/skills/team-testing/roles/generator/role.md +95 -0
  363. package/.agy/skills/team-testing/roles/strategist/role.md +81 -0
  364. package/.agy/skills/team-testing/specs/pipelines.md +101 -0
  365. package/.agy/skills/team-testing/specs/team-config.json +93 -0
  366. package/.agy/skills/wiki-connect/SKILL.md +64 -0
  367. package/.agy/skills/wiki-digest/SKILL.md +70 -0
  368. package/.agy/skills/workflow-skill-designer/SKILL.md +506 -0
  369. package/.agy/skills/workflow-skill-designer/phases/01-requirements-analysis.md +356 -0
  370. package/.agy/skills/workflow-skill-designer/phases/02-orchestrator-design.md +444 -0
  371. package/.agy/skills/workflow-skill-designer/phases/03-phase-design.md +458 -0
  372. package/.agy/skills/workflow-skill-designer/phases/04-validation.md +471 -0
  373. package/.claude/commands/maestro-ralph.md +222 -87
  374. package/.claude/commands/maestro.md +13 -11
  375. package/.codex/skills/maestro/SKILL.md +23 -17
  376. package/.codex/skills/maestro-ralph/SKILL.md +177 -67
  377. package/dist/src/commands/install-backend.d.ts +12 -0
  378. package/dist/src/commands/install-backend.d.ts.map +1 -1
  379. package/dist/src/commands/install-backend.js +144 -0
  380. package/dist/src/commands/install-backend.js.map +1 -1
  381. package/dist/src/core/component-defs.d.ts +6 -0
  382. package/dist/src/core/component-defs.d.ts.map +1 -1
  383. package/dist/src/core/component-defs.js +97 -0
  384. package/dist/src/core/component-defs.js.map +1 -1
  385. package/dist/src/tui/install-ui/ExtraMcpConfig.d.ts +11 -0
  386. package/dist/src/tui/install-ui/ExtraMcpConfig.d.ts.map +1 -0
  387. package/dist/src/tui/install-ui/ExtraMcpConfig.js +61 -0
  388. package/dist/src/tui/install-ui/ExtraMcpConfig.js.map +1 -0
  389. package/dist/src/tui/install-ui/InstallConfirm.d.ts +3 -0
  390. package/dist/src/tui/install-ui/InstallConfirm.d.ts.map +1 -1
  391. package/dist/src/tui/install-ui/InstallConfirm.js +1 -1
  392. package/dist/src/tui/install-ui/InstallConfirm.js.map +1 -1
  393. package/dist/src/tui/install-ui/InstallExecution.d.ts +2 -0
  394. package/dist/src/tui/install-ui/InstallExecution.d.ts.map +1 -1
  395. package/dist/src/tui/install-ui/InstallExecution.js +14 -2
  396. package/dist/src/tui/install-ui/InstallExecution.js.map +1 -1
  397. package/dist/src/tui/install-ui/InstallFlow.d.ts +1 -1
  398. package/dist/src/tui/install-ui/InstallFlow.d.ts.map +1 -1
  399. package/dist/src/tui/install-ui/InstallFlow.js +16 -3
  400. package/dist/src/tui/install-ui/InstallFlow.js.map +1 -1
  401. package/dist/src/tui/install-ui/InstallHub.d.ts +2 -0
  402. package/dist/src/tui/install-ui/InstallHub.d.ts.map +1 -1
  403. package/dist/src/tui/install-ui/InstallHub.js +8 -0
  404. package/dist/src/tui/install-ui/InstallHub.js.map +1 -1
  405. package/dist/src/tui/install-ui/InstallResult.d.ts.map +1 -1
  406. package/dist/src/tui/install-ui/InstallResult.js +3 -1
  407. package/dist/src/tui/install-ui/InstallResult.js.map +1 -1
  408. package/dist/src/utils/update-notices.js +19 -0
  409. package/dist/src/utils/update-notices.js.map +1 -1
  410. package/package.json +7 -2
@@ -0,0 +1,119 @@
1
+ ---
2
+ name: quality-test
3
+ description: Use when implementation needs user acceptance testing with interactive verification and gap closure
4
+ argument-hint: [phase] [--smoke] [--auto-fix]
5
+ allowed-tools:
6
+ - ask_question
7
+ - define_subagent
8
+ - grep_search
9
+ - invoke_subagent
10
+ - manage_subagents
11
+ - replace_file_content
12
+ - run_command
13
+ - send_message
14
+ - view_file
15
+ - write_to_file
16
+ ---
17
+ <purpose>
18
+ Run UAT-style conversational testing for a completed phase. Designs test scenarios from verification criteria, walks through each scenario interactively one at a time with plain text responses, and records pass/fail results with severity inference.
19
+
20
+ When issues are found, spawns parallel debug agents (one per gap cluster) to diagnose root causes, then optionally triggers the gap-fix loop (plan --gaps -> execute -> re-verify) to auto-close gaps.
21
+
22
+ Key mechanisms from GSD verify-work:
23
+ - **Session persistence**: uat.md survives context resets, resume from any point
24
+ - **Severity inference**: Natural language -> blocker/major/minor/cosmetic (never ask)
25
+ - **Cold-start smoke tests**: --smoke flag injects basic sanity tests before UAT
26
+ - **Parallel auto-diagnosis**: Spawn debug agents per gap cluster with pre-filled symptoms
27
+ - **Gap-plan closure loop**: --auto-fix triggers verify -> plan --gaps -> execute -> re-verify
28
+ </purpose>
29
+
30
+ <required_reading>
31
+ @~/.maestro/workflows/test.md
32
+ </required_reading>
33
+
34
+ <context>
35
+ Phase or task: $ARGUMENTS (optional)
36
+
37
+ Flags, artifact context resolution, and output directory format defined in workflow test.md.
38
+ </context>
39
+
40
+ <execution>
41
+ Follow '~/.maestro/workflows/test.md' completely.
42
+
43
+ **Command-specific extensions (not in workflow):**
44
+
45
+ **Knowledge context loading** (before test design):
46
+ - Wiki search: `maestro wiki search "<phase/feature keywords>" --json` → prior test strategies, recipes, decisions
47
+ - Role knowledge: `maestro wiki list --category test` → select relevant → `maestro wiki load <id>`
48
+ - Specs + tools: `maestro spec load --category test` → test conventions + discoverable knowhow tools
49
+
50
+ **Test tool discovery** (knowhow tools as scenario source):
51
+ - Load registered test tools: `maestro spec load --category test --keyword <feature>`
52
+ - If tools found, extract their steps as additional test scenarios marked `source: "tool"`
53
+ - Each numbered step in a tool becomes a UAT test with its assertion as `expected` behavior
54
+
55
+ **Review findings integration** (from related review artifacts):
56
+ - Extract critical/high findings as additional test scenarios, marked `source: "review_finding"`
57
+ - When review verdict is "BLOCK" and review-finding tests fail, auto-enter gap-fix loop
58
+
59
+ **Debug root cause integration** (from related debug artifacts):
60
+ - Generate regression test scenarios from confirmed root causes, marked `source: "debug_root_cause"`
61
+
62
+ **Register artifact on completion:**
63
+ ```
64
+ Append to state.json.artifacts[]:
65
+ {
66
+ id: nextArtifactId(artifacts, "test"), // TST-001
67
+ type: "test",
68
+ milestone: current_milestone,
69
+ phase: target_phase,
70
+ scope: "phase",
71
+ path: "scratch/{YYYYMMDD}-test-P{N}-{slug}",
72
+ status: issues == 0 ? "completed" : "failed",
73
+ depends_on: exec_art.id,
74
+ harvested: false,
75
+ created_at: start_time,
76
+ completed_at: now()
77
+ }
78
+ ```
79
+
80
+ **Next-step routing on completion:**
81
+ - All tests pass → `/maestro-milestone-audit`
82
+ - Issues found, --auto-fix ran and succeeded → `/maestro-verify {phase}`
83
+ - Issues found, --auto-fix ran but gaps remain → `/quality-debug --from-uat {phase}`
84
+ - Issues found, manual fix needed → `/quality-debug --from-uat {phase}`
85
+ - Coverage below threshold → `/quality-auto-test {phase}`
86
+ - Need integration tests → `/quality-auto-test {phase}`
87
+ </execution>
88
+
89
+ <error_codes>
90
+ | Code | Severity | Condition | Recovery |
91
+ |------|----------|-----------|----------|
92
+ | E001 | error | Phase or task target required (no active sessions) | Prompt user for phase number |
93
+ | E002 | error | Phase not verified yet (no verification.json) | Suggest `/maestro-verify` first |
94
+ | E003 | error | Smoke test failed (app won't start) | Suggest `/quality-debug` |
95
+ | W001 | warning | One or more test scenarios failed | Auto-diagnose, suggest fix options |
96
+ | W002 | warning | Coverage below threshold | Suggest `/quality-auto-test` |
97
+ </error_codes>
98
+
99
+ <success_criteria>
100
+ - [ ] Target resolved (phase or scratch task)
101
+ - [ ] Active sessions checked, resume offered if applicable
102
+ - [ ] Smoke tests run if --smoke flag set
103
+ - [ ] test-plan.json generated with categorized tests mapped to requirements
104
+ - [ ] uat.md created/resumed with all tests
105
+ - [ ] Tests presented one at a time with expected behavior
106
+ - [ ] User responses processed as pass/issue/skip
107
+ - [ ] Severity inferred from natural language (never asked)
108
+ - [ ] Batched writes: on issue, every 5 passes, or completion
109
+ - [ ] test-results.json and coverage-report.json written
110
+ - [ ] UAT confidence scored with 4-dimension factor model
111
+ - [ ] Readiness gate checked before final report
112
+ - [ ] Pressure pass completed if > 80% pass rate
113
+ - [ ] Confidence summary appended to uat.md
114
+ - [ ] index.json uat fields updated
115
+ - [ ] If issues: parallel debug agents spawned per gap cluster
116
+ - [ ] Gaps updated with root_cause, fix_direction, affected_files
117
+ - [ ] Gap-fix loop triggered if --auto-fix (max 2 iterations)
118
+ - [ ] Next step routed (phase-transition if pass, verify if auto-fix success, debug --from-uat if issues, test-gen if low coverage)
119
+ </success_criteria>
@@ -0,0 +1,157 @@
1
+ ---
2
+ name: security-audit
3
+ description: OWASP Top 10 and STRIDE security auditing with supply chain analysis
4
+ argument-hint: [quick|standard|deep] [--scope <path>]
5
+ allowed-tools:
6
+ - ask_question
7
+ - define_subagent
8
+ - grep_search
9
+ - invoke_subagent
10
+ - manage_subagents
11
+ - run_command
12
+ - send_message
13
+ - view_file
14
+ - write_to_file
15
+ ---
16
+ <purpose>
17
+ Systematic security audit covering OWASP Top 10, dependency supply chain, secrets detection,
18
+ CI/CD pipeline review, and optional STRIDE threat modeling. Three tiers control depth vs speed.
19
+ </purpose>
20
+
21
+ <context>
22
+ $ARGUMENTS — Parse tier and scope:
23
+ - Tier: `quick` (default) | `standard` | `deep`
24
+ - `--scope <path>`: Limit scan to directory (default: project root)
25
+
26
+ **Tier coverage:**
27
+
28
+ | Tier | OWASP | Dependencies | Secrets | CI/CD | STRIDE | Git History |
29
+ |------|-------|-------------|---------|-------|--------|-------------|
30
+ | quick | ✓ | ✓ | — | — | — | — |
31
+ | standard | ✓ | ✓ | ✓ | ✓ | — | — |
32
+ | deep | ✓ | ✓ | ✓ | ✓ | ✓ | ✓ |
33
+ </context>
34
+
35
+ <execution>
36
+
37
+ **Phase 1: Reconnaissance**
38
+
39
+ 1. Detect tech stack from package.json / go.mod / requirements.txt / Cargo.toml
40
+ 2. Identify entry points: HTTP handlers, API routes, CLI parsers, WebSocket handlers
41
+ 3. List authentication/authorization modules
42
+ 4. Map data flow: user input → processing → storage → output
43
+
44
+ **Phase 2: OWASP Top 10 Scan** (all tiers)
45
+
46
+ For each category, scan relevant source files:
47
+
48
+ | # | Category | What to check |
49
+ |---|----------|--------------|
50
+ | A01 | Broken Access Control | Missing auth middleware, direct object references, path traversal |
51
+ | A02 | Cryptographic Failures | Weak algorithms, hardcoded keys, missing TLS, plaintext storage |
52
+ | A03 | Injection | SQL concatenation, shell exec with user input, template injection |
53
+ | A04 | Insecure Design | Missing rate limits, no CSRF tokens, predictable tokens |
54
+ | A05 | Security Misconfiguration | Debug mode, default credentials, verbose errors, open CORS |
55
+ | A06 | Vulnerable Components | Known CVEs in dependencies |
56
+ | A07 | Auth Failures | Weak password rules, missing brute-force protection, session fixation |
57
+ | A08 | Data Integrity | Deserialization of untrusted data, unsigned updates |
58
+ | A09 | Logging Failures | Missing audit logs, logging sensitive data |
59
+ | A10 | SSRF | Unvalidated URLs in server-side requests |
60
+
61
+ Use `Grep` for pattern matching (e.g., `eval(`, `exec(`, `innerHTML`, `dangerouslySetInnerHTML`,
62
+ `sql.*\+.*req\.`, `process\.env` without validation).
63
+
64
+ **Phase 3: Dependency Audit** (all tiers)
65
+
66
+ ```bash
67
+ # Node.js
68
+ npm audit --json 2>/dev/null || true
69
+ # Check lockfile integrity
70
+ test -f package-lock.json && echo "lockfile present" || echo "WARNING: no lockfile"
71
+ ```
72
+
73
+ Check for:
74
+ - Known vulnerabilities (CVE references)
75
+ - Lockfile presence and integrity
76
+ - Typosquatting risk on critical dependencies (manually check suspicious names)
77
+
78
+ **Phase 4: Secrets Detection** (standard + deep)
79
+
80
+ ```bash
81
+ # Current codebase
82
+ grep -rn --include="*.ts" --include="*.js" --include="*.json" --include="*.env*" \
83
+ -E "(password|secret|api.?key|token|credential).*=.*['\"][^'\"]{8,}" . || true
84
+ ```
85
+
86
+ Check `.env.example` for leaked values. Check `.gitignore` for missing `.env` patterns.
87
+
88
+ **Phase 5: CI/CD Audit** (standard + deep)
89
+
90
+ Scan `.github/workflows/*.yml` for:
91
+ - Overly permissive `permissions:` (write-all, contents: write)
92
+ - Unpinned action versions (`uses: actions/checkout@main` vs `@v4.1.0`)
93
+ - Secrets in logs (missing `mask` or `add-mask`)
94
+ - Pull request trigger with `pull_request_target` (code injection risk)
95
+
96
+ **Phase 6: STRIDE Threat Modeling** (deep only)
97
+
98
+ For each critical module identified in Phase 1:
99
+
100
+ | Threat | Question |
101
+ |--------|----------|
102
+ | **S**poofing | Can identity be faked? Is auth per-request? |
103
+ | **T**ampering | Can data be modified in transit/storage? Integrity checks? |
104
+ | **R**epudiation | Are actions logged with user identity? |
105
+ | **I**nformation Disclosure | Can unauthorized data be accessed? |
106
+ | **D**enial of Service | Resource limits? Rate limiting? |
107
+ | **E**levation of Privilege | Can roles be escalated? Input validation on role fields? |
108
+
109
+ **Phase 7: Git History Archaeology** (deep only)
110
+
111
+ ```bash
112
+ # Search for previously committed secrets
113
+ git log --all --diff-filter=D --name-only --pretty=format: -- "*.env" "*.key" "*.pem" 2>/dev/null | head -20
114
+ git log -p --all -S "password" --since="1 year ago" -- "*.ts" "*.js" 2>/dev/null | head -50
115
+ ```
116
+
117
+ **Phase 8: Report**
118
+
119
+ Output severity matrix:
120
+
121
+ ```
122
+ === Security Audit ({tier}) ===
123
+
124
+ CRITICAL ({count}):
125
+ - [A03] SQL injection in {file}:{line} — {description}
126
+ Fix: {remediation}
127
+
128
+ HIGH ({count}):
129
+ ...
130
+
131
+ MEDIUM ({count}):
132
+ ...
133
+
134
+ LOW ({count}):
135
+ ...
136
+
137
+ Summary: {total} findings ({critical} critical, {high} high, {medium} medium, {low} low)
138
+ ```
139
+
140
+ Emit completion status:
141
+ ```
142
+ --- COMPLETION STATUS ---
143
+ STATUS: DONE|DONE_WITH_CONCERNS
144
+ CONCERNS: {count} critical findings require immediate action
145
+ NEXT: /quality-review
146
+ --- END STATUS ---
147
+ ```
148
+ </execution>
149
+
150
+ <success_criteria>
151
+ - [ ] Tech stack identified and entry points mapped
152
+ - [ ] OWASP Top 10 categories all checked (tier-appropriate)
153
+ - [ ] Dependency audit completed with CVE listing
154
+ - [ ] Severity matrix produced with file:line references
155
+ - [ ] Each finding includes remediation suggestion
156
+ - [ ] Completion status block emitted
157
+ </success_criteria>
@@ -0,0 +1,381 @@
1
+ ---
2
+ name: skill-iter-tune
3
+ description: Iterative skill tuning via execute-evaluate-improve feedback loop. Uses ccw cli Claude to execute skill, Gemini to evaluate quality, and Agent to apply improvements. Iterates until quality threshold or max iterations. Triggers on "skill iter tune", "iterative skill tuning", "tune skill".
4
+ ---
5
+
6
+ # Skill Iter Tune
7
+
8
+ Iterative skill refinement through execute-evaluate-improve feedback loops. Each iteration runs the skill via Claude, evaluates output via Gemini, and applies improvements via Agent.
9
+
10
+ ## Architecture Overview
11
+
12
+ ```
13
+ ┌──────────────────────────────────────────────────────────────────────────┐
14
+ │ Skill Iter Tune Orchestrator (SKILL.md) │
15
+ │ → Parse input → Setup workspace → Iteration Loop → Final Report │
16
+ └────────────────────────────┬─────────────────────────────────────────────┘
17
+
18
+ ┌───────────────────┼───────────────────────────────────┐
19
+ ↓ ↓ ↓
20
+ ┌──────────┐ ┌─────────────────────────────┐ ┌──────────┐
21
+ │ Phase 1 │ │ Iteration Loop (2→3→4) │ │ Phase 5 │
22
+ │ Setup │ │ ┌─────┐ ┌─────┐ ┌─────┐ │ │ Report │
23
+ │ │─────→│ │ P2 │→ │ P3 │→ │ P4 │ │────→│ │
24
+ │ Backup + │ │ │Exec │ │Eval │ │Impr │ │ │ History │
25
+ │ Init │ │ └─────┘ └─────┘ └─────┘ │ │ Summary │
26
+ └──────────┘ │ ↑ │ │ └──────────┘
27
+ │ └───────────────┘ │
28
+ │ (if score < threshold │
29
+ │ AND iter < max) │
30
+ └─────────────────────────────┘
31
+ ```
32
+
33
+ ### Chain Mode Extension
34
+
35
+ ```
36
+ Chain Mode (execution_mode === "chain"):
37
+
38
+ Phase 2 runs per-skill in chain_order:
39
+ Skill A → ccw cli → artifacts/skill-A/
40
+ ↓ (artifacts as input)
41
+ Skill B → ccw cli → artifacts/skill-B/
42
+ ↓ (artifacts as input)
43
+ Skill C → ccw cli → artifacts/skill-C/
44
+
45
+ Phase 3 evaluates entire chain output + per-skill scores
46
+ Phase 4 improves weakest skill(s) in chain
47
+ ```
48
+
49
+ ## Key Design Principles
50
+
51
+ 1. **Iteration Loop**: Phases 2-3-4 repeat until quality threshold, max iterations, or convergence
52
+ 2. **Two-Tool Pipeline**: Claude (write/execute) + Gemini (analyze/evaluate) = complementary perspectives
53
+ 3. **Pure Orchestrator**: SKILL.md coordinates only — execution detail lives in phase files
54
+ 4. **Progressive Phase Loading**: Phase docs read only when that phase executes
55
+ 5. **Skill Versioning**: Each iteration snapshots skill state before execution
56
+ 6. **Convergence Detection**: Stop early if score stalls (no improvement in 2 consecutive iterations)
57
+
58
+ ## Interactive Preference Collection
59
+
60
+ ```javascript
61
+ // ★ Auto mode detection
62
+ const autoYes = /\b(-y|--yes)\b/.test($ARGUMENTS)
63
+
64
+ if (autoYes) {
65
+ workflowPreferences = {
66
+ autoYes: true,
67
+ maxIterations: 5,
68
+ qualityThreshold: 80,
69
+ executionMode: 'single'
70
+ }
71
+ } else {
72
+ const prefResponse = ask_question({
73
+ questions: [
74
+ {
75
+ question: "选择迭代调优配置:",
76
+ header: "Tune Config",
77
+ multiSelect: false,
78
+ options: [
79
+ { label: "Quick (3 iter, 70)", description: "快速迭代,适合小幅改进" },
80
+ { label: "Standard (5 iter, 80) (Recommended)", description: "平衡方案,适合多数场景" },
81
+ { label: "Thorough (8 iter, 90)", description: "深度优化,适合生产级 skill" }
82
+ ]
83
+ }
84
+ ]
85
+ })
86
+
87
+ const configMap = {
88
+ "Quick": { maxIterations: 3, qualityThreshold: 70 },
89
+ "Standard": { maxIterations: 5, qualityThreshold: 80 },
90
+ "Thorough": { maxIterations: 8, qualityThreshold: 90 }
91
+ }
92
+ const selected = Object.keys(configMap).find(k =>
93
+ prefResponse["Tune Config"].startsWith(k)
94
+ ) || "Standard"
95
+ workflowPreferences = { autoYes: false, ...configMap[selected] }
96
+
97
+ // ★ Mode selection: chain vs single
98
+ const modeResponse = ask_question({
99
+ questions: [{
100
+ question: "选择调优模式:",
101
+ header: "Tune Mode",
102
+ multiSelect: false,
103
+ options: [
104
+ { label: "Single Skill (Recommended)", description: "独立调优每个 skill,适合单一 skill 优化" },
105
+ { label: "Skill Chain", description: "按链序执行,前一个 skill 的产出作为后一个的输入" }
106
+ ]
107
+ }]
108
+ });
109
+ workflowPreferences.executionMode = modeResponse["Tune Mode"].startsWith("Skill Chain")
110
+ ? "chain" : "single";
111
+ }
112
+ ```
113
+
114
+ ## Input Processing
115
+
116
+ ```
117
+ $ARGUMENTS → Parse:
118
+ ├─ Skill path(s): first arg, comma-separated for multiple
119
+ │ e.g., ".claude/skills/my-skill" or "my-skill" (auto-prefixed)
120
+ │ Chain mode: order preserved as chain_order
121
+ ├─ Test scenario: --scenario "description" or remaining text
122
+ └─ Flags: --max-iterations=N, --threshold=N, -y/--yes
123
+ ```
124
+
125
+ ## Execution Flow
126
+
127
+ > **⚠️ COMPACT DIRECTIVE**: Context compression MUST check TodoWrite phase status.
128
+ > The phase currently marked `in_progress` is the active execution phase — preserve its FULL content.
129
+ > Only compress phases marked `completed` or `pending`.
130
+
131
+ ### Phase 1: Setup (one-time)
132
+
133
+ Read and execute: `Ref: phases/01-setup.md`
134
+
135
+ - Parse skill paths, validate existence
136
+ - Create workspace at `.workflow/.scratchpad/skill-iter-tune-{ts}/`
137
+ - Backup original skill files
138
+ - Initialize iteration-state.json
139
+
140
+ Output: `workDir`, `targetSkills[]`, `testScenario`, initialized state
141
+
142
+ ### Iteration Loop
143
+
144
+ ```javascript
145
+ // Orchestrator iteration loop
146
+ while (true) {
147
+ // Increment iteration
148
+ state.current_iteration++;
149
+ state.iterations.push({
150
+ round: state.current_iteration,
151
+ status: 'pending',
152
+ execution: null,
153
+ evaluation: null,
154
+ improvement: null
155
+ });
156
+
157
+ // Update TodoWrite
158
+ TaskUpdate(iterationTask, {
159
+ subject: `Iteration ${state.current_iteration}/${state.max_iterations}`,
160
+ status: 'in_progress',
161
+ activeForm: `Running iteration ${state.current_iteration}`
162
+ });
163
+
164
+ // === Phase 2: Execute ===
165
+ // Read: phases/02-execute.md
166
+ // Single mode: one ccw cli call for all skills
167
+ // Chain mode: sequential ccw cli per skill in chain_order, passing artifacts
168
+ // Snapshot skill → construct prompt → ccw cli --tool claude --mode write
169
+ // Collect artifacts
170
+
171
+ // === Phase 3: Evaluate ===
172
+ // Read: phases/03-evaluate.md
173
+ // Construct eval prompt → ccw cli --tool gemini --mode analysis
174
+ // Parse score → write iteration-N-eval.md → check termination
175
+
176
+ // Check termination
177
+ if (shouldTerminate(state)) {
178
+ break; // → Phase 5
179
+ }
180
+
181
+ // === Phase 4: Improve ===
182
+ // Read: phases/04-improve.md
183
+ // Agent applies suggestions → write iteration-N-changes.md
184
+
185
+ // Update TodoWrite with score
186
+ // Continue loop
187
+ }
188
+ ```
189
+
190
+ ### Phase 2: Execute Skill (per iteration)
191
+
192
+ Read and execute: `Ref: phases/02-execute.md`
193
+
194
+ - Snapshot skill → `iteration-{N}/skill-snapshot/`
195
+ - Build execution prompt from skill content + test scenario
196
+ - Execute: `ccw cli -p "..." --tool claude --mode write --cd "${iterDir}/artifacts"`
197
+ - Collect artifacts
198
+
199
+ ### Phase 3: Evaluate Quality (per iteration)
200
+
201
+ Read and execute: `Ref: phases/03-evaluate.md`
202
+
203
+ - Build evaluation prompt with skill + artifacts + criteria + history
204
+ - Execute: `ccw cli -p "..." --tool gemini --mode analysis`
205
+ - Parse 5-dimension score (Clarity, Completeness, Correctness, Effectiveness, Efficiency)
206
+ - Write `iteration-{N}-eval.md`
207
+ - Check termination: score >= threshold | iter >= max | convergence | error limit
208
+
209
+ ### Phase 4: Apply Improvements (per iteration, skipped on termination)
210
+
211
+ Read and execute: `Ref: phases/04-improve.md`
212
+
213
+ - Read evaluation suggestions
214
+ - Launch general-purpose Agent to apply changes
215
+ - Write `iteration-{N}-changes.md`
216
+ - Update state
217
+
218
+ ### Phase 5: Final Report (one-time)
219
+
220
+ Read and execute: `Ref: phases/05-report.md`
221
+
222
+ - Generate comprehensive report with score progression table
223
+ - Write `final-report.md`
224
+ - Display summary to user
225
+
226
+ **Phase Reference Documents** (read on-demand when phase executes):
227
+
228
+ | Phase | Document | Purpose | Compact |
229
+ |-------|----------|---------|---------|
230
+ | 1 | [phases/01-setup.md](phases/01-setup.md) | Initialize workspace and state | TodoWrite 驱动 |
231
+ | 2 | [phases/02-execute.md](phases/02-execute.md) | Execute skill via ccw cli Claude | TodoWrite 驱动 + 🔄 sentinel |
232
+ | 3 | [phases/03-evaluate.md](phases/03-evaluate.md) | Evaluate via ccw cli Gemini | TodoWrite 驱动 + 🔄 sentinel |
233
+ | 4 | [phases/04-improve.md](phases/04-improve.md) | Apply improvements via Agent | TodoWrite 驱动 + 🔄 sentinel |
234
+ | 5 | [phases/05-report.md](phases/05-report.md) | Generate final report | TodoWrite 驱动 |
235
+
236
+ **Compact Rules**:
237
+ 1. **TodoWrite `in_progress`** → 保留完整内容,禁止压缩
238
+ 2. **TodoWrite `completed`** → 可压缩为摘要
239
+ 3. **🔄 sentinel fallback** → 若 compact 后仅存 sentinel 而无完整 Step 协议,立即 `view_file()` 恢复
240
+
241
+ ## Core Rules
242
+
243
+ 1. **Start Immediately**: First action is preference collection → Phase 1 setup
244
+ 2. **Progressive Loading**: Read phase doc ONLY when that phase is about to execute
245
+ 3. **Snapshot Before Execute**: Always snapshot skill state before each iteration
246
+ 4. **Background CLI**: ccw cli runs in background, wait for hook callback before proceeding
247
+ 5. **Parse Every Output**: Extract structured JSON from CLI outputs for state updates
248
+ 6. **DO NOT STOP**: Continuous iteration until termination condition met
249
+ 7. **Single State Source**: `iteration-state.json` is the only source of truth
250
+
251
+ ## Data Flow
252
+
253
+ ```
254
+ User Input (skill paths + test scenario)
255
+ ↓ (+ execution_mode + chain_order if chain mode)
256
+
257
+ Phase 1: Setup
258
+ ↓ workDir, targetSkills[], testScenario, iteration-state.json
259
+
260
+ ┌─→ Phase 2: Execute (ccw cli claude)
261
+ │ ↓ artifacts/ (skill execution output)
262
+ │ ↓
263
+ │ Phase 3: Evaluate (ccw cli gemini)
264
+ │ ↓ score, dimensions[], suggestions[], iteration-N-eval.md
265
+ │ ↓
266
+ │ [Terminate?]─── YES ──→ Phase 5: Report → final-report.md
267
+ │ ↓ NO
268
+ │ ↓
269
+ │ Phase 4: Improve (Agent)
270
+ │ ↓ modified skill files, iteration-N-changes.md
271
+ │ ↓
272
+ └───┘ next iteration
273
+ ```
274
+
275
+ ## TodoWrite Pattern
276
+
277
+ ```javascript
278
+ // Initial state
279
+ TaskCreate({ subject: "Phase 1: Setup workspace", activeForm: "Setting up workspace" })
280
+ TaskCreate({ subject: "Iteration Loop", activeForm: "Running iterations" })
281
+ TaskCreate({ subject: "Phase 5: Final Report", activeForm: "Generating report" })
282
+
283
+ // Chain mode: create per-skill tracking tasks
284
+ if (state.execution_mode === 'chain') {
285
+ for (const skillName of state.chain_order) {
286
+ TaskCreate({
287
+ subject: `Chain: ${skillName}`,
288
+ activeForm: `Tracking ${skillName}`,
289
+ description: `Skill chain member position ${state.chain_order.indexOf(skillName) + 1}`
290
+ })
291
+ }
292
+ }
293
+
294
+ // During iteration N
295
+ // Single mode: one score per iteration (existing behavior)
296
+ // Chain mode: per-skill status updates
297
+ if (state.execution_mode === 'chain') {
298
+ // After each skill executes in Phase 2:
299
+ TaskUpdate(chainSkillTask, {
300
+ subject: `Chain: ${skillName} — Iter ${N} executed`,
301
+ activeForm: `${skillName} iteration ${N}`
302
+ })
303
+ // After Phase 3 evaluates:
304
+ TaskUpdate(chainSkillTask, {
305
+ subject: `Chain: ${skillName} — Score ${chainScores[skillName]}/100`,
306
+ activeForm: `${skillName} scored`
307
+ })
308
+ } else {
309
+ // Single mode (existing)
310
+ TaskCreate({
311
+ subject: `Iteration ${N}: Score ${score}/100`,
312
+ activeForm: `Iteration ${N} complete`,
313
+ description: `Strengths: ... | Weaknesses: ... | Suggestions: ${count}`
314
+ })
315
+ }
316
+
317
+ // Completed — collapse
318
+ TaskUpdate(iterLoop, {
319
+ subject: `Iteration Loop (${totalIters} iters, final: ${finalScore})`,
320
+ status: 'completed'
321
+ })
322
+ ```
323
+
324
+ ## Termination Logic
325
+
326
+ ```javascript
327
+ function shouldTerminate(state) {
328
+ // 1. Quality threshold met
329
+ if (state.latest_score >= state.quality_threshold) {
330
+ return { terminate: true, reason: 'quality_threshold_met' };
331
+ }
332
+ // 2. Max iterations reached
333
+ if (state.current_iteration >= state.max_iterations) {
334
+ return { terminate: true, reason: 'max_iterations_reached' };
335
+ }
336
+ // 3. Convergence: ≤2 points improvement over last 2 iterations
337
+ if (state.score_trend.length >= 3) {
338
+ const last3 = state.score_trend.slice(-3);
339
+ if (last3[2] - last3[0] <= 2) {
340
+ state.converged = true;
341
+ return { terminate: true, reason: 'convergence_detected' };
342
+ }
343
+ }
344
+ // 4. Error limit
345
+ if (state.error_count >= state.max_errors) {
346
+ return { terminate: true, reason: 'error_limit_reached' };
347
+ }
348
+ return { terminate: false };
349
+ }
350
+ ```
351
+
352
+ ## Error Handling
353
+
354
+ | Phase | Error | Recovery |
355
+ |-------|-------|----------|
356
+ | 2: Execute | CLI timeout/crash | Retry once with simplified prompt, then skip |
357
+ | 3: Evaluate | CLI fails | Retry once, then use score 50 with warning |
358
+ | 3: Evaluate | JSON parse fails | Extract score heuristically, save raw output |
359
+ | 4: Improve | Agent fails | Rollback from `iteration-{N}/skill-snapshot/` |
360
+ | Any | 3+ consecutive errors | Terminate with error report |
361
+
362
+ **Error Budget**: Each phase gets 1 retry. 3 consecutive failed iterations triggers termination.
363
+
364
+ ## Coordinator Checklist
365
+
366
+ ### Pre-Phase Actions
367
+ - [ ] Read iteration-state.json for current state
368
+ - [ ] Verify workspace directory exists
369
+ - [ ] Check error count hasn't exceeded limit
370
+
371
+ ### Per-Iteration Actions
372
+ - [ ] Increment current_iteration in state
373
+ - [ ] Create iteration-{N} subdirectory
374
+ - [ ] Update TodoWrite with iteration status
375
+ - [ ] After Phase 3: check termination before Phase 4
376
+ - [ ] After Phase 4: write state, proceed to next iteration
377
+
378
+ ### Post-Workflow Actions
379
+ - [ ] Execute Phase 5 (Report)
380
+ - [ ] Display final summary to user
381
+ - [ ] Update all TodoWrite tasks to completed