aiox-core 5.0.3 → 5.0.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (468) hide show
  1. package/.aiox-core/core/execution/predictive-pipeline.js +1283 -0
  2. package/.aiox-core/core/memory/decision-memory.js +564 -0
  3. package/.aiox-core/data/entity-registry.yaml +1068 -1028
  4. package/.aiox-core/data/registry-update-log.jsonl +2 -2
  5. package/.aiox-core/development/templates/service-template/README.md.hbs +158 -158
  6. package/.aiox-core/development/templates/service-template/__tests__/index.test.ts.hbs +237 -237
  7. package/.aiox-core/development/templates/service-template/client.ts.hbs +403 -403
  8. package/.aiox-core/development/templates/service-template/errors.ts.hbs +182 -182
  9. package/.aiox-core/development/templates/service-template/index.ts.hbs +120 -120
  10. package/.aiox-core/development/templates/service-template/package.json.hbs +87 -87
  11. package/.aiox-core/development/templates/service-template/types.ts.hbs +145 -145
  12. package/.aiox-core/development/templates/squad-template/LICENSE +21 -21
  13. package/.aiox-core/infrastructure/templates/aiox-sync.yaml.template +182 -182
  14. package/.aiox-core/infrastructure/templates/coderabbit.yaml.template +279 -279
  15. package/.aiox-core/infrastructure/templates/github-workflows/ci.yml.template +169 -169
  16. package/.aiox-core/infrastructure/templates/github-workflows/pr-automation.yml.template +330 -330
  17. package/.aiox-core/infrastructure/templates/github-workflows/release.yml.template +196 -196
  18. package/.aiox-core/infrastructure/templates/gitignore/gitignore-aiox-base.tmpl +63 -63
  19. package/.aiox-core/infrastructure/templates/gitignore/gitignore-brownfield-merge.tmpl +18 -18
  20. package/.aiox-core/infrastructure/templates/gitignore/gitignore-node.tmpl +85 -85
  21. package/.aiox-core/infrastructure/templates/gitignore/gitignore-python.tmpl +145 -145
  22. package/.aiox-core/install-manifest.yaml +63 -55
  23. package/.aiox-core/local-config.yaml.template +71 -71
  24. package/.aiox-core/monitor/hooks/lib/__init__.py +1 -1
  25. package/.aiox-core/monitor/hooks/lib/enrich.py +58 -58
  26. package/.aiox-core/monitor/hooks/lib/send_event.py +47 -47
  27. package/.aiox-core/monitor/hooks/notification.py +29 -29
  28. package/.aiox-core/monitor/hooks/post_tool_use.py +45 -45
  29. package/.aiox-core/monitor/hooks/pre_compact.py +29 -29
  30. package/.aiox-core/monitor/hooks/pre_tool_use.py +40 -40
  31. package/.aiox-core/monitor/hooks/stop.py +29 -29
  32. package/.aiox-core/monitor/hooks/subagent_stop.py +29 -29
  33. package/.aiox-core/monitor/hooks/user_prompt_submit.py +38 -38
  34. package/.aiox-core/product/templates/adr.hbs +125 -125
  35. package/.aiox-core/product/templates/dbdr.hbs +241 -241
  36. package/.aiox-core/product/templates/epic.hbs +212 -212
  37. package/.aiox-core/product/templates/pmdr.hbs +186 -186
  38. package/.aiox-core/product/templates/prd-v2.0.hbs +216 -216
  39. package/.aiox-core/product/templates/prd.hbs +201 -201
  40. package/.aiox-core/product/templates/story.hbs +263 -263
  41. package/.aiox-core/product/templates/task.hbs +170 -170
  42. package/.aiox-core/product/templates/tmpl-comment-on-examples.sql +158 -158
  43. package/.aiox-core/product/templates/tmpl-migration-script.sql +91 -91
  44. package/.aiox-core/product/templates/tmpl-rls-granular-policies.sql +104 -104
  45. package/.aiox-core/product/templates/tmpl-rls-kiss-policy.sql +10 -10
  46. package/.aiox-core/product/templates/tmpl-rls-roles.sql +135 -135
  47. package/.aiox-core/product/templates/tmpl-rls-simple.sql +77 -77
  48. package/.aiox-core/product/templates/tmpl-rls-tenant.sql +152 -152
  49. package/.aiox-core/product/templates/tmpl-rollback-script.sql +77 -77
  50. package/.aiox-core/product/templates/tmpl-seed-data.sql +140 -140
  51. package/.aiox-core/product/templates/tmpl-smoke-test.sql +16 -16
  52. package/.aiox-core/product/templates/tmpl-staging-copy-merge.sql +139 -139
  53. package/.aiox-core/product/templates/tmpl-stored-proc.sql +140 -140
  54. package/.aiox-core/product/templates/tmpl-trigger.sql +152 -152
  55. package/.aiox-core/product/templates/tmpl-view-materialized.sql +133 -133
  56. package/.aiox-core/product/templates/tmpl-view.sql +177 -177
  57. package/.aiox-core/scripts/pm.sh +0 -0
  58. package/.claude/hooks/enforce-architecture-first.py +196 -196
  59. package/.claude/hooks/mind-clone-governance.py +192 -192
  60. package/.claude/hooks/read-protection.py +151 -151
  61. package/.claude/hooks/slug-validation.py +176 -176
  62. package/.claude/hooks/sql-governance.py +182 -182
  63. package/.claude/hooks/write-path-validation.py +194 -194
  64. package/LICENSE +33 -33
  65. package/bin/aiox-graph.js +0 -0
  66. package/bin/aiox-minimal.js +0 -0
  67. package/bin/aiox.js +0 -0
  68. package/package.json +1 -1
  69. package/packages/aiox-install/bin/aiox-install.js +0 -0
  70. package/packages/aiox-install/bin/edmcp.js +0 -0
  71. package/packages/aiox-pro-cli/bin/aiox-pro.js +0 -0
  72. package/packages/installer/src/wizard/pro-setup.js +28 -0
  73. package/pro/README.md +66 -66
  74. package/pro/feature-registry.yaml +225 -223
  75. package/pro/license/license-api.js +701 -679
  76. package/pro/package.json +39 -39
  77. package/pro/pro-config.yaml +63 -63
  78. package/pro/squads/README.md +24 -24
  79. package/pro/squads/design/HEADLINE.md +3 -3
  80. package/pro/squads/design/README.md +109 -109
  81. package/pro/squads/design/agents/brad-frost.md +1097 -1097
  82. package/pro/squads/design/agents/dan-mall.md +857 -857
  83. package/pro/squads/design/agents/dave-malouf.md +2272 -2272
  84. package/pro/squads/design/agents/design-chief.md +114 -114
  85. package/pro/squads/design/agents/ds-foundations-lead.md +194 -194
  86. package/pro/squads/design/agents/ds-token-architect.md +361 -361
  87. package/pro/squads/design/agents/nano-banana-generator.md +162 -162
  88. package/pro/squads/design/agents/storybook-expert.md +809 -809
  89. package/pro/squads/design/checklists/atomic-refactor-checklist.md +299 -299
  90. package/pro/squads/design/checklists/component-adaptation-checklist.md +81 -81
  91. package/pro/squads/design/checklists/design-fidelity-checklist.md +283 -283
  92. package/pro/squads/design/checklists/design-handoff-checklist.md +55 -55
  93. package/pro/squads/design/checklists/design-team-health-checklist.md +454 -454
  94. package/pro/squads/design/checklists/designops-maturity-checklist.md +518 -518
  95. package/pro/squads/design/checklists/ds-a11y-release-gate-checklist.md +45 -45
  96. package/pro/squads/design/checklists/ds-accessibility-wcag-checklist.md +147 -147
  97. package/pro/squads/design/checklists/ds-component-quality-checklist.md +150 -150
  98. package/pro/squads/design/checklists/ds-critical-eye-review-checklist.md +147 -147
  99. package/pro/squads/design/checklists/ds-migration-readiness-checklist.md +99 -99
  100. package/pro/squads/design/checklists/ds-pattern-audit-checklist.md +164 -164
  101. package/pro/squads/design/checklists/reading-accessibility-checklist.md +275 -275
  102. package/pro/squads/design/checklists/token-mapping-checklist.md +107 -107
  103. package/pro/squads/design/config/coding-standards.md +286 -286
  104. package/pro/squads/design/config/source-tree.md +59 -59
  105. package/pro/squads/design/config/tech-stack.md +48 -48
  106. package/pro/squads/design/config.yaml +204 -204
  107. package/pro/squads/design/data/agentic-design-systems-guide.md +46 -46
  108. package/pro/squads/design/data/agentic-ds-principles.md +100 -100
  109. package/pro/squads/design/data/atomic-design-principles.md +108 -108
  110. package/pro/squads/design/data/atomic-refactor-rules.md +582 -582
  111. package/pro/squads/design/data/base-component-specs.md +972 -972
  112. package/pro/squads/design/data/brad-frost-analysis-extract-implicit.yaml +270 -270
  113. package/pro/squads/design/data/brad-frost-analysis-find-0.8.yaml +176 -176
  114. package/pro/squads/design/data/brad-frost-analysis-qa-report.yaml +168 -168
  115. package/pro/squads/design/data/brad-frost-dna.yaml +713 -713
  116. package/pro/squads/design/data/capability-tools.yaml +124 -124
  117. package/pro/squads/design/data/component-adaptation-changelog.md +318 -318
  118. package/pro/squads/design/data/consolidation-algorithms.md +168 -168
  119. package/pro/squads/design/data/critical-eye-scoring-rules.yaml +240 -240
  120. package/pro/squads/design/data/design-token-best-practices.md +107 -107
  121. package/pro/squads/design/data/design-tokens-spec.yaml +418 -418
  122. package/pro/squads/design/data/ds-reference-architectures.md +93 -93
  123. package/pro/squads/design/data/f2-qa-report.md +168 -168
  124. package/pro/squads/design/data/f3-derived-components-changelog.md +100 -100
  125. package/pro/squads/design/data/f3-qa-report.md +208 -208
  126. package/pro/squads/design/data/figma-base-components-raw.md +101 -101
  127. package/pro/squads/design/data/figma-tokens-raw.md +1548 -1548
  128. package/pro/squads/design/data/fluent2-design-principles.md +114 -114
  129. package/pro/squads/design/data/high-retention-reading-guide.md +349 -349
  130. package/pro/squads/design/data/integration-patterns.md +207 -207
  131. package/pro/squads/design/data/internal-quality-chain.yaml +48 -48
  132. package/pro/squads/design/data/motion-tokens-guide.md +202 -202
  133. package/pro/squads/design/data/roi-calculation-guide.md +142 -142
  134. package/pro/squads/design/data/token-mapping-reference.md +213 -213
  135. package/pro/squads/design/data/w3c-dtcg-spec-reference.md +149 -149
  136. package/pro/squads/design/data/wcag-compliance-guide.md +267 -267
  137. package/pro/squads/design/docs/AUDIT_REPORT.md +97 -97
  138. package/pro/squads/design/docs/DS-CURATION-PIPELINE-PROPOSAL.md +577 -577
  139. package/pro/squads/design/docs/UPGRADE_PLAN.md +618 -618
  140. package/pro/squads/design/docs/brad-frost-research-validation.md +372 -372
  141. package/pro/squads/design/docs/dave-malouf-research-validation.md +391 -391
  142. package/pro/squads/design/docs/tool-discovery-report.md +87 -87
  143. package/pro/squads/design/docs/tool-integration-plan.md +44 -44
  144. package/pro/squads/design/protocols/ai-first-governance.md +56 -56
  145. package/pro/squads/design/protocols/governance-execution-boundary.md +59 -59
  146. package/pro/squads/design/protocols/handoff.md +60 -60
  147. package/pro/squads/design/rules/.claude-rules.md +88 -88
  148. package/pro/squads/design/scripts/design-system/curate_colors.cjs +447 -447
  149. package/pro/squads/design/scripts/design-system/curate_components.cjs +217 -217
  150. package/pro/squads/design/scripts/design-system/curate_radius.cjs +190 -190
  151. package/pro/squads/design/scripts/design-system/curate_shadows.cjs +208 -208
  152. package/pro/squads/design/scripts/design-system/curate_spacing.cjs +243 -243
  153. package/pro/squads/design/scripts/design-system/curate_typography.cjs +404 -404
  154. package/pro/squads/design/scripts/design-system/design-system-metadata.test.js +49 -49
  155. package/pro/squads/design/scripts/design-system/design_manifest_lib.cjs +142 -142
  156. package/pro/squads/design/scripts/design-system/fetch_page_images.cjs +195 -195
  157. package/pro/squads/design/scripts/design-system/generate_components_metadata.cjs +114 -114
  158. package/pro/squads/design/scripts/design-system/generate_curation_report.cjs +258 -258
  159. package/pro/squads/design/scripts/design-system/generate_tokens.cjs +342 -342
  160. package/pro/squads/design/scripts/design-system/sync_design_manifest.cjs +27 -27
  161. package/pro/squads/design/scripts/design-system/test_mcp_tools.cjs +232 -232
  162. package/pro/squads/design/scripts/design-system/validate_components_metadata.cjs +96 -96
  163. package/pro/squads/design/scripts/design-system/validate_curation.cjs +226 -226
  164. package/pro/squads/design/scripts/design-system/validate_design_manifest_drift.cjs +72 -72
  165. package/pro/squads/design/scripts/design-system/validate_mcp_skeleton.cjs +38 -38
  166. package/pro/squads/design/scripts/design-system/validate_registry.cjs +186 -186
  167. package/pro/squads/design/scripts/design-system/validate_task_checklist_bindings.cjs +78 -78
  168. package/pro/squads/design/scripts/dissect-artifact.cjs +806 -806
  169. package/pro/squads/design/scripts/validate-a11y-integration.cjs +40 -40
  170. package/pro/squads/design/scripts/validate-design-squad.py +411 -411
  171. package/pro/squads/design/squad.yaml +714 -714
  172. package/pro/squads/design/tasks/a11y-audit.md +340 -340
  173. package/pro/squads/design/tasks/aria-audit.md +525 -525
  174. package/pro/squads/design/tasks/atomic-refactor-execute.md +391 -391
  175. package/pro/squads/design/tasks/atomic-refactor-plan.md +262 -262
  176. package/pro/squads/design/tasks/audit-reading-experience.md +350 -350
  177. package/pro/squads/design/tasks/audit-tailwind-config.md +101 -101
  178. package/pro/squads/design/tasks/bootstrap-shadcn-library.md +96 -96
  179. package/pro/squads/design/tasks/bundle-audit.md +245 -245
  180. package/pro/squads/design/tasks/contrast-matrix.md +373 -373
  181. package/pro/squads/design/tasks/create-doc.md +135 -135
  182. package/pro/squads/design/tasks/dead-code-detection.md +329 -329
  183. package/pro/squads/design/tasks/design-compare.md +414 -414
  184. package/pro/squads/design/tasks/design-process-optimization.md +407 -407
  185. package/pro/squads/design/tasks/design-review-orchestration.md +99 -99
  186. package/pro/squads/design/tasks/design-team-scaling.md +407 -407
  187. package/pro/squads/design/tasks/design-tooling-audit.md +404 -404
  188. package/pro/squads/design/tasks/design-triage.md +89 -89
  189. package/pro/squads/design/tasks/designops-maturity-assessment.md +364 -364
  190. package/pro/squads/design/tasks/designops-metrics-setup.md +465 -465
  191. package/pro/squads/design/tasks/ds-agentic-audit.md +100 -100
  192. package/pro/squads/design/tasks/ds-agentic-setup.md +103 -103
  193. package/pro/squads/design/tasks/ds-audit-codebase.md +273 -273
  194. package/pro/squads/design/tasks/ds-build-component.md +349 -349
  195. package/pro/squads/design/tasks/ds-build-mcp-server.md +84 -84
  196. package/pro/squads/design/tasks/ds-calculate-roi.md +282 -282
  197. package/pro/squads/design/tasks/ds-compose-molecule.md +106 -106
  198. package/pro/squads/design/tasks/ds-consolidate-patterns.md +253 -253
  199. package/pro/squads/design/tasks/ds-context-contract.md +194 -194
  200. package/pro/squads/design/tasks/ds-critical-eye-compare.md +130 -130
  201. package/pro/squads/design/tasks/ds-critical-eye-decide.md +139 -139
  202. package/pro/squads/design/tasks/ds-critical-eye-inventory.md +111 -111
  203. package/pro/squads/design/tasks/ds-critical-eye-report.md +101 -101
  204. package/pro/squads/design/tasks/ds-critical-eye-score.md +109 -109
  205. package/pro/squads/design/tasks/ds-designops.md +99 -99
  206. package/pro/squads/design/tasks/ds-extend-pattern.md +91 -91
  207. package/pro/squads/design/tasks/ds-extract-tokens.md +312 -312
  208. package/pro/squads/design/tasks/ds-figma-pipeline.md +95 -95
  209. package/pro/squads/design/tasks/ds-fluent-audit.md +105 -105
  210. package/pro/squads/design/tasks/ds-fluent-build.md +110 -110
  211. package/pro/squads/design/tasks/ds-generate-ai-metadata.md +81 -81
  212. package/pro/squads/design/tasks/ds-generate-cursor-rules.md +74 -74
  213. package/pro/squads/design/tasks/ds-generate-documentation.md +101 -101
  214. package/pro/squads/design/tasks/ds-generate-migration-strategy.md +331 -331
  215. package/pro/squads/design/tasks/ds-generate-shock-report.md +323 -323
  216. package/pro/squads/design/tasks/ds-govern-a11y-compliance.md +93 -93
  217. package/pro/squads/design/tasks/ds-governance.md +187 -187
  218. package/pro/squads/design/tasks/ds-health-metrics.md +278 -278
  219. package/pro/squads/design/tasks/ds-integrate-squad.md +130 -130
  220. package/pro/squads/design/tasks/ds-integrate-workspace.md +100 -100
  221. package/pro/squads/design/tasks/ds-legacy-modernization.md +302 -302
  222. package/pro/squads/design/tasks/ds-mcp-status.md +65 -65
  223. package/pro/squads/design/tasks/ds-motion-audit.md +118 -118
  224. package/pro/squads/design/tasks/ds-multi-framework.md +96 -96
  225. package/pro/squads/design/tasks/ds-parallelization-gate.md +246 -246
  226. package/pro/squads/design/tasks/ds-query.md +90 -90
  227. package/pro/squads/design/tasks/ds-rebuild-artifact.md +369 -369
  228. package/pro/squads/design/tasks/ds-reverse-engineer.md +194 -194
  229. package/pro/squads/design/tasks/ds-scan-artifact.md +131 -131
  230. package/pro/squads/design/tasks/ds-setup-design-system.md +297 -297
  231. package/pro/squads/design/tasks/ds-sync-registry.md +287 -287
  232. package/pro/squads/design/tasks/ds-theme-multi-brand.md +90 -90
  233. package/pro/squads/design/tasks/ds-token-modes.md +108 -108
  234. package/pro/squads/design/tasks/ds-token-w3c-extract.md +105 -105
  235. package/pro/squads/design/tasks/ds-validate-ai-readiness.md +69 -69
  236. package/pro/squads/design/tasks/ds-visual-regression.md +130 -130
  237. package/pro/squads/design/tasks/execute-checklist.md +141 -141
  238. package/pro/squads/design/tasks/export-design-tokens-dtcg.md +97 -97
  239. package/pro/squads/design/tasks/f1-apply-foundations.md +154 -154
  240. package/pro/squads/design/tasks/f1-ingest-figma-tokens.md +130 -130
  241. package/pro/squads/design/tasks/f1-map-tokens-to-shadcn.md +145 -145
  242. package/pro/squads/design/tasks/f1-qa-foundations.md +95 -95
  243. package/pro/squads/design/tasks/f2-adapt-shadcn-components.md +155 -155
  244. package/pro/squads/design/tasks/f2-ingest-base-components.md +148 -148
  245. package/pro/squads/design/tasks/f2-qa-base-components.md +98 -98
  246. package/pro/squads/design/tasks/f3-derive-components.md +145 -145
  247. package/pro/squads/design/tasks/f3-qa-derived-components.md +101 -101
  248. package/pro/squads/design/tasks/focus-order-audit.md +450 -450
  249. package/pro/squads/design/tasks/sb-brownfield-migrate.md +367 -367
  250. package/pro/squads/design/tasks/sb-brownfield-scan.md +318 -318
  251. package/pro/squads/design/tasks/sb-configure.md +230 -230
  252. package/pro/squads/design/tasks/sb-expand-shadcn.md +213 -213
  253. package/pro/squads/design/tasks/sb-generate-all-stories.md +288 -288
  254. package/pro/squads/design/tasks/sb-install.md +152 -152
  255. package/pro/squads/design/tasks/sb-sync-workspace.md +239 -239
  256. package/pro/squads/design/tasks/sb-verify.md +203 -203
  257. package/pro/squads/design/tasks/tailwind-upgrade.md +117 -117
  258. package/pro/squads/design/tasks/token-usage-analytics.md +262 -262
  259. package/pro/squads/design/tasks/ux-rewrite-sixth-grade.md +82 -82
  260. package/pro/squads/design/tasks/validate-design-fidelity.md +222 -222
  261. package/pro/squads/design/templates/agent-template.yaml +46 -46
  262. package/pro/squads/design/templates/clone-mind-template.md +352 -352
  263. package/pro/squads/design/templates/component-prompt-injection-tmpl.md +236 -236
  264. package/pro/squads/design/templates/component-visual-spec-tmpl.md +378 -378
  265. package/pro/squads/design/templates/critical-eye-cycle-report-tmpl.md +165 -165
  266. package/pro/squads/design/templates/design-fidelity-report-tmpl.md +155 -155
  267. package/pro/squads/design/templates/ds-ai-component-metadata-schema-tmpl.json +138 -138
  268. package/pro/squads/design/templates/ds-artifact-analysis.md +70 -70
  269. package/pro/squads/design/templates/ds-health-report-tmpl.md +236 -236
  270. package/pro/squads/design/templates/ds-migration-strategy-tmpl.md +524 -524
  271. package/pro/squads/design/templates/ds-state-persistence-tmpl.yaml +194 -194
  272. package/pro/squads/design/templates/ds-tokens-schema-tmpl.yaml +139 -139
  273. package/pro/squads/design/templates/migration-strategy-tmpl.md +524 -524
  274. package/pro/squads/design/templates/reading-design-tokens.css +26 -26
  275. package/pro/squads/design/templates/state-persistence-tmpl.yaml +219 -219
  276. package/pro/squads/design/templates/tokens-schema-tmpl.yaml +305 -305
  277. package/pro/squads/design/workflows/agentic-readiness.yaml +83 -83
  278. package/pro/squads/design/workflows/audit-only.yaml +198 -198
  279. package/pro/squads/design/workflows/brownfield-complete.yaml +257 -257
  280. package/pro/squads/design/workflows/critical-eye.yaml +184 -184
  281. package/pro/squads/design/workflows/dtcg-tokens-governance.yaml +64 -64
  282. package/pro/squads/design/workflows/foundations-pipeline.yaml +192 -192
  283. package/pro/squads/design/workflows/greenfield-new.yaml +192 -192
  284. package/pro/squads/design/workflows/motion-quality.yaml +65 -65
  285. package/pro/squads/design/workflows/self-healing-workflow.yaml +237 -237
  286. package/pro/squads/design/workflows/storybook-brownfield-migration.yaml +400 -400
  287. package/pro/squads/design/workflows/storybook-full-setup.yaml +280 -280
  288. package/pro/squads/mmos-squad/minds/alex_hormozi/artifacts/ARQUITETURA_COGNITIVA_DE_ALEX_HORMOZI_EXTRA/303/207/303/203O_COMPLETA.md +215 -0
  289. package/pro/squads/mmos-squad/minds/alex_hormozi/artifacts/A_Rotina_de_Alta_Performance_de_Alex_Hormozi_Arquitetura,_Motiva/303/247/303/265es_e_Replica/303/247/303/243o.md +309 -0
  290. package/pro/squads/mmos-squad/minds/alex_hormozi/artifacts/O_sistema_completo_de_cria/303/247/303/243o_de_conte/303/272do_de_Alex_Hormozi.md +416 -0
  291. package/pro/squads/mmos-squad/minds/alex_hormozi/artifacts/Processo_Cria/303/247/303/243o_Conte/303/272do_Hormozi.md +0 -0
  292. package/pro/squads/mmos-squad/minds/brad_frost/.backup/2026-01-13/artifacts/DECIS/303/225ES_ESTRAT/303/211GICAS_DE_DESIGN_SYSTEMS_(2022_2025).md +1038 -0
  293. package/pro/squads/mmos-squad/minds/brad_frost/.backup/2026-01-13/artifacts/FRAMEWORK_COMPLETO_DE_IMPLEMENTA/303/207/303/203O_ATOMIC_DESIGN.md +797 -0
  294. package/pro/squads/mmos-squad/minds/brad_frost/.backup/2026-01-13/artifacts/O_Cemit/303/251rio_de_Design_Systems.md +447 -0
  295. package/pro/squads/mmos-squad/minds/brad_frost/.backup/2026-01-13/artifacts/PRINC/303/215PIOS_DE_RACIOC/303/215NIO.md +190 -0
  296. package/pro/squads/mmos-squad/minds/brad_frost/artifacts/DECIS/303/225ES_ESTRAT/303/211GICAS_DE_DESIGN_SYSTEMS_(2022_2025).md +1038 -0
  297. package/pro/squads/mmos-squad/minds/brad_frost/artifacts/FRAMEWORK_COMPLETO_DE_IMPLEMENTA/303/207/303/203O_ATOMIC_DESIGN.md +797 -0
  298. package/pro/squads/mmos-squad/minds/brad_frost/artifacts/O_Cemit/303/251rio_de_Design_Systems.md +447 -0
  299. package/pro/squads/mmos-squad/minds/brad_frost/artifacts/PRINC/303/215PIOS_DE_RACIOC/303/215NIO.md +190 -0
  300. package/pro/squads/mmos-squad/minds/elon_musk/artifacts/AN/303/201LISE_PSICOM/303/211TRICA_PROFUNDA_ELON_MUSK.md +291 -0
  301. package/pro/squads/mmos-squad/minds/elon_musk/artifacts/ASSINATURA_LINGU/303/215STICA_ELON_MUSK.md +485 -0
  302. package/pro/squads/mmos-squad/minds/elon_musk/artifacts/A_Arquitetura_Mental_de_Elon_Musk_Uma_An/303/241lise_Sistem/303/241tica_dos_Frameworks_de_Pensamento.md +907 -0
  303. package/pro/squads/mmos-squad/minds/elon_musk/artifacts/Dossi/303/252_Estrat/303/251gico_A_Arquitetura_Psicol/303/263gica_de_Elon_Musk.md +252 -0
  304. package/pro/squads/mmos-squad/minds/elon_musk/artifacts/Os_Padr/303/265es_de_Leitura_de_Elon_Musk_e_Sua_Influ/303/252ncia_Sistem/303/241tica.md +287 -0
  305. package/pro/squads/mmos-squad/minds/elon_musk/artifacts/Uma_an/303/241lise_psicol/303/263gica_abrangente.md +187 -0
  306. package/pro/squads/mmos-squad/minds/eugene_schwartz/artifacts/AN/303/201LISE_PSICOM/303/211TRICA_PROFUNDA_EUGENE_M._SCHWARTZ.md +790 -0
  307. package/pro/squads/mmos-squad/minds/eugene_schwartz/artifacts/An/303/241lise_Completa_Eugene_Schwartz_Arquitetura_Cognitiva_DEEP.md +210 -0
  308. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/5H_EXTRA/303/207/303/203O_COGNITIVA_COMPLETA_PEDRO_VAL/303/211RIO_LOPEZ.md +226 -0
  309. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/AN/303/201LISE_COMPARATIVA_REVISADA_PEDRO_VAL/303/211RIO_LOPEZ.md +246 -0
  310. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/AN/303/201LISE_LINGU/303/215STICA_CARIOCA_PEDRO_VAL/303/211RIO_LOPEZ.md +274 -0
  311. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/AN/303/201LISE_PSICOM/303/211TRICA_DEFINITIVA_PEDRO_VAL/303/211RIO_LOPEZ.md +821 -0
  312. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/AN/303/201LISE_PSICOM/303/211TRICA_PROFUNDA_PEDRO_VAL/303/211RIO.md +1844 -0
  313. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/C/303/201LCULO_DE_RARIDADE_ESTAT/303/215STICA_PEDRO_VAL/303/211RIO_LOPEZ.md +154 -0
  314. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/EXTRA/303/207/303/203O_PEDRO_VAL/303/211RIO.md +237 -0
  315. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/MAPEAMENTO_LINGU/303/215STICO_PROFUNDO.md +161 -0
  316. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/META_AXIOMAS_DE_PEDRO_VAL/303/211RIO.md +256 -0
  317. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/SISTEMA_IMUNOL/303/223GICO_COGNITIVO_PEDRO_VAL/303/211RIO_LOPEZ.md +586 -0
  318. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/SISTEMA_IMUNOL/303/223GICO_COGNITIVO_V2_/342/200/224_CLONE_IA.md +452 -0
  319. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/TABELA_COMPARATIVA_AN/303/201LISE_COMPLETA_DOS_CLONES_IA.md +102 -0
  320. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/WHATSAPP_PADR/303/225ES_LINGU/303/215STICOS_PEDRO_VAL/303/211RIO_LOPEZ.md +286 -0
  321. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/heur/303/255sticas_de_decis/303/243o_e_algoritmos_mentais_/303/272nicos.md +268 -0
  322. package/pro/squads/mmos-squad/minds/ray_kurzweil/sources/books/PROTOCOLO_COMPLETO_DE_INTERROGA/303/207/303/203O_-_NAVAL_RAVIKANT.md +3624 -0
  323. package/pro/squads/mmos-squad/minds/steve_jobs/artifacts/FRAMEWORK_COMPLETO_DE_IMPLEMENTA/303/207/303/203O_JOBS.md +488 -0
  324. package/pro/squads/mmos-squad/minds/steve_jobs/artifacts/Framework_Cabe/303/247a_Steve.md +257 -0
  325. package/pro/squads/mmos-squad/minds/steve_jobs/artifacts/Relat/303/263rio_Abrangente_sobre_Steve_Jobs_para_Cria/303/247/303/243o_de_Clone_de_IA.md +370 -0
  326. package/pro/squads/mmos-squad/minds/steve_jobs/artifacts/Steve_Jobs_An/303/241lise_Psicol/303/263gica_Profunda_e_Valida/303/247/303/243o_Comportamental.md +65 -0
  327. package/pro/squads/squad-creator-pro/HEADLINE.md +3 -3
  328. package/pro/squads/squad-creator-pro/agents/oalanicolas.md +438 -438
  329. package/pro/squads/squad-creator-pro/agents/squad-chief.md +1651 -1651
  330. package/pro/squads/squad-creator-pro/agents/thiago_finch.md +976 -976
  331. package/pro/squads/squad-creator-pro/assessments/axioma-assessment-wf-create-squad.yaml +325 -325
  332. package/pro/squads/squad-creator-pro/checklists/create-agent-checklist.md +184 -184
  333. package/pro/squads/squad-creator-pro/checklists/create-squad-checklist.md +219 -219
  334. package/pro/squads/squad-creator-pro/checklists/create-workflow-checklist.md +224 -224
  335. package/pro/squads/squad-creator-pro/checklists/mental-model-integration-checklist.md +95 -95
  336. package/pro/squads/squad-creator-pro/checklists/squad-overview-checklist.md +393 -393
  337. package/pro/squads/squad-creator-pro/config/model-routing.yaml +693 -693
  338. package/pro/squads/squad-creator-pro/config/scoring-rubric.yaml +199 -199
  339. package/pro/squads/squad-creator-pro/config.yaml +35 -35
  340. package/pro/squads/squad-creator-pro/data/internal-infrastructure-library.yaml +99 -99
  341. package/pro/squads/squad-creator-pro/data/mental-model-task-matrix.yaml +692 -692
  342. package/pro/squads/squad-creator-pro/docs/ADR-001-model-tier-qualification.md +344 -344
  343. package/pro/squads/squad-creator-pro/docs/AGENT-COLLABORATION.md +609 -609
  344. package/pro/squads/squad-creator-pro/docs/MIGRATION-PLAN-AGENT-CONFORMITY.md +861 -861
  345. package/pro/squads/squad-creator-pro/docs/MODEL-TIER-QUALIFICATION.md +337 -337
  346. package/pro/squads/squad-creator-pro/docs/optimize-v4-proposal.md +354 -354
  347. package/pro/squads/squad-creator-pro/docs/task-optimization-framework.md +229 -229
  348. package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_010.md +240 -240
  349. package/pro/squads/squad-creator-pro/protocols/ai-first-governance.md +63 -63
  350. package/pro/squads/squad-creator-pro/scripts/assess-sources.sh +443 -443
  351. package/pro/squads/squad-creator-pro/scripts/clone-review.sh +394 -394
  352. package/pro/squads/squad-creator-pro/scripts/create-agent-preflight.py +243 -243
  353. package/pro/squads/squad-creator-pro/scripts/cross-provider/compare-results.js +281 -281
  354. package/pro/squads/squad-creator-pro/scripts/cross-provider/cross-provider-runner.js +462 -462
  355. package/pro/squads/squad-creator-pro/scripts/fidelity-score.sh +519 -519
  356. package/pro/squads/squad-creator-pro/scripts/generate-squad-guide.js +558 -558
  357. package/pro/squads/squad-creator-pro/scripts/lib/config-loader.js +151 -151
  358. package/pro/squads/squad-creator-pro/scripts/model-tier-validator.cjs +369 -369
  359. package/pro/squads/squad-creator-pro/scripts/model-usage-logger.cjs +245 -245
  360. package/pro/squads/squad-creator-pro/scripts/modernization-score.sh +308 -308
  361. package/pro/squads/squad-creator-pro/scripts/scaffold-squad.cjs +281 -281
  362. package/pro/squads/squad-creator-pro/scripts/security_scanner.py +378 -378
  363. package/pro/squads/squad-creator-pro/scripts/squad-context-loader.cjs +205 -205
  364. package/pro/squads/squad-creator-pro/scripts/squad-state-manager.cjs +451 -451
  365. package/pro/squads/squad-creator-pro/scripts/squad-workflow-runner.cjs +471 -471
  366. package/pro/squads/squad-creator-pro/scripts/squad_utils.py +261 -261
  367. package/pro/squads/squad-creator-pro/scripts/tests/run_bash_tests.sh +29 -29
  368. package/pro/squads/squad-creator-pro/scripts/tests/test_assess_sources.sh +216 -216
  369. package/pro/squads/squad-creator-pro/scripts/tests/test_clone_review.sh +239 -239
  370. package/pro/squads/squad-creator-pro/scripts/tests/test_coherence_validator.py +212 -212
  371. package/pro/squads/squad-creator-pro/scripts/tests/test_fidelity_score.sh +298 -298
  372. package/pro/squads/squad-creator-pro/scripts/tests/test_modernization_score.sh +211 -211
  373. package/pro/squads/squad-creator-pro/scripts/tests/test_security_scanner.py +354 -354
  374. package/pro/squads/squad-creator-pro/scripts/tests/test_validate_clone.sh +252 -252
  375. package/pro/squads/squad-creator-pro/squad.yaml +36 -36
  376. package/pro/squads/squad-creator-pro/tasks/an-compare-outputs.md +354 -354
  377. package/pro/squads/squad-creator-pro/tasks/create-squad.md +933 -933
  378. package/pro/squads/squad-creator-pro/tasks/detect-squad-context.md +81 -81
  379. package/pro/squads/squad-creator-pro/tasks/lookup-model.md +78 -78
  380. package/pro/squads/squad-creator-pro/tasks/next-squad.md +487 -487
  381. package/pro/squads/squad-creator-pro/tasks/optimize-workflow.md +851 -851
  382. package/pro/squads/squad-creator-pro/tasks/parallel-discovery.md +58 -58
  383. package/pro/squads/squad-creator-pro/tasks/pv-axioma-assessment-wf-clone-mind.yaml +256 -256
  384. package/pro/squads/squad-creator-pro/tasks/qualify-task.md +265 -265
  385. package/pro/squads/squad-creator-pro/tasks/reexecute-squad-phase.md +64 -64
  386. package/pro/squads/squad-creator-pro/tasks/smoke-test-model-routing.md +167 -167
  387. package/pro/squads/squad-creator-pro/tasks/squad-overview.md +683 -683
  388. package/pro/squads/squad-creator-pro/tasks/validate-final-artifacts.md +80 -80
  389. package/pro/squads/squad-creator-pro/templates/orchestrator-tmpl.md +74 -74
  390. package/pro/squads/squad-creator-pro/test-cases/BATCH-PROGRESS.md +268 -268
  391. package/pro/squads/squad-creator-pro/test-cases/QUALIFICATION-DASHBOARD.yaml +13 -13
  392. package/pro/squads/squad-creator-pro/test-cases/_template.yaml +147 -147
  393. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/ASSESSMENT-SUMMARY.md +275 -275
  394. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/ASSESSMENT_SUMMARY.md +140 -140
  395. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/CHECKPOINT_MATRIX.md +202 -202
  396. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/EXECUTION-REPORT.md +413 -413
  397. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/EXECUTION_NOTES.md +358 -358
  398. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/README-v2.2.2.md +299 -299
  399. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/README.md +320 -320
  400. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/TEST-REPORT-v2.1.md +351 -351
  401. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/VERIFICATION-CHECKLIST.txt +247 -247
  402. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/formal-qualification-report.yaml +389 -389
  403. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-output.yaml +366 -366
  404. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-v2.1-output.yaml +452 -452
  405. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-v2.2.1-output.yaml +281 -281
  406. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-v2.2.2-output.yaml +332 -332
  407. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/opus-baseline.yaml +517 -517
  408. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/qualification-report.yaml +213 -213
  409. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/test-case.yaml +69 -69
  410. package/pro/squads/squad-creator-pro/test-cases/an-clone-review/haiku-round-1.yaml +213 -213
  411. package/pro/squads/squad-creator-pro/test-cases/an-clone-review/opus-baseline.yaml +566 -566
  412. package/pro/squads/squad-creator-pro/test-cases/an-clone-review/qualification-report.yaml +82 -82
  413. package/pro/squads/squad-creator-pro/test-cases/an-design-clone/test-case.yaml +102 -102
  414. package/pro/squads/squad-creator-pro/test-cases/an-extract-dna/test-case.yaml +105 -105
  415. package/pro/squads/squad-creator-pro/test-cases/an-fidelity-score/haiku-round-1.yaml +262 -262
  416. package/pro/squads/squad-creator-pro/test-cases/an-fidelity-score/opus-baseline.yaml +266 -266
  417. package/pro/squads/squad-creator-pro/test-cases/an-fidelity-score/qualification-report.yaml +94 -94
  418. package/pro/squads/squad-creator-pro/test-cases/an-validate-clone/haiku-round-1.yaml +282 -282
  419. package/pro/squads/squad-creator-pro/test-cases/an-validate-clone/opus-baseline.yaml +470 -470
  420. package/pro/squads/squad-creator-pro/test-cases/an-validate-clone/qualification-report.yaml +106 -106
  421. package/pro/squads/squad-creator-pro/test-cases/collect-sources/test-case.yaml +105 -105
  422. package/pro/squads/squad-creator-pro/test-cases/create-task/test-case.yaml +104 -104
  423. package/pro/squads/squad-creator-pro/test-cases/cross-provider/DASHBOARD.yaml +11 -11
  424. package/pro/squads/squad-creator-pro/test-cases/pv-audit/test-case.yaml +106 -106
  425. package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/haiku-output.yaml +209 -209
  426. package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/opus-baseline.yaml +96 -96
  427. package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/sonnet-output.yaml +30 -30
  428. package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/test-case.yaml +129 -129
  429. package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/comparison-round-1.yaml +242 -242
  430. package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/haiku-round-1.yaml +393 -393
  431. package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/opus-baseline.yaml +488 -488
  432. package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/qualification-report.yaml +74 -74
  433. package/pro/squads/squad-creator-pro/test-cases/qa-after-creation/haiku-round-1.yaml +292 -292
  434. package/pro/squads/squad-creator-pro/test-cases/qa-after-creation/opus-baseline.yaml +603 -603
  435. package/pro/squads/squad-creator-pro/test-cases/qa-after-creation/qualification-report.yaml +97 -97
  436. package/pro/squads/squad-creator-pro/test-cases/smoke-test-model-routing/test-case.yaml +100 -100
  437. package/pro/squads/squad-creator-pro/test-cases/upgrade-squad/test-case.yaml +106 -106
  438. package/pro/squads/squad-creator-pro/test-cases/validate-squad/comparison-round-1.yaml +223 -223
  439. package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-1-MINE.yaml +36 -36
  440. package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-1.yaml +193 -193
  441. package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-2.yaml +303 -303
  442. package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-3-v4-task.yaml +149 -149
  443. package/pro/squads/squad-creator-pro/test-cases/validate-squad/opus-baseline.yaml +529 -529
  444. package/pro/squads/squad-creator-pro/test-cases/validate-squad/opus-round-3-v4-task.yaml +132 -132
  445. package/pro/squads/squad-creator-pro/test-cases/validate-squad/qualification-report.yaml +104 -104
  446. package/pro/squads/squad-creator-pro/test-cases/wf-clone-mind/haiku-output-v2-calibrated.yaml +200 -200
  447. package/pro/squads/squad-creator-pro/test-cases/wf-clone-mind/haiku-output.yaml +183 -183
  448. package/pro/squads/squad-creator-pro/test-cases/wf-clone-mind/opus-baseline.yaml +112 -112
  449. package/pro/squads/squad-creator-pro/workflows/create-squad.yaml +348 -348
  450. package/pro/squads/squad-creator-pro/workflows/modules/module-discovery.yaml +16 -16
  451. package/pro/squads/squad-creator-pro/workflows/modules/module-integration.yaml +16 -16
  452. package/pro/squads/squad-creator-pro/workflows/modules/module-quality-gates.yaml +15 -15
  453. package/pro/squads/squad-creator-pro/workflows/wf-brownfield-upgrade-squad.yaml +46 -46
  454. package/pro/squads/squad-creator-pro/workflows/wf-context-aware-create-squad.yaml +47 -47
  455. package/pro/squads/squad-creator-pro/workflows/wf-create-squad.yaml +1619 -1619
  456. package/pro/squads/squad-creator-pro/workflows/wf-cross-provider-qualification.yaml +711 -711
  457. package/pro/squads/squad-creator-pro/workflows/wf-model-tier-qualification.yaml +800 -800
  458. package/pro/squads/squad-creator-pro/workflows/wf-optimize-squad.yaml +684 -684
  459. package/scripts/check-markdown-links.py +352 -352
  460. package/scripts/dashboard-parallel-dev.sh +0 -0
  461. package/scripts/dashboard-parallel-phase3.sh +0 -0
  462. package/scripts/dashboard-parallel-phase4.sh +0 -0
  463. package/scripts/install-monitor-hooks.sh +0 -0
  464. package/.claude/hooks/code-intel-pretool.cjs +0 -107
  465. package/docs/guides/aios-workflows/README.md +0 -247
  466. package/docs/guides/aios-workflows/bob-orchestrator-workflow.md +0 -1536
  467. package/scripts/glue/README.md +0 -355
  468. package/scripts/glue/compose-agent-prompt.cjs +0 -362
@@ -1,693 +1,693 @@
1
- # ============================================================================
2
- # Squad Creator Model Routing Configuration
3
- # ============================================================================
4
- # Self-contained config for task-to-model routing.
5
- # Squad Chief consults this before executing tasks to optimize token costs.
6
- #
7
- # PHILOSOPHY: "Use the cheapest model that maintains quality"
8
- # - Haiku: Deterministic tasks (validation, scoring, admin)
9
- # - Sonnet: Moderate analysis (documentation, templates)
10
- # - Opus: Complex reasoning (DNA extraction, agent creation)
11
- #
12
- # Based on empirical analysis: docs/enhance/squad_creator_token_economy/
13
- # Expected savings: 60-70% of token consumption (validated)
14
- # ============================================================================
15
-
16
- version: "2.4.0"
17
- updated: "2026-02-13"
18
-
19
- # ============================================================================
20
- # ROUTING TIERS
21
- # ============================================================================
22
-
23
- tiers:
24
- haiku:
25
- description: "Fast, cheap. For deterministic tasks with clear patterns."
26
- model_id: "haiku" # Maps to Task tool model parameter
27
- cost_per_mtok:
28
- input: 1.00
29
- output: 5.00
30
- best_for:
31
- - "Checklist validation"
32
- - "Formula-based scoring"
33
- - "File operations"
34
- - "Registry updates"
35
- - "Pattern matching"
36
-
37
- sonnet:
38
- description: "Balanced. For moderate analysis and generation."
39
- model_id: "sonnet"
40
- cost_per_mtok:
41
- input: 3.00
42
- output: 15.00
43
- best_for:
44
- - "Documentation generation"
45
- - "Template creation"
46
- - "Source collection"
47
- - "Workflow design"
48
-
49
- opus:
50
- description: "Most capable. For complex reasoning and synthesis."
51
- model_id: "opus"
52
- cost_per_mtok:
53
- input: 5.00
54
- output: 25.00
55
- best_for:
56
- - "DNA extraction"
57
- - "Agent creation"
58
- - "Deep research"
59
- - "Creative synthesis"
60
- - "Multi-source analysis"
61
-
62
- # ============================================================================
63
- # EXTERNAL PROVIDERS (v2.0 - Cross-Provider Support)
64
- # ============================================================================
65
- # External models via OpenRouter that can substitute Opus for cost savings.
66
- # These require LLM Router or direct API calls (not Task tool).
67
-
68
- external_providers:
69
- glm5:
70
- display_name: "GLM-5"
71
- provider: "openrouter"
72
- model_id: "z-ai/glm-5"
73
- cost_per_mtok:
74
- input: 0.80
75
- output: 3.20
76
- context_window: 200000
77
- qualified_date: "2026-02-13"
78
- validation_report: "test-cases/cross-provider/extract-voice-dna/glm5/qualification-report.yaml"
79
- quality_vs_opus: "85-98% (task/runner dependent)"
80
- latency_vs_opus: "25x faster"
81
- savings_vs_opus: "97.7%"
82
- pt_br_quality: "9/10"
83
- privacy_risk: "moderate" # Singapore entity, China parent
84
- best_for:
85
- - "Voice DNA extraction (production-ready with v1.4.0 task + v2.0 runner)"
86
- - "Batch processing"
87
- - "All DNA extraction tasks"
88
- not_for:
89
- - "Tasks using runner v1 (quality drops to 85%)"
90
- notes: |
91
- Empirically tested 2026-02-12, quality upgraded 2026-02-13.
92
- Record-low hallucination rate.
93
- MIT license enables self-hosting.
94
- CRITICAL: Quality depends on runner passing FULL task content.
95
- Runner v2.0 required for 95%+ quality.
96
-
97
- kimi:
98
- display_name: "Kimi K2.5"
99
- provider: "openrouter"
100
- model_id: "moonshotai/kimi-k2.5"
101
- cost_per_mtok:
102
- input: 0.50
103
- output: 2.80
104
- context_window: 256000
105
- qualified_date: null # Not yet tested
106
- validation_report: "infrastructure/services/llm-router/docs/model-discovery/scans/2026-02-08/validation-kimi-k2-5.md"
107
- verdict: "MONITOR"
108
- privacy_risk: "high" # China, trains on prompts
109
- latency_warning: "HIGH (15-200s per request)"
110
- notes: |
111
- Validation report exists but not empirically tested on squad-creator tasks.
112
- Agent Swarm capability may excel on research tasks.
113
- High latency is a concern.
114
-
115
- # ============================================================================
116
- # TASK ROUTING MAP
117
- # ============================================================================
118
- # Format: task_file -> tier
119
- # Squad Chief looks up task here before spawning agent
120
- # ============================================================================
121
-
122
- tasks:
123
- # --------------------------------------------------------------------------
124
- # HAIKU TIER - Immediate candidates (validated)
125
- # --------------------------------------------------------------------------
126
- # These tasks are deterministic and can safely use Haiku
127
-
128
- ## Validation Tasks
129
- qa-after-creation.md:
130
- tier: haiku
131
- confidence: high
132
- reason: "Checklist validation, gatekeeper task (pass/fail)"
133
- validated: true
134
- test_date: "2026-02-11"
135
- test_result: "QUALIFIED (Opus 8.32 APPROVED, Haiku 9.9 APPROVED - same decision)"
136
- caveat: "Haiku score inflation +19%, but pass/fail matches"
137
-
138
- validate-squad.md:
139
- tier: haiku # QUALIFIED after re-test with expert_override fix
140
- confidence: high
141
- reason: "91% voice_dna signal triggers expert override"
142
- validated: true
143
- test_date: "2026-02-11"
144
- test_result: "HAIKU QUALIFIED (expert_override 91% dominant signal)"
145
- fix_applied: "Already had dominant signals in v2.0"
146
-
147
- validate-extraction.md:
148
- tier: haiku
149
- confidence: high
150
- reason: "7-item checklist validation, threshold checking"
151
- validated: false
152
-
153
- ## Scoring Tasks
154
- pv-axioma-assessment.md:
155
- tier: haiku
156
- confidence: high
157
- reason: "12-dimension scoring with scoring calibration"
158
- validated: true
159
- test_date: "2026-02-11"
160
- test_result: "QUALIFIED (Opus 7.85, Haiku 7.77 = 95.5% quality)"
161
- note: "Added Scoring Calibration section in v1.1.0"
162
-
163
- pv-modernization-score.md:
164
- tier: script # UPGRADED - 100% deterministic scoring
165
- confidence: high
166
- reason: "Binary pass/fail checkpoints, no interpretation needed"
167
- validated: true
168
- test_date: "2026-02-11"
169
- test_result: "SCRIPT QUALIFIED (100% deterministic, 0 tokens)"
170
- note: "Converted to script-first architecture"
171
-
172
- an-fidelity-score.md:
173
- tier: script # UPGRADED from haiku - can be 100% deterministic
174
- confidence: high
175
- reason: "8-layer × 5 binary checkpoints - fully scriptable"
176
- validated: true
177
- test_date: "2026-02-11"
178
- test_result: "SCRIPT ELIGIBLE (0 tokens, <1s, 100% deterministic)"
179
- script_path: "scripts/fidelity-score.sh"
180
- note: "95% of task can be bash script. LLM only for gap recommendations."
181
-
182
- an-clone-review.md:
183
- tier: haiku # QUALIFIED v2.2.0 after scope fix
184
- confidence: high
185
- reason: "SCOPE DEFINITION added - explicit wrapper + delegated scope"
186
- validated: true
187
- test_date: "2026-02-11"
188
- test_result: "HAIKU QUALIFIED v2.2.0 (Trinity 93.3% SOLID - same as Opus)"
189
- fix_applied: "v2.2.0 SCOPE DEFINITION: Review wrapper AND referenced persona files"
190
- script_path: "scripts/clone-review.sh"
191
- note: "Script handles 90% deterministic checks. Scope fix enabled Haiku for final verdict."
192
-
193
- an-diagnose-clone.md:
194
- tier: opus # CONFIRMED after formal test
195
- confidence: high
196
- reason: "Requires accurate file content analysis - Haiku simulates instead of reads"
197
- validated: true
198
- test_date: "2026-02-11"
199
- test_result: "OPUS REQUIRED (Haiku 30% vs Opus 85% - wrong file analysis)"
200
- fix_attempted: "v2.0.0 with CHECKPOINT CLARIFICATIONS"
201
- fix_result: "FAILED - Haiku simulated grep counts incorrectly"
202
- note: "Task value is in nuanced LLM analysis, not scriptable"
203
-
204
- an-validate-clone.md:
205
- tier: haiku # QUALIFIED v2.2.0 after strict rules fix
206
- confidence: high
207
- reason: "CHECKPOINT CLARIFICATIONS added - strict rules, no inference"
208
- validated: true
209
- test_date: "2026-02-11"
210
- test_result: "HAIKU QUALIFIED v2.2.0 (90% AUTH with strict rules)"
211
- fix_applied: "v2.2.0 CHECKPOINT CLARIFICATIONS: Explicit SE/ENTÃO, no inference allowed"
212
- note: "Strict scoring rules eliminated Haiku generous bias."
213
-
214
- an-assess-sources.md:
215
- tier: haiku # CHANGED back to haiku after v2.2.1 iterative refinement
216
- confidence: high
217
- reason: "Binary Checkpoints + Scope Definition + No Override Rule = 100% tier match"
218
- validated: true
219
- test_date: "2026-02-11"
220
- test_result: "HAIKU QUALIFIED v2.2.1 (Opus 3 CJ, Haiku 3 CJ - 100% tier match)"
221
- iterations_to_qualify: 3
222
- fixes_applied:
223
- - "v2.0: Binary Checkpoints (25% match)"
224
- - "v2.1: Scope Definition (75% match)"
225
- - "v2.2.1: No Override Rule (100% match)"
226
- note: "Demonstrates iterative task refinement pattern for Haiku qualification."
227
-
228
- ## Admin Tasks
229
- refresh-registry.md:
230
- tier: haiku
231
- confidence: high
232
- reason: "Script-based extraction, LLM just formats output"
233
-
234
- squad-analytics.md:
235
- tier: haiku
236
- confidence: high
237
- reason: "Count files, compute metrics - deterministic"
238
-
239
- migrate-workflows-to-yaml.md:
240
- tier: haiku
241
- confidence: high
242
- reason: "Format conversion with clear rules"
243
-
244
- install-commands.md:
245
- tier: haiku
246
- confidence: high
247
- reason: "Script execution, deterministic file operations"
248
-
249
- sync-ide-command.md:
250
- tier: haiku
251
- confidence: high
252
- reason: "File sync operation, no reasoning needed"
253
-
254
- # --------------------------------------------------------------------------
255
- # SONNET TIER - Test candidates (moderate confidence)
256
- # --------------------------------------------------------------------------
257
- # These tasks might work with Haiku but need validation
258
-
259
- ## Documentation Tasks
260
- create-documentation.md:
261
- tier: sonnet
262
- confidence: medium
263
- reason: "Template-based but needs some coherence"
264
- test_with_haiku: true
265
-
266
- create-template.md:
267
- tier: sonnet
268
- confidence: medium
269
- reason: "Structure design with moderate creativity"
270
- test_with_haiku: true
271
-
272
- ## Source Tasks
273
- collect-sources.md:
274
- tier: sonnet
275
- confidence: medium
276
- reason: "Web search + validation, some judgment needed"
277
- test_with_haiku: true
278
-
279
- auto-acquire-sources.md:
280
- tier: sonnet
281
- confidence: medium
282
- reason: "Tool orchestration, content extraction"
283
- test_with_haiku: true
284
-
285
- ## Workflow/Task Creation
286
- create-workflow.md:
287
- tier: sonnet
288
- confidence: medium
289
- reason: "Multi-phase design, needs logical coherence"
290
-
291
- create-task.md:
292
- tier: sonnet
293
- confidence: medium
294
- reason: "Task Anatomy compliance, some complexity"
295
-
296
- create-pipeline.md:
297
- tier: sonnet
298
- confidence: medium
299
- reason: "Pipeline design with dependencies"
300
-
301
- ## Analysis Tasks
302
- pv-audit.md:
303
- tier: sonnet
304
- confidence: medium
305
- reason: "Process audit requires some reasoning"
306
-
307
- find-0.8.md:
308
- tier: sonnet
309
- confidence: medium
310
- reason: "Pareto analysis needs judgment"
311
-
312
- deconstruct.md:
313
- tier: sonnet
314
- confidence: medium
315
- reason: "Structural analysis, moderate depth"
316
-
317
- optimize.md:
318
- tier: sonnet
319
- confidence: medium
320
- reason: "Q1-Q6 decision tree evaluation"
321
-
322
- update-mind.md:
323
- tier: sonnet
324
- confidence: medium
325
- reason: "Brownfield updates need context awareness"
326
-
327
- upgrade-squad.md:
328
- tier: sonnet
329
- confidence: medium
330
- reason: "Squad upgrade analysis"
331
-
332
- squad-fusion.md:
333
- tier: sonnet
334
- confidence: medium
335
- reason: "Merge logic, moderate complexity"
336
-
337
- next-squad.md:
338
- tier: sonnet
339
- confidence: high
340
- reason: "Registry analysis + multi-dimensional scoring + synthesis. Structured data in, ranked recommendation out."
341
-
342
- # --------------------------------------------------------------------------
343
- # OPUS TIER - Keep on Opus (non-negotiable)
344
- # --------------------------------------------------------------------------
345
- # These tasks require deep reasoning and cannot be downgraded
346
-
347
- ## DNA Extraction (Core Value)
348
- extract-voice-dna.md:
349
- tier: opus
350
- confidence: high
351
- reason: "Multi-layer pattern recognition, nuance detection"
352
- downgrade_risk: "Quality degradation in voice capture"
353
-
354
- extract-thinking-dna.md:
355
- tier: opus
356
- confidence: high
357
- reason: "Framework synthesis, decision architecture mapping"
358
- downgrade_risk: "Missing mental models and heuristics"
359
-
360
- extract-knowledge.md:
361
- tier: opus
362
- confidence: high
363
- reason: "Anti-invention gates need sophisticated reasoning"
364
- downgrade_risk: "Hallucinated frameworks"
365
-
366
- extract-sop.md:
367
- tier: opus
368
- confidence: high
369
- reason: "Process extraction from unstructured sources"
370
- downgrade_risk: "Incomplete procedures"
371
-
372
- extract-implicit.md:
373
- tier: opus
374
- confidence: high
375
- reason: "Inference of unstated knowledge"
376
- downgrade_risk: "Missing implicit patterns"
377
-
378
- ## Agent Creation
379
- create-agent.md:
380
- tier: opus
381
- confidence: high
382
- reason: "Creative persona synthesis with voice consistency"
383
- downgrade_risk: "Generic agent without depth"
384
-
385
- an-design-clone.md:
386
- tier: opus
387
- confidence: high
388
- reason: "Clone architecture requires holistic design"
389
- downgrade_risk: "Incomplete clone structure"
390
-
391
- an-extract-dna.md:
392
- tier: opus
393
- confidence: high
394
- reason: "Specialized DNA extraction"
395
- downgrade_risk: "Missing DNA layers"
396
-
397
- an-extract-framework.md:
398
- tier: opus
399
- confidence: high
400
- reason: "Framework identification from sources"
401
- downgrade_risk: "Shallow framework extraction"
402
-
403
- ## Research Tasks
404
- deep-research-pre-agent.md:
405
- tier: opus
406
- confidence: high
407
- reason: "Web research synthesis, source triangulation"
408
- downgrade_risk: "Superficial research"
409
-
410
- discover-tools.md:
411
- tier: opus
412
- confidence: high
413
- reason: "Multi-source tool discovery, scoring"
414
- downgrade_risk: "Missing relevant tools"
415
-
416
- ## Squad Creation
417
- create-squad.md:
418
- tier: opus
419
- confidence: high
420
- reason: "Full squad orchestration, multi-phase"
421
- downgrade_risk: "Incomplete squad structure"
422
-
423
- # ============================================================================
424
- # FALLBACK CONFIGURATION
425
- # ============================================================================
426
- # If a model fails, try the next tier up
427
-
428
- fallback:
429
- haiku:
430
- on_failure: sonnet
431
- on_quality_below: 0.85
432
-
433
- sonnet:
434
- on_failure: opus
435
- on_quality_below: 0.80
436
-
437
- # ============================================================================
438
- # USAGE BY SQUAD CHIEF
439
- # ============================================================================
440
- #
441
- # Before executing a task, Squad Chief should:
442
- #
443
- # 1. Look up task in this config:
444
- # task_config = model_routing.tasks[task_name]
445
- #
446
- # 2. Get the tier:
447
- # tier = task_config.tier # haiku, sonnet, or opus
448
- #
449
- # 3. Spawn agent with model:
450
- # Task(
451
- # subagent_type: "appropriate-agent",
452
- # model: tier, # "haiku", "sonnet", or "opus"
453
- # prompt: "..."
454
- # )
455
- #
456
- # 4. If quality check fails, use fallback:
457
- # if quality < fallback[tier].on_quality_below:
458
- # retry with fallback[tier].on_failure
459
- #
460
- # ============================================================================
461
-
462
- # ============================================================================
463
- # METRICS TRACKING
464
- # ============================================================================
465
- # Track these metrics to validate routing decisions
466
-
467
- metrics:
468
- track:
469
- - task_name
470
- - model_used
471
- - tokens_in
472
- - tokens_out
473
- - latency_ms
474
- - quality_score # If available
475
- - fallback_triggered
476
-
477
- report_location: "outputs/metrics/model-routing-{date}.yaml"
478
-
479
- # ============================================================================
480
- # EXTERNAL ALTERNATIVES (Opus Tasks with Qualified External Options)
481
- # ============================================================================
482
- # Tasks that can use external models as cost-effective alternatives to Opus.
483
- # Squad Chief can route to these when cost optimization is prioritized.
484
-
485
- external_alternatives:
486
- extract-voice-dna.md:
487
- primary_tier: opus
488
- external_option:
489
- model: glm5
490
- qualified: true
491
- quality_vs_opus: "95-98%" # UPGRADED 2026-02-13 after task v1.4.0 + runner v2.0
492
- savings: "97.7%"
493
- pt_br_qualified: true
494
- tested_date: "2026-02-13"
495
- runner_version: "v2.0" # Requires runner v2.0 (full task content)
496
- task_version: "v1.4.0" # Requires task v1.4.0 (explicit quality requirements)
497
- use_when:
498
- - "Batch processing multiple minds"
499
- - "Cost-sensitive workflows"
500
- - "Production clones (with v1.4.0 task)"
501
- avoid_when:
502
- - "Runner v1 still in use"
503
- evidence: "test-cases/cross-provider/extract-voice-dna/glm5/"
504
- notes: |
505
- Quality improved from 85% to 95-98% after:
506
- 1. Task v1.4.0: Added explicit source requirements, example_usage, example_wrong/correct
507
- 2. Runner v2.0: Passes FULL task content (including QUALITY CHECK section)
508
- Key insight: Model follows instructions when they actually reach the prompt.
509
-
510
- extract-knowledge.md:
511
- primary_tier: opus
512
- external_option:
513
- model: glm5
514
- qualified: true
515
- quality_vs_opus: "95%"
516
- savings: "96.8%"
517
- tested_date: "2026-02-12"
518
- use_when:
519
- - "Zero-invention extraction"
520
- - "Batch processing sources"
521
- - "Cost-sensitive workflows"
522
- avoid_when:
523
- - "Gap analysis required"
524
- - "Verbose examples needed"
525
- evidence: "test-cases/cross-provider/extract-knowledge/glm5/"
526
- notes: "GLM-5 CONFIRMA record-low hallucination claim. Zero invented content."
527
-
528
- extract-thinking-dna.md:
529
- primary_tier: opus
530
- external_option:
531
- model: glm5
532
- qualified: true
533
- quality_vs_opus: "100%"
534
- savings: "99%"
535
- tested_date: "2026-02-12"
536
- use_when:
537
- - "Framework extraction"
538
- - "Heuristic mapping"
539
- - "Decision pattern extraction"
540
- - "Batch processing minds"
541
- avoid_when:
542
- - "Need attention_triggers detail"
543
- evidence: "outputs/llm-tests/extract-thinking-dna/glm5/"
544
- notes: "GLM-5 matched Opus exactly. 19s vs 66s latency. $0.007 vs $0.50 cost."
545
-
546
- # Candidates for future testing
547
-
548
- deep-research-pre-agent.md:
549
- primary_tier: opus
550
- external_option:
551
- model: glm5
552
- qualified: true
553
- quality_vs_opus: "95%"
554
- savings: "97.8%"
555
- tested_date: "2026-02-13"
556
- use_when:
557
- - "Research prompt generation"
558
- - "7-component meta-framework"
559
- - "Cost-sensitive research pipelines"
560
- avoid_when:
561
- - "Need GOLD/SILVER/BRONZE confidence naming"
562
- evidence: "outputs/llm-tests/deep-research-pre-agent/glm5/"
563
- notes: "GLM-5 produced identical 7-component structure. 45.5s latency. $0.0098 cost."
564
-
565
- create-agent.md:
566
- primary_tier: opus
567
- external_option:
568
- model: glm5
569
- qualified: true
570
- quality_vs_opus: "98%"
571
- savings: "99.1%"
572
- tested_date: "2026-02-13"
573
- runner_version: "v2.0"
574
- use_when:
575
- - "Agent creation from pre-extracted DNA"
576
- - "Batch agent generation"
577
- - "Production agents"
578
- avoid_when:
579
- - "Runner v1 still in use"
580
- evidence: "outputs/llm-tests/create-agent/glm5/"
581
- notes: |
582
- GLM-5 QUALIFIED after runner v2.0 (full task content).
583
- Output: 718 lines, all sections complete.
584
- Key improvements: 6 heuristics (was 3), 4 objection algorithms,
585
- SCOPE with boundary_conditions, veto_conditions, handoff_triggers.
586
- $0.02 vs ~$2.50 Opus = 99.1% savings.
587
-
588
- # ============================================================================
589
- # CHANGELOG
590
- # ============================================================================
591
-
592
- changelog:
593
- - version: "2.4.0"
594
- date: "2026-02-13"
595
- changes:
596
- - "GLM-5 QUALIFIED for create-agent (98% quality, 99.1% savings)"
597
- - "Output: 718 lines with ALL sections complete"
598
- - "Key wins: 6 heuristics, 4 objection algorithms, SCOPE with veto conditions"
599
- - "$0.02 vs ~$2.50 Opus"
600
- - "5 tasks now qualified: extract-voice-dna, extract-knowledge, extract-thinking-dna, deep-research-pre-agent, create-agent"
601
-
602
- - version: "2.3.0"
603
- date: "2026-02-13"
604
- changes:
605
- - "QUALITY IMPROVEMENT: extract-voice-dna GLM-5 quality upgraded 85% → 95-98%"
606
- - "Task v1.4.0: Added explicit quality requirements (source:, example_usage:, example_wrong/correct)"
607
- - "Runner v2.0: Now passes FULL task content (was passing only ~10% of task)"
608
- - "Key insight: QUALITY CHECK section was never reaching the model - fixed"
609
- - "Trade-off: +$0.01 cost, +174s latency for +10-13% quality"
610
- - "GLM-5 now production-ready for voice DNA extraction"
611
-
612
- - version: "2.2.0"
613
- date: "2026-02-13"
614
- changes:
615
- - "GLM-5 QUALIFIED for deep-research-pre-agent (95% quality, 97.8% savings)"
616
- - "GLM-5 produced identical 7-component meta-framework structure"
617
- - "45.5s latency, $0.0098 cost"
618
- - "4 tasks now qualified: extract-voice-dna, extract-knowledge, extract-thinking-dna, deep-research-pre-agent"
619
-
620
- - version: "2.1.0"
621
- date: "2026-02-12"
622
- changes:
623
- - "GLM-5 QUALIFIED for extract-thinking-dna (100% quality, 99% savings)"
624
- - "GLM-5 matched Opus exactly on all categories"
625
- - "19s latency vs 66s Opus (3.5x faster)"
626
- - "$0.007 cost vs ~$0.50 Opus"
627
- - "3 tasks now qualified: extract-voice-dna, extract-knowledge, extract-thinking-dna"
628
-
629
- - version: "2.0.0"
630
- date: "2026-02-12"
631
- changes:
632
- - "MAJOR: Added external_providers section (GLM-5, Kimi K2.5)"
633
- - "MAJOR: Added external_alternatives for Opus tasks with cheaper options"
634
- - "GLM-5 QUALIFIED for extract-voice-dna (85% quality, 97.7% savings)"
635
- - "GLM-5 tested: 1.9s latency (25x faster than Opus)"
636
- - "GLM-5 PT-BR quality: 9/10 (QUALIFIED)"
637
- - "Created wf-cross-provider-qualification.yaml workflow"
638
- - "Created validation-glm-5.md report"
639
- - "4 tasks marked as candidates for GLM-5 testing"
640
-
641
- - version: "1.3.0"
642
- date: "2026-02-11"
643
- changes:
644
- - "FORMAL TEST: an-diagnose-clone tested Opus vs Haiku"
645
- - "an-diagnose-clone: OPUS REQUIRED (Haiku 30% vs Opus 85%)"
646
- - "Fix v2.0.0 attempted with CHECKPOINT CLARIFICATIONS - FAILED"
647
- - "Root cause: Haiku simulates file reads instead of accurate analysis"
648
- - "Decision: Keep Opus - LLM analysis value > script automation"
649
- - "Final stats: 12/14 Haiku/Script (86%), 1/14 Opus (7%), 1/14 deprecated"
650
-
651
- - version: "1.2.0"
652
- date: "2026-02-11"
653
- changes:
654
- - "SYNC WITH BATCH-PROGRESS: 4 tasks re-qualified after fixes"
655
- - "validate-squad: HAIKU QUALIFIED (expert_override 91% dominant signal)"
656
- - "pv-modernization-score: SCRIPT QUALIFIED (100% deterministic)"
657
- - "an-clone-review: HAIKU QUALIFIED v2.2.0 (SCOPE DEFINITION fix)"
658
- - "an-validate-clone: HAIKU QUALIFIED v2.2.0 (CHECKPOINT CLARIFICATIONS fix)"
659
- - "Total qualified: 12/14 (86%) - matches BATCH-PROGRESS.md"
660
- - "Estimated savings: 60-70% token cost reduction"
661
-
662
- - version: "1.1.0"
663
- date: "2026-02-11"
664
- changes:
665
- - "EMPIRICAL VALIDATION: 4 tasks tested with Opus vs Haiku"
666
- - "pv-axioma-assessment: HAIKU QUALIFIED (95.5% quality)"
667
- - "qa-after-creation: HAIKU QUALIFIED (same pass/fail decision)"
668
- - "pv-modernization-score: MOVED TO OPUS (wrong judgment)"
669
- - "validate-squad: MOVED TO OPUS (wrong type detection)"
670
- - "an-fidelity-score: Task updated to v2.0 Haiku-compatible (pending validation)"
671
- - "New haiku count: 13 validated candidates"
672
- - "New opus count: 14 (includes 2 moved from haiku)"
673
-
674
- - version: "1.0.2"
675
- date: "2026-02-11"
676
- changes:
677
- - "Corrected task counts: 15 haiku + 14 sonnet + 12 opus = 41 total"
678
-
679
- - version: "1.0.1"
680
- date: "2026-02-11"
681
- changes:
682
- - "Added install-commands.md (haiku)"
683
- - "Added sync-ide-command.md (haiku)"
684
- - "Total haiku tasks: 15 (was 13)"
685
-
686
- - version: "1.0.0"
687
- date: "2026-02-11"
688
- changes:
689
- - "Initial release based on enhance-workflow discovery"
690
- - "13 tasks classified as Haiku-eligible"
691
- - "14 tasks classified as Sonnet (test candidates)"
692
- - "12 tasks must stay on Opus"
693
- - "Expected savings: 25-40%"
1
+ # ============================================================================
2
+ # Squad Creator Model Routing Configuration
3
+ # ============================================================================
4
+ # Self-contained config for task-to-model routing.
5
+ # Squad Chief consults this before executing tasks to optimize token costs.
6
+ #
7
+ # PHILOSOPHY: "Use the cheapest model that maintains quality"
8
+ # - Haiku: Deterministic tasks (validation, scoring, admin)
9
+ # - Sonnet: Moderate analysis (documentation, templates)
10
+ # - Opus: Complex reasoning (DNA extraction, agent creation)
11
+ #
12
+ # Based on empirical analysis: docs/enhance/squad_creator_token_economy/
13
+ # Expected savings: 60-70% of token consumption (validated)
14
+ # ============================================================================
15
+
16
+ version: "2.4.0"
17
+ updated: "2026-02-13"
18
+
19
+ # ============================================================================
20
+ # ROUTING TIERS
21
+ # ============================================================================
22
+
23
+ tiers:
24
+ haiku:
25
+ description: "Fast, cheap. For deterministic tasks with clear patterns."
26
+ model_id: "haiku" # Maps to Task tool model parameter
27
+ cost_per_mtok:
28
+ input: 1.00
29
+ output: 5.00
30
+ best_for:
31
+ - "Checklist validation"
32
+ - "Formula-based scoring"
33
+ - "File operations"
34
+ - "Registry updates"
35
+ - "Pattern matching"
36
+
37
+ sonnet:
38
+ description: "Balanced. For moderate analysis and generation."
39
+ model_id: "sonnet"
40
+ cost_per_mtok:
41
+ input: 3.00
42
+ output: 15.00
43
+ best_for:
44
+ - "Documentation generation"
45
+ - "Template creation"
46
+ - "Source collection"
47
+ - "Workflow design"
48
+
49
+ opus:
50
+ description: "Most capable. For complex reasoning and synthesis."
51
+ model_id: "opus"
52
+ cost_per_mtok:
53
+ input: 5.00
54
+ output: 25.00
55
+ best_for:
56
+ - "DNA extraction"
57
+ - "Agent creation"
58
+ - "Deep research"
59
+ - "Creative synthesis"
60
+ - "Multi-source analysis"
61
+
62
+ # ============================================================================
63
+ # EXTERNAL PROVIDERS (v2.0 - Cross-Provider Support)
64
+ # ============================================================================
65
+ # External models via OpenRouter that can substitute Opus for cost savings.
66
+ # These require LLM Router or direct API calls (not Task tool).
67
+
68
+ external_providers:
69
+ glm5:
70
+ display_name: "GLM-5"
71
+ provider: "openrouter"
72
+ model_id: "z-ai/glm-5"
73
+ cost_per_mtok:
74
+ input: 0.80
75
+ output: 3.20
76
+ context_window: 200000
77
+ qualified_date: "2026-02-13"
78
+ validation_report: "test-cases/cross-provider/extract-voice-dna/glm5/qualification-report.yaml"
79
+ quality_vs_opus: "85-98% (task/runner dependent)"
80
+ latency_vs_opus: "25x faster"
81
+ savings_vs_opus: "97.7%"
82
+ pt_br_quality: "9/10"
83
+ privacy_risk: "moderate" # Singapore entity, China parent
84
+ best_for:
85
+ - "Voice DNA extraction (production-ready with v1.4.0 task + v2.0 runner)"
86
+ - "Batch processing"
87
+ - "All DNA extraction tasks"
88
+ not_for:
89
+ - "Tasks using runner v1 (quality drops to 85%)"
90
+ notes: |
91
+ Empirically tested 2026-02-12, quality upgraded 2026-02-13.
92
+ Record-low hallucination rate.
93
+ MIT license enables self-hosting.
94
+ CRITICAL: Quality depends on runner passing FULL task content.
95
+ Runner v2.0 required for 95%+ quality.
96
+
97
+ kimi:
98
+ display_name: "Kimi K2.5"
99
+ provider: "openrouter"
100
+ model_id: "moonshotai/kimi-k2.5"
101
+ cost_per_mtok:
102
+ input: 0.50
103
+ output: 2.80
104
+ context_window: 256000
105
+ qualified_date: null # Not yet tested
106
+ validation_report: "infrastructure/services/llm-router/docs/model-discovery/scans/2026-02-08/validation-kimi-k2-5.md"
107
+ verdict: "MONITOR"
108
+ privacy_risk: "high" # China, trains on prompts
109
+ latency_warning: "HIGH (15-200s per request)"
110
+ notes: |
111
+ Validation report exists but not empirically tested on squad-creator tasks.
112
+ Agent Swarm capability may excel on research tasks.
113
+ High latency is a concern.
114
+
115
+ # ============================================================================
116
+ # TASK ROUTING MAP
117
+ # ============================================================================
118
+ # Format: task_file -> tier
119
+ # Squad Chief looks up task here before spawning agent
120
+ # ============================================================================
121
+
122
+ tasks:
123
+ # --------------------------------------------------------------------------
124
+ # HAIKU TIER - Immediate candidates (validated)
125
+ # --------------------------------------------------------------------------
126
+ # These tasks are deterministic and can safely use Haiku
127
+
128
+ ## Validation Tasks
129
+ qa-after-creation.md:
130
+ tier: haiku
131
+ confidence: high
132
+ reason: "Checklist validation, gatekeeper task (pass/fail)"
133
+ validated: true
134
+ test_date: "2026-02-11"
135
+ test_result: "QUALIFIED (Opus 8.32 APPROVED, Haiku 9.9 APPROVED - same decision)"
136
+ caveat: "Haiku score inflation +19%, but pass/fail matches"
137
+
138
+ validate-squad.md:
139
+ tier: haiku # QUALIFIED after re-test with expert_override fix
140
+ confidence: high
141
+ reason: "91% voice_dna signal triggers expert override"
142
+ validated: true
143
+ test_date: "2026-02-11"
144
+ test_result: "HAIKU QUALIFIED (expert_override 91% dominant signal)"
145
+ fix_applied: "Already had dominant signals in v2.0"
146
+
147
+ validate-extraction.md:
148
+ tier: haiku
149
+ confidence: high
150
+ reason: "7-item checklist validation, threshold checking"
151
+ validated: false
152
+
153
+ ## Scoring Tasks
154
+ pv-axioma-assessment.md:
155
+ tier: haiku
156
+ confidence: high
157
+ reason: "12-dimension scoring with scoring calibration"
158
+ validated: true
159
+ test_date: "2026-02-11"
160
+ test_result: "QUALIFIED (Opus 7.85, Haiku 7.77 = 95.5% quality)"
161
+ note: "Added Scoring Calibration section in v1.1.0"
162
+
163
+ pv-modernization-score.md:
164
+ tier: script # UPGRADED - 100% deterministic scoring
165
+ confidence: high
166
+ reason: "Binary pass/fail checkpoints, no interpretation needed"
167
+ validated: true
168
+ test_date: "2026-02-11"
169
+ test_result: "SCRIPT QUALIFIED (100% deterministic, 0 tokens)"
170
+ note: "Converted to script-first architecture"
171
+
172
+ an-fidelity-score.md:
173
+ tier: script # UPGRADED from haiku - can be 100% deterministic
174
+ confidence: high
175
+ reason: "8-layer × 5 binary checkpoints - fully scriptable"
176
+ validated: true
177
+ test_date: "2026-02-11"
178
+ test_result: "SCRIPT ELIGIBLE (0 tokens, <1s, 100% deterministic)"
179
+ script_path: "scripts/fidelity-score.sh"
180
+ note: "95% of task can be bash script. LLM only for gap recommendations."
181
+
182
+ an-clone-review.md:
183
+ tier: haiku # QUALIFIED v2.2.0 after scope fix
184
+ confidence: high
185
+ reason: "SCOPE DEFINITION added - explicit wrapper + delegated scope"
186
+ validated: true
187
+ test_date: "2026-02-11"
188
+ test_result: "HAIKU QUALIFIED v2.2.0 (Trinity 93.3% SOLID - same as Opus)"
189
+ fix_applied: "v2.2.0 SCOPE DEFINITION: Review wrapper AND referenced persona files"
190
+ script_path: "scripts/clone-review.sh"
191
+ note: "Script handles 90% deterministic checks. Scope fix enabled Haiku for final verdict."
192
+
193
+ an-diagnose-clone.md:
194
+ tier: opus # CONFIRMED after formal test
195
+ confidence: high
196
+ reason: "Requires accurate file content analysis - Haiku simulates instead of reads"
197
+ validated: true
198
+ test_date: "2026-02-11"
199
+ test_result: "OPUS REQUIRED (Haiku 30% vs Opus 85% - wrong file analysis)"
200
+ fix_attempted: "v2.0.0 with CHECKPOINT CLARIFICATIONS"
201
+ fix_result: "FAILED - Haiku simulated grep counts incorrectly"
202
+ note: "Task value is in nuanced LLM analysis, not scriptable"
203
+
204
+ an-validate-clone.md:
205
+ tier: haiku # QUALIFIED v2.2.0 after strict rules fix
206
+ confidence: high
207
+ reason: "CHECKPOINT CLARIFICATIONS added - strict rules, no inference"
208
+ validated: true
209
+ test_date: "2026-02-11"
210
+ test_result: "HAIKU QUALIFIED v2.2.0 (90% AUTH with strict rules)"
211
+ fix_applied: "v2.2.0 CHECKPOINT CLARIFICATIONS: Explicit SE/ENTÃO, no inference allowed"
212
+ note: "Strict scoring rules eliminated Haiku generous bias."
213
+
214
+ an-assess-sources.md:
215
+ tier: haiku # CHANGED back to haiku after v2.2.1 iterative refinement
216
+ confidence: high
217
+ reason: "Binary Checkpoints + Scope Definition + No Override Rule = 100% tier match"
218
+ validated: true
219
+ test_date: "2026-02-11"
220
+ test_result: "HAIKU QUALIFIED v2.2.1 (Opus 3 CJ, Haiku 3 CJ - 100% tier match)"
221
+ iterations_to_qualify: 3
222
+ fixes_applied:
223
+ - "v2.0: Binary Checkpoints (25% match)"
224
+ - "v2.1: Scope Definition (75% match)"
225
+ - "v2.2.1: No Override Rule (100% match)"
226
+ note: "Demonstrates iterative task refinement pattern for Haiku qualification."
227
+
228
+ ## Admin Tasks
229
+ refresh-registry.md:
230
+ tier: haiku
231
+ confidence: high
232
+ reason: "Script-based extraction, LLM just formats output"
233
+
234
+ squad-analytics.md:
235
+ tier: haiku
236
+ confidence: high
237
+ reason: "Count files, compute metrics - deterministic"
238
+
239
+ migrate-workflows-to-yaml.md:
240
+ tier: haiku
241
+ confidence: high
242
+ reason: "Format conversion with clear rules"
243
+
244
+ install-commands.md:
245
+ tier: haiku
246
+ confidence: high
247
+ reason: "Script execution, deterministic file operations"
248
+
249
+ sync-ide-command.md:
250
+ tier: haiku
251
+ confidence: high
252
+ reason: "File sync operation, no reasoning needed"
253
+
254
+ # --------------------------------------------------------------------------
255
+ # SONNET TIER - Test candidates (moderate confidence)
256
+ # --------------------------------------------------------------------------
257
+ # These tasks might work with Haiku but need validation
258
+
259
+ ## Documentation Tasks
260
+ create-documentation.md:
261
+ tier: sonnet
262
+ confidence: medium
263
+ reason: "Template-based but needs some coherence"
264
+ test_with_haiku: true
265
+
266
+ create-template.md:
267
+ tier: sonnet
268
+ confidence: medium
269
+ reason: "Structure design with moderate creativity"
270
+ test_with_haiku: true
271
+
272
+ ## Source Tasks
273
+ collect-sources.md:
274
+ tier: sonnet
275
+ confidence: medium
276
+ reason: "Web search + validation, some judgment needed"
277
+ test_with_haiku: true
278
+
279
+ auto-acquire-sources.md:
280
+ tier: sonnet
281
+ confidence: medium
282
+ reason: "Tool orchestration, content extraction"
283
+ test_with_haiku: true
284
+
285
+ ## Workflow/Task Creation
286
+ create-workflow.md:
287
+ tier: sonnet
288
+ confidence: medium
289
+ reason: "Multi-phase design, needs logical coherence"
290
+
291
+ create-task.md:
292
+ tier: sonnet
293
+ confidence: medium
294
+ reason: "Task Anatomy compliance, some complexity"
295
+
296
+ create-pipeline.md:
297
+ tier: sonnet
298
+ confidence: medium
299
+ reason: "Pipeline design with dependencies"
300
+
301
+ ## Analysis Tasks
302
+ pv-audit.md:
303
+ tier: sonnet
304
+ confidence: medium
305
+ reason: "Process audit requires some reasoning"
306
+
307
+ find-0.8.md:
308
+ tier: sonnet
309
+ confidence: medium
310
+ reason: "Pareto analysis needs judgment"
311
+
312
+ deconstruct.md:
313
+ tier: sonnet
314
+ confidence: medium
315
+ reason: "Structural analysis, moderate depth"
316
+
317
+ optimize.md:
318
+ tier: sonnet
319
+ confidence: medium
320
+ reason: "Q1-Q6 decision tree evaluation"
321
+
322
+ update-mind.md:
323
+ tier: sonnet
324
+ confidence: medium
325
+ reason: "Brownfield updates need context awareness"
326
+
327
+ upgrade-squad.md:
328
+ tier: sonnet
329
+ confidence: medium
330
+ reason: "Squad upgrade analysis"
331
+
332
+ squad-fusion.md:
333
+ tier: sonnet
334
+ confidence: medium
335
+ reason: "Merge logic, moderate complexity"
336
+
337
+ next-squad.md:
338
+ tier: sonnet
339
+ confidence: high
340
+ reason: "Registry analysis + multi-dimensional scoring + synthesis. Structured data in, ranked recommendation out."
341
+
342
+ # --------------------------------------------------------------------------
343
+ # OPUS TIER - Keep on Opus (non-negotiable)
344
+ # --------------------------------------------------------------------------
345
+ # These tasks require deep reasoning and cannot be downgraded
346
+
347
+ ## DNA Extraction (Core Value)
348
+ extract-voice-dna.md:
349
+ tier: opus
350
+ confidence: high
351
+ reason: "Multi-layer pattern recognition, nuance detection"
352
+ downgrade_risk: "Quality degradation in voice capture"
353
+
354
+ extract-thinking-dna.md:
355
+ tier: opus
356
+ confidence: high
357
+ reason: "Framework synthesis, decision architecture mapping"
358
+ downgrade_risk: "Missing mental models and heuristics"
359
+
360
+ extract-knowledge.md:
361
+ tier: opus
362
+ confidence: high
363
+ reason: "Anti-invention gates need sophisticated reasoning"
364
+ downgrade_risk: "Hallucinated frameworks"
365
+
366
+ extract-sop.md:
367
+ tier: opus
368
+ confidence: high
369
+ reason: "Process extraction from unstructured sources"
370
+ downgrade_risk: "Incomplete procedures"
371
+
372
+ extract-implicit.md:
373
+ tier: opus
374
+ confidence: high
375
+ reason: "Inference of unstated knowledge"
376
+ downgrade_risk: "Missing implicit patterns"
377
+
378
+ ## Agent Creation
379
+ create-agent.md:
380
+ tier: opus
381
+ confidence: high
382
+ reason: "Creative persona synthesis with voice consistency"
383
+ downgrade_risk: "Generic agent without depth"
384
+
385
+ an-design-clone.md:
386
+ tier: opus
387
+ confidence: high
388
+ reason: "Clone architecture requires holistic design"
389
+ downgrade_risk: "Incomplete clone structure"
390
+
391
+ an-extract-dna.md:
392
+ tier: opus
393
+ confidence: high
394
+ reason: "Specialized DNA extraction"
395
+ downgrade_risk: "Missing DNA layers"
396
+
397
+ an-extract-framework.md:
398
+ tier: opus
399
+ confidence: high
400
+ reason: "Framework identification from sources"
401
+ downgrade_risk: "Shallow framework extraction"
402
+
403
+ ## Research Tasks
404
+ deep-research-pre-agent.md:
405
+ tier: opus
406
+ confidence: high
407
+ reason: "Web research synthesis, source triangulation"
408
+ downgrade_risk: "Superficial research"
409
+
410
+ discover-tools.md:
411
+ tier: opus
412
+ confidence: high
413
+ reason: "Multi-source tool discovery, scoring"
414
+ downgrade_risk: "Missing relevant tools"
415
+
416
+ ## Squad Creation
417
+ create-squad.md:
418
+ tier: opus
419
+ confidence: high
420
+ reason: "Full squad orchestration, multi-phase"
421
+ downgrade_risk: "Incomplete squad structure"
422
+
423
+ # ============================================================================
424
+ # FALLBACK CONFIGURATION
425
+ # ============================================================================
426
+ # If a model fails, try the next tier up
427
+
428
+ fallback:
429
+ haiku:
430
+ on_failure: sonnet
431
+ on_quality_below: 0.85
432
+
433
+ sonnet:
434
+ on_failure: opus
435
+ on_quality_below: 0.80
436
+
437
+ # ============================================================================
438
+ # USAGE BY SQUAD CHIEF
439
+ # ============================================================================
440
+ #
441
+ # Before executing a task, Squad Chief should:
442
+ #
443
+ # 1. Look up task in this config:
444
+ # task_config = model_routing.tasks[task_name]
445
+ #
446
+ # 2. Get the tier:
447
+ # tier = task_config.tier # haiku, sonnet, or opus
448
+ #
449
+ # 3. Spawn agent with model:
450
+ # Task(
451
+ # subagent_type: "appropriate-agent",
452
+ # model: tier, # "haiku", "sonnet", or "opus"
453
+ # prompt: "..."
454
+ # )
455
+ #
456
+ # 4. If quality check fails, use fallback:
457
+ # if quality < fallback[tier].on_quality_below:
458
+ # retry with fallback[tier].on_failure
459
+ #
460
+ # ============================================================================
461
+
462
+ # ============================================================================
463
+ # METRICS TRACKING
464
+ # ============================================================================
465
+ # Track these metrics to validate routing decisions
466
+
467
+ metrics:
468
+ track:
469
+ - task_name
470
+ - model_used
471
+ - tokens_in
472
+ - tokens_out
473
+ - latency_ms
474
+ - quality_score # If available
475
+ - fallback_triggered
476
+
477
+ report_location: "outputs/metrics/model-routing-{date}.yaml"
478
+
479
+ # ============================================================================
480
+ # EXTERNAL ALTERNATIVES (Opus Tasks with Qualified External Options)
481
+ # ============================================================================
482
+ # Tasks that can use external models as cost-effective alternatives to Opus.
483
+ # Squad Chief can route to these when cost optimization is prioritized.
484
+
485
+ external_alternatives:
486
+ extract-voice-dna.md:
487
+ primary_tier: opus
488
+ external_option:
489
+ model: glm5
490
+ qualified: true
491
+ quality_vs_opus: "95-98%" # UPGRADED 2026-02-13 after task v1.4.0 + runner v2.0
492
+ savings: "97.7%"
493
+ pt_br_qualified: true
494
+ tested_date: "2026-02-13"
495
+ runner_version: "v2.0" # Requires runner v2.0 (full task content)
496
+ task_version: "v1.4.0" # Requires task v1.4.0 (explicit quality requirements)
497
+ use_when:
498
+ - "Batch processing multiple minds"
499
+ - "Cost-sensitive workflows"
500
+ - "Production clones (with v1.4.0 task)"
501
+ avoid_when:
502
+ - "Runner v1 still in use"
503
+ evidence: "test-cases/cross-provider/extract-voice-dna/glm5/"
504
+ notes: |
505
+ Quality improved from 85% to 95-98% after:
506
+ 1. Task v1.4.0: Added explicit source requirements, example_usage, example_wrong/correct
507
+ 2. Runner v2.0: Passes FULL task content (including QUALITY CHECK section)
508
+ Key insight: Model follows instructions when they actually reach the prompt.
509
+
510
+ extract-knowledge.md:
511
+ primary_tier: opus
512
+ external_option:
513
+ model: glm5
514
+ qualified: true
515
+ quality_vs_opus: "95%"
516
+ savings: "96.8%"
517
+ tested_date: "2026-02-12"
518
+ use_when:
519
+ - "Zero-invention extraction"
520
+ - "Batch processing sources"
521
+ - "Cost-sensitive workflows"
522
+ avoid_when:
523
+ - "Gap analysis required"
524
+ - "Verbose examples needed"
525
+ evidence: "test-cases/cross-provider/extract-knowledge/glm5/"
526
+ notes: "GLM-5 CONFIRMA record-low hallucination claim. Zero invented content."
527
+
528
+ extract-thinking-dna.md:
529
+ primary_tier: opus
530
+ external_option:
531
+ model: glm5
532
+ qualified: true
533
+ quality_vs_opus: "100%"
534
+ savings: "99%"
535
+ tested_date: "2026-02-12"
536
+ use_when:
537
+ - "Framework extraction"
538
+ - "Heuristic mapping"
539
+ - "Decision pattern extraction"
540
+ - "Batch processing minds"
541
+ avoid_when:
542
+ - "Need attention_triggers detail"
543
+ evidence: "outputs/llm-tests/extract-thinking-dna/glm5/"
544
+ notes: "GLM-5 matched Opus exactly. 19s vs 66s latency. $0.007 vs $0.50 cost."
545
+
546
+ # Candidates for future testing
547
+
548
+ deep-research-pre-agent.md:
549
+ primary_tier: opus
550
+ external_option:
551
+ model: glm5
552
+ qualified: true
553
+ quality_vs_opus: "95%"
554
+ savings: "97.8%"
555
+ tested_date: "2026-02-13"
556
+ use_when:
557
+ - "Research prompt generation"
558
+ - "7-component meta-framework"
559
+ - "Cost-sensitive research pipelines"
560
+ avoid_when:
561
+ - "Need GOLD/SILVER/BRONZE confidence naming"
562
+ evidence: "outputs/llm-tests/deep-research-pre-agent/glm5/"
563
+ notes: "GLM-5 produced identical 7-component structure. 45.5s latency. $0.0098 cost."
564
+
565
+ create-agent.md:
566
+ primary_tier: opus
567
+ external_option:
568
+ model: glm5
569
+ qualified: true
570
+ quality_vs_opus: "98%"
571
+ savings: "99.1%"
572
+ tested_date: "2026-02-13"
573
+ runner_version: "v2.0"
574
+ use_when:
575
+ - "Agent creation from pre-extracted DNA"
576
+ - "Batch agent generation"
577
+ - "Production agents"
578
+ avoid_when:
579
+ - "Runner v1 still in use"
580
+ evidence: "outputs/llm-tests/create-agent/glm5/"
581
+ notes: |
582
+ GLM-5 QUALIFIED after runner v2.0 (full task content).
583
+ Output: 718 lines, all sections complete.
584
+ Key improvements: 6 heuristics (was 3), 4 objection algorithms,
585
+ SCOPE with boundary_conditions, veto_conditions, handoff_triggers.
586
+ $0.02 vs ~$2.50 Opus = 99.1% savings.
587
+
588
+ # ============================================================================
589
+ # CHANGELOG
590
+ # ============================================================================
591
+
592
+ changelog:
593
+ - version: "2.4.0"
594
+ date: "2026-02-13"
595
+ changes:
596
+ - "GLM-5 QUALIFIED for create-agent (98% quality, 99.1% savings)"
597
+ - "Output: 718 lines with ALL sections complete"
598
+ - "Key wins: 6 heuristics, 4 objection algorithms, SCOPE with veto conditions"
599
+ - "$0.02 vs ~$2.50 Opus"
600
+ - "5 tasks now qualified: extract-voice-dna, extract-knowledge, extract-thinking-dna, deep-research-pre-agent, create-agent"
601
+
602
+ - version: "2.3.0"
603
+ date: "2026-02-13"
604
+ changes:
605
+ - "QUALITY IMPROVEMENT: extract-voice-dna GLM-5 quality upgraded 85% → 95-98%"
606
+ - "Task v1.4.0: Added explicit quality requirements (source:, example_usage:, example_wrong/correct)"
607
+ - "Runner v2.0: Now passes FULL task content (was passing only ~10% of task)"
608
+ - "Key insight: QUALITY CHECK section was never reaching the model - fixed"
609
+ - "Trade-off: +$0.01 cost, +174s latency for +10-13% quality"
610
+ - "GLM-5 now production-ready for voice DNA extraction"
611
+
612
+ - version: "2.2.0"
613
+ date: "2026-02-13"
614
+ changes:
615
+ - "GLM-5 QUALIFIED for deep-research-pre-agent (95% quality, 97.8% savings)"
616
+ - "GLM-5 produced identical 7-component meta-framework structure"
617
+ - "45.5s latency, $0.0098 cost"
618
+ - "4 tasks now qualified: extract-voice-dna, extract-knowledge, extract-thinking-dna, deep-research-pre-agent"
619
+
620
+ - version: "2.1.0"
621
+ date: "2026-02-12"
622
+ changes:
623
+ - "GLM-5 QUALIFIED for extract-thinking-dna (100% quality, 99% savings)"
624
+ - "GLM-5 matched Opus exactly on all categories"
625
+ - "19s latency vs 66s Opus (3.5x faster)"
626
+ - "$0.007 cost vs ~$0.50 Opus"
627
+ - "3 tasks now qualified: extract-voice-dna, extract-knowledge, extract-thinking-dna"
628
+
629
+ - version: "2.0.0"
630
+ date: "2026-02-12"
631
+ changes:
632
+ - "MAJOR: Added external_providers section (GLM-5, Kimi K2.5)"
633
+ - "MAJOR: Added external_alternatives for Opus tasks with cheaper options"
634
+ - "GLM-5 QUALIFIED for extract-voice-dna (85% quality, 97.7% savings)"
635
+ - "GLM-5 tested: 1.9s latency (25x faster than Opus)"
636
+ - "GLM-5 PT-BR quality: 9/10 (QUALIFIED)"
637
+ - "Created wf-cross-provider-qualification.yaml workflow"
638
+ - "Created validation-glm-5.md report"
639
+ - "4 tasks marked as candidates for GLM-5 testing"
640
+
641
+ - version: "1.3.0"
642
+ date: "2026-02-11"
643
+ changes:
644
+ - "FORMAL TEST: an-diagnose-clone tested Opus vs Haiku"
645
+ - "an-diagnose-clone: OPUS REQUIRED (Haiku 30% vs Opus 85%)"
646
+ - "Fix v2.0.0 attempted with CHECKPOINT CLARIFICATIONS - FAILED"
647
+ - "Root cause: Haiku simulates file reads instead of accurate analysis"
648
+ - "Decision: Keep Opus - LLM analysis value > script automation"
649
+ - "Final stats: 12/14 Haiku/Script (86%), 1/14 Opus (7%), 1/14 deprecated"
650
+
651
+ - version: "1.2.0"
652
+ date: "2026-02-11"
653
+ changes:
654
+ - "SYNC WITH BATCH-PROGRESS: 4 tasks re-qualified after fixes"
655
+ - "validate-squad: HAIKU QUALIFIED (expert_override 91% dominant signal)"
656
+ - "pv-modernization-score: SCRIPT QUALIFIED (100% deterministic)"
657
+ - "an-clone-review: HAIKU QUALIFIED v2.2.0 (SCOPE DEFINITION fix)"
658
+ - "an-validate-clone: HAIKU QUALIFIED v2.2.0 (CHECKPOINT CLARIFICATIONS fix)"
659
+ - "Total qualified: 12/14 (86%) - matches BATCH-PROGRESS.md"
660
+ - "Estimated savings: 60-70% token cost reduction"
661
+
662
+ - version: "1.1.0"
663
+ date: "2026-02-11"
664
+ changes:
665
+ - "EMPIRICAL VALIDATION: 4 tasks tested with Opus vs Haiku"
666
+ - "pv-axioma-assessment: HAIKU QUALIFIED (95.5% quality)"
667
+ - "qa-after-creation: HAIKU QUALIFIED (same pass/fail decision)"
668
+ - "pv-modernization-score: MOVED TO OPUS (wrong judgment)"
669
+ - "validate-squad: MOVED TO OPUS (wrong type detection)"
670
+ - "an-fidelity-score: Task updated to v2.0 Haiku-compatible (pending validation)"
671
+ - "New haiku count: 13 validated candidates"
672
+ - "New opus count: 14 (includes 2 moved from haiku)"
673
+
674
+ - version: "1.0.2"
675
+ date: "2026-02-11"
676
+ changes:
677
+ - "Corrected task counts: 15 haiku + 14 sonnet + 12 opus = 41 total"
678
+
679
+ - version: "1.0.1"
680
+ date: "2026-02-11"
681
+ changes:
682
+ - "Added install-commands.md (haiku)"
683
+ - "Added sync-ide-command.md (haiku)"
684
+ - "Total haiku tasks: 15 (was 13)"
685
+
686
+ - version: "1.0.0"
687
+ date: "2026-02-11"
688
+ changes:
689
+ - "Initial release based on enhance-workflow discovery"
690
+ - "13 tasks classified as Haiku-eligible"
691
+ - "14 tasks classified as Sonnet (test candidates)"
692
+ - "12 tasks must stay on Opus"
693
+ - "Expected savings: 25-40%"