aiox-core 5.0.3 → 5.0.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (468) hide show
  1. package/.aiox-core/core/execution/predictive-pipeline.js +1283 -0
  2. package/.aiox-core/core/memory/decision-memory.js +564 -0
  3. package/.aiox-core/data/entity-registry.yaml +1068 -1028
  4. package/.aiox-core/data/registry-update-log.jsonl +2 -2
  5. package/.aiox-core/development/templates/service-template/README.md.hbs +158 -158
  6. package/.aiox-core/development/templates/service-template/__tests__/index.test.ts.hbs +237 -237
  7. package/.aiox-core/development/templates/service-template/client.ts.hbs +403 -403
  8. package/.aiox-core/development/templates/service-template/errors.ts.hbs +182 -182
  9. package/.aiox-core/development/templates/service-template/index.ts.hbs +120 -120
  10. package/.aiox-core/development/templates/service-template/package.json.hbs +87 -87
  11. package/.aiox-core/development/templates/service-template/types.ts.hbs +145 -145
  12. package/.aiox-core/development/templates/squad-template/LICENSE +21 -21
  13. package/.aiox-core/infrastructure/templates/aiox-sync.yaml.template +182 -182
  14. package/.aiox-core/infrastructure/templates/coderabbit.yaml.template +279 -279
  15. package/.aiox-core/infrastructure/templates/github-workflows/ci.yml.template +169 -169
  16. package/.aiox-core/infrastructure/templates/github-workflows/pr-automation.yml.template +330 -330
  17. package/.aiox-core/infrastructure/templates/github-workflows/release.yml.template +196 -196
  18. package/.aiox-core/infrastructure/templates/gitignore/gitignore-aiox-base.tmpl +63 -63
  19. package/.aiox-core/infrastructure/templates/gitignore/gitignore-brownfield-merge.tmpl +18 -18
  20. package/.aiox-core/infrastructure/templates/gitignore/gitignore-node.tmpl +85 -85
  21. package/.aiox-core/infrastructure/templates/gitignore/gitignore-python.tmpl +145 -145
  22. package/.aiox-core/install-manifest.yaml +63 -55
  23. package/.aiox-core/local-config.yaml.template +71 -71
  24. package/.aiox-core/monitor/hooks/lib/__init__.py +1 -1
  25. package/.aiox-core/monitor/hooks/lib/enrich.py +58 -58
  26. package/.aiox-core/monitor/hooks/lib/send_event.py +47 -47
  27. package/.aiox-core/monitor/hooks/notification.py +29 -29
  28. package/.aiox-core/monitor/hooks/post_tool_use.py +45 -45
  29. package/.aiox-core/monitor/hooks/pre_compact.py +29 -29
  30. package/.aiox-core/monitor/hooks/pre_tool_use.py +40 -40
  31. package/.aiox-core/monitor/hooks/stop.py +29 -29
  32. package/.aiox-core/monitor/hooks/subagent_stop.py +29 -29
  33. package/.aiox-core/monitor/hooks/user_prompt_submit.py +38 -38
  34. package/.aiox-core/product/templates/adr.hbs +125 -125
  35. package/.aiox-core/product/templates/dbdr.hbs +241 -241
  36. package/.aiox-core/product/templates/epic.hbs +212 -212
  37. package/.aiox-core/product/templates/pmdr.hbs +186 -186
  38. package/.aiox-core/product/templates/prd-v2.0.hbs +216 -216
  39. package/.aiox-core/product/templates/prd.hbs +201 -201
  40. package/.aiox-core/product/templates/story.hbs +263 -263
  41. package/.aiox-core/product/templates/task.hbs +170 -170
  42. package/.aiox-core/product/templates/tmpl-comment-on-examples.sql +158 -158
  43. package/.aiox-core/product/templates/tmpl-migration-script.sql +91 -91
  44. package/.aiox-core/product/templates/tmpl-rls-granular-policies.sql +104 -104
  45. package/.aiox-core/product/templates/tmpl-rls-kiss-policy.sql +10 -10
  46. package/.aiox-core/product/templates/tmpl-rls-roles.sql +135 -135
  47. package/.aiox-core/product/templates/tmpl-rls-simple.sql +77 -77
  48. package/.aiox-core/product/templates/tmpl-rls-tenant.sql +152 -152
  49. package/.aiox-core/product/templates/tmpl-rollback-script.sql +77 -77
  50. package/.aiox-core/product/templates/tmpl-seed-data.sql +140 -140
  51. package/.aiox-core/product/templates/tmpl-smoke-test.sql +16 -16
  52. package/.aiox-core/product/templates/tmpl-staging-copy-merge.sql +139 -139
  53. package/.aiox-core/product/templates/tmpl-stored-proc.sql +140 -140
  54. package/.aiox-core/product/templates/tmpl-trigger.sql +152 -152
  55. package/.aiox-core/product/templates/tmpl-view-materialized.sql +133 -133
  56. package/.aiox-core/product/templates/tmpl-view.sql +177 -177
  57. package/.aiox-core/scripts/pm.sh +0 -0
  58. package/.claude/hooks/enforce-architecture-first.py +196 -196
  59. package/.claude/hooks/mind-clone-governance.py +192 -192
  60. package/.claude/hooks/read-protection.py +151 -151
  61. package/.claude/hooks/slug-validation.py +176 -176
  62. package/.claude/hooks/sql-governance.py +182 -182
  63. package/.claude/hooks/write-path-validation.py +194 -194
  64. package/LICENSE +33 -33
  65. package/bin/aiox-graph.js +0 -0
  66. package/bin/aiox-minimal.js +0 -0
  67. package/bin/aiox.js +0 -0
  68. package/package.json +1 -1
  69. package/packages/aiox-install/bin/aiox-install.js +0 -0
  70. package/packages/aiox-install/bin/edmcp.js +0 -0
  71. package/packages/aiox-pro-cli/bin/aiox-pro.js +0 -0
  72. package/packages/installer/src/wizard/pro-setup.js +28 -0
  73. package/pro/README.md +66 -66
  74. package/pro/feature-registry.yaml +225 -223
  75. package/pro/license/license-api.js +701 -679
  76. package/pro/package.json +39 -39
  77. package/pro/pro-config.yaml +63 -63
  78. package/pro/squads/README.md +24 -24
  79. package/pro/squads/design/HEADLINE.md +3 -3
  80. package/pro/squads/design/README.md +109 -109
  81. package/pro/squads/design/agents/brad-frost.md +1097 -1097
  82. package/pro/squads/design/agents/dan-mall.md +857 -857
  83. package/pro/squads/design/agents/dave-malouf.md +2272 -2272
  84. package/pro/squads/design/agents/design-chief.md +114 -114
  85. package/pro/squads/design/agents/ds-foundations-lead.md +194 -194
  86. package/pro/squads/design/agents/ds-token-architect.md +361 -361
  87. package/pro/squads/design/agents/nano-banana-generator.md +162 -162
  88. package/pro/squads/design/agents/storybook-expert.md +809 -809
  89. package/pro/squads/design/checklists/atomic-refactor-checklist.md +299 -299
  90. package/pro/squads/design/checklists/component-adaptation-checklist.md +81 -81
  91. package/pro/squads/design/checklists/design-fidelity-checklist.md +283 -283
  92. package/pro/squads/design/checklists/design-handoff-checklist.md +55 -55
  93. package/pro/squads/design/checklists/design-team-health-checklist.md +454 -454
  94. package/pro/squads/design/checklists/designops-maturity-checklist.md +518 -518
  95. package/pro/squads/design/checklists/ds-a11y-release-gate-checklist.md +45 -45
  96. package/pro/squads/design/checklists/ds-accessibility-wcag-checklist.md +147 -147
  97. package/pro/squads/design/checklists/ds-component-quality-checklist.md +150 -150
  98. package/pro/squads/design/checklists/ds-critical-eye-review-checklist.md +147 -147
  99. package/pro/squads/design/checklists/ds-migration-readiness-checklist.md +99 -99
  100. package/pro/squads/design/checklists/ds-pattern-audit-checklist.md +164 -164
  101. package/pro/squads/design/checklists/reading-accessibility-checklist.md +275 -275
  102. package/pro/squads/design/checklists/token-mapping-checklist.md +107 -107
  103. package/pro/squads/design/config/coding-standards.md +286 -286
  104. package/pro/squads/design/config/source-tree.md +59 -59
  105. package/pro/squads/design/config/tech-stack.md +48 -48
  106. package/pro/squads/design/config.yaml +204 -204
  107. package/pro/squads/design/data/agentic-design-systems-guide.md +46 -46
  108. package/pro/squads/design/data/agentic-ds-principles.md +100 -100
  109. package/pro/squads/design/data/atomic-design-principles.md +108 -108
  110. package/pro/squads/design/data/atomic-refactor-rules.md +582 -582
  111. package/pro/squads/design/data/base-component-specs.md +972 -972
  112. package/pro/squads/design/data/brad-frost-analysis-extract-implicit.yaml +270 -270
  113. package/pro/squads/design/data/brad-frost-analysis-find-0.8.yaml +176 -176
  114. package/pro/squads/design/data/brad-frost-analysis-qa-report.yaml +168 -168
  115. package/pro/squads/design/data/brad-frost-dna.yaml +713 -713
  116. package/pro/squads/design/data/capability-tools.yaml +124 -124
  117. package/pro/squads/design/data/component-adaptation-changelog.md +318 -318
  118. package/pro/squads/design/data/consolidation-algorithms.md +168 -168
  119. package/pro/squads/design/data/critical-eye-scoring-rules.yaml +240 -240
  120. package/pro/squads/design/data/design-token-best-practices.md +107 -107
  121. package/pro/squads/design/data/design-tokens-spec.yaml +418 -418
  122. package/pro/squads/design/data/ds-reference-architectures.md +93 -93
  123. package/pro/squads/design/data/f2-qa-report.md +168 -168
  124. package/pro/squads/design/data/f3-derived-components-changelog.md +100 -100
  125. package/pro/squads/design/data/f3-qa-report.md +208 -208
  126. package/pro/squads/design/data/figma-base-components-raw.md +101 -101
  127. package/pro/squads/design/data/figma-tokens-raw.md +1548 -1548
  128. package/pro/squads/design/data/fluent2-design-principles.md +114 -114
  129. package/pro/squads/design/data/high-retention-reading-guide.md +349 -349
  130. package/pro/squads/design/data/integration-patterns.md +207 -207
  131. package/pro/squads/design/data/internal-quality-chain.yaml +48 -48
  132. package/pro/squads/design/data/motion-tokens-guide.md +202 -202
  133. package/pro/squads/design/data/roi-calculation-guide.md +142 -142
  134. package/pro/squads/design/data/token-mapping-reference.md +213 -213
  135. package/pro/squads/design/data/w3c-dtcg-spec-reference.md +149 -149
  136. package/pro/squads/design/data/wcag-compliance-guide.md +267 -267
  137. package/pro/squads/design/docs/AUDIT_REPORT.md +97 -97
  138. package/pro/squads/design/docs/DS-CURATION-PIPELINE-PROPOSAL.md +577 -577
  139. package/pro/squads/design/docs/UPGRADE_PLAN.md +618 -618
  140. package/pro/squads/design/docs/brad-frost-research-validation.md +372 -372
  141. package/pro/squads/design/docs/dave-malouf-research-validation.md +391 -391
  142. package/pro/squads/design/docs/tool-discovery-report.md +87 -87
  143. package/pro/squads/design/docs/tool-integration-plan.md +44 -44
  144. package/pro/squads/design/protocols/ai-first-governance.md +56 -56
  145. package/pro/squads/design/protocols/governance-execution-boundary.md +59 -59
  146. package/pro/squads/design/protocols/handoff.md +60 -60
  147. package/pro/squads/design/rules/.claude-rules.md +88 -88
  148. package/pro/squads/design/scripts/design-system/curate_colors.cjs +447 -447
  149. package/pro/squads/design/scripts/design-system/curate_components.cjs +217 -217
  150. package/pro/squads/design/scripts/design-system/curate_radius.cjs +190 -190
  151. package/pro/squads/design/scripts/design-system/curate_shadows.cjs +208 -208
  152. package/pro/squads/design/scripts/design-system/curate_spacing.cjs +243 -243
  153. package/pro/squads/design/scripts/design-system/curate_typography.cjs +404 -404
  154. package/pro/squads/design/scripts/design-system/design-system-metadata.test.js +49 -49
  155. package/pro/squads/design/scripts/design-system/design_manifest_lib.cjs +142 -142
  156. package/pro/squads/design/scripts/design-system/fetch_page_images.cjs +195 -195
  157. package/pro/squads/design/scripts/design-system/generate_components_metadata.cjs +114 -114
  158. package/pro/squads/design/scripts/design-system/generate_curation_report.cjs +258 -258
  159. package/pro/squads/design/scripts/design-system/generate_tokens.cjs +342 -342
  160. package/pro/squads/design/scripts/design-system/sync_design_manifest.cjs +27 -27
  161. package/pro/squads/design/scripts/design-system/test_mcp_tools.cjs +232 -232
  162. package/pro/squads/design/scripts/design-system/validate_components_metadata.cjs +96 -96
  163. package/pro/squads/design/scripts/design-system/validate_curation.cjs +226 -226
  164. package/pro/squads/design/scripts/design-system/validate_design_manifest_drift.cjs +72 -72
  165. package/pro/squads/design/scripts/design-system/validate_mcp_skeleton.cjs +38 -38
  166. package/pro/squads/design/scripts/design-system/validate_registry.cjs +186 -186
  167. package/pro/squads/design/scripts/design-system/validate_task_checklist_bindings.cjs +78 -78
  168. package/pro/squads/design/scripts/dissect-artifact.cjs +806 -806
  169. package/pro/squads/design/scripts/validate-a11y-integration.cjs +40 -40
  170. package/pro/squads/design/scripts/validate-design-squad.py +411 -411
  171. package/pro/squads/design/squad.yaml +714 -714
  172. package/pro/squads/design/tasks/a11y-audit.md +340 -340
  173. package/pro/squads/design/tasks/aria-audit.md +525 -525
  174. package/pro/squads/design/tasks/atomic-refactor-execute.md +391 -391
  175. package/pro/squads/design/tasks/atomic-refactor-plan.md +262 -262
  176. package/pro/squads/design/tasks/audit-reading-experience.md +350 -350
  177. package/pro/squads/design/tasks/audit-tailwind-config.md +101 -101
  178. package/pro/squads/design/tasks/bootstrap-shadcn-library.md +96 -96
  179. package/pro/squads/design/tasks/bundle-audit.md +245 -245
  180. package/pro/squads/design/tasks/contrast-matrix.md +373 -373
  181. package/pro/squads/design/tasks/create-doc.md +135 -135
  182. package/pro/squads/design/tasks/dead-code-detection.md +329 -329
  183. package/pro/squads/design/tasks/design-compare.md +414 -414
  184. package/pro/squads/design/tasks/design-process-optimization.md +407 -407
  185. package/pro/squads/design/tasks/design-review-orchestration.md +99 -99
  186. package/pro/squads/design/tasks/design-team-scaling.md +407 -407
  187. package/pro/squads/design/tasks/design-tooling-audit.md +404 -404
  188. package/pro/squads/design/tasks/design-triage.md +89 -89
  189. package/pro/squads/design/tasks/designops-maturity-assessment.md +364 -364
  190. package/pro/squads/design/tasks/designops-metrics-setup.md +465 -465
  191. package/pro/squads/design/tasks/ds-agentic-audit.md +100 -100
  192. package/pro/squads/design/tasks/ds-agentic-setup.md +103 -103
  193. package/pro/squads/design/tasks/ds-audit-codebase.md +273 -273
  194. package/pro/squads/design/tasks/ds-build-component.md +349 -349
  195. package/pro/squads/design/tasks/ds-build-mcp-server.md +84 -84
  196. package/pro/squads/design/tasks/ds-calculate-roi.md +282 -282
  197. package/pro/squads/design/tasks/ds-compose-molecule.md +106 -106
  198. package/pro/squads/design/tasks/ds-consolidate-patterns.md +253 -253
  199. package/pro/squads/design/tasks/ds-context-contract.md +194 -194
  200. package/pro/squads/design/tasks/ds-critical-eye-compare.md +130 -130
  201. package/pro/squads/design/tasks/ds-critical-eye-decide.md +139 -139
  202. package/pro/squads/design/tasks/ds-critical-eye-inventory.md +111 -111
  203. package/pro/squads/design/tasks/ds-critical-eye-report.md +101 -101
  204. package/pro/squads/design/tasks/ds-critical-eye-score.md +109 -109
  205. package/pro/squads/design/tasks/ds-designops.md +99 -99
  206. package/pro/squads/design/tasks/ds-extend-pattern.md +91 -91
  207. package/pro/squads/design/tasks/ds-extract-tokens.md +312 -312
  208. package/pro/squads/design/tasks/ds-figma-pipeline.md +95 -95
  209. package/pro/squads/design/tasks/ds-fluent-audit.md +105 -105
  210. package/pro/squads/design/tasks/ds-fluent-build.md +110 -110
  211. package/pro/squads/design/tasks/ds-generate-ai-metadata.md +81 -81
  212. package/pro/squads/design/tasks/ds-generate-cursor-rules.md +74 -74
  213. package/pro/squads/design/tasks/ds-generate-documentation.md +101 -101
  214. package/pro/squads/design/tasks/ds-generate-migration-strategy.md +331 -331
  215. package/pro/squads/design/tasks/ds-generate-shock-report.md +323 -323
  216. package/pro/squads/design/tasks/ds-govern-a11y-compliance.md +93 -93
  217. package/pro/squads/design/tasks/ds-governance.md +187 -187
  218. package/pro/squads/design/tasks/ds-health-metrics.md +278 -278
  219. package/pro/squads/design/tasks/ds-integrate-squad.md +130 -130
  220. package/pro/squads/design/tasks/ds-integrate-workspace.md +100 -100
  221. package/pro/squads/design/tasks/ds-legacy-modernization.md +302 -302
  222. package/pro/squads/design/tasks/ds-mcp-status.md +65 -65
  223. package/pro/squads/design/tasks/ds-motion-audit.md +118 -118
  224. package/pro/squads/design/tasks/ds-multi-framework.md +96 -96
  225. package/pro/squads/design/tasks/ds-parallelization-gate.md +246 -246
  226. package/pro/squads/design/tasks/ds-query.md +90 -90
  227. package/pro/squads/design/tasks/ds-rebuild-artifact.md +369 -369
  228. package/pro/squads/design/tasks/ds-reverse-engineer.md +194 -194
  229. package/pro/squads/design/tasks/ds-scan-artifact.md +131 -131
  230. package/pro/squads/design/tasks/ds-setup-design-system.md +297 -297
  231. package/pro/squads/design/tasks/ds-sync-registry.md +287 -287
  232. package/pro/squads/design/tasks/ds-theme-multi-brand.md +90 -90
  233. package/pro/squads/design/tasks/ds-token-modes.md +108 -108
  234. package/pro/squads/design/tasks/ds-token-w3c-extract.md +105 -105
  235. package/pro/squads/design/tasks/ds-validate-ai-readiness.md +69 -69
  236. package/pro/squads/design/tasks/ds-visual-regression.md +130 -130
  237. package/pro/squads/design/tasks/execute-checklist.md +141 -141
  238. package/pro/squads/design/tasks/export-design-tokens-dtcg.md +97 -97
  239. package/pro/squads/design/tasks/f1-apply-foundations.md +154 -154
  240. package/pro/squads/design/tasks/f1-ingest-figma-tokens.md +130 -130
  241. package/pro/squads/design/tasks/f1-map-tokens-to-shadcn.md +145 -145
  242. package/pro/squads/design/tasks/f1-qa-foundations.md +95 -95
  243. package/pro/squads/design/tasks/f2-adapt-shadcn-components.md +155 -155
  244. package/pro/squads/design/tasks/f2-ingest-base-components.md +148 -148
  245. package/pro/squads/design/tasks/f2-qa-base-components.md +98 -98
  246. package/pro/squads/design/tasks/f3-derive-components.md +145 -145
  247. package/pro/squads/design/tasks/f3-qa-derived-components.md +101 -101
  248. package/pro/squads/design/tasks/focus-order-audit.md +450 -450
  249. package/pro/squads/design/tasks/sb-brownfield-migrate.md +367 -367
  250. package/pro/squads/design/tasks/sb-brownfield-scan.md +318 -318
  251. package/pro/squads/design/tasks/sb-configure.md +230 -230
  252. package/pro/squads/design/tasks/sb-expand-shadcn.md +213 -213
  253. package/pro/squads/design/tasks/sb-generate-all-stories.md +288 -288
  254. package/pro/squads/design/tasks/sb-install.md +152 -152
  255. package/pro/squads/design/tasks/sb-sync-workspace.md +239 -239
  256. package/pro/squads/design/tasks/sb-verify.md +203 -203
  257. package/pro/squads/design/tasks/tailwind-upgrade.md +117 -117
  258. package/pro/squads/design/tasks/token-usage-analytics.md +262 -262
  259. package/pro/squads/design/tasks/ux-rewrite-sixth-grade.md +82 -82
  260. package/pro/squads/design/tasks/validate-design-fidelity.md +222 -222
  261. package/pro/squads/design/templates/agent-template.yaml +46 -46
  262. package/pro/squads/design/templates/clone-mind-template.md +352 -352
  263. package/pro/squads/design/templates/component-prompt-injection-tmpl.md +236 -236
  264. package/pro/squads/design/templates/component-visual-spec-tmpl.md +378 -378
  265. package/pro/squads/design/templates/critical-eye-cycle-report-tmpl.md +165 -165
  266. package/pro/squads/design/templates/design-fidelity-report-tmpl.md +155 -155
  267. package/pro/squads/design/templates/ds-ai-component-metadata-schema-tmpl.json +138 -138
  268. package/pro/squads/design/templates/ds-artifact-analysis.md +70 -70
  269. package/pro/squads/design/templates/ds-health-report-tmpl.md +236 -236
  270. package/pro/squads/design/templates/ds-migration-strategy-tmpl.md +524 -524
  271. package/pro/squads/design/templates/ds-state-persistence-tmpl.yaml +194 -194
  272. package/pro/squads/design/templates/ds-tokens-schema-tmpl.yaml +139 -139
  273. package/pro/squads/design/templates/migration-strategy-tmpl.md +524 -524
  274. package/pro/squads/design/templates/reading-design-tokens.css +26 -26
  275. package/pro/squads/design/templates/state-persistence-tmpl.yaml +219 -219
  276. package/pro/squads/design/templates/tokens-schema-tmpl.yaml +305 -305
  277. package/pro/squads/design/workflows/agentic-readiness.yaml +83 -83
  278. package/pro/squads/design/workflows/audit-only.yaml +198 -198
  279. package/pro/squads/design/workflows/brownfield-complete.yaml +257 -257
  280. package/pro/squads/design/workflows/critical-eye.yaml +184 -184
  281. package/pro/squads/design/workflows/dtcg-tokens-governance.yaml +64 -64
  282. package/pro/squads/design/workflows/foundations-pipeline.yaml +192 -192
  283. package/pro/squads/design/workflows/greenfield-new.yaml +192 -192
  284. package/pro/squads/design/workflows/motion-quality.yaml +65 -65
  285. package/pro/squads/design/workflows/self-healing-workflow.yaml +237 -237
  286. package/pro/squads/design/workflows/storybook-brownfield-migration.yaml +400 -400
  287. package/pro/squads/design/workflows/storybook-full-setup.yaml +280 -280
  288. package/pro/squads/mmos-squad/minds/alex_hormozi/artifacts/ARQUITETURA_COGNITIVA_DE_ALEX_HORMOZI_EXTRA/303/207/303/203O_COMPLETA.md +215 -0
  289. package/pro/squads/mmos-squad/minds/alex_hormozi/artifacts/A_Rotina_de_Alta_Performance_de_Alex_Hormozi_Arquitetura,_Motiva/303/247/303/265es_e_Replica/303/247/303/243o.md +309 -0
  290. package/pro/squads/mmos-squad/minds/alex_hormozi/artifacts/O_sistema_completo_de_cria/303/247/303/243o_de_conte/303/272do_de_Alex_Hormozi.md +416 -0
  291. package/pro/squads/mmos-squad/minds/alex_hormozi/artifacts/Processo_Cria/303/247/303/243o_Conte/303/272do_Hormozi.md +0 -0
  292. package/pro/squads/mmos-squad/minds/brad_frost/.backup/2026-01-13/artifacts/DECIS/303/225ES_ESTRAT/303/211GICAS_DE_DESIGN_SYSTEMS_(2022_2025).md +1038 -0
  293. package/pro/squads/mmos-squad/minds/brad_frost/.backup/2026-01-13/artifacts/FRAMEWORK_COMPLETO_DE_IMPLEMENTA/303/207/303/203O_ATOMIC_DESIGN.md +797 -0
  294. package/pro/squads/mmos-squad/minds/brad_frost/.backup/2026-01-13/artifacts/O_Cemit/303/251rio_de_Design_Systems.md +447 -0
  295. package/pro/squads/mmos-squad/minds/brad_frost/.backup/2026-01-13/artifacts/PRINC/303/215PIOS_DE_RACIOC/303/215NIO.md +190 -0
  296. package/pro/squads/mmos-squad/minds/brad_frost/artifacts/DECIS/303/225ES_ESTRAT/303/211GICAS_DE_DESIGN_SYSTEMS_(2022_2025).md +1038 -0
  297. package/pro/squads/mmos-squad/minds/brad_frost/artifacts/FRAMEWORK_COMPLETO_DE_IMPLEMENTA/303/207/303/203O_ATOMIC_DESIGN.md +797 -0
  298. package/pro/squads/mmos-squad/minds/brad_frost/artifacts/O_Cemit/303/251rio_de_Design_Systems.md +447 -0
  299. package/pro/squads/mmos-squad/minds/brad_frost/artifacts/PRINC/303/215PIOS_DE_RACIOC/303/215NIO.md +190 -0
  300. package/pro/squads/mmos-squad/minds/elon_musk/artifacts/AN/303/201LISE_PSICOM/303/211TRICA_PROFUNDA_ELON_MUSK.md +291 -0
  301. package/pro/squads/mmos-squad/minds/elon_musk/artifacts/ASSINATURA_LINGU/303/215STICA_ELON_MUSK.md +485 -0
  302. package/pro/squads/mmos-squad/minds/elon_musk/artifacts/A_Arquitetura_Mental_de_Elon_Musk_Uma_An/303/241lise_Sistem/303/241tica_dos_Frameworks_de_Pensamento.md +907 -0
  303. package/pro/squads/mmos-squad/minds/elon_musk/artifacts/Dossi/303/252_Estrat/303/251gico_A_Arquitetura_Psicol/303/263gica_de_Elon_Musk.md +252 -0
  304. package/pro/squads/mmos-squad/minds/elon_musk/artifacts/Os_Padr/303/265es_de_Leitura_de_Elon_Musk_e_Sua_Influ/303/252ncia_Sistem/303/241tica.md +287 -0
  305. package/pro/squads/mmos-squad/minds/elon_musk/artifacts/Uma_an/303/241lise_psicol/303/263gica_abrangente.md +187 -0
  306. package/pro/squads/mmos-squad/minds/eugene_schwartz/artifacts/AN/303/201LISE_PSICOM/303/211TRICA_PROFUNDA_EUGENE_M._SCHWARTZ.md +790 -0
  307. package/pro/squads/mmos-squad/minds/eugene_schwartz/artifacts/An/303/241lise_Completa_Eugene_Schwartz_Arquitetura_Cognitiva_DEEP.md +210 -0
  308. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/5H_EXTRA/303/207/303/203O_COGNITIVA_COMPLETA_PEDRO_VAL/303/211RIO_LOPEZ.md +226 -0
  309. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/AN/303/201LISE_COMPARATIVA_REVISADA_PEDRO_VAL/303/211RIO_LOPEZ.md +246 -0
  310. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/AN/303/201LISE_LINGU/303/215STICA_CARIOCA_PEDRO_VAL/303/211RIO_LOPEZ.md +274 -0
  311. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/AN/303/201LISE_PSICOM/303/211TRICA_DEFINITIVA_PEDRO_VAL/303/211RIO_LOPEZ.md +821 -0
  312. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/AN/303/201LISE_PSICOM/303/211TRICA_PROFUNDA_PEDRO_VAL/303/211RIO.md +1844 -0
  313. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/C/303/201LCULO_DE_RARIDADE_ESTAT/303/215STICA_PEDRO_VAL/303/211RIO_LOPEZ.md +154 -0
  314. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/EXTRA/303/207/303/203O_PEDRO_VAL/303/211RIO.md +237 -0
  315. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/MAPEAMENTO_LINGU/303/215STICO_PROFUNDO.md +161 -0
  316. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/META_AXIOMAS_DE_PEDRO_VAL/303/211RIO.md +256 -0
  317. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/SISTEMA_IMUNOL/303/223GICO_COGNITIVO_PEDRO_VAL/303/211RIO_LOPEZ.md +586 -0
  318. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/SISTEMA_IMUNOL/303/223GICO_COGNITIVO_V2_/342/200/224_CLONE_IA.md +452 -0
  319. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/TABELA_COMPARATIVA_AN/303/201LISE_COMPLETA_DOS_CLONES_IA.md +102 -0
  320. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/WHATSAPP_PADR/303/225ES_LINGU/303/215STICOS_PEDRO_VAL/303/211RIO_LOPEZ.md +286 -0
  321. package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/heur/303/255sticas_de_decis/303/243o_e_algoritmos_mentais_/303/272nicos.md +268 -0
  322. package/pro/squads/mmos-squad/minds/ray_kurzweil/sources/books/PROTOCOLO_COMPLETO_DE_INTERROGA/303/207/303/203O_-_NAVAL_RAVIKANT.md +3624 -0
  323. package/pro/squads/mmos-squad/minds/steve_jobs/artifacts/FRAMEWORK_COMPLETO_DE_IMPLEMENTA/303/207/303/203O_JOBS.md +488 -0
  324. package/pro/squads/mmos-squad/minds/steve_jobs/artifacts/Framework_Cabe/303/247a_Steve.md +257 -0
  325. package/pro/squads/mmos-squad/minds/steve_jobs/artifacts/Relat/303/263rio_Abrangente_sobre_Steve_Jobs_para_Cria/303/247/303/243o_de_Clone_de_IA.md +370 -0
  326. package/pro/squads/mmos-squad/minds/steve_jobs/artifacts/Steve_Jobs_An/303/241lise_Psicol/303/263gica_Profunda_e_Valida/303/247/303/243o_Comportamental.md +65 -0
  327. package/pro/squads/squad-creator-pro/HEADLINE.md +3 -3
  328. package/pro/squads/squad-creator-pro/agents/oalanicolas.md +438 -438
  329. package/pro/squads/squad-creator-pro/agents/squad-chief.md +1651 -1651
  330. package/pro/squads/squad-creator-pro/agents/thiago_finch.md +976 -976
  331. package/pro/squads/squad-creator-pro/assessments/axioma-assessment-wf-create-squad.yaml +325 -325
  332. package/pro/squads/squad-creator-pro/checklists/create-agent-checklist.md +184 -184
  333. package/pro/squads/squad-creator-pro/checklists/create-squad-checklist.md +219 -219
  334. package/pro/squads/squad-creator-pro/checklists/create-workflow-checklist.md +224 -224
  335. package/pro/squads/squad-creator-pro/checklists/mental-model-integration-checklist.md +95 -95
  336. package/pro/squads/squad-creator-pro/checklists/squad-overview-checklist.md +393 -393
  337. package/pro/squads/squad-creator-pro/config/model-routing.yaml +693 -693
  338. package/pro/squads/squad-creator-pro/config/scoring-rubric.yaml +199 -199
  339. package/pro/squads/squad-creator-pro/config.yaml +35 -35
  340. package/pro/squads/squad-creator-pro/data/internal-infrastructure-library.yaml +99 -99
  341. package/pro/squads/squad-creator-pro/data/mental-model-task-matrix.yaml +692 -692
  342. package/pro/squads/squad-creator-pro/docs/ADR-001-model-tier-qualification.md +344 -344
  343. package/pro/squads/squad-creator-pro/docs/AGENT-COLLABORATION.md +609 -609
  344. package/pro/squads/squad-creator-pro/docs/MIGRATION-PLAN-AGENT-CONFORMITY.md +861 -861
  345. package/pro/squads/squad-creator-pro/docs/MODEL-TIER-QUALIFICATION.md +337 -337
  346. package/pro/squads/squad-creator-pro/docs/optimize-v4-proposal.md +354 -354
  347. package/pro/squads/squad-creator-pro/docs/task-optimization-framework.md +229 -229
  348. package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_010.md +240 -240
  349. package/pro/squads/squad-creator-pro/protocols/ai-first-governance.md +63 -63
  350. package/pro/squads/squad-creator-pro/scripts/assess-sources.sh +443 -443
  351. package/pro/squads/squad-creator-pro/scripts/clone-review.sh +394 -394
  352. package/pro/squads/squad-creator-pro/scripts/create-agent-preflight.py +243 -243
  353. package/pro/squads/squad-creator-pro/scripts/cross-provider/compare-results.js +281 -281
  354. package/pro/squads/squad-creator-pro/scripts/cross-provider/cross-provider-runner.js +462 -462
  355. package/pro/squads/squad-creator-pro/scripts/fidelity-score.sh +519 -519
  356. package/pro/squads/squad-creator-pro/scripts/generate-squad-guide.js +558 -558
  357. package/pro/squads/squad-creator-pro/scripts/lib/config-loader.js +151 -151
  358. package/pro/squads/squad-creator-pro/scripts/model-tier-validator.cjs +369 -369
  359. package/pro/squads/squad-creator-pro/scripts/model-usage-logger.cjs +245 -245
  360. package/pro/squads/squad-creator-pro/scripts/modernization-score.sh +308 -308
  361. package/pro/squads/squad-creator-pro/scripts/scaffold-squad.cjs +281 -281
  362. package/pro/squads/squad-creator-pro/scripts/security_scanner.py +378 -378
  363. package/pro/squads/squad-creator-pro/scripts/squad-context-loader.cjs +205 -205
  364. package/pro/squads/squad-creator-pro/scripts/squad-state-manager.cjs +451 -451
  365. package/pro/squads/squad-creator-pro/scripts/squad-workflow-runner.cjs +471 -471
  366. package/pro/squads/squad-creator-pro/scripts/squad_utils.py +261 -261
  367. package/pro/squads/squad-creator-pro/scripts/tests/run_bash_tests.sh +29 -29
  368. package/pro/squads/squad-creator-pro/scripts/tests/test_assess_sources.sh +216 -216
  369. package/pro/squads/squad-creator-pro/scripts/tests/test_clone_review.sh +239 -239
  370. package/pro/squads/squad-creator-pro/scripts/tests/test_coherence_validator.py +212 -212
  371. package/pro/squads/squad-creator-pro/scripts/tests/test_fidelity_score.sh +298 -298
  372. package/pro/squads/squad-creator-pro/scripts/tests/test_modernization_score.sh +211 -211
  373. package/pro/squads/squad-creator-pro/scripts/tests/test_security_scanner.py +354 -354
  374. package/pro/squads/squad-creator-pro/scripts/tests/test_validate_clone.sh +252 -252
  375. package/pro/squads/squad-creator-pro/squad.yaml +36 -36
  376. package/pro/squads/squad-creator-pro/tasks/an-compare-outputs.md +354 -354
  377. package/pro/squads/squad-creator-pro/tasks/create-squad.md +933 -933
  378. package/pro/squads/squad-creator-pro/tasks/detect-squad-context.md +81 -81
  379. package/pro/squads/squad-creator-pro/tasks/lookup-model.md +78 -78
  380. package/pro/squads/squad-creator-pro/tasks/next-squad.md +487 -487
  381. package/pro/squads/squad-creator-pro/tasks/optimize-workflow.md +851 -851
  382. package/pro/squads/squad-creator-pro/tasks/parallel-discovery.md +58 -58
  383. package/pro/squads/squad-creator-pro/tasks/pv-axioma-assessment-wf-clone-mind.yaml +256 -256
  384. package/pro/squads/squad-creator-pro/tasks/qualify-task.md +265 -265
  385. package/pro/squads/squad-creator-pro/tasks/reexecute-squad-phase.md +64 -64
  386. package/pro/squads/squad-creator-pro/tasks/smoke-test-model-routing.md +167 -167
  387. package/pro/squads/squad-creator-pro/tasks/squad-overview.md +683 -683
  388. package/pro/squads/squad-creator-pro/tasks/validate-final-artifacts.md +80 -80
  389. package/pro/squads/squad-creator-pro/templates/orchestrator-tmpl.md +74 -74
  390. package/pro/squads/squad-creator-pro/test-cases/BATCH-PROGRESS.md +268 -268
  391. package/pro/squads/squad-creator-pro/test-cases/QUALIFICATION-DASHBOARD.yaml +13 -13
  392. package/pro/squads/squad-creator-pro/test-cases/_template.yaml +147 -147
  393. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/ASSESSMENT-SUMMARY.md +275 -275
  394. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/ASSESSMENT_SUMMARY.md +140 -140
  395. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/CHECKPOINT_MATRIX.md +202 -202
  396. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/EXECUTION-REPORT.md +413 -413
  397. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/EXECUTION_NOTES.md +358 -358
  398. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/README-v2.2.2.md +299 -299
  399. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/README.md +320 -320
  400. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/TEST-REPORT-v2.1.md +351 -351
  401. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/VERIFICATION-CHECKLIST.txt +247 -247
  402. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/formal-qualification-report.yaml +389 -389
  403. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-output.yaml +366 -366
  404. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-v2.1-output.yaml +452 -452
  405. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-v2.2.1-output.yaml +281 -281
  406. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-v2.2.2-output.yaml +332 -332
  407. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/opus-baseline.yaml +517 -517
  408. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/qualification-report.yaml +213 -213
  409. package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/test-case.yaml +69 -69
  410. package/pro/squads/squad-creator-pro/test-cases/an-clone-review/haiku-round-1.yaml +213 -213
  411. package/pro/squads/squad-creator-pro/test-cases/an-clone-review/opus-baseline.yaml +566 -566
  412. package/pro/squads/squad-creator-pro/test-cases/an-clone-review/qualification-report.yaml +82 -82
  413. package/pro/squads/squad-creator-pro/test-cases/an-design-clone/test-case.yaml +102 -102
  414. package/pro/squads/squad-creator-pro/test-cases/an-extract-dna/test-case.yaml +105 -105
  415. package/pro/squads/squad-creator-pro/test-cases/an-fidelity-score/haiku-round-1.yaml +262 -262
  416. package/pro/squads/squad-creator-pro/test-cases/an-fidelity-score/opus-baseline.yaml +266 -266
  417. package/pro/squads/squad-creator-pro/test-cases/an-fidelity-score/qualification-report.yaml +94 -94
  418. package/pro/squads/squad-creator-pro/test-cases/an-validate-clone/haiku-round-1.yaml +282 -282
  419. package/pro/squads/squad-creator-pro/test-cases/an-validate-clone/opus-baseline.yaml +470 -470
  420. package/pro/squads/squad-creator-pro/test-cases/an-validate-clone/qualification-report.yaml +106 -106
  421. package/pro/squads/squad-creator-pro/test-cases/collect-sources/test-case.yaml +105 -105
  422. package/pro/squads/squad-creator-pro/test-cases/create-task/test-case.yaml +104 -104
  423. package/pro/squads/squad-creator-pro/test-cases/cross-provider/DASHBOARD.yaml +11 -11
  424. package/pro/squads/squad-creator-pro/test-cases/pv-audit/test-case.yaml +106 -106
  425. package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/haiku-output.yaml +209 -209
  426. package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/opus-baseline.yaml +96 -96
  427. package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/sonnet-output.yaml +30 -30
  428. package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/test-case.yaml +129 -129
  429. package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/comparison-round-1.yaml +242 -242
  430. package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/haiku-round-1.yaml +393 -393
  431. package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/opus-baseline.yaml +488 -488
  432. package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/qualification-report.yaml +74 -74
  433. package/pro/squads/squad-creator-pro/test-cases/qa-after-creation/haiku-round-1.yaml +292 -292
  434. package/pro/squads/squad-creator-pro/test-cases/qa-after-creation/opus-baseline.yaml +603 -603
  435. package/pro/squads/squad-creator-pro/test-cases/qa-after-creation/qualification-report.yaml +97 -97
  436. package/pro/squads/squad-creator-pro/test-cases/smoke-test-model-routing/test-case.yaml +100 -100
  437. package/pro/squads/squad-creator-pro/test-cases/upgrade-squad/test-case.yaml +106 -106
  438. package/pro/squads/squad-creator-pro/test-cases/validate-squad/comparison-round-1.yaml +223 -223
  439. package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-1-MINE.yaml +36 -36
  440. package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-1.yaml +193 -193
  441. package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-2.yaml +303 -303
  442. package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-3-v4-task.yaml +149 -149
  443. package/pro/squads/squad-creator-pro/test-cases/validate-squad/opus-baseline.yaml +529 -529
  444. package/pro/squads/squad-creator-pro/test-cases/validate-squad/opus-round-3-v4-task.yaml +132 -132
  445. package/pro/squads/squad-creator-pro/test-cases/validate-squad/qualification-report.yaml +104 -104
  446. package/pro/squads/squad-creator-pro/test-cases/wf-clone-mind/haiku-output-v2-calibrated.yaml +200 -200
  447. package/pro/squads/squad-creator-pro/test-cases/wf-clone-mind/haiku-output.yaml +183 -183
  448. package/pro/squads/squad-creator-pro/test-cases/wf-clone-mind/opus-baseline.yaml +112 -112
  449. package/pro/squads/squad-creator-pro/workflows/create-squad.yaml +348 -348
  450. package/pro/squads/squad-creator-pro/workflows/modules/module-discovery.yaml +16 -16
  451. package/pro/squads/squad-creator-pro/workflows/modules/module-integration.yaml +16 -16
  452. package/pro/squads/squad-creator-pro/workflows/modules/module-quality-gates.yaml +15 -15
  453. package/pro/squads/squad-creator-pro/workflows/wf-brownfield-upgrade-squad.yaml +46 -46
  454. package/pro/squads/squad-creator-pro/workflows/wf-context-aware-create-squad.yaml +47 -47
  455. package/pro/squads/squad-creator-pro/workflows/wf-create-squad.yaml +1619 -1619
  456. package/pro/squads/squad-creator-pro/workflows/wf-cross-provider-qualification.yaml +711 -711
  457. package/pro/squads/squad-creator-pro/workflows/wf-model-tier-qualification.yaml +800 -800
  458. package/pro/squads/squad-creator-pro/workflows/wf-optimize-squad.yaml +684 -684
  459. package/scripts/check-markdown-links.py +352 -352
  460. package/scripts/dashboard-parallel-dev.sh +0 -0
  461. package/scripts/dashboard-parallel-phase3.sh +0 -0
  462. package/scripts/dashboard-parallel-phase4.sh +0 -0
  463. package/scripts/install-monitor-hooks.sh +0 -0
  464. package/.claude/hooks/code-intel-pretool.cjs +0 -107
  465. package/docs/guides/aios-workflows/README.md +0 -247
  466. package/docs/guides/aios-workflows/bob-orchestrator-workflow.md +0 -1536
  467. package/scripts/glue/README.md +0 -355
  468. package/scripts/glue/compose-agent-prompt.cjs +0 -362
@@ -1,354 +1,354 @@
1
- # Task: Compare Model Outputs
2
-
3
- **Command:** `*compare-outputs`
4
- **Version:** 1.0.0
5
- **Execution Type:** Agent (Opus ONLY - evaluator must be most capable model)
6
- **Model:** `Opus` (REQUIRED - evaluator cannot be same tier as test subject)
7
- **Purpose:** Systematic comparison of Opus baseline vs Haiku test outputs for Model Tier Qualification
8
-
9
- ---
10
-
11
- ## CRITICAL: Evaluator Independence
12
-
13
- ```yaml
14
- evaluator_rules:
15
- model: "opus" # NEVER use Haiku to evaluate Haiku
16
- blind_mode: false # We know which is which (baseline vs test)
17
- bias_mitigation:
18
- - "Score WHAT IS WRITTEN, not what you expect"
19
- - "Do NOT assume Opus is better - measure objectively"
20
- - "If outputs are equivalent, say so (don't force differences)"
21
- ```
22
-
23
- ---
24
-
25
- ## Inputs
26
-
27
- | Parameter | Type | Required | Description |
28
- |-----------|------|----------|-------------|
29
- | `task_name` | string | Yes | Task being evaluated (e.g., "an-assess-sources") |
30
- | `opus_baseline` | file | Yes | Path to Opus output file |
31
- | `haiku_output` | file | Yes | Path to Haiku output file |
32
- | `task_file` | file | Yes | Original task definition (for reference) |
33
-
34
- ---
35
-
36
- ## Evaluation Rubric (100 points)
37
-
38
- ### Dimension 1: TIER MATCH (40 points)
39
-
40
- ```yaml
41
- tier_match:
42
- weight: 40
43
- description: "Do both outputs classify items into the same tiers?"
44
-
45
- scoring:
46
- perfect_match: 40 # 100% of items have same tier
47
- high_match: 32 # 90-99% same tier
48
- moderate_match: 24 # 75-89% same tier
49
- low_match: 16 # 50-74% same tier
50
- poor_match: 0 # <50% same tier
51
-
52
- calculation: |
53
- match_rate = count(opus_tier == haiku_tier) / total_items
54
-
55
- IF match_rate == 1.0 → 40 points
56
- IF match_rate >= 0.9 → 32 points
57
- IF match_rate >= 0.75 → 24 points
58
- IF match_rate >= 0.5 → 16 points
59
- ELSE → 0 points
60
-
61
- veto_condition: |
62
- IF match_rate < 0.75 → VETO (different tier = different user action)
63
- Rationale: User decides based on tier, not score details
64
- ```
65
-
66
- ### Dimension 2: SCORE VARIANCE (30 points)
67
-
68
- ```yaml
69
- score_variance:
70
- weight: 30
71
- description: "Are numerical scores within acceptable variance?"
72
-
73
- thresholds:
74
- excellent: 5% # Scores within 5%
75
- good: 10% # Scores within 10%
76
- acceptable: 15% # Scores within 15%
77
- poor: 20% # Scores within 20%
78
- unacceptable: ">20%"
79
-
80
- scoring:
81
- within_5pct: 30
82
- within_10pct: 24
83
- within_15pct: 18
84
- within_20pct: 12
85
- beyond_20pct: 0
86
-
87
- calculation: |
88
- FOR each scored item:
89
- variance = abs(opus_score - haiku_score) / opus_score * 100
90
-
91
- avg_variance = mean(all variances)
92
- max_variance = max(all variances)
93
-
94
- # Use WORST case (max) for scoring, not average
95
- IF max_variance <= 5% → 30 points
96
- IF max_variance <= 10% → 24 points
97
- IF max_variance <= 15% → 18 points
98
- IF max_variance <= 20% → 12 points
99
- ELSE → 0 points
100
-
101
- veto_condition: |
102
- IF max_variance > 15% → REVIEW (significant scoring difference)
103
- IF max_variance > 25% → VETO (unreliable scoring)
104
- ```
105
-
106
- ### Dimension 3: CHECKPOINT MATCH (20 points)
107
-
108
- ```yaml
109
- checkpoint_match:
110
- weight: 20
111
- description: "Do binary checkpoints (true/false) match?"
112
-
113
- applies_to: "Tasks with binary checkpoint scoring"
114
-
115
- scoring:
116
- perfect_match: 20 # 100% checkpoints match
117
- high_match: 16 # 95-99% match
118
- moderate_match: 12 # 90-94% match
119
- low_match: 8 # 80-89% match
120
- poor_match: 0 # <80% match
121
-
122
- calculation: |
123
- FOR each item with checkpoints:
124
- FOR each checkpoint:
125
- match = (opus_checkpoint == haiku_checkpoint)
126
-
127
- match_rate = count(matches) / total_checkpoints
128
-
129
- IF match_rate == 1.0 → 20 points
130
- IF match_rate >= 0.95 → 16 points
131
- IF match_rate >= 0.90 → 12 points
132
- IF match_rate >= 0.80 → 8 points
133
- ELSE → 0 points
134
-
135
- note: |
136
- If task doesn't use binary checkpoints, award 20 points
137
- (dimension not applicable)
138
- ```
139
-
140
- ### Dimension 4: RECOMMENDATION QUALITY (10 points)
141
-
142
- ```yaml
143
- recommendation_quality:
144
- weight: 10
145
- description: "Do recommendations lead to same user actions?"
146
-
147
- scoring:
148
- same_actions: 10 # Same recommended actions
149
- similar_actions: 7 # Same direction, different specifics
150
- different_actions: 3 # Different recommendations
151
- contradictory: 0 # Opposite recommendations
152
-
153
- evaluation_criteria:
154
- - "Would user take same action based on each output?"
155
- - "Are priorities the same (what to do first)?"
156
- - "Are gaps/issues identified the same?"
157
-
158
- note: |
159
- This is the most subjective dimension.
160
- Focus on ACTIONABLE outcomes, not wording.
161
- ```
162
-
163
- ---
164
-
165
- ## Qualification Thresholds
166
-
167
- ```yaml
168
- qualification_decision:
169
- thresholds:
170
- QUALIFIED: ">= 85 points AND no veto triggered"
171
- CONDITIONAL: "70-84 points OR veto with mitigation possible"
172
- NOT_QUALIFIED: "< 70 points OR hard veto"
173
-
174
- veto_conditions:
175
- - id: "MTQ_VC_001"
176
- name: "Score Variance >15%"
177
- severity: "review"
178
-
179
- - id: "MTQ_VC_002"
180
- name: "Score Variance >25%"
181
- severity: "veto"
182
-
183
- - id: "MTQ_VC_003"
184
- name: "Tier Match <90%"
185
- severity: "review"
186
-
187
- - id: "MTQ_VC_004"
188
- name: "Tier Match <75%"
189
- severity: "veto"
190
-
191
- - id: "MTQ_VC_005"
192
- name: "Contradictory Recommendations"
193
- severity: "veto"
194
- ```
195
-
196
- ---
197
-
198
- ## Workflow
199
-
200
- ### Step 1: Load Inputs
201
-
202
- ```yaml
203
- step_1:
204
- action: "Read both output files and task definition"
205
- inputs:
206
- - opus_baseline
207
- - haiku_output
208
- - task_file
209
- validation:
210
- - "Both files exist and are valid YAML"
211
- - "Both files have same structure"
212
- - "Task file provides context for evaluation"
213
- ```
214
-
215
- ### Step 2: Extract Comparable Items
216
-
217
- ```yaml
218
- step_2:
219
- action: "Identify all items to compare"
220
- extract:
221
- - items: "List of scored items (sources, dimensions, etc.)"
222
- - scores: "Numerical scores per item"
223
- - tiers: "Classification tiers per item"
224
- - checkpoints: "Binary checkpoints if applicable"
225
- - recommendations: "Action items and priorities"
226
- ```
227
-
228
- ### Step 3: Calculate Dimension Scores
229
-
230
- ```yaml
231
- step_3:
232
- action: "Score each dimension using rubric"
233
-
234
- tier_match:
235
- calculate: "match_rate = matching_tiers / total_items"
236
- score: "Apply scoring table"
237
- check_veto: "match_rate < 0.75?"
238
-
239
- score_variance:
240
- calculate: "variance per item, take max"
241
- score: "Apply scoring table"
242
- check_veto: "max_variance > 25%?"
243
-
244
- checkpoint_match:
245
- calculate: "matching_checkpoints / total_checkpoints"
246
- score: "Apply scoring table"
247
-
248
- recommendation_quality:
249
- evaluate: "Would user take same action?"
250
- score: "Apply scoring table"
251
- check_veto: "Contradictory?"
252
- ```
253
-
254
- ### Step 4: Generate Report
255
-
256
- ```yaml
257
- step_4:
258
- action: "Generate qualification report"
259
-
260
- output_format: |
261
- qualification_report:
262
- task: "{task_name}"
263
- evaluation_date: "{ISO date}"
264
- evaluator: "opus"
265
-
266
- inputs:
267
- opus_baseline: "{path}"
268
- haiku_output: "{path}"
269
-
270
- dimension_scores:
271
- tier_match:
272
- score: X/40
273
- match_rate: X%
274
- details: [...]
275
-
276
- score_variance:
277
- score: X/30
278
- avg_variance: X%
279
- max_variance: X%
280
- details: [...]
281
-
282
- checkpoint_match:
283
- score: X/20
284
- match_rate: X%
285
- details: [...]
286
-
287
- recommendation_quality:
288
- score: X/10
289
- assessment: "same|similar|different|contradictory"
290
- details: [...]
291
-
292
- total_score: X/100
293
-
294
- veto_conditions:
295
- triggered: [...]
296
- not_triggered: [...]
297
-
298
- decision: "QUALIFIED | CONDITIONAL | NOT_QUALIFIED"
299
-
300
- rationale: |
301
- {Explanation of decision}
302
-
303
- recommendations:
304
- if_qualified: |
305
- - Update model-routing.yaml: tier = haiku
306
- - Add validated: true with test_date
307
- if_conditional: |
308
- - {Specific fixes needed}
309
- - Re-test after fixes
310
- if_not_qualified: |
311
- - Keep tier = opus
312
- - Document root cause
313
- ```
314
-
315
- ---
316
-
317
- ## Output
318
-
319
- Save qualification report to:
320
- ```
321
- squads/squad-creator-pro/test-cases/{task_name}/qualification-report.yaml
322
- ```
323
-
324
- ---
325
-
326
- ## Usage Example
327
-
328
- ```bash
329
- *compare-outputs \
330
- --task an-assess-sources \
331
- --opus squads/squad-creator-pro/test-cases/an-assess-sources/opus-baseline.yaml \
332
- --haiku squads/squad-creator-pro/test-cases/an-assess-sources/haiku-v2.2.1-output.yaml \
333
- --task-file squads/squad-creator-pro/tasks/an-assess-sources.md
334
- ```
335
-
336
- ---
337
-
338
- ## Completion Criteria
339
-
340
- - [ ] Both output files loaded and parsed
341
- - [ ] All 4 dimensions scored using rubric
342
- - [ ] Veto conditions checked
343
- - [ ] Total score calculated
344
- - [ ] Decision determined (QUALIFIED/CONDITIONAL/NOT_QUALIFIED)
345
- - [ ] Qualification report generated with full details
346
- - [ ] Report saved to test-cases/{task}/qualification-report.yaml
347
-
348
- ---
349
-
350
- ## Changelog
351
-
352
- | Version | Date | Changes |
353
- |---------|------|---------|
354
- | 1.0.0 | 2026-02-11 | Initial version with 4-dimension rubric |
1
+ # Task: Compare Model Outputs
2
+
3
+ **Command:** `*compare-outputs`
4
+ **Version:** 1.0.0
5
+ **Execution Type:** Agent (Opus ONLY - evaluator must be most capable model)
6
+ **Model:** `Opus` (REQUIRED - evaluator cannot be same tier as test subject)
7
+ **Purpose:** Systematic comparison of Opus baseline vs Haiku test outputs for Model Tier Qualification
8
+
9
+ ---
10
+
11
+ ## CRITICAL: Evaluator Independence
12
+
13
+ ```yaml
14
+ evaluator_rules:
15
+ model: "opus" # NEVER use Haiku to evaluate Haiku
16
+ blind_mode: false # We know which is which (baseline vs test)
17
+ bias_mitigation:
18
+ - "Score WHAT IS WRITTEN, not what you expect"
19
+ - "Do NOT assume Opus is better - measure objectively"
20
+ - "If outputs are equivalent, say so (don't force differences)"
21
+ ```
22
+
23
+ ---
24
+
25
+ ## Inputs
26
+
27
+ | Parameter | Type | Required | Description |
28
+ |-----------|------|----------|-------------|
29
+ | `task_name` | string | Yes | Task being evaluated (e.g., "an-assess-sources") |
30
+ | `opus_baseline` | file | Yes | Path to Opus output file |
31
+ | `haiku_output` | file | Yes | Path to Haiku output file |
32
+ | `task_file` | file | Yes | Original task definition (for reference) |
33
+
34
+ ---
35
+
36
+ ## Evaluation Rubric (100 points)
37
+
38
+ ### Dimension 1: TIER MATCH (40 points)
39
+
40
+ ```yaml
41
+ tier_match:
42
+ weight: 40
43
+ description: "Do both outputs classify items into the same tiers?"
44
+
45
+ scoring:
46
+ perfect_match: 40 # 100% of items have same tier
47
+ high_match: 32 # 90-99% same tier
48
+ moderate_match: 24 # 75-89% same tier
49
+ low_match: 16 # 50-74% same tier
50
+ poor_match: 0 # <50% same tier
51
+
52
+ calculation: |
53
+ match_rate = count(opus_tier == haiku_tier) / total_items
54
+
55
+ IF match_rate == 1.0 → 40 points
56
+ IF match_rate >= 0.9 → 32 points
57
+ IF match_rate >= 0.75 → 24 points
58
+ IF match_rate >= 0.5 → 16 points
59
+ ELSE → 0 points
60
+
61
+ veto_condition: |
62
+ IF match_rate < 0.75 → VETO (different tier = different user action)
63
+ Rationale: User decides based on tier, not score details
64
+ ```
65
+
66
+ ### Dimension 2: SCORE VARIANCE (30 points)
67
+
68
+ ```yaml
69
+ score_variance:
70
+ weight: 30
71
+ description: "Are numerical scores within acceptable variance?"
72
+
73
+ thresholds:
74
+ excellent: 5% # Scores within 5%
75
+ good: 10% # Scores within 10%
76
+ acceptable: 15% # Scores within 15%
77
+ poor: 20% # Scores within 20%
78
+ unacceptable: ">20%"
79
+
80
+ scoring:
81
+ within_5pct: 30
82
+ within_10pct: 24
83
+ within_15pct: 18
84
+ within_20pct: 12
85
+ beyond_20pct: 0
86
+
87
+ calculation: |
88
+ FOR each scored item:
89
+ variance = abs(opus_score - haiku_score) / opus_score * 100
90
+
91
+ avg_variance = mean(all variances)
92
+ max_variance = max(all variances)
93
+
94
+ # Use WORST case (max) for scoring, not average
95
+ IF max_variance <= 5% → 30 points
96
+ IF max_variance <= 10% → 24 points
97
+ IF max_variance <= 15% → 18 points
98
+ IF max_variance <= 20% → 12 points
99
+ ELSE → 0 points
100
+
101
+ veto_condition: |
102
+ IF max_variance > 15% → REVIEW (significant scoring difference)
103
+ IF max_variance > 25% → VETO (unreliable scoring)
104
+ ```
105
+
106
+ ### Dimension 3: CHECKPOINT MATCH (20 points)
107
+
108
+ ```yaml
109
+ checkpoint_match:
110
+ weight: 20
111
+ description: "Do binary checkpoints (true/false) match?"
112
+
113
+ applies_to: "Tasks with binary checkpoint scoring"
114
+
115
+ scoring:
116
+ perfect_match: 20 # 100% checkpoints match
117
+ high_match: 16 # 95-99% match
118
+ moderate_match: 12 # 90-94% match
119
+ low_match: 8 # 80-89% match
120
+ poor_match: 0 # <80% match
121
+
122
+ calculation: |
123
+ FOR each item with checkpoints:
124
+ FOR each checkpoint:
125
+ match = (opus_checkpoint == haiku_checkpoint)
126
+
127
+ match_rate = count(matches) / total_checkpoints
128
+
129
+ IF match_rate == 1.0 → 20 points
130
+ IF match_rate >= 0.95 → 16 points
131
+ IF match_rate >= 0.90 → 12 points
132
+ IF match_rate >= 0.80 → 8 points
133
+ ELSE → 0 points
134
+
135
+ note: |
136
+ If task doesn't use binary checkpoints, award 20 points
137
+ (dimension not applicable)
138
+ ```
139
+
140
+ ### Dimension 4: RECOMMENDATION QUALITY (10 points)
141
+
142
+ ```yaml
143
+ recommendation_quality:
144
+ weight: 10
145
+ description: "Do recommendations lead to same user actions?"
146
+
147
+ scoring:
148
+ same_actions: 10 # Same recommended actions
149
+ similar_actions: 7 # Same direction, different specifics
150
+ different_actions: 3 # Different recommendations
151
+ contradictory: 0 # Opposite recommendations
152
+
153
+ evaluation_criteria:
154
+ - "Would user take same action based on each output?"
155
+ - "Are priorities the same (what to do first)?"
156
+ - "Are gaps/issues identified the same?"
157
+
158
+ note: |
159
+ This is the most subjective dimension.
160
+ Focus on ACTIONABLE outcomes, not wording.
161
+ ```
162
+
163
+ ---
164
+
165
+ ## Qualification Thresholds
166
+
167
+ ```yaml
168
+ qualification_decision:
169
+ thresholds:
170
+ QUALIFIED: ">= 85 points AND no veto triggered"
171
+ CONDITIONAL: "70-84 points OR veto with mitigation possible"
172
+ NOT_QUALIFIED: "< 70 points OR hard veto"
173
+
174
+ veto_conditions:
175
+ - id: "MTQ_VC_001"
176
+ name: "Score Variance >15%"
177
+ severity: "review"
178
+
179
+ - id: "MTQ_VC_002"
180
+ name: "Score Variance >25%"
181
+ severity: "veto"
182
+
183
+ - id: "MTQ_VC_003"
184
+ name: "Tier Match <90%"
185
+ severity: "review"
186
+
187
+ - id: "MTQ_VC_004"
188
+ name: "Tier Match <75%"
189
+ severity: "veto"
190
+
191
+ - id: "MTQ_VC_005"
192
+ name: "Contradictory Recommendations"
193
+ severity: "veto"
194
+ ```
195
+
196
+ ---
197
+
198
+ ## Workflow
199
+
200
+ ### Step 1: Load Inputs
201
+
202
+ ```yaml
203
+ step_1:
204
+ action: "Read both output files and task definition"
205
+ inputs:
206
+ - opus_baseline
207
+ - haiku_output
208
+ - task_file
209
+ validation:
210
+ - "Both files exist and are valid YAML"
211
+ - "Both files have same structure"
212
+ - "Task file provides context for evaluation"
213
+ ```
214
+
215
+ ### Step 2: Extract Comparable Items
216
+
217
+ ```yaml
218
+ step_2:
219
+ action: "Identify all items to compare"
220
+ extract:
221
+ - items: "List of scored items (sources, dimensions, etc.)"
222
+ - scores: "Numerical scores per item"
223
+ - tiers: "Classification tiers per item"
224
+ - checkpoints: "Binary checkpoints if applicable"
225
+ - recommendations: "Action items and priorities"
226
+ ```
227
+
228
+ ### Step 3: Calculate Dimension Scores
229
+
230
+ ```yaml
231
+ step_3:
232
+ action: "Score each dimension using rubric"
233
+
234
+ tier_match:
235
+ calculate: "match_rate = matching_tiers / total_items"
236
+ score: "Apply scoring table"
237
+ check_veto: "match_rate < 0.75?"
238
+
239
+ score_variance:
240
+ calculate: "variance per item, take max"
241
+ score: "Apply scoring table"
242
+ check_veto: "max_variance > 25%?"
243
+
244
+ checkpoint_match:
245
+ calculate: "matching_checkpoints / total_checkpoints"
246
+ score: "Apply scoring table"
247
+
248
+ recommendation_quality:
249
+ evaluate: "Would user take same action?"
250
+ score: "Apply scoring table"
251
+ check_veto: "Contradictory?"
252
+ ```
253
+
254
+ ### Step 4: Generate Report
255
+
256
+ ```yaml
257
+ step_4:
258
+ action: "Generate qualification report"
259
+
260
+ output_format: |
261
+ qualification_report:
262
+ task: "{task_name}"
263
+ evaluation_date: "{ISO date}"
264
+ evaluator: "opus"
265
+
266
+ inputs:
267
+ opus_baseline: "{path}"
268
+ haiku_output: "{path}"
269
+
270
+ dimension_scores:
271
+ tier_match:
272
+ score: X/40
273
+ match_rate: X%
274
+ details: [...]
275
+
276
+ score_variance:
277
+ score: X/30
278
+ avg_variance: X%
279
+ max_variance: X%
280
+ details: [...]
281
+
282
+ checkpoint_match:
283
+ score: X/20
284
+ match_rate: X%
285
+ details: [...]
286
+
287
+ recommendation_quality:
288
+ score: X/10
289
+ assessment: "same|similar|different|contradictory"
290
+ details: [...]
291
+
292
+ total_score: X/100
293
+
294
+ veto_conditions:
295
+ triggered: [...]
296
+ not_triggered: [...]
297
+
298
+ decision: "QUALIFIED | CONDITIONAL | NOT_QUALIFIED"
299
+
300
+ rationale: |
301
+ {Explanation of decision}
302
+
303
+ recommendations:
304
+ if_qualified: |
305
+ - Update model-routing.yaml: tier = haiku
306
+ - Add validated: true with test_date
307
+ if_conditional: |
308
+ - {Specific fixes needed}
309
+ - Re-test after fixes
310
+ if_not_qualified: |
311
+ - Keep tier = opus
312
+ - Document root cause
313
+ ```
314
+
315
+ ---
316
+
317
+ ## Output
318
+
319
+ Save qualification report to:
320
+ ```
321
+ squads/squad-creator-pro/test-cases/{task_name}/qualification-report.yaml
322
+ ```
323
+
324
+ ---
325
+
326
+ ## Usage Example
327
+
328
+ ```bash
329
+ *compare-outputs \
330
+ --task an-assess-sources \
331
+ --opus squads/squad-creator-pro/test-cases/an-assess-sources/opus-baseline.yaml \
332
+ --haiku squads/squad-creator-pro/test-cases/an-assess-sources/haiku-v2.2.1-output.yaml \
333
+ --task-file squads/squad-creator-pro/tasks/an-assess-sources.md
334
+ ```
335
+
336
+ ---
337
+
338
+ ## Completion Criteria
339
+
340
+ - [ ] Both output files loaded and parsed
341
+ - [ ] All 4 dimensions scored using rubric
342
+ - [ ] Veto conditions checked
343
+ - [ ] Total score calculated
344
+ - [ ] Decision determined (QUALIFIED/CONDITIONAL/NOT_QUALIFIED)
345
+ - [ ] Qualification report generated with full details
346
+ - [ ] Report saved to test-cases/{task}/qualification-report.yaml
347
+
348
+ ---
349
+
350
+ ## Changelog
351
+
352
+ | Version | Date | Changes |
353
+ |---------|------|---------|
354
+ | 1.0.0 | 2026-02-11 | Initial version with 4-dimension rubric |