aiox-core 5.0.2 → 5.0.4
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.aiox-core/core/execution/predictive-pipeline.js +1283 -0
- package/.aiox-core/core/memory/decision-memory.js +564 -0
- package/.aiox-core/data/entity-registry.yaml +1068 -1043
- package/.aiox-core/data/registry-update-log.jsonl +2 -2
- package/.aiox-core/development/templates/service-template/README.md.hbs +158 -158
- package/.aiox-core/development/templates/service-template/__tests__/index.test.ts.hbs +237 -237
- package/.aiox-core/development/templates/service-template/client.ts.hbs +403 -403
- package/.aiox-core/development/templates/service-template/errors.ts.hbs +182 -182
- package/.aiox-core/development/templates/service-template/index.ts.hbs +120 -120
- package/.aiox-core/development/templates/service-template/package.json.hbs +87 -87
- package/.aiox-core/development/templates/service-template/types.ts.hbs +145 -145
- package/.aiox-core/development/templates/squad-template/LICENSE +21 -21
- package/.aiox-core/infrastructure/templates/aiox-sync.yaml.template +182 -182
- package/.aiox-core/infrastructure/templates/coderabbit.yaml.template +279 -279
- package/.aiox-core/infrastructure/templates/github-workflows/ci.yml.template +169 -169
- package/.aiox-core/infrastructure/templates/github-workflows/pr-automation.yml.template +330 -330
- package/.aiox-core/infrastructure/templates/github-workflows/release.yml.template +196 -196
- package/.aiox-core/infrastructure/templates/gitignore/gitignore-aiox-base.tmpl +63 -63
- package/.aiox-core/infrastructure/templates/gitignore/gitignore-brownfield-merge.tmpl +18 -18
- package/.aiox-core/infrastructure/templates/gitignore/gitignore-node.tmpl +85 -85
- package/.aiox-core/infrastructure/templates/gitignore/gitignore-python.tmpl +145 -145
- package/.aiox-core/install-manifest.yaml +63 -55
- package/.aiox-core/local-config.yaml.template +71 -71
- package/.aiox-core/monitor/hooks/lib/__init__.py +1 -1
- package/.aiox-core/monitor/hooks/lib/enrich.py +58 -58
- package/.aiox-core/monitor/hooks/lib/send_event.py +47 -47
- package/.aiox-core/monitor/hooks/notification.py +29 -29
- package/.aiox-core/monitor/hooks/post_tool_use.py +45 -45
- package/.aiox-core/monitor/hooks/pre_compact.py +29 -29
- package/.aiox-core/monitor/hooks/pre_tool_use.py +40 -40
- package/.aiox-core/monitor/hooks/stop.py +29 -29
- package/.aiox-core/monitor/hooks/subagent_stop.py +29 -29
- package/.aiox-core/monitor/hooks/user_prompt_submit.py +38 -38
- package/.aiox-core/product/templates/adr.hbs +125 -125
- package/.aiox-core/product/templates/dbdr.hbs +241 -241
- package/.aiox-core/product/templates/epic.hbs +212 -212
- package/.aiox-core/product/templates/pmdr.hbs +186 -186
- package/.aiox-core/product/templates/prd-v2.0.hbs +216 -216
- package/.aiox-core/product/templates/prd.hbs +201 -201
- package/.aiox-core/product/templates/story.hbs +263 -263
- package/.aiox-core/product/templates/task.hbs +170 -170
- package/.aiox-core/product/templates/tmpl-comment-on-examples.sql +158 -158
- package/.aiox-core/product/templates/tmpl-migration-script.sql +91 -91
- package/.aiox-core/product/templates/tmpl-rls-granular-policies.sql +104 -104
- package/.aiox-core/product/templates/tmpl-rls-kiss-policy.sql +10 -10
- package/.aiox-core/product/templates/tmpl-rls-roles.sql +135 -135
- package/.aiox-core/product/templates/tmpl-rls-simple.sql +77 -77
- package/.aiox-core/product/templates/tmpl-rls-tenant.sql +152 -152
- package/.aiox-core/product/templates/tmpl-rollback-script.sql +77 -77
- package/.aiox-core/product/templates/tmpl-seed-data.sql +140 -140
- package/.aiox-core/product/templates/tmpl-smoke-test.sql +16 -16
- package/.aiox-core/product/templates/tmpl-staging-copy-merge.sql +139 -139
- package/.aiox-core/product/templates/tmpl-stored-proc.sql +140 -140
- package/.aiox-core/product/templates/tmpl-trigger.sql +152 -152
- package/.aiox-core/product/templates/tmpl-view-materialized.sql +133 -133
- package/.aiox-core/product/templates/tmpl-view.sql +177 -177
- package/.aiox-core/scripts/pm.sh +0 -0
- package/.claude/hooks/enforce-architecture-first.py +196 -196
- package/.claude/hooks/mind-clone-governance.py +192 -192
- package/.claude/hooks/read-protection.py +151 -151
- package/.claude/hooks/slug-validation.py +176 -176
- package/.claude/hooks/sql-governance.py +182 -182
- package/.claude/hooks/write-path-validation.py +194 -194
- package/LICENSE +33 -33
- package/bin/aiox-graph.js +0 -0
- package/bin/aiox-minimal.js +0 -0
- package/bin/aiox.js +0 -0
- package/package.json +6 -1
- package/packages/aiox-install/bin/aiox-install.js +0 -0
- package/packages/aiox-install/bin/edmcp.js +0 -0
- package/packages/aiox-pro-cli/bin/aiox-pro.js +0 -0
- package/packages/installer/src/wizard/pro-setup.js +28 -0
- package/pro/README.md +66 -66
- package/pro/feature-registry.yaml +225 -0
- package/pro/license/license-api.js +701 -679
- package/pro/package.json +39 -0
- package/pro/pro-config.yaml +63 -0
- package/pro/squads/README.md +24 -0
- package/pro/squads/design/HEADLINE.md +3 -0
- package/pro/squads/design/README.md +109 -0
- package/pro/squads/design/agents/brad-frost.md +1097 -0
- package/pro/squads/design/agents/dan-mall.md +857 -0
- package/pro/squads/design/agents/dave-malouf.md +2272 -0
- package/pro/squads/design/agents/design-chief.md +114 -0
- package/pro/squads/design/agents/ds-foundations-lead.md +194 -0
- package/pro/squads/design/agents/ds-token-architect.md +361 -0
- package/pro/squads/design/agents/nano-banana-generator.md +162 -0
- package/pro/squads/design/agents/storybook-expert.md +809 -0
- package/pro/squads/design/checklists/atomic-refactor-checklist.md +299 -0
- package/pro/squads/design/checklists/component-adaptation-checklist.md +81 -0
- package/pro/squads/design/checklists/design-fidelity-checklist.md +283 -0
- package/pro/squads/design/checklists/design-handoff-checklist.md +55 -0
- package/pro/squads/design/checklists/design-team-health-checklist.md +454 -0
- package/pro/squads/design/checklists/designops-maturity-checklist.md +518 -0
- package/pro/squads/design/checklists/ds-a11y-release-gate-checklist.md +45 -0
- package/pro/squads/design/checklists/ds-accessibility-wcag-checklist.md +147 -0
- package/pro/squads/design/checklists/ds-component-quality-checklist.md +150 -0
- package/pro/squads/design/checklists/ds-critical-eye-review-checklist.md +147 -0
- package/pro/squads/design/checklists/ds-migration-readiness-checklist.md +99 -0
- package/pro/squads/design/checklists/ds-pattern-audit-checklist.md +164 -0
- package/pro/squads/design/checklists/reading-accessibility-checklist.md +275 -0
- package/pro/squads/design/checklists/token-mapping-checklist.md +107 -0
- package/pro/squads/design/config/coding-standards.md +286 -0
- package/pro/squads/design/config/source-tree.md +59 -0
- package/pro/squads/design/config/tech-stack.md +48 -0
- package/pro/squads/design/config.yaml +204 -0
- package/pro/squads/design/data/agentic-design-systems-guide.md +46 -0
- package/pro/squads/design/data/agentic-ds-principles.md +100 -0
- package/pro/squads/design/data/atomic-design-principles.md +108 -0
- package/pro/squads/design/data/atomic-refactor-rules.md +582 -0
- package/pro/squads/design/data/base-component-specs.md +972 -0
- package/pro/squads/design/data/brad-frost-analysis-extract-implicit.yaml +270 -0
- package/pro/squads/design/data/brad-frost-analysis-find-0.8.yaml +176 -0
- package/pro/squads/design/data/brad-frost-analysis-qa-report.yaml +168 -0
- package/pro/squads/design/data/brad-frost-dna.yaml +713 -0
- package/pro/squads/design/data/capability-tools.yaml +124 -0
- package/pro/squads/design/data/component-adaptation-changelog.md +318 -0
- package/pro/squads/design/data/consolidation-algorithms.md +168 -0
- package/pro/squads/design/data/critical-eye-scoring-rules.yaml +240 -0
- package/pro/squads/design/data/design-token-best-practices.md +107 -0
- package/pro/squads/design/data/design-tokens-spec.yaml +418 -0
- package/pro/squads/design/data/ds-reference-architectures.md +93 -0
- package/pro/squads/design/data/f2-qa-report.md +168 -0
- package/pro/squads/design/data/f3-derived-components-changelog.md +100 -0
- package/pro/squads/design/data/f3-qa-report.md +208 -0
- package/pro/squads/design/data/figma-base-components-raw.md +102 -0
- package/pro/squads/design/data/figma-tokens-raw.md +1549 -0
- package/pro/squads/design/data/fluent2-design-principles.md +114 -0
- package/pro/squads/design/data/high-retention-reading-guide.md +349 -0
- package/pro/squads/design/data/integration-patterns.md +207 -0
- package/pro/squads/design/data/internal-quality-chain.yaml +48 -0
- package/pro/squads/design/data/motion-tokens-guide.md +202 -0
- package/pro/squads/design/data/roi-calculation-guide.md +142 -0
- package/pro/squads/design/data/token-mapping-reference.md +213 -0
- package/pro/squads/design/data/w3c-dtcg-spec-reference.md +149 -0
- package/pro/squads/design/data/wcag-compliance-guide.md +267 -0
- package/pro/squads/design/docs/AUDIT_REPORT.md +97 -0
- package/pro/squads/design/docs/DS-CURATION-PIPELINE-PROPOSAL.md +577 -0
- package/pro/squads/design/docs/UPGRADE_PLAN.md +618 -0
- package/pro/squads/design/docs/brad-frost-research-validation.md +372 -0
- package/pro/squads/design/docs/dave-malouf-research-validation.md +391 -0
- package/pro/squads/design/docs/tool-discovery-report.md +87 -0
- package/pro/squads/design/docs/tool-integration-plan.md +44 -0
- package/pro/squads/design/protocols/ai-first-governance.md +56 -0
- package/pro/squads/design/protocols/governance-execution-boundary.md +59 -0
- package/pro/squads/design/protocols/handoff.md +60 -0
- package/pro/squads/design/rules/.claude-rules.md +88 -0
- package/pro/squads/design/scripts/design-system/curate_colors.cjs +447 -0
- package/pro/squads/design/scripts/design-system/curate_components.cjs +217 -0
- package/pro/squads/design/scripts/design-system/curate_radius.cjs +190 -0
- package/pro/squads/design/scripts/design-system/curate_shadows.cjs +208 -0
- package/pro/squads/design/scripts/design-system/curate_spacing.cjs +243 -0
- package/pro/squads/design/scripts/design-system/curate_typography.cjs +404 -0
- package/pro/squads/design/scripts/design-system/design-system-metadata.test.js +49 -0
- package/pro/squads/design/scripts/design-system/design_manifest_lib.cjs +142 -0
- package/pro/squads/design/scripts/design-system/fetch_page_images.cjs +195 -0
- package/pro/squads/design/scripts/design-system/generate_components_metadata.cjs +114 -0
- package/pro/squads/design/scripts/design-system/generate_curation_report.cjs +258 -0
- package/pro/squads/design/scripts/design-system/generate_tokens.cjs +342 -0
- package/pro/squads/design/scripts/design-system/sync_design_manifest.cjs +27 -0
- package/pro/squads/design/scripts/design-system/test_mcp_tools.cjs +232 -0
- package/pro/squads/design/scripts/design-system/validate_components_metadata.cjs +96 -0
- package/pro/squads/design/scripts/design-system/validate_curation.cjs +226 -0
- package/pro/squads/design/scripts/design-system/validate_design_manifest_drift.cjs +72 -0
- package/pro/squads/design/scripts/design-system/validate_mcp_skeleton.cjs +38 -0
- package/pro/squads/design/scripts/design-system/validate_registry.cjs +186 -0
- package/pro/squads/design/scripts/design-system/validate_task_checklist_bindings.cjs +78 -0
- package/pro/squads/design/scripts/dissect-artifact.cjs +806 -0
- package/pro/squads/design/scripts/validate-a11y-integration.cjs +40 -0
- package/pro/squads/design/scripts/validate-design-squad.py +411 -0
- package/pro/squads/design/squad.yaml +714 -0
- package/pro/squads/design/tasks/a11y-audit.md +340 -0
- package/pro/squads/design/tasks/aria-audit.md +525 -0
- package/pro/squads/design/tasks/atomic-refactor-execute.md +391 -0
- package/pro/squads/design/tasks/atomic-refactor-plan.md +262 -0
- package/pro/squads/design/tasks/audit-reading-experience.md +350 -0
- package/pro/squads/design/tasks/audit-tailwind-config.md +101 -0
- package/pro/squads/design/tasks/bootstrap-shadcn-library.md +96 -0
- package/pro/squads/design/tasks/bundle-audit.md +245 -0
- package/pro/squads/design/tasks/contrast-matrix.md +373 -0
- package/pro/squads/design/tasks/create-doc.md +135 -0
- package/pro/squads/design/tasks/dead-code-detection.md +329 -0
- package/pro/squads/design/tasks/design-compare.md +414 -0
- package/pro/squads/design/tasks/design-process-optimization.md +407 -0
- package/pro/squads/design/tasks/design-review-orchestration.md +99 -0
- package/pro/squads/design/tasks/design-team-scaling.md +407 -0
- package/pro/squads/design/tasks/design-tooling-audit.md +404 -0
- package/pro/squads/design/tasks/design-triage.md +89 -0
- package/pro/squads/design/tasks/designops-maturity-assessment.md +364 -0
- package/pro/squads/design/tasks/designops-metrics-setup.md +465 -0
- package/pro/squads/design/tasks/ds-agentic-audit.md +100 -0
- package/pro/squads/design/tasks/ds-agentic-setup.md +103 -0
- package/pro/squads/design/tasks/ds-audit-codebase.md +273 -0
- package/pro/squads/design/tasks/ds-build-component.md +349 -0
- package/pro/squads/design/tasks/ds-build-mcp-server.md +84 -0
- package/pro/squads/design/tasks/ds-calculate-roi.md +282 -0
- package/pro/squads/design/tasks/ds-compose-molecule.md +106 -0
- package/pro/squads/design/tasks/ds-consolidate-patterns.md +253 -0
- package/pro/squads/design/tasks/ds-context-contract.md +194 -0
- package/pro/squads/design/tasks/ds-critical-eye-compare.md +130 -0
- package/pro/squads/design/tasks/ds-critical-eye-decide.md +139 -0
- package/pro/squads/design/tasks/ds-critical-eye-inventory.md +111 -0
- package/pro/squads/design/tasks/ds-critical-eye-report.md +101 -0
- package/pro/squads/design/tasks/ds-critical-eye-score.md +109 -0
- package/pro/squads/design/tasks/ds-designops.md +99 -0
- package/pro/squads/design/tasks/ds-extend-pattern.md +91 -0
- package/pro/squads/design/tasks/ds-extract-tokens.md +312 -0
- package/pro/squads/design/tasks/ds-figma-pipeline.md +95 -0
- package/pro/squads/design/tasks/ds-fluent-audit.md +105 -0
- package/pro/squads/design/tasks/ds-fluent-build.md +110 -0
- package/pro/squads/design/tasks/ds-generate-ai-metadata.md +81 -0
- package/pro/squads/design/tasks/ds-generate-cursor-rules.md +74 -0
- package/pro/squads/design/tasks/ds-generate-documentation.md +101 -0
- package/pro/squads/design/tasks/ds-generate-migration-strategy.md +331 -0
- package/pro/squads/design/tasks/ds-generate-shock-report.md +323 -0
- package/pro/squads/design/tasks/ds-govern-a11y-compliance.md +93 -0
- package/pro/squads/design/tasks/ds-governance.md +187 -0
- package/pro/squads/design/tasks/ds-health-metrics.md +278 -0
- package/pro/squads/design/tasks/ds-integrate-squad.md +130 -0
- package/pro/squads/design/tasks/ds-integrate-workspace.md +100 -0
- package/pro/squads/design/tasks/ds-legacy-modernization.md +302 -0
- package/pro/squads/design/tasks/ds-mcp-status.md +65 -0
- package/pro/squads/design/tasks/ds-motion-audit.md +118 -0
- package/pro/squads/design/tasks/ds-multi-framework.md +96 -0
- package/pro/squads/design/tasks/ds-parallelization-gate.md +246 -0
- package/pro/squads/design/tasks/ds-query.md +90 -0
- package/pro/squads/design/tasks/ds-rebuild-artifact.md +369 -0
- package/pro/squads/design/tasks/ds-reverse-engineer.md +194 -0
- package/pro/squads/design/tasks/ds-scan-artifact.md +131 -0
- package/pro/squads/design/tasks/ds-setup-design-system.md +297 -0
- package/pro/squads/design/tasks/ds-sync-registry.md +287 -0
- package/pro/squads/design/tasks/ds-theme-multi-brand.md +90 -0
- package/pro/squads/design/tasks/ds-token-modes.md +108 -0
- package/pro/squads/design/tasks/ds-token-w3c-extract.md +105 -0
- package/pro/squads/design/tasks/ds-validate-ai-readiness.md +69 -0
- package/pro/squads/design/tasks/ds-visual-regression.md +130 -0
- package/pro/squads/design/tasks/execute-checklist.md +141 -0
- package/pro/squads/design/tasks/export-design-tokens-dtcg.md +97 -0
- package/pro/squads/design/tasks/f1-apply-foundations.md +154 -0
- package/pro/squads/design/tasks/f1-ingest-figma-tokens.md +130 -0
- package/pro/squads/design/tasks/f1-map-tokens-to-shadcn.md +145 -0
- package/pro/squads/design/tasks/f1-qa-foundations.md +95 -0
- package/pro/squads/design/tasks/f2-adapt-shadcn-components.md +155 -0
- package/pro/squads/design/tasks/f2-ingest-base-components.md +148 -0
- package/pro/squads/design/tasks/f2-qa-base-components.md +98 -0
- package/pro/squads/design/tasks/f3-derive-components.md +145 -0
- package/pro/squads/design/tasks/f3-qa-derived-components.md +101 -0
- package/pro/squads/design/tasks/focus-order-audit.md +450 -0
- package/pro/squads/design/tasks/sb-brownfield-migrate.md +367 -0
- package/pro/squads/design/tasks/sb-brownfield-scan.md +318 -0
- package/pro/squads/design/tasks/sb-configure.md +230 -0
- package/pro/squads/design/tasks/sb-expand-shadcn.md +213 -0
- package/pro/squads/design/tasks/sb-generate-all-stories.md +288 -0
- package/pro/squads/design/tasks/sb-install.md +152 -0
- package/pro/squads/design/tasks/sb-sync-workspace.md +239 -0
- package/pro/squads/design/tasks/sb-verify.md +203 -0
- package/pro/squads/design/tasks/tailwind-upgrade.md +117 -0
- package/pro/squads/design/tasks/token-usage-analytics.md +262 -0
- package/pro/squads/design/tasks/ux-rewrite-sixth-grade.md +82 -0
- package/pro/squads/design/tasks/validate-design-fidelity.md +222 -0
- package/pro/squads/design/templates/agent-template.yaml +46 -0
- package/pro/squads/design/templates/clone-mind-template.md +352 -0
- package/pro/squads/design/templates/component-prompt-injection-tmpl.md +236 -0
- package/pro/squads/design/templates/component-visual-spec-tmpl.md +378 -0
- package/pro/squads/design/templates/critical-eye-cycle-report-tmpl.md +165 -0
- package/pro/squads/design/templates/design-fidelity-report-tmpl.md +155 -0
- package/pro/squads/design/templates/ds-ai-component-metadata-schema-tmpl.json +138 -0
- package/pro/squads/design/templates/ds-artifact-analysis.md +70 -0
- package/pro/squads/design/templates/ds-health-report-tmpl.md +236 -0
- package/pro/squads/design/templates/ds-migration-strategy-tmpl.md +524 -0
- package/pro/squads/design/templates/ds-state-persistence-tmpl.yaml +194 -0
- package/pro/squads/design/templates/ds-tokens-schema-tmpl.yaml +139 -0
- package/pro/squads/design/templates/migration-strategy-tmpl.md +524 -0
- package/pro/squads/design/templates/reading-design-tokens.css +26 -0
- package/pro/squads/design/templates/state-persistence-tmpl.yaml +219 -0
- package/pro/squads/design/templates/tokens-schema-tmpl.yaml +305 -0
- package/pro/squads/design/workflows/agentic-readiness.yaml +83 -0
- package/pro/squads/design/workflows/audit-only.yaml +198 -0
- package/pro/squads/design/workflows/brownfield-complete.yaml +257 -0
- package/pro/squads/design/workflows/critical-eye.yaml +184 -0
- package/pro/squads/design/workflows/dtcg-tokens-governance.yaml +64 -0
- package/pro/squads/design/workflows/foundations-pipeline.yaml +192 -0
- package/pro/squads/design/workflows/greenfield-new.yaml +192 -0
- package/pro/squads/design/workflows/motion-quality.yaml +65 -0
- package/pro/squads/design/workflows/self-healing-workflow.yaml +237 -0
- package/pro/squads/design/workflows/storybook-brownfield-migration.yaml +400 -0
- package/pro/squads/design/workflows/storybook-full-setup.yaml +280 -0
- package/pro/squads/index.js +145 -0
- package/pro/squads/mmos-squad/minds/alex_hormozi/artifacts/ARQUITETURA_COGNITIVA_DE_ALEX_HORMOZI_EXTRA/303/207/303/203O_COMPLETA.md +215 -0
- package/pro/squads/mmos-squad/minds/alex_hormozi/artifacts/A_Rotina_de_Alta_Performance_de_Alex_Hormozi_Arquitetura,_Motiva/303/247/303/265es_e_Replica/303/247/303/243o.md +309 -0
- package/pro/squads/mmos-squad/minds/alex_hormozi/artifacts/O_sistema_completo_de_cria/303/247/303/243o_de_conte/303/272do_de_Alex_Hormozi.md +416 -0
- package/pro/squads/mmos-squad/minds/alex_hormozi/artifacts/Processo_Cria/303/247/303/243o_Conte/303/272do_Hormozi.md +0 -0
- package/pro/squads/mmos-squad/minds/brad_frost/.backup/2026-01-13/artifacts/DECIS/303/225ES_ESTRAT/303/211GICAS_DE_DESIGN_SYSTEMS_(2022_2025).md +1038 -0
- package/pro/squads/mmos-squad/minds/brad_frost/.backup/2026-01-13/artifacts/FRAMEWORK_COMPLETO_DE_IMPLEMENTA/303/207/303/203O_ATOMIC_DESIGN.md +797 -0
- package/pro/squads/mmos-squad/minds/brad_frost/.backup/2026-01-13/artifacts/O_Cemit/303/251rio_de_Design_Systems.md +447 -0
- package/pro/squads/mmos-squad/minds/brad_frost/.backup/2026-01-13/artifacts/PRINC/303/215PIOS_DE_RACIOC/303/215NIO.md +190 -0
- package/pro/squads/mmos-squad/minds/brad_frost/artifacts/DECIS/303/225ES_ESTRAT/303/211GICAS_DE_DESIGN_SYSTEMS_(2022_2025).md +1038 -0
- package/pro/squads/mmos-squad/minds/brad_frost/artifacts/FRAMEWORK_COMPLETO_DE_IMPLEMENTA/303/207/303/203O_ATOMIC_DESIGN.md +797 -0
- package/pro/squads/mmos-squad/minds/brad_frost/artifacts/O_Cemit/303/251rio_de_Design_Systems.md +447 -0
- package/pro/squads/mmos-squad/minds/brad_frost/artifacts/PRINC/303/215PIOS_DE_RACIOC/303/215NIO.md +190 -0
- package/pro/squads/mmos-squad/minds/elon_musk/artifacts/AN/303/201LISE_PSICOM/303/211TRICA_PROFUNDA_ELON_MUSK.md +291 -0
- package/pro/squads/mmos-squad/minds/elon_musk/artifacts/ASSINATURA_LINGU/303/215STICA_ELON_MUSK.md +485 -0
- package/pro/squads/mmos-squad/minds/elon_musk/artifacts/A_Arquitetura_Mental_de_Elon_Musk_Uma_An/303/241lise_Sistem/303/241tica_dos_Frameworks_de_Pensamento.md +907 -0
- package/pro/squads/mmos-squad/minds/elon_musk/artifacts/Dossi/303/252_Estrat/303/251gico_A_Arquitetura_Psicol/303/263gica_de_Elon_Musk.md +252 -0
- package/pro/squads/mmos-squad/minds/elon_musk/artifacts/Os_Padr/303/265es_de_Leitura_de_Elon_Musk_e_Sua_Influ/303/252ncia_Sistem/303/241tica.md +287 -0
- package/pro/squads/mmos-squad/minds/elon_musk/artifacts/Uma_an/303/241lise_psicol/303/263gica_abrangente.md +187 -0
- package/pro/squads/mmos-squad/minds/eugene_schwartz/artifacts/AN/303/201LISE_PSICOM/303/211TRICA_PROFUNDA_EUGENE_M._SCHWARTZ.md +790 -0
- package/pro/squads/mmos-squad/minds/eugene_schwartz/artifacts/An/303/241lise_Completa_Eugene_Schwartz_Arquitetura_Cognitiva_DEEP.md +210 -0
- package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/5H_EXTRA/303/207/303/203O_COGNITIVA_COMPLETA_PEDRO_VAL/303/211RIO_LOPEZ.md +226 -0
- package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/AN/303/201LISE_COMPARATIVA_REVISADA_PEDRO_VAL/303/211RIO_LOPEZ.md +246 -0
- package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/AN/303/201LISE_LINGU/303/215STICA_CARIOCA_PEDRO_VAL/303/211RIO_LOPEZ.md +274 -0
- package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/AN/303/201LISE_PSICOM/303/211TRICA_DEFINITIVA_PEDRO_VAL/303/211RIO_LOPEZ.md +821 -0
- package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/AN/303/201LISE_PSICOM/303/211TRICA_PROFUNDA_PEDRO_VAL/303/211RIO.md +1844 -0
- package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/C/303/201LCULO_DE_RARIDADE_ESTAT/303/215STICA_PEDRO_VAL/303/211RIO_LOPEZ.md +154 -0
- package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/EXTRA/303/207/303/203O_PEDRO_VAL/303/211RIO.md +237 -0
- package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/MAPEAMENTO_LINGU/303/215STICO_PROFUNDO.md +161 -0
- package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/META_AXIOMAS_DE_PEDRO_VAL/303/211RIO.md +256 -0
- package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/SISTEMA_IMUNOL/303/223GICO_COGNITIVO_PEDRO_VAL/303/211RIO_LOPEZ.md +586 -0
- package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/SISTEMA_IMUNOL/303/223GICO_COGNITIVO_V2_/342/200/224_CLONE_IA.md +452 -0
- package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/TABELA_COMPARATIVA_AN/303/201LISE_COMPLETA_DOS_CLONES_IA.md +102 -0
- package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/WHATSAPP_PADR/303/225ES_LINGU/303/215STICOS_PEDRO_VAL/303/211RIO_LOPEZ.md +286 -0
- package/pro/squads/mmos-squad/minds/pedro_valerio/sources/artifacts_v1.6/heur/303/255sticas_de_decis/303/243o_e_algoritmos_mentais_/303/272nicos.md +268 -0
- package/pro/squads/mmos-squad/minds/ray_kurzweil/sources/books/PROTOCOLO_COMPLETO_DE_INTERROGA/303/207/303/203O_-_NAVAL_RAVIKANT.md +3624 -0
- package/pro/squads/mmos-squad/minds/steve_jobs/artifacts/FRAMEWORK_COMPLETO_DE_IMPLEMENTA/303/207/303/203O_JOBS.md +488 -0
- package/pro/squads/mmos-squad/minds/steve_jobs/artifacts/Framework_Cabe/303/247a_Steve.md +257 -0
- package/pro/squads/mmos-squad/minds/steve_jobs/artifacts/Relat/303/263rio_Abrangente_sobre_Steve_Jobs_para_Cria/303/247/303/243o_de_Clone_de_IA.md +370 -0
- package/pro/squads/mmos-squad/minds/steve_jobs/artifacts/Steve_Jobs_An/303/241lise_Psicol/303/263gica_Profunda_e_Valida/303/247/303/243o_Comportamental.md +65 -0
- package/pro/squads/squad-creator-pro/.state.json +32 -0
- package/pro/squads/squad-creator-pro/CHANGELOG.md +275 -0
- package/pro/squads/squad-creator-pro/HEADLINE.md +3 -0
- package/pro/squads/squad-creator-pro/README.md +1059 -0
- package/pro/squads/squad-creator-pro/agents/oalanicolas.md +438 -0
- package/pro/squads/squad-creator-pro/agents/pedro-valerio.md +449 -0
- package/pro/squads/squad-creator-pro/agents/squad-chief.md +1651 -0
- package/pro/squads/squad-creator-pro/agents/thiago_finch.md +976 -0
- package/pro/squads/squad-creator-pro/assessments/axioma-assessment-wf-create-squad.yaml +325 -0
- package/pro/squads/squad-creator-pro/checklists/.gitkeep +1 -0
- package/pro/squads/squad-creator-pro/checklists/agent-depth-checklist.md +244 -0
- package/pro/squads/squad-creator-pro/checklists/agent-quality-gate.md +434 -0
- package/pro/squads/squad-creator-pro/checklists/create-agent-checklist.md +184 -0
- package/pro/squads/squad-creator-pro/checklists/create-squad-checklist.md +219 -0
- package/pro/squads/squad-creator-pro/checklists/create-workflow-checklist.md +224 -0
- package/pro/squads/squad-creator-pro/checklists/deep-research-quality.md +506 -0
- package/pro/squads/squad-creator-pro/checklists/executor-matrix-checklist.md +260 -0
- package/pro/squads/squad-creator-pro/checklists/mental-model-integration-checklist.md +95 -0
- package/pro/squads/squad-creator-pro/checklists/mind-validation.md +374 -0
- package/pro/squads/squad-creator-pro/checklists/quality-gate-checklist.md +385 -0
- package/pro/squads/squad-creator-pro/checklists/smoke-test-agent.md +313 -0
- package/pro/squads/squad-creator-pro/checklists/sop-validation.md +250 -0
- package/pro/squads/squad-creator-pro/checklists/squad-checklist.md +1014 -0
- package/pro/squads/squad-creator-pro/checklists/squad-overview-checklist.md +393 -0
- package/pro/squads/squad-creator-pro/checklists/task-anatomy-checklist.md +626 -0
- package/pro/squads/squad-creator-pro/config/.gitkeep +1 -0
- package/pro/squads/squad-creator-pro/config/axioma-validator.yaml +371 -0
- package/pro/squads/squad-creator-pro/config/heuristics.yaml +753 -0
- package/pro/squads/squad-creator-pro/config/model-routing.yaml +693 -0
- package/pro/squads/squad-creator-pro/config/quality-gates.yaml +415 -0
- package/pro/squads/squad-creator-pro/config/scoring-rubric.yaml +199 -0
- package/pro/squads/squad-creator-pro/config/squad-config.yaml +165 -0
- package/pro/squads/squad-creator-pro/config/task-anatomy.yaml +263 -0
- package/pro/squads/squad-creator-pro/config/veto-conditions.yaml +455 -0
- package/pro/squads/squad-creator-pro/config.yaml +35 -0
- package/pro/squads/squad-creator-pro/data/.gitkeep +1 -0
- package/pro/squads/squad-creator-pro/data/an-anchor-words.yaml +78 -0
- package/pro/squads/squad-creator-pro/data/an-clone-anti-patterns.yaml +148 -0
- package/pro/squads/squad-creator-pro/data/an-clone-validation.yaml +190 -0
- package/pro/squads/squad-creator-pro/data/an-diagnostic-framework.yaml +164 -0
- package/pro/squads/squad-creator-pro/data/an-output-examples.yaml +102 -0
- package/pro/squads/squad-creator-pro/data/an-source-signals.yaml +98 -0
- package/pro/squads/squad-creator-pro/data/an-source-tiers.yaml +119 -0
- package/pro/squads/squad-creator-pro/data/best-practices.md +986 -0
- package/pro/squads/squad-creator-pro/data/core-heuristics.md +510 -0
- package/pro/squads/squad-creator-pro/data/decision-heuristics-framework.md +620 -0
- package/pro/squads/squad-creator-pro/data/executor-decision-tree.md +774 -0
- package/pro/squads/squad-creator-pro/data/executor-matrix-framework.md +441 -0
- package/pro/squads/squad-creator-pro/data/fusion-decision-points-analysis.md +397 -0
- package/pro/squads/squad-creator-pro/data/fusion-executor-analysis.md +677 -0
- package/pro/squads/squad-creator-pro/data/hybridops-patterns.md +1351 -0
- package/pro/squads/squad-creator-pro/data/internal-infrastructure-library.yaml +99 -0
- package/pro/squads/squad-creator-pro/data/mental-model-task-matrix.yaml +692 -0
- package/pro/squads/squad-creator-pro/data/pipeline-patterns.md +352 -0
- package/pro/squads/squad-creator-pro/data/pm-best-practices.md +440 -0
- package/pro/squads/squad-creator-pro/data/pv-anchor-words.yaml +64 -0
- package/pro/squads/squad-creator-pro/data/pv-authenticity-markers.yaml +200 -0
- package/pro/squads/squad-creator-pro/data/pv-meta-axiomas.yaml +162 -0
- package/pro/squads/squad-creator-pro/data/pv-output-examples.yaml +342 -0
- package/pro/squads/squad-creator-pro/data/pv-workflow-validation.yaml +318 -0
- package/pro/squads/squad-creator-pro/data/quality-dimensions-framework.md +405 -0
- package/pro/squads/squad-creator-pro/data/squad-analytics-guide.md +252 -0
- package/pro/squads/squad-creator-pro/data/squad-kb.md +987 -0
- package/pro/squads/squad-creator-pro/data/squad-registry.yaml +841 -0
- package/pro/squads/squad-creator-pro/data/squad-type-definitions.yaml +578 -0
- package/pro/squads/squad-creator-pro/data/tier-system-framework.md +475 -0
- package/pro/squads/squad-creator-pro/data/tool-evaluation-framework.md +847 -0
- package/pro/squads/squad-creator-pro/data/tool-registry.yaml +700 -0
- package/pro/squads/squad-creator-pro/docs/ADR-001-model-tier-qualification.md +344 -0
- package/pro/squads/squad-creator-pro/docs/AGENT-COLLABORATION.md +609 -0
- package/pro/squads/squad-creator-pro/docs/ARCHITECTURE-DIAGRAMS.md +1466 -0
- package/pro/squads/squad-creator-pro/docs/COMMANDS.md +544 -0
- package/pro/squads/squad-creator-pro/docs/CONCEPTS.md +584 -0
- package/pro/squads/squad-creator-pro/docs/FAQ.md +731 -0
- package/pro/squads/squad-creator-pro/docs/HITL-FLOW.md +255 -0
- package/pro/squads/squad-creator-pro/docs/MIGRATION-PLAN-AGENT-CONFORMITY.md +861 -0
- package/pro/squads/squad-creator-pro/docs/MIGRATION-ROADMAP-HYBRIDOPS.md +1161 -0
- package/pro/squads/squad-creator-pro/docs/MODEL-TIER-QUALIFICATION.md +337 -0
- package/pro/squads/squad-creator-pro/docs/PATTERN-LIBRARY.md +333 -0
- package/pro/squads/squad-creator-pro/docs/PEDRO-VALERIO-ARCHITECTURE.md +456 -0
- package/pro/squads/squad-creator-pro/docs/POR-ONDE-COMECAR.md +210 -0
- package/pro/squads/squad-creator-pro/docs/QUICK-START.md +205 -0
- package/pro/squads/squad-creator-pro/docs/RFC-001-deterministic-refactoring.md +463 -0
- package/pro/squads/squad-creator-pro/docs/TOOL-RECOMMENDATIONS.md +379 -0
- package/pro/squads/squad-creator-pro/docs/TROUBLESHOOTING.md +412 -0
- package/pro/squads/squad-creator-pro/docs/TUTORIAL-COMPLETO.md +458 -0
- package/pro/squads/squad-creator-pro/docs/optimize-v4-proposal.md +354 -0
- package/pro/squads/squad-creator-pro/docs/session-report-2026-02-01.md +411 -0
- package/pro/squads/squad-creator-pro/docs/sop-extraction-process.md +674 -0
- package/pro/squads/squad-creator-pro/docs/squad-chief-agent-flow.md +981 -0
- package/pro/squads/squad-creator-pro/docs/squad-creation-pipeline-workflow.md +937 -0
- package/pro/squads/squad-creator-pro/docs/task-optimization-framework.md +229 -0
- package/pro/squads/squad-creator-pro/docs/validation-report-2026-02-01.md +439 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/artifacts/HANDOFF_PROTOCOL.md +269 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/artifacts/SOURCE_CLASSIFICATION.md +258 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_001.md +166 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_002.md +206 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_003.md +239 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_004.md +153 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_005.md +161 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_006.md +166 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_007.md +190 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_008.md +191 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_009.md +234 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_010.md +240 -0
- package/pro/squads/squad-creator-pro/minds/pedro_valerio/artifacts/Assinatura_Linguistica.md +355 -0
- package/pro/squads/squad-creator-pro/minds/pedro_valerio/artifacts/META_AXIOMAS.md +277 -0
- package/pro/squads/squad-creator-pro/minds/pedro_valerio/heuristics/PV_BS_001.md +144 -0
- package/pro/squads/squad-creator-pro/minds/pedro_valerio/heuristics/PV_PA_001.md +174 -0
- package/pro/squads/squad-creator-pro/minds/pedro_valerio/heuristics/PV_PM_001.md +191 -0
- package/pro/squads/squad-creator-pro/package.json +26 -0
- package/pro/squads/squad-creator-pro/protocols/ai-first-governance.md +63 -0
- package/pro/squads/squad-creator-pro/scripts/README.md +246 -0
- package/pro/squads/squad-creator-pro/scripts/__pycache__/dependency_check.cpython-314.pyc +0 -0
- package/pro/squads/squad-creator-pro/scripts/__pycache__/inventory.cpython-314.pyc +0 -0
- package/pro/squads/squad-creator-pro/scripts/__pycache__/naming_validator.cpython-314.pyc +0 -0
- package/pro/squads/squad-creator-pro/scripts/__pycache__/quality_gate.cpython-314.pyc +0 -0
- package/pro/squads/squad-creator-pro/scripts/__pycache__/scoring.cpython-314.pyc +0 -0
- package/pro/squads/squad-creator-pro/scripts/__pycache__/yaml_validator.cpython-314.pyc +0 -0
- package/pro/squads/squad-creator-pro/scripts/assess-sources.sh +443 -0
- package/pro/squads/squad-creator-pro/scripts/checklist_validator.py +451 -0
- package/pro/squads/squad-creator-pro/scripts/clone-review.sh +394 -0
- package/pro/squads/squad-creator-pro/scripts/coherence-validator.py +836 -0
- package/pro/squads/squad-creator-pro/scripts/create-agent-preflight.py +243 -0
- package/pro/squads/squad-creator-pro/scripts/cross-provider/compare-results.js +281 -0
- package/pro/squads/squad-creator-pro/scripts/cross-provider/cross-provider-runner.js +462 -0
- package/pro/squads/squad-creator-pro/scripts/dependency_check.py +333 -0
- package/pro/squads/squad-creator-pro/scripts/fidelity-score.sh +519 -0
- package/pro/squads/squad-creator-pro/scripts/generate-squad-greeting.js +426 -0
- package/pro/squads/squad-creator-pro/scripts/generate-squad-guide.js +558 -0
- package/pro/squads/squad-creator-pro/scripts/inventory.py +269 -0
- package/pro/squads/squad-creator-pro/scripts/lib/config-loader.js +151 -0
- package/pro/squads/squad-creator-pro/scripts/model-tier-validator.cjs +369 -0
- package/pro/squads/squad-creator-pro/scripts/model-usage-logger.cjs +245 -0
- package/pro/squads/squad-creator-pro/scripts/modernization-score.sh +308 -0
- package/pro/squads/squad-creator-pro/scripts/naming_validator.py +299 -0
- package/pro/squads/squad-creator-pro/scripts/on-specialist-complete.py +98 -0
- package/pro/squads/squad-creator-pro/scripts/quality_gate.py +413 -0
- package/pro/squads/squad-creator-pro/scripts/refresh-registry.py +270 -0
- package/pro/squads/squad-creator-pro/scripts/save-session-metrics.py +136 -0
- package/pro/squads/squad-creator-pro/scripts/scaffold-squad.cjs +281 -0
- package/pro/squads/squad-creator-pro/scripts/scoring.py +395 -0
- package/pro/squads/squad-creator-pro/scripts/security_scanner.py +378 -0
- package/pro/squads/squad-creator-pro/scripts/squad-analytics.py +585 -0
- package/pro/squads/squad-creator-pro/scripts/squad-context-loader.cjs +205 -0
- package/pro/squads/squad-creator-pro/scripts/squad-state-manager.cjs +451 -0
- package/pro/squads/squad-creator-pro/scripts/squad-workflow-runner.cjs +471 -0
- package/pro/squads/squad-creator-pro/scripts/squad_utils.py +261 -0
- package/pro/squads/squad-creator-pro/scripts/sync-ide-command.py +590 -0
- package/pro/squads/squad-creator-pro/scripts/tests/__init__.py +1 -0
- package/pro/squads/squad-creator-pro/scripts/tests/conftest.py +309 -0
- package/pro/squads/squad-creator-pro/scripts/tests/run_bash_tests.sh +29 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_assess_sources.sh +216 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_checklist_validator.py +396 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_clone_review.sh +239 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_coherence_validator.py +212 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_dependency_check.py +361 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_fidelity_score.sh +298 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_inventory.py +307 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_modernization_score.sh +211 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_naming_validator.py +373 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_quality_gate.py +280 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_refresh_registry.py +338 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_scoring.py +366 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_security_scanner.py +354 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_squad_analytics.py +450 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_validate_clone.sh +252 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_yaml_validator.py +412 -0
- package/pro/squads/squad-creator-pro/scripts/validate-agent-output.py +115 -0
- package/pro/squads/squad-creator-pro/scripts/validate-all.sh +49 -0
- package/pro/squads/squad-creator-pro/scripts/validate-squad-structure.py +535 -0
- package/pro/squads/squad-creator-pro/scripts/validate-squad.sh +944 -0
- package/pro/squads/squad-creator-pro/scripts/yaml_validator.py +528 -0
- package/pro/squads/squad-creator-pro/skills/squad.md +301 -0
- package/pro/squads/squad-creator-pro/squad.yaml +36 -0
- package/pro/squads/squad-creator-pro/tasks/CHANGELOG.md +80 -0
- package/pro/squads/squad-creator-pro/tasks/an-assess-sources.md +78 -0
- package/pro/squads/squad-creator-pro/tasks/an-clone-review.md +104 -0
- package/pro/squads/squad-creator-pro/tasks/an-compare-outputs.md +354 -0
- package/pro/squads/squad-creator-pro/tasks/an-design-clone.md +79 -0
- package/pro/squads/squad-creator-pro/tasks/an-diagnose-clone.md +87 -0
- package/pro/squads/squad-creator-pro/tasks/an-extract-dna.md +90 -0
- package/pro/squads/squad-creator-pro/tasks/an-extract-framework.md +100 -0
- package/pro/squads/squad-creator-pro/tasks/an-fidelity-score.md +108 -0
- package/pro/squads/squad-creator-pro/tasks/an-validate-clone.md +96 -0
- package/pro/squads/squad-creator-pro/tasks/auto-acquire-sources.md +349 -0
- package/pro/squads/squad-creator-pro/tasks/collect-sources.md +533 -0
- package/pro/squads/squad-creator-pro/tasks/create-agent.md +768 -0
- package/pro/squads/squad-creator-pro/tasks/create-documentation.md +258 -0
- package/pro/squads/squad-creator-pro/tasks/create-pipeline.md +296 -0
- package/pro/squads/squad-creator-pro/tasks/create-squad.md +933 -0
- package/pro/squads/squad-creator-pro/tasks/create-task.md +1148 -0
- package/pro/squads/squad-creator-pro/tasks/create-template.md +474 -0
- package/pro/squads/squad-creator-pro/tasks/create-workflow.md +720 -0
- package/pro/squads/squad-creator-pro/tasks/deconstruct.md +167 -0
- package/pro/squads/squad-creator-pro/tasks/deep-research-pre-agent.md +566 -0
- package/pro/squads/squad-creator-pro/tasks/detect-squad-context.md +81 -0
- package/pro/squads/squad-creator-pro/tasks/discover-tools.md +944 -0
- package/pro/squads/squad-creator-pro/tasks/extract-implicit.md +352 -0
- package/pro/squads/squad-creator-pro/tasks/extract-knowledge.md +577 -0
- package/pro/squads/squad-creator-pro/tasks/extract-sop.md +320 -0
- package/pro/squads/squad-creator-pro/tasks/extract-thinking-dna.md +653 -0
- package/pro/squads/squad-creator-pro/tasks/extract-voice-dna.md +619 -0
- package/pro/squads/squad-creator-pro/tasks/find-0.8.md +222 -0
- package/pro/squads/squad-creator-pro/tasks/install-commands.md +373 -0
- package/pro/squads/squad-creator-pro/tasks/lookup-model.md +78 -0
- package/pro/squads/squad-creator-pro/tasks/migrate-workflows-to-yaml.md +259 -0
- package/pro/squads/squad-creator-pro/tasks/next-squad.md +487 -0
- package/pro/squads/squad-creator-pro/tasks/optimize-workflow.md +851 -0
- package/pro/squads/squad-creator-pro/tasks/optimize.md +1082 -0
- package/pro/squads/squad-creator-pro/tasks/parallel-discovery.md +58 -0
- package/pro/squads/squad-creator-pro/tasks/pv-audit.md +244 -0
- package/pro/squads/squad-creator-pro/tasks/pv-axioma-assessment-wf-clone-mind.yaml +256 -0
- package/pro/squads/squad-creator-pro/tasks/pv-axioma-assessment.md +83 -0
- package/pro/squads/squad-creator-pro/tasks/pv-modernization-score.md +83 -0
- package/pro/squads/squad-creator-pro/tasks/qa-after-creation.md +475 -0
- package/pro/squads/squad-creator-pro/tasks/qualify-task.md +265 -0
- package/pro/squads/squad-creator-pro/tasks/reexecute-squad-phase.md +64 -0
- package/pro/squads/squad-creator-pro/tasks/refresh-registry.md +403 -0
- package/pro/squads/squad-creator-pro/tasks/smoke-test-model-routing.md +167 -0
- package/pro/squads/squad-creator-pro/tasks/squad-analytics.md +265 -0
- package/pro/squads/squad-creator-pro/tasks/squad-fusion.md +817 -0
- package/pro/squads/squad-creator-pro/tasks/squad-overview.md +683 -0
- package/pro/squads/squad-creator-pro/tasks/sync-ide-command.md +392 -0
- package/pro/squads/squad-creator-pro/tasks/update-mind.md +428 -0
- package/pro/squads/squad-creator-pro/tasks/upgrade-squad.md +919 -0
- package/pro/squads/squad-creator-pro/tasks/validate-extraction.md +209 -0
- package/pro/squads/squad-creator-pro/tasks/validate-final-artifacts.md +80 -0
- package/pro/squads/squad-creator-pro/tasks/validate-squad.md +1385 -0
- package/pro/squads/squad-creator-pro/templates/.gitkeep +1 -0
- package/pro/squads/squad-creator-pro/templates/agent-flow-doc-tmpl.md +512 -0
- package/pro/squads/squad-creator-pro/templates/agent-tmpl.md +697 -0
- package/pro/squads/squad-creator-pro/templates/config-tmpl.yaml +352 -0
- package/pro/squads/squad-creator-pro/templates/handoff-insumos-tmpl.yaml +112 -0
- package/pro/squads/squad-creator-pro/templates/orchestrator-tmpl.md +74 -0
- package/pro/squads/squad-creator-pro/templates/pipeline-progress-tmpl.py +373 -0
- package/pro/squads/squad-creator-pro/templates/pipeline-runner-tmpl.py +444 -0
- package/pro/squads/squad-creator-pro/templates/pipeline-state-tmpl.py +413 -0
- package/pro/squads/squad-creator-pro/templates/pop-extractor-prompt.md +549 -0
- package/pro/squads/squad-creator-pro/templates/quality-dashboard-tmpl.md +286 -0
- package/pro/squads/squad-creator-pro/templates/quality-gate-tmpl.yaml +589 -0
- package/pro/squads/squad-creator-pro/templates/readme-tmpl.md +231 -0
- package/pro/squads/squad-creator-pro/templates/research-output-tmpl.md +625 -0
- package/pro/squads/squad-creator-pro/templates/research-prompt-tmpl.md +479 -0
- package/pro/squads/squad-creator-pro/templates/squad-prd-tmpl.md +464 -0
- package/pro/squads/squad-creator-pro/templates/squad-readme-tmpl.md +170 -0
- package/pro/squads/squad-creator-pro/templates/story-create-agent-tmpl.md +284 -0
- package/pro/squads/squad-creator-pro/templates/task-tmpl.md +461 -0
- package/pro/squads/squad-creator-pro/templates/template-tmpl.yaml +227 -0
- package/pro/squads/squad-creator-pro/templates/workflow-doc-tmpl.md +860 -0
- package/pro/squads/squad-creator-pro/templates/workflow-tmpl.yaml +394 -0
- package/pro/squads/squad-creator-pro/test-cases/BATCH-PROGRESS.md +268 -0
- package/pro/squads/squad-creator-pro/test-cases/QUALIFICATION-DASHBOARD.yaml +13 -0
- package/pro/squads/squad-creator-pro/test-cases/_template.yaml +147 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/ASSESSMENT-SUMMARY.md +275 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/ASSESSMENT_SUMMARY.md +140 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/CHECKPOINT_MATRIX.md +202 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/EXECUTION-REPORT.md +413 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/EXECUTION_NOTES.md +358 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/README-v2.2.2.md +299 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/README.md +320 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/TEST-REPORT-v2.1.md +351 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/VERIFICATION-CHECKLIST.txt +247 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/formal-qualification-report.yaml +389 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-output.yaml +366 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-v2.1-output.yaml +452 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-v2.2.1-output.yaml +281 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-v2.2.2-output.yaml +332 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/opus-baseline.yaml +517 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/qualification-report.yaml +213 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/test-case.yaml +69 -0
- package/pro/squads/squad-creator-pro/test-cases/an-clone-review/haiku-round-1.yaml +213 -0
- package/pro/squads/squad-creator-pro/test-cases/an-clone-review/opus-baseline.yaml +566 -0
- package/pro/squads/squad-creator-pro/test-cases/an-clone-review/qualification-report.yaml +82 -0
- package/pro/squads/squad-creator-pro/test-cases/an-design-clone/test-case.yaml +102 -0
- package/pro/squads/squad-creator-pro/test-cases/an-extract-dna/test-case.yaml +105 -0
- package/pro/squads/squad-creator-pro/test-cases/an-fidelity-score/haiku-round-1.yaml +262 -0
- package/pro/squads/squad-creator-pro/test-cases/an-fidelity-score/opus-baseline.yaml +266 -0
- package/pro/squads/squad-creator-pro/test-cases/an-fidelity-score/qualification-report.yaml +94 -0
- package/pro/squads/squad-creator-pro/test-cases/an-validate-clone/haiku-round-1.yaml +282 -0
- package/pro/squads/squad-creator-pro/test-cases/an-validate-clone/opus-baseline.yaml +470 -0
- package/pro/squads/squad-creator-pro/test-cases/an-validate-clone/qualification-report.yaml +106 -0
- package/pro/squads/squad-creator-pro/test-cases/collect-sources/test-case.yaml +105 -0
- package/pro/squads/squad-creator-pro/test-cases/create-task/test-case.yaml +104 -0
- package/pro/squads/squad-creator-pro/test-cases/cross-provider/DASHBOARD.yaml +11 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-audit/test-case.yaml +106 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/haiku-output.yaml +209 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/opus-baseline.yaml +96 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/sonnet-output.yaml +30 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/test-case.yaml +129 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/comparison-round-1.yaml +242 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/haiku-round-1.yaml +393 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/opus-baseline.yaml +488 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/qualification-report.yaml +74 -0
- package/pro/squads/squad-creator-pro/test-cases/qa-after-creation/haiku-round-1.yaml +292 -0
- package/pro/squads/squad-creator-pro/test-cases/qa-after-creation/opus-baseline.yaml +603 -0
- package/pro/squads/squad-creator-pro/test-cases/qa-after-creation/qualification-report.yaml +97 -0
- package/pro/squads/squad-creator-pro/test-cases/smoke-test-model-routing/test-case.yaml +100 -0
- package/pro/squads/squad-creator-pro/test-cases/upgrade-squad/test-case.yaml +106 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/comparison-round-1.yaml +223 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-1-MINE.yaml +36 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-1.yaml +193 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-2.yaml +303 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-3-v4-task.yaml +149 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/opus-baseline.yaml +529 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/opus-round-3-v4-task.yaml +132 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/qualification-report.yaml +104 -0
- package/pro/squads/squad-creator-pro/test-cases/wf-clone-mind/haiku-output-v2-calibrated.yaml +200 -0
- package/pro/squads/squad-creator-pro/test-cases/wf-clone-mind/haiku-output.yaml +183 -0
- package/pro/squads/squad-creator-pro/test-cases/wf-clone-mind/opus-baseline.yaml +112 -0
- package/pro/squads/squad-creator-pro/utils/.gitkeep +1 -0
- package/pro/squads/squad-creator-pro/workflows/.gitkeep +1 -0
- package/pro/squads/squad-creator-pro/workflows/create-squad.yaml +348 -0
- package/pro/squads/squad-creator-pro/workflows/modules/module-discovery.yaml +16 -0
- package/pro/squads/squad-creator-pro/workflows/modules/module-integration.yaml +16 -0
- package/pro/squads/squad-creator-pro/workflows/modules/module-quality-gates.yaml +15 -0
- package/pro/squads/squad-creator-pro/workflows/validate-squad.yaml +582 -0
- package/pro/squads/squad-creator-pro/workflows/wf-auto-acquire-sources.yaml +518 -0
- package/pro/squads/squad-creator-pro/workflows/wf-brownfield-upgrade-squad.yaml +46 -0
- package/pro/squads/squad-creator-pro/workflows/wf-clone-mind.yaml +521 -0
- package/pro/squads/squad-creator-pro/workflows/wf-context-aware-create-squad.yaml +47 -0
- package/pro/squads/squad-creator-pro/workflows/wf-create-squad.yaml +1619 -0
- package/pro/squads/squad-creator-pro/workflows/wf-cross-provider-qualification.yaml +711 -0
- package/pro/squads/squad-creator-pro/workflows/wf-discover-tools.yaml +1439 -0
- package/pro/squads/squad-creator-pro/workflows/wf-extraction-pipeline.yaml +486 -0
- package/pro/squads/squad-creator-pro/workflows/wf-mind-research-loop.yaml +668 -0
- package/pro/squads/squad-creator-pro/workflows/wf-model-tier-qualification.yaml +800 -0
- package/pro/squads/squad-creator-pro/workflows/wf-optimize-squad.yaml +684 -0
- package/pro/squads/squad-creator-pro/workflows/wf-research-then-create-agent.yaml +921 -0
- package/pro/squads/squad-creator-pro/workflows/wf-squad-fusion.yaml +1684 -0
- package/scripts/check-markdown-links.py +352 -352
- package/scripts/dashboard-parallel-dev.sh +0 -0
- package/scripts/dashboard-parallel-phase3.sh +0 -0
- package/scripts/dashboard-parallel-phase4.sh +0 -0
- package/scripts/install-monitor-hooks.sh +0 -0
- package/.claude/hooks/code-intel-pretool.cjs +0 -107
- package/docs/guides/aios-workflows/README.md +0 -247
- package/docs/guides/aios-workflows/bob-orchestrator-workflow.md +0 -1536
- package/scripts/glue/README.md +0 -355
- package/scripts/glue/compose-agent-prompt.cjs +0 -362
|
@@ -0,0 +1,711 @@
|
|
|
1
|
+
# wf-cross-provider-qualification.yaml
|
|
2
|
+
# Workflow para qualificar modelos EXTERNOS (Kimi K2.5, GLM-5, etc) vs Opus
|
|
3
|
+
# Version: 1.0
|
|
4
|
+
# Created: 2026-02-12
|
|
5
|
+
# Author: @architect (Aria)
|
|
6
|
+
|
|
7
|
+
workflow:
|
|
8
|
+
id: wf-cross-provider-qualification
|
|
9
|
+
name: "Cross-Provider Model Qualification"
|
|
10
|
+
version: "1.0"
|
|
11
|
+
purpose: "Testar se modelos externos (via OpenRouter) podem substituir Opus em tasks específicas"
|
|
12
|
+
orchestrator: "@pedro-valerio"
|
|
13
|
+
mode: "autonomous"
|
|
14
|
+
|
|
15
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
16
|
+
# PHILOSOPHY
|
|
17
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
18
|
+
|
|
19
|
+
philosophy:
|
|
20
|
+
core: |
|
|
21
|
+
"Não assumir. Provar com dados."
|
|
22
|
+
"Custo importa, mas qualidade é inegociável."
|
|
23
|
+
"PT-BR é obrigatório para nosso pipeline."
|
|
24
|
+
"Latência conta — modelo lento é modelo inútil."
|
|
25
|
+
|
|
26
|
+
key_differences_from_tier_qualification:
|
|
27
|
+
- "Modelos externos via LLM Router/OpenRouter (não Task tool)"
|
|
28
|
+
- "Latência tracking obrigatório"
|
|
29
|
+
- "Múltiplos runs para medir reliability"
|
|
30
|
+
- "Fase específica para PT-BR quality"
|
|
31
|
+
- "Privacy risk flag obrigatório"
|
|
32
|
+
|
|
33
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
34
|
+
# EXTERNAL MODELS REGISTRY
|
|
35
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
36
|
+
|
|
37
|
+
external_models:
|
|
38
|
+
glm5:
|
|
39
|
+
provider: openrouter
|
|
40
|
+
model_id: "z-ai/glm-5"
|
|
41
|
+
display_name: "GLM-5"
|
|
42
|
+
cost_per_mtok:
|
|
43
|
+
input: 0.80
|
|
44
|
+
output: 3.20
|
|
45
|
+
context_window: 200000
|
|
46
|
+
validation_report: "docs/model-discovery/scans/2026-02-12/validation-glm-5.md"
|
|
47
|
+
verdict: "ADD_CONDITIONAL"
|
|
48
|
+
privacy_risk: "moderate" # Singapore entity, China parent
|
|
49
|
+
pt_br_status: "unknown"
|
|
50
|
+
|
|
51
|
+
kimi:
|
|
52
|
+
provider: openrouter
|
|
53
|
+
model_id: "moonshotai/kimi-k2.5"
|
|
54
|
+
display_name: "Kimi K2.5"
|
|
55
|
+
cost_per_mtok:
|
|
56
|
+
input: 0.50
|
|
57
|
+
output: 2.80
|
|
58
|
+
context_window: 256000
|
|
59
|
+
validation_report: "docs/model-discovery/scans/2026-02-08/validation-kimi-k2-5.md"
|
|
60
|
+
verdict: "MONITOR"
|
|
61
|
+
privacy_risk: "high" # China, trains on prompts
|
|
62
|
+
pt_br_status: "unknown"
|
|
63
|
+
latency_warning: "HIGH (15-200s per request)"
|
|
64
|
+
|
|
65
|
+
# Baseline para comparação
|
|
66
|
+
opus:
|
|
67
|
+
provider: anthropic
|
|
68
|
+
model_id: "claude-opus-4-6"
|
|
69
|
+
display_name: "Claude Opus 4.6"
|
|
70
|
+
cost_per_mtok:
|
|
71
|
+
input: 5.00
|
|
72
|
+
output: 25.00
|
|
73
|
+
context_window: 1000000
|
|
74
|
+
privacy_risk: "low"
|
|
75
|
+
pt_br_status: "excellent"
|
|
76
|
+
|
|
77
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
78
|
+
# VETO CONDITIONS
|
|
79
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
80
|
+
|
|
81
|
+
veto_conditions:
|
|
82
|
+
- id: CPQ_VC_001
|
|
83
|
+
trigger: "Task não está no test_input_registry"
|
|
84
|
+
action: "BLOCK - Adicionar input ao registry primeiro"
|
|
85
|
+
|
|
86
|
+
- id: CPQ_VC_002
|
|
87
|
+
trigger: "Opus baseline falha ou output vazio"
|
|
88
|
+
action: "BLOCK - Não há baseline para comparar"
|
|
89
|
+
|
|
90
|
+
- id: CPQ_VC_003
|
|
91
|
+
trigger: "Modelo externo retorna erro em >50% dos runs"
|
|
92
|
+
action: "BLOCK - Modelo não é confiável para esta task"
|
|
93
|
+
|
|
94
|
+
- id: CPQ_VC_004
|
|
95
|
+
trigger: "Decisão oposta ao Opus (PASS vs FAIL)"
|
|
96
|
+
action: "BLOCK - Modelo não qualificado (decisão errada)"
|
|
97
|
+
|
|
98
|
+
- id: CPQ_VC_005
|
|
99
|
+
trigger: "PT-BR quality score < 7.0/10"
|
|
100
|
+
action: "BLOCK - Modelo não qualificado para PT-BR"
|
|
101
|
+
|
|
102
|
+
- id: CPQ_VC_006
|
|
103
|
+
trigger: "Latência média > 60s"
|
|
104
|
+
action: "FLAG - Só usar para batch/async jobs"
|
|
105
|
+
|
|
106
|
+
- id: CPQ_VC_007
|
|
107
|
+
trigger: "Privacy risk = high AND task envolve dados sensíveis"
|
|
108
|
+
action: "BLOCK - Usar self-hosted ou escolher outro modelo"
|
|
109
|
+
|
|
110
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
111
|
+
# TEST INPUT REGISTRY (Cross-Provider Candidates)
|
|
112
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
113
|
+
# Tasks Opus-tier que podem ser testadas com modelos externos
|
|
114
|
+
|
|
115
|
+
cross_provider_candidates:
|
|
116
|
+
# === DNA EXTRACTION (High Value, High Cost) ===
|
|
117
|
+
extract-voice-dna:
|
|
118
|
+
current_tier: opus
|
|
119
|
+
test_with: [glm5, kimi]
|
|
120
|
+
expected_savings: "80-90%"
|
|
121
|
+
risk: "Quality degradation in voice capture"
|
|
122
|
+
test_input:
|
|
123
|
+
target: "outputs/minds/pedro_valerio/sources/"
|
|
124
|
+
type: "sources_directory"
|
|
125
|
+
pt_br_critical: true
|
|
126
|
+
|
|
127
|
+
extract-thinking-dna:
|
|
128
|
+
current_tier: opus
|
|
129
|
+
test_with: [glm5, kimi]
|
|
130
|
+
expected_savings: "80-90%"
|
|
131
|
+
risk: "Missing mental models"
|
|
132
|
+
test_input:
|
|
133
|
+
target: "outputs/minds/pedro_valerio/sources/"
|
|
134
|
+
type: "sources_directory"
|
|
135
|
+
pt_br_critical: true
|
|
136
|
+
|
|
137
|
+
# === RESEARCH (Good Candidate) ===
|
|
138
|
+
deep-research-pre-agent:
|
|
139
|
+
current_tier: opus
|
|
140
|
+
test_with: [glm5, kimi]
|
|
141
|
+
expected_savings: "80-90%"
|
|
142
|
+
risk: "Superficial research"
|
|
143
|
+
test_input:
|
|
144
|
+
target: "Pedro Valério"
|
|
145
|
+
type: "person_name"
|
|
146
|
+
pt_br_critical: false
|
|
147
|
+
note: "Kimi Agent Swarm could excel here"
|
|
148
|
+
|
|
149
|
+
# === AGENT CREATION ===
|
|
150
|
+
create-agent:
|
|
151
|
+
current_tier: opus
|
|
152
|
+
test_with: [glm5] # GLM-5 has lower hallucination
|
|
153
|
+
expected_savings: "80%"
|
|
154
|
+
risk: "Generic agent without depth"
|
|
155
|
+
test_input:
|
|
156
|
+
target: "outputs/minds/pedro_valerio/"
|
|
157
|
+
type: "mind_directory"
|
|
158
|
+
pt_br_critical: true
|
|
159
|
+
|
|
160
|
+
an-design-clone:
|
|
161
|
+
current_tier: opus
|
|
162
|
+
test_with: [glm5]
|
|
163
|
+
expected_savings: "80%"
|
|
164
|
+
risk: "Incomplete clone structure"
|
|
165
|
+
test_input:
|
|
166
|
+
target: "outputs/minds/pedro_valerio/"
|
|
167
|
+
type: "mind_directory"
|
|
168
|
+
pt_br_critical: true
|
|
169
|
+
|
|
170
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
171
|
+
# INPUTS
|
|
172
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
173
|
+
|
|
174
|
+
inputs:
|
|
175
|
+
required:
|
|
176
|
+
- name: task_name
|
|
177
|
+
type: string
|
|
178
|
+
description: "Nome da task (sem .md)"
|
|
179
|
+
example: "extract-voice-dna"
|
|
180
|
+
validation: "Must exist in cross_provider_candidates"
|
|
181
|
+
|
|
182
|
+
- name: candidate_model
|
|
183
|
+
type: enum
|
|
184
|
+
values: ["glm5", "kimi"]
|
|
185
|
+
description: "Modelo externo a testar"
|
|
186
|
+
|
|
187
|
+
optional:
|
|
188
|
+
- name: threshold
|
|
189
|
+
type: number
|
|
190
|
+
default: 0.85
|
|
191
|
+
description: "Threshold mínimo de qualidade vs Opus"
|
|
192
|
+
|
|
193
|
+
- name: reliability_runs
|
|
194
|
+
type: number
|
|
195
|
+
default: 3
|
|
196
|
+
description: "Número de runs para medir reliability"
|
|
197
|
+
|
|
198
|
+
- name: skip_pt_br
|
|
199
|
+
type: boolean
|
|
200
|
+
default: false
|
|
201
|
+
description: "Pular teste PT-BR (não recomendado)"
|
|
202
|
+
|
|
203
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
204
|
+
# PHASES
|
|
205
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
206
|
+
|
|
207
|
+
phases:
|
|
208
|
+
# ─────────────────────────────────────────────────────────────────────────────
|
|
209
|
+
# PHASE 0: PRE-FLIGHT VALIDATION
|
|
210
|
+
# ─────────────────────────────────────────────────────────────────────────────
|
|
211
|
+
- id: phase_0
|
|
212
|
+
name: "PRE-FLIGHT"
|
|
213
|
+
purpose: "Validar inputs, verificar modelo disponível, criar diretório"
|
|
214
|
+
duration: "< 1 min"
|
|
215
|
+
|
|
216
|
+
steps:
|
|
217
|
+
- id: step_0_1
|
|
218
|
+
name: "Check cross_provider_candidates"
|
|
219
|
+
action: "Lookup task_name in cross_provider_candidates"
|
|
220
|
+
veto_if: "task_name not in registry → CPQ_VC_001"
|
|
221
|
+
|
|
222
|
+
- id: step_0_2
|
|
223
|
+
name: "Check model in test_with list"
|
|
224
|
+
action: "Verify candidate_model is in task's test_with array"
|
|
225
|
+
veto_if: "Model not allowed for this task"
|
|
226
|
+
|
|
227
|
+
- id: step_0_3
|
|
228
|
+
name: "Check model availability"
|
|
229
|
+
action: |
|
|
230
|
+
Bash: node infrastructure/services/llm-router/bin/check-model.js {candidate_model}
|
|
231
|
+
Verify model responds to ping
|
|
232
|
+
veto_if: "Model unavailable or API error"
|
|
233
|
+
|
|
234
|
+
- id: step_0_4
|
|
235
|
+
name: "Read task file"
|
|
236
|
+
action: "Read squads/squad-creator-pro/tasks/{task_name}.md completely"
|
|
237
|
+
output:
|
|
238
|
+
task_prompt: "Full task content"
|
|
239
|
+
|
|
240
|
+
- id: step_0_5
|
|
241
|
+
name: "Create test directory"
|
|
242
|
+
action: "mkdir -p squads/squad-creator-pro/test-cases/cross-provider/{task_name}/{candidate_model}/"
|
|
243
|
+
|
|
244
|
+
checkpoint:
|
|
245
|
+
id: CP_PREFLIGHT
|
|
246
|
+
blocking: true
|
|
247
|
+
|
|
248
|
+
# ─────────────────────────────────────────────────────────────────────────────
|
|
249
|
+
# PHASE 1: BASELINE EXECUTION (Opus)
|
|
250
|
+
# ─────────────────────────────────────────────────────────────────────────────
|
|
251
|
+
- id: phase_1
|
|
252
|
+
name: "OPUS BASELINE"
|
|
253
|
+
purpose: "Executar task em Opus para estabelecer baseline de qualidade"
|
|
254
|
+
duration: "2-5 min"
|
|
255
|
+
|
|
256
|
+
steps:
|
|
257
|
+
- id: step_1_1
|
|
258
|
+
name: "Execute in Opus"
|
|
259
|
+
action: |
|
|
260
|
+
Task(
|
|
261
|
+
subagent_type: "general-purpose",
|
|
262
|
+
model: "opus",
|
|
263
|
+
prompt: "Read squads/squad-creator-pro/tasks/{task_name}.md completely.
|
|
264
|
+
Execute the task with input: {test_input.target}
|
|
265
|
+
Save output as YAML to test-cases/cross-provider/{task_name}/{candidate_model}/opus-baseline.yaml
|
|
266
|
+
Include metadata: tokens used, duration_ms."
|
|
267
|
+
)
|
|
268
|
+
output:
|
|
269
|
+
opus_result: "Full output saved to file"
|
|
270
|
+
opus_tokens: { input: 0, output: 0 }
|
|
271
|
+
opus_latency_ms: 0
|
|
272
|
+
opus_cost_usd: 0
|
|
273
|
+
|
|
274
|
+
checkpoint:
|
|
275
|
+
id: CP_BASELINE
|
|
276
|
+
blocking: true
|
|
277
|
+
veto_if: "Output empty or error → CPQ_VC_002"
|
|
278
|
+
|
|
279
|
+
# ─────────────────────────────────────────────────────────────────────────────
|
|
280
|
+
# PHASE 2: CANDIDATE EXECUTION (Multiple Runs for Reliability)
|
|
281
|
+
# ─────────────────────────────────────────────────────────────────────────────
|
|
282
|
+
- id: phase_2
|
|
283
|
+
name: "CANDIDATE RELIABILITY TEST"
|
|
284
|
+
purpose: "Executar modelo externo N vezes para medir reliability e variance"
|
|
285
|
+
duration: "5-15 min (depends on model latency)"
|
|
286
|
+
|
|
287
|
+
steps:
|
|
288
|
+
- id: step_2_1
|
|
289
|
+
name: "Execute reliability runs"
|
|
290
|
+
action: |
|
|
291
|
+
FOR i in 1..{reliability_runs}:
|
|
292
|
+
|
|
293
|
+
start_time = now()
|
|
294
|
+
|
|
295
|
+
# Call via LLM Router
|
|
296
|
+
result = Bash(
|
|
297
|
+
node infrastructure/services/llm-router/index.js \
|
|
298
|
+
--task "{task_name}" \
|
|
299
|
+
--model "{candidate_model}" \
|
|
300
|
+
--input "{test_input.target}" \
|
|
301
|
+
--output "test-cases/cross-provider/{task_name}/{candidate_model}/run-{i}.yaml"
|
|
302
|
+
)
|
|
303
|
+
|
|
304
|
+
end_time = now()
|
|
305
|
+
|
|
306
|
+
Record:
|
|
307
|
+
- run_number: i
|
|
308
|
+
- success: true/false
|
|
309
|
+
- latency_ms: end_time - start_time
|
|
310
|
+
- tokens: { input, output }
|
|
311
|
+
- error: null or error_message
|
|
312
|
+
|
|
313
|
+
output:
|
|
314
|
+
runs: "Array of run results"
|
|
315
|
+
success_rate: "N successful / N total"
|
|
316
|
+
avg_latency_ms: "Average latency"
|
|
317
|
+
latency_variance: "Min/max/stddev"
|
|
318
|
+
total_cost_usd: "Sum of all runs"
|
|
319
|
+
|
|
320
|
+
- id: step_2_2
|
|
321
|
+
name: "Check reliability threshold"
|
|
322
|
+
action: |
|
|
323
|
+
IF success_rate < 0.5:
|
|
324
|
+
→ VETO (CPQ_VC_003)
|
|
325
|
+
|
|
326
|
+
IF avg_latency_ms > 60000:
|
|
327
|
+
→ FLAG as "batch-only" (CPQ_VC_006)
|
|
328
|
+
output:
|
|
329
|
+
reliability_verdict: "PASS | BATCH_ONLY | FAIL"
|
|
330
|
+
|
|
331
|
+
checkpoint:
|
|
332
|
+
id: CP_RELIABILITY
|
|
333
|
+
blocking: true
|
|
334
|
+
|
|
335
|
+
# ─────────────────────────────────────────────────────────────────────────────
|
|
336
|
+
# PHASE 3: QUALITY COMPARISON
|
|
337
|
+
# ─────────────────────────────────────────────────────────────────────────────
|
|
338
|
+
- id: phase_3
|
|
339
|
+
name: "QUALITY COMPARISON"
|
|
340
|
+
purpose: "Comparar output do melhor run com Opus baseline"
|
|
341
|
+
duration: "2-3 min"
|
|
342
|
+
|
|
343
|
+
steps:
|
|
344
|
+
- id: step_3_1
|
|
345
|
+
name: "Select best run"
|
|
346
|
+
action: |
|
|
347
|
+
Select the successful run with:
|
|
348
|
+
1. Lowest latency (if all similar quality)
|
|
349
|
+
2. Most complete output (section count)
|
|
350
|
+
output:
|
|
351
|
+
best_run_file: "run-{N}.yaml"
|
|
352
|
+
|
|
353
|
+
- id: step_3_2
|
|
354
|
+
name: "Compare across 5 dimensions"
|
|
355
|
+
action: |
|
|
356
|
+
Same comparison as wf-model-tier-qualification:
|
|
357
|
+
|
|
358
|
+
1. COMPLETENESS (weight: 0.30)
|
|
359
|
+
- Section count: candidate vs opus
|
|
360
|
+
|
|
361
|
+
2. ACCURACY (weight: 0.30)
|
|
362
|
+
- Key decisions match (PASS/FAIL, scores)
|
|
363
|
+
- VETO CHECK: opposite decision → CPQ_VC_004
|
|
364
|
+
|
|
365
|
+
3. REASONING (weight: 0.20)
|
|
366
|
+
- Evidence depth and specificity
|
|
367
|
+
|
|
368
|
+
4. FORMAT (weight: 0.10)
|
|
369
|
+
- YAML valid, structure matches
|
|
370
|
+
|
|
371
|
+
5. ACTIONABILITY (weight: 0.10)
|
|
372
|
+
- Recommendations count and quality
|
|
373
|
+
|
|
374
|
+
output:
|
|
375
|
+
dimension_scores: "Per-dimension breakdown"
|
|
376
|
+
quality_score: "Weighted percentage (0-100%)"
|
|
377
|
+
gaps: "List of gap types"
|
|
378
|
+
|
|
379
|
+
- id: step_3_3
|
|
380
|
+
name: "Calculate cost savings"
|
|
381
|
+
action: |
|
|
382
|
+
opus_cost = (opus_tokens.input * 5.00 / 1_000_000) + (opus_tokens.output * 25.00 / 1_000_000)
|
|
383
|
+
candidate_cost = (candidate_tokens.input * model.cost.input / 1_000_000) + (candidate_tokens.output * model.cost.output / 1_000_000)
|
|
384
|
+
|
|
385
|
+
# Adjust for reliability (cost of retries)
|
|
386
|
+
effective_candidate_cost = candidate_cost / success_rate
|
|
387
|
+
|
|
388
|
+
savings_pct = (1 - effective_candidate_cost / opus_cost) * 100
|
|
389
|
+
output:
|
|
390
|
+
opus_cost_usd: 0
|
|
391
|
+
candidate_cost_usd: 0
|
|
392
|
+
effective_cost_usd: 0
|
|
393
|
+
savings_percentage: 0
|
|
394
|
+
|
|
395
|
+
checkpoint:
|
|
396
|
+
id: CP_QUALITY
|
|
397
|
+
blocking: true
|
|
398
|
+
output:
|
|
399
|
+
saved_to: "test-cases/cross-provider/{task_name}/{candidate_model}/quality-comparison.yaml"
|
|
400
|
+
|
|
401
|
+
# ─────────────────────────────────────────────────────────────────────────────
|
|
402
|
+
# PHASE 4: PT-BR QUALITY TEST
|
|
403
|
+
# ─────────────────────────────────────────────────────────────────────────────
|
|
404
|
+
- id: phase_4
|
|
405
|
+
name: "PT-BR QUALITY TEST"
|
|
406
|
+
purpose: "Testar qualidade do modelo em português brasileiro"
|
|
407
|
+
duration: "3-5 min"
|
|
408
|
+
condition: "NOT skip_pt_br AND task.pt_br_critical"
|
|
409
|
+
|
|
410
|
+
pt_br_test_prompts:
|
|
411
|
+
- id: ptbr_1
|
|
412
|
+
name: "Technical Writing"
|
|
413
|
+
prompt: |
|
|
414
|
+
Escreva uma documentação técnica de 500 palavras sobre arquitetura de microsserviços.
|
|
415
|
+
Inclua: definição, benefícios, desafios, e quando usar.
|
|
416
|
+
Use linguagem técnica mas acessível.
|
|
417
|
+
eval_criteria:
|
|
418
|
+
- fluency: "Português natural, não traduzido"
|
|
419
|
+
- accuracy: "Termos técnicos corretos"
|
|
420
|
+
- completeness: "Todos os pontos cobertos"
|
|
421
|
+
|
|
422
|
+
- id: ptbr_2
|
|
423
|
+
name: "Framework Extraction"
|
|
424
|
+
prompt: |
|
|
425
|
+
Dado o seguinte texto sobre metodologia de vendas:
|
|
426
|
+
|
|
427
|
+
"O fechamento acontece quando você elimina todas as objeções do cliente.
|
|
428
|
+
Primeiro, identifique a objeção real. Depois, concorde parcialmente.
|
|
429
|
+
Por fim, apresente uma perspectiva diferente que resolve a objeção."
|
|
430
|
+
|
|
431
|
+
Extraia o framework em formato YAML com: nome, etapas, e quando aplicar.
|
|
432
|
+
eval_criteria:
|
|
433
|
+
- understanding: "Captou a essência do método"
|
|
434
|
+
- structure: "YAML válido e bem organizado"
|
|
435
|
+
- no_hallucination: "Não inventou etapas extras"
|
|
436
|
+
|
|
437
|
+
- id: ptbr_3
|
|
438
|
+
name: "Voice Consistency"
|
|
439
|
+
prompt: |
|
|
440
|
+
Você é Pedro Valério, especialista em processos e automação.
|
|
441
|
+
Sua filosofia é: "Se o executor consegue errar, o processo está errado."
|
|
442
|
+
|
|
443
|
+
Responda à pergunta: "Como você abordaria a criação de um novo workflow?"
|
|
444
|
+
|
|
445
|
+
Mantenha sua voz e perspectiva consistentes.
|
|
446
|
+
eval_criteria:
|
|
447
|
+
- voice_match: "Soa como o personagem"
|
|
448
|
+
- philosophy_applied: "Usa os princípios mencionados"
|
|
449
|
+
- natural_pt_br: "Português fluente"
|
|
450
|
+
|
|
451
|
+
steps:
|
|
452
|
+
- id: step_4_1
|
|
453
|
+
name: "Execute PT-BR prompts"
|
|
454
|
+
action: |
|
|
455
|
+
FOR each prompt in pt_br_test_prompts:
|
|
456
|
+
result = Bash(
|
|
457
|
+
node infrastructure/services/llm-router/index.js \
|
|
458
|
+
--model "{candidate_model}" \
|
|
459
|
+
--prompt "{prompt.prompt}" \
|
|
460
|
+
--output "test-cases/cross-provider/{task_name}/{candidate_model}/ptbr-{prompt.id}.yaml"
|
|
461
|
+
)
|
|
462
|
+
|
|
463
|
+
- id: step_4_2
|
|
464
|
+
name: "Evaluate PT-BR quality"
|
|
465
|
+
action: |
|
|
466
|
+
Task(
|
|
467
|
+
subagent_type: "general-purpose",
|
|
468
|
+
model: "opus", # Opus avalia PT-BR quality
|
|
469
|
+
prompt: "Avalie a qualidade do português brasileiro nos outputs anexados.
|
|
470
|
+
|
|
471
|
+
Para cada output, score de 1-10:
|
|
472
|
+
- Fluência (português natural, não traduzido)
|
|
473
|
+
- Precisão (termos técnicos corretos)
|
|
474
|
+
- Completude (resposta completa)
|
|
475
|
+
|
|
476
|
+
Overall PT-BR Score = média dos scores.
|
|
477
|
+
|
|
478
|
+
VETO se overall < 7.0"
|
|
479
|
+
)
|
|
480
|
+
output:
|
|
481
|
+
ptbr_scores: "Per-prompt breakdown"
|
|
482
|
+
ptbr_overall: "Overall score (0-10)"
|
|
483
|
+
|
|
484
|
+
- id: step_4_3
|
|
485
|
+
name: "PT-BR verdict"
|
|
486
|
+
action: |
|
|
487
|
+
IF ptbr_overall < 7.0:
|
|
488
|
+
→ VETO (CPQ_VC_005)
|
|
489
|
+
verdict = "PT-BR NOT QUALIFIED"
|
|
490
|
+
ELSE IF ptbr_overall < 8.0:
|
|
491
|
+
verdict = "PT-BR ACCEPTABLE (with caveats)"
|
|
492
|
+
ELSE:
|
|
493
|
+
verdict = "PT-BR QUALIFIED"
|
|
494
|
+
output:
|
|
495
|
+
ptbr_verdict: "QUALIFIED | ACCEPTABLE | NOT_QUALIFIED"
|
|
496
|
+
|
|
497
|
+
checkpoint:
|
|
498
|
+
id: CP_PTBR
|
|
499
|
+
blocking: true
|
|
500
|
+
veto_if: "ptbr_overall < 7.0 → CPQ_VC_005"
|
|
501
|
+
|
|
502
|
+
# ─────────────────────────────────────────────────────────────────────────────
|
|
503
|
+
# PHASE 5: GENERATE REPORT
|
|
504
|
+
# ─────────────────────────────────────────────────────────────────────────────
|
|
505
|
+
- id: phase_5
|
|
506
|
+
name: "GENERATE REPORT"
|
|
507
|
+
purpose: "Criar relatório final com toda evidência"
|
|
508
|
+
duration: "1-2 min"
|
|
509
|
+
|
|
510
|
+
steps:
|
|
511
|
+
- id: step_5_1
|
|
512
|
+
name: "Generate qualification report"
|
|
513
|
+
action: |
|
|
514
|
+
Create test-cases/cross-provider/{task_name}/{candidate_model}/qualification-report.yaml:
|
|
515
|
+
|
|
516
|
+
cross_provider_qualification_report:
|
|
517
|
+
task_name: "{task_name}"
|
|
518
|
+
candidate_model: "{candidate_model}"
|
|
519
|
+
test_date: "{today}"
|
|
520
|
+
workflow_version: "1.0"
|
|
521
|
+
|
|
522
|
+
baseline:
|
|
523
|
+
model: "opus"
|
|
524
|
+
cost_usd: "{opus_cost}"
|
|
525
|
+
tokens: { input: X, output: Y }
|
|
526
|
+
latency_ms: Z
|
|
527
|
+
file: "opus-baseline.yaml"
|
|
528
|
+
|
|
529
|
+
candidate:
|
|
530
|
+
model: "{candidate_model}"
|
|
531
|
+
provider: "{model.provider}"
|
|
532
|
+
|
|
533
|
+
reliability:
|
|
534
|
+
runs: {reliability_runs}
|
|
535
|
+
success_rate: "{success_rate}%"
|
|
536
|
+
avg_latency_ms: {avg_latency}
|
|
537
|
+
latency_range: "{min_ms}-{max_ms}ms"
|
|
538
|
+
verdict: "{reliability_verdict}"
|
|
539
|
+
|
|
540
|
+
quality:
|
|
541
|
+
overall_score: "{quality_score}%"
|
|
542
|
+
dimension_scores: {dimension_scores}
|
|
543
|
+
gaps: [{gaps}]
|
|
544
|
+
|
|
545
|
+
cost:
|
|
546
|
+
per_run_usd: "{candidate_cost}"
|
|
547
|
+
effective_usd: "{effective_cost}" # adjusted for retries
|
|
548
|
+
vs_opus_savings: "{savings_pct}%"
|
|
549
|
+
|
|
550
|
+
pt_br:
|
|
551
|
+
tested: true/false
|
|
552
|
+
overall_score: "{ptbr_overall}/10"
|
|
553
|
+
verdict: "{ptbr_verdict}"
|
|
554
|
+
|
|
555
|
+
decision:
|
|
556
|
+
final: "{QUALIFIED | QUALIFIED_BATCH_ONLY | NOT_QUALIFIED}"
|
|
557
|
+
recommended_use: "{task types}"
|
|
558
|
+
caveats: ["{list of caveats}"]
|
|
559
|
+
|
|
560
|
+
privacy_assessment:
|
|
561
|
+
risk_level: "{model.privacy_risk}"
|
|
562
|
+
recommendation: "{self-host | api | do-not-use}"
|
|
563
|
+
|
|
564
|
+
evidence_files:
|
|
565
|
+
- "opus-baseline.yaml"
|
|
566
|
+
- "run-1.yaml"
|
|
567
|
+
- "run-2.yaml"
|
|
568
|
+
- "run-3.yaml"
|
|
569
|
+
- "quality-comparison.yaml"
|
|
570
|
+
- "ptbr-*.yaml"
|
|
571
|
+
- "qualification-report.yaml"
|
|
572
|
+
|
|
573
|
+
- id: step_5_2
|
|
574
|
+
name: "Update model-routing.yaml"
|
|
575
|
+
condition: "decision is QUALIFIED or QUALIFIED_BATCH_ONLY"
|
|
576
|
+
action: |
|
|
577
|
+
Add to model-routing.yaml under external_alternatives:
|
|
578
|
+
|
|
579
|
+
{task_name}:
|
|
580
|
+
external_alternative:
|
|
581
|
+
model: "{candidate_model}"
|
|
582
|
+
qualified: true
|
|
583
|
+
quality_vs_opus: "{quality_score}%"
|
|
584
|
+
savings: "{savings_pct}%"
|
|
585
|
+
batch_only: true/false
|
|
586
|
+
pt_br_qualified: true/false
|
|
587
|
+
tested_date: "{today}"
|
|
588
|
+
|
|
589
|
+
- id: step_5_3
|
|
590
|
+
name: "Display summary"
|
|
591
|
+
action: |
|
|
592
|
+
╔══════════════════════════════════════════════════════════════════════════╗
|
|
593
|
+
║ CROSS-PROVIDER QUALIFICATION RESULT ║
|
|
594
|
+
╠══════════════════════════════════════════════════════════════════════════╣
|
|
595
|
+
║ Task: {task_name} ║
|
|
596
|
+
║ Candidate: {candidate_model} ({model.display_name}) ║
|
|
597
|
+
║ ║
|
|
598
|
+
║ RELIABILITY ║
|
|
599
|
+
║ ├─ Success Rate: {success_rate}% ║
|
|
600
|
+
║ ├─ Avg Latency: {avg_latency}ms ║
|
|
601
|
+
║ └─ Verdict: {reliability_verdict} ║
|
|
602
|
+
║ ║
|
|
603
|
+
║ QUALITY ║
|
|
604
|
+
║ ├─ vs Opus: {quality_score}% ║
|
|
605
|
+
║ └─ Gaps: {gaps_count} ║
|
|
606
|
+
║ ║
|
|
607
|
+
║ PT-BR ║
|
|
608
|
+
║ ├─ Score: {ptbr_overall}/10 ║
|
|
609
|
+
║ └─ Verdict: {ptbr_verdict} ║
|
|
610
|
+
║ ║
|
|
611
|
+
║ COST ║
|
|
612
|
+
║ ├─ Opus: ${opus_cost}/run ║
|
|
613
|
+
║ ├─ {candidate}: ${candidate_cost}/run ║
|
|
614
|
+
║ └─ SAVINGS: {savings_pct}% ║
|
|
615
|
+
║ ║
|
|
616
|
+
║ ══════════════════════════════════════════════════════════════════════ ║
|
|
617
|
+
║ DECISION: {final_decision} ║
|
|
618
|
+
║ PRIVACY: {privacy_risk} → {privacy_recommendation} ║
|
|
619
|
+
╚══════════════════════════════════════════════════════════════════════════╝
|
|
620
|
+
|
|
621
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
622
|
+
# BATCH EXECUTION
|
|
623
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
624
|
+
|
|
625
|
+
batch_mode:
|
|
626
|
+
description: "Testar múltiplas tasks com múltiplos modelos"
|
|
627
|
+
|
|
628
|
+
execution_strategy:
|
|
629
|
+
# Fase 1: GLM-5 (melhor candidato baseado em validation reports)
|
|
630
|
+
wave_1_glm5:
|
|
631
|
+
model: glm5
|
|
632
|
+
tasks:
|
|
633
|
+
- extract-voice-dna
|
|
634
|
+
- extract-thinking-dna
|
|
635
|
+
- create-agent
|
|
636
|
+
- deep-research-pre-agent
|
|
637
|
+
|
|
638
|
+
# Fase 2: Kimi K2.5 (se GLM-5 não qualificar)
|
|
639
|
+
wave_2_kimi:
|
|
640
|
+
model: kimi
|
|
641
|
+
tasks:
|
|
642
|
+
- deep-research-pre-agent # Kimi Swarm pode excel aqui
|
|
643
|
+
condition: "Only if GLM-5 not qualified for task"
|
|
644
|
+
|
|
645
|
+
consolidated_report:
|
|
646
|
+
output: "squads/squad-creator-pro/test-cases/cross-provider/DASHBOARD.yaml"
|
|
647
|
+
|
|
648
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
649
|
+
# FAILURE PATHS
|
|
650
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
651
|
+
|
|
652
|
+
failure_paths:
|
|
653
|
+
- scenario: "Model API unavailable"
|
|
654
|
+
action: "Skip model, try next in wave. Log error."
|
|
655
|
+
|
|
656
|
+
- scenario: ">50% runs fail"
|
|
657
|
+
action: "Mark as NOT_QUALIFIED. Model unreliable."
|
|
658
|
+
|
|
659
|
+
- scenario: "Opposite decision (PASS vs FAIL)"
|
|
660
|
+
action: "Mark as NOT_QUALIFIED. Quality unacceptable."
|
|
661
|
+
|
|
662
|
+
- scenario: "PT-BR score < 7.0"
|
|
663
|
+
action: "Mark as NOT_QUALIFIED for PT-BR tasks. May still qualify for EN-only."
|
|
664
|
+
|
|
665
|
+
- scenario: "Latency > 60s avg"
|
|
666
|
+
action: "Mark as QUALIFIED_BATCH_ONLY. Not for sync use."
|
|
667
|
+
|
|
668
|
+
- scenario: "Privacy risk = high AND sensitive task"
|
|
669
|
+
action: "Recommend self-hosting. Do not use API for sensitive data."
|
|
670
|
+
|
|
671
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
672
|
+
# OUTPUTS
|
|
673
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
674
|
+
|
|
675
|
+
outputs:
|
|
676
|
+
per_task:
|
|
677
|
+
- "test-cases/cross-provider/{task_name}/{model}/opus-baseline.yaml"
|
|
678
|
+
- "test-cases/cross-provider/{task_name}/{model}/run-{N}.yaml"
|
|
679
|
+
- "test-cases/cross-provider/{task_name}/{model}/quality-comparison.yaml"
|
|
680
|
+
- "test-cases/cross-provider/{task_name}/{model}/ptbr-{id}.yaml"
|
|
681
|
+
- "test-cases/cross-provider/{task_name}/{model}/qualification-report.yaml"
|
|
682
|
+
|
|
683
|
+
batch:
|
|
684
|
+
- "test-cases/cross-provider/DASHBOARD.yaml"
|
|
685
|
+
|
|
686
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
687
|
+
# METADATA
|
|
688
|
+
# ═══════════════════════════════════════════════════════════════════════════════
|
|
689
|
+
|
|
690
|
+
metadata:
|
|
691
|
+
version: "1.0"
|
|
692
|
+
created: "2026-02-12"
|
|
693
|
+
author: "@architect"
|
|
694
|
+
|
|
695
|
+
dependencies:
|
|
696
|
+
- "infrastructure/services/llm-router/" # Para chamar modelos externos
|
|
697
|
+
- "wf-model-tier-qualification.yaml" # Comparison logic
|
|
698
|
+
- "validation-glm-5.md" # GLM-5 validation report
|
|
699
|
+
- "validation-kimi-k2-5.md" # Kimi validation report
|
|
700
|
+
|
|
701
|
+
changelog:
|
|
702
|
+
- version: "1.0"
|
|
703
|
+
date: "2026-02-12"
|
|
704
|
+
changes:
|
|
705
|
+
- "Initial workflow based on tier-qualification pattern"
|
|
706
|
+
- "Added external_models registry (GLM-5, Kimi K2.5)"
|
|
707
|
+
- "Added Phase 2: Reliability test (multiple runs)"
|
|
708
|
+
- "Added Phase 4: PT-BR quality test"
|
|
709
|
+
- "Added privacy risk assessment"
|
|
710
|
+
- "Added latency tracking and batch-only verdict"
|
|
711
|
+
- "5 cross_provider_candidates defined"
|