aiox-core 5.0.2 → 5.0.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.aiox-core/data/entity-registry.yaml +748 -763
- package/.aiox-core/install-manifest.yaml +4 -4
- package/package.json +6 -1
- package/pro/feature-registry.yaml +223 -0
- package/pro/package.json +39 -0
- package/pro/pro-config.yaml +63 -0
- package/pro/squads/README.md +24 -0
- package/pro/squads/design/HEADLINE.md +3 -0
- package/pro/squads/design/README.md +109 -0
- package/pro/squads/design/agents/brad-frost.md +1097 -0
- package/pro/squads/design/agents/dan-mall.md +857 -0
- package/pro/squads/design/agents/dave-malouf.md +2272 -0
- package/pro/squads/design/agents/design-chief.md +114 -0
- package/pro/squads/design/agents/ds-foundations-lead.md +194 -0
- package/pro/squads/design/agents/ds-token-architect.md +361 -0
- package/pro/squads/design/agents/nano-banana-generator.md +162 -0
- package/pro/squads/design/agents/storybook-expert.md +809 -0
- package/pro/squads/design/checklists/atomic-refactor-checklist.md +299 -0
- package/pro/squads/design/checklists/component-adaptation-checklist.md +81 -0
- package/pro/squads/design/checklists/design-fidelity-checklist.md +283 -0
- package/pro/squads/design/checklists/design-handoff-checklist.md +55 -0
- package/pro/squads/design/checklists/design-team-health-checklist.md +454 -0
- package/pro/squads/design/checklists/designops-maturity-checklist.md +518 -0
- package/pro/squads/design/checklists/ds-a11y-release-gate-checklist.md +45 -0
- package/pro/squads/design/checklists/ds-accessibility-wcag-checklist.md +147 -0
- package/pro/squads/design/checklists/ds-component-quality-checklist.md +150 -0
- package/pro/squads/design/checklists/ds-critical-eye-review-checklist.md +147 -0
- package/pro/squads/design/checklists/ds-migration-readiness-checklist.md +99 -0
- package/pro/squads/design/checklists/ds-pattern-audit-checklist.md +164 -0
- package/pro/squads/design/checklists/reading-accessibility-checklist.md +275 -0
- package/pro/squads/design/checklists/token-mapping-checklist.md +107 -0
- package/pro/squads/design/config/coding-standards.md +286 -0
- package/pro/squads/design/config/source-tree.md +59 -0
- package/pro/squads/design/config/tech-stack.md +48 -0
- package/pro/squads/design/config.yaml +204 -0
- package/pro/squads/design/data/agentic-design-systems-guide.md +46 -0
- package/pro/squads/design/data/agentic-ds-principles.md +100 -0
- package/pro/squads/design/data/atomic-design-principles.md +108 -0
- package/pro/squads/design/data/atomic-refactor-rules.md +582 -0
- package/pro/squads/design/data/base-component-specs.md +972 -0
- package/pro/squads/design/data/brad-frost-analysis-extract-implicit.yaml +270 -0
- package/pro/squads/design/data/brad-frost-analysis-find-0.8.yaml +176 -0
- package/pro/squads/design/data/brad-frost-analysis-qa-report.yaml +168 -0
- package/pro/squads/design/data/brad-frost-dna.yaml +713 -0
- package/pro/squads/design/data/capability-tools.yaml +124 -0
- package/pro/squads/design/data/component-adaptation-changelog.md +318 -0
- package/pro/squads/design/data/consolidation-algorithms.md +168 -0
- package/pro/squads/design/data/critical-eye-scoring-rules.yaml +240 -0
- package/pro/squads/design/data/design-token-best-practices.md +107 -0
- package/pro/squads/design/data/design-tokens-spec.yaml +418 -0
- package/pro/squads/design/data/ds-reference-architectures.md +93 -0
- package/pro/squads/design/data/f2-qa-report.md +168 -0
- package/pro/squads/design/data/f3-derived-components-changelog.md +100 -0
- package/pro/squads/design/data/f3-qa-report.md +208 -0
- package/pro/squads/design/data/figma-base-components-raw.md +102 -0
- package/pro/squads/design/data/figma-tokens-raw.md +1549 -0
- package/pro/squads/design/data/fluent2-design-principles.md +114 -0
- package/pro/squads/design/data/high-retention-reading-guide.md +349 -0
- package/pro/squads/design/data/integration-patterns.md +207 -0
- package/pro/squads/design/data/internal-quality-chain.yaml +48 -0
- package/pro/squads/design/data/motion-tokens-guide.md +202 -0
- package/pro/squads/design/data/roi-calculation-guide.md +142 -0
- package/pro/squads/design/data/token-mapping-reference.md +213 -0
- package/pro/squads/design/data/w3c-dtcg-spec-reference.md +149 -0
- package/pro/squads/design/data/wcag-compliance-guide.md +267 -0
- package/pro/squads/design/docs/AUDIT_REPORT.md +97 -0
- package/pro/squads/design/docs/DS-CURATION-PIPELINE-PROPOSAL.md +577 -0
- package/pro/squads/design/docs/UPGRADE_PLAN.md +618 -0
- package/pro/squads/design/docs/brad-frost-research-validation.md +372 -0
- package/pro/squads/design/docs/dave-malouf-research-validation.md +391 -0
- package/pro/squads/design/docs/tool-discovery-report.md +87 -0
- package/pro/squads/design/docs/tool-integration-plan.md +44 -0
- package/pro/squads/design/protocols/ai-first-governance.md +56 -0
- package/pro/squads/design/protocols/governance-execution-boundary.md +59 -0
- package/pro/squads/design/protocols/handoff.md +60 -0
- package/pro/squads/design/rules/.claude-rules.md +88 -0
- package/pro/squads/design/scripts/design-system/curate_colors.cjs +447 -0
- package/pro/squads/design/scripts/design-system/curate_components.cjs +217 -0
- package/pro/squads/design/scripts/design-system/curate_radius.cjs +190 -0
- package/pro/squads/design/scripts/design-system/curate_shadows.cjs +208 -0
- package/pro/squads/design/scripts/design-system/curate_spacing.cjs +243 -0
- package/pro/squads/design/scripts/design-system/curate_typography.cjs +404 -0
- package/pro/squads/design/scripts/design-system/design-system-metadata.test.js +49 -0
- package/pro/squads/design/scripts/design-system/design_manifest_lib.cjs +142 -0
- package/pro/squads/design/scripts/design-system/fetch_page_images.cjs +195 -0
- package/pro/squads/design/scripts/design-system/generate_components_metadata.cjs +114 -0
- package/pro/squads/design/scripts/design-system/generate_curation_report.cjs +258 -0
- package/pro/squads/design/scripts/design-system/generate_tokens.cjs +342 -0
- package/pro/squads/design/scripts/design-system/sync_design_manifest.cjs +27 -0
- package/pro/squads/design/scripts/design-system/test_mcp_tools.cjs +232 -0
- package/pro/squads/design/scripts/design-system/validate_components_metadata.cjs +96 -0
- package/pro/squads/design/scripts/design-system/validate_curation.cjs +226 -0
- package/pro/squads/design/scripts/design-system/validate_design_manifest_drift.cjs +72 -0
- package/pro/squads/design/scripts/design-system/validate_mcp_skeleton.cjs +38 -0
- package/pro/squads/design/scripts/design-system/validate_registry.cjs +186 -0
- package/pro/squads/design/scripts/design-system/validate_task_checklist_bindings.cjs +78 -0
- package/pro/squads/design/scripts/dissect-artifact.cjs +806 -0
- package/pro/squads/design/scripts/validate-a11y-integration.cjs +40 -0
- package/pro/squads/design/scripts/validate-design-squad.py +411 -0
- package/pro/squads/design/squad.yaml +714 -0
- package/pro/squads/design/tasks/a11y-audit.md +340 -0
- package/pro/squads/design/tasks/aria-audit.md +525 -0
- package/pro/squads/design/tasks/atomic-refactor-execute.md +391 -0
- package/pro/squads/design/tasks/atomic-refactor-plan.md +262 -0
- package/pro/squads/design/tasks/audit-reading-experience.md +350 -0
- package/pro/squads/design/tasks/audit-tailwind-config.md +101 -0
- package/pro/squads/design/tasks/bootstrap-shadcn-library.md +96 -0
- package/pro/squads/design/tasks/bundle-audit.md +245 -0
- package/pro/squads/design/tasks/contrast-matrix.md +373 -0
- package/pro/squads/design/tasks/create-doc.md +135 -0
- package/pro/squads/design/tasks/dead-code-detection.md +329 -0
- package/pro/squads/design/tasks/design-compare.md +414 -0
- package/pro/squads/design/tasks/design-process-optimization.md +407 -0
- package/pro/squads/design/tasks/design-review-orchestration.md +99 -0
- package/pro/squads/design/tasks/design-team-scaling.md +407 -0
- package/pro/squads/design/tasks/design-tooling-audit.md +404 -0
- package/pro/squads/design/tasks/design-triage.md +89 -0
- package/pro/squads/design/tasks/designops-maturity-assessment.md +364 -0
- package/pro/squads/design/tasks/designops-metrics-setup.md +465 -0
- package/pro/squads/design/tasks/ds-agentic-audit.md +100 -0
- package/pro/squads/design/tasks/ds-agentic-setup.md +103 -0
- package/pro/squads/design/tasks/ds-audit-codebase.md +273 -0
- package/pro/squads/design/tasks/ds-build-component.md +349 -0
- package/pro/squads/design/tasks/ds-build-mcp-server.md +84 -0
- package/pro/squads/design/tasks/ds-calculate-roi.md +282 -0
- package/pro/squads/design/tasks/ds-compose-molecule.md +106 -0
- package/pro/squads/design/tasks/ds-consolidate-patterns.md +253 -0
- package/pro/squads/design/tasks/ds-context-contract.md +194 -0
- package/pro/squads/design/tasks/ds-critical-eye-compare.md +130 -0
- package/pro/squads/design/tasks/ds-critical-eye-decide.md +139 -0
- package/pro/squads/design/tasks/ds-critical-eye-inventory.md +111 -0
- package/pro/squads/design/tasks/ds-critical-eye-report.md +101 -0
- package/pro/squads/design/tasks/ds-critical-eye-score.md +109 -0
- package/pro/squads/design/tasks/ds-designops.md +99 -0
- package/pro/squads/design/tasks/ds-extend-pattern.md +91 -0
- package/pro/squads/design/tasks/ds-extract-tokens.md +312 -0
- package/pro/squads/design/tasks/ds-figma-pipeline.md +95 -0
- package/pro/squads/design/tasks/ds-fluent-audit.md +105 -0
- package/pro/squads/design/tasks/ds-fluent-build.md +110 -0
- package/pro/squads/design/tasks/ds-generate-ai-metadata.md +81 -0
- package/pro/squads/design/tasks/ds-generate-cursor-rules.md +74 -0
- package/pro/squads/design/tasks/ds-generate-documentation.md +101 -0
- package/pro/squads/design/tasks/ds-generate-migration-strategy.md +331 -0
- package/pro/squads/design/tasks/ds-generate-shock-report.md +323 -0
- package/pro/squads/design/tasks/ds-govern-a11y-compliance.md +93 -0
- package/pro/squads/design/tasks/ds-governance.md +187 -0
- package/pro/squads/design/tasks/ds-health-metrics.md +278 -0
- package/pro/squads/design/tasks/ds-integrate-squad.md +130 -0
- package/pro/squads/design/tasks/ds-integrate-workspace.md +100 -0
- package/pro/squads/design/tasks/ds-legacy-modernization.md +302 -0
- package/pro/squads/design/tasks/ds-mcp-status.md +65 -0
- package/pro/squads/design/tasks/ds-motion-audit.md +118 -0
- package/pro/squads/design/tasks/ds-multi-framework.md +96 -0
- package/pro/squads/design/tasks/ds-parallelization-gate.md +246 -0
- package/pro/squads/design/tasks/ds-query.md +90 -0
- package/pro/squads/design/tasks/ds-rebuild-artifact.md +369 -0
- package/pro/squads/design/tasks/ds-reverse-engineer.md +194 -0
- package/pro/squads/design/tasks/ds-scan-artifact.md +131 -0
- package/pro/squads/design/tasks/ds-setup-design-system.md +297 -0
- package/pro/squads/design/tasks/ds-sync-registry.md +287 -0
- package/pro/squads/design/tasks/ds-theme-multi-brand.md +90 -0
- package/pro/squads/design/tasks/ds-token-modes.md +108 -0
- package/pro/squads/design/tasks/ds-token-w3c-extract.md +105 -0
- package/pro/squads/design/tasks/ds-validate-ai-readiness.md +69 -0
- package/pro/squads/design/tasks/ds-visual-regression.md +130 -0
- package/pro/squads/design/tasks/execute-checklist.md +141 -0
- package/pro/squads/design/tasks/export-design-tokens-dtcg.md +97 -0
- package/pro/squads/design/tasks/f1-apply-foundations.md +154 -0
- package/pro/squads/design/tasks/f1-ingest-figma-tokens.md +130 -0
- package/pro/squads/design/tasks/f1-map-tokens-to-shadcn.md +145 -0
- package/pro/squads/design/tasks/f1-qa-foundations.md +95 -0
- package/pro/squads/design/tasks/f2-adapt-shadcn-components.md +155 -0
- package/pro/squads/design/tasks/f2-ingest-base-components.md +148 -0
- package/pro/squads/design/tasks/f2-qa-base-components.md +98 -0
- package/pro/squads/design/tasks/f3-derive-components.md +145 -0
- package/pro/squads/design/tasks/f3-qa-derived-components.md +101 -0
- package/pro/squads/design/tasks/focus-order-audit.md +450 -0
- package/pro/squads/design/tasks/sb-brownfield-migrate.md +367 -0
- package/pro/squads/design/tasks/sb-brownfield-scan.md +318 -0
- package/pro/squads/design/tasks/sb-configure.md +230 -0
- package/pro/squads/design/tasks/sb-expand-shadcn.md +213 -0
- package/pro/squads/design/tasks/sb-generate-all-stories.md +288 -0
- package/pro/squads/design/tasks/sb-install.md +152 -0
- package/pro/squads/design/tasks/sb-sync-workspace.md +239 -0
- package/pro/squads/design/tasks/sb-verify.md +203 -0
- package/pro/squads/design/tasks/tailwind-upgrade.md +117 -0
- package/pro/squads/design/tasks/token-usage-analytics.md +262 -0
- package/pro/squads/design/tasks/ux-rewrite-sixth-grade.md +82 -0
- package/pro/squads/design/tasks/validate-design-fidelity.md +222 -0
- package/pro/squads/design/templates/agent-template.yaml +46 -0
- package/pro/squads/design/templates/clone-mind-template.md +352 -0
- package/pro/squads/design/templates/component-prompt-injection-tmpl.md +236 -0
- package/pro/squads/design/templates/component-visual-spec-tmpl.md +378 -0
- package/pro/squads/design/templates/critical-eye-cycle-report-tmpl.md +165 -0
- package/pro/squads/design/templates/design-fidelity-report-tmpl.md +155 -0
- package/pro/squads/design/templates/ds-ai-component-metadata-schema-tmpl.json +138 -0
- package/pro/squads/design/templates/ds-artifact-analysis.md +70 -0
- package/pro/squads/design/templates/ds-health-report-tmpl.md +236 -0
- package/pro/squads/design/templates/ds-migration-strategy-tmpl.md +524 -0
- package/pro/squads/design/templates/ds-state-persistence-tmpl.yaml +194 -0
- package/pro/squads/design/templates/ds-tokens-schema-tmpl.yaml +139 -0
- package/pro/squads/design/templates/migration-strategy-tmpl.md +524 -0
- package/pro/squads/design/templates/reading-design-tokens.css +26 -0
- package/pro/squads/design/templates/state-persistence-tmpl.yaml +219 -0
- package/pro/squads/design/templates/tokens-schema-tmpl.yaml +305 -0
- package/pro/squads/design/workflows/agentic-readiness.yaml +83 -0
- package/pro/squads/design/workflows/audit-only.yaml +198 -0
- package/pro/squads/design/workflows/brownfield-complete.yaml +257 -0
- package/pro/squads/design/workflows/critical-eye.yaml +184 -0
- package/pro/squads/design/workflows/dtcg-tokens-governance.yaml +64 -0
- package/pro/squads/design/workflows/foundations-pipeline.yaml +192 -0
- package/pro/squads/design/workflows/greenfield-new.yaml +192 -0
- package/pro/squads/design/workflows/motion-quality.yaml +65 -0
- package/pro/squads/design/workflows/self-healing-workflow.yaml +237 -0
- package/pro/squads/design/workflows/storybook-brownfield-migration.yaml +400 -0
- package/pro/squads/design/workflows/storybook-full-setup.yaml +280 -0
- package/pro/squads/index.js +145 -0
- package/pro/squads/squad-creator-pro/.state.json +32 -0
- package/pro/squads/squad-creator-pro/CHANGELOG.md +275 -0
- package/pro/squads/squad-creator-pro/HEADLINE.md +3 -0
- package/pro/squads/squad-creator-pro/README.md +1059 -0
- package/pro/squads/squad-creator-pro/agents/oalanicolas.md +438 -0
- package/pro/squads/squad-creator-pro/agents/pedro-valerio.md +449 -0
- package/pro/squads/squad-creator-pro/agents/squad-chief.md +1651 -0
- package/pro/squads/squad-creator-pro/agents/thiago_finch.md +976 -0
- package/pro/squads/squad-creator-pro/assessments/axioma-assessment-wf-create-squad.yaml +325 -0
- package/pro/squads/squad-creator-pro/checklists/.gitkeep +1 -0
- package/pro/squads/squad-creator-pro/checklists/agent-depth-checklist.md +244 -0
- package/pro/squads/squad-creator-pro/checklists/agent-quality-gate.md +434 -0
- package/pro/squads/squad-creator-pro/checklists/create-agent-checklist.md +184 -0
- package/pro/squads/squad-creator-pro/checklists/create-squad-checklist.md +219 -0
- package/pro/squads/squad-creator-pro/checklists/create-workflow-checklist.md +224 -0
- package/pro/squads/squad-creator-pro/checklists/deep-research-quality.md +506 -0
- package/pro/squads/squad-creator-pro/checklists/executor-matrix-checklist.md +260 -0
- package/pro/squads/squad-creator-pro/checklists/mental-model-integration-checklist.md +95 -0
- package/pro/squads/squad-creator-pro/checklists/mind-validation.md +374 -0
- package/pro/squads/squad-creator-pro/checklists/quality-gate-checklist.md +385 -0
- package/pro/squads/squad-creator-pro/checklists/smoke-test-agent.md +313 -0
- package/pro/squads/squad-creator-pro/checklists/sop-validation.md +250 -0
- package/pro/squads/squad-creator-pro/checklists/squad-checklist.md +1014 -0
- package/pro/squads/squad-creator-pro/checklists/squad-overview-checklist.md +393 -0
- package/pro/squads/squad-creator-pro/checklists/task-anatomy-checklist.md +626 -0
- package/pro/squads/squad-creator-pro/config/.gitkeep +1 -0
- package/pro/squads/squad-creator-pro/config/axioma-validator.yaml +371 -0
- package/pro/squads/squad-creator-pro/config/heuristics.yaml +753 -0
- package/pro/squads/squad-creator-pro/config/model-routing.yaml +693 -0
- package/pro/squads/squad-creator-pro/config/quality-gates.yaml +415 -0
- package/pro/squads/squad-creator-pro/config/scoring-rubric.yaml +199 -0
- package/pro/squads/squad-creator-pro/config/squad-config.yaml +165 -0
- package/pro/squads/squad-creator-pro/config/task-anatomy.yaml +263 -0
- package/pro/squads/squad-creator-pro/config/veto-conditions.yaml +455 -0
- package/pro/squads/squad-creator-pro/config.yaml +35 -0
- package/pro/squads/squad-creator-pro/data/.gitkeep +1 -0
- package/pro/squads/squad-creator-pro/data/an-anchor-words.yaml +78 -0
- package/pro/squads/squad-creator-pro/data/an-clone-anti-patterns.yaml +148 -0
- package/pro/squads/squad-creator-pro/data/an-clone-validation.yaml +190 -0
- package/pro/squads/squad-creator-pro/data/an-diagnostic-framework.yaml +164 -0
- package/pro/squads/squad-creator-pro/data/an-output-examples.yaml +102 -0
- package/pro/squads/squad-creator-pro/data/an-source-signals.yaml +98 -0
- package/pro/squads/squad-creator-pro/data/an-source-tiers.yaml +119 -0
- package/pro/squads/squad-creator-pro/data/best-practices.md +986 -0
- package/pro/squads/squad-creator-pro/data/core-heuristics.md +510 -0
- package/pro/squads/squad-creator-pro/data/decision-heuristics-framework.md +620 -0
- package/pro/squads/squad-creator-pro/data/executor-decision-tree.md +774 -0
- package/pro/squads/squad-creator-pro/data/executor-matrix-framework.md +441 -0
- package/pro/squads/squad-creator-pro/data/fusion-decision-points-analysis.md +397 -0
- package/pro/squads/squad-creator-pro/data/fusion-executor-analysis.md +677 -0
- package/pro/squads/squad-creator-pro/data/hybridops-patterns.md +1351 -0
- package/pro/squads/squad-creator-pro/data/internal-infrastructure-library.yaml +99 -0
- package/pro/squads/squad-creator-pro/data/mental-model-task-matrix.yaml +692 -0
- package/pro/squads/squad-creator-pro/data/pipeline-patterns.md +352 -0
- package/pro/squads/squad-creator-pro/data/pm-best-practices.md +440 -0
- package/pro/squads/squad-creator-pro/data/pv-anchor-words.yaml +64 -0
- package/pro/squads/squad-creator-pro/data/pv-authenticity-markers.yaml +200 -0
- package/pro/squads/squad-creator-pro/data/pv-meta-axiomas.yaml +162 -0
- package/pro/squads/squad-creator-pro/data/pv-output-examples.yaml +342 -0
- package/pro/squads/squad-creator-pro/data/pv-workflow-validation.yaml +318 -0
- package/pro/squads/squad-creator-pro/data/quality-dimensions-framework.md +405 -0
- package/pro/squads/squad-creator-pro/data/squad-analytics-guide.md +252 -0
- package/pro/squads/squad-creator-pro/data/squad-kb.md +987 -0
- package/pro/squads/squad-creator-pro/data/squad-registry.yaml +841 -0
- package/pro/squads/squad-creator-pro/data/squad-type-definitions.yaml +578 -0
- package/pro/squads/squad-creator-pro/data/tier-system-framework.md +475 -0
- package/pro/squads/squad-creator-pro/data/tool-evaluation-framework.md +847 -0
- package/pro/squads/squad-creator-pro/data/tool-registry.yaml +700 -0
- package/pro/squads/squad-creator-pro/docs/ADR-001-model-tier-qualification.md +344 -0
- package/pro/squads/squad-creator-pro/docs/AGENT-COLLABORATION.md +609 -0
- package/pro/squads/squad-creator-pro/docs/ARCHITECTURE-DIAGRAMS.md +1466 -0
- package/pro/squads/squad-creator-pro/docs/COMMANDS.md +544 -0
- package/pro/squads/squad-creator-pro/docs/CONCEPTS.md +584 -0
- package/pro/squads/squad-creator-pro/docs/FAQ.md +731 -0
- package/pro/squads/squad-creator-pro/docs/HITL-FLOW.md +255 -0
- package/pro/squads/squad-creator-pro/docs/MIGRATION-PLAN-AGENT-CONFORMITY.md +861 -0
- package/pro/squads/squad-creator-pro/docs/MIGRATION-ROADMAP-HYBRIDOPS.md +1161 -0
- package/pro/squads/squad-creator-pro/docs/MODEL-TIER-QUALIFICATION.md +337 -0
- package/pro/squads/squad-creator-pro/docs/PATTERN-LIBRARY.md +333 -0
- package/pro/squads/squad-creator-pro/docs/PEDRO-VALERIO-ARCHITECTURE.md +456 -0
- package/pro/squads/squad-creator-pro/docs/POR-ONDE-COMECAR.md +210 -0
- package/pro/squads/squad-creator-pro/docs/QUICK-START.md +205 -0
- package/pro/squads/squad-creator-pro/docs/RFC-001-deterministic-refactoring.md +463 -0
- package/pro/squads/squad-creator-pro/docs/TOOL-RECOMMENDATIONS.md +379 -0
- package/pro/squads/squad-creator-pro/docs/TROUBLESHOOTING.md +412 -0
- package/pro/squads/squad-creator-pro/docs/TUTORIAL-COMPLETO.md +458 -0
- package/pro/squads/squad-creator-pro/docs/optimize-v4-proposal.md +354 -0
- package/pro/squads/squad-creator-pro/docs/session-report-2026-02-01.md +411 -0
- package/pro/squads/squad-creator-pro/docs/sop-extraction-process.md +674 -0
- package/pro/squads/squad-creator-pro/docs/squad-chief-agent-flow.md +981 -0
- package/pro/squads/squad-creator-pro/docs/squad-creation-pipeline-workflow.md +937 -0
- package/pro/squads/squad-creator-pro/docs/task-optimization-framework.md +229 -0
- package/pro/squads/squad-creator-pro/docs/validation-report-2026-02-01.md +439 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/artifacts/HANDOFF_PROTOCOL.md +269 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/artifacts/SOURCE_CLASSIFICATION.md +258 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_001.md +166 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_002.md +206 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_003.md +239 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_004.md +153 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_005.md +161 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_006.md +166 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_007.md +190 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_008.md +191 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_009.md +234 -0
- package/pro/squads/squad-creator-pro/minds/oalanicolas/heuristics/AN_KE_010.md +240 -0
- package/pro/squads/squad-creator-pro/minds/pedro_valerio/artifacts/Assinatura_Linguistica.md +355 -0
- package/pro/squads/squad-creator-pro/minds/pedro_valerio/artifacts/META_AXIOMAS.md +277 -0
- package/pro/squads/squad-creator-pro/minds/pedro_valerio/heuristics/PV_BS_001.md +144 -0
- package/pro/squads/squad-creator-pro/minds/pedro_valerio/heuristics/PV_PA_001.md +174 -0
- package/pro/squads/squad-creator-pro/minds/pedro_valerio/heuristics/PV_PM_001.md +191 -0
- package/pro/squads/squad-creator-pro/package.json +26 -0
- package/pro/squads/squad-creator-pro/protocols/ai-first-governance.md +63 -0
- package/pro/squads/squad-creator-pro/scripts/README.md +246 -0
- package/pro/squads/squad-creator-pro/scripts/__pycache__/dependency_check.cpython-314.pyc +0 -0
- package/pro/squads/squad-creator-pro/scripts/__pycache__/inventory.cpython-314.pyc +0 -0
- package/pro/squads/squad-creator-pro/scripts/__pycache__/naming_validator.cpython-314.pyc +0 -0
- package/pro/squads/squad-creator-pro/scripts/__pycache__/quality_gate.cpython-314.pyc +0 -0
- package/pro/squads/squad-creator-pro/scripts/__pycache__/scoring.cpython-314.pyc +0 -0
- package/pro/squads/squad-creator-pro/scripts/__pycache__/yaml_validator.cpython-314.pyc +0 -0
- package/pro/squads/squad-creator-pro/scripts/assess-sources.sh +443 -0
- package/pro/squads/squad-creator-pro/scripts/checklist_validator.py +451 -0
- package/pro/squads/squad-creator-pro/scripts/clone-review.sh +394 -0
- package/pro/squads/squad-creator-pro/scripts/coherence-validator.py +836 -0
- package/pro/squads/squad-creator-pro/scripts/create-agent-preflight.py +243 -0
- package/pro/squads/squad-creator-pro/scripts/cross-provider/compare-results.js +281 -0
- package/pro/squads/squad-creator-pro/scripts/cross-provider/cross-provider-runner.js +462 -0
- package/pro/squads/squad-creator-pro/scripts/dependency_check.py +333 -0
- package/pro/squads/squad-creator-pro/scripts/fidelity-score.sh +519 -0
- package/pro/squads/squad-creator-pro/scripts/generate-squad-greeting.js +426 -0
- package/pro/squads/squad-creator-pro/scripts/generate-squad-guide.js +558 -0
- package/pro/squads/squad-creator-pro/scripts/inventory.py +269 -0
- package/pro/squads/squad-creator-pro/scripts/lib/config-loader.js +151 -0
- package/pro/squads/squad-creator-pro/scripts/model-tier-validator.cjs +369 -0
- package/pro/squads/squad-creator-pro/scripts/model-usage-logger.cjs +245 -0
- package/pro/squads/squad-creator-pro/scripts/modernization-score.sh +308 -0
- package/pro/squads/squad-creator-pro/scripts/naming_validator.py +299 -0
- package/pro/squads/squad-creator-pro/scripts/on-specialist-complete.py +98 -0
- package/pro/squads/squad-creator-pro/scripts/quality_gate.py +413 -0
- package/pro/squads/squad-creator-pro/scripts/refresh-registry.py +270 -0
- package/pro/squads/squad-creator-pro/scripts/save-session-metrics.py +136 -0
- package/pro/squads/squad-creator-pro/scripts/scaffold-squad.cjs +281 -0
- package/pro/squads/squad-creator-pro/scripts/scoring.py +395 -0
- package/pro/squads/squad-creator-pro/scripts/security_scanner.py +378 -0
- package/pro/squads/squad-creator-pro/scripts/squad-analytics.py +585 -0
- package/pro/squads/squad-creator-pro/scripts/squad-context-loader.cjs +205 -0
- package/pro/squads/squad-creator-pro/scripts/squad-state-manager.cjs +451 -0
- package/pro/squads/squad-creator-pro/scripts/squad-workflow-runner.cjs +471 -0
- package/pro/squads/squad-creator-pro/scripts/squad_utils.py +261 -0
- package/pro/squads/squad-creator-pro/scripts/sync-ide-command.py +590 -0
- package/pro/squads/squad-creator-pro/scripts/tests/__init__.py +1 -0
- package/pro/squads/squad-creator-pro/scripts/tests/conftest.py +309 -0
- package/pro/squads/squad-creator-pro/scripts/tests/run_bash_tests.sh +29 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_assess_sources.sh +216 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_checklist_validator.py +396 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_clone_review.sh +239 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_coherence_validator.py +212 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_dependency_check.py +361 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_fidelity_score.sh +298 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_inventory.py +307 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_modernization_score.sh +211 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_naming_validator.py +373 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_quality_gate.py +280 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_refresh_registry.py +338 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_scoring.py +366 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_security_scanner.py +354 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_squad_analytics.py +450 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_validate_clone.sh +252 -0
- package/pro/squads/squad-creator-pro/scripts/tests/test_yaml_validator.py +412 -0
- package/pro/squads/squad-creator-pro/scripts/validate-agent-output.py +115 -0
- package/pro/squads/squad-creator-pro/scripts/validate-all.sh +49 -0
- package/pro/squads/squad-creator-pro/scripts/validate-squad-structure.py +535 -0
- package/pro/squads/squad-creator-pro/scripts/validate-squad.sh +944 -0
- package/pro/squads/squad-creator-pro/scripts/yaml_validator.py +528 -0
- package/pro/squads/squad-creator-pro/skills/squad.md +301 -0
- package/pro/squads/squad-creator-pro/squad.yaml +36 -0
- package/pro/squads/squad-creator-pro/tasks/CHANGELOG.md +80 -0
- package/pro/squads/squad-creator-pro/tasks/an-assess-sources.md +78 -0
- package/pro/squads/squad-creator-pro/tasks/an-clone-review.md +104 -0
- package/pro/squads/squad-creator-pro/tasks/an-compare-outputs.md +354 -0
- package/pro/squads/squad-creator-pro/tasks/an-design-clone.md +79 -0
- package/pro/squads/squad-creator-pro/tasks/an-diagnose-clone.md +87 -0
- package/pro/squads/squad-creator-pro/tasks/an-extract-dna.md +90 -0
- package/pro/squads/squad-creator-pro/tasks/an-extract-framework.md +100 -0
- package/pro/squads/squad-creator-pro/tasks/an-fidelity-score.md +108 -0
- package/pro/squads/squad-creator-pro/tasks/an-validate-clone.md +96 -0
- package/pro/squads/squad-creator-pro/tasks/auto-acquire-sources.md +349 -0
- package/pro/squads/squad-creator-pro/tasks/collect-sources.md +533 -0
- package/pro/squads/squad-creator-pro/tasks/create-agent.md +768 -0
- package/pro/squads/squad-creator-pro/tasks/create-documentation.md +258 -0
- package/pro/squads/squad-creator-pro/tasks/create-pipeline.md +296 -0
- package/pro/squads/squad-creator-pro/tasks/create-squad.md +933 -0
- package/pro/squads/squad-creator-pro/tasks/create-task.md +1148 -0
- package/pro/squads/squad-creator-pro/tasks/create-template.md +474 -0
- package/pro/squads/squad-creator-pro/tasks/create-workflow.md +720 -0
- package/pro/squads/squad-creator-pro/tasks/deconstruct.md +167 -0
- package/pro/squads/squad-creator-pro/tasks/deep-research-pre-agent.md +566 -0
- package/pro/squads/squad-creator-pro/tasks/detect-squad-context.md +81 -0
- package/pro/squads/squad-creator-pro/tasks/discover-tools.md +944 -0
- package/pro/squads/squad-creator-pro/tasks/extract-implicit.md +352 -0
- package/pro/squads/squad-creator-pro/tasks/extract-knowledge.md +577 -0
- package/pro/squads/squad-creator-pro/tasks/extract-sop.md +320 -0
- package/pro/squads/squad-creator-pro/tasks/extract-thinking-dna.md +653 -0
- package/pro/squads/squad-creator-pro/tasks/extract-voice-dna.md +619 -0
- package/pro/squads/squad-creator-pro/tasks/find-0.8.md +222 -0
- package/pro/squads/squad-creator-pro/tasks/install-commands.md +373 -0
- package/pro/squads/squad-creator-pro/tasks/lookup-model.md +78 -0
- package/pro/squads/squad-creator-pro/tasks/migrate-workflows-to-yaml.md +259 -0
- package/pro/squads/squad-creator-pro/tasks/next-squad.md +487 -0
- package/pro/squads/squad-creator-pro/tasks/optimize-workflow.md +851 -0
- package/pro/squads/squad-creator-pro/tasks/optimize.md +1082 -0
- package/pro/squads/squad-creator-pro/tasks/parallel-discovery.md +58 -0
- package/pro/squads/squad-creator-pro/tasks/pv-audit.md +244 -0
- package/pro/squads/squad-creator-pro/tasks/pv-axioma-assessment-wf-clone-mind.yaml +256 -0
- package/pro/squads/squad-creator-pro/tasks/pv-axioma-assessment.md +83 -0
- package/pro/squads/squad-creator-pro/tasks/pv-modernization-score.md +83 -0
- package/pro/squads/squad-creator-pro/tasks/qa-after-creation.md +475 -0
- package/pro/squads/squad-creator-pro/tasks/qualify-task.md +265 -0
- package/pro/squads/squad-creator-pro/tasks/reexecute-squad-phase.md +64 -0
- package/pro/squads/squad-creator-pro/tasks/refresh-registry.md +403 -0
- package/pro/squads/squad-creator-pro/tasks/smoke-test-model-routing.md +167 -0
- package/pro/squads/squad-creator-pro/tasks/squad-analytics.md +265 -0
- package/pro/squads/squad-creator-pro/tasks/squad-fusion.md +817 -0
- package/pro/squads/squad-creator-pro/tasks/squad-overview.md +683 -0
- package/pro/squads/squad-creator-pro/tasks/sync-ide-command.md +392 -0
- package/pro/squads/squad-creator-pro/tasks/update-mind.md +428 -0
- package/pro/squads/squad-creator-pro/tasks/upgrade-squad.md +919 -0
- package/pro/squads/squad-creator-pro/tasks/validate-extraction.md +209 -0
- package/pro/squads/squad-creator-pro/tasks/validate-final-artifacts.md +80 -0
- package/pro/squads/squad-creator-pro/tasks/validate-squad.md +1385 -0
- package/pro/squads/squad-creator-pro/templates/.gitkeep +1 -0
- package/pro/squads/squad-creator-pro/templates/agent-flow-doc-tmpl.md +512 -0
- package/pro/squads/squad-creator-pro/templates/agent-tmpl.md +697 -0
- package/pro/squads/squad-creator-pro/templates/config-tmpl.yaml +352 -0
- package/pro/squads/squad-creator-pro/templates/handoff-insumos-tmpl.yaml +112 -0
- package/pro/squads/squad-creator-pro/templates/orchestrator-tmpl.md +74 -0
- package/pro/squads/squad-creator-pro/templates/pipeline-progress-tmpl.py +373 -0
- package/pro/squads/squad-creator-pro/templates/pipeline-runner-tmpl.py +444 -0
- package/pro/squads/squad-creator-pro/templates/pipeline-state-tmpl.py +413 -0
- package/pro/squads/squad-creator-pro/templates/pop-extractor-prompt.md +549 -0
- package/pro/squads/squad-creator-pro/templates/quality-dashboard-tmpl.md +286 -0
- package/pro/squads/squad-creator-pro/templates/quality-gate-tmpl.yaml +589 -0
- package/pro/squads/squad-creator-pro/templates/readme-tmpl.md +231 -0
- package/pro/squads/squad-creator-pro/templates/research-output-tmpl.md +625 -0
- package/pro/squads/squad-creator-pro/templates/research-prompt-tmpl.md +479 -0
- package/pro/squads/squad-creator-pro/templates/squad-prd-tmpl.md +464 -0
- package/pro/squads/squad-creator-pro/templates/squad-readme-tmpl.md +170 -0
- package/pro/squads/squad-creator-pro/templates/story-create-agent-tmpl.md +284 -0
- package/pro/squads/squad-creator-pro/templates/task-tmpl.md +461 -0
- package/pro/squads/squad-creator-pro/templates/template-tmpl.yaml +227 -0
- package/pro/squads/squad-creator-pro/templates/workflow-doc-tmpl.md +860 -0
- package/pro/squads/squad-creator-pro/templates/workflow-tmpl.yaml +394 -0
- package/pro/squads/squad-creator-pro/test-cases/BATCH-PROGRESS.md +268 -0
- package/pro/squads/squad-creator-pro/test-cases/QUALIFICATION-DASHBOARD.yaml +13 -0
- package/pro/squads/squad-creator-pro/test-cases/_template.yaml +147 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/ASSESSMENT-SUMMARY.md +275 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/ASSESSMENT_SUMMARY.md +140 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/CHECKPOINT_MATRIX.md +202 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/EXECUTION-REPORT.md +413 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/EXECUTION_NOTES.md +358 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/README-v2.2.2.md +299 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/README.md +320 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/TEST-REPORT-v2.1.md +351 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/VERIFICATION-CHECKLIST.txt +247 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/formal-qualification-report.yaml +389 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-output.yaml +366 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-v2.1-output.yaml +452 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-v2.2.1-output.yaml +281 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/haiku-v2.2.2-output.yaml +332 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/opus-baseline.yaml +517 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/qualification-report.yaml +213 -0
- package/pro/squads/squad-creator-pro/test-cases/an-assess-sources/test-case.yaml +69 -0
- package/pro/squads/squad-creator-pro/test-cases/an-clone-review/haiku-round-1.yaml +213 -0
- package/pro/squads/squad-creator-pro/test-cases/an-clone-review/opus-baseline.yaml +566 -0
- package/pro/squads/squad-creator-pro/test-cases/an-clone-review/qualification-report.yaml +82 -0
- package/pro/squads/squad-creator-pro/test-cases/an-design-clone/test-case.yaml +102 -0
- package/pro/squads/squad-creator-pro/test-cases/an-extract-dna/test-case.yaml +105 -0
- package/pro/squads/squad-creator-pro/test-cases/an-fidelity-score/haiku-round-1.yaml +262 -0
- package/pro/squads/squad-creator-pro/test-cases/an-fidelity-score/opus-baseline.yaml +266 -0
- package/pro/squads/squad-creator-pro/test-cases/an-fidelity-score/qualification-report.yaml +94 -0
- package/pro/squads/squad-creator-pro/test-cases/an-validate-clone/haiku-round-1.yaml +282 -0
- package/pro/squads/squad-creator-pro/test-cases/an-validate-clone/opus-baseline.yaml +470 -0
- package/pro/squads/squad-creator-pro/test-cases/an-validate-clone/qualification-report.yaml +106 -0
- package/pro/squads/squad-creator-pro/test-cases/collect-sources/test-case.yaml +105 -0
- package/pro/squads/squad-creator-pro/test-cases/create-task/test-case.yaml +104 -0
- package/pro/squads/squad-creator-pro/test-cases/cross-provider/DASHBOARD.yaml +11 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-audit/test-case.yaml +106 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/haiku-output.yaml +209 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/opus-baseline.yaml +96 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/sonnet-output.yaml +30 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-axioma-assessment/test-case.yaml +129 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/comparison-round-1.yaml +242 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/haiku-round-1.yaml +393 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/opus-baseline.yaml +488 -0
- package/pro/squads/squad-creator-pro/test-cases/pv-modernization-score/qualification-report.yaml +74 -0
- package/pro/squads/squad-creator-pro/test-cases/qa-after-creation/haiku-round-1.yaml +292 -0
- package/pro/squads/squad-creator-pro/test-cases/qa-after-creation/opus-baseline.yaml +603 -0
- package/pro/squads/squad-creator-pro/test-cases/qa-after-creation/qualification-report.yaml +97 -0
- package/pro/squads/squad-creator-pro/test-cases/smoke-test-model-routing/test-case.yaml +100 -0
- package/pro/squads/squad-creator-pro/test-cases/upgrade-squad/test-case.yaml +106 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/comparison-round-1.yaml +223 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-1-MINE.yaml +36 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-1.yaml +193 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-2.yaml +303 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/haiku-round-3-v4-task.yaml +149 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/opus-baseline.yaml +529 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/opus-round-3-v4-task.yaml +132 -0
- package/pro/squads/squad-creator-pro/test-cases/validate-squad/qualification-report.yaml +104 -0
- package/pro/squads/squad-creator-pro/test-cases/wf-clone-mind/haiku-output-v2-calibrated.yaml +200 -0
- package/pro/squads/squad-creator-pro/test-cases/wf-clone-mind/haiku-output.yaml +183 -0
- package/pro/squads/squad-creator-pro/test-cases/wf-clone-mind/opus-baseline.yaml +112 -0
- package/pro/squads/squad-creator-pro/utils/.gitkeep +1 -0
- package/pro/squads/squad-creator-pro/workflows/.gitkeep +1 -0
- package/pro/squads/squad-creator-pro/workflows/create-squad.yaml +348 -0
- package/pro/squads/squad-creator-pro/workflows/modules/module-discovery.yaml +16 -0
- package/pro/squads/squad-creator-pro/workflows/modules/module-integration.yaml +16 -0
- package/pro/squads/squad-creator-pro/workflows/modules/module-quality-gates.yaml +15 -0
- package/pro/squads/squad-creator-pro/workflows/validate-squad.yaml +582 -0
- package/pro/squads/squad-creator-pro/workflows/wf-auto-acquire-sources.yaml +518 -0
- package/pro/squads/squad-creator-pro/workflows/wf-brownfield-upgrade-squad.yaml +46 -0
- package/pro/squads/squad-creator-pro/workflows/wf-clone-mind.yaml +521 -0
- package/pro/squads/squad-creator-pro/workflows/wf-context-aware-create-squad.yaml +47 -0
- package/pro/squads/squad-creator-pro/workflows/wf-create-squad.yaml +1619 -0
- package/pro/squads/squad-creator-pro/workflows/wf-cross-provider-qualification.yaml +711 -0
- package/pro/squads/squad-creator-pro/workflows/wf-discover-tools.yaml +1439 -0
- package/pro/squads/squad-creator-pro/workflows/wf-extraction-pipeline.yaml +486 -0
- package/pro/squads/squad-creator-pro/workflows/wf-mind-research-loop.yaml +668 -0
- package/pro/squads/squad-creator-pro/workflows/wf-model-tier-qualification.yaml +800 -0
- package/pro/squads/squad-creator-pro/workflows/wf-optimize-squad.yaml +684 -0
- package/pro/squads/squad-creator-pro/workflows/wf-research-then-create-agent.yaml +921 -0
- package/pro/squads/squad-creator-pro/workflows/wf-squad-fusion.yaml +1684 -0
|
@@ -0,0 +1,243 @@
|
|
|
1
|
+
#!/usr/bin/env python3
|
|
2
|
+
"""
|
|
3
|
+
create-agent-preflight.py - Deterministic preflight checks for create-agent task
|
|
4
|
+
|
|
5
|
+
Purpose: Execute all deterministic validations BEFORE LLM engagement
|
|
6
|
+
Usage: python3 create-agent-preflight.py --squad <squad_name> --specialist <slug> [--sources <path>]
|
|
7
|
+
|
|
8
|
+
Output: JSON with validation results
|
|
9
|
+
|
|
10
|
+
Deterministic checks (no LLM needed):
|
|
11
|
+
1. Squad exists at squads/{squad_name}/
|
|
12
|
+
2. Squad has config.yaml
|
|
13
|
+
3. Squad has agents/ directory
|
|
14
|
+
4. If specialist: check local sources exist
|
|
15
|
+
5. Count source files and lines
|
|
16
|
+
6. Validate naming conventions
|
|
17
|
+
"""
|
|
18
|
+
|
|
19
|
+
import argparse
|
|
20
|
+
import json
|
|
21
|
+
import os
|
|
22
|
+
import sys
|
|
23
|
+
from pathlib import Path
|
|
24
|
+
from datetime import datetime
|
|
25
|
+
|
|
26
|
+
|
|
27
|
+
def count_lines(file_path: Path) -> int:
|
|
28
|
+
"""Count lines in a file."""
|
|
29
|
+
try:
|
|
30
|
+
with open(file_path, 'r', encoding='utf-8', errors='ignore') as f:
|
|
31
|
+
return sum(1 for _ in f)
|
|
32
|
+
except Exception:
|
|
33
|
+
return 0
|
|
34
|
+
|
|
35
|
+
|
|
36
|
+
def validate_squad(squad_name: str, squads_path: str = "squads") -> dict:
|
|
37
|
+
"""Validate squad exists and has required structure."""
|
|
38
|
+
squad_path = Path(squads_path) / squad_name
|
|
39
|
+
|
|
40
|
+
result = {
|
|
41
|
+
"squad_name": squad_name,
|
|
42
|
+
"squad_path": str(squad_path),
|
|
43
|
+
"exists": squad_path.exists(),
|
|
44
|
+
"has_config": (squad_path / "config.yaml").exists(),
|
|
45
|
+
"has_agents_dir": (squad_path / "agents").exists(),
|
|
46
|
+
"has_readme": (squad_path / "README.md").exists(),
|
|
47
|
+
"agent_count": 0,
|
|
48
|
+
"existing_agents": []
|
|
49
|
+
}
|
|
50
|
+
|
|
51
|
+
if result["has_agents_dir"]:
|
|
52
|
+
agents = list((squad_path / "agents").glob("*.md"))
|
|
53
|
+
result["agent_count"] = len(agents)
|
|
54
|
+
result["existing_agents"] = [a.stem for a in agents]
|
|
55
|
+
|
|
56
|
+
return result
|
|
57
|
+
|
|
58
|
+
|
|
59
|
+
def check_local_sources(specialist_slug: str, sources_path: str = None) -> dict:
|
|
60
|
+
"""Check local knowledge sources for a specialist."""
|
|
61
|
+
|
|
62
|
+
# Default paths to search
|
|
63
|
+
search_paths = [
|
|
64
|
+
f"outputs/minds/{specialist_slug}/sources",
|
|
65
|
+
f"outputs/minds/{specialist_slug}/analysis",
|
|
66
|
+
f"squads/*/minds/{specialist_slug}",
|
|
67
|
+
]
|
|
68
|
+
|
|
69
|
+
if sources_path:
|
|
70
|
+
search_paths.insert(0, sources_path)
|
|
71
|
+
|
|
72
|
+
result = {
|
|
73
|
+
"specialist_slug": specialist_slug,
|
|
74
|
+
"sources_found": False,
|
|
75
|
+
"total_files": 0,
|
|
76
|
+
"total_lines": 0,
|
|
77
|
+
"coverage_estimate": 0,
|
|
78
|
+
"paths_checked": [],
|
|
79
|
+
"files": []
|
|
80
|
+
}
|
|
81
|
+
|
|
82
|
+
for search_pattern in search_paths:
|
|
83
|
+
# Handle glob patterns
|
|
84
|
+
if "*" in search_pattern:
|
|
85
|
+
from glob import glob
|
|
86
|
+
matches = glob(search_pattern)
|
|
87
|
+
paths_to_check = [Path(m) for m in matches]
|
|
88
|
+
else:
|
|
89
|
+
paths_to_check = [Path(search_pattern)]
|
|
90
|
+
|
|
91
|
+
for path in paths_to_check:
|
|
92
|
+
result["paths_checked"].append(str(path))
|
|
93
|
+
|
|
94
|
+
if path.exists() and path.is_dir():
|
|
95
|
+
result["sources_found"] = True
|
|
96
|
+
|
|
97
|
+
for ext in ["*.md", "*.txt", "*.yaml", "*.json"]:
|
|
98
|
+
for file in path.rglob(ext):
|
|
99
|
+
lines = count_lines(file)
|
|
100
|
+
result["files"].append({
|
|
101
|
+
"path": str(file),
|
|
102
|
+
"lines": lines
|
|
103
|
+
})
|
|
104
|
+
result["total_files"] += 1
|
|
105
|
+
result["total_lines"] += lines
|
|
106
|
+
|
|
107
|
+
# Estimate coverage based on lines
|
|
108
|
+
if result["total_lines"] >= 5000:
|
|
109
|
+
result["coverage_estimate"] = 90
|
|
110
|
+
elif result["total_lines"] >= 2000:
|
|
111
|
+
result["coverage_estimate"] = 70
|
|
112
|
+
elif result["total_lines"] >= 500:
|
|
113
|
+
result["coverage_estimate"] = 40
|
|
114
|
+
elif result["total_lines"] > 0:
|
|
115
|
+
result["coverage_estimate"] = 20
|
|
116
|
+
|
|
117
|
+
return result
|
|
118
|
+
|
|
119
|
+
|
|
120
|
+
def validate_agent_name(name: str) -> dict:
|
|
121
|
+
"""Validate agent naming conventions."""
|
|
122
|
+
import re
|
|
123
|
+
|
|
124
|
+
# kebab-case pattern
|
|
125
|
+
kebab_pattern = r'^[a-z][a-z0-9]*(-[a-z0-9]+)*$'
|
|
126
|
+
# snake_case pattern
|
|
127
|
+
snake_pattern = r'^[a-z][a-z0-9]*(_[a-z0-9]+)*$'
|
|
128
|
+
|
|
129
|
+
result = {
|
|
130
|
+
"name": name,
|
|
131
|
+
"is_kebab_case": bool(re.match(kebab_pattern, name)),
|
|
132
|
+
"is_snake_case": bool(re.match(snake_pattern, name)),
|
|
133
|
+
"valid": False,
|
|
134
|
+
"suggested": None
|
|
135
|
+
}
|
|
136
|
+
|
|
137
|
+
result["valid"] = result["is_kebab_case"] or result["is_snake_case"]
|
|
138
|
+
|
|
139
|
+
if not result["valid"]:
|
|
140
|
+
# Try to generate a valid name
|
|
141
|
+
suggested = name.lower()
|
|
142
|
+
suggested = re.sub(r'[^a-z0-9]+', '-', suggested)
|
|
143
|
+
suggested = re.sub(r'^-|-$', '', suggested)
|
|
144
|
+
result["suggested"] = suggested
|
|
145
|
+
|
|
146
|
+
return result
|
|
147
|
+
|
|
148
|
+
|
|
149
|
+
def main():
|
|
150
|
+
parser = argparse.ArgumentParser(description="Preflight checks for create-agent")
|
|
151
|
+
parser.add_argument("--squad", help="Target squad name")
|
|
152
|
+
parser.add_argument("--pack", dest="legacy_pack", help="Legacy alias for --squad")
|
|
153
|
+
parser.add_argument("--specialist", help="Specialist slug (optional)")
|
|
154
|
+
parser.add_argument("--sources", help="Custom sources path")
|
|
155
|
+
parser.add_argument("--agent-name", help="Proposed agent name to validate")
|
|
156
|
+
parser.add_argument("--squads-path", default="squads", help="Path to squads directory")
|
|
157
|
+
parser.add_argument("--format", choices=["json", "text"], default="json")
|
|
158
|
+
|
|
159
|
+
args = parser.parse_args()
|
|
160
|
+
squad_name = args.squad or args.legacy_pack
|
|
161
|
+
if not squad_name:
|
|
162
|
+
parser.error("Missing required argument: --squad (or legacy --pack)")
|
|
163
|
+
|
|
164
|
+
# Run validations
|
|
165
|
+
result = {
|
|
166
|
+
"timestamp": datetime.now().isoformat(),
|
|
167
|
+
"squad_validation": validate_squad(squad_name, args.squads_path),
|
|
168
|
+
"pack_validation": None, # legacy key, filled below for compatibility
|
|
169
|
+
"sources_validation": None,
|
|
170
|
+
"name_validation": None,
|
|
171
|
+
"overall_status": "READY",
|
|
172
|
+
"blockers": [],
|
|
173
|
+
"warnings": [],
|
|
174
|
+
"recommendations": []
|
|
175
|
+
}
|
|
176
|
+
|
|
177
|
+
# Backward-compatible payload alias
|
|
178
|
+
result["pack_validation"] = result["squad_validation"]
|
|
179
|
+
|
|
180
|
+
# Check squad
|
|
181
|
+
if not result["squad_validation"]["exists"]:
|
|
182
|
+
result["blockers"].append(f"Squad '{squad_name}' does not exist at squads/{squad_name}/")
|
|
183
|
+
result["overall_status"] = "BLOCKED"
|
|
184
|
+
elif not result["squad_validation"]["has_config"]:
|
|
185
|
+
result["warnings"].append("Squad missing config.yaml")
|
|
186
|
+
|
|
187
|
+
# Check sources if specialist provided
|
|
188
|
+
if args.specialist:
|
|
189
|
+
result["sources_validation"] = check_local_sources(args.specialist, args.sources)
|
|
190
|
+
|
|
191
|
+
if not result["sources_validation"]["sources_found"]:
|
|
192
|
+
result["warnings"].append(f"No local sources found for '{args.specialist}'")
|
|
193
|
+
result["recommendations"].append("Run *auto-acquire-sources or provide sources manually")
|
|
194
|
+
elif result["sources_validation"]["coverage_estimate"] < 50:
|
|
195
|
+
result["warnings"].append(f"Low source coverage ({result['sources_validation']['coverage_estimate']}%)")
|
|
196
|
+
result["recommendations"].append("Consider gathering more sources before extraction")
|
|
197
|
+
|
|
198
|
+
# Validate agent name if provided
|
|
199
|
+
if args.agent_name:
|
|
200
|
+
result["name_validation"] = validate_agent_name(args.agent_name)
|
|
201
|
+
|
|
202
|
+
if not result["name_validation"]["valid"]:
|
|
203
|
+
result["warnings"].append(f"Agent name '{args.agent_name}' doesn't follow conventions")
|
|
204
|
+
result["recommendations"].append(f"Suggested name: {result['name_validation']['suggested']}")
|
|
205
|
+
|
|
206
|
+
# Output
|
|
207
|
+
if args.format == "json":
|
|
208
|
+
print(json.dumps(result, indent=2))
|
|
209
|
+
else:
|
|
210
|
+
print(f"=== CREATE-AGENT PREFLIGHT ===")
|
|
211
|
+
print(f"Status: {result['overall_status']}")
|
|
212
|
+
print(f"\nSquad: {squad_name}")
|
|
213
|
+
print(f" Exists: {'Yes' if result['squad_validation']['exists'] else 'No'}")
|
|
214
|
+
print(f" Agents: {result['squad_validation']['agent_count']}")
|
|
215
|
+
|
|
216
|
+
if result["sources_validation"]:
|
|
217
|
+
print(f"\nSources for {args.specialist}:")
|
|
218
|
+
print(f" Found: {'Yes' if result['sources_validation']['sources_found'] else 'No'}")
|
|
219
|
+
print(f" Files: {result['sources_validation']['total_files']}")
|
|
220
|
+
print(f" Lines: {result['sources_validation']['total_lines']}")
|
|
221
|
+
print(f" Coverage: {result['sources_validation']['coverage_estimate']}%")
|
|
222
|
+
|
|
223
|
+
if result["blockers"]:
|
|
224
|
+
print(f"\nBLOCKERS:")
|
|
225
|
+
for b in result["blockers"]:
|
|
226
|
+
print(f" - {b}")
|
|
227
|
+
|
|
228
|
+
if result["warnings"]:
|
|
229
|
+
print(f"\nWARNINGS:")
|
|
230
|
+
for w in result["warnings"]:
|
|
231
|
+
print(f" - {w}")
|
|
232
|
+
|
|
233
|
+
if result["recommendations"]:
|
|
234
|
+
print(f"\nRECOMMENDATIONS:")
|
|
235
|
+
for r in result["recommendations"]:
|
|
236
|
+
print(f" - {r}")
|
|
237
|
+
|
|
238
|
+
# Exit code based on status
|
|
239
|
+
sys.exit(0 if result["overall_status"] == "READY" else 1)
|
|
240
|
+
|
|
241
|
+
|
|
242
|
+
if __name__ == "__main__":
|
|
243
|
+
main()
|
|
@@ -0,0 +1,281 @@
|
|
|
1
|
+
#!/usr/bin/env node
|
|
2
|
+
/**
|
|
3
|
+
* Cross-Provider Results Comparator
|
|
4
|
+
*
|
|
5
|
+
* Compara resultados de Opus (baseline) vs modelo candidato.
|
|
6
|
+
* Gera relatório de qualificação automático.
|
|
7
|
+
* Usa paths do squad-config.yaml (zero hardcoded paths).
|
|
8
|
+
*
|
|
9
|
+
* Usage:
|
|
10
|
+
* node compare-results.js --task extract-knowledge --baseline opus --candidate glm5
|
|
11
|
+
*/
|
|
12
|
+
|
|
13
|
+
const fs = require('fs');
|
|
14
|
+
const path = require('path');
|
|
15
|
+
|
|
16
|
+
// Load config (auto-detects project root)
|
|
17
|
+
const config = require('../lib/config-loader');
|
|
18
|
+
|
|
19
|
+
const PATHS = {
|
|
20
|
+
outputDir: config.paths.llmTests
|
|
21
|
+
};
|
|
22
|
+
|
|
23
|
+
// ============================================================================
|
|
24
|
+
// RESULT LOADER
|
|
25
|
+
// ============================================================================
|
|
26
|
+
|
|
27
|
+
function loadLatestResult(taskName, modelName) {
|
|
28
|
+
const dir = path.join(PATHS.outputDir, taskName, modelName);
|
|
29
|
+
|
|
30
|
+
if (!fs.existsSync(dir)) {
|
|
31
|
+
return null;
|
|
32
|
+
}
|
|
33
|
+
|
|
34
|
+
const files = fs.readdirSync(dir)
|
|
35
|
+
.filter(f => f.startsWith('run-') && f.endsWith('.yaml'))
|
|
36
|
+
.sort()
|
|
37
|
+
.reverse();
|
|
38
|
+
|
|
39
|
+
if (files.length === 0) return null;
|
|
40
|
+
|
|
41
|
+
const content = fs.readFileSync(path.join(dir, files[0]), 'utf-8');
|
|
42
|
+
return { file: files[0], content, parsed: parseYaml(content) };
|
|
43
|
+
}
|
|
44
|
+
|
|
45
|
+
function parseYaml(content) {
|
|
46
|
+
const result = {};
|
|
47
|
+
|
|
48
|
+
const taskMatch = content.match(/task: "([^"]+)"/);
|
|
49
|
+
const modelMatch = content.match(/model: "([^"]+)"/);
|
|
50
|
+
const hashMatch = content.match(/task_hash: "([^"]+)"/);
|
|
51
|
+
|
|
52
|
+
result.task = taskMatch?.[1];
|
|
53
|
+
result.model = modelMatch?.[1];
|
|
54
|
+
result.task_hash = hashMatch?.[1];
|
|
55
|
+
|
|
56
|
+
const latencyMatch = content.match(/latency_seconds: ([\d.]+)/);
|
|
57
|
+
const costMatch = content.match(/cost_usd: ([\d.]+)/);
|
|
58
|
+
const promptTokens = content.match(/prompt: (\d+)/);
|
|
59
|
+
const completionTokens = content.match(/completion: (\d+)/);
|
|
60
|
+
|
|
61
|
+
result.latency = latencyMatch ? parseFloat(latencyMatch[1]) : null;
|
|
62
|
+
result.cost = costMatch ? parseFloat(costMatch[1]) : null;
|
|
63
|
+
result.tokens = {
|
|
64
|
+
prompt: promptTokens ? parseInt(promptTokens[1]) : null,
|
|
65
|
+
completion: completionTokens ? parseInt(completionTokens[1]) : null
|
|
66
|
+
};
|
|
67
|
+
|
|
68
|
+
const outputMatch = content.match(/output: \|\n([\s\S]+)$/);
|
|
69
|
+
result.output = outputMatch ? outputMatch[1].replace(/^ /gm, '').trim() : null;
|
|
70
|
+
|
|
71
|
+
return result;
|
|
72
|
+
}
|
|
73
|
+
|
|
74
|
+
// ============================================================================
|
|
75
|
+
// COMPARISON METRICS
|
|
76
|
+
// ============================================================================
|
|
77
|
+
|
|
78
|
+
function compare(baseline, candidate) {
|
|
79
|
+
const metrics = {
|
|
80
|
+
latency: {
|
|
81
|
+
baseline: baseline.latency,
|
|
82
|
+
candidate: candidate.latency,
|
|
83
|
+
ratio: candidate.latency / baseline.latency,
|
|
84
|
+
improvement: `${((1 - candidate.latency / baseline.latency) * 100).toFixed(1)}% faster`
|
|
85
|
+
},
|
|
86
|
+
cost: {
|
|
87
|
+
baseline: baseline.cost,
|
|
88
|
+
candidate: candidate.cost,
|
|
89
|
+
ratio: candidate.cost / baseline.cost,
|
|
90
|
+
savings: `${((1 - candidate.cost / baseline.cost) * 100).toFixed(1)}% cheaper`
|
|
91
|
+
},
|
|
92
|
+
tokens: {
|
|
93
|
+
baseline: baseline.tokens,
|
|
94
|
+
candidate: candidate.tokens
|
|
95
|
+
}
|
|
96
|
+
};
|
|
97
|
+
|
|
98
|
+
const baselineLines = baseline.output?.split('\n').length || 0;
|
|
99
|
+
const candidateLines = candidate.output?.split('\n').length || 0;
|
|
100
|
+
|
|
101
|
+
metrics.content = {
|
|
102
|
+
baseline_lines: baselineLines,
|
|
103
|
+
candidate_lines: candidateLines,
|
|
104
|
+
ratio: candidateLines / baselineLines
|
|
105
|
+
};
|
|
106
|
+
|
|
107
|
+
return metrics;
|
|
108
|
+
}
|
|
109
|
+
|
|
110
|
+
// ============================================================================
|
|
111
|
+
// REPORT GENERATOR
|
|
112
|
+
// ============================================================================
|
|
113
|
+
|
|
114
|
+
function generateReport(taskName, baseline, candidate, comparison) {
|
|
115
|
+
const timestamp = new Date().toISOString();
|
|
116
|
+
|
|
117
|
+
let report = `# Cross-Provider Qualification Report
|
|
118
|
+
|
|
119
|
+
**Task:** ${taskName}
|
|
120
|
+
**Baseline:** ${baseline.model} (hash: ${baseline.task_hash})
|
|
121
|
+
**Candidate:** ${candidate.model}
|
|
122
|
+
**Date:** ${timestamp.split('T')[0]}
|
|
123
|
+
|
|
124
|
+
---
|
|
125
|
+
|
|
126
|
+
## Performance Comparison
|
|
127
|
+
|
|
128
|
+
| Metric | ${baseline.model} | ${candidate.model} | Delta |
|
|
129
|
+
|--------|----------|-----------|-------|
|
|
130
|
+
| Latency | ${baseline.latency?.toFixed(1)}s | ${candidate.latency?.toFixed(1)}s | ${comparison.latency.improvement} |
|
|
131
|
+
| Cost | $${baseline.cost?.toFixed(4)} | $${candidate.cost?.toFixed(4)} | ${comparison.cost.savings} |
|
|
132
|
+
| Output Lines | ${comparison.content.baseline_lines} | ${comparison.content.candidate_lines} | ${(comparison.content.ratio * 100).toFixed(0)}% |
|
|
133
|
+
|
|
134
|
+
---
|
|
135
|
+
|
|
136
|
+
## Qualification Metrics
|
|
137
|
+
|
|
138
|
+
### Speed
|
|
139
|
+
- **${comparison.latency.ratio < 1 ? '✅' : '❌'} Latency:** ${comparison.latency.improvement}
|
|
140
|
+
|
|
141
|
+
### Cost
|
|
142
|
+
- **${comparison.cost.ratio < 0.5 ? '✅' : '⚠️'} Savings:** ${comparison.cost.savings}
|
|
143
|
+
|
|
144
|
+
### Content Completeness
|
|
145
|
+
- **${comparison.content.ratio > 0.8 ? '✅' : '❌'} Output Volume:** ${(comparison.content.ratio * 100).toFixed(0)}% of baseline
|
|
146
|
+
|
|
147
|
+
---
|
|
148
|
+
|
|
149
|
+
## Manual Review Required
|
|
150
|
+
|
|
151
|
+
- [ ] **Anti-Invention:** Zero unsourced claims?
|
|
152
|
+
- [ ] **Accuracy:** Citations correct?
|
|
153
|
+
- [ ] **Completeness:** All key items extracted?
|
|
154
|
+
- [ ] **Format:** Valid YAML/MD structure?
|
|
155
|
+
- [ ] **PT-BR Quality:** Natural Portuguese?
|
|
156
|
+
|
|
157
|
+
---
|
|
158
|
+
|
|
159
|
+
## Recommendation
|
|
160
|
+
|
|
161
|
+
`;
|
|
162
|
+
|
|
163
|
+
const speedOK = comparison.latency.ratio < 1;
|
|
164
|
+
const costOK = comparison.cost.ratio < 0.5;
|
|
165
|
+
const sizeOK = comparison.content.ratio > 0.7;
|
|
166
|
+
|
|
167
|
+
if (speedOK && costOK && sizeOK) {
|
|
168
|
+
report += `**LIKELY QUALIFIED** ✅
|
|
169
|
+
|
|
170
|
+
Candidate shows:
|
|
171
|
+
- ${comparison.latency.improvement}
|
|
172
|
+
- ${comparison.cost.savings}
|
|
173
|
+
- ${(comparison.content.ratio * 100).toFixed(0)}% output completeness
|
|
174
|
+
|
|
175
|
+
Proceed with manual quality review.`;
|
|
176
|
+
} else {
|
|
177
|
+
report += `**NEEDS REVIEW** ⚠️
|
|
178
|
+
|
|
179
|
+
Potential issues:
|
|
180
|
+
${!speedOK ? '- Slower than baseline\n' : ''}${!costOK ? '- Limited cost savings\n' : ''}${!sizeOK ? '- Significantly less output\n' : ''}
|
|
181
|
+
Review output quality before qualifying.`;
|
|
182
|
+
}
|
|
183
|
+
|
|
184
|
+
report += `
|
|
185
|
+
|
|
186
|
+
---
|
|
187
|
+
|
|
188
|
+
## Raw Outputs
|
|
189
|
+
|
|
190
|
+
### ${baseline.model} Output
|
|
191
|
+
|
|
192
|
+
\`\`\`yaml
|
|
193
|
+
${baseline.output?.slice(0, 2000) || 'N/A'}${baseline.output?.length > 2000 ? '\n... (truncated)' : ''}
|
|
194
|
+
\`\`\`
|
|
195
|
+
|
|
196
|
+
### ${candidate.model} Output
|
|
197
|
+
|
|
198
|
+
\`\`\`yaml
|
|
199
|
+
${candidate.output?.slice(0, 2000) || 'N/A'}${candidate.output?.length > 2000 ? '\n... (truncated)' : ''}
|
|
200
|
+
\`\`\`
|
|
201
|
+
`;
|
|
202
|
+
|
|
203
|
+
return report;
|
|
204
|
+
}
|
|
205
|
+
|
|
206
|
+
// ============================================================================
|
|
207
|
+
// CLI
|
|
208
|
+
// ============================================================================
|
|
209
|
+
|
|
210
|
+
async function main() {
|
|
211
|
+
const args = process.argv.slice(2);
|
|
212
|
+
|
|
213
|
+
if (args.includes('--help') || args.length === 0) {
|
|
214
|
+
console.log(`
|
|
215
|
+
Cross-Provider Results Comparator
|
|
216
|
+
|
|
217
|
+
Usage:
|
|
218
|
+
node compare-results.js --task <name> --baseline <model> --candidate <model>
|
|
219
|
+
|
|
220
|
+
Options:
|
|
221
|
+
--task Task name
|
|
222
|
+
--baseline Baseline model (default: opus)
|
|
223
|
+
--candidate Candidate model (e.g., glm5)
|
|
224
|
+
|
|
225
|
+
Paths (from squad-config.yaml):
|
|
226
|
+
Output: ${PATHS.outputDir}
|
|
227
|
+
|
|
228
|
+
Example:
|
|
229
|
+
node compare-results.js --task extract-knowledge --candidate glm5
|
|
230
|
+
`);
|
|
231
|
+
process.exit(0);
|
|
232
|
+
}
|
|
233
|
+
|
|
234
|
+
const getArg = (name, defaultValue = null) => {
|
|
235
|
+
const idx = args.indexOf(`--${name}`);
|
|
236
|
+
return idx !== -1 ? args[idx + 1] : defaultValue;
|
|
237
|
+
};
|
|
238
|
+
|
|
239
|
+
const taskName = getArg('task');
|
|
240
|
+
const baselineModel = getArg('baseline', 'opus');
|
|
241
|
+
const candidateModel = getArg('candidate');
|
|
242
|
+
|
|
243
|
+
if (!taskName || !candidateModel) {
|
|
244
|
+
console.error('❌ Missing required arguments. Use --help for usage.');
|
|
245
|
+
process.exit(1);
|
|
246
|
+
}
|
|
247
|
+
|
|
248
|
+
console.log(`\n📊 Comparing ${taskName}: ${baselineModel} vs ${candidateModel}\n`);
|
|
249
|
+
|
|
250
|
+
const baseline = loadLatestResult(taskName, baselineModel);
|
|
251
|
+
const candidate = loadLatestResult(taskName, candidateModel);
|
|
252
|
+
|
|
253
|
+
if (!baseline) {
|
|
254
|
+
console.error(`❌ No baseline results found for ${taskName}/${baselineModel}`);
|
|
255
|
+
process.exit(1);
|
|
256
|
+
}
|
|
257
|
+
|
|
258
|
+
if (!candidate) {
|
|
259
|
+
console.error(`❌ No candidate results found for ${taskName}/${candidateModel}`);
|
|
260
|
+
process.exit(1);
|
|
261
|
+
}
|
|
262
|
+
|
|
263
|
+
console.log(`✓ Loaded baseline: ${baseline.file}`);
|
|
264
|
+
console.log(`✓ Loaded candidate: ${candidate.file}`);
|
|
265
|
+
|
|
266
|
+
const comparison = compare(baseline.parsed, candidate.parsed);
|
|
267
|
+
const report = generateReport(taskName, baseline.parsed, candidate.parsed, comparison);
|
|
268
|
+
|
|
269
|
+
const reportPath = path.join(PATHS.outputDir, taskName, candidateModel, 'qualification-report.md');
|
|
270
|
+
fs.writeFileSync(reportPath, report);
|
|
271
|
+
|
|
272
|
+
console.log(`\n📄 Report saved: ${reportPath}`);
|
|
273
|
+
console.log(`\n${'='.repeat(50)}`);
|
|
274
|
+
console.log('Quick Summary:');
|
|
275
|
+
console.log(`${'='.repeat(50)}`);
|
|
276
|
+
console.log(`Latency: ${comparison.latency.improvement}`);
|
|
277
|
+
console.log(`Cost: ${comparison.cost.savings}`);
|
|
278
|
+
console.log(`Output: ${(comparison.content.ratio * 100).toFixed(0)}% of baseline`);
|
|
279
|
+
}
|
|
280
|
+
|
|
281
|
+
main();
|