@event4u/agent-config 6.1.0 → 7.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude-plugin/marketplace.json +35 -3
- package/AGENTS.md +8 -7
- package/CHANGELOG.md +408 -0
- package/CONTRIBUTING.md +1 -1
- package/README.md +17 -15
- package/dist/agent-src/commands/agent-status.md +2 -2
- package/dist/agent-src/commands/agents/audit.md +3 -3
- package/dist/agent-src/commands/agents/init.md +1 -1
- package/dist/agent-src/commands/agents/optimize.md +4 -4
- package/dist/agent-src/commands/analyze/decision.md +108 -0
- package/dist/agent-src/commands/analyze/incident.md +120 -0
- package/dist/agent-src/commands/analyze/near-miss.md +113 -0
- package/dist/agent-src/commands/analyze/postmortem.md +130 -0
- package/dist/agent-src/commands/analyze/premortem.md +104 -0
- package/dist/agent-src/commands/analyze.md +124 -0
- package/dist/agent-src/commands/brand/identity.md +27 -0
- package/dist/agent-src/commands/brand/review.md +27 -0
- package/dist/agent-src/commands/brand/strategy.md +27 -0
- package/dist/agent-src/commands/brand/tokens.md +28 -0
- package/dist/agent-src/commands/brand/voice.md +27 -0
- package/dist/agent-src/commands/brand.md +58 -0
- package/dist/agent-src/commands/check-current-md.md +3 -3
- package/dist/agent-src/commands/condense.md +2 -2
- package/dist/agent-src/commands/council/debate.md +2 -2
- package/dist/agent-src/commands/council/default.md +45 -18
- package/dist/agent-src/commands/fix/portability.md +3 -3
- package/dist/agent-src/commands/fix/refs.md +3 -3
- package/dist/agent-src/commands/implement-ticket.md +36 -6
- package/dist/agent-src/commands/knowledge/cross-repo.md +1 -1
- package/dist/agent-src/commands/memory/add.md +1 -1
- package/dist/agent-src/commands/mission/upgrade.md +182 -0
- package/dist/agent-src/commands/optimize/skills.md +2 -2
- package/dist/agent-src/commands/orchestrate.md +1 -1
- package/dist/agent-src/commands/pr/create.md +6 -4
- package/dist/agent-src/commands/review-changes.md +8 -0
- package/dist/agent-src/commands/roadmap/materialize.md +73 -0
- package/dist/agent-src/commands/skill/preview.md +1 -1
- package/dist/agent-src/commands/skills/discover.md +1 -1
- package/dist/agent-src/commands/threat-model.md +4 -4
- package/dist/agent-src/commands/upstream-contribute.md +3 -3
- package/dist/agent-src/commands/video/from-script.md +2 -2
- package/dist/agent-src/commands/video/from-song.md +3 -3
- package/dist/agent-src/commands/video/scene.md +1 -1
- package/dist/agent-src/commands/video/storyboard.md +1 -1
- package/dist/agent-src/commands/video.md +3 -3
- package/dist/agent-src/contexts/communication/rules-auto/source-of-truth-mechanics.md +3 -3
- package/dist/agent-src/contexts/communication/rules-auto/user-interaction-mechanics.md +1 -1
- package/dist/agent-src/contexts/execution/evidence-discipline.md +153 -0
- package/dist/agent-src/contexts/execution/project-intelligence.md +264 -0
- package/dist/agent-src/contexts/execution/roadmap-process-loop.md +2 -1
- package/dist/agent-src/personas/ai-video-technical-director.md +1 -1
- package/dist/agent-src/personas/brand-strategist.md +74 -0
- package/dist/agent-src/personas/design-director.md +74 -0
- package/dist/agent-src/rules/brand-consistency.md +77 -0
- package/dist/agent-src/rules/brand-source-of-truth.md +57 -0
- package/dist/agent-src/rules/direct-answers.md +2 -0
- package/dist/agent-src/rules/domain-safety-disclaimer.md +2 -0
- package/dist/agent-src/rules/git-history-discipline.md +1 -0
- package/dist/agent-src/rules/icon-consistency.md +53 -0
- package/dist/agent-src/rules/image-likeness-and-rights.md +67 -0
- package/dist/agent-src/rules/lethal-trifecta-guard.md +1 -1
- package/dist/agent-src/rules/persona-governance.md +2 -2
- package/dist/agent-src/rules/provider-lifecycle-discipline.md +3 -1
- package/dist/agent-src/rules/roadmap-progress-sync.md +10 -0
- package/dist/agent-src/rules/security-sensitive-stop.md +9 -3
- package/dist/agent-src/rules/size-enforcement.md +1 -1
- package/dist/agent-src/rules/source-confidentiality.md +3 -3
- package/dist/agent-src/rules/source-discovery-gate.md +98 -0
- package/dist/agent-src/rules/think-before-action.md +1 -0
- package/dist/agent-src/rules/ui-audit-gate.md +2 -0
- package/dist/agent-src/rules/untrusted-input-defense.md +1 -1
- package/dist/agent-src/rules/user-interaction.md +1 -1
- package/dist/agent-src/scripts/archive_completed_roadmaps.ts +392 -0
- package/dist/agent-src/scripts/update_roadmap_progress.ts +824 -0
- package/dist/agent-src/skills/adr-create/SKILL.md +5 -5
- package/dist/agent-src/skills/agent-security-review/evals/triggers.json +1 -0
- package/dist/agent-src/skills/agents-md-thin-root/SKILL.md +1 -1
- package/dist/agent-src/skills/ai-council/SKILL.md +1 -1
- package/dist/agent-src/skills/analysis-autonomous-mode/SKILL.md +9 -13
- package/dist/agent-src/skills/blade-ui/SKILL.md +12 -5
- package/dist/agent-src/skills/blameless-post-mortem/SKILL.md +199 -0
- package/dist/agent-src/skills/brand/ATTRIBUTION.md +38 -0
- package/dist/agent-src/skills/brand/SKILL.md +115 -0
- package/dist/agent-src/skills/brand/data/archetypes.csv +13 -0
- package/dist/agent-src/skills/brand/data/color-psychology.csv +14 -0
- package/dist/agent-src/skills/brand/data/logo-style-fit.csv +13 -0
- package/dist/agent-src/skills/brand/data/manifest.json +226 -0
- package/dist/agent-src/skills/brand/data/messaging-frameworks.csv +13 -0
- package/dist/agent-src/skills/brand/data/naming-patterns.csv +13 -0
- package/dist/agent-src/skills/brand/data/typography-principles.csv +13 -0
- package/dist/agent-src/skills/brand/data/voice-tone.csv +13 -0
- package/dist/agent-src/skills/brand/evals/triggers.json +17 -0
- package/dist/agent-src/skills/brand-asset-generation/SKILL.md +89 -0
- package/dist/agent-src/skills/brand-asset-generation/evals/triggers.json +17 -0
- package/dist/agent-src/skills/brand-audit/SKILL.md +67 -0
- package/dist/agent-src/skills/brand-audit/evals/triggers.json +17 -0
- package/dist/agent-src/skills/brand-identity/SKILL.md +101 -0
- package/dist/agent-src/skills/brand-identity/evals/triggers.json +17 -0
- package/dist/agent-src/skills/brand-strategy/SKILL.md +83 -0
- package/dist/agent-src/skills/brand-strategy/evals/triggers.json +17 -0
- package/dist/agent-src/skills/brand-to-tokens/SKILL.md +102 -0
- package/dist/agent-src/skills/brand-to-tokens/evals/triggers.json +17 -0
- package/dist/agent-src/skills/brand-to-tokens/templates/marp-brand-deck.md.example +46 -0
- package/dist/agent-src/skills/brand-to-tokens/templates/reveal-brand-deck.yaml +32 -0
- package/dist/agent-src/skills/canvas-design/evals/triggers.json +1 -0
- package/dist/agent-src/skills/check-refs/SKILL.md +5 -5
- package/dist/agent-src/skills/code-review/SKILL.md +6 -15
- package/dist/agent-src/skills/command-writing/SKILL.md +2 -2
- package/dist/agent-src/skills/complexity-first-planning/evals/triggers.json +1 -0
- package/dist/agent-src/skills/context-authoring/SKILL.md +2 -2
- package/dist/agent-src/skills/context-document/SKILL.md +35 -2
- package/dist/agent-src/skills/corpus-grounding/evals/triggers.json +1 -0
- package/dist/agent-src/skills/corpus-grounding/scripts/bm25_search.ts +482 -0
- package/dist/agent-src/skills/corpus-grounding/scripts/decision_engine.ts +803 -0
- package/dist/agent-src/skills/corpus-grounding/scripts/ground.ts +541 -0
- package/dist/agent-src/skills/corpus-grounding/scripts/schema_validator.ts +309 -0
- package/dist/agent-src/skills/database/SKILL.md +26 -4
- package/dist/agent-src/skills/decision-record/SKILL.md +1 -1
- package/dist/agent-src/skills/decision-record/evals/triggers.json +17 -0
- package/dist/agent-src/skills/decision-review/SKILL.md +179 -0
- package/dist/agent-src/skills/description-assist/SKILL.md +1 -1
- package/dist/agent-src/skills/design-intelligence/SKILL.md +1 -1
- package/dist/agent-src/skills/design-intelligence/data/manifest.json +23 -6
- package/dist/agent-src/skills/design-intelligence/evals/triggers.json +1 -0
- package/dist/agent-src/skills/design-tokens/evals/triggers.json +1 -0
- package/dist/agent-src/skills/design-tokens/scripts/tokens.ts +888 -0
- package/dist/agent-src/skills/doc-coauthoring/evals/triggers.json +1 -0
- package/dist/agent-src/skills/eloquent/evals/triggers.json +1 -0
- package/dist/agent-src/skills/emit-tickets/SKILL.md +198 -0
- package/dist/agent-src/skills/estimate-ticket/evals/triggers.json +1 -0
- package/dist/agent-src/skills/git-workflow/SKILL.md +33 -0
- package/dist/agent-src/skills/guideline-writing/SKILL.md +2 -2
- package/dist/agent-src/skills/iconography/SKILL.md +88 -0
- package/dist/agent-src/skills/iconography/evals/triggers.json +17 -0
- package/dist/agent-src/skills/image-analyser/evals/triggers.json +1 -0
- package/dist/agent-src/skills/image-creator/evals/triggers.json +1 -0
- package/dist/agent-src/skills/image-editing/SKILL.md +100 -0
- package/dist/agent-src/skills/image-editing/evals/triggers.json +17 -0
- package/dist/agent-src/skills/image-generation/SKILL.md +95 -0
- package/dist/agent-src/skills/image-generation/evals/triggers.json +17 -0
- package/dist/agent-src/skills/image-provider-routing/SKILL.md +96 -0
- package/dist/agent-src/skills/image-provider-routing/evals/triggers.json +17 -0
- package/dist/agent-src/skills/launch-readiness/SKILL.md +21 -0
- package/dist/agent-src/skills/learning-to-rule-or-skill/SKILL.md +12 -8
- package/dist/agent-src/skills/lint-skills/SKILL.md +5 -5
- package/dist/agent-src/skills/logo-generation/SKILL.md +98 -0
- package/dist/agent-src/skills/logo-generation/evals/triggers.json +17 -0
- package/dist/agent-src/skills/markitdown/SKILL.md +1 -1
- package/dist/agent-src/skills/md-language-check/SKILL.md +1 -1
- package/dist/agent-src/skills/motion-choreographer/SKILL.md +1 -1
- package/dist/agent-src/skills/php-coder/evals/triggers.json +1 -0
- package/dist/agent-src/skills/prediction-pool-optimizer/evals/triggers.json +1 -0
- package/dist/agent-src/skills/premortem/SKILL.md +137 -0
- package/dist/agent-src/skills/prompt-engineering-image/SKILL.md +115 -0
- package/dist/agent-src/skills/prompt-engineering-image/evals/triggers.json +17 -0
- package/dist/agent-src/skills/prompt-validator/evals/triggers.json +1 -0
- package/dist/agent-src/skills/react-shadcn-ui/SKILL.md +12 -5
- package/dist/agent-src/skills/react-shadcn-ui/scripts/shadcn_add.ts +388 -0
- package/dist/agent-src/skills/reasoning-orchestrator/SKILL.md +1 -1
- package/dist/agent-src/skills/reasoning-orchestrator/evals/triggers.json +1 -0
- package/dist/agent-src/skills/refine-ticket/evals/triggers.json +1 -0
- package/dist/agent-src/skills/roadmap-management/SKILL.md +16 -3
- package/dist/agent-src/skills/roadmap-writing/SKILL.md +76 -0
- package/dist/agent-src/skills/root-cause-frameworks/SKILL.md +146 -0
- package/dist/agent-src/skills/rule-refactor/SKILL.md +9 -9
- package/dist/agent-src/skills/rule-writing/SKILL.md +7 -7
- package/dist/agent-src/skills/script-writing/SKILL.md +2 -2
- package/dist/agent-src/skills/security-audit/SKILL.md +5 -0
- package/dist/agent-src/skills/skill-improvement-pipeline/SKILL.md +19 -3
- package/dist/agent-src/skills/skill-management/SKILL.md +3 -3
- package/dist/agent-src/skills/skill-reviewer/SKILL.md +1 -1
- package/dist/agent-src/skills/skill-writing/SKILL.md +5 -5
- package/dist/agent-src/skills/skill-writing/evals/triggers.json +1 -0
- package/dist/agent-src/skills/source-discovery/SKILL.md +182 -0
- package/dist/agent-src/skills/standards-from-config/SKILL.md +93 -0
- package/dist/agent-src/skills/systematic-debugging/SKILL.md +7 -0
- package/dist/agent-src/skills/tailwind-engineer/scripts/tailwind_config_gen.ts +561 -0
- package/dist/agent-src/skills/threat-modeling/SKILL.md +1 -0
- package/dist/agent-src/skills/typography-system/SKILL.md +138 -0
- package/dist/agent-src/skills/typography-system/evals/triggers.json +17 -0
- package/dist/agent-src/skills/upstream-contribute/SKILL.md +3 -3
- package/dist/agent-src/skills/verify-repair-loop/SKILL.md +209 -0
- package/dist/agent-src/skills/verify-repair-loop/evals/output-schema.yml +20 -0
- package/dist/agent-src/skills/verify-repair-loop/evals/triggers.json +17 -0
- package/dist/agent-src/templates/agent-settings.md +7 -0
- package/dist/agent-src/templates/contexts/knowledge-card.md +69 -0
- package/dist/agent-src/templates/contexts/lesson-card.md +73 -0
- package/dist/agent-src/templates/roadmaps.md +29 -1
- package/dist/agent-src/templates/scripts/README.md +6 -6
- package/dist/agent-src/templates/scripts/check_memory.ts +640 -0
- package/dist/agent-src/templates/scripts/check_memory_proposal.ts +351 -0
- package/dist/agent-src/templates/scripts/implement_ticket/__main__.ts +27 -0
- package/dist/agent-src/templates/scripts/memory_hash.ts +333 -0
- package/dist/agent-src/templates/scripts/memory_lookup.ts +1067 -0
- package/dist/agent-src/templates/scripts/memory_report.ts +846 -0
- package/dist/agent-src/templates/scripts/memory_signal.ts +422 -0
- package/dist/agent-src/templates/scripts/memory_status.ts +191 -0
- package/dist/agent-src/templates/scripts/pr_review_routing.ts +523 -0
- package/dist/agent-src/templates/scripts/pr_risk_review.ts +0 -0
- package/dist/agent-src/templates/scripts/telemetry/aggregator.ts +0 -0
- package/dist/agent-src/templates/scripts/telemetry/boundary.ts +164 -0
- package/dist/agent-src/templates/scripts/telemetry/engagement.ts +479 -0
- package/dist/agent-src/templates/scripts/telemetry/report_renderer.ts +394 -0
- package/dist/agent-src/templates/scripts/telemetry/settings.ts +210 -0
- package/dist/agent-src/templates/scripts/telemetry_record.ts +255 -0
- package/dist/agent-src/templates/scripts/telemetry_report.ts +189 -0
- package/dist/agent-src/templates/scripts/telemetry_status.ts +312 -0
- package/dist/agent-src/templates/scripts/tier_usage_report.ts +597 -0
- package/dist/agent-src/templates/scripts/work_engine/__main__.ts +14 -0
- package/dist/agent-src/templates/scripts/work_engine/_lib/agent_settings.ts +1118 -0
- package/dist/agent-src/templates/scripts/work_engine/_lib/user_global_paths.ts +329 -0
- package/dist/agent-src/templates/scripts/work_engine/cli.ts +206 -0
- package/dist/agent-src/templates/scripts/work_engine/cli_args.ts +249 -0
- package/dist/agent-src/templates/scripts/work_engine/delivery_state.ts +225 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/analyze.ts +125 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/implement.ts +189 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/index.ts +94 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/memory.ts +193 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/plan.ts +267 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/refine.ts +518 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/report.ts +379 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/test.ts +268 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/verify.ts +258 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/index.ts +32 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/mixed/contract.ts +243 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/mixed/index.ts +108 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/mixed/stitch.ts +259 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/mixed/ui.ts +216 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/_passthrough.ts +40 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/app_spec.ts +241 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/apply.ts +216 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/audit.ts +506 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/design.ts +325 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/index.ts +102 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/polish.ts +462 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/review.ts +474 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/scaffold.ts +352 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/ui_trivial/_skipped.ts +33 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/ui_trivial/apply.ts +213 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/ui_trivial/index.ts +111 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/ui_trivial/refine.ts +126 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/ui_trivial/report.ts +112 -0
- package/dist/agent-src/templates/scripts/work_engine/directives/ui_trivial/test.ts +164 -0
- package/dist/agent-src/templates/scripts/work_engine/dispatcher.ts +515 -0
- package/dist/agent-src/templates/scripts/work_engine/emitters.ts +119 -0
- package/dist/agent-src/templates/scripts/work_engine/errors.ts +24 -0
- package/dist/agent-src/templates/scripts/work_engine/hook_bootstrap.ts +104 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/_chat_history_base.ts +176 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/chat_history_append.ts +41 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/chat_history_halt_append.ts +89 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/decision_gate.ts +193 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/decision_trace.ts +304 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/directive_set_guard.ts +110 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/halt_surface_audit.ts +118 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/index.ts +17 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/memory_visibility.ts +161 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/state_shape_validation.ts +45 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/trace.ts +134 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/context.ts +94 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/events.ts +58 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/exceptions.ts +85 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/index.ts +27 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/registry.ts +66 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/runner.ts +90 -0
- package/dist/agent-src/templates/scripts/work_engine/hooks/settings.ts +260 -0
- package/dist/agent-src/templates/scripts/work_engine/input_builders.ts +260 -0
- package/dist/agent-src/templates/scripts/work_engine/intent/classify.ts +466 -0
- package/dist/agent-src/templates/scripts/work_engine/migration/v0_to_v1.ts +531 -0
- package/dist/agent-src/templates/scripts/work_engine/orchestration.ts +366 -0
- package/dist/agent-src/templates/scripts/work_engine/persona_policy.ts +97 -0
- package/dist/agent-src/templates/scripts/work_engine/resolvers/diff.ts +135 -0
- package/dist/agent-src/templates/scripts/work_engine/resolvers/file.ts +175 -0
- package/dist/agent-src/templates/scripts/work_engine/resolvers/prompt.ts +115 -0
- package/dist/agent-src/templates/scripts/work_engine/scoring/confidence.ts +415 -0
- package/dist/agent-src/templates/scripts/work_engine/scoring/decision_engine.ts +466 -0
- package/dist/agent-src/templates/scripts/work_engine/scoring/decision_trace.ts +298 -0
- package/dist/agent-src/templates/scripts/work_engine/scoring/memory_visibility.ts +444 -0
- package/dist/agent-src/templates/scripts/work_engine/stack/detect.ts +252 -0
- package/dist/agent-src/templates/scripts/work_engine/stack/runner.ts +745 -0
- package/dist/agent-src/templates/scripts/work_engine/state.ts +1151 -0
- package/dist/agent-src/templates/scripts/work_engine/state_io.ts +413 -0
- package/dist/agent-src/templates/tickets.md +120 -0
- package/dist/cli/commands/commands.js +2 -2
- package/dist/cli/commands/commands.js.map +1 -1
- package/dist/cli/commands/doctorShell.js +4 -22
- package/dist/cli/commands/doctorShell.js.map +1 -1
- package/dist/cli/commands/packs.js +1 -1
- package/dist/cli/commands/packs.js.map +1 -1
- package/dist/cli/commands/recordTriggerEval.js +179 -0
- package/dist/cli/commands/recordTriggerEval.js.map +1 -0
- package/dist/cli/commands/recordTriggerEval.test.js +113 -0
- package/dist/cli/commands/recordTriggerEval.test.js.map +1 -0
- package/dist/cli/commands/workspaces.js +1 -1
- package/dist/cli/commands/workspaces.js.map +1 -1
- package/dist/cli/main.js +22 -1
- package/dist/cli/main.js.map +1 -1
- package/dist/cli/python/knowledge_ingest.js +1048 -0
- package/dist/cli/python/knowledge_ingest.js.map +1 -0
- package/dist/cli/python/workspace_analytics.js +1085 -0
- package/dist/cli/python/workspace_analytics.js.map +1 -0
- package/dist/cli/python/workspace_crypto.js +544 -0
- package/dist/cli/python/workspace_crypto.js.map +1 -0
- package/dist/cli/python/workspace_documents.js +1216 -0
- package/dist/cli/python/workspace_documents.js.map +1 -0
- package/dist/cli/python/workspace_drive.js +574 -0
- package/dist/cli/python/workspace_drive.js.map +1 -0
- package/dist/cli/python/workspace_drive_health.js +628 -0
- package/dist/cli/python/workspace_drive_health.js.map +1 -0
- package/dist/cli/python/workspace_explain.js +765 -0
- package/dist/cli/python/workspace_explain.js.map +1 -0
- package/dist/cli/python/workspace_hosts.js +349 -0
- package/dist/cli/python/workspace_hosts.js.map +1 -0
- package/dist/cli/python/workspace_inbox.js +692 -0
- package/dist/cli/python/workspace_inbox.js.map +1 -0
- package/dist/cli/python/workspace_render.js +816 -0
- package/dist/cli/python/workspace_render.js.map +1 -0
- package/dist/cli/python/workspace_roles.js +487 -0
- package/dist/cli/python/workspace_roles.js.map +1 -0
- package/dist/cli/python/workspace_secrets.js +180 -0
- package/dist/cli/python/workspace_secrets.js.map +1 -0
- package/dist/cli/python/workspace_sessions.js +1079 -0
- package/dist/cli/python/workspace_sessions.js.map +1 -0
- package/dist/cli/python/workspace_skills.js +417 -0
- package/dist/cli/python/workspace_skills.js.map +1 -0
- package/dist/cli/registry.js +2 -0
- package/dist/cli/registry.js.map +1 -1
- package/dist/discovery/deprecation-report.md +1 -1
- package/dist/discovery/discovery-manifest.json +1174 -123
- package/dist/discovery/discovery-manifest.json.sha256 +1 -1
- package/dist/discovery/discovery-manifest.summary.md +9 -6
- package/dist/discovery/orphan-report.md +1 -1
- package/dist/discovery/packs.json +163 -15
- package/dist/discovery/trust-report.md +4 -4
- package/dist/discovery/workspaces.json +73 -12
- package/dist/install/install.mjs +13934 -0
- package/dist/mcp/registry-manifest.json +4 -4
- package/dist/router.json +1 -1
- package/dist/server/routes/wizard.js +50 -21
- package/dist/server/routes/wizard.js.map +1 -1
- package/dist/server/routes/workspace.js +44 -25
- package/dist/server/routes/workspace.js.map +1 -1
- package/dist/server/schemas/settings.js +15 -0
- package/dist/server/schemas/settings.js.map +1 -1
- package/docs/SKILL_CENSUS.md +344 -0
- package/docs/architecture/augment-projection.md +1 -1
- package/docs/architecture/multi-tool-projection.md +3 -3
- package/docs/architecture.md +37 -6
- package/docs/benchmark.md +24 -27
- package/docs/capability-matrix.md +32 -0
- package/docs/catalog.md +50 -9
- package/docs/command-naming-audit.md +60 -0
- package/docs/contracts/STABILITY.md +32 -0
- package/docs/contracts/agents-md-tech-stack.md +1 -1
- package/docs/contracts/ai-council-config.md +22 -22
- package/docs/contracts/analysis-memory-loop.md +149 -0
- package/docs/contracts/benchmark-ab-contract.md +3 -3
- package/docs/contracts/branch-protection-policy.md +27 -0
- package/docs/contracts/brand-token-consumption.md +69 -0
- package/docs/contracts/command-clusters.md +2 -1
- package/docs/contracts/command-surface-tiers.md +13 -0
- package/docs/contracts/discovery-manifest.schema.json +24 -5
- package/docs/contracts/implement-ticket-flow.md +9 -9
- package/docs/contracts/install-layout.md +249 -0
- package/docs/contracts/kernel-membership.md +1 -1
- package/docs/contracts/linear-ai-rules-inclusion.md +2 -2
- package/docs/contracts/linter-structural-model.md +1 -1
- package/docs/contracts/mcp-discovery-phase-notice.md +1 -1
- package/docs/contracts/multi-tool-projection-fidelity.md +1 -1
- package/docs/contracts/namespace.md +2 -2
- package/docs/contracts/no-runtime-boundary.md +56 -0
- package/docs/contracts/package-self-orientation.md +24 -0
- package/docs/contracts/provider-lifecycle.md +3 -3
- package/docs/contracts/reasoning-discipline-protocol.md +83 -0
- package/docs/contracts/rule-classification.md +3 -3
- package/docs/contracts/skill-domains.md +1 -1
- package/docs/contracts/smoke-contracts.md +1 -1
- package/docs/contracts/surface-tiers.md +81 -0
- package/docs/contracts/ticket-bundle-format.md +228 -0
- package/docs/cookbook.md +152 -0
- package/docs/customization.md +12 -1
- package/docs/decisions/ADR-013-discovery-frontmatter-contract.md +16 -0
- package/docs/decisions/ADR-056-unvalidated-video-adapters-disposition.md +1 -1
- package/docs/decisions/ADR-059-render-resume-filesystem-as-state.md +1 -1
- package/docs/decisions/ADR-060-comfyui-sandbox-model.md +1 -1
- package/docs/decisions/ADR-061-corpus-grounding-layer.md +48 -1
- package/docs/decisions/ADR-096-analysis-workbench.md +110 -0
- package/docs/decisions/ADR-097-mission-recipe-privilege-boundary.md +121 -0
- package/docs/decisions/ADR-098-evidence-first-structure-discovery.md +154 -0
- package/docs/decisions/ADR-099-file-first-pattern-library.md +87 -0
- package/docs/decisions/ADR-100-global-knowledge-card-sharing.md +133 -0
- package/docs/decisions/ADR-101-ticket-bundle-emission.md +109 -0
- package/docs/decisions/ADR-102-ticket-handoff-paste-and-mcp.md +72 -0
- package/docs/decisions/ADR-103-global-knowledge-default-off-until-measured.md +92 -0
- package/docs/decisions/ADR-200-python-to-typescript-migration.md +193 -0
- package/docs/decisions/INDEX.md +9 -0
- package/docs/distribution/mcp-submission-checklist.md +3 -3
- package/docs/featured-commands.md +1 -1
- package/docs/featured-skills.md +1 -1
- package/docs/getting-started-by-role.md +2 -0
- package/docs/getting-started.md +2 -2
- package/docs/guidelines/agent-infra/failure-signatures.md +35 -0
- package/docs/guidelines/agent-infra/frontier-reasoning-operating-profile.md +5 -0
- package/docs/guidelines/agent-infra/size-and-scope.md +17 -0
- package/docs/guidelines/agent-infra/skill-quality-checklist.md +2 -2
- package/docs/guides/frontend-design-corpus-refresh.md +83 -0
- package/docs/guides/skill-preview.md +1 -1
- package/docs/hook-payload-capture.md +4 -4
- package/docs/mcp.md +1 -1
- package/docs/migration/consumer-template-consumption-model.md +145 -0
- package/docs/migration/divergences/README.md +55 -0
- package/docs/migration/divergences/_template.md +50 -0
- package/docs/migration/divergences/bench-stats-float-precision.md +72 -0
- package/docs/migration/divergences/mcp-telemetry-node-sqlite.md +61 -0
- package/docs/migration/divergences/pack-mcp-content-gzip-body.md +53 -0
- package/docs/migration/divergences/src-scripts-build_cloud_bundle.md +63 -0
- package/docs/migration/divergences/src-scripts-check_memory.md +91 -0
- package/docs/migration/divergences/src-scripts-inventory_abstraction_budget.md +65 -0
- package/docs/migration/divergences/src-scripts-lint_marketplace.md +57 -0
- package/docs/migration/divergences/src-scripts-lint_mcp_registry_manifest.md +70 -0
- package/docs/migration/divergences/src-scripts-spotcheck_thin_root.md +60 -0
- package/docs/migration/divergences/src-scripts-validate_agent_settings.md +58 -0
- package/docs/migration/node-floor.md +86 -0
- package/docs/migration/yaml-roundtrip-spike.md +163 -0
- package/docs/personas.md +6 -1
- package/docs/role-experiences.md +19 -0
- package/docs/setup/per-ide/windsurf.md +1 -1
- package/docs/skills-catalog.md +24 -3
- package/docs/threat-model.md +28 -0
- package/llms.txt +23 -2
- package/package.json +10 -15
- package/src/config/agent-settings.template.yml +64 -1
- package/src/config/discovery/packs.yml +31 -0
- package/src/config/discovery/unassigned-artefacts.yml +6 -0
- package/src/config/discovery/workspaces.yml +2 -2
- package/src/config/gitignore-block.txt +7 -0
- package/src/scripts/_cli/cmd_doctor.ts +2306 -0
- package/src/scripts/_cli/cmd_explain.ts +748 -0
- package/src/scripts/_cli/cmd_export.ts +375 -0
- package/src/scripts/_cli/cmd_migrate.ts +951 -0
- package/src/scripts/_cli/cmd_prune.ts +610 -0
- package/src/scripts/_cli/cmd_refresh.ts +530 -0
- package/src/scripts/_cli/cmd_settings_check.ts +407 -0
- package/src/scripts/_cli/cmd_settings_migrate.ts +344 -0
- package/src/scripts/_cli/cmd_sync.ts +381 -0
- package/src/scripts/_cli/cmd_uninstall.ts +833 -0
- package/src/scripts/_cli/cmd_update.ts +585 -0
- package/src/scripts/_cli/cmd_upgrade.ts +390 -0
- package/src/scripts/_cli/cmd_validate.ts +394 -0
- package/src/scripts/_cli/cmd_versions.ts +492 -0
- package/src/scripts/_cli/explain_last/assumptions.ts +114 -0
- package/src/scripts/_cli/explain_last/council.ts +197 -0
- package/src/scripts/_cli/explain_last/halt.ts +73 -0
- package/src/scripts/_cli/explain_last/index.ts +155 -0
- package/src/scripts/_cli/explain_last/inputs.ts +211 -0
- package/src/scripts/_cli/explain_last/memory.ts +231 -0
- package/src/scripts/_cli/explain_last/provider.ts +82 -0
- package/src/scripts/_cli/explain_last/render.ts +54 -0
- package/src/scripts/_cli/explain_last/route.ts +70 -0
- package/src/scripts/_cli/explain_last/scrubber.ts +138 -0
- package/src/scripts/_cli/explain_last/sections/assumptions.ts +51 -0
- package/src/scripts/_cli/explain_last/sections/council.ts +56 -0
- package/src/scripts/_cli/explain_last/sections/halt.ts +60 -0
- package/src/scripts/_cli/explain_last/sections/header.ts +50 -0
- package/src/scripts/_cli/explain_last/sections/index.ts +21 -0
- package/src/scripts/_cli/explain_last/sections/inputs.ts +63 -0
- package/src/scripts/_cli/explain_last/sections/memory.ts +124 -0
- package/src/scripts/_cli/explain_last/sections/pack.ts +42 -0
- package/src/scripts/_cli/explain_last/sections/provider.ts +51 -0
- package/src/scripts/_cli/explain_last/sections/route.ts +48 -0
- package/src/scripts/_cli/explain_last/state_loader.ts +119 -0
- package/src/scripts/_dispatch.bash +179 -163
- package/src/scripts/_lib/agent_settings.ts +1123 -0
- package/src/scripts/_lib/agent_src.ts +654 -0
- package/src/scripts/_lib/agents_overlay.ts +183 -0
- package/src/scripts/_lib/bench_ab_cache.ts +399 -0
- package/src/scripts/_lib/bench_ab_scoring.ts +352 -0
- package/src/scripts/_lib/bench_ab_scoring_v2.ts +751 -0
- package/src/scripts/_lib/bench_cost.ts +396 -0
- package/src/scripts/_lib/bench_quality.ts +237 -0
- package/src/scripts/_lib/bench_report.ts +255 -0
- package/src/scripts/_lib/bench_telegraph.ts +516 -0
- package/src/scripts/_lib/bench_telegraph_report.ts +272 -0
- package/src/scripts/_lib/changelog_eras.ts +398 -0
- package/src/scripts/_lib/claude_desktop_bundler.ts +324 -0
- package/src/scripts/_lib/cli_wrapper.ts +89 -0
- package/src/scripts/_lib/fs_atomic.ts +172 -0
- package/src/scripts/_lib/global_deploy_inventory.ts +639 -0
- package/src/scripts/_lib/install_layout.ts +87 -0
- package/src/scripts/_lib/install_regenerator.ts +157 -0
- package/src/scripts/_lib/installed_lock.ts +451 -0
- package/src/scripts/_lib/installed_tools.ts +518 -0
- package/src/scripts/_lib/json_pointers.ts +388 -0
- package/src/scripts/_lib/knowledge_global.ts +770 -0
- package/src/scripts/_lib/knowledge_global_promote.ts +453 -0
- package/src/scripts/_lib/knowledge_global_redaction.ts +448 -0
- package/src/scripts/_lib/link_crypto.ts +325 -0
- package/src/scripts/_lib/linked_projects.ts +613 -0
- package/src/scripts/_lib/model_tier.ts +65 -0
- package/src/scripts/_lib/module_detection.ts +275 -0
- package/src/scripts/_lib/node_sqlite.d.ts +32 -0
- package/src/scripts/_lib/pin_resolver.ts +264 -0
- package/src/scripts/_lib/py_random.ts +212 -0
- package/src/scripts/_lib/script_output.ts +147 -0
- package/src/scripts/_lib/security_lint.ts +623 -0
- package/src/scripts/_lib/surface_tiers.ts +127 -0
- package/src/scripts/_lib/token_count.ts +126 -0
- package/src/scripts/_lib/update_check.ts +297 -0
- package/src/scripts/_lib/user_global_paths.ts +329 -0
- package/src/scripts/_lib/value_ladder.ts +882 -0
- package/src/scripts/_lib/value_report.ts +617 -0
- package/src/scripts/_lib/zip_min.ts +175 -0
- package/src/scripts/adoption_report.ts +357 -0
- package/src/scripts/adoption_snapshot.ts +392 -0
- package/src/scripts/adoption_status.ts +424 -0
- package/src/scripts/adr/regenerate_index.ts +257 -0
- package/src/scripts/ai-image/adapters/flux.sh +45 -0
- package/src/scripts/ai-image/adapters/gemini-image.sh +45 -0
- package/src/scripts/ai-image/adapters/ideogram.sh +45 -0
- package/src/scripts/ai-image/adapters/recraft.sh +47 -0
- package/src/scripts/ai-video/adapters/comfyui.sh +3 -3
- package/src/scripts/ai-video/adapters/fal.sh +3 -3
- package/src/scripts/ai-video/adapters/gemini-veo.sh +3 -3
- package/src/scripts/ai-video/adapters/higgsfield.sh +3 -3
- package/src/scripts/ai-video/adapters/kling.sh +3 -3
- package/src/scripts/ai-video/adapters/musetalk.sh +2 -2
- package/src/scripts/ai-video/adapters/openai-images.sh +3 -3
- package/src/scripts/ai-video/adapters/replicate.sh +3 -3
- package/src/scripts/ai-video/adapters/sora.sh +3 -3
- package/src/scripts/ai-video/adapters/syncso.sh +3 -3
- package/src/scripts/ai-video/audio-adapters/allin1.sh +2 -2
- package/src/scripts/ai-video/audio-adapters/whisperx.sh +2 -2
- package/src/scripts/ai-video/lib/audio-adapter-contract.md +1 -1
- package/src/scripts/ai-video/lib/embed-provenance.sh +2 -2
- package/src/scripts/ai-video/lib/ingest-song.sh +2 -2
- package/src/scripts/ai-video/lib/parse-blueprint.sh +1 -1
- package/src/scripts/ai-video/lib/resume-scan.sh +2 -2
- package/src/scripts/ai-video/smoke-trace.sh +16 -7
- package/src/scripts/ai-video/stitch.sh +2 -2
- package/src/scripts/ai_council/_default_prices.ts +73 -0
- package/src/scripts/ai_council/advisors.ts +244 -0
- package/src/scripts/ai_council/airgap.ts +249 -0
- package/src/scripts/ai_council/budget_guard.ts +492 -0
- package/src/scripts/ai_council/bundler.ts +376 -0
- package/src/scripts/ai_council/cli_hints.ts +120 -0
- package/src/scripts/ai_council/clients.ts +2214 -0
- package/src/scripts/ai_council/compile_corpus.ts +681 -0
- package/src/scripts/ai_council/confidence_gate.ts +230 -0
- package/src/scripts/ai_council/config.ts +1729 -0
- package/src/scripts/ai_council/consensus.ts +551 -0
- package/src/scripts/ai_council/events_log.ts +327 -0
- package/src/scripts/ai_council/learn_low_impact_preview.ts +317 -0
- package/src/scripts/ai_council/low_impact.ts +1069 -0
- package/src/scripts/ai_council/low_impact_corpus.ts +662 -0
- package/src/scripts/ai_council/low_impact_intake.ts +222 -0
- package/src/scripts/ai_council/modes.ts +169 -0
- package/src/scripts/ai_council/necessity.ts +933 -0
- package/src/scripts/ai_council/orchestrator.ts +1689 -0
- package/src/scripts/ai_council/pricing.ts +267 -0
- package/src/scripts/ai_council/probation_gate.ts +282 -0
- package/src/scripts/ai_council/project_context.ts +308 -0
- package/src/scripts/ai_council/prompts.ts +600 -0
- package/src/scripts/ai_council/redact_low_impact_entry.ts +291 -0
- package/src/scripts/ai_council/replay.ts +314 -0
- package/src/scripts/ai_council/session.ts +558 -0
- package/src/scripts/ai_council/shadow_dispatch.ts +509 -0
- package/src/scripts/ai_council/solo_dispatch.ts +281 -0
- package/src/scripts/analysis_freshness.ts +343 -0
- package/src/scripts/annotate_discovery.ts +288 -0
- package/src/scripts/apply_modules_config.ts +537 -0
- package/src/scripts/audit_adr_coverage.ts +357 -0
- package/src/scripts/audit_auto_rules.ts +415 -0
- package/src/scripts/audit_cloud_compatibility.ts +608 -0
- package/src/scripts/audit_command_surface.ts +1227 -0
- package/src/scripts/audit_initial_context.ts +694 -0
- package/src/scripts/audit_likelihood.ts +434 -0
- package/src/scripts/audit_mcp_tools.ts +252 -0
- package/src/scripts/audit_overlap.ts +421 -0
- package/src/scripts/audit_skill_descriptions.ts +402 -0
- package/src/scripts/audit_skill_overlap.ts +576 -0
- package/src/scripts/audit_user_type_axis.ts +264 -0
- package/src/scripts/backfill_model_tier.ts +349 -0
- package/src/scripts/bench_ab_cache_dispatch.ts +126 -0
- package/src/scripts/bench_ab_clone.ts +610 -0
- package/src/scripts/bench_ab_diff.ts +609 -0
- package/src/scripts/bench_ab_integrity.ts +261 -0
- package/src/scripts/bench_ab_run.ts +417 -0
- package/src/scripts/bench_ab_task_runner.ts +1382 -0
- package/src/scripts/bench_ab_tracka_run.ts +436 -0
- package/src/scripts/bench_ab_v2_run.ts +585 -0
- package/src/scripts/bench_ab_v2_stats.ts +1018 -0
- package/src/scripts/bench_baseline_ready.ts +326 -0
- package/src/scripts/bench_condense_memory.ts +479 -0
- package/src/scripts/bench_drift_check.ts +503 -0
- package/src/scripts/bench_per_tool.ts +591 -0
- package/src/scripts/bench_rtk_savings.ts +710 -0
- package/src/scripts/bench_run.ts +509 -0
- package/src/scripts/bench_runner.ts +519 -0
- package/src/scripts/build_cloud_bundle.ts +692 -0
- package/src/scripts/build_discovery_manifest.ts +1371 -0
- package/src/scripts/build_linear_digest.ts +368 -0
- package/src/scripts/build_mcp_registry_manifest.ts +351 -0
- package/src/scripts/build_rule_trigger_matrix.ts +469 -0
- package/src/scripts/capture_showcase_session.ts +735 -0
- package/src/scripts/chat_history.ts +2301 -0
- package/src/scripts/check_always_budget.ts +694 -0
- package/src/scripts/check_artefact_checksums.ts +281 -0
- package/src/scripts/check_augment_description_cap.ts +133 -0
- package/src/scripts/check_augmentignore.ts +108 -0
- package/src/scripts/check_beta_review_markers.ts +234 -0
- package/src/scripts/check_bite_sized_granularity.ts +116 -0
- package/src/scripts/check_cluster_patterns.ts +285 -0
- package/src/scripts/check_command_count_messaging.ts +224 -0
- package/src/scripts/check_condensation.ts +900 -0
- package/src/scripts/check_condensed_paths.ts +414 -0
- package/src/scripts/check_context_paths.ts +388 -0
- package/src/scripts/check_council_config_location.ts +260 -0
- package/src/scripts/check_council_layout.ts +180 -0
- package/src/scripts/check_council_references.ts +345 -0
- package/src/scripts/check_discovery_determinism.ts +124 -0
- package/src/scripts/check_gate_paths.ts +230 -0
- package/src/scripts/check_iron_law_prominence.ts +298 -0
- package/src/scripts/check_kernel_rule_bundle.ts +242 -0
- package/src/scripts/check_knowledge_cards.ts +759 -0
- package/src/scripts/check_md_language.ts +291 -0
- package/src/scripts/check_memory.ts +845 -0
- package/src/scripts/check_memory_proposal.ts +351 -0
- package/src/scripts/check_module_management_neutral.ts +238 -0
- package/src/scripts/check_no_conflict_markers.ts +298 -0
- package/src/scripts/check_no_conflict_markers_allowlist.json +4 -0
- package/src/scripts/check_no_external_sources.ts +351 -0
- package/src/scripts/check_no_local_settings_committed.ts +69 -0
- package/src/scripts/check_no_new_legacy_path.ts +188 -0
- package/src/scripts/check_no_roadmap_refs.ts +304 -0
- package/src/scripts/check_one_off_location.ts +165 -0
- package/src/scripts/check_overlay_cascade_subdirs.ts +188 -0
- package/src/scripts/check_portability.ts +860 -0
- package/src/scripts/check_proposal.ts +0 -0
- package/src/scripts/check_public_catalog_links.ts +204 -0
- package/src/scripts/check_public_links.ts +357 -0
- package/src/scripts/check_references.ts +963 -0
- package/src/scripts/check_release_includes_discovery.ts +94 -0
- package/src/scripts/check_release_pr_shape.ts +222 -0
- package/src/scripts/check_release_published.ts +235 -0
- package/src/scripts/check_release_trunk_sync.ts +203 -0
- package/src/scripts/check_reply_consistency.ts +359 -0
- package/src/scripts/check_roadmap_trackable.ts +268 -0
- package/src/scripts/check_role_doc_links.ts +187 -0
- package/src/scripts/check_safety_floor_untouched.ts +160 -0
- package/src/scripts/check_skill_requires.ts +205 -0
- package/src/scripts/check_structural_breaking.ts +170 -0
- package/src/scripts/check_surface_tiers.ts +567 -0
- package/src/scripts/check_template_pin_drift.ts +222 -0
- package/src/scripts/check_test_coverage_diff.ts +235 -0
- package/src/scripts/check_token_optimizer_freshness.ts +183 -0
- package/src/scripts/check_trigger_evals.ts +375 -0
- package/src/scripts/check_update_banner.ts +143 -0
- package/src/scripts/ci_status.ts +0 -0
- package/src/scripts/ci_summary.ts +235 -0
- package/src/scripts/ci_time_ratio.ts +526 -0
- package/src/scripts/command_suggester/cooldown.ts +176 -0
- package/src/scripts/command_suggester/index.ts +41 -0
- package/src/scripts/command_suggester/loader.ts +205 -0
- package/src/scripts/command_suggester/match.ts +294 -0
- package/src/scripts/command_suggester/rank.ts +201 -0
- package/src/scripts/command_suggester/render.ts +122 -0
- package/src/scripts/command_suggester/sanitize.ts +114 -0
- package/src/scripts/command_suggester/settings.ts +186 -0
- package/src/scripts/command_suggester/types.ts +0 -0
- package/src/scripts/compile_router.ts +297 -0
- package/src/scripts/condense.sh +7 -1
- package/src/scripts/condense.ts +2035 -0
- package/src/scripts/condense_memory.ts +334 -0
- package/src/scripts/config/index.ts +15 -0
- package/src/scripts/config/packs.ts +310 -0
- package/src/scripts/config/presets.ts +369 -0
- package/src/scripts/config/profile_explain.ts +114 -0
- package/src/scripts/config/profiles.ts +277 -0
- package/src/scripts/config/session_profiles.ts +1064 -0
- package/src/scripts/context_hygiene_hook.ts +272 -0
- package/src/scripts/cost_by_conversation.ts +444 -0
- package/src/scripts/cost_summary.ts +407 -0
- package/src/scripts/council_cli.ts +2827 -0
- package/src/scripts/council_prune.ts +153 -0
- package/src/scripts/cross_repo_retrieve.ts +694 -0
- package/src/scripts/discovery_stats.ts +218 -0
- package/src/scripts/evidence_report.ts +580 -0
- package/src/scripts/external_sources_denylist.json +1 -0
- package/src/scripts/extract_audit_patterns.ts +394 -0
- package/src/scripts/first_run_gate_hook.ts +246 -0
- package/src/scripts/gen_discovery_baseline.ts +297 -0
- package/src/scripts/generate_capabilities_index.ts +496 -0
- package/src/scripts/generate_capability_matrix.ts +430 -0
- package/src/scripts/generate_catalog.ts +178 -0
- package/src/scripts/generate_command_flows.ts +316 -0
- package/src/scripts/generate_cookbook.ts +302 -0
- package/src/scripts/generate_index.ts +500 -0
- package/src/scripts/generate_ownership_matrix.ts +646 -0
- package/src/scripts/generate_pack_manifests.ts +1025 -0
- package/src/scripts/generate_role_experiences_catalog.ts +265 -0
- package/src/scripts/hermetic-install.sh +22 -11
- package/src/scripts/hook_manifest.yaml +24 -10
- package/src/scripts/hooks/augment-chat-history.sh +3 -10
- package/src/scripts/hooks/augment-context-hygiene.sh +3 -10
- package/src/scripts/hooks/augment-dispatcher.sh +3 -10
- package/src/scripts/hooks/augment-onboarding-gate.sh +3 -10
- package/src/scripts/hooks/augment-roadmap-progress.sh +3 -10
- package/src/scripts/hooks/block_no_verify.ts +413 -0
- package/src/scripts/hooks/cline-dispatcher.sh +3 -10
- package/src/scripts/hooks/cowork-dispatcher.sh +3 -14
- package/src/scripts/hooks/cursor-dispatcher.sh +3 -10
- package/src/scripts/hooks/dispatch_hook.ts +851 -0
- package/src/scripts/hooks/dispatch_issues.ts +226 -0
- package/src/scripts/hooks/envelope.ts +140 -0
- package/src/scripts/hooks/gemini-dispatcher.sh +3 -8
- package/src/scripts/hooks/replay_hook.ts +364 -0
- package/src/scripts/hooks/state_io.ts +293 -0
- package/src/scripts/hooks/windsurf-dispatcher.sh +3 -9
- package/src/scripts/hooks_doctor.ts +418 -0
- package/src/scripts/hooks_status.ts +292 -0
- package/src/scripts/injection_scan_hook.ts +285 -0
- package/src/scripts/install +36 -22
- package/src/scripts/install-hooks.sh +20 -14
- package/src/scripts/install.sh +38 -14
- package/src/scripts/install.ts +4515 -0
- package/src/scripts/inventory_abstraction_budget.ts +1104 -0
- package/src/scripts/inventory_frontmatter.ts +320 -0
- package/src/scripts/inventory_meta_layers.ts +516 -0
- package/src/scripts/iron_law_sha.ts +233 -0
- package/src/scripts/knowledge_global_cli.ts +1105 -0
- package/src/scripts/linked_projects_list.ts +310 -0
- package/src/scripts/lint_agent_security.ts +224 -0
- package/src/scripts/lint_agent_skill_names.ts +241 -0
- package/src/scripts/lint_agents_layout.ts +205 -0
- package/src/scripts/lint_agents_md.ts +294 -0
- package/src/scripts/lint_archived_skills.ts +309 -0
- package/src/scripts/lint_artefact_frontmatter.ts +359 -0
- package/src/scripts/lint_bench_ab.ts +319 -0
- package/src/scripts/lint_bench_corpus.ts +421 -0
- package/src/scripts/lint_command_flow_coverage.ts +231 -0
- package/src/scripts/lint_command_routing.ts +377 -0
- package/src/scripts/lint_command_tiers.ts +345 -0
- package/src/scripts/lint_command_verbs.ts +379 -0
- package/src/scripts/lint_commit_subjects.ts +243 -0
- package/src/scripts/lint_context_spine_usage.ts +198 -0
- package/src/scripts/lint_discovery_manifest.ts +540 -0
- package/src/scripts/lint_discovery_vocabulary.ts +393 -0
- package/src/scripts/lint_empty_roadmaps.ts +147 -0
- package/src/scripts/lint_eval_freshness.ts +335 -0
- package/src/scripts/lint_examples.ts +183 -0
- package/src/scripts/lint_explain_trace.ts +381 -0
- package/src/scripts/lint_featured_skills.ts +0 -0
- package/src/scripts/lint_flows.ts +701 -0
- package/src/scripts/lint_framework_leakage.ts +497 -0
- package/src/scripts/lint_framework_leakage_allowlist.json +8 -1
- package/src/scripts/lint_frontmatter_boilerplate.ts +356 -0
- package/src/scripts/lint_ghostwriter_source.ts +389 -0
- package/src/scripts/lint_global_paths.ts +420 -0
- package/src/scripts/lint_handoffs.ts +362 -0
- package/src/scripts/lint_hidden_unicode.ts +350 -0
- package/src/scripts/lint_hook_concern_budget.ts +319 -0
- package/src/scripts/lint_hook_manifest.ts +354 -0
- package/src/scripts/lint_instruction_smuggling.ts +173 -0
- package/src/scripts/lint_load_context.ts +371 -0
- package/src/scripts/lint_marketplace.ts +286 -0
- package/src/scripts/lint_marketplace_install_completeness.ts +309 -0
- package/src/scripts/lint_mcp_config_security.ts +225 -0
- package/src/scripts/lint_mcp_registry_manifest.ts +350 -0
- package/src/scripts/lint_media_policy_linkage.ts +224 -0
- package/src/scripts/lint_missions.ts +774 -0
- package/src/scripts/lint_model_tier_coverage.ts +151 -0
- package/src/scripts/lint_namespace.ts +295 -0
- package/src/scripts/lint_namespace_collisions.ts +203 -0
- package/src/scripts/lint_new_skill_gate.ts +462 -0
- package/src/scripts/lint_no_new_atomic_commands.ts +342 -0
- package/src/scripts/lint_one_off_age.ts +348 -0
- package/src/scripts/lint_orchestration_dsl.ts +377 -0
- package/src/scripts/lint_orchestrator_auto_detect.ts +177 -0
- package/src/scripts/lint_pack_boundaries.ts +366 -0
- package/src/scripts/lint_pack_dependencies.ts +541 -0
- package/src/scripts/lint_pack_first_win.ts +202 -0
- package/src/scripts/lint_persona_governance.ts +292 -0
- package/src/scripts/lint_positioning.ts +257 -0
- package/src/scripts/lint_profile_overlay_set_only.ts +324 -0
- package/src/scripts/lint_readme_jargon.ts +189 -0
- package/src/scripts/lint_readme_size.ts +73 -0
- package/src/scripts/lint_regression.ts +497 -0
- package/src/scripts/lint_roadmap_ci_steps.ts +252 -0
- package/src/scripts/lint_roadmap_complexity.ts +295 -0
- package/src/scripts/lint_roadmap_later_disposition.ts +357 -0
- package/src/scripts/lint_role_experiences.ts +410 -0
- package/src/scripts/lint_rule_interactions.ts +281 -0
- package/src/scripts/lint_rule_tiers.ts +169 -0
- package/src/scripts/lint_showcase_sessions.ts +254 -0
- package/src/scripts/lint_skill_frontmatter_safety.ts +279 -0
- package/src/scripts/lint_skill_originality.ts +586 -0
- package/src/scripts/lint_skill_originality_allowlist.json +20 -0
- package/src/scripts/lint_skill_tools.ts +320 -0
- package/src/scripts/lint_ticket_buildable.ts +1027 -0
- package/src/scripts/lint_topics_yaml.ts +203 -0
- package/src/scripts/lint_trust_coherence.ts +377 -0
- package/src/scripts/lint_value_dashboard.ts +314 -0
- package/src/scripts/lint_workflow_security.ts +637 -0
- package/src/scripts/lint_workflow_security_allowlist.json +20 -0
- package/src/scripts/lint_workspace_boundary.ts +248 -0
- package/src/scripts/mcp_parity_smoke.ts +638 -0
- package/src/scripts/mcp_render.ts +346 -0
- package/src/scripts/mcp_server/__main__.ts +28 -0
- package/src/scripts/mcp_server/catalog.ts +154 -0
- package/src/scripts/mcp_server/index.ts +24 -0
- package/src/scripts/mcp_server/metadata.ts +83 -0
- package/src/scripts/mcp_server/prompts.ts +711 -0
- package/src/scripts/mcp_server/resources.ts +343 -0
- package/src/scripts/mcp_server/server.ts +439 -0
- package/src/scripts/mcp_server/telemetry.ts +154 -0
- package/src/scripts/mcp_server/tools.ts +1031 -0
- package/src/scripts/mcp_setup.sh +25 -52
- package/src/scripts/mcp_telemetry_health.ts +362 -0
- package/src/scripts/mcp_telemetry_query.ts +371 -0
- package/src/scripts/mcp_telemetry_store.ts +422 -0
- package/src/scripts/measure_augment_budget.ts +453 -0
- package/src/scripts/measure_density.ts +618 -0
- package/src/scripts/measure_frugality_savings.ts +353 -0
- package/src/scripts/measure_markitdown_lift.ts +299 -0
- package/src/scripts/measure_patterns.ts +682 -0
- package/src/scripts/measure_projection_bytes.ts +425 -0
- package/src/scripts/measure_rule_budget.ts +627 -0
- package/src/scripts/measure_skill_reduction.ts +442 -0
- package/src/scripts/media/lib/adapter-common.sh +247 -0
- package/src/scripts/media/lib/adapter-contract.md +329 -0
- package/src/scripts/media/lib/fixtures/comfyui/result.json +1 -0
- package/src/scripts/media/lib/fixtures/fal/result.json +1 -0
- package/src/scripts/media/lib/fixtures/flux/asset-0001.png +0 -0
- package/src/scripts/media/lib/fixtures/flux/result.json +1 -0
- package/src/scripts/media/lib/fixtures/gemini-image/asset-0001.png +0 -0
- package/src/scripts/media/lib/fixtures/gemini-image/result.json +1 -0
- package/src/scripts/media/lib/fixtures/gemini-veo/result.json +1 -0
- package/src/scripts/media/lib/fixtures/higgsfield/result.json +1 -0
- package/src/scripts/media/lib/fixtures/ideogram/asset-0001.png +0 -0
- package/src/scripts/media/lib/fixtures/ideogram/result.json +1 -0
- package/src/scripts/media/lib/fixtures/kling/result.json +1 -0
- package/src/scripts/media/lib/fixtures/musetalk/result.json +1 -0
- package/src/scripts/media/lib/fixtures/openai-images/result.json +1 -0
- package/src/scripts/media/lib/fixtures/recraft/asset-0001.svg +1 -0
- package/src/scripts/media/lib/fixtures/recraft/result.json +1 -0
- package/src/scripts/media/lib/fixtures/replicate/result.json +1 -0
- package/src/scripts/media/lib/fixtures/sora/result.json +1 -0
- package/src/scripts/media/lib/fixtures/syncso/result.json +1 -0
- package/src/scripts/media/lib/load-config.sh +180 -0
- package/src/scripts/media/lib/redact.sh +85 -0
- package/src/scripts/memory_hash.ts +331 -0
- package/src/scripts/memory_lookup.ts +1278 -0
- package/src/scripts/memory_report.ts +845 -0
- package/src/scripts/memory_signal.ts +417 -0
- package/src/scripts/memory_status.ts +189 -0
- package/src/scripts/migrate_command_suggestions.ts +341 -0
- package/src/scripts/migrate_frontmatter_defaults.ts +539 -0
- package/src/scripts/migration_status.ts +301 -0
- package/src/scripts/mine_session.ts +645 -0
- package/src/scripts/minimal_safe_diff_hook.ts +355 -0
- package/src/scripts/move_artefact.ts +869 -0
- package/src/scripts/new_skill.ts +404 -0
- package/src/scripts/onboarding_gate_hook.ts +224 -0
- package/src/scripts/pack_dependency_allowlist.json +1 -1
- package/src/scripts/pack_mcp_content.ts +552 -0
- package/src/scripts/parity/README.md +140 -0
- package/src/scripts/parity/compare.ts +189 -0
- package/src/scripts/parity/coverage_diff.ts +199 -0
- package/src/scripts/parity/phase-manifest.json +93 -0
- package/src/scripts/parity/phase_gate.ts +270 -0
- package/src/scripts/parity/replay.ts +320 -0
- package/src/scripts/pattern_share.ts +363 -0
- package/src/scripts/plan_physical_move.ts +605 -0
- package/src/scripts/prediction-pool/poisson_sim.ts +537 -0
- package/src/scripts/prediction-pool/pool_winsim.ts +677 -0
- package/src/scripts/prediction-pool/score_ev.ts +546 -0
- package/src/scripts/print_required_checks.ts +249 -0
- package/src/scripts/probe_projection_fidelity.ts +468 -0
- package/src/scripts/probe_skill_registration.ts +787 -0
- package/src/scripts/profile_staleness_hook.ts +169 -0
- package/src/scripts/profile_use.ts +227 -0
- package/src/scripts/project_thin_rules.ts +387 -0
- package/src/scripts/propose_modules_config.ts +311 -0
- package/src/scripts/prototype_lint_contradictions.ts +414 -0
- package/src/scripts/prove_pack_extractable.ts +388 -0
- package/src/scripts/readme_linter.ts +913 -0
- package/src/scripts/redact_hook_capture.ts +325 -0
- package/src/scripts/refine_ticket_detect.ts +703 -0
- package/src/scripts/release.ts +1697 -0
- package/src/scripts/render_benchmark_md.ts +664 -0
- package/src/scripts/render_value_md.ts +506 -0
- package/src/scripts/repro/repro_marketplace_install_gap.sh +1 -1
- package/src/scripts/roadmap_progress_hook.ts +410 -0
- package/src/scripts/router_telemetry.ts +972 -0
- package/src/scripts/run.ts +98 -0
- package/src/scripts/run_skill_evals.ts +477 -0
- package/src/scripts/runtime_dispatcher.ts +586 -0
- package/src/scripts/runtime_handler.ts +231 -0
- package/src/scripts/runtime_registry.ts +394 -0
- package/src/scripts/schemas/command.schema.json +3 -2
- package/src/scripts/schemas/mission-catalog.schema.json +112 -0
- package/src/scripts/schemas/mission.schema.json +87 -0
- package/src/scripts/schemas/pack.schema.json +6 -0
- package/src/scripts/schemas/rule.schema.json +1 -0
- package/src/scripts/schemas/skill.schema.json +1 -0
- package/src/scripts/schemas/ticket-manifest.schema.json +35 -0
- package/src/scripts/schemas/ticket.schema.json +60 -0
- package/src/scripts/score_skill_selection.ts +570 -0
- package/src/scripts/security_audit_config.ts +423 -0
- package/src/scripts/skill_collision_clusters.ts +448 -0
- package/src/scripts/skill_discovery.ts +690 -0
- package/src/scripts/skill_linter.ts +4276 -0
- package/src/scripts/skill_overlap.ts +414 -0
- package/src/scripts/skill_preview.ts +548 -0
- package/src/scripts/skill_tools/audit_persona_coverage.ts +427 -0
- package/src/scripts/skill_tools/audit_user_type_coverage.ts +507 -0
- package/src/scripts/skill_tools/index.ts +28 -0
- package/src/scripts/skill_tools/run_block_d_eval.ts +373 -0
- package/src/scripts/skill_tools/score_skill_relevance.ts +475 -0
- package/src/scripts/skill_tools/suggest_skill_for_task.ts +288 -0
- package/src/scripts/skill_trigger_eval.ts +1046 -0
- package/src/scripts/skill_usage_collect.ts +465 -0
- package/src/scripts/skill_usage_report.ts +364 -0
- package/src/scripts/smoke/kernel.sh +4 -5
- package/src/scripts/smoke/router.sh +76 -76
- package/src/scripts/smoke/schema.sh +2 -2
- package/src/scripts/smoke/skills.sh +73 -52
- package/src/scripts/smoke_path_resolution.ts +194 -0
- package/src/scripts/smoke_quickstart.ts +224 -0
- package/src/scripts/snapshot_agent_outputs.ts +375 -0
- package/src/scripts/spotcheck_thin_root.ts +247 -0
- package/src/scripts/surface-tiers.yml +68 -0
- package/src/scripts/sync_agent_settings.ts +763 -0
- package/src/scripts/sync_github_metadata.ts +550 -0
- package/src/scripts/sync_gitignore.ts +630 -0
- package/src/scripts/sync_yaml_rt.ts +910 -0
- package/src/scripts/telegraph_stats.ts +447 -0
- package/src/scripts/tool_registry.ts +330 -0
- package/src/scripts/tools/adapter_errors.ts +93 -0
- package/src/scripts/tools/base_adapter.ts +147 -0
- package/src/scripts/tools/github_adapter.ts +229 -0
- package/src/scripts/tools/jira_adapter.ts +196 -0
- package/src/scripts/trigger_coverage.ts +251 -0
- package/src/scripts/update_counts.ts +284 -0
- package/src/scripts/update_prices.ts +219 -0
- package/src/scripts/validate_agent_settings.ts +265 -0
- package/src/scripts/validate_decision_engine.ts +366 -0
- package/src/scripts/validate_discovery_manifest.ts +160 -0
- package/src/scripts/validate_frontmatter.ts +1030 -0
- package/src/scripts/validate_pack_yaml.ts +0 -0
- package/src/scripts/validate_safe_paths.ts +164 -0
- package/src/scripts/validate_telegraph_carveouts.ts +485 -0
- package/src/scripts/verify_before_complete_hook.ts +306 -0
- package/src/scripts/verify_physical_move.ts +411 -0
- package/src/scripts/wrapper_freshness_hook.ts +179 -0
- package/dist/agent-src/scripts/archive_completed_roadmaps.py +0 -171
- package/dist/agent-src/scripts/update_roadmap_progress.py +0 -537
- package/dist/agent-src/skills/corpus-grounding/scripts/bm25_search.py +0 -212
- package/dist/agent-src/skills/corpus-grounding/scripts/decision_engine.py +0 -438
- package/dist/agent-src/skills/corpus-grounding/scripts/ground.py +0 -166
- package/dist/agent-src/skills/corpus-grounding/scripts/schema_validator.py +0 -160
- package/dist/agent-src/skills/design-tokens/scripts/tokens.py +0 -296
- package/dist/agent-src/skills/react-shadcn-ui/scripts/shadcn_add.py +0 -299
- package/dist/agent-src/skills/tailwind-engineer/scripts/tailwind_config_gen.py +0 -463
- package/dist/agent-src/templates/scripts/check_memory.py +0 -282
- package/dist/agent-src/templates/scripts/check_memory_proposal.py +0 -180
- package/dist/agent-src/templates/scripts/implement_ticket/__init__.py +0 -94
- package/dist/agent-src/templates/scripts/implement_ticket/__main__.py +0 -15
- package/dist/agent-src/templates/scripts/memory_hash.py +0 -75
- package/dist/agent-src/templates/scripts/memory_lookup.py +0 -436
- package/dist/agent-src/templates/scripts/memory_report.py +0 -314
- package/dist/agent-src/templates/scripts/memory_signal.py +0 -165
- package/dist/agent-src/templates/scripts/memory_status.py +0 -76
- package/dist/agent-src/templates/scripts/pr_review_routing.py +0 -340
- package/dist/agent-src/templates/scripts/pr_risk_review.py +0 -211
- package/dist/agent-src/templates/scripts/telemetry/__init__.py +0 -42
- package/dist/agent-src/templates/scripts/telemetry/aggregator.py +0 -169
- package/dist/agent-src/templates/scripts/telemetry/boundary.py +0 -171
- package/dist/agent-src/templates/scripts/telemetry/engagement.py +0 -297
- package/dist/agent-src/templates/scripts/telemetry/report_renderer.py +0 -197
- package/dist/agent-src/templates/scripts/telemetry/settings.py +0 -177
- package/dist/agent-src/templates/scripts/telemetry_record.py +0 -179
- package/dist/agent-src/templates/scripts/telemetry_report.py +0 -161
- package/dist/agent-src/templates/scripts/telemetry_status.py +0 -142
- package/dist/agent-src/templates/scripts/tier_usage_report.py +0 -183
- package/dist/agent-src/templates/scripts/work_engine/__init__.py +0 -58
- package/dist/agent-src/templates/scripts/work_engine/__main__.py +0 -9
- package/dist/agent-src/templates/scripts/work_engine/_lib/__init__.py +0 -7
- package/dist/agent-src/templates/scripts/work_engine/_lib/agent_settings.py +0 -840
- package/dist/agent-src/templates/scripts/work_engine/_lib/user_global_paths.py +0 -249
- package/dist/agent-src/templates/scripts/work_engine/cli.py +0 -195
- package/dist/agent-src/templates/scripts/work_engine/cli_args.py +0 -116
- package/dist/agent-src/templates/scripts/work_engine/delivery_state.py +0 -137
- package/dist/agent-src/templates/scripts/work_engine/directives/__init__.py +0 -33
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/__init__.py +0 -98
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/analyze.py +0 -98
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/implement.py +0 -145
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/memory.py +0 -136
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/plan.py +0 -175
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/refine.py +0 -396
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/report.py +0 -227
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/test.py +0 -180
- package/dist/agent-src/templates/scripts/work_engine/directives/backend/verify.py +0 -170
- package/dist/agent-src/templates/scripts/work_engine/directives/mixed/__init__.py +0 -116
- package/dist/agent-src/templates/scripts/work_engine/directives/mixed/contract.py +0 -254
- package/dist/agent-src/templates/scripts/work_engine/directives/mixed/stitch.py +0 -229
- package/dist/agent-src/templates/scripts/work_engine/directives/mixed/ui.py +0 -231
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/__init__.py +0 -113
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/_passthrough.py +0 -44
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/apply.py +0 -241
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/audit.py +0 -414
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/design.py +0 -335
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/polish.py +0 -513
- package/dist/agent-src/templates/scripts/work_engine/directives/ui/review.py +0 -471
- package/dist/agent-src/templates/scripts/work_engine/directives/ui_trivial/__init__.py +0 -119
- package/dist/agent-src/templates/scripts/work_engine/directives/ui_trivial/_skipped.py +0 -37
- package/dist/agent-src/templates/scripts/work_engine/directives/ui_trivial/apply.py +0 -165
- package/dist/agent-src/templates/scripts/work_engine/directives/ui_trivial/refine.py +0 -66
- package/dist/agent-src/templates/scripts/work_engine/directives/ui_trivial/report.py +0 -62
- package/dist/agent-src/templates/scripts/work_engine/directives/ui_trivial/test.py +0 -115
- package/dist/agent-src/templates/scripts/work_engine/dispatcher.py +0 -331
- package/dist/agent-src/templates/scripts/work_engine/emitters.py +0 -68
- package/dist/agent-src/templates/scripts/work_engine/errors.py +0 -19
- package/dist/agent-src/templates/scripts/work_engine/hook_bootstrap.py +0 -91
- package/dist/agent-src/templates/scripts/work_engine/hooks/__init__.py +0 -54
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/__init__.py +0 -35
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/_chat_history_base.py +0 -59
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/chat_history_append.py +0 -43
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/chat_history_halt_append.py +0 -41
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/decision_gate.py +0 -162
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/decision_trace.py +0 -163
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/directive_set_guard.py +0 -53
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/halt_surface_audit.py +0 -50
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/memory_visibility.py +0 -141
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/state_shape_validation.py +0 -52
- package/dist/agent-src/templates/scripts/work_engine/hooks/builtin/trace.py +0 -84
- package/dist/agent-src/templates/scripts/work_engine/hooks/context.py +0 -66
- package/dist/agent-src/templates/scripts/work_engine/hooks/events.py +0 -44
- package/dist/agent-src/templates/scripts/work_engine/hooks/exceptions.py +0 -79
- package/dist/agent-src/templates/scripts/work_engine/hooks/registry.py +0 -60
- package/dist/agent-src/templates/scripts/work_engine/hooks/runner.py +0 -73
- package/dist/agent-src/templates/scripts/work_engine/hooks/settings.py +0 -196
- package/dist/agent-src/templates/scripts/work_engine/input_builders.py +0 -163
- package/dist/agent-src/templates/scripts/work_engine/intent/__init__.py +0 -47
- package/dist/agent-src/templates/scripts/work_engine/intent/classify.py +0 -280
- package/dist/agent-src/templates/scripts/work_engine/migration/__init__.py +0 -8
- package/dist/agent-src/templates/scripts/work_engine/migration/v0_to_v1.py +0 -231
- package/dist/agent-src/templates/scripts/work_engine/orchestration.py +0 -193
- package/dist/agent-src/templates/scripts/work_engine/persona_policy.py +0 -85
- package/dist/agent-src/templates/scripts/work_engine/resolvers/__init__.py +0 -22
- package/dist/agent-src/templates/scripts/work_engine/resolvers/diff.py +0 -106
- package/dist/agent-src/templates/scripts/work_engine/resolvers/file.py +0 -113
- package/dist/agent-src/templates/scripts/work_engine/resolvers/prompt.py +0 -90
- package/dist/agent-src/templates/scripts/work_engine/scoring/__init__.py +0 -14
- package/dist/agent-src/templates/scripts/work_engine/scoring/confidence.py +0 -300
- package/dist/agent-src/templates/scripts/work_engine/scoring/decision_engine.py +0 -351
- package/dist/agent-src/templates/scripts/work_engine/scoring/decision_trace.py +0 -141
- package/dist/agent-src/templates/scripts/work_engine/scoring/memory_visibility.py +0 -283
- package/dist/agent-src/templates/scripts/work_engine/stack/__init__.py +0 -31
- package/dist/agent-src/templates/scripts/work_engine/stack/detect.py +0 -187
- package/dist/agent-src/templates/scripts/work_engine/stack/runner.py +0 -481
- package/dist/agent-src/templates/scripts/work_engine/state.py +0 -694
- package/dist/agent-src/templates/scripts/work_engine/state_io.py +0 -202
- package/dist/cli/python/resolvePython.js +0 -38
- package/dist/cli/python/resolvePython.js.map +0 -1
- package/src/scripts/__pycache__/validate_frontmatter.cpython-312.pyc +0 -0
- package/src/scripts/_archive/_backfill_skill_domains.py +0 -140
- package/src/scripts/_archive/_bootstrap_tier_frontmatter.py +0 -151
- package/src/scripts/_archive/_p43_bodies.py +0 -235
- package/src/scripts/_archive/_p43_condense.py +0 -118
- package/src/scripts/_archive/_p4_migrate.py +0 -199
- package/src/scripts/_archive/_phase2_shim_helper.py +0 -109
- package/src/scripts/_archive/_pilot_council_question.py +0 -57
- package/src/scripts/_cli/__init__.py +0 -0
- package/src/scripts/_cli/cmd_doctor.py +0 -1669
- package/src/scripts/_cli/cmd_explain.py +0 -355
- package/src/scripts/_cli/cmd_export.py +0 -157
- package/src/scripts/_cli/cmd_migrate.py +0 -524
- package/src/scripts/_cli/cmd_prune.py +0 -322
- package/src/scripts/_cli/cmd_refresh.py +0 -179
- package/src/scripts/_cli/cmd_settings_check.py +0 -171
- package/src/scripts/_cli/cmd_settings_migrate.py +0 -147
- package/src/scripts/_cli/cmd_sync.py +0 -166
- package/src/scripts/_cli/cmd_uninstall.py +0 -476
- package/src/scripts/_cli/cmd_update.py +0 -279
- package/src/scripts/_cli/cmd_upgrade.py +0 -172
- package/src/scripts/_cli/cmd_validate.py +0 -177
- package/src/scripts/_cli/cmd_versions.py +0 -160
- package/src/scripts/_cli/explain_last/__init__.py +0 -122
- package/src/scripts/_cli/explain_last/assumptions.py +0 -59
- package/src/scripts/_cli/explain_last/council.py +0 -105
- package/src/scripts/_cli/explain_last/halt.py +0 -44
- package/src/scripts/_cli/explain_last/inputs.py +0 -128
- package/src/scripts/_cli/explain_last/memory.py +0 -94
- package/src/scripts/_cli/explain_last/provider.py +0 -52
- package/src/scripts/_cli/explain_last/render.py +0 -52
- package/src/scripts/_cli/explain_last/route.py +0 -59
- package/src/scripts/_cli/explain_last/scrubber.py +0 -105
- package/src/scripts/_cli/explain_last/sections/__init__.py +0 -35
- package/src/scripts/_cli/explain_last/sections/assumptions.py +0 -21
- package/src/scripts/_cli/explain_last/sections/council.py +0 -27
- package/src/scripts/_cli/explain_last/sections/halt.py +0 -31
- package/src/scripts/_cli/explain_last/sections/header.py +0 -24
- package/src/scripts/_cli/explain_last/sections/inputs.py +0 -27
- package/src/scripts/_cli/explain_last/sections/memory.py +0 -21
- package/src/scripts/_cli/explain_last/sections/pack.py +0 -16
- package/src/scripts/_cli/explain_last/sections/provider.py +0 -26
- package/src/scripts/_cli/explain_last/sections/route.py +0 -22
- package/src/scripts/_cli/explain_last/state_loader.py +0 -76
- package/src/scripts/_emit_domain_table.py +0 -35
- package/src/scripts/_lib/__init__.py +0 -5
- package/src/scripts/_lib/__pycache__/__init__.cpython-312.pyc +0 -0
- package/src/scripts/_lib/__pycache__/agent_src.cpython-312.pyc +0 -0
- package/src/scripts/_lib/agent_settings.py +0 -840
- package/src/scripts/_lib/agent_src.py +0 -491
- package/src/scripts/_lib/agents_overlay.py +0 -120
- package/src/scripts/_lib/bench_ab_cache.py +0 -162
- package/src/scripts/_lib/bench_ab_scoring.py +0 -209
- package/src/scripts/_lib/bench_ab_scoring_v2.py +0 -227
- package/src/scripts/_lib/bench_cost.py +0 -138
- package/src/scripts/_lib/bench_quality.py +0 -118
- package/src/scripts/_lib/bench_report.py +0 -149
- package/src/scripts/_lib/bench_telegraph.py +0 -273
- package/src/scripts/_lib/bench_telegraph_report.py +0 -151
- package/src/scripts/_lib/changelog_eras.py +0 -330
- package/src/scripts/_lib/claude_desktop_bundler.py +0 -238
- package/src/scripts/_lib/cli_wrapper.py +0 -64
- package/src/scripts/_lib/fs_atomic.py +0 -116
- package/src/scripts/_lib/global_deploy_inventory.py +0 -312
- package/src/scripts/_lib/install_regenerator.py +0 -134
- package/src/scripts/_lib/installed_lock.py +0 -256
- package/src/scripts/_lib/installed_tools.py +0 -381
- package/src/scripts/_lib/json_pointers.py +0 -260
- package/src/scripts/_lib/link_crypto.py +0 -206
- package/src/scripts/_lib/linked_projects.py +0 -238
- package/src/scripts/_lib/model_tier.py +0 -52
- package/src/scripts/_lib/module_detection.py +0 -223
- package/src/scripts/_lib/pin_resolver.py +0 -152
- package/src/scripts/_lib/script_output.py +0 -144
- package/src/scripts/_lib/security_lint.py +0 -228
- package/src/scripts/_lib/token_count.py +0 -95
- package/src/scripts/_lib/update_check.py +0 -207
- package/src/scripts/_lib/user_global_paths.py +0 -249
- package/src/scripts/_lib/value_ladder.py +0 -696
- package/src/scripts/_lib/value_report.py +0 -455
- package/src/scripts/_phase4_bucket.py +0 -210
- package/src/scripts/_pilot_measure.py +0 -53
- package/src/scripts/_tmp_scan_framework_leakage.py +0 -119
- package/src/scripts/adoption_report.py +0 -195
- package/src/scripts/adoption_snapshot.py +0 -219
- package/src/scripts/adoption_status.py +0 -166
- package/src/scripts/adr/regenerate_index.py +0 -79
- package/src/scripts/ai-video/lib/adapter-common.sh +0 -231
- package/src/scripts/ai-video/lib/adapter-contract.md +0 -329
- package/src/scripts/ai-video/lib/fixtures/comfyui/result.json +0 -1
- package/src/scripts/ai-video/lib/fixtures/fal/result.json +0 -1
- package/src/scripts/ai-video/lib/fixtures/gemini-veo/result.json +0 -1
- package/src/scripts/ai-video/lib/fixtures/higgsfield/result.json +0 -1
- package/src/scripts/ai-video/lib/fixtures/kling/result.json +0 -1
- package/src/scripts/ai-video/lib/fixtures/musetalk/result.json +0 -1
- package/src/scripts/ai-video/lib/fixtures/openai-images/result.json +0 -1
- package/src/scripts/ai-video/lib/fixtures/replicate/result.json +0 -1
- package/src/scripts/ai-video/lib/fixtures/sora/result.json +0 -1
- package/src/scripts/ai-video/lib/fixtures/syncso/result.json +0 -1
- package/src/scripts/ai-video/lib/load-config.sh +0 -180
- package/src/scripts/ai-video/lib/redact.sh +0 -85
- package/src/scripts/ai_council/__init__.py +0 -40
- package/src/scripts/ai_council/_default_prices.py +0 -50
- package/src/scripts/ai_council/advisors.py +0 -148
- package/src/scripts/ai_council/airgap.py +0 -165
- package/src/scripts/ai_council/budget_guard.py +0 -202
- package/src/scripts/ai_council/bundler.py +0 -263
- package/src/scripts/ai_council/cli_hints.py +0 -123
- package/src/scripts/ai_council/clients.py +0 -1385
- package/src/scripts/ai_council/compile_corpus.py +0 -179
- package/src/scripts/ai_council/confidence_gate.py +0 -156
- package/src/scripts/ai_council/config.py +0 -1419
- package/src/scripts/ai_council/consensus.py +0 -329
- package/src/scripts/ai_council/events_log.py +0 -141
- package/src/scripts/ai_council/learn_low_impact_preview.py +0 -252
- package/src/scripts/ai_council/low_impact.py +0 -714
- package/src/scripts/ai_council/low_impact_corpus.py +0 -466
- package/src/scripts/ai_council/low_impact_intake.py +0 -163
- package/src/scripts/ai_council/modes.py +0 -131
- package/src/scripts/ai_council/necessity.py +0 -782
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_2a4_acceptance.py +0 -208
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_add_quiet.py +0 -149
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_budget_v2_audit.py +0 -206
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_context_layer_v1_estimate.py +0 -67
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_context_layer_v1_review.py +0 -292
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_followups_review.py +0 -259
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_inject_quiet_flag.py +0 -33
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_measure_v2.sh +0 -36
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_measure_verbosity.sh +0 -26
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_nondestructive_inline_audit.py +0 -209
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_per_task.sh +0 -41
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_phase4_dispatch_latency.py +0 -108
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_phase6_trigger_jaccard.py +0 -92
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_phase_2a_budget_rebalance.py +0 -257
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_phase_2a_post_revert.py +0 -197
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_rebalancing_audit.py +0 -149
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_roundtrip.py +0 -111
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_rule_hardening_v1.py +0 -251
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_silent_taskfiles.py +0 -98
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_structural_open_questions.py +0 -232
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_structural_optimization.py +0 -144
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_structural_v3_gaps.py +0 -252
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_structural_v3_review.py +0 -240
- package/src/scripts/ai_council/one_off_archive/2026-05/_one_off_tier_retrofit.py +0 -180
- package/src/scripts/ai_council/orchestrator.py +0 -1206
- package/src/scripts/ai_council/pricing.py +0 -215
- package/src/scripts/ai_council/probation_gate.py +0 -152
- package/src/scripts/ai_council/project_context.py +0 -159
- package/src/scripts/ai_council/prompts.py +0 -567
- package/src/scripts/ai_council/redact_low_impact_entry.py +0 -155
- package/src/scripts/ai_council/replay.py +0 -155
- package/src/scripts/ai_council/session.py +0 -366
- package/src/scripts/ai_council/shadow_dispatch.py +0 -235
- package/src/scripts/ai_council/solo_dispatch.py +0 -226
- package/src/scripts/annotate_discovery.py +0 -149
- package/src/scripts/apply_modules_config.py +0 -290
- package/src/scripts/audit_adr_coverage.py +0 -173
- package/src/scripts/audit_auto_rules.py +0 -175
- package/src/scripts/audit_cloud_compatibility.py +0 -362
- package/src/scripts/audit_command_surface.py +0 -682
- package/src/scripts/audit_initial_context.py +0 -237
- package/src/scripts/audit_likelihood.py +0 -148
- package/src/scripts/audit_mcp_tools.py +0 -146
- package/src/scripts/audit_overlap.py +0 -145
- package/src/scripts/audit_skill_descriptions.py +0 -180
- package/src/scripts/audit_skill_overlap.py +0 -207
- package/src/scripts/audit_user_type_axis.py +0 -140
- package/src/scripts/backfill_model_tier.py +0 -184
- package/src/scripts/bench_ab_cache_dispatch.py +0 -68
- package/src/scripts/bench_ab_clone.py +0 -220
- package/src/scripts/bench_ab_diff.py +0 -220
- package/src/scripts/bench_ab_integrity.py +0 -143
- package/src/scripts/bench_ab_run.py +0 -235
- package/src/scripts/bench_ab_task_runner.py +0 -814
- package/src/scripts/bench_ab_tracka_run.py +0 -202
- package/src/scripts/bench_ab_v2_run.py +0 -247
- package/src/scripts/bench_ab_v2_stats.py +0 -347
- package/src/scripts/bench_baseline_ready.py +0 -108
- package/src/scripts/bench_condense_memory.py +0 -168
- package/src/scripts/bench_drift_check.py +0 -151
- package/src/scripts/bench_per_tool.py +0 -216
- package/src/scripts/bench_rtk_savings.py +0 -320
- package/src/scripts/bench_run.py +0 -272
- package/src/scripts/bench_runner.py +0 -158
- package/src/scripts/build_cloud_bundle.py +0 -458
- package/src/scripts/build_discovery_manifest.py +0 -757
- package/src/scripts/build_linear_digest.py +0 -260
- package/src/scripts/build_mcp_registry_manifest.py +0 -181
- package/src/scripts/build_rule_trigger_matrix.py +0 -350
- package/src/scripts/capture_showcase_session.py +0 -361
- package/src/scripts/chat_history.py +0 -1799
- package/src/scripts/check_always_budget.py +0 -532
- package/src/scripts/check_artefact_checksums.py +0 -111
- package/src/scripts/check_augment_description_cap.py +0 -79
- package/src/scripts/check_augmentignore.py +0 -72
- package/src/scripts/check_beta_review_markers.py +0 -127
- package/src/scripts/check_bite_sized_granularity.py +0 -98
- package/src/scripts/check_cluster_patterns.py +0 -206
- package/src/scripts/check_command_count_messaging.py +0 -152
- package/src/scripts/check_condensation.py +0 -375
- package/src/scripts/check_condensed_paths.py +0 -231
- package/src/scripts/check_context_paths.py +0 -202
- package/src/scripts/check_council_layout.py +0 -125
- package/src/scripts/check_council_references.py +0 -228
- package/src/scripts/check_discovery_determinism.py +0 -70
- package/src/scripts/check_gate_paths.py +0 -128
- package/src/scripts/check_iron_law_prominence.py +0 -145
- package/src/scripts/check_kernel_rule_bundle.py +0 -151
- package/src/scripts/check_md_language.py +0 -161
- package/src/scripts/check_memory.py +0 -429
- package/src/scripts/check_memory_proposal.py +0 -182
- package/src/scripts/check_module_management_neutral.py +0 -147
- package/src/scripts/check_no_external_sources.py +0 -101
- package/src/scripts/check_no_local_settings_committed.py +0 -51
- package/src/scripts/check_no_new_legacy_path.py +0 -100
- package/src/scripts/check_no_roadmap_refs.py +0 -155
- package/src/scripts/check_one_off_location.py +0 -81
- package/src/scripts/check_overlay_cascade_subdirs.py +0 -129
- package/src/scripts/check_portability.py +0 -574
- package/src/scripts/check_proposal.py +0 -269
- package/src/scripts/check_public_catalog_links.py +0 -125
- package/src/scripts/check_public_links.py +0 -185
- package/src/scripts/check_references.py +0 -559
- package/src/scripts/check_release_includes_discovery.py +0 -61
- package/src/scripts/check_release_pr_shape.py +0 -123
- package/src/scripts/check_release_published.py +0 -145
- package/src/scripts/check_release_trunk_sync.py +0 -152
- package/src/scripts/check_reply_consistency.py +0 -169
- package/src/scripts/check_roadmap_trackable.py +0 -114
- package/src/scripts/check_role_doc_links.py +0 -110
- package/src/scripts/check_safety_floor_untouched.py +0 -125
- package/src/scripts/check_skill_requires.py +0 -147
- package/src/scripts/check_template_pin_drift.py +0 -129
- package/src/scripts/check_test_coverage_diff.py +0 -180
- package/src/scripts/check_token_optimizer_freshness.py +0 -146
- package/src/scripts/check_update_banner.py +0 -86
- package/src/scripts/ci_status.py +0 -301
- package/src/scripts/ci_summary.py +0 -131
- package/src/scripts/ci_time_ratio.py +0 -168
- package/src/scripts/command_suggester/__init__.py +0 -51
- package/src/scripts/command_suggester/cooldown.py +0 -132
- package/src/scripts/command_suggester/loader.py +0 -73
- package/src/scripts/command_suggester/match.py +0 -180
- package/src/scripts/command_suggester/rank.py +0 -120
- package/src/scripts/command_suggester/render.py +0 -86
- package/src/scripts/command_suggester/sanitize.py +0 -113
- package/src/scripts/command_suggester/settings.py +0 -127
- package/src/scripts/command_suggester/types.py +0 -78
- package/src/scripts/compile_router.py +0 -232
- package/src/scripts/condense.py +0 -1919
- package/src/scripts/condense_memory.py +0 -178
- package/src/scripts/config/__init__.py +0 -9
- package/src/scripts/config/packs.py +0 -157
- package/src/scripts/config/presets.py +0 -224
- package/src/scripts/config/profile_explain.py +0 -89
- package/src/scripts/config/profiles.py +0 -191
- package/src/scripts/config/session_profiles.py +0 -542
- package/src/scripts/context_hygiene_hook.py +0 -181
- package/src/scripts/cost_by_conversation.py +0 -78
- package/src/scripts/cost_summary.py +0 -97
- package/src/scripts/council_cli.py +0 -2571
- package/src/scripts/council_prune.py +0 -81
- package/src/scripts/cross_repo_retrieve.py +0 -172
- package/src/scripts/discovery_stats.py +0 -70
- package/src/scripts/extract_audit_patterns.py +0 -202
- package/src/scripts/first_run_gate_hook.py +0 -179
- package/src/scripts/gen_discovery_baseline.py +0 -127
- package/src/scripts/generate_catalog.py +0 -116
- package/src/scripts/generate_command_flows.py +0 -191
- package/src/scripts/generate_index.py +0 -303
- package/src/scripts/generate_ownership_matrix.py +0 -378
- package/src/scripts/generate_pack_manifests.py +0 -340
- package/src/scripts/hooks/__init__.py +0 -1
- package/src/scripts/hooks/dispatch_hook.py +0 -461
- package/src/scripts/hooks/dispatch_issues.py +0 -136
- package/src/scripts/hooks/envelope.py +0 -98
- package/src/scripts/hooks/replay_hook.py +0 -144
- package/src/scripts/hooks/state_io.py +0 -145
- package/src/scripts/hooks_doctor.py +0 -223
- package/src/scripts/hooks_status.py +0 -157
- package/src/scripts/injection_scan_hook.py +0 -145
- package/src/scripts/install.py +0 -5258
- package/src/scripts/inventory_abstraction_budget.py +0 -622
- package/src/scripts/inventory_frontmatter.py +0 -164
- package/src/scripts/inventory_meta_layers.py +0 -288
- package/src/scripts/iron_law_sha.py +0 -107
- package/src/scripts/linked_projects_list.py +0 -91
- package/src/scripts/lint_agent_security.py +0 -112
- package/src/scripts/lint_agent_skill_names.py +0 -150
- package/src/scripts/lint_agents_layout.py +0 -197
- package/src/scripts/lint_agents_md.py +0 -210
- package/src/scripts/lint_archived_skills.py +0 -159
- package/src/scripts/lint_artefact_frontmatter.py +0 -188
- package/src/scripts/lint_bench_ab.py +0 -173
- package/src/scripts/lint_bench_corpus.py +0 -255
- package/src/scripts/lint_command_flow_coverage.py +0 -132
- package/src/scripts/lint_command_routing.py +0 -160
- package/src/scripts/lint_command_tiers.py +0 -216
- package/src/scripts/lint_command_verbs.py +0 -206
- package/src/scripts/lint_commit_subjects.py +0 -139
- package/src/scripts/lint_context_spine_usage.py +0 -137
- package/src/scripts/lint_discovery_manifest.py +0 -176
- package/src/scripts/lint_discovery_vocabulary.py +0 -222
- package/src/scripts/lint_empty_roadmaps.py +0 -80
- package/src/scripts/lint_examples.py +0 -102
- package/src/scripts/lint_explain_trace.py +0 -80
- package/src/scripts/lint_featured_skills.py +0 -144
- package/src/scripts/lint_flows.py +0 -215
- package/src/scripts/lint_framework_leakage.py +0 -375
- package/src/scripts/lint_frontmatter_boilerplate.py +0 -77
- package/src/scripts/lint_ghostwriter_source.py +0 -242
- package/src/scripts/lint_global_paths.py +0 -148
- package/src/scripts/lint_handoffs.py +0 -217
- package/src/scripts/lint_hidden_unicode.py +0 -132
- package/src/scripts/lint_hook_concern_budget.py +0 -207
- package/src/scripts/lint_hook_manifest.py +0 -217
- package/src/scripts/lint_instruction_smuggling.py +0 -107
- package/src/scripts/lint_load_context.py +0 -196
- package/src/scripts/lint_marketplace.py +0 -180
- package/src/scripts/lint_marketplace_install_completeness.py +0 -198
- package/src/scripts/lint_mcp_config_security.py +0 -124
- package/src/scripts/lint_mcp_registry_manifest.py +0 -69
- package/src/scripts/lint_media_policy_linkage.py +0 -140
- package/src/scripts/lint_model_tier_coverage.py +0 -73
- package/src/scripts/lint_namespace.py +0 -135
- package/src/scripts/lint_namespace_collisions.py +0 -103
- package/src/scripts/lint_new_skill_gate.py +0 -144
- package/src/scripts/lint_no_new_atomic_commands.py +0 -180
- package/src/scripts/lint_one_off_age.py +0 -184
- package/src/scripts/lint_orchestration_dsl.py +0 -217
- package/src/scripts/lint_orchestrator_auto_detect.py +0 -111
- package/src/scripts/lint_pack_boundaries.py +0 -147
- package/src/scripts/lint_pack_dependencies.py +0 -137
- package/src/scripts/lint_pack_first_win.py +0 -121
- package/src/scripts/lint_persona_governance.py +0 -164
- package/src/scripts/lint_positioning.py +0 -143
- package/src/scripts/lint_profile_overlay_set_only.py +0 -179
- package/src/scripts/lint_readme_jargon.py +0 -131
- package/src/scripts/lint_readme_size.py +0 -33
- package/src/scripts/lint_regression.py +0 -251
- package/src/scripts/lint_roadmap_ci_steps.py +0 -186
- package/src/scripts/lint_roadmap_complexity.py +0 -220
- package/src/scripts/lint_role_experiences.py +0 -255
- package/src/scripts/lint_rule_interactions.py +0 -170
- package/src/scripts/lint_rule_tiers.py +0 -90
- package/src/scripts/lint_showcase_sessions.py +0 -148
- package/src/scripts/lint_skill_frontmatter_safety.py +0 -144
- package/src/scripts/lint_skill_tools.py +0 -168
- package/src/scripts/lint_topics_yaml.py +0 -89
- package/src/scripts/lint_trust_coherence.py +0 -212
- package/src/scripts/lint_value_dashboard.py +0 -218
- package/src/scripts/lint_workspace_boundary.py +0 -122
- package/src/scripts/mcp_parity_smoke.py +0 -316
- package/src/scripts/mcp_render.py +0 -173
- package/src/scripts/mcp_server/__init__.py +0 -19
- package/src/scripts/mcp_server/__main__.py +0 -12
- package/src/scripts/mcp_server/catalog.py +0 -125
- package/src/scripts/mcp_server/metadata.py +0 -75
- package/src/scripts/mcp_server/prompts.py +0 -442
- package/src/scripts/mcp_server/requirements.txt +0 -4
- package/src/scripts/mcp_server/resources.py +0 -201
- package/src/scripts/mcp_server/server.py +0 -270
- package/src/scripts/mcp_server/telemetry.py +0 -128
- package/src/scripts/mcp_server/tools.py +0 -926
- package/src/scripts/mcp_telemetry_health.py +0 -214
- package/src/scripts/mcp_telemetry_query.py +0 -203
- package/src/scripts/mcp_telemetry_store.py +0 -211
- package/src/scripts/measure_augment_budget.py +0 -214
- package/src/scripts/measure_density.py +0 -232
- package/src/scripts/measure_frugality_savings.py +0 -164
- package/src/scripts/measure_markitdown_lift.py +0 -127
- package/src/scripts/measure_patterns.py +0 -376
- package/src/scripts/measure_projection_bytes.py +0 -159
- package/src/scripts/measure_rule_budget.py +0 -347
- package/src/scripts/measure_skill_reduction.py +0 -102
- package/src/scripts/memory_hash.py +0 -75
- package/src/scripts/memory_lookup.py +0 -436
- package/src/scripts/memory_report.py +0 -314
- package/src/scripts/memory_signal.py +0 -165
- package/src/scripts/memory_status.py +0 -76
- package/src/scripts/migrate_command_suggestions.py +0 -151
- package/src/scripts/migrate_frontmatter_defaults.py +0 -245
- package/src/scripts/mine_session.py +0 -356
- package/src/scripts/minimal_safe_diff_hook.py +0 -245
- package/src/scripts/move_artefact.py +0 -143
- package/src/scripts/new_skill.py +0 -148
- package/src/scripts/onboarding_gate_hook.py +0 -142
- package/src/scripts/pack_mcp_content.py +0 -293
- package/src/scripts/plan_physical_move.py +0 -353
- package/src/scripts/prediction-pool/poisson_sim.py +0 -167
- package/src/scripts/prediction-pool/pool_winsim.py +0 -236
- package/src/scripts/prediction-pool/score_ev.py +0 -188
- package/src/scripts/print_required_checks.py +0 -196
- package/src/scripts/probe_projection_fidelity.py +0 -202
- package/src/scripts/probe_skill_registration.py +0 -413
- package/src/scripts/profile_staleness_hook.py +0 -69
- package/src/scripts/profile_use.py +0 -164
- package/src/scripts/project_thin_rules.py +0 -168
- package/src/scripts/propose_modules_config.py +0 -145
- package/src/scripts/prototype_lint_contradictions.py +0 -150
- package/src/scripts/prove_pack_extractable.py +0 -187
- package/src/scripts/readme_linter.py +0 -589
- package/src/scripts/redact_hook_capture.py +0 -148
- package/src/scripts/refine_ticket_detect.py +0 -646
- package/src/scripts/release.py +0 -1091
- package/src/scripts/render_benchmark_md.py +0 -401
- package/src/scripts/render_value_md.py +0 -347
- package/src/scripts/requirements-evals.txt +0 -8
- package/src/scripts/roadmap_progress_hook.py +0 -274
- package/src/scripts/router_telemetry.py +0 -470
- package/src/scripts/run_skill_evals.py +0 -185
- package/src/scripts/runtime_dispatcher.py +0 -276
- package/src/scripts/runtime_handler.py +0 -148
- package/src/scripts/runtime_registry.py +0 -166
- package/src/scripts/score_skill_selection.py +0 -198
- package/src/scripts/security_audit_config.py +0 -153
- package/src/scripts/setup_eval_venv.sh +0 -58
- package/src/scripts/skill_collision_clusters.py +0 -162
- package/src/scripts/skill_discovery.py +0 -254
- package/src/scripts/skill_linter.py +0 -3694
- package/src/scripts/skill_overlap.py +0 -204
- package/src/scripts/skill_preview.py +0 -179
- package/src/scripts/skill_tools/__init__.py +0 -22
- package/src/scripts/skill_tools/audit_persona_coverage.py +0 -147
- package/src/scripts/skill_tools/audit_user_type_coverage.py +0 -148
- package/src/scripts/skill_tools/run_block_d_eval.py +0 -129
- package/src/scripts/skill_tools/score_skill_relevance.py +0 -169
- package/src/scripts/skill_tools/suggest_skill_for_task.py +0 -113
- package/src/scripts/skill_trigger_eval.py +0 -682
- package/src/scripts/skill_usage_collect.py +0 -191
- package/src/scripts/skill_usage_report.py +0 -162
- package/src/scripts/smoke_path_resolution.py +0 -93
- package/src/scripts/smoke_quickstart.py +0 -144
- package/src/scripts/snapshot_agent_outputs.py +0 -144
- package/src/scripts/spotcheck_thin_root.py +0 -134
- package/src/scripts/sync_agent_settings.py +0 -180
- package/src/scripts/sync_github_metadata.py +0 -147
- package/src/scripts/sync_gitignore.py +0 -291
- package/src/scripts/sync_yaml_rt.py +0 -734
- package/src/scripts/telegraph_stats.py +0 -119
- package/src/scripts/tool_registry.py +0 -146
- package/src/scripts/tools/__init__.py +0 -1
- package/src/scripts/tools/adapter_errors.py +0 -63
- package/src/scripts/tools/base_adapter.py +0 -91
- package/src/scripts/tools/github_adapter.py +0 -128
- package/src/scripts/tools/jira_adapter.py +0 -115
- package/src/scripts/trigger_coverage.py +0 -129
- package/src/scripts/update_counts.py +0 -199
- package/src/scripts/update_prices.py +0 -125
- package/src/scripts/validate_agent_settings.py +0 -124
- package/src/scripts/validate_decision_engine.py +0 -136
- package/src/scripts/validate_discovery_manifest.py +0 -94
- package/src/scripts/validate_frontmatter.py +0 -647
- package/src/scripts/validate_pack_yaml.py +0 -179
- package/src/scripts/validate_safe_paths.py +0 -118
- package/src/scripts/validate_telegraph_carveouts.py +0 -129
- package/src/scripts/verify_before_complete_hook.py +0 -216
- package/src/scripts/verify_physical_move.py +0 -185
- package/src/scripts/wrapper_freshness_hook.py +0 -86
- /package/dist/agent-src/skills/design-intelligence/data/{typography.csv → font-pairings-reference.csv} +0 -0
- /package/src/scripts/{ai-video → media}/lib/fixtures/allin1/analysis.json +0 -0
- /package/src/scripts/{ai-video → media}/lib/fixtures/comfyui/scene-0001.mp4 +0 -0
- /package/src/scripts/{ai-video → media}/lib/fixtures/fal/scene-0001.mp4 +0 -0
- /package/src/scripts/{ai-video → media}/lib/fixtures/gemini-veo/scene-0001.mp4 +0 -0
- /package/src/scripts/{ai-video → media}/lib/fixtures/higgsfield/scene-0001.mp4 +0 -0
- /package/src/scripts/{ai-video → media}/lib/fixtures/kling/scene-0001.mp4 +0 -0
- /package/src/scripts/{ai-video → media}/lib/fixtures/musetalk/lipsync-0001.mp4 +0 -0
- /package/src/scripts/{ai-video → media}/lib/fixtures/openai-images/scene-0001.png +0 -0
- /package/src/scripts/{ai-video → media}/lib/fixtures/replicate/scene-0001.mp4 +0 -0
- /package/src/scripts/{ai-video → media}/lib/fixtures/sora/scene-0001.mp4 +0 -0
- /package/src/scripts/{ai-video → media}/lib/fixtures/syncso/lipsync-0001.mp4 +0 -0
- /package/src/scripts/{ai-video → media}/lib/fixtures/whisperx/transcript.json +0 -0
- /package/src/scripts/{ai-video → media}/lib/telemetry.sh +0 -0
|
@@ -0,0 +1,1018 @@
|
|
|
1
|
+
#!/usr/bin/env node
|
|
2
|
+
/**
|
|
3
|
+
* bench:ab v2 — paired statistics (Phase 3).
|
|
4
|
+
*
|
|
5
|
+
* TypeScript twin of `src/scripts/bench_ab_v2_stats.py` (ADR-200 Python→TS
|
|
6
|
+
* migration). Mirrors the CLI contract EXACTLY: positional `report` arg, the
|
|
7
|
+
* `--json` / `--markdown PATH` flags, exit codes (0 ok / 1 no report found),
|
|
8
|
+
* byte-identical stdout/stderr, byte-identical analysis JSON, and byte-identical
|
|
9
|
+
* rendered markdown. No behaviour changes.
|
|
10
|
+
*
|
|
11
|
+
* Reads a v2 paired report (bench_ab_v2_run.py output) and computes, for each
|
|
12
|
+
* arm comparison, paired significance + effect size on:
|
|
13
|
+
*
|
|
14
|
+
* - capability axis (binary) -> McNemar exact test + Cohen's h
|
|
15
|
+
* - discipline axis ([0,1]) -> Wilcoxon signed-rank + rank-biserial
|
|
16
|
+
* - status buckets -> error/undisciplined-rate per arm
|
|
17
|
+
*
|
|
18
|
+
* Pairing: each (task, seed) is one pair, seen under every arm. Pooled across all
|
|
19
|
+
* task×seed pairs. Dependency-free (stdlib math only) so the benchmark stays
|
|
20
|
+
* portable. Errored runs are EXCLUDED from a pair (per-axis) so a quota trip is
|
|
21
|
+
* never read as a content/discipline fail.
|
|
22
|
+
*
|
|
23
|
+
* Float parity: `math.erf` is ported from CPython's `m_erf` series and `math.comb`
|
|
24
|
+
* from an exact BigInt computation, so every `round(p, 4)` / `round(h, 4)` output
|
|
25
|
+
* is byte-identical to the Python original.
|
|
26
|
+
*/
|
|
27
|
+
import * as fs from 'node:fs';
|
|
28
|
+
import * as path from 'node:path';
|
|
29
|
+
import process from 'node:process';
|
|
30
|
+
import { fileURLToPath, pathToFileURL } from 'node:url';
|
|
31
|
+
|
|
32
|
+
const _HERE = fileURLToPath(import.meta.url);
|
|
33
|
+
|
|
34
|
+
// bench_ab_v2_stats.ts → parents[2] is repo root (script lives in src/scripts/).
|
|
35
|
+
const REPO_ROOT = path.resolve(path.dirname(_HERE), '..', '..');
|
|
36
|
+
const REPORTS_DIR = path.join(REPO_ROOT, 'internal', 'bench', 'reports', 'ab-v2');
|
|
37
|
+
|
|
38
|
+
type Dict = Record<string, unknown>;
|
|
39
|
+
|
|
40
|
+
const COMPARISONS: Array<[string, string, string]> = [
|
|
41
|
+
['package', 'vanilla', 'package lift'],
|
|
42
|
+
['package-rdp', 'package', 'RDP lift'],
|
|
43
|
+
['package', 'placebo', 'attribution (content vs length)'],
|
|
44
|
+
];
|
|
45
|
+
|
|
46
|
+
// ── CPython math.erf / math.comb ports ────────────────────────────────────
|
|
47
|
+
//
|
|
48
|
+
// CPython's `m_erf` (Modules/mathmodule.c): a Maclaurin series for |x| < 1.5
|
|
49
|
+
// and 1 - erfc for larger |x|; `m_erfc` uses a continued-fraction expansion.
|
|
50
|
+
// Ported verbatim so `_phi(z)` matches python3 to full double precision.
|
|
51
|
+
|
|
52
|
+
const _ERF_SERIES_CUTOFF = 1.5;
|
|
53
|
+
const _ERF_SERIES_TERMS = 25;
|
|
54
|
+
const _ERFC_CONTFRAC_CUTOFF = 30.0;
|
|
55
|
+
const _ERFC_CONTFRAC_TERMS = 50;
|
|
56
|
+
const _SQRTPI = 1.772453850905516027298167483341145182798;
|
|
57
|
+
|
|
58
|
+
function _m_erf_series(x: number): number {
|
|
59
|
+
// erf(x) = 2/sqrt(pi) * x * sum_{k>=0} (-x^2)^k / (k! (2k+1))
|
|
60
|
+
let x2 = x * x;
|
|
61
|
+
let acc = 0.0;
|
|
62
|
+
let fk = _ERF_SERIES_TERMS + 0.5;
|
|
63
|
+
for (let i = 0; i < _ERF_SERIES_TERMS; i += 1) {
|
|
64
|
+
acc = 2.0 + (x2 * acc) / fk;
|
|
65
|
+
fk -= 1.0;
|
|
66
|
+
}
|
|
67
|
+
return (acc * x * Math.exp(-x2)) / _SQRTPI;
|
|
68
|
+
}
|
|
69
|
+
|
|
70
|
+
function _m_erfc_contfrac(x: number): number {
|
|
71
|
+
if (x >= _ERFC_CONTFRAC_CUTOFF) {
|
|
72
|
+
return 0.0;
|
|
73
|
+
}
|
|
74
|
+
const x2 = x * x;
|
|
75
|
+
let a = 0.0;
|
|
76
|
+
let da = 0.5;
|
|
77
|
+
let p = 1.0;
|
|
78
|
+
let p_last = 0.0;
|
|
79
|
+
let q = da + x2;
|
|
80
|
+
let q_last = 1.0;
|
|
81
|
+
for (let i = 0; i < _ERFC_CONTFRAC_TERMS; i += 1) {
|
|
82
|
+
a += da;
|
|
83
|
+
da += 2.0;
|
|
84
|
+
const b = da + x2;
|
|
85
|
+
const temp_p = b * p - a * p_last;
|
|
86
|
+
p_last = p;
|
|
87
|
+
p = temp_p;
|
|
88
|
+
const temp_q = b * q - a * q_last;
|
|
89
|
+
q_last = q;
|
|
90
|
+
q = temp_q;
|
|
91
|
+
}
|
|
92
|
+
return (((p / q) * x) * Math.exp(-x2)) / _SQRTPI;
|
|
93
|
+
}
|
|
94
|
+
|
|
95
|
+
function _erf(x: number): number {
|
|
96
|
+
if (Number.isNaN(x)) {
|
|
97
|
+
return x;
|
|
98
|
+
}
|
|
99
|
+
const absx = Math.abs(x);
|
|
100
|
+
if (absx < _ERF_SERIES_CUTOFF) {
|
|
101
|
+
return _m_erf_series(x);
|
|
102
|
+
}
|
|
103
|
+
const cf = _m_erfc_contfrac(absx);
|
|
104
|
+
return x > 0.0 ? 1.0 - cf : cf - 1.0;
|
|
105
|
+
}
|
|
106
|
+
|
|
107
|
+
/** Python `math.comb(n, k)` — exact non-negative integer (BigInt → Number). */
|
|
108
|
+
function _comb(n: number, k: number): number {
|
|
109
|
+
if (k < 0 || k > n) {
|
|
110
|
+
return 0;
|
|
111
|
+
}
|
|
112
|
+
let kk = BigInt(Math.min(k, n - k));
|
|
113
|
+
if (kk === 0n) {
|
|
114
|
+
return 1;
|
|
115
|
+
}
|
|
116
|
+
const N = BigInt(n);
|
|
117
|
+
let result = 1n;
|
|
118
|
+
let i = 0n;
|
|
119
|
+
while (i < kk) {
|
|
120
|
+
result = (result * (N - i)) / (i + 1n);
|
|
121
|
+
i += 1n;
|
|
122
|
+
}
|
|
123
|
+
return Number(result);
|
|
124
|
+
}
|
|
125
|
+
|
|
126
|
+
function _phi(z: number): number {
|
|
127
|
+
// Standard-normal CDF via erf.
|
|
128
|
+
return 0.5 * (1.0 + _erf(z / Math.sqrt(2.0)));
|
|
129
|
+
}
|
|
130
|
+
|
|
131
|
+
export function mcnemar_exact(b: number, c: number): number {
|
|
132
|
+
// Two-sided exact McNemar p-value (binomial on discordant pairs).
|
|
133
|
+
const n = b + c;
|
|
134
|
+
if (n === 0) {
|
|
135
|
+
return 1.0;
|
|
136
|
+
}
|
|
137
|
+
const k = Math.min(b, c);
|
|
138
|
+
let tail = 0;
|
|
139
|
+
for (let i = 0; i <= k; i += 1) {
|
|
140
|
+
tail += _comb(n, i);
|
|
141
|
+
}
|
|
142
|
+
tail = tail * 0.5 ** n;
|
|
143
|
+
return Math.min(1.0, 2.0 * tail);
|
|
144
|
+
}
|
|
145
|
+
|
|
146
|
+
export function cohens_h(p1: number, p2: number): number {
|
|
147
|
+
return (
|
|
148
|
+
2 * Math.asin(Math.sqrt(Math.max(0, Math.min(1, p1)))) -
|
|
149
|
+
2 * Math.asin(Math.sqrt(Math.max(0, Math.min(1, p2))))
|
|
150
|
+
);
|
|
151
|
+
}
|
|
152
|
+
|
|
153
|
+
interface WilcoxonResult {
|
|
154
|
+
n: number;
|
|
155
|
+
W_plus: number; // PyFloat-flagged at dump for the rounded case
|
|
156
|
+
W_minus: number;
|
|
157
|
+
p: number;
|
|
158
|
+
rank_biserial: number;
|
|
159
|
+
}
|
|
160
|
+
|
|
161
|
+
export function wilcoxon(diffs: number[]): WilcoxonResult {
|
|
162
|
+
// Wilcoxon signed-rank on paired differences (treatment - baseline).
|
|
163
|
+
// Returns W+, W-, normal-approx two-sided p (continuity-corrected), and
|
|
164
|
+
// rank-biserial effect size. Zeros are dropped.
|
|
165
|
+
const nz = diffs.filter((d) => Math.abs(d) > 1e-9);
|
|
166
|
+
const n = nz.length;
|
|
167
|
+
if (n === 0) {
|
|
168
|
+
return { n: 0, W_plus: 0, W_minus: 0, p: 1.0, rank_biserial: 0.0 };
|
|
169
|
+
}
|
|
170
|
+
// order = sorted(range(n), key=lambda i: abs(nz[i])) — stable sort.
|
|
171
|
+
const order = Array.from({ length: n }, (_, i) => i).sort((x, y) => {
|
|
172
|
+
const ax = Math.abs(nz[x] as number);
|
|
173
|
+
const ay = Math.abs(nz[y] as number);
|
|
174
|
+
return ax < ay ? -1 : ax > ay ? 1 : x - y; // stable on tie
|
|
175
|
+
});
|
|
176
|
+
const ranks: number[] = new Array(n).fill(0.0);
|
|
177
|
+
let i = 0;
|
|
178
|
+
while (i < n) {
|
|
179
|
+
let j = i;
|
|
180
|
+
while (j + 1 < n && Math.abs(nz[order[j + 1] as number] as number) === Math.abs(nz[order[i] as number] as number)) {
|
|
181
|
+
j += 1;
|
|
182
|
+
}
|
|
183
|
+
const avg = (i + 1 + j + 1) / 2.0; // average rank for ties (1-based)
|
|
184
|
+
for (let k = i; k <= j; k += 1) {
|
|
185
|
+
ranks[order[k] as number] = avg;
|
|
186
|
+
}
|
|
187
|
+
i = j + 1;
|
|
188
|
+
}
|
|
189
|
+
let w_plus = 0.0;
|
|
190
|
+
let w_minus = 0.0;
|
|
191
|
+
for (let idx = 0; idx < n; idx += 1) {
|
|
192
|
+
if ((nz[idx] as number) > 0) {
|
|
193
|
+
w_plus += ranks[idx] as number;
|
|
194
|
+
} else if ((nz[idx] as number) < 0) {
|
|
195
|
+
w_minus += ranks[idx] as number;
|
|
196
|
+
}
|
|
197
|
+
}
|
|
198
|
+
const total = w_plus + w_minus;
|
|
199
|
+
const rb = total ? (w_plus - w_minus) / total : 0.0;
|
|
200
|
+
// Normal approximation (ok-ish for n>=10; for small n it's conservative —
|
|
201
|
+
// we surface n so the reader can weight it).
|
|
202
|
+
const mean = (n * (n + 1)) / 4.0;
|
|
203
|
+
const sd = Math.sqrt((n * (n + 1) * (2 * n + 1)) / 24.0);
|
|
204
|
+
const w = Math.min(w_plus, w_minus);
|
|
205
|
+
let p: number;
|
|
206
|
+
if (sd === 0) {
|
|
207
|
+
p = 1.0;
|
|
208
|
+
} else {
|
|
209
|
+
const z = (w - mean + 0.5) / sd;
|
|
210
|
+
p = Math.min(1.0, 2.0 * _phi(z));
|
|
211
|
+
}
|
|
212
|
+
return {
|
|
213
|
+
n,
|
|
214
|
+
// W_plus / W_minus are not surfaced in JSON/markdown (compare() drops
|
|
215
|
+
// them), so plain numbers suffice; p / rank_biserial are floats.
|
|
216
|
+
W_plus: _pyRound(w_plus, 1),
|
|
217
|
+
W_minus: _pyRound(w_minus, 1),
|
|
218
|
+
p: _pyRound(p, 4),
|
|
219
|
+
rank_biserial: _pyRound(rb, 4),
|
|
220
|
+
};
|
|
221
|
+
}
|
|
222
|
+
|
|
223
|
+
/** Wrap a `round(...)`/float result so it renders `1.0` not `1` (Python float). */
|
|
224
|
+
function PF(x: number): PyFloat {
|
|
225
|
+
return new PyFloat(x);
|
|
226
|
+
}
|
|
227
|
+
|
|
228
|
+
/**
|
|
229
|
+
* Did the JSON source literal for `key` carry a decimal point / exponent?
|
|
230
|
+
* Mirrors `json.loads` keeping `1.0` a float vs `1` an int — `JSON.parse`
|
|
231
|
+
* collapses both to the JS number `1`, losing the distinction.
|
|
232
|
+
*/
|
|
233
|
+
function _jsonFieldIsFloat(raw: string, key: string): boolean {
|
|
234
|
+
const re = new RegExp(`"${key}"\\s*:\\s*(-?\\d+(?:\\.\\d+)?(?:[eE][+-]?\\d+)?)`);
|
|
235
|
+
const m = re.exec(raw);
|
|
236
|
+
if (!m) {
|
|
237
|
+
return false;
|
|
238
|
+
}
|
|
239
|
+
const lit = m[1] as string;
|
|
240
|
+
return lit.includes('.') || lit.includes('e') || lit.includes('E');
|
|
241
|
+
}
|
|
242
|
+
|
|
243
|
+
interface Pair {
|
|
244
|
+
id: unknown;
|
|
245
|
+
seed: unknown;
|
|
246
|
+
rt: Dict;
|
|
247
|
+
rb: Dict;
|
|
248
|
+
}
|
|
249
|
+
|
|
250
|
+
function* _pairs(records: Dict[], arm_t: string, arm_b: string): Generator<Pair> {
|
|
251
|
+
// Yield (task, seed, run_t, run_b) for each paired (task,seed).
|
|
252
|
+
for (const rec of records) {
|
|
253
|
+
const arms = _dictOr(rec['arms']);
|
|
254
|
+
const runs_t = Array.isArray(arms[arm_t]) ? (arms[arm_t] as Dict[]) : [];
|
|
255
|
+
const runs_b = Array.isArray(arms[arm_b]) ? (arms[arm_b] as Dict[]) : [];
|
|
256
|
+
const by_seed_b = new Map<unknown, Dict>();
|
|
257
|
+
for (const r of runs_b) {
|
|
258
|
+
by_seed_b.set(r['seed'], r);
|
|
259
|
+
}
|
|
260
|
+
for (const r_t of runs_t) {
|
|
261
|
+
const r_b = by_seed_b.get(r_t['seed']);
|
|
262
|
+
if (r_b !== undefined) {
|
|
263
|
+
yield { id: rec['id'], seed: r_t['seed'], rt: r_t, rb: r_b };
|
|
264
|
+
}
|
|
265
|
+
}
|
|
266
|
+
}
|
|
267
|
+
}
|
|
268
|
+
|
|
269
|
+
export function compare(records: Dict[], arm_t: string, arm_b: string): Dict {
|
|
270
|
+
// Capability (binary, McNemar) — exclude pairs where either side errored.
|
|
271
|
+
let b = 0;
|
|
272
|
+
let c = 0;
|
|
273
|
+
let both1 = 0;
|
|
274
|
+
let both0 = 0;
|
|
275
|
+
let cap_t = 0;
|
|
276
|
+
let cap_b = 0;
|
|
277
|
+
let capn = 0;
|
|
278
|
+
// Discipline (continuous, Wilcoxon)
|
|
279
|
+
const diffs: number[] = [];
|
|
280
|
+
let dis_t_sum = 0.0;
|
|
281
|
+
let dis_b_sum = 0.0;
|
|
282
|
+
let disn = 0.0;
|
|
283
|
+
for (const { rt, rb } of _pairs(records, arm_t, arm_b)) {
|
|
284
|
+
if (!_pyTruthy(rt['errored']) && !_pyTruthy(rb['errored'])) {
|
|
285
|
+
const t = _pyTruthy(rt['capability_pass']);
|
|
286
|
+
const bb = _pyTruthy(rb['capability_pass']);
|
|
287
|
+
capn += 1;
|
|
288
|
+
cap_t += t ? 1 : 0;
|
|
289
|
+
cap_b += bb ? 1 : 0;
|
|
290
|
+
if (t && !bb) {
|
|
291
|
+
b += 1;
|
|
292
|
+
} else if (bb && !t) {
|
|
293
|
+
c += 1;
|
|
294
|
+
} else if (t && bb) {
|
|
295
|
+
both1 += 1;
|
|
296
|
+
} else {
|
|
297
|
+
both0 += 1;
|
|
298
|
+
}
|
|
299
|
+
const dt = _pyFloat(rt['discipline_score']);
|
|
300
|
+
const db = _pyFloat(rb['discipline_score']);
|
|
301
|
+
diffs.push(dt - db);
|
|
302
|
+
dis_t_sum += dt;
|
|
303
|
+
dis_b_sum += db;
|
|
304
|
+
disn += 1;
|
|
305
|
+
}
|
|
306
|
+
}
|
|
307
|
+
void both1;
|
|
308
|
+
void both0;
|
|
309
|
+
const p1 = capn ? cap_t / capn : 0;
|
|
310
|
+
const p2 = capn ? cap_b / capn : 0;
|
|
311
|
+
const wil = wilcoxon(diffs);
|
|
312
|
+
return {
|
|
313
|
+
arm_treatment: arm_t,
|
|
314
|
+
arm_baseline: arm_b,
|
|
315
|
+
n_pairs: capn,
|
|
316
|
+
capability: {
|
|
317
|
+
rate_treatment: PF(_pyRound(p1, 4)),
|
|
318
|
+
rate_baseline: PF(_pyRound(p2, 4)),
|
|
319
|
+
discordant_b_only_treatment: b,
|
|
320
|
+
discordant_c_only_baseline: c,
|
|
321
|
+
mcnemar_p: PF(_pyRound(mcnemar_exact(b, c), 4)),
|
|
322
|
+
cohens_h: PF(_pyRound(cohens_h(p1, p2), 4)),
|
|
323
|
+
},
|
|
324
|
+
discipline: {
|
|
325
|
+
// round(...) → float; the `else 0` fallback is an int (disn == 0).
|
|
326
|
+
mean_treatment: disn ? PF(_pyRound(dis_t_sum / disn, 4)) : 0,
|
|
327
|
+
mean_baseline: disn ? PF(_pyRound(dis_b_sum / disn, 4)) : 0,
|
|
328
|
+
mean_delta: disn ? PF(_pyRound((dis_t_sum - dis_b_sum) / disn, 4)) : 0,
|
|
329
|
+
wilcoxon_p: PF(wil.p),
|
|
330
|
+
rank_biserial: PF(wil.rank_biserial),
|
|
331
|
+
n_nonzero: wil.n,
|
|
332
|
+
},
|
|
333
|
+
};
|
|
334
|
+
}
|
|
335
|
+
|
|
336
|
+
export function mean_tokens_by_arm(records: Dict[], arms: string[]): Dict {
|
|
337
|
+
// Mean total tokens per arm over non-errored runs (the cost axis, L10).
|
|
338
|
+
// Truncated/errored runs are excluded — their token count is capped by the
|
|
339
|
+
// budget, not representative of the work done.
|
|
340
|
+
const out: Dict = {};
|
|
341
|
+
for (const arm of arms) {
|
|
342
|
+
const toks: number[] = [];
|
|
343
|
+
for (const rec of records) {
|
|
344
|
+
const armRuns = _dictOr(rec['arms'])[arm];
|
|
345
|
+
for (const r of Array.isArray(armRuns) ? (armRuns as Dict[]) : []) {
|
|
346
|
+
if (!_pyTruthy(r['errored'])) {
|
|
347
|
+
toks.push(_orZero(_dictOr(r['metrics'])['tokens']));
|
|
348
|
+
}
|
|
349
|
+
}
|
|
350
|
+
}
|
|
351
|
+
out[arm] = {
|
|
352
|
+
n: toks.length,
|
|
353
|
+
mean_tokens: toks.length ? _pyRoundNoArg(toks.reduce((s, x) => s + x, 0) / toks.length) : 0,
|
|
354
|
+
};
|
|
355
|
+
}
|
|
356
|
+
return out;
|
|
357
|
+
}
|
|
358
|
+
|
|
359
|
+
export function bucket_rates(records: Dict[], arms: string[]): Dict {
|
|
360
|
+
const out: Dict = {};
|
|
361
|
+
for (const arm of arms) {
|
|
362
|
+
const buckets: Record<string, number> = {};
|
|
363
|
+
let total = 0;
|
|
364
|
+
for (const rec of records) {
|
|
365
|
+
const armRuns = _dictOr(rec['arms'])[arm];
|
|
366
|
+
for (const r of Array.isArray(armRuns) ? (armRuns as Dict[]) : []) {
|
|
367
|
+
total += 1;
|
|
368
|
+
const bk = _strOr(_dictOr(r['metrics'])['status_bucket'], 'completed');
|
|
369
|
+
buckets[bk] = (buckets[bk] ?? 0) + 1;
|
|
370
|
+
}
|
|
371
|
+
}
|
|
372
|
+
out[arm] = {
|
|
373
|
+
total,
|
|
374
|
+
buckets,
|
|
375
|
+
error_rate: total ? PF(_pyRound(1 - (buckets['completed'] ?? 0) / total, 4)) : 0,
|
|
376
|
+
};
|
|
377
|
+
}
|
|
378
|
+
return out;
|
|
379
|
+
}
|
|
380
|
+
|
|
381
|
+
export function analyse(payload: Dict): Dict {
|
|
382
|
+
const records = Array.isArray(payload['records']) ? (payload['records'] as Dict[]) : [];
|
|
383
|
+
const arms = Array.isArray(payload['arms']) ? (payload['arms'] as string[]) : [];
|
|
384
|
+
const comps: Dict[] = [];
|
|
385
|
+
for (const [t, b, lbl] of COMPARISONS) {
|
|
386
|
+
if (arms.includes(t) && arms.includes(b)) {
|
|
387
|
+
// compare(...) | {"label": lbl} — label appended at the end.
|
|
388
|
+
comps.push({ ...compare(records, t, b), label: lbl });
|
|
389
|
+
}
|
|
390
|
+
}
|
|
391
|
+
return {
|
|
392
|
+
stamp: payload['stamp'] ?? null,
|
|
393
|
+
model: payload['model'] ?? null,
|
|
394
|
+
seeds: payload['seeds'] ?? null,
|
|
395
|
+
n_tasks: records.length,
|
|
396
|
+
comparisons: comps,
|
|
397
|
+
status_buckets: bucket_rates(records, arms),
|
|
398
|
+
mean_tokens: mean_tokens_by_arm(records, arms),
|
|
399
|
+
};
|
|
400
|
+
}
|
|
401
|
+
|
|
402
|
+
export function gate_verdict(analysis: Dict): Dict {
|
|
403
|
+
// L4 gate: PASS if ANY axis shows significant paired lift for package vs
|
|
404
|
+
// vanilla (McNemar p<0.05 OR Wilcoxon p<0.05 OR a status-bucket reduction).
|
|
405
|
+
const comparisons = Array.isArray(analysis['comparisons']) ? (analysis['comparisons'] as Dict[]) : [];
|
|
406
|
+
const pkg = comparisons.find(
|
|
407
|
+
(cc) => cc['arm_treatment'] === 'package' && cc['arm_baseline'] === 'vanilla',
|
|
408
|
+
);
|
|
409
|
+
if (!pkg) {
|
|
410
|
+
return { verdict: 'INCONCLUSIVE', reason: 'no package-vs-vanilla comparison' };
|
|
411
|
+
}
|
|
412
|
+
const cap = _dictOr(pkg['capability']);
|
|
413
|
+
const dis = _dictOr(pkg['discipline']);
|
|
414
|
+
const cap_sig =
|
|
415
|
+
_pyFloat(cap['mcnemar_p']) < 0.05 && _pyFloat(cap['rate_treatment']) > _pyFloat(cap['rate_baseline']);
|
|
416
|
+
const dis_sig = _pyFloat(dis['wilcoxon_p']) < 0.05 && _pyFloat(dis['mean_delta']) > 0;
|
|
417
|
+
const sb = _dictOr(analysis['status_buckets']);
|
|
418
|
+
const bucket_better =
|
|
419
|
+
_errorRate(sb['package']) < _errorRate(sb['vanilla']);
|
|
420
|
+
const passed = cap_sig || dis_sig;
|
|
421
|
+
return {
|
|
422
|
+
verdict: passed ? 'PASS' : 'FALSIFIED-OR-INCONCLUSIVE',
|
|
423
|
+
capability_significant: cap_sig,
|
|
424
|
+
discipline_significant: dis_sig,
|
|
425
|
+
status_bucket_better: bucket_better,
|
|
426
|
+
note:
|
|
427
|
+
'PASS = significant paired discipline/capability lift; ' +
|
|
428
|
+
'FALSIFIED only if also trivial across seeds (inspect n_pairs).',
|
|
429
|
+
};
|
|
430
|
+
}
|
|
431
|
+
|
|
432
|
+
/** `sb.get(arm, {}).get("error_rate", 1)`. */
|
|
433
|
+
function _errorRate(arm: unknown): number {
|
|
434
|
+
const d = _dictOr(arm);
|
|
435
|
+
return 'error_rate' in d ? _pyFloat(d['error_rate']) : 1;
|
|
436
|
+
}
|
|
437
|
+
|
|
438
|
+
export function to_markdown(analysis: Dict, payload: Dict): string {
|
|
439
|
+
const a = analysis;
|
|
440
|
+
const g = _dictOr(a['gate']);
|
|
441
|
+
const L: string[] = [];
|
|
442
|
+
L.push('# Discipline-Axis Wrapper-Lift Benchmark (v2)');
|
|
443
|
+
L.push('');
|
|
444
|
+
L.push(
|
|
445
|
+
'> Generated by `scripts/bench_ab_v2_stats.py --markdown`. Source: ' +
|
|
446
|
+
'`internal/bench/reports/ab-v2/`. Re-render with `task bench:ab:v2:diff`.',
|
|
447
|
+
);
|
|
448
|
+
L.push('');
|
|
449
|
+
L.push('## Honesty labels (read first)');
|
|
450
|
+
L.push('');
|
|
451
|
+
L.push(
|
|
452
|
+
`> 1. **Wrapper-lift on a fixed host (\`${_pyStr(a['model'])}\`), NOT model-vs-model.** ` +
|
|
453
|
+
'Measures what the agent-config package does to ONE host model on a neutral ' +
|
|
454
|
+
'fixture — not a capability ranking.',
|
|
455
|
+
);
|
|
456
|
+
L.push(
|
|
457
|
+
'> 2. **Discipline axis, not capability.** The headline is the *discipline* ' +
|
|
458
|
+
'delta (did it stay minimal / verify / ask / not destroy / update downstream), ' +
|
|
459
|
+
'not whether the goal was achievable.',
|
|
460
|
+
);
|
|
461
|
+
L.push(
|
|
462
|
+
`> 3. **PILOT — low statistical power (N=${_pyStr(a['n_tasks'])} tasks × ` +
|
|
463
|
+
`${_pyStr(a['seeds'])} seed(s)).** Directional only.`,
|
|
464
|
+
);
|
|
465
|
+
L.push(
|
|
466
|
+
'> 4. **Paired design**, errored runs excluded; McNemar (capability) + ' +
|
|
467
|
+
'Wilcoxon signed-rank (discipline) + effect sizes.',
|
|
468
|
+
);
|
|
469
|
+
L.push(
|
|
470
|
+
'> 5. **Not comparable to SWE-bench / GAIA / Fable scores** — a different ' +
|
|
471
|
+
'question entirely.',
|
|
472
|
+
);
|
|
473
|
+
L.push('');
|
|
474
|
+
L.push(`## Gate verdict: **${_pyStr(g['verdict'])}**`);
|
|
475
|
+
L.push('');
|
|
476
|
+
L.push(`- capability lift significant: \`${_pyStr(g['capability_significant'])}\``);
|
|
477
|
+
L.push(`- discipline lift significant: \`${_pyStr(g['discipline_significant'])}\``);
|
|
478
|
+
L.push(`- status-bucket better (package vs vanilla): \`${_pyStr(g['status_bucket_better'])}\``);
|
|
479
|
+
L.push('');
|
|
480
|
+
if (g['verdict'] === 'PASS') {
|
|
481
|
+
L.push(
|
|
482
|
+
'> **Measurable discipline lift (significant).** On the scope-creep / ' +
|
|
483
|
+
'downstream-changes family, a weak host (`claude-haiku-4-5`) leaves the ' +
|
|
484
|
+
'downstream caller un-updated / scope-creeps a large fraction of the time; ' +
|
|
485
|
+
'the package reliably corrects it. The lift is significant on the discipline ' +
|
|
486
|
+
'axis (Wilcoxon p<0.05, every discordant pair favouring the package) AND ' +
|
|
487
|
+
'beats an **equal-length inert-prose placebo** — so it is the package\'s ' +
|
|
488
|
+
'*content* (its `downstream-changes`/`scope-control` rules), NOT mere ' +
|
|
489
|
+
'prompt-length, that helps. **Honest scope (empirically bounded):** the lift ' +
|
|
490
|
+
'is **weak-host-specific** — a CLEAN strong-host run (`claude-sonnet-4-6`, ' +
|
|
491
|
+
'same tasks, 8 seeds) scored vanilla = package = placebo = 1.00 (no headroom, ' +
|
|
492
|
+
'package redundant). So the package helps a WEAK model that lacks the ' +
|
|
493
|
+
'discipline; a strong model already has it. This matches the package\'s design ' +
|
|
494
|
+
'thesis (strong hosts self-apply discipline; weak hosts benefit fully). ' +
|
|
495
|
+
'Discipline axis, not capability (both arms make the primary change); this ' +
|
|
496
|
+
'task family (scope/downstream), not a universal claim. It improves *solution ' +
|
|
497
|
+
'discipline*, not model intelligence.',
|
|
498
|
+
);
|
|
499
|
+
L.push('');
|
|
500
|
+
}
|
|
501
|
+
if (g['verdict'] !== 'PASS') {
|
|
502
|
+
L.push(
|
|
503
|
+
'> **Honest null.** The bare host is *already* disciplined ' +
|
|
504
|
+
'(vanilla discipline ≈ 1.0), so there is no headroom for the package to ' +
|
|
505
|
+
'lift — and the package neither helps nor hurts (placebo ≈ package ≈ ' +
|
|
506
|
+
'vanilla, so no prompt-length effect either). This replicated across **both ' +
|
|
507
|
+
'hosts** (weak `claude-haiku-4-5` + strong `claude-sonnet-4-6`) and **both ' +
|
|
508
|
+
'scales** (micro + meso) — the complexity-stratified gate the 2026-06-14 ' +
|
|
509
|
+
'council required. The discipline axis saturates for capable hosts on ' +
|
|
510
|
+
'deterministic trap tasks; **no lift is claimed.** (A measurement confound — ' +
|
|
511
|
+
"the plugin's own runtime hooks writing into the clone — once manufactured a " +
|
|
512
|
+
"fake 'degradation' signal; it is excluded from the diff, see " +
|
|
513
|
+
'`bench_ab_scoring_v2._rel_files`.) The apparatus is kept for a future ' +
|
|
514
|
+
'non-deterministic / agentic-trajectory corpus where headroom may exist.',
|
|
515
|
+
);
|
|
516
|
+
L.push('');
|
|
517
|
+
}
|
|
518
|
+
const comparisons = Array.isArray(a['comparisons']) ? (a['comparisons'] as Dict[]) : [];
|
|
519
|
+
for (const cmp of comparisons) {
|
|
520
|
+
const cap = _dictOr(cmp['capability']);
|
|
521
|
+
const dis = _dictOr(cmp['discipline']);
|
|
522
|
+
L.push(
|
|
523
|
+
`## ${_pyStr(cmp['label'])} — \`${_pyStr(cmp['arm_treatment'])}\` vs \`${_pyStr(cmp['arm_baseline'])}\` ` +
|
|
524
|
+
`(n=${_pyStr(cmp['n_pairs'])} pairs)`,
|
|
525
|
+
);
|
|
526
|
+
L.push('');
|
|
527
|
+
L.push('### Table 1 — capability axis (expected near-flat by design)');
|
|
528
|
+
L.push('');
|
|
529
|
+
L.push('| metric | baseline | treatment | test |');
|
|
530
|
+
L.push('|---|---|---|---|');
|
|
531
|
+
L.push(
|
|
532
|
+
`| pass-rate | ${_fmtPct0(cap['rate_baseline'])} | ${_fmtPct0(cap['rate_treatment'])} ` +
|
|
533
|
+
`| McNemar p=${_pyStr(cap['mcnemar_p'])}, h=${_pyStr(cap['cohens_h'])} |`,
|
|
534
|
+
);
|
|
535
|
+
L.push('');
|
|
536
|
+
L.push('### Table 2 — discipline axis (the lift)');
|
|
537
|
+
L.push('');
|
|
538
|
+
L.push('| metric | baseline | treatment | Δ | test |');
|
|
539
|
+
L.push('|---|---|---|---|---|');
|
|
540
|
+
L.push(
|
|
541
|
+
`| mean discipline | ${_fmt3(dis['mean_baseline'])} | ${_fmt3(dis['mean_treatment'])} ` +
|
|
542
|
+
`| ${_fmtSigned3(dis['mean_delta'])} | Wilcoxon p=${_pyStr(dis['wilcoxon_p'])}, ` +
|
|
543
|
+
`rb=${_pyStr(dis['rank_biserial'])} (n≠0=${_pyStr(dis['n_nonzero'])}) |`,
|
|
544
|
+
);
|
|
545
|
+
L.push('');
|
|
546
|
+
const mt = _dictOr(a['mean_tokens']);
|
|
547
|
+
const tb = _meanTokens(mt[String(cmp['arm_baseline'])]);
|
|
548
|
+
const tt = _meanTokens(mt[String(cmp['arm_treatment'])]);
|
|
549
|
+
L.push('### Table 3 — cost axis (mean tokens/run, non-errored)');
|
|
550
|
+
L.push('');
|
|
551
|
+
L.push('| metric | baseline | treatment | Δ |');
|
|
552
|
+
L.push('|---|---|---|---|');
|
|
553
|
+
L.push(`| mean tokens | ${_thousands(tb)} | ${_thousands(tt)} | ${_thousandsSigned(tt - tb)} |`);
|
|
554
|
+
L.push('');
|
|
555
|
+
}
|
|
556
|
+
L.push('## Status buckets (trajectory)');
|
|
557
|
+
L.push('');
|
|
558
|
+
L.push('| arm | runs | error-rate | buckets |');
|
|
559
|
+
L.push('|---|---|---|---|');
|
|
560
|
+
const statusBuckets = _dictOr(a['status_buckets']);
|
|
561
|
+
for (const arm of Object.keys(statusBuckets)) {
|
|
562
|
+
const info = _dictOr(statusBuckets[arm]);
|
|
563
|
+
const bucketsObj = _dictOr(info['buckets']);
|
|
564
|
+
const bk = Object.entries(bucketsObj)
|
|
565
|
+
.map(([k, v]) => `${k}:${_pyStr(v)}`)
|
|
566
|
+
.join(', ');
|
|
567
|
+
L.push(`| ${arm} | ${_pyStr(info['total'])} | ${_fmtPct0(info['error_rate'])} | ${bk} |`);
|
|
568
|
+
}
|
|
569
|
+
L.push('');
|
|
570
|
+
L.push('## Methodology');
|
|
571
|
+
L.push('');
|
|
572
|
+
L.push(
|
|
573
|
+
`- Host model: \`${_pyStr(a['model'])}\` (pinned across all arms — a validity ` +
|
|
574
|
+
'requirement, not a model comparison).',
|
|
575
|
+
);
|
|
576
|
+
L.push(
|
|
577
|
+
// budget_usd_per_run is a Python float (argparse type=float, round-tripped
|
|
578
|
+
// through JSON); str() → "1.0". placebo_chars is an int → "2000".
|
|
579
|
+
`- Per-run budget cap: $${_pyStr(payload['budget_usd_per_run'])}; ` +
|
|
580
|
+
`placebo injected ~${_pyStr(payload['placebo_chars'])} chars of inert prose.`,
|
|
581
|
+
);
|
|
582
|
+
L.push(
|
|
583
|
+
'- Arms: vanilla (plugin off) · package (real plugin) · package-rdp ' +
|
|
584
|
+
'(plugin + RDP rules) · placebo (plugin off + equal-length inert prose).',
|
|
585
|
+
);
|
|
586
|
+
L.push(
|
|
587
|
+
'- Corpus: `internal/bench/corpora/ab-trackb-v2.yaml` (5 trap archetypes). ' +
|
|
588
|
+
'Scoring: `bench_ab_scoring_v2.py` (deterministic, no LLM judge).',
|
|
589
|
+
);
|
|
590
|
+
L.push('- Roadmap: `agents/roadmaps/road-to-discipline-axis-benchmark.md`.');
|
|
591
|
+
L.push('');
|
|
592
|
+
return L.join('\n');
|
|
593
|
+
}
|
|
594
|
+
|
|
595
|
+
// ── format helpers (Python f-string parity) ───────────────────────────────
|
|
596
|
+
|
|
597
|
+
/** `f"{x:.0%}"` — percent, 0 decimals, value is a 0..1 fraction. */
|
|
598
|
+
function _fmtPct0(v: unknown): string {
|
|
599
|
+
return `${_pyFixed(_pyFloat(v) * 100, 0)}%`;
|
|
600
|
+
}
|
|
601
|
+
|
|
602
|
+
/** `f"{x:.3f}"`. */
|
|
603
|
+
function _fmt3(v: unknown): string {
|
|
604
|
+
return _pyFixed(_pyFloat(v), 3);
|
|
605
|
+
}
|
|
606
|
+
|
|
607
|
+
/** `f"{x:+.3f}"`. */
|
|
608
|
+
function _fmtSigned3(v: unknown): string {
|
|
609
|
+
const body = _pyFixed(_pyFloat(v), 3);
|
|
610
|
+
return body.startsWith('-') ? body : `+${body}`;
|
|
611
|
+
}
|
|
612
|
+
|
|
613
|
+
/** `f"{n:,}"` over `int(value)`. */
|
|
614
|
+
function _thousands(n: number): string {
|
|
615
|
+
return _pyThousands(_pyIntTrunc(n));
|
|
616
|
+
}
|
|
617
|
+
|
|
618
|
+
function _thousandsSigned(n: number): string {
|
|
619
|
+
const t = _pyIntTrunc(n);
|
|
620
|
+
const body = _pyThousands(t);
|
|
621
|
+
return t < 0 ? body : `+${body}`;
|
|
622
|
+
}
|
|
623
|
+
|
|
624
|
+
/** `mt.get(arm, {}).get("mean_tokens", 0)`. */
|
|
625
|
+
function _meanTokens(arm: unknown): number {
|
|
626
|
+
const d = _dictOr(arm);
|
|
627
|
+
return _orZero(d['mean_tokens']);
|
|
628
|
+
}
|
|
629
|
+
|
|
630
|
+
// ── analysis-JSON byte parity (json.dumps(..., indent=2)) ──────────────────
|
|
631
|
+
|
|
632
|
+
class PyFloat {
|
|
633
|
+
constructor(readonly value: number) {}
|
|
634
|
+
}
|
|
635
|
+
|
|
636
|
+
type Json = null | boolean | number | string | PyFloat | Json[] | { [k: string]: Json };
|
|
637
|
+
|
|
638
|
+
// Keys whose Python value is a float (round(...) / x/y ratio) and must render
|
|
639
|
+
// with a trailing `.0` for integer values.
|
|
640
|
+
const _FLOAT_KEYS = new Set([
|
|
641
|
+
'rate_treatment',
|
|
642
|
+
'rate_baseline',
|
|
643
|
+
'mcnemar_p',
|
|
644
|
+
'cohens_h',
|
|
645
|
+
'mean_treatment',
|
|
646
|
+
'mean_baseline',
|
|
647
|
+
'mean_delta',
|
|
648
|
+
'wilcoxon_p',
|
|
649
|
+
'rank_biserial',
|
|
650
|
+
'error_rate',
|
|
651
|
+
'budget_usd_per_run',
|
|
652
|
+
]);
|
|
653
|
+
|
|
654
|
+
function _toJson(v: unknown, key?: string): Json {
|
|
655
|
+
if (v === null || v === undefined) return null;
|
|
656
|
+
if (v instanceof PyFloat) return v;
|
|
657
|
+
if (typeof v === 'boolean') return v;
|
|
658
|
+
if (typeof v === 'number') {
|
|
659
|
+
return key !== undefined && _FLOAT_KEYS.has(key) ? new PyFloat(v) : v;
|
|
660
|
+
}
|
|
661
|
+
if (typeof v === 'string') return v;
|
|
662
|
+
if (Array.isArray(v)) return v.map((x) => _toJson(x));
|
|
663
|
+
if (typeof v === 'object') {
|
|
664
|
+
const o = v as Record<string, unknown>;
|
|
665
|
+
const out: { [k: string]: Json } = {};
|
|
666
|
+
for (const k of Object.keys(o)) {
|
|
667
|
+
out[k] = _toJson(o[k], k);
|
|
668
|
+
}
|
|
669
|
+
return out;
|
|
670
|
+
}
|
|
671
|
+
return null;
|
|
672
|
+
}
|
|
673
|
+
|
|
674
|
+
function _jsonDumps(obj: Json, indent: number): string {
|
|
675
|
+
const pad = ' '.repeat(indent);
|
|
676
|
+
function enc(value: Json, depth: number): string {
|
|
677
|
+
if (value === null) return 'null';
|
|
678
|
+
if (value instanceof PyFloat) {
|
|
679
|
+
return Number.isInteger(value.value) ? `${value.value}.0` : String(value.value);
|
|
680
|
+
}
|
|
681
|
+
if (typeof value === 'boolean') return value ? 'true' : 'false';
|
|
682
|
+
if (typeof value === 'number') return String(value);
|
|
683
|
+
if (typeof value === 'string') return encStr(value);
|
|
684
|
+
if (Array.isArray(value)) {
|
|
685
|
+
if (value.length === 0) return '[]';
|
|
686
|
+
const inner = value.map((v) => pad.repeat(depth + 1) + enc(v, depth + 1));
|
|
687
|
+
return '[\n' + inner.join(',\n') + '\n' + pad.repeat(depth) + ']';
|
|
688
|
+
}
|
|
689
|
+
const o = value as { [k: string]: Json };
|
|
690
|
+
const keys = Object.keys(o);
|
|
691
|
+
if (keys.length === 0) return '{}';
|
|
692
|
+
const inner = keys.map((k) => pad.repeat(depth + 1) + encStr(k) + ': ' + enc(o[k] as Json, depth + 1));
|
|
693
|
+
return '{\n' + inner.join(',\n') + '\n' + pad.repeat(depth) + '}';
|
|
694
|
+
}
|
|
695
|
+
function encStr(s: string): string {
|
|
696
|
+
let out = '"';
|
|
697
|
+
for (const ch of s) {
|
|
698
|
+
const cp = ch.codePointAt(0) as number;
|
|
699
|
+
if (ch === '"') out += '\\"';
|
|
700
|
+
else if (ch === '\\') out += '\\\\';
|
|
701
|
+
else if (ch === '\n') out += '\\n';
|
|
702
|
+
else if (ch === '\r') out += '\\r';
|
|
703
|
+
else if (ch === '\t') out += '\\t';
|
|
704
|
+
else if (ch === '\b') out += '\\b';
|
|
705
|
+
else if (ch === '\f') out += '\\f';
|
|
706
|
+
else if (cp < 0x20) out += '\\u' + cp.toString(16).padStart(4, '0');
|
|
707
|
+
else if (cp < 0x7f) out += ch;
|
|
708
|
+
else if (cp > 0xffff) {
|
|
709
|
+
const v = cp - 0x10000;
|
|
710
|
+
const hi = 0xd800 + (v >> 10);
|
|
711
|
+
const lo = 0xdc00 + (v & 0x3ff);
|
|
712
|
+
out += '\\u' + hi.toString(16).padStart(4, '0');
|
|
713
|
+
out += '\\u' + lo.toString(16).padStart(4, '0');
|
|
714
|
+
} else {
|
|
715
|
+
out += '\\u' + cp.toString(16).padStart(4, '0');
|
|
716
|
+
}
|
|
717
|
+
}
|
|
718
|
+
return out + '"';
|
|
719
|
+
}
|
|
720
|
+
return enc(obj, 0);
|
|
721
|
+
}
|
|
722
|
+
|
|
723
|
+
// ── stdout (`print`) parity ───────────────────────────────────────────────
|
|
724
|
+
|
|
725
|
+
function _printStdout(analysis: Dict): void {
|
|
726
|
+
const a = analysis;
|
|
727
|
+
const lines: string[] = [];
|
|
728
|
+
lines.push(
|
|
729
|
+
`bench:ab v2 — ${_pyStr(a['n_tasks'])} tasks × ${_pyStr(a['seeds'])} seeds · model=${_pyStr(a['model'])}`,
|
|
730
|
+
);
|
|
731
|
+
const comparisons = Array.isArray(a['comparisons']) ? (a['comparisons'] as Dict[]) : [];
|
|
732
|
+
for (const cmp of comparisons) {
|
|
733
|
+
lines.push(
|
|
734
|
+
`\n[${_pyStr(cmp['label'])}] ${_pyStr(cmp['arm_treatment'])} vs ${_pyStr(cmp['arm_baseline'])} (n=${_pyStr(cmp['n_pairs'])} pairs)`,
|
|
735
|
+
);
|
|
736
|
+
const cap = _dictOr(cmp['capability']);
|
|
737
|
+
const dis = _dictOr(cmp['discipline']);
|
|
738
|
+
lines.push(
|
|
739
|
+
` capability: ${_fmtPct0(cap['rate_baseline'])} -> ${_fmtPct0(cap['rate_treatment'])} ` +
|
|
740
|
+
`(McNemar p=${_pyStr(cap['mcnemar_p'])}, h=${_pyStr(cap['cohens_h'])})`,
|
|
741
|
+
);
|
|
742
|
+
lines.push(
|
|
743
|
+
` discipline: ${_fmt3(dis['mean_baseline'])} -> ${_fmt3(dis['mean_treatment'])} ` +
|
|
744
|
+
`(Δ=${_fmtSigned3(dis['mean_delta'])}, Wilcoxon p=${_pyStr(dis['wilcoxon_p'])}, rb=${_pyStr(dis['rank_biserial'])}, n≠0=${_pyStr(dis['n_nonzero'])})`,
|
|
745
|
+
);
|
|
746
|
+
}
|
|
747
|
+
const gate = _dictOr(a['gate']);
|
|
748
|
+
lines.push(
|
|
749
|
+
`\nGATE: ${_pyStr(gate['verdict'])} ` +
|
|
750
|
+
`(cap_sig=${_pyStr(gate['capability_significant'])}, dis_sig=${_pyStr(gate['discipline_significant'])})`,
|
|
751
|
+
);
|
|
752
|
+
// print() adds a trailing newline per call; join with "\n" then add final "\n".
|
|
753
|
+
process.stdout.write(lines.join('\n') + '\n');
|
|
754
|
+
}
|
|
755
|
+
|
|
756
|
+
// ── CLI ───────────────────────────────────────────────────────────────────
|
|
757
|
+
|
|
758
|
+
interface ParsedArgs {
|
|
759
|
+
report: string | null;
|
|
760
|
+
json: boolean;
|
|
761
|
+
markdown: string;
|
|
762
|
+
}
|
|
763
|
+
|
|
764
|
+
class ArgExit extends Error {}
|
|
765
|
+
|
|
766
|
+
function parse_args(argv: string[]): ParsedArgs {
|
|
767
|
+
const prog = 'bench_ab_v2_stats.py';
|
|
768
|
+
const out: ParsedArgs = { report: null, json: false, markdown: '' };
|
|
769
|
+
const usage = `usage: ${prog} [-h] [--json] [--markdown PATH] [report]\n`;
|
|
770
|
+
const argErr = (msg: string): never => {
|
|
771
|
+
process.stderr.write(usage);
|
|
772
|
+
process.stderr.write(`${prog}: error: ${msg}\n`);
|
|
773
|
+
process.exitCode = 2;
|
|
774
|
+
throw new ArgExit(msg);
|
|
775
|
+
};
|
|
776
|
+
const positionals: string[] = [];
|
|
777
|
+
for (let i = 0; i < argv.length; i += 1) {
|
|
778
|
+
const a = argv[i] as string;
|
|
779
|
+
if (a === '-h' || a === '--help') {
|
|
780
|
+
process.stdout.write(usage);
|
|
781
|
+
process.exit(0);
|
|
782
|
+
} else if (a === '--json') {
|
|
783
|
+
out.json = true;
|
|
784
|
+
} else if (a === '--markdown') {
|
|
785
|
+
if (i + 1 >= argv.length) {
|
|
786
|
+
argErr('argument --markdown: expected one argument');
|
|
787
|
+
}
|
|
788
|
+
out.markdown = argv[i + 1] as string;
|
|
789
|
+
i += 1;
|
|
790
|
+
} else if (a.startsWith('--markdown=')) {
|
|
791
|
+
out.markdown = a.slice('--markdown='.length);
|
|
792
|
+
} else if (a.startsWith('-') && a !== '-') {
|
|
793
|
+
argErr(`unrecognized arguments: ${a}`);
|
|
794
|
+
} else {
|
|
795
|
+
positionals.push(a);
|
|
796
|
+
}
|
|
797
|
+
}
|
|
798
|
+
if (positionals.length > 1) {
|
|
799
|
+
argErr(`unrecognized arguments: ${positionals.slice(1).join(' ')}`);
|
|
800
|
+
}
|
|
801
|
+
out.report = positionals.length ? (positionals[0] as string) : null;
|
|
802
|
+
return out;
|
|
803
|
+
}
|
|
804
|
+
|
|
805
|
+
/** `sorted(REPORTS_DIR.glob("*-ab-v2-paired.json"))` — direct children, sorted. */
|
|
806
|
+
function _globSorted(dir: string, suffix: string): string[] {
|
|
807
|
+
let names: string[];
|
|
808
|
+
try {
|
|
809
|
+
names = fs.readdirSync(dir);
|
|
810
|
+
} catch {
|
|
811
|
+
return [];
|
|
812
|
+
}
|
|
813
|
+
const out = names.filter((n) => n.endsWith(suffix)).map((n) => path.join(dir, n));
|
|
814
|
+
out.sort((x, y) => (x < y ? -1 : x > y ? 1 : 0));
|
|
815
|
+
return out;
|
|
816
|
+
}
|
|
817
|
+
|
|
818
|
+
export function main(argv: string[] | null = null): number {
|
|
819
|
+
const args = parse_args(argv ?? process.argv.slice(2));
|
|
820
|
+
|
|
821
|
+
let p: string;
|
|
822
|
+
if (args.report) {
|
|
823
|
+
p = args.report;
|
|
824
|
+
} else {
|
|
825
|
+
const cands = _globSorted(REPORTS_DIR, '-ab-v2-paired.json');
|
|
826
|
+
if (cands.length === 0) {
|
|
827
|
+
process.stderr.write('no v2 paired report found\n');
|
|
828
|
+
return 1;
|
|
829
|
+
}
|
|
830
|
+
p = cands[cands.length - 1] as string;
|
|
831
|
+
}
|
|
832
|
+
const raw = fs.readFileSync(p, 'utf-8');
|
|
833
|
+
const payload = _dictOr(JSON.parse(raw));
|
|
834
|
+
// Python `json.loads` keeps the int/float distinction (`1` int, `1.0` float);
|
|
835
|
+
// `budget_usd_per_run` is the only input number the markdown re-renders via
|
|
836
|
+
// str(), so preserve its float-ness from the raw literal (`JSON.parse` drops
|
|
837
|
+
// the trailing `.0`). All other rendered numbers are computed, not echoed.
|
|
838
|
+
if (typeof payload['budget_usd_per_run'] === 'number' && _jsonFieldIsFloat(raw, 'budget_usd_per_run')) {
|
|
839
|
+
payload['budget_usd_per_run'] = new PyFloat(payload['budget_usd_per_run'] as number);
|
|
840
|
+
}
|
|
841
|
+
const analysis = analyse(payload);
|
|
842
|
+
analysis['gate'] = gate_verdict(analysis);
|
|
843
|
+
if (args.markdown) {
|
|
844
|
+
const out = args.markdown;
|
|
845
|
+
fs.mkdirSync(path.dirname(out), { recursive: true });
|
|
846
|
+
fs.writeFileSync(out, to_markdown(analysis, payload));
|
|
847
|
+
process.stdout.write(`wrote ${out}\n`);
|
|
848
|
+
return 0;
|
|
849
|
+
}
|
|
850
|
+
if (args.json) {
|
|
851
|
+
process.stdout.write(_jsonDumps(_toJson(analysis), 2) + '\n');
|
|
852
|
+
return 0;
|
|
853
|
+
}
|
|
854
|
+
_printStdout(analysis);
|
|
855
|
+
return 0;
|
|
856
|
+
}
|
|
857
|
+
|
|
858
|
+
// ── parity primitives ─────────────────────────────────────────────────────
|
|
859
|
+
|
|
860
|
+
function _dictOr(value: unknown): Dict {
|
|
861
|
+
if (value && typeof value === 'object' && !Array.isArray(value)) {
|
|
862
|
+
return value as Dict;
|
|
863
|
+
}
|
|
864
|
+
return {};
|
|
865
|
+
}
|
|
866
|
+
|
|
867
|
+
function _pyTruthy(v: unknown): boolean {
|
|
868
|
+
if (v === null || v === undefined) return false;
|
|
869
|
+
if (typeof v === 'boolean') return v;
|
|
870
|
+
if (typeof v === 'number') return v !== 0 && !Number.isNaN(v);
|
|
871
|
+
if (typeof v === 'string') return v.length > 0;
|
|
872
|
+
if (Array.isArray(v)) return v.length > 0;
|
|
873
|
+
if (typeof v === 'object') return Object.keys(v as object).length > 0;
|
|
874
|
+
return Boolean(v);
|
|
875
|
+
}
|
|
876
|
+
|
|
877
|
+
function _pyFloat(v: unknown): number {
|
|
878
|
+
if (v instanceof PyFloat) return v.value;
|
|
879
|
+
if (typeof v === 'number') return v;
|
|
880
|
+
if (typeof v === 'boolean') return v ? 1 : 0;
|
|
881
|
+
const n = Number(v);
|
|
882
|
+
return Number.isNaN(n) ? 0 : n;
|
|
883
|
+
}
|
|
884
|
+
|
|
885
|
+
function _orZero(v: unknown): number {
|
|
886
|
+
if (typeof v === 'number') return v;
|
|
887
|
+
if (v === null || v === undefined) return 0;
|
|
888
|
+
const n = Number(v);
|
|
889
|
+
return Number.isNaN(n) ? 0 : n;
|
|
890
|
+
}
|
|
891
|
+
|
|
892
|
+
function _strOr(v: unknown, fallback: string): string {
|
|
893
|
+
if (typeof v === 'string') return v;
|
|
894
|
+
if (v === null || v === undefined) return fallback;
|
|
895
|
+
return String(v);
|
|
896
|
+
}
|
|
897
|
+
|
|
898
|
+
function _pyStr(v: unknown): string {
|
|
899
|
+
if (v instanceof PyFloat) {
|
|
900
|
+
return Number.isInteger(v.value) ? `${v.value}.0` : String(v.value);
|
|
901
|
+
}
|
|
902
|
+
if (v === null || v === undefined) return 'None';
|
|
903
|
+
if (v === true) return 'True';
|
|
904
|
+
if (v === false) return 'False';
|
|
905
|
+
return String(v);
|
|
906
|
+
}
|
|
907
|
+
|
|
908
|
+
/** Python `round(x)` (no ndigits) → int, round-half-to-even. */
|
|
909
|
+
function _pyRoundNoArg(x: number): number {
|
|
910
|
+
if (!Number.isFinite(x)) return x;
|
|
911
|
+
const floor = Math.floor(x);
|
|
912
|
+
const frac = x - floor;
|
|
913
|
+
if (frac < 0.5) return floor;
|
|
914
|
+
if (frac > 0.5) return floor + 1;
|
|
915
|
+
return floor % 2 === 0 ? floor : floor + 1;
|
|
916
|
+
}
|
|
917
|
+
|
|
918
|
+
/** Python `round(x, ndigits)` — round-half-to-even on the exact double. */
|
|
919
|
+
function _pyRound(value: number, ndigits: number): number {
|
|
920
|
+
if (!Number.isFinite(value) || value === 0) {
|
|
921
|
+
return value;
|
|
922
|
+
}
|
|
923
|
+
const neg = value < 0;
|
|
924
|
+
const abs = Math.abs(value);
|
|
925
|
+
const exact = abs.toFixed(40);
|
|
926
|
+
const dot = exact.indexOf('.');
|
|
927
|
+
const intPart = dot === -1 ? exact : exact.slice(0, dot);
|
|
928
|
+
const fracPart = dot === -1 ? '' : exact.slice(dot + 1);
|
|
929
|
+
const keepFrac = fracPart.slice(0, ndigits).padEnd(ndigits, '0');
|
|
930
|
+
const rest = fracPart.slice(ndigits);
|
|
931
|
+
const scaledStr = (intPart + keepFrac).replace(/^0+(?=\d)/, '');
|
|
932
|
+
let scaled = BigInt(scaledStr === '' ? '0' : scaledStr);
|
|
933
|
+
if (rest.length > 0) {
|
|
934
|
+
const firstRest = rest.charCodeAt(0) - 48;
|
|
935
|
+
const hasMore = /[1-9]/.test(rest.slice(1));
|
|
936
|
+
if (firstRest > 5 || (firstRest === 5 && hasMore)) {
|
|
937
|
+
scaled += 1n;
|
|
938
|
+
} else if (firstRest === 5 && !hasMore) {
|
|
939
|
+
if (scaled % 2n === 1n) {
|
|
940
|
+
scaled += 1n;
|
|
941
|
+
}
|
|
942
|
+
}
|
|
943
|
+
}
|
|
944
|
+
const factor = 10 ** ndigits;
|
|
945
|
+
const result = Number(scaled) / factor;
|
|
946
|
+
return neg ? -result : result;
|
|
947
|
+
}
|
|
948
|
+
|
|
949
|
+
/** `format(x, '.Nf')` — round-half-even on the exact double, fixed N decimals. */
|
|
950
|
+
function _pyFixed(x: number, ndigits: number): string {
|
|
951
|
+
if (!Number.isFinite(x)) return String(x);
|
|
952
|
+
const neg = x < 0 || Object.is(x, -0);
|
|
953
|
+
const abs = Math.abs(x);
|
|
954
|
+
const exact = abs.toFixed(40);
|
|
955
|
+
const dot = exact.indexOf('.');
|
|
956
|
+
const intPart = dot === -1 ? exact : exact.slice(0, dot);
|
|
957
|
+
const fracPart = dot === -1 ? '' : exact.slice(dot + 1);
|
|
958
|
+
const kept = (intPart + fracPart.slice(0, ndigits).padEnd(ndigits, '0')).replace(/^0+(?=\d)/, '');
|
|
959
|
+
const rest = fracPart.slice(ndigits);
|
|
960
|
+
let value = BigInt(kept === '' ? '0' : kept);
|
|
961
|
+
if (rest.length > 0) {
|
|
962
|
+
const firstRest = rest.charCodeAt(0) - 48;
|
|
963
|
+
const hasMore = /[1-9]/.test(rest.slice(1));
|
|
964
|
+
if (firstRest > 5 || (firstRest === 5 && hasMore)) {
|
|
965
|
+
value += 1n;
|
|
966
|
+
} else if (firstRest === 5 && !hasMore) {
|
|
967
|
+
if (value % 2n === 1n) {
|
|
968
|
+
value += 1n;
|
|
969
|
+
}
|
|
970
|
+
}
|
|
971
|
+
}
|
|
972
|
+
let intStr = value.toString();
|
|
973
|
+
let result: string;
|
|
974
|
+
if (ndigits === 0) {
|
|
975
|
+
result = intStr;
|
|
976
|
+
} else {
|
|
977
|
+
if (intStr.length <= ndigits) {
|
|
978
|
+
intStr = '0'.repeat(ndigits - intStr.length + 1) + intStr;
|
|
979
|
+
}
|
|
980
|
+
const whole = intStr.slice(0, intStr.length - ndigits);
|
|
981
|
+
const dec = intStr.slice(intStr.length - ndigits);
|
|
982
|
+
result = `${whole}.${dec}`;
|
|
983
|
+
}
|
|
984
|
+
// Python preserves the sign even when the magnitude rounds to zero
|
|
985
|
+
// (`format(-0.0001, '.3f')` → '-0.000', `format(-0.5, '.0f')` → '-0').
|
|
986
|
+
return neg ? `-${result}` : result;
|
|
987
|
+
}
|
|
988
|
+
|
|
989
|
+
/** Python `int(x)` truncate toward zero. */
|
|
990
|
+
function _pyIntTrunc(x: number): number {
|
|
991
|
+
return x < 0 ? Math.ceil(x) : Math.floor(x);
|
|
992
|
+
}
|
|
993
|
+
|
|
994
|
+
/** Python `f"{n:,}"` — group integer digits in threes with commas. */
|
|
995
|
+
function _pyThousands(n: number): string {
|
|
996
|
+
const neg = n < 0;
|
|
997
|
+
const digits = String(Math.abs(n));
|
|
998
|
+
let out = '';
|
|
999
|
+
for (let i = 0; i < digits.length; i += 1) {
|
|
1000
|
+
if (i > 0 && (digits.length - i) % 3 === 0) {
|
|
1001
|
+
out += ',';
|
|
1002
|
+
}
|
|
1003
|
+
out += digits[i];
|
|
1004
|
+
}
|
|
1005
|
+
return neg ? `-${out}` : out;
|
|
1006
|
+
}
|
|
1007
|
+
|
|
1008
|
+
if (import.meta.url === pathToFileURL(process.argv[1] ?? '').href || process.argv[1] === _HERE) {
|
|
1009
|
+
try {
|
|
1010
|
+
process.exitCode = main();
|
|
1011
|
+
} catch (e) {
|
|
1012
|
+
if (e instanceof ArgExit) {
|
|
1013
|
+
process.exitCode = process.exitCode ?? 2;
|
|
1014
|
+
} else {
|
|
1015
|
+
throw e;
|
|
1016
|
+
}
|
|
1017
|
+
}
|
|
1018
|
+
}
|