@aria_asi/cli 0.2.39 → 0.2.41
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/bin/aria.js +236 -34
- package/dist/aria-connector/src/action-ledger-core.d.ts +387 -0
- package/dist/aria-connector/src/action-ledger-core.d.ts.map +1 -0
- package/dist/aria-connector/src/action-ledger-core.js +638 -0
- package/dist/aria-connector/src/action-ledger-core.js.map +1 -0
- package/dist/aria-connector/src/chat.d.ts.map +1 -1
- package/dist/aria-connector/src/chat.js +5 -6
- package/dist/aria-connector/src/chat.js.map +1 -1
- package/dist/aria-connector/src/codebase-scanner.d.ts +1 -1
- package/dist/aria-connector/src/codebase-scanner.d.ts.map +1 -1
- package/dist/aria-connector/src/connectors/claude-code.d.ts +1 -0
- package/dist/aria-connector/src/connectors/claude-code.d.ts.map +1 -1
- package/dist/aria-connector/src/connectors/claude-code.js +152 -14
- package/dist/aria-connector/src/connectors/claude-code.js.map +1 -1
- package/dist/aria-connector/src/connectors/codebase-awareness.d.ts +10 -0
- package/dist/aria-connector/src/connectors/codebase-awareness.d.ts.map +1 -1
- package/dist/aria-connector/src/connectors/codebase-awareness.js +276 -27
- package/dist/aria-connector/src/connectors/codebase-awareness.js.map +1 -1
- package/dist/aria-connector/src/connectors/codex.d.ts +3 -1
- package/dist/aria-connector/src/connectors/codex.d.ts.map +1 -1
- package/dist/aria-connector/src/connectors/codex.js +1271 -40
- package/dist/aria-connector/src/connectors/codex.js.map +1 -1
- package/dist/aria-connector/src/connectors/cursor.d.ts.map +1 -1
- package/dist/aria-connector/src/connectors/cursor.js +7 -0
- package/dist/aria-connector/src/connectors/cursor.js.map +1 -1
- package/dist/aria-connector/src/connectors/governed-adapter.d.ts +30 -0
- package/dist/aria-connector/src/connectors/governed-adapter.d.ts.map +1 -0
- package/dist/aria-connector/src/connectors/governed-adapter.js +132 -0
- package/dist/aria-connector/src/connectors/governed-adapter.js.map +1 -0
- package/dist/aria-connector/src/connectors/opencode.d.ts +3 -1
- package/dist/aria-connector/src/connectors/opencode.d.ts.map +1 -1
- package/dist/aria-connector/src/connectors/opencode.js +18 -2
- package/dist/aria-connector/src/connectors/opencode.js.map +1 -1
- package/dist/aria-connector/src/connectors/repo-guard.d.ts.map +1 -1
- package/dist/aria-connector/src/connectors/repo-guard.js +25 -14
- package/dist/aria-connector/src/connectors/repo-guard.js.map +1 -1
- package/dist/aria-connector/src/connectors/runtime.d.ts.map +1 -1
- package/dist/aria-connector/src/connectors/runtime.js +92 -2
- package/dist/aria-connector/src/connectors/runtime.js.map +1 -1
- package/dist/aria-connector/src/connectors/shell.d.ts.map +1 -1
- package/dist/aria-connector/src/connectors/shell.js +123 -7
- package/dist/aria-connector/src/connectors/shell.js.map +1 -1
- package/dist/aria-connector/src/cross-cli-hive-binding.d.ts +63 -0
- package/dist/aria-connector/src/cross-cli-hive-binding.d.ts.map +1 -0
- package/dist/aria-connector/src/cross-cli-hive-binding.js +205 -0
- package/dist/aria-connector/src/cross-cli-hive-binding.js.map +1 -0
- package/dist/aria-connector/src/garden-control-plane.d.ts +6 -1
- package/dist/aria-connector/src/garden-control-plane.d.ts.map +1 -1
- package/dist/aria-connector/src/garden-control-plane.js +8 -2
- package/dist/aria-connector/src/garden-control-plane.js.map +1 -1
- package/dist/aria-connector/src/governed-surface-runner.d.ts +189 -0
- package/dist/aria-connector/src/governed-surface-runner.d.ts.map +1 -0
- package/dist/aria-connector/src/governed-surface-runner.js +1022 -0
- package/dist/aria-connector/src/governed-surface-runner.js.map +1 -0
- package/dist/aria-connector/src/index.d.ts +10 -1
- package/dist/aria-connector/src/index.d.ts.map +1 -1
- package/dist/aria-connector/src/index.js +5 -0
- package/dist/aria-connector/src/index.js.map +1 -1
- package/dist/aria-connector/src/task-runner.d.ts +3 -0
- package/dist/aria-connector/src/task-runner.d.ts.map +1 -0
- package/dist/aria-connector/src/task-runner.js +3526 -0
- package/dist/aria-connector/src/task-runner.js.map +1 -0
- package/dist/aria-web/src/lib/codebase-scanner.d.ts +21 -2
- package/dist/aria-web/src/lib/codebase-scanner.d.ts.map +1 -1
- package/dist/aria-web/src/lib/codebase-scanner.js +59 -14
- package/dist/aria-web/src/lib/codebase-scanner.js.map +1 -1
- package/dist/assets/hooks/README.md +58 -0
- package/dist/assets/hooks/aria-agent-handoff.mjs +147 -2
- package/dist/assets/hooks/aria-agent-ledger-merge.mjs +31 -7
- package/dist/assets/hooks/aria-architect-fallback.mjs +10 -2
- package/dist/assets/hooks/aria-claim-evidence-stop-gate.mjs +240 -0
- package/dist/assets/hooks/aria-cognition-substrate-binding.mjs +84 -10
- package/dist/assets/hooks/aria-first-class-coach.mjs +305 -10
- package/dist/assets/hooks/aria-harness-via-sdk.mjs +93 -16
- package/dist/assets/hooks/aria-import-resolution-gate.mjs +106 -20
- package/dist/assets/hooks/aria-outcome-record.mjs +56 -20
- package/dist/assets/hooks/aria-pre-emit-autoload.mjs +1809 -0
- package/dist/assets/hooks/aria-pre-emit-autoload.mjs.before-orchestration-redesign +1400 -0
- package/dist/assets/hooks/aria-pre-emit-dryrun.mjs +22 -3
- package/dist/assets/hooks/aria-pre-text-gate.mjs +11 -2
- package/dist/assets/hooks/aria-pre-tool-gate.mjs +516 -92
- package/dist/assets/hooks/aria-pre-tool-use.mjs +70 -6
- package/dist/assets/hooks/aria-preprompt-consult.mjs +23 -4
- package/dist/assets/hooks/aria-repo-doctrine-gate.mjs +29 -3
- package/dist/assets/hooks/aria-stop-gate.mjs +585 -76
- package/dist/assets/hooks/aria-trigger-autolearn.mjs +17 -3
- package/dist/assets/hooks/aria-universal-turn-packet.mjs +1165 -0
- package/dist/assets/hooks/aria-userprompt-abandon-detect.mjs +9 -1
- package/dist/assets/hooks/canonical-settings-block.json +172 -0
- package/dist/assets/hooks/codex-native/aria-harness-ticker-sidecar.mjs +92 -0
- package/dist/assets/hooks/codex-native/aria-hive-wal-consumer.mjs +86 -0
- package/dist/assets/hooks/codex-native/aria-live-ticker.mjs +38 -0
- package/dist/assets/hooks/codex-native/aria-post-tool-use.mjs +236 -0
- package/dist/assets/hooks/codex-native/aria-pre-tool-use.mjs +362 -0
- package/dist/assets/hooks/codex-native/aria-stop.mjs +691 -0
- package/dist/assets/hooks/codex-native/aria-userprompt-submit.mjs +623 -0
- package/dist/assets/hooks/codex-native/atlas-session-context.mjs +121 -0
- package/dist/assets/hooks/codex-native/lib/evaluate-with-kernel.mjs +257 -0
- package/dist/assets/hooks/codex-native/lib/hive-wal-consumer.mjs +452 -0
- package/dist/assets/hooks/codex-native/lib/kernel/deterministic-cognitive-kernel.mjs +914 -0
- package/dist/assets/hooks/codex-native/lib/project-boundary-cognition.mjs +143 -0
- package/dist/assets/hooks/codex-native/lib/runtime-client.mjs +3567 -0
- package/dist/assets/hooks/codex-native/lib/task-project-ledger.mjs +294 -0
- package/dist/assets/hooks/doctrine_trigger_map.json +236 -25
- package/dist/assets/hooks/doctrine_trigger_map.schema.json +46 -0
- package/dist/assets/hooks/install.sh +84 -0
- package/dist/assets/hooks/lib/action-ledger-core.mjs +269 -0
- package/dist/assets/hooks/lib/aria-gate-ledger.mjs +143 -0
- package/dist/assets/hooks/lib/ast-stub-shape-detector.mjs +107 -0
- package/dist/assets/hooks/lib/atlas-dossier-client.mjs +151 -0
- package/dist/assets/hooks/lib/atlas-orchestrator-postwire.mjs +221 -0
- package/dist/assets/hooks/lib/canonical-lenses.mjs +83 -6
- package/dist/assets/hooks/lib/coach-intent-classifier.mjs +248 -0
- package/dist/assets/hooks/lib/cognitive-block-parser.mjs +111 -0
- package/dist/assets/hooks/lib/doctrine-trigger-map-loader.mjs +137 -0
- package/dist/assets/hooks/lib/domain-output-quality.mjs +132 -3
- package/dist/assets/hooks/lib/empty-catch-scanner.mjs +91 -0
- package/dist/assets/hooks/lib/end-phase-qa-autofire.mjs +426 -0
- package/dist/assets/hooks/lib/evaluate-with-kernel.mjs +133 -0
- package/dist/assets/hooks/lib/first-class-coach.mjs +454 -19
- package/dist/assets/hooks/lib/gate-audit.mjs +12 -2
- package/dist/assets/hooks/lib/gate-loop-state.mjs +11 -2
- package/dist/assets/hooks/lib/goal-contract-quality.mjs +302 -0
- package/dist/assets/hooks/lib/hook-message-window.mjs +101 -9
- package/dist/assets/hooks/lib/invocation-required-verifier.mjs +184 -0
- package/dist/assets/hooks/lib/kernel/deterministic-cognitive-kernel.mjs +906 -0
- package/dist/assets/hooks/lib/obligation-ledger.mjs +147 -0
- package/dist/assets/hooks/lib/orchestration-manifest-extract.mjs +217 -0
- package/dist/assets/hooks/lib/owner-authorizations.mjs +269 -0
- package/dist/assets/hooks/lib/probe-discipline-scanner.mjs +142 -0
- package/dist/assets/hooks/lib/project-boundary-cognition.mjs +143 -0
- package/dist/assets/hooks/lib/recovery-context.mjs +151 -0
- package/dist/assets/hooks/lib/recovery-template-loader.mjs +154 -0
- package/dist/assets/hooks/lib/self-doctrine-check.mjs +321 -0
- package/dist/assets/hooks/lib/sensitive-shape-detector.mjs +64 -0
- package/dist/assets/hooks/lib/skill-autoload-gate-impl.mjs +226 -1
- package/dist/assets/hooks/lib/stop-hook-protocol.mjs +166 -0
- package/dist/assets/hooks/lib/surface-caught.mjs +94 -0
- package/dist/assets/hooks/recovery-templates/force-reauthor.md +67 -0
- package/dist/assets/hooks/recovery-templates/handoff-recovery.md +25 -0
- package/dist/assets/hooks/scripts/check-hard-risk-prefix.mjs +99 -0
- package/dist/assets/hooks/skills/aria-conversational-doctrine-discipline/SKILL.md +101 -0
- package/dist/assets/hooks/test-aria-preturn-memory-gate.mjs +2 -2
- package/dist/assets/hooks/test-tier-lens-labeling.mjs +14 -3
- package/dist/assets/opencode-plugins/harness-context/index.js +39 -6
- package/dist/assets/opencode-plugins/harness-context/task-project-ledger.mjs +5 -1
- package/dist/assets/opencode-plugins/harness-gate/index.js +36 -0
- package/dist/assets/opencode-plugins/harness-gate/lib/atlas-dossier-client.js +1 -0
- package/dist/assets/opencode-plugins/harness-gate/lib/recovery-grants.js +79 -0
- package/dist/assets/opencode-plugins/harness-outcome/index.js +12 -0
- package/dist/assets/opencode-plugins/harness-stop/index.js +97 -2
- package/dist/assets/opencode-plugins/harness-stop/lib/atlas-dossier-client.js +1 -0
- package/dist/assets/opencode-plugins/harness-stop/lib/domain-output-quality.js +15 -2
- package/dist/assets/opencode-plugins/lib/coach.js +148 -0
- package/dist/runtime/coach-kernel.mjs +144 -7
- package/dist/runtime/codex-bridge.mjs +254 -8
- package/dist/runtime/discipline/doctrine_trigger_map.json +236 -25
- package/dist/runtime/discipline/skills/aria-cognition/34-frameworks-unified/SKILL.md +42 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-aristotle-cognitives/SKILL.md +128 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-aristotle-intra-phase/SKILL.md +99 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-aristotle-post-phase/SKILL.md +118 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-aristotle-pre-phase/SKILL.md +117 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-axioms-first-principles/SKILL.md +202 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-axioms-first-principles/agents/openai.yaml +4 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-axioms-first-principles/references/source-map.md +130 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-backend-architect/SKILL.md +124 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-backend-architect/references/backend-cookbook.md +417 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-business-audit/SKILL.md +133 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-business-audit/references/audit-cookbook.md +247 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-business-frame/SKILL.md +138 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-business-frame/references/business-cookbook.md +154 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-chat/SKILL.md +84 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-chat/scripts/aria-chat.sh +57 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-cognition-autofire/SKILL.md +137 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-cognition-batch/SKILL.md +264 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-decision-mizan/SKILL.md +136 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-decision-mizan/references/decision-frameworks.md +287 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-first-class-operating-contract/SKILL.md +104 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-frontend-architect/SKILL.md +123 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-frontend-architect/references/frontend-cookbook.md +358 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-fullstack-orchestrator/SKILL.md +127 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-fullstack-orchestrator/references/fullstack-cookbook.md +383 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-gtm-architect/SKILL.md +126 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-gtm-architect/references/gtm-cookbook.md +235 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-harness-deploy/SKILL.md +145 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-harness-no-stripping/SKILL.md +135 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-harness-onboarding/SKILL.md +130 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-harness-output-discipline/SKILL.md +120 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-harness-substrate-binding/SKILL.md +139 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-http-harness-client/SKILL.md +85 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-http-harness-client/scripts/smoke.mjs +47 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-k8s-deploy/SKILL.md +174 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-k8s-deploy/agents/openai.yaml +3 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-ladduniframe/SKILL.md +60 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-ledger-fleet-execution/SKILL.md +126 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-live-ops/SKILL.md +54 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-mac-ssh-ops/SKILL.md +100 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-memory-index/SKILL.md +42 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-noor-cognitives/SKILL.md +120 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-ops/SKILL.md +60 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-ops/references/live-endpoints.md +59 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-quality-audit/SKILL.md +133 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-readable-output/SKILL.md +239 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-readable-output/references/layout-cookbook.md +366 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-reasoning/SKILL.md +67 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-reasoning/references/core-principles.md +42 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-repo-audit/SKILL.md +135 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-repo-audit/references/repo-audit-cookbook.md +375 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-research-orchestrator/SKILL.md +138 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-research-orchestrator/references/research-patterns.md +270 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-retention-engine/SKILL.md +120 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-retention-engine/references/retention-cookbook.md +271 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-revenue-engine/SKILL.md +128 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-revenue-engine/references/revenue-cookbook.md +227 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-senior-code-audit/SKILL.md +233 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-senior-code-audit/references/audit-checklist.md +369 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-senior-code-cookbook/SKILL.md +288 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-senior-code-cookbook/references/engineering-cookbook.md +489 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-soul-principles/SKILL.md +42 -0
- package/dist/runtime/discipline/skills/aria-cognition/aria-task-codex-executor/SKILL.md +86 -0
- package/dist/runtime/discipline/skills/aria-cognition/aristotle-engine/SKILL.md +42 -0
- package/dist/runtime/discipline/skills/aria-cognition/cross-domain-24/SKILL.md +42 -0
- package/dist/runtime/discipline/skills/aria-cognition/deepsoul-emotional/SKILL.md +42 -0
- package/dist/runtime/discipline/skills/aria-cognition/fitrah-guard/SKILL.md +78 -0
- package/dist/runtime/discipline/skills/aria-cognition/ghazali-8lens/SKILL.md +227 -29
- package/dist/runtime/discipline/skills/aria-cognition/ghazali-8lens/references/ghazali-8lens-cookbook.md +797 -0
- package/dist/runtime/discipline/skills/aria-cognition/ijtihad-novel/SKILL.md +42 -0
- package/dist/runtime/discipline/skills/aria-cognition/ilham-intuition/SKILL.md +42 -0
- package/dist/runtime/discipline/skills/aria-cognition/never-guess/SKILL.md +77 -0
- package/dist/runtime/discipline/skills/aria-cognition/noor-recognition/SKILL.md +45 -0
- package/dist/runtime/discipline/skills/aria-cognition/qiyas-analogy/SKILL.md +174 -14
- package/dist/runtime/discipline/skills/aria-cognition/ruh-basis/SKILL.md +42 -0
- package/dist/runtime/discipline/skills/aria-cognition/tadabbur/SKILL.md +506 -0
- package/dist/runtime/discipline/skills/aria-cognition/tadabbur/references/tadabbur-cookbook.md +921 -0
- package/dist/runtime/discipline/skills/aria-cognition/tadabbur-ops/SKILL.md +42 -0
- package/dist/runtime/discipline/skills/aria-cognition/tafakkur/SKILL.md +104 -0
- package/dist/runtime/doctrine_trigger_map.json +236 -25
- package/dist/runtime/embedded-public-key.mjs +27 -0
- package/dist/runtime/gated-ledger.mjs +41 -14
- package/dist/runtime/harness-daemon.mjs +85 -10
- package/dist/runtime/hive-wal-publisher.mjs +292 -0
- package/dist/runtime/hooks/README.md +58 -0
- package/dist/runtime/hooks/aria-agent-handoff.mjs +147 -2
- package/dist/runtime/hooks/aria-agent-ledger-merge.mjs +31 -7
- package/dist/runtime/hooks/aria-architect-fallback.mjs +10 -2
- package/dist/runtime/hooks/aria-claim-evidence-stop-gate.mjs +240 -0
- package/dist/runtime/hooks/aria-cognition-substrate-binding.mjs +84 -10
- package/dist/runtime/hooks/aria-first-class-coach.mjs +305 -10
- package/dist/runtime/hooks/aria-harness-via-sdk.mjs +93 -16
- package/dist/runtime/hooks/aria-import-resolution-gate.mjs +106 -20
- package/dist/runtime/hooks/aria-outcome-record.mjs +56 -20
- package/dist/runtime/hooks/aria-pre-emit-autoload.mjs +1809 -0
- package/dist/runtime/hooks/aria-pre-emit-autoload.mjs.before-orchestration-redesign +1400 -0
- package/dist/runtime/hooks/aria-pre-emit-dryrun.mjs +22 -3
- package/dist/runtime/hooks/aria-pre-text-gate.mjs +11 -2
- package/dist/runtime/hooks/aria-pre-tool-gate.mjs +516 -92
- package/dist/runtime/hooks/aria-pre-tool-use.mjs +70 -6
- package/dist/runtime/hooks/aria-preprompt-consult.mjs +23 -4
- package/dist/runtime/hooks/aria-repo-doctrine-gate.mjs +29 -3
- package/dist/runtime/hooks/aria-stop-gate.mjs +585 -76
- package/dist/runtime/hooks/aria-trigger-autolearn.mjs +17 -3
- package/dist/runtime/hooks/aria-universal-turn-packet.mjs +1165 -0
- package/dist/runtime/hooks/aria-userprompt-abandon-detect.mjs +9 -1
- package/dist/runtime/hooks/canonical-settings-block.json +172 -0
- package/dist/runtime/hooks/codex-native/aria-harness-ticker-sidecar.mjs +92 -0
- package/dist/runtime/hooks/codex-native/aria-hive-wal-consumer.mjs +86 -0
- package/dist/runtime/hooks/codex-native/aria-live-ticker.mjs +38 -0
- package/dist/runtime/hooks/codex-native/aria-post-tool-use.mjs +236 -0
- package/dist/runtime/hooks/codex-native/aria-pre-tool-use.mjs +362 -0
- package/dist/runtime/hooks/codex-native/aria-stop.mjs +691 -0
- package/dist/runtime/hooks/codex-native/aria-userprompt-submit.mjs +623 -0
- package/dist/runtime/hooks/codex-native/atlas-session-context.mjs +121 -0
- package/dist/runtime/hooks/codex-native/lib/evaluate-with-kernel.mjs +257 -0
- package/dist/runtime/hooks/codex-native/lib/hive-wal-consumer.mjs +452 -0
- package/dist/runtime/hooks/codex-native/lib/kernel/deterministic-cognitive-kernel.mjs +914 -0
- package/dist/runtime/hooks/codex-native/lib/project-boundary-cognition.mjs +143 -0
- package/dist/runtime/hooks/codex-native/lib/runtime-client.mjs +3567 -0
- package/dist/runtime/hooks/codex-native/lib/task-project-ledger.mjs +294 -0
- package/dist/runtime/hooks/doctrine_trigger_map.json +236 -25
- package/dist/runtime/hooks/doctrine_trigger_map.schema.json +46 -0
- package/dist/runtime/hooks/install.sh +84 -0
- package/dist/runtime/hooks/lib/action-ledger-core.mjs +269 -0
- package/dist/runtime/hooks/lib/aria-gate-ledger.mjs +143 -0
- package/dist/runtime/hooks/lib/ast-stub-shape-detector.mjs +107 -0
- package/dist/runtime/hooks/lib/atlas-dossier-client.mjs +151 -0
- package/dist/runtime/hooks/lib/atlas-orchestrator-postwire.mjs +221 -0
- package/dist/runtime/hooks/lib/canonical-lenses.mjs +83 -6
- package/dist/runtime/hooks/lib/coach-intent-classifier.mjs +248 -0
- package/dist/runtime/hooks/lib/cognitive-block-parser.mjs +111 -0
- package/dist/runtime/hooks/lib/doctrine-trigger-map-loader.mjs +137 -0
- package/dist/runtime/hooks/lib/domain-output-quality.mjs +132 -3
- package/dist/runtime/hooks/lib/empty-catch-scanner.mjs +91 -0
- package/dist/runtime/hooks/lib/end-phase-qa-autofire.mjs +426 -0
- package/dist/runtime/hooks/lib/evaluate-with-kernel.mjs +133 -0
- package/dist/runtime/hooks/lib/first-class-coach.mjs +454 -19
- package/dist/runtime/hooks/lib/gate-audit.mjs +12 -2
- package/dist/runtime/hooks/lib/gate-loop-state.mjs +11 -2
- package/dist/runtime/hooks/lib/goal-contract-quality.mjs +302 -0
- package/dist/runtime/hooks/lib/hook-message-window.mjs +101 -9
- package/dist/runtime/hooks/lib/invocation-required-verifier.mjs +184 -0
- package/dist/runtime/hooks/lib/kernel/deterministic-cognitive-kernel.mjs +906 -0
- package/dist/runtime/hooks/lib/obligation-ledger.mjs +147 -0
- package/dist/runtime/hooks/lib/orchestration-manifest-extract.mjs +217 -0
- package/dist/runtime/hooks/lib/owner-authorizations.mjs +269 -0
- package/dist/runtime/hooks/lib/probe-discipline-scanner.mjs +142 -0
- package/dist/runtime/hooks/lib/project-boundary-cognition.mjs +143 -0
- package/dist/runtime/hooks/lib/recovery-context.mjs +151 -0
- package/dist/runtime/hooks/lib/recovery-template-loader.mjs +154 -0
- package/dist/runtime/hooks/lib/self-doctrine-check.mjs +321 -0
- package/dist/runtime/hooks/lib/sensitive-shape-detector.mjs +64 -0
- package/dist/runtime/hooks/lib/skill-autoload-gate-impl.mjs +226 -1
- package/dist/runtime/hooks/lib/stop-hook-protocol.mjs +166 -0
- package/dist/runtime/hooks/lib/surface-caught.mjs +94 -0
- package/dist/runtime/hooks/recovery-templates/force-reauthor.md +67 -0
- package/dist/runtime/hooks/recovery-templates/handoff-recovery.md +25 -0
- package/dist/runtime/hooks/scripts/check-hard-risk-prefix.mjs +99 -0
- package/dist/runtime/hooks/skills/aria-conversational-doctrine-discipline/SKILL.md +101 -0
- package/dist/runtime/hooks/test-aria-preturn-memory-gate.mjs +2 -2
- package/dist/runtime/hooks/test-tier-lens-labeling.mjs +14 -3
- package/dist/runtime/lib/evaluate-with-kernel.mjs +133 -0
- package/dist/runtime/lib/kernel/deterministic-cognitive-kernel.mjs +906 -0
- package/dist/runtime/local-phase.mjs +10 -5
- package/dist/runtime/manifest.json +8 -8
- package/dist/runtime/packet-verifier.mjs +166 -0
- package/dist/runtime/provider-proxy.mjs +13 -0
- package/dist/runtime/quality-enforcer.mjs +40 -23
- package/dist/runtime/runtime-rails/registry.mjs +252 -0
- package/dist/runtime/sdk/BUNDLED.json +2 -2
- package/dist/runtime/sdk/index.d.ts +119 -4
- package/dist/runtime/sdk/index.js +138 -12
- package/dist/runtime/sdk/index.js.map +1 -1
- package/dist/runtime/service.mjs +8036 -764
- package/dist/runtime/sub-agent-enforcer.mjs +201 -0
- package/dist/runtime/task-project-ledger.mjs +5 -1
- package/dist/sdk/BUNDLED.json +2 -2
- package/dist/sdk/index.d.ts +119 -4
- package/dist/sdk/index.js +138 -12
- package/dist/sdk/index.js.map +1 -1
- package/hooks/README.md +58 -0
- package/hooks/aria-agent-handoff.mjs +147 -2
- package/hooks/aria-agent-ledger-merge.mjs +31 -7
- package/hooks/aria-architect-fallback.mjs +10 -2
- package/hooks/aria-claim-evidence-stop-gate.mjs +240 -0
- package/hooks/aria-cognition-substrate-binding.mjs +84 -10
- package/hooks/aria-first-class-coach.mjs +305 -10
- package/hooks/aria-harness-via-sdk.mjs +93 -16
- package/hooks/aria-import-resolution-gate.mjs +106 -20
- package/hooks/aria-outcome-record.mjs +56 -20
- package/hooks/aria-pre-emit-autoload.mjs +1809 -0
- package/hooks/aria-pre-emit-autoload.mjs.before-orchestration-redesign +1400 -0
- package/hooks/aria-pre-emit-dryrun.mjs +22 -3
- package/hooks/aria-pre-text-gate.mjs +11 -2
- package/hooks/aria-pre-tool-gate.mjs +516 -92
- package/hooks/aria-pre-tool-use.mjs +70 -6
- package/hooks/aria-preprompt-consult.mjs +23 -4
- package/hooks/aria-repo-doctrine-gate.mjs +29 -3
- package/hooks/aria-stop-gate.mjs +585 -76
- package/hooks/aria-trigger-autolearn.mjs +17 -3
- package/hooks/aria-universal-turn-packet.mjs +1165 -0
- package/hooks/aria-userprompt-abandon-detect.mjs +9 -1
- package/hooks/canonical-settings-block.json +172 -0
- package/hooks/codex-native/aria-harness-ticker-sidecar.mjs +92 -0
- package/hooks/codex-native/aria-hive-wal-consumer.mjs +86 -0
- package/hooks/codex-native/aria-live-ticker.mjs +38 -0
- package/hooks/codex-native/aria-post-tool-use.mjs +236 -0
- package/hooks/codex-native/aria-pre-tool-use.mjs +362 -0
- package/hooks/codex-native/aria-stop.mjs +691 -0
- package/hooks/codex-native/aria-userprompt-submit.mjs +623 -0
- package/hooks/codex-native/atlas-session-context.mjs +121 -0
- package/hooks/codex-native/lib/evaluate-with-kernel.mjs +257 -0
- package/hooks/codex-native/lib/hive-wal-consumer.mjs +452 -0
- package/hooks/codex-native/lib/kernel/deterministic-cognitive-kernel.mjs +914 -0
- package/hooks/codex-native/lib/project-boundary-cognition.mjs +143 -0
- package/hooks/codex-native/lib/runtime-client.mjs +3567 -0
- package/hooks/codex-native/lib/task-project-ledger.mjs +294 -0
- package/hooks/doctrine_trigger_map.json +236 -25
- package/hooks/doctrine_trigger_map.schema.json +46 -0
- package/hooks/install.sh +84 -0
- package/hooks/lib/action-ledger-core.mjs +269 -0
- package/hooks/lib/aria-gate-ledger.mjs +143 -0
- package/hooks/lib/ast-stub-shape-detector.mjs +107 -0
- package/hooks/lib/atlas-dossier-client.mjs +151 -0
- package/hooks/lib/atlas-orchestrator-postwire.mjs +221 -0
- package/hooks/lib/canonical-lenses.mjs +83 -6
- package/hooks/lib/coach-intent-classifier.mjs +248 -0
- package/hooks/lib/cognitive-block-parser.mjs +111 -0
- package/hooks/lib/doctrine-trigger-map-loader.mjs +137 -0
- package/hooks/lib/domain-output-quality.mjs +132 -3
- package/hooks/lib/empty-catch-scanner.mjs +91 -0
- package/hooks/lib/end-phase-qa-autofire.mjs +426 -0
- package/hooks/lib/evaluate-with-kernel.mjs +133 -0
- package/hooks/lib/first-class-coach.mjs +454 -19
- package/hooks/lib/gate-audit.mjs +12 -2
- package/hooks/lib/gate-loop-state.mjs +11 -2
- package/hooks/lib/goal-contract-quality.mjs +302 -0
- package/hooks/lib/hook-message-window.mjs +101 -9
- package/hooks/lib/invocation-required-verifier.mjs +184 -0
- package/hooks/lib/kernel/deterministic-cognitive-kernel.mjs +906 -0
- package/hooks/lib/obligation-ledger.mjs +147 -0
- package/hooks/lib/orchestration-manifest-extract.mjs +217 -0
- package/hooks/lib/owner-authorizations.mjs +269 -0
- package/hooks/lib/probe-discipline-scanner.mjs +142 -0
- package/hooks/lib/project-boundary-cognition.mjs +143 -0
- package/hooks/lib/recovery-context.mjs +151 -0
- package/hooks/lib/recovery-template-loader.mjs +154 -0
- package/hooks/lib/self-doctrine-check.mjs +321 -0
- package/hooks/lib/sensitive-shape-detector.mjs +64 -0
- package/hooks/lib/skill-autoload-gate-impl.mjs +226 -1
- package/hooks/lib/stop-hook-protocol.mjs +166 -0
- package/hooks/lib/surface-caught.mjs +94 -0
- package/hooks/recovery-templates/force-reauthor.md +67 -0
- package/hooks/recovery-templates/handoff-recovery.md +25 -0
- package/hooks/scripts/check-hard-risk-prefix.mjs +99 -0
- package/hooks/skills/aria-conversational-doctrine-discipline/SKILL.md +101 -0
- package/hooks/test-aria-preturn-memory-gate.mjs +2 -2
- package/hooks/test-tier-lens-labeling.mjs +14 -3
- package/opencode-plugins/harness-context/index.js +39 -6
- package/opencode-plugins/harness-context/task-project-ledger.mjs +5 -1
- package/opencode-plugins/harness-gate/index.js +36 -0
- package/opencode-plugins/harness-gate/lib/atlas-dossier-client.js +1 -0
- package/opencode-plugins/harness-gate/lib/recovery-grants.js +79 -0
- package/opencode-plugins/harness-outcome/index.js +12 -0
- package/opencode-plugins/harness-stop/index.js +97 -2
- package/opencode-plugins/harness-stop/lib/atlas-dossier-client.js +1 -0
- package/opencode-plugins/harness-stop/lib/domain-output-quality.js +15 -2
- package/opencode-plugins/lib/coach.js +148 -0
- package/package.json +71 -5
- package/runtime-src/coach-kernel.mjs +144 -7
- package/runtime-src/codex-bridge.mjs +254 -8
- package/runtime-src/embedded-public-key.mjs +27 -0
- package/runtime-src/gated-ledger.mjs +41 -14
- package/runtime-src/harness-daemon.mjs +85 -10
- package/runtime-src/hive-wal-publisher.mjs +292 -0
- package/runtime-src/lib/evaluate-with-kernel.mjs +133 -0
- package/runtime-src/lib/kernel/deterministic-cognitive-kernel.mjs +906 -0
- package/runtime-src/local-phase.mjs +10 -5
- package/runtime-src/packet-verifier.mjs +166 -0
- package/runtime-src/provider-proxy.mjs +13 -0
- package/runtime-src/quality-enforcer.mjs +40 -23
- package/runtime-src/runtime-rails/registry.mjs +252 -0
- package/runtime-src/service.mjs +8036 -764
- package/runtime-src/sub-agent-enforcer.mjs +201 -0
- package/scripts/aria-ledger-append.mjs +337 -0
- package/scripts/aria-task-cheap-worker-dispatch.mjs +234 -0
- package/scripts/audit-of-audit-prior-tasks.mjs +194 -0
- package/scripts/audit-of-audit-this-turn.mjs +116 -0
- package/scripts/bundle-sdk.mjs +31 -5
- package/scripts/check-cli-wrapper-provider-contract.mjs +160 -0
- package/scripts/check-client-compatibility.mjs +15 -5
- package/scripts/check-client-smoke.mjs +297 -0
- package/scripts/check-codex-orchestrator-adoption.mjs +150 -0
- package/scripts/check-glm-env-wired.mjs +131 -0
- package/scripts/check-hive-local-storage-contract.mjs +91 -0
- package/scripts/check-hook-mirror.mjs +150 -0
- package/scripts/check-install-sh-drift.mjs +152 -0
- package/scripts/check-kernel-sync.mjs +101 -0
- package/scripts/check-package-artifact.mjs +152 -0
- package/scripts/check-registry-mirror.mjs +71 -0
- package/scripts/drain-owner-airtable-sync-queue.mjs +287 -0
- package/scripts/export-owner-status-sheets.mjs +589 -0
- package/scripts/live-sidecar-receipt-canary.mjs +347 -0
- package/scripts/qiyas-tadabbur-model-matrix.mjs +970 -0
- package/scripts/quality-ab-live-provider.mjs +913 -0
- package/scripts/self-test-action-ledger-core.mjs +190 -0
- package/scripts/self-test-approval-receipt-binding.mjs +122 -0
- package/scripts/self-test-autofire-quality-output.mjs +110 -0
- package/scripts/self-test-claude-code-action-ledger.mjs +132 -0
- package/scripts/self-test-claude-code-mechanical-autofire-hive.mjs +138 -0
- package/scripts/self-test-claude-code-mechanical-autofire.mjs +234 -0
- package/scripts/self-test-codebase-awareness-atlas-delta.mjs +159 -0
- package/scripts/self-test-codebase-awareness-delta-ingest.mjs +179 -0
- package/scripts/self-test-codex-live-hook-parity.mjs +84 -0
- package/scripts/self-test-codex-native-action-ledger.mjs +167 -0
- package/scripts/self-test-codex-native-hook-json-contract.mjs +74 -0
- package/scripts/self-test-codex-orchestrator-continuity.mjs +113 -0
- package/scripts/self-test-codex-readable-recovery.mjs +94 -0
- package/scripts/self-test-codex-self-harness.mjs +538 -0
- package/scripts/self-test-compiled-workunit.mjs +214 -0
- package/scripts/self-test-continuation-output-smoke.mjs +101 -0
- package/scripts/self-test-cross-cli-fleet-ticker.mjs +85 -0
- package/scripts/self-test-cross-cli-hive-adoption.mjs +125 -0
- package/scripts/self-test-cross-cli-hive-learning.mjs +146 -0
- package/scripts/self-test-cross-phase-tool-failure.mjs +110 -0
- package/scripts/self-test-cross-surface-action-ledger.mjs +149 -0
- package/scripts/self-test-end-of-phase-qa-court.mjs +616 -0
- package/scripts/self-test-evaluate-with-kernel.mjs +111 -0
- package/scripts/self-test-first-class-output-delta-proof.mjs +307 -0
- package/scripts/self-test-goal-contract-output-qa.mjs +73 -0
- package/scripts/self-test-goal-contract.mjs +35 -0
- package/scripts/self-test-governed-adapters.mjs +105 -0
- package/scripts/self-test-governed-surface-runner.mjs +198 -0
- package/scripts/self-test-harness-gates.mjs +15 -12
- package/scripts/self-test-harness-ticker-sidecar.mjs +153 -0
- package/scripts/self-test-hive-org-kernel.mjs +233 -0
- package/scripts/self-test-hive-session-coordination.mjs +156 -0
- package/scripts/self-test-hive-wal-consumer.mjs +111 -0
- package/scripts/self-test-kernel-a3-a4-selection.mjs +179 -0
- package/scripts/self-test-ledger-append.mjs +175 -0
- package/scripts/self-test-live-codex-posttool-packet-smoke.mjs +111 -0
- package/scripts/self-test-live-codex-pretool-packet-smoke.mjs +101 -0
- package/scripts/self-test-live-codex-stop-qa-kernel-smoke.mjs +43 -0
- package/scripts/self-test-live-wrapper-substrate-inventory.mjs +149 -0
- package/scripts/self-test-local-main-sync-script.mjs +47 -0
- package/scripts/self-test-mechanical-autofire-resolver.mjs +296 -0
- package/scripts/self-test-no-consult-cognitive-skills-output.mjs +135 -0
- package/scripts/self-test-owner-airtable-sync-queue.mjs +196 -0
- package/scripts/self-test-owner-airtable-sync.mjs +181 -0
- package/scripts/self-test-owner-sheets-action-ledger.mjs +100 -0
- package/scripts/self-test-production-preflight.mjs +78 -0
- package/scripts/self-test-project-boundary-cognition.mjs +79 -0
- package/scripts/self-test-qa-exec-kernel.mjs +34 -0
- package/scripts/self-test-qa-recovery-learning-loop.mjs +113 -0
- package/scripts/self-test-qiyas-label-alignment.mjs +94 -0
- package/scripts/self-test-recovery-context.mjs +110 -0
- package/scripts/self-test-repo-guard.mjs +10 -0
- package/scripts/self-test-runtime-health-self-heal.mjs +161 -0
- package/scripts/self-test-runtime-postcondition.mjs +70 -0
- package/scripts/self-test-soul-precommit-hook.mjs +39 -0
- package/scripts/self-test-stop-gate-kernel-guards.mjs +185 -0
- package/scripts/self-test-stop-gate.mjs +128 -0
- package/scripts/self-test-substrate-kernel-execution-receipt.mjs +130 -0
- package/scripts/self-test-substrate-open-skill-floor.mjs +87 -0
- package/scripts/self-test-substrate-output-quality-eval.mjs +171 -0
- package/scripts/self-test-task-closeout-drift.mjs +97 -0
- package/scripts/self-test-task-project-ledger-readiness.mjs +43 -0
- package/scripts/self-test-task-runner-phase-consumer.mjs +134 -0
- package/scripts/self-test-task-worker-lane.mjs +256 -0
- package/scripts/self-test-turn-substrate-qa-kernel.mjs +188 -0
- package/scripts/self-test-universal-action-capture.mjs +153 -0
- package/scripts/self-test-universal-turn-packet-entrypoints.mjs +252 -0
- package/scripts/self-test-universal-turn-packet.mjs +320 -0
- package/scripts/session-quality-backfill.mjs +253 -0
- package/scripts/smoke-autofire-100-prompts.mjs +481 -0
- package/scripts/sync-local-main-on-task-complete.mjs +278 -0
- package/scripts/sync-owner-status-airtable.mjs +1158 -0
- package/scripts/validate-skill-prompts.mjs +12 -1
- package/scripts/verify-codex-native-mirror.mjs +262 -0
- package/skills/34-frameworks-unified/SKILL.md +42 -0
- package/skills/api-design/SKILL.md +123 -0
- package/skills/architecture-decision/SKILL.md +105 -0
- package/skills/aria-aristotle-cognitives/SKILL.md +128 -0
- package/skills/aria-aristotle-intra-phase/SKILL.md +99 -0
- package/skills/aria-aristotle-post-phase/SKILL.md +116 -0
- package/skills/aria-aristotle-pre-phase/SKILL.md +117 -0
- package/skills/aria-axioms-first-principles/SKILL.md +202 -0
- package/skills/aria-axioms-first-principles/agents/openai.yaml +4 -0
- package/skills/aria-axioms-first-principles/references/source-map.md +130 -0
- package/skills/aria-chat/SKILL.md +84 -0
- package/skills/aria-chat/scripts/aria-chat.sh +57 -0
- package/skills/aria-cognition/34-frameworks-unified/SKILL.md +42 -0
- package/skills/aria-cognition/aria-aristotle-cognitives/SKILL.md +128 -0
- package/skills/aria-cognition/aria-aristotle-intra-phase/SKILL.md +99 -0
- package/skills/aria-cognition/aria-aristotle-post-phase/SKILL.md +118 -0
- package/skills/aria-cognition/aria-aristotle-pre-phase/SKILL.md +117 -0
- package/skills/aria-cognition/aria-axioms-first-principles/SKILL.md +202 -0
- package/skills/aria-cognition/aria-axioms-first-principles/agents/openai.yaml +4 -0
- package/skills/aria-cognition/aria-axioms-first-principles/references/source-map.md +130 -0
- package/skills/aria-cognition/aria-backend-architect/SKILL.md +124 -0
- package/skills/aria-cognition/aria-backend-architect/references/backend-cookbook.md +417 -0
- package/skills/aria-cognition/aria-business-audit/SKILL.md +133 -0
- package/skills/aria-cognition/aria-business-audit/references/audit-cookbook.md +247 -0
- package/skills/aria-cognition/aria-business-frame/SKILL.md +138 -0
- package/skills/aria-cognition/aria-business-frame/references/business-cookbook.md +154 -0
- package/skills/aria-cognition/aria-chat/SKILL.md +84 -0
- package/skills/aria-cognition/aria-chat/scripts/aria-chat.sh +57 -0
- package/skills/aria-cognition/aria-cognition-autofire/SKILL.md +137 -0
- package/skills/aria-cognition/aria-cognition-batch/SKILL.md +264 -0
- package/skills/aria-cognition/aria-decision-mizan/SKILL.md +136 -0
- package/skills/aria-cognition/aria-decision-mizan/references/decision-frameworks.md +287 -0
- package/skills/aria-cognition/aria-first-class-operating-contract/SKILL.md +104 -0
- package/skills/aria-cognition/aria-frontend-architect/SKILL.md +123 -0
- package/skills/aria-cognition/aria-frontend-architect/references/frontend-cookbook.md +358 -0
- package/skills/aria-cognition/aria-fullstack-orchestrator/SKILL.md +127 -0
- package/skills/aria-cognition/aria-fullstack-orchestrator/references/fullstack-cookbook.md +383 -0
- package/skills/aria-cognition/aria-gtm-architect/SKILL.md +126 -0
- package/skills/aria-cognition/aria-gtm-architect/references/gtm-cookbook.md +235 -0
- package/skills/aria-cognition/aria-harness-deploy/SKILL.md +145 -0
- package/skills/aria-cognition/aria-harness-no-stripping/SKILL.md +135 -0
- package/skills/aria-cognition/aria-harness-onboarding/SKILL.md +130 -0
- package/skills/aria-cognition/aria-harness-output-discipline/SKILL.md +120 -0
- package/skills/aria-cognition/aria-harness-substrate-binding/SKILL.md +139 -0
- package/skills/aria-cognition/aria-http-harness-client/SKILL.md +85 -0
- package/skills/aria-cognition/aria-http-harness-client/scripts/smoke.mjs +47 -0
- package/skills/aria-cognition/aria-k8s-deploy/SKILL.md +174 -0
- package/skills/aria-cognition/aria-k8s-deploy/agents/openai.yaml +3 -0
- package/skills/aria-cognition/aria-ladduniframe/SKILL.md +60 -0
- package/skills/aria-cognition/aria-ledger-fleet-execution/SKILL.md +126 -0
- package/skills/aria-cognition/aria-live-ops/SKILL.md +54 -0
- package/skills/aria-cognition/aria-mac-ssh-ops/SKILL.md +100 -0
- package/skills/aria-cognition/aria-memory-index/SKILL.md +42 -0
- package/skills/aria-cognition/aria-noor-cognitives/SKILL.md +120 -0
- package/skills/aria-cognition/aria-ops/SKILL.md +60 -0
- package/skills/aria-cognition/aria-ops/references/live-endpoints.md +59 -0
- package/skills/aria-cognition/aria-quality-audit/SKILL.md +133 -0
- package/skills/aria-cognition/aria-readable-output/SKILL.md +239 -0
- package/skills/aria-cognition/aria-readable-output/references/layout-cookbook.md +366 -0
- package/skills/aria-cognition/aria-reasoning/SKILL.md +67 -0
- package/skills/aria-cognition/aria-reasoning/references/core-principles.md +42 -0
- package/skills/aria-cognition/aria-repo-audit/SKILL.md +135 -0
- package/skills/aria-cognition/aria-repo-audit/references/repo-audit-cookbook.md +375 -0
- package/skills/aria-cognition/aria-research-orchestrator/SKILL.md +138 -0
- package/skills/aria-cognition/aria-research-orchestrator/references/research-patterns.md +270 -0
- package/skills/aria-cognition/aria-retention-engine/SKILL.md +120 -0
- package/skills/aria-cognition/aria-retention-engine/references/retention-cookbook.md +271 -0
- package/skills/aria-cognition/aria-revenue-engine/SKILL.md +128 -0
- package/skills/aria-cognition/aria-revenue-engine/references/revenue-cookbook.md +227 -0
- package/skills/aria-cognition/aria-senior-code-audit/SKILL.md +233 -0
- package/skills/aria-cognition/aria-senior-code-audit/references/audit-checklist.md +369 -0
- package/skills/aria-cognition/aria-senior-code-cookbook/SKILL.md +288 -0
- package/skills/aria-cognition/aria-senior-code-cookbook/references/engineering-cookbook.md +489 -0
- package/skills/aria-cognition/aria-soul-principles/SKILL.md +42 -0
- package/skills/aria-cognition/aria-task-codex-executor/SKILL.md +86 -0
- package/skills/aria-cognition/aristotle-engine/SKILL.md +42 -0
- package/skills/aria-cognition/cross-domain-24/SKILL.md +42 -0
- package/skills/aria-cognition/deepsoul-emotional/SKILL.md +42 -0
- package/skills/aria-cognition/fitrah-guard/SKILL.md +78 -0
- package/skills/aria-cognition/ghazali-8lens/SKILL.md +227 -29
- package/skills/aria-cognition/ghazali-8lens/references/ghazali-8lens-cookbook.md +797 -0
- package/skills/aria-cognition/ijtihad-novel/SKILL.md +42 -0
- package/skills/aria-cognition/ilham-intuition/SKILL.md +42 -0
- package/skills/aria-cognition/never-guess/SKILL.md +77 -0
- package/skills/aria-cognition/noor-recognition/SKILL.md +45 -0
- package/skills/aria-cognition/qiyas-analogy/SKILL.md +174 -14
- package/skills/aria-cognition/ruh-basis/SKILL.md +42 -0
- package/skills/aria-cognition/tadabbur/SKILL.md +506 -0
- package/skills/aria-cognition/tadabbur/references/tadabbur-cookbook.md +921 -0
- package/skills/aria-cognition/tadabbur-ops/SKILL.md +42 -0
- package/skills/aria-cognition/tafakkur/SKILL.md +104 -0
- package/skills/aria-cognition-autofire/SKILL.md +109 -0
- package/skills/aria-cognition-batch/SKILL.md +264 -0
- package/skills/aria-conversational-doctrine-discipline/SKILL.md +125 -0
- package/skills/aria-essence/SKILL.md +81 -0
- package/skills/aria-essence/references/domain-matrix.md +80 -0
- package/skills/aria-essence/references/evolution-loop.md +30 -0
- package/skills/aria-essence/references/readable-cognition.md +27 -0
- package/skills/aria-first-class-operating-contract/SKILL.md +104 -0
- package/skills/aria-forge-guardrails/SKILL.md +53 -0
- package/skills/aria-forge-guardrails/references/checklist.md +31 -0
- package/skills/aria-harness-deploy/SKILL.md +145 -0
- package/skills/aria-harness-no-stripping/SKILL.md +135 -0
- package/skills/aria-harness-onboarding/SKILL.md +130 -0
- package/skills/aria-harness-output-discipline/SKILL.md +120 -0
- package/skills/aria-harness-substrate-binding/SKILL.md +139 -0
- package/skills/aria-http-harness-client/SKILL.md +85 -0
- package/skills/aria-http-harness-client/scripts/smoke.mjs +47 -0
- package/skills/aria-k8s-deploy/SKILL.md +174 -0
- package/skills/aria-k8s-deploy/agents/openai.yaml +3 -0
- package/skills/aria-ladduniframe/SKILL.md +60 -0
- package/skills/aria-ledger-fleet-execution/SKILL.md +126 -0
- package/skills/aria-live-ops/SKILL.md +54 -0
- package/skills/aria-mac-ssh-ops/SKILL.md +100 -0
- package/skills/aria-memory-index/SKILL.md +42 -0
- package/skills/aria-noor-cognitives/SKILL.md +120 -0
- package/skills/aria-ops/SKILL.md +60 -0
- package/skills/aria-ops/references/live-endpoints.md +59 -0
- package/skills/aria-quality-audit/SKILL.md +133 -0
- package/skills/aria-reasoning/SKILL.md +67 -0
- package/skills/aria-reasoning/references/core-principles.md +42 -0
- package/skills/aria-repo-doctrine/SKILL.md +57 -0
- package/skills/aria-soul-principles/SKILL.md +42 -0
- package/skills/aria-task-codex-executor/SKILL.md +86 -0
- package/skills/aristotle-engine/SKILL.md +42 -0
- package/skills/ci-cd-pipeline/SKILL.md +116 -0
- package/skills/code-review/SKILL.md +131 -0
- package/skills/cross-domain-24/SKILL.md +42 -0
- package/skills/database-design/SKILL.md +124 -0
- package/skills/deepsoul-emotional/SKILL.md +42 -0
- package/skills/deno-kv-raft-pubsub/SKILL.md +561 -0
- package/skills/deno-kv-raft-pubsub/reference/maelstrom-integration.md +393 -0
- package/skills/deno-kv-raft-pubsub/reference/pubsub-api.md +376 -0
- package/skills/deno-kv-raft-pubsub/reference/raft-spec.md +402 -0
- package/skills/deno-kv-raft-pubsub/reference/state-machine.md +182 -0
- package/skills/error-handling/SKILL.md +159 -0
- package/skills/firecrawl/SKILL.md +165 -0
- package/skills/firecrawl/rules/install.md +82 -0
- package/skills/firecrawl/rules/security.md +26 -0
- package/skills/firecrawl-agent/SKILL.md +86 -0
- package/skills/firecrawl-build-interact/SKILL.md +96 -0
- package/skills/firecrawl-build-onboarding/SKILL.md +131 -0
- package/skills/firecrawl-build-onboarding/references/auth-flow.md +39 -0
- package/skills/firecrawl-build-onboarding/references/project-setup.md +20 -0
- package/skills/firecrawl-build-onboarding/references/sdk-installation.md +17 -0
- package/skills/firecrawl-build-scrape/SKILL.md +97 -0
- package/skills/firecrawl-build-search/SKILL.md +97 -0
- package/skills/firecrawl-clone/SKILL.md +419 -0
- package/skills/firecrawl-crawl/SKILL.md +87 -0
- package/skills/firecrawl-download/SKILL.md +98 -0
- package/skills/firecrawl-interact/SKILL.md +112 -0
- package/skills/firecrawl-map/SKILL.md +79 -0
- package/skills/firecrawl-scrape/SKILL.md +97 -0
- package/skills/firecrawl-search/SKILL.md +88 -0
- package/skills/fitrah-guard/SKILL.md +78 -0
- package/skills/forge-quality-rules/SKILL.md +61 -0
- package/skills/ghazali-8lens/SKILL.md +56 -0
- package/skills/ijtihad-novel/SKILL.md +42 -0
- package/skills/ilham-intuition/SKILL.md +42 -0
- package/skills/imagegen/LICENSE.txt +201 -0
- package/skills/imagegen/SKILL.md +374 -0
- package/skills/imagegen/agents/openai.yaml +6 -0
- package/skills/imagegen/assets/imagegen-small.svg +5 -0
- package/skills/imagegen/assets/imagegen.png +0 -0
- package/skills/imagegen/references/cli.md +242 -0
- package/skills/imagegen/references/codex-network.md +33 -0
- package/skills/imagegen/references/image-api.md +90 -0
- package/skills/imagegen/references/prompting.md +118 -0
- package/skills/imagegen/references/sample-prompts.md +433 -0
- package/skills/imagegen/scripts/image_gen.py +995 -0
- package/skills/imagegen/scripts/remove_chroma_key.py +440 -0
- package/skills/istiqra-induction/SKILL.md +44 -0
- package/skills/ladunni-22/SKILL.md +53 -0
- package/skills/mizan/SKILL.md +90 -0
- package/skills/nadia/SKILL.md +56 -0
- package/skills/nadia-psi/SKILL.md +56 -0
- package/skills/never-guess/SKILL.md +75 -0
- package/skills/noor-recognition/SKILL.md +45 -0
- package/skills/observability/SKILL.md +133 -0
- package/skills/openai-docs/LICENSE.txt +201 -0
- package/skills/openai-docs/SKILL.md +100 -0
- package/skills/openai-docs/agents/openai.yaml +14 -0
- package/skills/openai-docs/assets/openai-small.svg +3 -0
- package/skills/openai-docs/assets/openai.png +0 -0
- package/skills/openai-docs/references/latest-model.md +37 -0
- package/skills/openai-docs/references/prompting-guide.md +244 -0
- package/skills/openai-docs/references/upgrade-guide.md +181 -0
- package/skills/openai-docs/scripts/resolve-latest-model-info.js +147 -0
- package/skills/pdf/LICENSE.txt +201 -0
- package/skills/pdf/SKILL.md +85 -0
- package/skills/pdf/agents/openai.yaml +5 -0
- package/skills/pdf/assets/pdf.png +0 -0
- package/skills/playwright/LICENSE.txt +201 -0
- package/skills/playwright/NOTICE.txt +14 -0
- package/skills/playwright/SKILL.md +165 -0
- package/skills/playwright/agents/openai.yaml +6 -0
- package/skills/playwright/assets/playwright-small.svg +3 -0
- package/skills/playwright/assets/playwright.png +0 -0
- package/skills/playwright/references/cli.md +116 -0
- package/skills/playwright/references/workflows.md +95 -0
- package/skills/playwright/scripts/playwright_cli.sh +25 -0
- package/skills/plugin-creator/SKILL.md +178 -0
- package/skills/plugin-creator/agents/openai.yaml +6 -0
- package/skills/plugin-creator/assets/plugin-creator-small.svg +3 -0
- package/skills/plugin-creator/assets/plugin-creator.png +0 -0
- package/skills/plugin-creator/references/plugin-json-spec.md +170 -0
- package/skills/plugin-creator/scripts/create_basic_plugin.py +301 -0
- package/skills/predictor/SKILL.md +43 -0
- package/skills/qiyas-analogy/SKILL.md +204 -0
- package/skills/refactoring/SKILL.md +137 -0
- package/skills/ruh-basis/SKILL.md +42 -0
- package/skills/security-review/SKILL.md +129 -0
- package/skills/skill-creator/SKILL.md +434 -0
- package/skills/skill-creator/agents/openai.yaml +5 -0
- package/skills/skill-creator/assets/skill-creator-small.svg +3 -0
- package/skills/skill-creator/assets/skill-creator.png +0 -0
- package/skills/skill-creator/license.txt +202 -0
- package/skills/skill-creator/references/openai_yaml.md +49 -0
- package/skills/skill-creator/scripts/generate_openai_yaml.py +226 -0
- package/skills/skill-creator/scripts/init_skill.py +400 -0
- package/skills/skill-creator/scripts/quick_validate.py +101 -0
- package/skills/skill-installer/LICENSE.txt +202 -0
- package/skills/skill-installer/SKILL.md +76 -0
- package/skills/skill-installer/agents/openai.yaml +5 -0
- package/skills/skill-installer/assets/skill-installer-small.svg +3 -0
- package/skills/skill-installer/assets/skill-installer.png +0 -0
- package/skills/skill-installer/scripts/github_utils.py +21 -0
- package/skills/skill-installer/scripts/install-skill-from-github.py +308 -0
- package/skills/skill-installer/scripts/list-skills.py +107 -0
- package/skills/skills-and-hooks-reference/SKILL.md +196 -0
- package/skills/soul-domains/SKILL.md +43 -0
- package/skills/tadabbur/SKILL.md +232 -0
- package/skills/tadabbur-ops/SKILL.md +42 -0
- package/skills/tafakkur/SKILL.md +104 -0
- package/skills/testing-strategy/SKILL.md +122 -0
- package/src/action-ledger-core.ts +1054 -0
- package/src/chat.ts +5 -6
- package/src/codebase-scanner.ts +2 -0
- package/src/connectors/claude-code.ts +149 -12
- package/src/connectors/codebase-awareness.ts +325 -25
- package/src/connectors/codex.ts +1273 -40
- package/src/connectors/cursor.ts +8 -0
- package/src/connectors/governed-adapter.ts +174 -0
- package/src/connectors/opencode.ts +18 -2
- package/src/connectors/repo-guard.ts +24 -12
- package/src/connectors/runtime.ts +99 -2
- package/src/connectors/shell.ts +125 -7
- package/src/cross-cli-hive-binding.ts +290 -0
- package/src/garden-control-plane.ts +24 -1
- package/src/governed-surface-runner.ts +1227 -0
- package/src/index.ts +104 -1
- package/src/task-runner.ts +3794 -0
- package/dist/aria-connector/src/install-hooks.d.ts +0 -18
- package/dist/aria-connector/src/install-hooks.d.ts.map +0 -1
- package/dist/aria-connector/src/install-hooks.js +0 -224
- package/dist/aria-connector/src/install-hooks.js.map +0 -1
- package/dist/aria-connector/src/onboarding-wizard.d.ts +0 -5
- package/dist/aria-connector/src/onboarding-wizard.d.ts.map +0 -1
- package/dist/aria-connector/src/onboarding-wizard.js +0 -188
- package/dist/aria-connector/src/onboarding-wizard.js.map +0 -1
- package/dist/cli-0.2.38.tgz +0 -0
- package/dist/install.sh +0 -13
- package/src/__tests__/anthropic-oauth.test.ts +0 -186
- package/src/__tests__/auth-commands.test.ts +0 -132
- package/src/__tests__/owner-login.test.ts +0 -311
|
@@ -0,0 +1,970 @@
|
|
|
1
|
+
#!/usr/bin/env node
|
|
2
|
+
import { createHash } from 'node:crypto';
|
|
3
|
+
import { spawnSync } from 'node:child_process';
|
|
4
|
+
import {
|
|
5
|
+
existsSync,
|
|
6
|
+
mkdirSync,
|
|
7
|
+
readdirSync,
|
|
8
|
+
readFileSync,
|
|
9
|
+
statSync,
|
|
10
|
+
writeFileSync,
|
|
11
|
+
} from 'node:fs';
|
|
12
|
+
import os from 'node:os';
|
|
13
|
+
import path from 'node:path';
|
|
14
|
+
|
|
15
|
+
const repoRoot = process.cwd();
|
|
16
|
+
const runId = new Date().toISOString().replace(/[:.]/g, '-');
|
|
17
|
+
const outputRoot = path.join(repoRoot, 'artifacts', 'qiyas-tadabbur-model-matrix', runId);
|
|
18
|
+
const outputsDir = path.join(outputRoot, 'outputs');
|
|
19
|
+
const qiyasPerspectives = [
|
|
20
|
+
'Owner-Hamza-tomorrow',
|
|
21
|
+
'operator-client',
|
|
22
|
+
'investor',
|
|
23
|
+
'LLM-consumer',
|
|
24
|
+
'human-end-user',
|
|
25
|
+
'skeptic',
|
|
26
|
+
'compliance',
|
|
27
|
+
'engineering-quality',
|
|
28
|
+
'cognitive-load',
|
|
29
|
+
'scale',
|
|
30
|
+
'Islamic-scholar',
|
|
31
|
+
'clinical-scholar',
|
|
32
|
+
'red-team-attacker',
|
|
33
|
+
'1-week-future-self',
|
|
34
|
+
'1-year-future-self',
|
|
35
|
+
];
|
|
36
|
+
const tadabburStages = [
|
|
37
|
+
'EMBED',
|
|
38
|
+
'EXCAVATE',
|
|
39
|
+
'ROOT TRACE',
|
|
40
|
+
'MULTI-LENS',
|
|
41
|
+
'PATTERN',
|
|
42
|
+
'CONSEQUENCE',
|
|
43
|
+
'DWELLING',
|
|
44
|
+
'COLLAPSE',
|
|
45
|
+
'PRINCIPLE',
|
|
46
|
+
'INVERSION',
|
|
47
|
+
'PERSONAL',
|
|
48
|
+
'VOICE',
|
|
49
|
+
];
|
|
50
|
+
const relevanceRx = /\b(qiyas|tadabbur|taddabur|fire skills|skills active|runtime|runtimes|autofire|first class|quality|gates|hook|cognition|substrate|kernel|qa|compare|model)\b/i;
|
|
51
|
+
|
|
52
|
+
function ensureDir(dir) {
|
|
53
|
+
mkdirSync(dir, { recursive: true, mode: 0o755 });
|
|
54
|
+
}
|
|
55
|
+
|
|
56
|
+
function sha256(value) {
|
|
57
|
+
return createHash('sha256').update(String(value ?? '')).digest('hex');
|
|
58
|
+
}
|
|
59
|
+
|
|
60
|
+
function redactText(value) {
|
|
61
|
+
return String(value ?? '')
|
|
62
|
+
.replace(/sk-[^"\s,}\]]{8,}/g, 'sk-[REDACTED]')
|
|
63
|
+
.replace(/Bearer [^"\s,}\]]{8,}/g, 'Bearer [REDACTED]');
|
|
64
|
+
}
|
|
65
|
+
|
|
66
|
+
function redactRequest(value) {
|
|
67
|
+
if (Array.isArray(value)) return value.map(redactRequest);
|
|
68
|
+
if (typeof value === 'string') return redactText(value);
|
|
69
|
+
if (!value || typeof value !== 'object') return value;
|
|
70
|
+
return Object.fromEntries(Object.entries(value).map(([key, child]) => {
|
|
71
|
+
if (/api[_-]?key|authorization|bearer|secret|token|password/i.test(key) && typeof child !== 'boolean') return [key, '[REDACTED]'];
|
|
72
|
+
return [key, redactRequest(child)];
|
|
73
|
+
}));
|
|
74
|
+
}
|
|
75
|
+
|
|
76
|
+
function writeJsonArtifact(filePath, value) {
|
|
77
|
+
writeFileSync(filePath, JSON.stringify(redactRequest(value), null, 2) + '\n');
|
|
78
|
+
}
|
|
79
|
+
|
|
80
|
+
function asRecord(value) {
|
|
81
|
+
return value && typeof value === 'object' && !Array.isArray(value) ? value : {};
|
|
82
|
+
}
|
|
83
|
+
|
|
84
|
+
function completionUsageDetails(data = {}) {
|
|
85
|
+
const usage = asRecord(data.usage);
|
|
86
|
+
const completionDetails = asRecord(usage.completion_tokens_details || usage.completionTokensDetails);
|
|
87
|
+
const completionTokens = Number(usage.completion_tokens ?? usage.completionTokens ?? 0);
|
|
88
|
+
const reasoningTokens = Number(completionDetails.reasoning_tokens ?? completionDetails.reasoningTokens ?? 0);
|
|
89
|
+
return {
|
|
90
|
+
promptTokens: Number(usage.prompt_tokens ?? usage.promptTokens ?? 0),
|
|
91
|
+
completionTokens,
|
|
92
|
+
totalTokens: Number(usage.total_tokens ?? usage.totalTokens ?? 0),
|
|
93
|
+
reasoningTokens,
|
|
94
|
+
allCompletionTokensSpentOnReasoning: completionTokens > 0 && reasoningTokens >= completionTokens,
|
|
95
|
+
};
|
|
96
|
+
}
|
|
97
|
+
|
|
98
|
+
function argValue(name, fallback = '') {
|
|
99
|
+
const prefix = `--${name}=`;
|
|
100
|
+
const raw = process.argv.find((arg) => arg.startsWith(prefix));
|
|
101
|
+
return raw ? raw.slice(prefix.length) : process.env[`ARIA_QT_${name.replaceAll('-', '_').toUpperCase()}`] || fallback;
|
|
102
|
+
}
|
|
103
|
+
|
|
104
|
+
function argNumber(name, fallback, { min = 1, max = Number.MAX_SAFE_INTEGER } = {}) {
|
|
105
|
+
const value = Number(argValue(name, String(fallback)));
|
|
106
|
+
return Math.min(max, Math.max(min, Number.isFinite(value) ? value : fallback));
|
|
107
|
+
}
|
|
108
|
+
|
|
109
|
+
async function mapConcurrent(items, concurrency, worker) {
|
|
110
|
+
const results = new Array(items.length);
|
|
111
|
+
let next = 0;
|
|
112
|
+
const workers = Array.from({ length: Math.min(concurrency, items.length) }, async () => {
|
|
113
|
+
while (next < items.length) {
|
|
114
|
+
const index = next;
|
|
115
|
+
next += 1;
|
|
116
|
+
results[index] = await worker(items[index], index);
|
|
117
|
+
}
|
|
118
|
+
});
|
|
119
|
+
await Promise.all(workers);
|
|
120
|
+
return results;
|
|
121
|
+
}
|
|
122
|
+
|
|
123
|
+
function walkFiles(root, predicate, maxFiles = 5000) {
|
|
124
|
+
const out = [];
|
|
125
|
+
function visit(dir) {
|
|
126
|
+
if (out.length >= maxFiles) return;
|
|
127
|
+
let entries = [];
|
|
128
|
+
try {
|
|
129
|
+
entries = readdirSync(dir, { withFileTypes: true });
|
|
130
|
+
} catch {
|
|
131
|
+
return;
|
|
132
|
+
}
|
|
133
|
+
for (const entry of entries) {
|
|
134
|
+
const full = path.join(dir, entry.name);
|
|
135
|
+
if (entry.isDirectory()) visit(full);
|
|
136
|
+
else if (predicate(full)) out.push(full);
|
|
137
|
+
if (out.length >= maxFiles) return;
|
|
138
|
+
}
|
|
139
|
+
}
|
|
140
|
+
if (existsSync(root)) visit(root);
|
|
141
|
+
return out;
|
|
142
|
+
}
|
|
143
|
+
|
|
144
|
+
function recentJsonl(root, limit) {
|
|
145
|
+
return walkFiles(root, (file) => file.endsWith('.jsonl'), 12000)
|
|
146
|
+
.map((file) => {
|
|
147
|
+
try {
|
|
148
|
+
return { file, mtimeMs: statSync(file).mtimeMs };
|
|
149
|
+
} catch {
|
|
150
|
+
return null;
|
|
151
|
+
}
|
|
152
|
+
})
|
|
153
|
+
.filter(Boolean)
|
|
154
|
+
.sort((a, b) => b.mtimeMs - a.mtimeMs)
|
|
155
|
+
.slice(0, limit)
|
|
156
|
+
.map((entry) => entry.file);
|
|
157
|
+
}
|
|
158
|
+
|
|
159
|
+
function textFromContent(content) {
|
|
160
|
+
if (typeof content === 'string') return content;
|
|
161
|
+
if (!Array.isArray(content)) return '';
|
|
162
|
+
return content
|
|
163
|
+
.filter((part) => part && (part.type === 'text' || part.type === 'input_text' || part.type === 'output_text'))
|
|
164
|
+
.map((part) => part.text || '')
|
|
165
|
+
.join('\n')
|
|
166
|
+
.trim();
|
|
167
|
+
}
|
|
168
|
+
|
|
169
|
+
function readJsonl(file) {
|
|
170
|
+
try {
|
|
171
|
+
return readFileSync(file, 'utf8')
|
|
172
|
+
.split('\n')
|
|
173
|
+
.filter(Boolean)
|
|
174
|
+
.map((line) => {
|
|
175
|
+
try {
|
|
176
|
+
return JSON.parse(line);
|
|
177
|
+
} catch {
|
|
178
|
+
return null;
|
|
179
|
+
}
|
|
180
|
+
})
|
|
181
|
+
.filter(Boolean);
|
|
182
|
+
} catch {
|
|
183
|
+
return [];
|
|
184
|
+
}
|
|
185
|
+
}
|
|
186
|
+
|
|
187
|
+
function extractCodexPairs(file) {
|
|
188
|
+
const rows = readJsonl(file);
|
|
189
|
+
let model = 'codex-observed';
|
|
190
|
+
const pairs = [];
|
|
191
|
+
let pendingUser = null;
|
|
192
|
+
for (const row of rows) {
|
|
193
|
+
if (row.type === 'session_meta') model = row.payload?.model || model;
|
|
194
|
+
const item = row.type === 'response_item' ? row.payload : null;
|
|
195
|
+
if (!item || item.type !== 'message') continue;
|
|
196
|
+
const role = item.role;
|
|
197
|
+
if (role === 'user') {
|
|
198
|
+
const text = textFromContent(item.content);
|
|
199
|
+
if (text && relevanceRx.test(text)) pendingUser = text;
|
|
200
|
+
} else if (role === 'assistant' && pendingUser) {
|
|
201
|
+
const text = textFromContent(item.content);
|
|
202
|
+
if (text) {
|
|
203
|
+
pairs.push({ source: 'codex', model, file, prompt: pendingUser, observedAnswer: text });
|
|
204
|
+
pendingUser = null;
|
|
205
|
+
}
|
|
206
|
+
}
|
|
207
|
+
}
|
|
208
|
+
return pairs;
|
|
209
|
+
}
|
|
210
|
+
|
|
211
|
+
function extractClaudePairs(file) {
|
|
212
|
+
const rows = readJsonl(file);
|
|
213
|
+
const pairs = [];
|
|
214
|
+
let pendingUser = null;
|
|
215
|
+
for (const row of rows) {
|
|
216
|
+
if (row.type !== 'user' && row.type !== 'assistant') continue;
|
|
217
|
+
const content = row.message?.content;
|
|
218
|
+
if (row.type === 'user') {
|
|
219
|
+
const text = textFromContent(content);
|
|
220
|
+
if (text && relevanceRx.test(text)) pendingUser = text;
|
|
221
|
+
} else if (row.type === 'assistant' && pendingUser) {
|
|
222
|
+
const text = textFromContent(content);
|
|
223
|
+
if (text) {
|
|
224
|
+
pairs.push({ source: 'claude', model: row.message?.model || 'claude-observed', file, prompt: pendingUser, observedAnswer: text });
|
|
225
|
+
pendingUser = null;
|
|
226
|
+
}
|
|
227
|
+
}
|
|
228
|
+
}
|
|
229
|
+
return pairs;
|
|
230
|
+
}
|
|
231
|
+
|
|
232
|
+
function collectPromptPairs({ sessionLimit, pairLimit, maxPromptChars }) {
|
|
233
|
+
const codexRoot = path.join(os.homedir(), '.codex', 'sessions');
|
|
234
|
+
const claudeRoot = path.join(os.homedir(), '.claude', 'projects');
|
|
235
|
+
const codexCandidates = recentJsonl(codexRoot, sessionLimit).flatMap(extractCodexPairs);
|
|
236
|
+
const claudeCandidates = recentJsonl(claudeRoot, sessionLimit).flatMap(extractClaudePairs);
|
|
237
|
+
const candidates = [...codexCandidates, ...claudeCandidates];
|
|
238
|
+
const seen = new Set();
|
|
239
|
+
const filtered = [];
|
|
240
|
+
for (const candidate of candidates) {
|
|
241
|
+
const prompt = String(candidate.prompt || '').replace(/\s+/g, ' ').trim();
|
|
242
|
+
if (prompt.length < 40 || prompt.length > maxPromptChars) continue;
|
|
243
|
+
const key = sha256(prompt);
|
|
244
|
+
if (seen.has(key)) continue;
|
|
245
|
+
seen.add(key);
|
|
246
|
+
filtered.push({ ...candidate, prompt, promptSha256: key });
|
|
247
|
+
}
|
|
248
|
+
filtered.sort((a, b) => promptWeight(b.prompt) - promptWeight(a.prompt));
|
|
249
|
+
const balanced = [];
|
|
250
|
+
const perSourceFloor = Math.max(1, Math.floor(pairLimit / 3));
|
|
251
|
+
for (const source of ['codex', 'claude']) {
|
|
252
|
+
const sourceRows = filtered.filter((row) => row.source === source).slice(0, perSourceFloor);
|
|
253
|
+
for (const row of sourceRows) {
|
|
254
|
+
if (!balanced.find((existing) => existing.promptSha256 === row.promptSha256)) balanced.push(row);
|
|
255
|
+
}
|
|
256
|
+
}
|
|
257
|
+
for (const row of filtered) {
|
|
258
|
+
if (balanced.length >= pairLimit) break;
|
|
259
|
+
if (!balanced.find((existing) => existing.promptSha256 === row.promptSha256)) balanced.push(row);
|
|
260
|
+
}
|
|
261
|
+
return balanced.slice(0, pairLimit);
|
|
262
|
+
}
|
|
263
|
+
|
|
264
|
+
function promptWeight(text) {
|
|
265
|
+
const source = String(text || '').toLowerCase();
|
|
266
|
+
return [
|
|
267
|
+
['qiyas', 8],
|
|
268
|
+
['tadabbur', 8],
|
|
269
|
+
['first class', 5],
|
|
270
|
+
['autofire', 5],
|
|
271
|
+
['runtime', 3],
|
|
272
|
+
['skills', 3],
|
|
273
|
+
['quality', 3],
|
|
274
|
+
['compare', 3],
|
|
275
|
+
['model', 2],
|
|
276
|
+
].reduce((score, [term, weight]) => score + (source.includes(term) ? weight : 0), 0);
|
|
277
|
+
}
|
|
278
|
+
|
|
279
|
+
function providerApiKey(provider) {
|
|
280
|
+
if (provider === 'deepseek') return process.env.DEEPSEEK_API_KEY || process.env.ARIA_DEEPSEEK_API_KEY || '';
|
|
281
|
+
if (provider === 'xai') return process.env.XAI_API_KEY || process.env.GROK_API_KEY || '';
|
|
282
|
+
if (provider === 'openai') return process.env.OPENAI_API_KEY || '';
|
|
283
|
+
return '';
|
|
284
|
+
}
|
|
285
|
+
|
|
286
|
+
function providerUrl(provider) {
|
|
287
|
+
if (provider === 'deepseek') return 'https://api.deepseek.com/v1/chat/completions';
|
|
288
|
+
if (provider === 'xai') return 'https://api.x.ai/v1/chat/completions';
|
|
289
|
+
if (provider === 'openai') return 'https://api.openai.com/v1/chat/completions';
|
|
290
|
+
throw new Error(`unsupported provider: ${provider}`);
|
|
291
|
+
}
|
|
292
|
+
|
|
293
|
+
function parseModels() {
|
|
294
|
+
const raw = argValue('models', 'deepseek:deepseek-v4-flash,deepseek:deepseek-v4-pro,xai:grok-4.3,openai:gpt-5.5,openai:gpt-5.3-codex');
|
|
295
|
+
return raw.split(',')
|
|
296
|
+
.map((item) => item.trim())
|
|
297
|
+
.filter(Boolean)
|
|
298
|
+
.map((item) => {
|
|
299
|
+
const [provider, model] = item.split(':');
|
|
300
|
+
return { provider, model, id: `${provider}:${model}`, apiKeyPresent: Boolean(providerApiKey(provider)) };
|
|
301
|
+
});
|
|
302
|
+
}
|
|
303
|
+
|
|
304
|
+
function directSystemPrompt() {
|
|
305
|
+
return [
|
|
306
|
+
'You are a senior engineering and cognition evaluator.',
|
|
307
|
+
'Answer the user prompt directly.',
|
|
308
|
+
'Use full Qiyas-15 and full Tadabbur-12 as operative reasoning, but keep an owner-readable executive answer first.',
|
|
309
|
+
'Include enough structure that a deterministic grader can see whether the 15 Qiyas perspectives and 12 Tadabbur stages were actually covered.',
|
|
310
|
+
'Do not claim proof that is not present. Name a concrete next action and a measurable verification predicate.',
|
|
311
|
+
].join(' ');
|
|
312
|
+
}
|
|
313
|
+
|
|
314
|
+
function matrixUserPrompt(prompt) {
|
|
315
|
+
return [
|
|
316
|
+
'Use the user prompt below as the exact task substrate.',
|
|
317
|
+
'Produce a full Qiyas and full Tadabbur quality answer that would help the owner decide what to do next.',
|
|
318
|
+
'Do not ask what to do next if a best next action can be named from the prompt.',
|
|
319
|
+
'',
|
|
320
|
+
'USER PROMPT:',
|
|
321
|
+
prompt,
|
|
322
|
+
].join('\n');
|
|
323
|
+
}
|
|
324
|
+
|
|
325
|
+
async function callChatModel(modelSpec, prompt, index) {
|
|
326
|
+
if (!modelSpec.apiKeyPresent) {
|
|
327
|
+
return {
|
|
328
|
+
ok: false,
|
|
329
|
+
skipped: true,
|
|
330
|
+
reason: `missing API key for ${modelSpec.provider}`,
|
|
331
|
+
text: '',
|
|
332
|
+
durationMs: 0,
|
|
333
|
+
usage: null,
|
|
334
|
+
};
|
|
335
|
+
}
|
|
336
|
+
const started = Date.now();
|
|
337
|
+
const maxTokens = argNumber('max-tokens', 1800, { min: 400, max: 6000 });
|
|
338
|
+
const attempts = modelSpec.provider === 'deepseek' ? 2 : 1;
|
|
339
|
+
const blanks = [];
|
|
340
|
+
const requestAttempts = [];
|
|
341
|
+
for (let attempt = 1; attempt <= attempts; attempt += 1) {
|
|
342
|
+
const visibleAnswerSuffix = attempt > 1
|
|
343
|
+
? '\n\nReturn a visible final answer in message.content. Do not spend the entire completion budget on hidden reasoning.'
|
|
344
|
+
: '';
|
|
345
|
+
const body = {
|
|
346
|
+
model: modelSpec.model,
|
|
347
|
+
messages: [
|
|
348
|
+
{ role: 'system', content: directSystemPrompt() + visibleAnswerSuffix },
|
|
349
|
+
{ role: 'user', content: matrixUserPrompt(prompt) },
|
|
350
|
+
],
|
|
351
|
+
max_tokens: Math.min(6000, maxTokens * attempt),
|
|
352
|
+
temperature: Number(argValue('temperature', '0.2')),
|
|
353
|
+
stream: false,
|
|
354
|
+
metadata: { source: 'qiyas-tadabbur-model-matrix', index, attempt },
|
|
355
|
+
};
|
|
356
|
+
requestAttempts.push({
|
|
357
|
+
attempt,
|
|
358
|
+
provider: modelSpec.provider,
|
|
359
|
+
model: modelSpec.model,
|
|
360
|
+
url: providerUrl(modelSpec.provider),
|
|
361
|
+
requestBody: redactRequest(body),
|
|
362
|
+
requestSha256: sha256(JSON.stringify(body)),
|
|
363
|
+
});
|
|
364
|
+
const response = await fetch(providerUrl(modelSpec.provider), {
|
|
365
|
+
method: 'POST',
|
|
366
|
+
headers: {
|
|
367
|
+
'content-type': 'application/json',
|
|
368
|
+
authorization: `Bearer ${providerApiKey(modelSpec.provider)}`,
|
|
369
|
+
},
|
|
370
|
+
body: JSON.stringify(body),
|
|
371
|
+
});
|
|
372
|
+
const rawText = await response.text();
|
|
373
|
+
let data = {};
|
|
374
|
+
try {
|
|
375
|
+
data = rawText ? JSON.parse(rawText) : {};
|
|
376
|
+
} catch {
|
|
377
|
+
data = { raw: rawText };
|
|
378
|
+
}
|
|
379
|
+
if (!response.ok) {
|
|
380
|
+
return {
|
|
381
|
+
ok: false,
|
|
382
|
+
skipped: false,
|
|
383
|
+
reason: `${modelSpec.provider} ${modelSpec.model} ${response.status}: ${rawText.slice(0, 500)}`,
|
|
384
|
+
text: '',
|
|
385
|
+
durationMs: Date.now() - started,
|
|
386
|
+
usage: data.usage || null,
|
|
387
|
+
usageDetails: completionUsageDetails(data),
|
|
388
|
+
rawSha256: sha256(rawText),
|
|
389
|
+
rawText,
|
|
390
|
+
attempts: attempt,
|
|
391
|
+
requestAttempts,
|
|
392
|
+
};
|
|
393
|
+
}
|
|
394
|
+
const text = data?.choices?.[0]?.message?.content || '';
|
|
395
|
+
if (String(text).trim()) {
|
|
396
|
+
return {
|
|
397
|
+
ok: true,
|
|
398
|
+
skipped: false,
|
|
399
|
+
reason: null,
|
|
400
|
+
text,
|
|
401
|
+
durationMs: Date.now() - started,
|
|
402
|
+
usage: data.usage || null,
|
|
403
|
+
usageDetails: completionUsageDetails(data),
|
|
404
|
+
rawSha256: sha256(rawText),
|
|
405
|
+
rawText,
|
|
406
|
+
attempts: attempt,
|
|
407
|
+
requestAttempts,
|
|
408
|
+
};
|
|
409
|
+
}
|
|
410
|
+
blanks.push({ attempt, usage: data.usage || null, usageDetails: completionUsageDetails(data), rawSha256: sha256(rawText), rawText });
|
|
411
|
+
}
|
|
412
|
+
return {
|
|
413
|
+
ok: false,
|
|
414
|
+
skipped: false,
|
|
415
|
+
visibleOutputFailure: true,
|
|
416
|
+
reason: `${modelSpec.provider} ${modelSpec.model} returned no visible answer text after ${attempts} attempt(s); usage=${JSON.stringify(blanks.map((blank) => blank.usageDetails))}`,
|
|
417
|
+
text: '',
|
|
418
|
+
durationMs: Date.now() - started,
|
|
419
|
+
usage: blanks.at(-1)?.usage || null,
|
|
420
|
+
usageDetails: blanks.at(-1)?.usageDetails || null,
|
|
421
|
+
rawSha256: blanks.at(-1)?.rawSha256 || null,
|
|
422
|
+
rawText: blanks.at(-1)?.rawText || '',
|
|
423
|
+
attempts,
|
|
424
|
+
requestAttempts,
|
|
425
|
+
blankAttempts: blanks.map((blank) => ({ attempt: blank.attempt, usageDetails: blank.usageDetails, rawSha256: blank.rawSha256 })),
|
|
426
|
+
};
|
|
427
|
+
}
|
|
428
|
+
|
|
429
|
+
function includeClaudeTerminalArm() {
|
|
430
|
+
return ['1', 'true', 'yes'].includes(String(argValue('claude-terminal', process.env.ARIA_QT_CLAUDE_TERMINAL || 'false')).toLowerCase());
|
|
431
|
+
}
|
|
432
|
+
|
|
433
|
+
function shellQuote(value) {
|
|
434
|
+
return `'${String(value).replaceAll("'", "'\\''")}'`;
|
|
435
|
+
}
|
|
436
|
+
|
|
437
|
+
function claudeTerminalCommand(prompt) {
|
|
438
|
+
const claudePath = process.env.ARIA_QT_CLAUDE_PATH || '/home/hamzaibrahim1/.local/bin/claude';
|
|
439
|
+
const model = argValue('claude-model', process.env.ARIA_QT_CLAUDE_MODEL || 'opus');
|
|
440
|
+
const budget = argValue('claude-budget-usd', process.env.ARIA_QT_CLAUDE_BUDGET_USD || '0.35');
|
|
441
|
+
return [
|
|
442
|
+
shellQuote(claudePath),
|
|
443
|
+
'--print',
|
|
444
|
+
'--input-format text',
|
|
445
|
+
'--output-format text',
|
|
446
|
+
'--no-session-persistence',
|
|
447
|
+
'--permission-mode plan',
|
|
448
|
+
'--tools ""',
|
|
449
|
+
`--model ${shellQuote(model)}`,
|
|
450
|
+
`--max-budget-usd ${shellQuote(budget)}`,
|
|
451
|
+
shellQuote(prompt),
|
|
452
|
+
].join(' ');
|
|
453
|
+
}
|
|
454
|
+
|
|
455
|
+
function stripTerminalControls(text = '') {
|
|
456
|
+
return String(text || '')
|
|
457
|
+
.replace(/\u001b\[[0-?]*[ -/]*[@-~]/g, '')
|
|
458
|
+
.replace(/\u001b\][^\u0007]*(?:\u0007|\u001b\\)/g, '')
|
|
459
|
+
.replace(/\r/g, '')
|
|
460
|
+
.trim();
|
|
461
|
+
}
|
|
462
|
+
|
|
463
|
+
function callClaudeCodeTerminal(promptPair, index) {
|
|
464
|
+
const claudePath = process.env.ARIA_QT_CLAUDE_PATH || '/home/hamzaibrahim1/.local/bin/claude';
|
|
465
|
+
if (!existsSync(claudePath)) {
|
|
466
|
+
return {
|
|
467
|
+
ok: false,
|
|
468
|
+
skipped: true,
|
|
469
|
+
reason: `claude executable missing at ${claudePath}`,
|
|
470
|
+
text: '',
|
|
471
|
+
durationMs: 0,
|
|
472
|
+
usage: null,
|
|
473
|
+
};
|
|
474
|
+
}
|
|
475
|
+
const started = Date.now();
|
|
476
|
+
const prompt = [
|
|
477
|
+
directSystemPrompt(),
|
|
478
|
+
'',
|
|
479
|
+
matrixUserPrompt(promptPair.prompt),
|
|
480
|
+
].join('\n');
|
|
481
|
+
const command = claudeTerminalCommand(prompt);
|
|
482
|
+
const timeoutMs = Number(argValue('claude-timeout-ms', process.env.ARIA_QT_CLAUDE_TIMEOUT_MS || '0'));
|
|
483
|
+
const result = spawnSync('script', ['-qefc', command, '/dev/null'], {
|
|
484
|
+
cwd: repoRoot,
|
|
485
|
+
encoding: 'utf8',
|
|
486
|
+
maxBuffer: 1024 * 1024 * 8,
|
|
487
|
+
...(timeoutMs > 0 ? { timeout: timeoutMs } : {}),
|
|
488
|
+
env: {
|
|
489
|
+
...process.env,
|
|
490
|
+
CLAUDE_CODE_SIMPLE: process.env.CLAUDE_CODE_SIMPLE || '1',
|
|
491
|
+
},
|
|
492
|
+
});
|
|
493
|
+
const stdout = result.stdout || '';
|
|
494
|
+
const stderr = result.stderr || '';
|
|
495
|
+
const text = stripTerminalControls(stdout);
|
|
496
|
+
const signal = result.signal || null;
|
|
497
|
+
const error = result.error ? String(result.error.message || result.error) : null;
|
|
498
|
+
const authFailure = /invalid api key|api key|auth|authentication|not logged in|login required/i.test(`${text}\n${stderr}`);
|
|
499
|
+
const ok = result.status === 0 && text.length > 0 && !signal && !error;
|
|
500
|
+
return {
|
|
501
|
+
ok,
|
|
502
|
+
skipped: authFailure,
|
|
503
|
+
terminalLaunched: true,
|
|
504
|
+
authFailure,
|
|
505
|
+
reason: ok ? null : authFailure
|
|
506
|
+
? `claude terminal auth failure: ${text.slice(0, 200) || stderr.slice(0, 200)}`
|
|
507
|
+
: `claude terminal status=${result.status} signal=${signal || 'none'} error=${error || 'none'} stderr=${stderr.slice(0, 500)}`,
|
|
508
|
+
text: authFailure ? '' : text,
|
|
509
|
+
durationMs: Date.now() - started,
|
|
510
|
+
usage: null,
|
|
511
|
+
usageDetails: null,
|
|
512
|
+
inputPrompt: prompt,
|
|
513
|
+
inputPromptSha256: sha256(prompt),
|
|
514
|
+
requestBody: {
|
|
515
|
+
terminal: 'claude-code',
|
|
516
|
+
command: 'script -qefc <claude-code-terminal-command> /dev/null',
|
|
517
|
+
claudePath,
|
|
518
|
+
model: argValue('claude-model', process.env.ARIA_QT_CLAUDE_MODEL || 'opus'),
|
|
519
|
+
budgetUsd: argValue('claude-budget-usd', process.env.ARIA_QT_CLAUDE_BUDGET_USD || '0.35'),
|
|
520
|
+
permissionMode: 'plan',
|
|
521
|
+
tools: '',
|
|
522
|
+
promptSha256: sha256(prompt),
|
|
523
|
+
index,
|
|
524
|
+
},
|
|
525
|
+
rawSha256: sha256([stdout, stderr, result.status, signal, error].join('\n---\n')),
|
|
526
|
+
rawText: JSON.stringify({
|
|
527
|
+
command: 'script -qefc <claude-code-terminal-command> /dev/null',
|
|
528
|
+
terminalCommand: `<claude> --print --input-format text --output-format text --no-session-persistence --permission-mode plan --tools "" --model ${argValue('claude-model', process.env.ARIA_QT_CLAUDE_MODEL || 'opus')} --max-budget-usd ${argValue('claude-budget-usd', process.env.ARIA_QT_CLAUDE_BUDGET_USD || '0.35')} <prompt sha256=${sha256(prompt)}>`,
|
|
529
|
+
status: result.status,
|
|
530
|
+
signal,
|
|
531
|
+
error,
|
|
532
|
+
stdout,
|
|
533
|
+
stderr,
|
|
534
|
+
index,
|
|
535
|
+
}, null, 2),
|
|
536
|
+
};
|
|
537
|
+
}
|
|
538
|
+
|
|
539
|
+
function hasTerm(text, term) {
|
|
540
|
+
const escaped = term.replace(/[.*+?^${}()|[\]\\]/g, '\\$&').replace(/\\ /g, '\\s+');
|
|
541
|
+
return new RegExp(`\\b${escaped}\\b`, 'i').test(String(text || ''));
|
|
542
|
+
}
|
|
543
|
+
|
|
544
|
+
function countHits(text, terms) {
|
|
545
|
+
return terms.filter((term) => hasTerm(text, term)).length;
|
|
546
|
+
}
|
|
547
|
+
|
|
548
|
+
function scoreAnswer(text, prompt = '') {
|
|
549
|
+
const source = String(text || '');
|
|
550
|
+
const lower = source.toLowerCase();
|
|
551
|
+
const qiyasHits = countHits(source, qiyasPerspectives);
|
|
552
|
+
const tadabburHits = countHits(source, tadabburStages);
|
|
553
|
+
const hasFourPillars = ['asl', "far'", 'hukm', 'illah'].every((term) => lower.includes(term.replace("'", '')));
|
|
554
|
+
const furuq = /\bfuruq\b|false analog|material distinction/i.test(source);
|
|
555
|
+
const nextAction = /\b(next action|next step|do this|implement|run|verify|inspect|measure)\b/i.test(source);
|
|
556
|
+
const measurablePredicate = /\b(predicate|threshold|metric|score|pass|fail|delta|%|\d+\/\d+|artifact|sha256|exit=0)\b/i.test(source);
|
|
557
|
+
const evidenceBoundary = /\b(evidence|observed|verified|unverified|bounded|not measured|not proven|cannot verify)\b/i.test(source);
|
|
558
|
+
const learningLoop = /\b(lesson|learning|reflexion|dalio|feedback|record|future selection|update the loop)\b/i.test(source);
|
|
559
|
+
const ownerReadableFirst = !/^\s*<\s*(?:cognition|applied_cognition|qiyas_15_pass|tadabbur_questions)/i.test(source)
|
|
560
|
+
&& source.length >= 250
|
|
561
|
+
&& source.length <= 6000;
|
|
562
|
+
const noAskOnly = !/\bwhat would you like me to do next\b|\bhow would you like me to proceed\b/i.test(source);
|
|
563
|
+
const noFalseClosure = !/\b(guaranteed|fully complete|production ready|100% proven)\b/i.test(source);
|
|
564
|
+
const promptTerms = new Set(String(prompt).toLowerCase().split(/[^a-z0-9]+/).filter((term) => term.length > 5));
|
|
565
|
+
const promptTermHits = [...promptTerms].filter((term) => lower.includes(term)).length;
|
|
566
|
+
const score = (
|
|
567
|
+
qiyasHits * 0.8
|
|
568
|
+
+ tadabburHits * 0.9
|
|
569
|
+
+ (hasFourPillars ? 3 : 0)
|
|
570
|
+
+ (furuq ? 2 : 0)
|
|
571
|
+
+ (nextAction ? 2 : 0)
|
|
572
|
+
+ (measurablePredicate ? 2 : 0)
|
|
573
|
+
+ (evidenceBoundary ? 2 : 0)
|
|
574
|
+
+ (learningLoop ? 1.5 : 0)
|
|
575
|
+
+ (ownerReadableFirst ? 1.5 : 0)
|
|
576
|
+
+ (noAskOnly ? 1 : -2)
|
|
577
|
+
+ (noFalseClosure ? 1 : -3)
|
|
578
|
+
+ Math.min(promptTermHits, 8) * 0.2
|
|
579
|
+
);
|
|
580
|
+
const findings = [];
|
|
581
|
+
if (qiyasHits < 15) findings.push(`qiyas coverage ${qiyasHits}/15`);
|
|
582
|
+
if (tadabburHits < 12) findings.push(`tadabbur coverage ${tadabburHits}/12`);
|
|
583
|
+
if (!hasFourPillars) findings.push('missing explicit four-pillar qiyas');
|
|
584
|
+
if (!furuq) findings.push('missing furuq false-analogy check');
|
|
585
|
+
if (!nextAction) findings.push('missing concrete next action');
|
|
586
|
+
if (!measurablePredicate) findings.push('missing measurable predicate');
|
|
587
|
+
if (!evidenceBoundary) findings.push('missing evidence boundary');
|
|
588
|
+
if (!learningLoop) findings.push('missing learning/reflexion loop');
|
|
589
|
+
if (!ownerReadableFirst) findings.push('owner-readable executive surface weak or bloated');
|
|
590
|
+
if (!noAskOnly) findings.push('ask-only ending');
|
|
591
|
+
if (!noFalseClosure) findings.push('false closure language');
|
|
592
|
+
return {
|
|
593
|
+
score: Number(score.toFixed(3)),
|
|
594
|
+
qiyasHits,
|
|
595
|
+
tadabburHits,
|
|
596
|
+
hasFourPillars,
|
|
597
|
+
furuq,
|
|
598
|
+
nextAction,
|
|
599
|
+
measurablePredicate,
|
|
600
|
+
evidenceBoundary,
|
|
601
|
+
learningLoop,
|
|
602
|
+
ownerReadableFirst,
|
|
603
|
+
noAskOnly,
|
|
604
|
+
noFalseClosure,
|
|
605
|
+
chars: source.length,
|
|
606
|
+
sha256: sha256(source),
|
|
607
|
+
findings,
|
|
608
|
+
};
|
|
609
|
+
}
|
|
610
|
+
|
|
611
|
+
function comparePromptRows(rows) {
|
|
612
|
+
const byPrompt = new Map();
|
|
613
|
+
for (const row of rows) {
|
|
614
|
+
if (!byPrompt.has(row.promptSha256)) byPrompt.set(row.promptSha256, []);
|
|
615
|
+
byPrompt.get(row.promptSha256).push(row);
|
|
616
|
+
}
|
|
617
|
+
const comparisons = [];
|
|
618
|
+
for (const group of byPrompt.values()) {
|
|
619
|
+
const scored = group.filter((row) => row.ok && row.score);
|
|
620
|
+
scored.sort((a, b) => b.score.score - a.score.score || b.score.qiyasHits - a.score.qiyasHits || b.score.tadabburHits - a.score.tadabburHits);
|
|
621
|
+
if (!scored.length) continue;
|
|
622
|
+
comparisons.push({
|
|
623
|
+
promptSha256: scored[0].promptSha256,
|
|
624
|
+
prompt: scored[0].prompt,
|
|
625
|
+
winner: scored[0].arm,
|
|
626
|
+
winnerScore: scored[0].score.score,
|
|
627
|
+
spread: Number((scored[0].score.score - scored[scored.length - 1].score.score).toFixed(3)),
|
|
628
|
+
rows: scored.map((row) => ({
|
|
629
|
+
arm: row.arm,
|
|
630
|
+
score: row.score.score,
|
|
631
|
+
qiyasHits: row.score.qiyasHits,
|
|
632
|
+
tadabburHits: row.score.tadabburHits,
|
|
633
|
+
findings: row.score.findings,
|
|
634
|
+
})),
|
|
635
|
+
});
|
|
636
|
+
}
|
|
637
|
+
return comparisons;
|
|
638
|
+
}
|
|
639
|
+
|
|
640
|
+
function renderMarkdown(summary, comparisons) {
|
|
641
|
+
const lines = [
|
|
642
|
+
'# Qiyas/Tadabbur Model Matrix',
|
|
643
|
+
'',
|
|
644
|
+
`- run_id: ${summary.runId}`,
|
|
645
|
+
`- prompts: ${summary.promptCount}`,
|
|
646
|
+
`- live model arms: ${summary.liveArms.join(', ') || 'none'}`,
|
|
647
|
+
`- terminal arms: ${summary.terminalArms.join(', ') || 'none'}`,
|
|
648
|
+
`- observed transcript arms: ${summary.observedArms.join(', ') || 'none'}`,
|
|
649
|
+
`- skipped arms: ${summary.skippedArms.join(', ') || 'none'}`,
|
|
650
|
+
`- visible output failures: ${summary.visibleOutputFailures}`,
|
|
651
|
+
`- terminal launch rows: ${summary.terminalLaunchRows}`,
|
|
652
|
+
`- evidence boundary: ${summary.evidenceBoundary}`,
|
|
653
|
+
'',
|
|
654
|
+
'## Aggregate',
|
|
655
|
+
'',
|
|
656
|
+
'| Arm | Calls | Mean | Qiyas Mean | Tadabbur Mean | Full Qiyas | Full Tadabbur | Fail Findings |',
|
|
657
|
+
'|---|---:|---:|---:|---:|---:|---:|---:|',
|
|
658
|
+
...summary.armStats.map((row) => `| ${row.arm} | ${row.calls} | ${row.meanScore} | ${row.meanQiyas} | ${row.meanTadabbur} | ${row.fullQiyas} | ${row.fullTadabbur} | ${row.findingCount} |`),
|
|
659
|
+
'',
|
|
660
|
+
'## Per Prompt Winners',
|
|
661
|
+
'',
|
|
662
|
+
'| Prompt | Winner | Score | Spread |',
|
|
663
|
+
'|---|---|---:|---:|',
|
|
664
|
+
...comparisons.map((row) => `| ${row.prompt.replaceAll('|', '\\|').slice(0, 220)} | ${row.winner} | ${row.winnerScore} | ${row.spread} |`),
|
|
665
|
+
'',
|
|
666
|
+
'## Gap Pattern',
|
|
667
|
+
'',
|
|
668
|
+
...summary.topFindings.map((row) => `- ${row.finding}: ${row.count}`),
|
|
669
|
+
'',
|
|
670
|
+
];
|
|
671
|
+
return lines.join('\n');
|
|
672
|
+
}
|
|
673
|
+
|
|
674
|
+
function mean(values) {
|
|
675
|
+
return values.length ? values.reduce((sum, value) => sum + value, 0) / values.length : 0;
|
|
676
|
+
}
|
|
677
|
+
|
|
678
|
+
function summarize(rows, prompts, models, comparisons) {
|
|
679
|
+
const scoredRows = rows.filter((row) => row.ok && row.score);
|
|
680
|
+
const armNames = [...new Set(rows.map((row) => row.arm))].sort();
|
|
681
|
+
const armStats = armNames.map((arm) => {
|
|
682
|
+
const armRows = scoredRows.filter((row) => row.arm === arm);
|
|
683
|
+
return {
|
|
684
|
+
arm,
|
|
685
|
+
calls: armRows.length,
|
|
686
|
+
meanScore: Number(mean(armRows.map((row) => row.score.score)).toFixed(3)),
|
|
687
|
+
meanQiyas: Number(mean(armRows.map((row) => row.score.qiyasHits)).toFixed(3)),
|
|
688
|
+
meanTadabbur: Number(mean(armRows.map((row) => row.score.tadabburHits)).toFixed(3)),
|
|
689
|
+
fullQiyas: armRows.filter((row) => row.score.qiyasHits === 15).length,
|
|
690
|
+
fullTadabbur: armRows.filter((row) => row.score.tadabburHits === 12).length,
|
|
691
|
+
findingCount: armRows.reduce((sum, row) => sum + row.score.findings.length, 0),
|
|
692
|
+
};
|
|
693
|
+
}).sort((a, b) => b.meanScore - a.meanScore);
|
|
694
|
+
const findingCounts = new Map();
|
|
695
|
+
for (const row of scoredRows) {
|
|
696
|
+
for (const finding of row.score.findings) {
|
|
697
|
+
findingCounts.set(finding, (findingCounts.get(finding) || 0) + 1);
|
|
698
|
+
}
|
|
699
|
+
}
|
|
700
|
+
const topFindings = [...findingCounts.entries()]
|
|
701
|
+
.map(([finding, count]) => ({ finding, count }))
|
|
702
|
+
.sort((a, b) => b.count - a.count)
|
|
703
|
+
.slice(0, 12);
|
|
704
|
+
return {
|
|
705
|
+
schema: 'aria.qiyas_tadabbur_model_matrix.v1',
|
|
706
|
+
runId,
|
|
707
|
+
generatedAt: new Date().toISOString(),
|
|
708
|
+
evidenceBoundary: 'Live arms are direct provider API calls. GPT/Codex and Claude entries are observed transcript outputs unless an API key/model is available. Scores are deterministic coverage/quality signals, not a statistically powered benchmark.',
|
|
709
|
+
promptCount: prompts.length,
|
|
710
|
+
models,
|
|
711
|
+
liveArms: models.filter((model) => model.apiKeyPresent).map((model) => model.id),
|
|
712
|
+
terminalArms: [...new Set(rows.filter((row) => row.source === 'claude_code_terminal').map((row) => row.arm))].sort(),
|
|
713
|
+
observedArms: [...new Set(rows.filter((row) => row.source === 'observed').map((row) => row.arm))].sort(),
|
|
714
|
+
skippedArms: rows.filter((row) => row.skipped).map((row) => row.arm),
|
|
715
|
+
visibleOutputFailures: rows.filter((row) => row.visibleOutputFailure || (!row.skipped && !row.ok && /no visible answer text/i.test(row.reason || ''))).length,
|
|
716
|
+
terminalLaunchRows: rows.filter((row) => row.terminalLaunched).length,
|
|
717
|
+
armStats,
|
|
718
|
+
topFindings,
|
|
719
|
+
comparisons: comparisons.map((row) => ({
|
|
720
|
+
promptSha256: row.promptSha256,
|
|
721
|
+
winner: row.winner,
|
|
722
|
+
winnerScore: row.winnerScore,
|
|
723
|
+
spread: row.spread,
|
|
724
|
+
})),
|
|
725
|
+
outputRoot,
|
|
726
|
+
};
|
|
727
|
+
}
|
|
728
|
+
|
|
729
|
+
function buildEvidenceManifest({ summary, promptPairs, rows, comparisons, artifacts }) {
|
|
730
|
+
return {
|
|
731
|
+
schema: 'aria.qiyas_tadabbur_model_matrix.evidence_manifest.v1',
|
|
732
|
+
runId,
|
|
733
|
+
generatedAt: new Date().toISOString(),
|
|
734
|
+
command: {
|
|
735
|
+
cwd: repoRoot,
|
|
736
|
+
argv: process.argv,
|
|
737
|
+
},
|
|
738
|
+
envKeyPresence: {
|
|
739
|
+
DEEPSEEK_API_KEY: Boolean(process.env.DEEPSEEK_API_KEY),
|
|
740
|
+
ARIA_DEEPSEEK_API_KEY: Boolean(process.env.ARIA_DEEPSEEK_API_KEY),
|
|
741
|
+
XAI_API_KEY: Boolean(process.env.XAI_API_KEY),
|
|
742
|
+
GROK_API_KEY: Boolean(process.env.GROK_API_KEY),
|
|
743
|
+
ANTHROPIC_API_KEY: Boolean(process.env.ANTHROPIC_API_KEY),
|
|
744
|
+
OPENAI_API_KEY: Boolean(process.env.OPENAI_API_KEY),
|
|
745
|
+
},
|
|
746
|
+
prompts: promptPairs.map((prompt) => ({
|
|
747
|
+
source: prompt.source,
|
|
748
|
+
model: prompt.model,
|
|
749
|
+
sourceSessionFile: prompt.file,
|
|
750
|
+
promptSha256: prompt.promptSha256,
|
|
751
|
+
chars: prompt.prompt.length,
|
|
752
|
+
inputPath: prompt.inputPath || null,
|
|
753
|
+
})),
|
|
754
|
+
rowArtifacts: rows.map((row) => ({
|
|
755
|
+
source: row.source,
|
|
756
|
+
arm: row.arm,
|
|
757
|
+
provider: row.provider,
|
|
758
|
+
model: row.model,
|
|
759
|
+
promptSha256: row.promptSha256,
|
|
760
|
+
sourceSessionFile: row.sourceSessionFile,
|
|
761
|
+
ok: row.ok,
|
|
762
|
+
skipped: row.skipped,
|
|
763
|
+
terminalLaunched: row.terminalLaunched === true,
|
|
764
|
+
visibleOutputFailure: row.visibleOutputFailure === true,
|
|
765
|
+
reason: row.reason,
|
|
766
|
+
attempts: row.attempts || null,
|
|
767
|
+
durationMs: row.durationMs,
|
|
768
|
+
usageDetails: row.usageDetails || null,
|
|
769
|
+
inputPath: row.inputPath || null,
|
|
770
|
+
requestPath: row.requestPath || null,
|
|
771
|
+
requestSha256: row.requestSha256 || null,
|
|
772
|
+
textPath: row.textPath || null,
|
|
773
|
+
rawPath: row.rawPath || null,
|
|
774
|
+
rawSha256: row.rawSha256 || null,
|
|
775
|
+
score: row.score ? {
|
|
776
|
+
score: row.score.score,
|
|
777
|
+
qiyasHits: row.score.qiyasHits,
|
|
778
|
+
tadabburHits: row.score.tadabburHits,
|
|
779
|
+
findings: row.score.findings,
|
|
780
|
+
} : null,
|
|
781
|
+
})),
|
|
782
|
+
comparisons: comparisons.map((row) => ({
|
|
783
|
+
promptSha256: row.promptSha256,
|
|
784
|
+
winner: row.winner,
|
|
785
|
+
winnerScore: row.winnerScore,
|
|
786
|
+
spread: row.spread,
|
|
787
|
+
rows: row.rows,
|
|
788
|
+
})),
|
|
789
|
+
summary,
|
|
790
|
+
artifacts,
|
|
791
|
+
};
|
|
792
|
+
}
|
|
793
|
+
|
|
794
|
+
async function main() {
|
|
795
|
+
ensureDir(outputRoot);
|
|
796
|
+
ensureDir(outputsDir);
|
|
797
|
+
const count = argNumber('count', 4, { min: 1, max: 100 });
|
|
798
|
+
const sessionLimit = argNumber('session-limit', 80, { min: 1, max: 500 });
|
|
799
|
+
const maxPromptChars = argNumber('max-prompt-chars', 1600, { min: 200, max: 8000 });
|
|
800
|
+
const concurrency = argNumber('concurrency', 4, { min: 1, max: 12 });
|
|
801
|
+
const promptPairs = collectPromptPairs({ sessionLimit, pairLimit: count, maxPromptChars });
|
|
802
|
+
if (!promptPairs.length) throw new Error('no relevant qiyas/tadabbur/autofire prompts found in local sessions');
|
|
803
|
+
const models = parseModels();
|
|
804
|
+
const liveWork = [];
|
|
805
|
+
for (const promptPair of promptPairs) {
|
|
806
|
+
for (const model of models) {
|
|
807
|
+
liveWork.push({ promptPair, model });
|
|
808
|
+
}
|
|
809
|
+
}
|
|
810
|
+
const rows = [];
|
|
811
|
+
const jsonlPath = path.join(outputRoot, 'rows.jsonl');
|
|
812
|
+
const liveRows = await mapConcurrent(liveWork, concurrency, async (work, index) => {
|
|
813
|
+
const result = await callChatModel(work.model, work.promptPair.prompt, index + 1);
|
|
814
|
+
const arm = work.model.id;
|
|
815
|
+
const artifactStem = `${String(index + 1).padStart(3, '0')}-${arm.replace(/[^a-z0-9._-]/gi, '_')}`;
|
|
816
|
+
const inputPath = path.join(outputsDir, `${artifactStem}.input.txt`);
|
|
817
|
+
const requestPath = path.join(outputsDir, `${artifactStem}.request.json`);
|
|
818
|
+
const textPath = path.join(outputsDir, `${artifactStem}.txt`);
|
|
819
|
+
const rawPath = path.join(outputsDir, `${artifactStem}.raw.json`);
|
|
820
|
+
writeFileSync(inputPath, work.promptPair.prompt);
|
|
821
|
+
if (result.requestAttempts?.length) writeJsonArtifact(requestPath, result.requestAttempts);
|
|
822
|
+
if (result.text) writeFileSync(textPath, result.text);
|
|
823
|
+
if (result.rawText) writeFileSync(rawPath, redactText(result.rawText));
|
|
824
|
+
const row = {
|
|
825
|
+
source: 'live_api',
|
|
826
|
+
arm,
|
|
827
|
+
provider: work.model.provider,
|
|
828
|
+
model: work.model.model,
|
|
829
|
+
prompt: work.promptPair.prompt,
|
|
830
|
+
promptSha256: work.promptPair.promptSha256,
|
|
831
|
+
sourceSessionFile: work.promptPair.file,
|
|
832
|
+
ok: result.ok,
|
|
833
|
+
skipped: result.skipped,
|
|
834
|
+
visibleOutputFailure: result.visibleOutputFailure === true,
|
|
835
|
+
reason: result.reason,
|
|
836
|
+
durationMs: result.durationMs,
|
|
837
|
+
usage: result.usage,
|
|
838
|
+
usageDetails: result.usageDetails || null,
|
|
839
|
+
attempts: result.attempts || 1,
|
|
840
|
+
blankAttempts: result.blankAttempts || [],
|
|
841
|
+
inputPath,
|
|
842
|
+
requestPath: result.requestAttempts?.length ? requestPath : null,
|
|
843
|
+
requestSha256: result.requestAttempts?.at(-1)?.requestSha256 || null,
|
|
844
|
+
textPath: result.text ? textPath : null,
|
|
845
|
+
rawPath: result.rawText ? rawPath : null,
|
|
846
|
+
rawSha256: result.rawSha256 || null,
|
|
847
|
+
score: result.text ? scoreAnswer(result.text, work.promptPair.prompt) : null,
|
|
848
|
+
};
|
|
849
|
+
writeFileSync(jsonlPath, JSON.stringify(redactRequest(row)) + '\n', { flag: 'a', mode: 0o644 });
|
|
850
|
+
process.stdout.write(JSON.stringify({
|
|
851
|
+
arm,
|
|
852
|
+
prompt: work.promptPair.promptSha256.slice(0, 8),
|
|
853
|
+
ok: row.ok,
|
|
854
|
+
skipped: row.skipped,
|
|
855
|
+
score: row.score?.score ?? null,
|
|
856
|
+
qiyas: row.score?.qiyasHits ?? null,
|
|
857
|
+
tadabbur: row.score?.tadabburHits ?? null,
|
|
858
|
+
}) + '\n');
|
|
859
|
+
return row;
|
|
860
|
+
});
|
|
861
|
+
rows.push(...liveRows);
|
|
862
|
+
if (includeClaudeTerminalArm()) {
|
|
863
|
+
for (const [index, promptPair] of promptPairs.entries()) {
|
|
864
|
+
const result = callClaudeCodeTerminal(promptPair, index + 1);
|
|
865
|
+
const arm = `claude-terminal:${argValue('claude-model', process.env.ARIA_QT_CLAUDE_MODEL || 'opus')}`;
|
|
866
|
+
const safeArm = arm.replace(/[^a-z0-9._-]/gi, '_');
|
|
867
|
+
const artifactStem = `${String(liveRows.length + index + 1).padStart(3, '0')}-${safeArm}`;
|
|
868
|
+
const inputPath = path.join(outputsDir, `${artifactStem}.input.txt`);
|
|
869
|
+
const requestPath = path.join(outputsDir, `${artifactStem}.request.json`);
|
|
870
|
+
const textPath = path.join(outputsDir, `${artifactStem}.txt`);
|
|
871
|
+
const rawPath = path.join(outputsDir, `${artifactStem}.raw.json`);
|
|
872
|
+
writeFileSync(inputPath, result.inputPrompt || promptPair.prompt);
|
|
873
|
+
writeJsonArtifact(requestPath, result.requestBody || {});
|
|
874
|
+
if (result.text) writeFileSync(textPath, result.text);
|
|
875
|
+
if (result.rawText) writeFileSync(rawPath, redactText(result.rawText));
|
|
876
|
+
const row = {
|
|
877
|
+
source: 'claude_code_terminal',
|
|
878
|
+
arm,
|
|
879
|
+
provider: 'claude-code-terminal',
|
|
880
|
+
model: argValue('claude-model', process.env.ARIA_QT_CLAUDE_MODEL || 'opus'),
|
|
881
|
+
prompt: promptPair.prompt,
|
|
882
|
+
promptSha256: promptPair.promptSha256,
|
|
883
|
+
sourceSessionFile: promptPair.file,
|
|
884
|
+
ok: result.ok,
|
|
885
|
+
skipped: result.skipped,
|
|
886
|
+
terminalLaunched: result.terminalLaunched === true,
|
|
887
|
+
reason: result.reason,
|
|
888
|
+
durationMs: result.durationMs,
|
|
889
|
+
usage: result.usage,
|
|
890
|
+
usageDetails: result.usageDetails || null,
|
|
891
|
+
inputPath,
|
|
892
|
+
requestPath,
|
|
893
|
+
requestSha256: sha256(JSON.stringify(result.requestBody || {})),
|
|
894
|
+
textPath: result.text ? textPath : null,
|
|
895
|
+
rawPath: result.rawText ? rawPath : null,
|
|
896
|
+
rawSha256: result.rawSha256 || null,
|
|
897
|
+
score: result.text ? scoreAnswer(result.text, promptPair.prompt) : null,
|
|
898
|
+
};
|
|
899
|
+
rows.push(row);
|
|
900
|
+
writeFileSync(jsonlPath, JSON.stringify(redactRequest(row)) + '\n', { flag: 'a', mode: 0o644 });
|
|
901
|
+
process.stdout.write(JSON.stringify({
|
|
902
|
+
arm,
|
|
903
|
+
prompt: promptPair.promptSha256.slice(0, 8),
|
|
904
|
+
ok: row.ok,
|
|
905
|
+
skipped: row.skipped,
|
|
906
|
+
terminalLaunched: row.terminalLaunched,
|
|
907
|
+
score: row.score?.score ?? null,
|
|
908
|
+
qiyas: row.score?.qiyasHits ?? null,
|
|
909
|
+
tadabbur: row.score?.tadabburHits ?? null,
|
|
910
|
+
}) + '\n');
|
|
911
|
+
}
|
|
912
|
+
}
|
|
913
|
+
for (const [index, promptPair] of promptPairs.entries()) {
|
|
914
|
+
if (!promptPair.observedAnswer) continue;
|
|
915
|
+
const arm = `${promptPair.source}:${promptPair.model}`;
|
|
916
|
+
const artifactStem = `${String(index + 1).padStart(3, '0')}-${arm.replace(/[^a-z0-9._-]/gi, '_')}-observed`;
|
|
917
|
+
const inputPath = path.join(outputsDir, `${artifactStem}.input.txt`);
|
|
918
|
+
const textPath = path.join(outputsDir, `${artifactStem}.txt`);
|
|
919
|
+
writeFileSync(inputPath, promptPair.prompt);
|
|
920
|
+
writeFileSync(textPath, promptPair.observedAnswer);
|
|
921
|
+
const row = {
|
|
922
|
+
source: 'observed',
|
|
923
|
+
arm,
|
|
924
|
+
provider: promptPair.source,
|
|
925
|
+
model: promptPair.model,
|
|
926
|
+
prompt: promptPair.prompt,
|
|
927
|
+
promptSha256: promptPair.promptSha256,
|
|
928
|
+
sourceSessionFile: promptPair.file,
|
|
929
|
+
ok: true,
|
|
930
|
+
skipped: false,
|
|
931
|
+
reason: null,
|
|
932
|
+
durationMs: null,
|
|
933
|
+
usage: null,
|
|
934
|
+
inputPath,
|
|
935
|
+
textPath,
|
|
936
|
+
score: scoreAnswer(promptPair.observedAnswer, promptPair.prompt),
|
|
937
|
+
};
|
|
938
|
+
rows.push(row);
|
|
939
|
+
writeFileSync(jsonlPath, JSON.stringify(redactRequest(row)) + '\n', { flag: 'a', mode: 0o644 });
|
|
940
|
+
}
|
|
941
|
+
const comparisons = comparePromptRows(rows);
|
|
942
|
+
const summary = summarize(rows, promptPairs, models.map((model) => ({ ...model, apiKeyPresent: Boolean(model.apiKeyPresent) })), comparisons);
|
|
943
|
+
const metricsPath = path.join(outputRoot, 'metrics.json');
|
|
944
|
+
const promptsPath = path.join(outputRoot, 'prompts.json');
|
|
945
|
+
const summaryPath = path.join(outputRoot, 'summary.md');
|
|
946
|
+
const evidenceManifestPath = path.join(outputRoot, 'evidence-manifest.json');
|
|
947
|
+
for (const promptPair of promptPairs) {
|
|
948
|
+
const promptInputPath = path.join(outputsDir, `${promptPair.promptSha256.slice(0, 12)}-prompt.input.txt`);
|
|
949
|
+
writeFileSync(promptInputPath, promptPair.prompt);
|
|
950
|
+
promptPair.inputPath = promptInputPath;
|
|
951
|
+
}
|
|
952
|
+
writeJsonArtifact(metricsPath, { summary, rows, comparisons });
|
|
953
|
+
writeFileSync(promptsPath, JSON.stringify(promptPairs.map((prompt) => ({
|
|
954
|
+
source: prompt.source,
|
|
955
|
+
model: prompt.model,
|
|
956
|
+
file: prompt.file,
|
|
957
|
+
prompt: prompt.prompt,
|
|
958
|
+
promptSha256: prompt.promptSha256,
|
|
959
|
+
inputPath: prompt.inputPath,
|
|
960
|
+
})), null, 2) + '\n');
|
|
961
|
+
writeFileSync(summaryPath, renderMarkdown(summary, comparisons));
|
|
962
|
+
const artifacts = { outputRoot, metricsPath, promptsPath, summaryPath, jsonlPath, evidenceManifestPath };
|
|
963
|
+
writeJsonArtifact(evidenceManifestPath, buildEvidenceManifest({ summary, promptPairs, rows, comparisons, artifacts }));
|
|
964
|
+
process.stdout.write(JSON.stringify({ ok: true, summary, artifacts }, null, 2) + '\n');
|
|
965
|
+
}
|
|
966
|
+
|
|
967
|
+
main().catch((error) => {
|
|
968
|
+
console.error(error instanceof Error ? error.stack : String(error));
|
|
969
|
+
process.exit(1);
|
|
970
|
+
});
|