npm - sneakoscope - Versions diffs - 4.1.1 → 4.2.1 - Mend

sneakoscope 4.1.1 → 4.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (84) hide show

package/README.md +13 -10
package/crates/sks-core/Cargo.lock +1 -1
package/crates/sks-core/Cargo.toml +1 -1
package/crates/sks-core/src/main.rs +1 -1
package/dist/bin/sks.js +1 -1
package/dist/cli/command-registry.js +1 -1
package/dist/core/auto-review.js +1 -1
package/dist/core/codex-control/codex-app-server-v2-client.js +86 -2
package/dist/core/codex-control/codex-reliability-shield.js +26 -5
package/dist/core/codex-control/codex-task-runner.js +7 -1
package/dist/core/codex-control/model-call-concurrency.js +1 -1
package/dist/core/commands/mad-db-command.js +146 -51
package/dist/core/commands/mad-sks-command.js +15 -31
package/dist/core/commands/qa-loop-command.js +23 -7
package/dist/core/db-safety.js +35 -37
package/dist/core/doctor/supabase-mcp-repair.js +2 -2
package/dist/core/feature-registry.js +1 -1
package/dist/core/fsx.js +1 -1
package/dist/core/hooks-runtime.js +1 -1
package/dist/core/init.js +5 -4
package/dist/core/mad-db/mad-db-capability.js +203 -74
package/dist/core/mad-db/mad-db-coordinator.js +287 -0
package/dist/core/mad-db/mad-db-executor.js +156 -0
package/dist/core/mad-db/mad-db-ledger.js +1 -1
package/dist/core/mad-db/mad-db-lock.js +40 -0
package/dist/core/mad-db/mad-db-operation-store.js +140 -0
package/dist/core/mad-db/mad-db-policy-resolver.js +42 -22
package/dist/core/mad-db/mad-db-policy.js +195 -0
package/dist/core/mad-db/mad-db-postconditions.js +30 -0
package/dist/core/mad-db/mad-db-recovery.js +27 -0
package/dist/core/mad-db/mad-db-result-lifecycle.js +31 -102
package/dist/core/mad-db/mad-db-runtime-profile.js +121 -0
package/dist/core/mad-db/mad-db-target.js +64 -0
package/dist/core/managed-assets/managed-assets-manifest.js +1 -1
package/dist/core/pipeline-internals/runtime-core.js +40 -0
package/dist/core/providers/glm/bench/glm-benchmark-types.js +1 -1
package/dist/core/qa-loop/qa-app-server-driver.js +134 -0
package/dist/core/qa-loop/qa-contract-v2.js +231 -0
package/dist/core/qa-loop/qa-gate-v2.js +132 -0
package/dist/core/qa-loop/qa-runtime-artifacts.js +53 -0
package/dist/core/qa-loop/qa-surface-router.js +114 -0
package/dist/core/qa-loop/qa-types.js +18 -0
package/dist/core/qa-loop.js +83 -26
package/dist/core/release/gate-manifest.js +1 -0
package/dist/core/release/release-gate-dag.js +6 -5
package/dist/core/release/sla-scheduler.js +1 -1
package/dist/core/routes.js +42 -12
package/dist/core/triwiki/triwiki-affected-graph.js +3 -2
package/dist/core/version.js +1 -1
package/dist/core/zellij/zellij-slot-column-anchor.js +5 -1
package/dist/scripts/check-dist-runtime.js +3 -2
package/dist/scripts/codex-0142-manifest-check.js +2 -1
package/dist/scripts/codex-control-all-pipelines-check.js +1 -0
package/dist/scripts/codex-control-model-capacity-fallback-check.js +53 -0
package/dist/scripts/config-managed-merge-callsite-coverage-check.js +7 -1
package/dist/scripts/loop-directive-check-lib.js +78 -1
package/dist/scripts/mad-db-capability-check.js +13 -2
package/dist/scripts/mad-db-command-check.js +7 -5
package/dist/scripts/mad-db-hook-idempotency-check.js +21 -0
package/dist/scripts/mad-db-ledger-check.js +2 -1
package/dist/scripts/mad-db-lifecycle-hook-decision-check.js +5 -4
package/dist/scripts/mad-db-mad-command-check.js +29 -16
package/dist/scripts/mad-db-mcp-result-lifecycle-check.js +11 -10
package/dist/scripts/mad-db-one-cycle-bounded-check.js +15 -18
package/dist/scripts/mad-db-one-cycle-consumption-check.js +3 -3
package/dist/scripts/mad-db-operation-lifecycle-blackbox.js +9 -9
package/dist/scripts/mad-db-operation-lifecycle-ledger-check.js +6 -6
package/dist/scripts/mad-db-parallel-lifecycle-check.js +24 -0
package/dist/scripts/mad-db-policy-v2-check.js +20 -0
package/dist/scripts/mad-db-priority-resolver-check.js +5 -5
package/dist/scripts/mad-db-real-supabase-e2e.js +166 -0
package/dist/scripts/mad-db-route-identity-check.js +28 -0
package/dist/scripts/mad-db-runtime-profile-lifecycle-check.js +24 -0
package/dist/scripts/mad-db-safety-conflict-matrix-check.js +3 -3
package/dist/scripts/mad-db-skill-policy-snapshot-check.js +15 -0
package/dist/scripts/qa-loop-app-server-driver-check.js +74 -0
package/dist/scripts/qa-loop-surface-router-check.js +49 -0
package/dist/scripts/release-check-dynamic-execute.js +1 -1
package/dist/scripts/release-dag-full-coverage-check.js +6 -0
package/dist/scripts/release-triwiki-first-runner-blackbox.js +5 -1
package/dist/scripts/runtime-ts-rust-boundary-check.js +1 -1
package/dist/scripts/triwiki-affected-graph-check.js +2 -2
package/package.json +18 -5
package/schemas/mad-db/mad-db-capability.schema.json +92 -19

package/dist/core/qa-loop.js CHANGED Viewed

@@ -1,14 +1,18 @@
 import path from 'node:path';
 import { exists, nowIso, readJson, readText, writeJsonAtomic, writeTextAtomic, PACKAGE_VERSION } from './fsx.js';
-import { CODEX_APP_IMAGE_GENERATION_DOC_URL, CODEX_IMAGEGEN_REQUIRED_POLICY, CODEX_WEB_VERIFICATION_EVIDENCE_SOURCE, CODEX_WEB_VERIFICATION_POLICY, evidenceMentionsForbiddenBrowserAutomation, evidenceMentionsForbiddenWebComputerUseEvidence } from './routes.js';
+import { CODEX_APP_IMAGE_GENERATION_DOC_URL, CODEX_CHROME_EXTENSION_EVIDENCE_SOURCE, CODEX_COMPUTER_USE_EVIDENCE_SOURCE, CODEX_IMAGEGEN_REQUIRED_POLICY, CODEX_IN_APP_BROWSER_EVIDENCE_SOURCE, CODEX_WEB_VERIFICATION_EVIDENCE_SOURCE, CODEX_WEB_VERIFICATION_POLICY, evidenceMentionsForbiddenBrowserAutomation, evidenceMentionsForbiddenWebComputerUseEvidence } from './routes.js';
 import { appendAgentLedgerEvent, initializeAgentCentralLedger } from './agents/agent-central-ledger.js';
 import { resolveCodexAppExecutionProfile } from './codex-app/codex-app-execution-profile.js';
 import { resolveCodexNativeInvocationPlan } from './codex-native/codex-native-invocation-router.js';
 import { imageDimensions, sha256File } from './wiki-image/image-hash.js';
+import { initializeQaRuntimeArtifacts } from './qa-loop/qa-runtime-artifacts.js';
+import { evaluateQaGateV2 } from './qa-loop/qa-gate-v2.js';
+import { DEFAULT_QA_MAX_CYCLES, QA_GATE_V2_ARTIFACT, QA_SURFACE_SELECTION_ARTIFACT } from './qa-loop/qa-types.js';
 export const QA_LOOP_ROUTE = 'QALoop';
 export const QA_LOOP_VISUAL_EVIDENCE_ARTIFACT = 'qa-loop/visual-evidence.json';
 const QA_REPORT_SUFFIX = 'qa-report.md';
-const UI_CHROME_EXTENSION_FIRST_ACK = 'use_codex_chrome_extension_first_no_computer_use_for_web_ui_or_mark_unverified';
+const UI_SURFACE_ROUTER_ACK = 'use_codex_surface_router_browser_chrome_computer_no_synthetic_evidence';
+const LEGACY_UI_CHROME_EXTENSION_FIRST_ACK = 'use_codex_chrome_extension_first_no_computer_use_for_web_ui_or_mark_unverified';
 const GPT_IMAGE_2_ANNOTATED_REVIEW_REQUIRED_ACK = 'yes_gpt_image_2_annotated_review';
 const IMAGE_FILE_RE = /\.(png|jpe?g|webp|gif)$/i;
 export const QA_NATIVE_AGENT_PERSONAS = Object.freeze([
@@ -166,7 +170,7 @@ export function inferQaLoopAnswers(prompt = '') {
         '검증하지 못한 UI/API 범위는 통과로 주장하지 않고 QA 리포트에 남긴다.'
     ];
     if (isUiScope(scope))
-        acceptance.push('UI E2E 통과 증거는 실제 Codex Chrome Extension screenshot artifact path와 sha256을 기록해야 한다.');
+        acceptance.push('UI E2E 통과 증거는 surface router가 고른 @Browser/@Chrome/@Computer 실제 action·observation ledger와 필요한 screenshot/hash를 기록해야 한다.');
     if (wantsGptImage2Review)
         acceptance.push('gpt-image-2 annotated review image가 필요한 경우 실제 Codex App $imagegen/gpt-image-2 출력 파일 path, sha256, model, provider를 기록해야 한다.');
     return {
@@ -181,17 +185,17 @@ export function inferQaLoopAnswers(prompt = '') {
         EXTERNAL_SIDE_EFFECT_POLICY: 'block_all_external_side_effects',
         ...login,
         CREDENTIAL_STORAGE_ACK: 'never_store_credentials_in_artifacts_or_wiki',
-        UI_CHROME_EXTENSION_ACK: UI_CHROME_EXTENSION_FIRST_ACK,
+        UI_CHROME_EXTENSION_ACK: UI_SURFACE_ROUTER_ACK,
         QA_VISUAL_REVIEW_IMAGEGEN_REQUIRED: wantsGptImage2Review ? GPT_IMAGE_2_ANNOTATED_REVIEW_REQUIRED_ACK : 'not_required',
         TEAM_MODE_ALLOWED: 'no_parent_only',
-        MAX_QA_CYCLES: '1',
+        MAX_QA_CYCLES: String(DEFAULT_QA_MAX_CYCLES),
         ACCEPTANCE_CRITERIA: acceptance,
         NON_GOALS: [
             '결제, 실제 이메일/SMS 발송, 관리자 권한 변경, 데이터 삭제, 프로덕션 데이터 변경은 테스트하지 않는다.'
         ],
         RISK_BOUNDARY: [
             '실제 사용자 데이터, 인증 권한, 결제, 메시지 발송, 웹훅, 외부 서비스 상태를 생성/수정/삭제하지 않는다.',
-            'Codex Chrome Extension readiness/evidence가 없으면 web/browser UI 검증 완료로 주장하지 않는다.',
+            '선택된 Codex App visual surface의 실제 action·observation evidence가 없으면 UI 검증 완료로 주장하지 않는다.',
             '로그인이 필요하지만 임시 테스트 자격증명이 없으면 인증 구간은 차단/미검증으로 기록한다.'
         ],
         MID_RUN_UNKNOWN_POLICY: ['preserve_existing_behavior', 'defer_optional_scope', 'block_only_if_no_safe_path']
@@ -245,7 +249,7 @@ export function qaLoopQuestionSlots() {
         { id: 'TEMP_TEST_CREDENTIALS_READY', question: 'If login is required, are test-only credentials ready to provide ephemerally during the run?', required: true, type: 'enum', options: ['not_required', 'yes_temp_only', 'no_block_authenticated_tests'] },
         { id: 'TEST_CREDENTIALS_RUNTIME_SOURCE', question: 'If login is required, how will test-only credentials be provided without saving the values?', required: true, type: 'enum', options: ['not_required', 'ephemeral_chat_only', 'environment_variables', 'secret_manager'] },
         { id: 'CREDENTIAL_STORAGE_ACK', question: 'Acknowledge credential handling policy.', required: true, type: 'enum', options: ['never_store_credentials_in_artifacts_or_wiki'] },
-        { id: 'UI_CHROME_EXTENSION_ACK', question: 'Acknowledge UI E2E evidence policy: Codex Chrome Extension first for web/browser/webapp verification; no Computer Use or unofficial browser automation substitute.', required: true, type: 'enum', options: [UI_CHROME_EXTENSION_FIRST_ACK] },
+        { id: 'UI_CHROME_EXTENSION_ACK', question: 'Acknowledge UI E2E evidence policy: QA-LOOP routes local/public web to @Browser, signed-in web to @Chrome, native/cross-app GUI to @Computer, and never treats synthetic artifacts as real proof.', required: true, type: 'enum', options: [UI_SURFACE_ROUTER_ACK, LEGACY_UI_CHROME_EXTENSION_FIRST_ACK] },
         { id: 'TEAM_MODE_ALLOWED', question: 'May QA-LOOP use Team/subagents where useful?', required: true, type: 'enum', options: ['yes_parallel_where_safe', 'no_parent_only'] },
         { id: 'MAX_QA_CYCLES', question: 'How many no-question QA cycles are allowed before pausing?', required: true, type: 'string' },
         { id: 'ACCEPTANCE_CRITERIA', question: 'List the QA completion criteria.', required: true, type: 'array_or_string' },
@@ -269,8 +273,8 @@ export function validateQaLoopAnswers(schema, answers = {}) {
         errors.push({ slot: 'QA_MUTATION_POLICY', error: 'production_deployed_qa_is_read_only_smoke_only' });
     if (answers.DESTRUCTIVE_DEPLOYED_TESTS_ALLOWED !== 'never')
         errors.push({ slot: 'DESTRUCTIVE_DEPLOYED_TESTS_ALLOWED', error: 'destructive_deployed_tests_never_allowed' });
-    if (isUiScope(answers.QA_SCOPE) && answers.UI_CHROME_EXTENSION_ACK !== UI_CHROME_EXTENSION_FIRST_ACK)
-        errors.push({ slot: 'UI_CHROME_EXTENSION_ACK', error: 'ui_e2e_requires_codex_chrome_extension_first_ack' });
+    if (isUiScope(answers.QA_SCOPE) && ![UI_SURFACE_ROUTER_ACK, LEGACY_UI_CHROME_EXTENSION_FIRST_ACK].includes(answers.UI_CHROME_EXTENSION_ACK))
+        errors.push({ slot: 'UI_CHROME_EXTENSION_ACK', error: 'ui_e2e_requires_codex_surface_router_ack' });
     if (answers.LOGIN_REQUIRED === 'yes' && !['yes_temp_only', 'no_block_authenticated_tests'].includes(answers.TEMP_TEST_CREDENTIALS_READY))
         errors.push({ slot: 'TEMP_TEST_CREDENTIALS_READY', error: 'authenticated_tests_require_ephemeral_test_credentials_or_must_be_blocked' });
     if (answers.LOGIN_REQUIRED === 'yes' && answers.TEMP_TEST_CREDENTIALS_READY === 'yes_temp_only' && answers.TEST_CREDENTIALS_RUNTIME_SOURCE === 'not_required')
@@ -322,6 +326,7 @@ export function defaultQaGate(contract = {}, opts = {}) {
     const gptImage2ReviewRequired = qaGptImage2AnnotatedReviewRequired(contract, contract.prompt);
     const reportFile = opts.reportFile || qaReportFilename();
     const corrective = a.QA_CORRECTIVE_POLICY !== 'report_only_no_code_changes';
+    const selectedSurface = opts.qaRuntime?.surface?.selected_surface || null;
     return {
         passed: false,
         clarification_contract_sealed: Boolean(contract.sealed_hash),
@@ -333,6 +338,15 @@ export function defaultQaGate(contract = {}, opts = {}) {
         deployed_destructive_tests_blocked: a.TARGET_ENVIRONMENT === 'local_dev_server' || a.DESTRUCTIVE_DEPLOYED_TESTS_ALLOWED === 'never',
         credentials_not_persisted: false,
         ui_e2e_required: uiRequired,
+        qa_contract_v2_required: opts.qaRuntime ? true : false,
+        qa_surface_selection_artifact: opts.qaRuntime ? QA_SURFACE_SELECTION_ARTIFACT : null,
+        qa_gate_v2_artifact: opts.qaRuntime ? QA_GATE_V2_ARTIFACT : null,
+        qa_surface_selected: selectedSurface,
+        ui_selected_surface: selectedSurface,
+        ui_live_surface_preflight_passed: !uiRequired,
+        ui_real_action_count: 0,
+        ui_observation_count: 0,
+        same_flow_replay_complete: false,
         chrome_extension_preflight_passed: !uiRequired,
         ui_chrome_extension_evidence: !uiRequired,
         ui_computer_use_evidence: false,
@@ -385,6 +399,13 @@ export async function writeQaLoopArtifacts(dir, mission, contract) {
     const root = missionRootFromDir(dir);
     const executionProfile = root ? await resolveCodexAppExecutionProfile({ root }).catch(() => null) : null;
     const codexNativeInvocation = root ? await resolveQaCodexNativeInvocation(root, mission.id).catch(() => null) : null;
+    const qaRuntime = await initializeQaRuntimeArtifacts(dir, {
+        ...contract,
+        prompt: mission.prompt || contract.prompt,
+        mission_id: mission.id || contract.mission_id
+    }, {
+        missionId: mission.id || contract.mission_id || null
+    }).catch(() => null);
     if (executionProfile)
         await writeJsonAtomic(path.join(dir, 'qa-loop', 'execution-profile.json'), executionProfile).catch(() => undefined);
     if (codexNativeInvocation)
@@ -397,11 +418,20 @@ export async function writeQaLoopArtifacts(dir, mission, contract) {
         codex_app_execution_profile: executionProfile ? compactExecutionProfile(executionProfile) : null,
         codex_native_invocation: codexNativeInvocation,
         target: { scope: a.QA_SCOPE, environment: a.TARGET_ENVIRONMENT, base_url: a.TARGET_BASE_URL, api_base_url: a.API_BASE_URL },
-        safety: { mutation_policy: a.QA_MUTATION_POLICY, deployed_destructive_tests_allowed: 'never', credentials: 'temp_only_never_saved', ui_evidence: 'codex_chrome_extension_first_required_for_web_ui_e2e', visual_review: 'gpt_image_2_annotated_review_required_when_contract_requests_it' },
+        qa_runtime_v2: qaRuntime ? {
+            contract_artifact: 'qa-loop/qa-contract-v2.json',
+            surface_selection_artifact: QA_SURFACE_SELECTION_ARTIFACT,
+            selected_surface: qaRuntime.surface.selected_surface,
+            journey_graph_artifact: 'qa-loop/qa-journey-graph.json',
+            gate_artifact: QA_GATE_V2_ARTIFACT
+        } : null,
+        safety: { mutation_policy: a.QA_MUTATION_POLICY, deployed_destructive_tests_allowed: 'never', credentials: 'temp_only_never_saved', ui_evidence: 'codex_surface_router_live_action_required_for_ui_e2e', visual_review: 'gpt_image_2_annotated_review_required_when_contract_requests_it' },
         checklist
     });
     await writeJsonAtomic(path.join(dir, QA_LOOP_VISUAL_EVIDENCE_ARTIFACT), buildQaLoopVisualEvidenceArtifact(mission, contract));
-    await writeJsonAtomic(path.join(dir, 'qa-gate.json'), defaultQaGate(contract, { reportFile, executionProfile, codexNativeInvocation }));
+    await writeJsonAtomic(path.join(dir, 'qa-gate.json'), defaultQaGate(contract, { reportFile, executionProfile, codexNativeInvocation, qaRuntime }));
+    if (qaRuntime)
+        await evaluateQaGateV2(dir).catch(() => undefined);
     await writeTextAtomic(path.join(dir, reportFile), qaReportTemplate(mission, contract, checklist));
     return { checklist_count: checklist.length, report_file: reportFile };
 }
@@ -441,8 +471,18 @@ export async function ensureQaLoopVisualEvidenceContract(dir, mission = {}, cont
 }
 export async function evaluateQaGate(dir) {
     const gate = await readJson(path.join(dir, 'qa-gate.json'), {});
+    const surfaceSelection = await readJson(path.join(dir, QA_SURFACE_SELECTION_ARTIFACT), null);
+    const selectedSurface = gate.ui_selected_surface || gate.qa_surface_selected || surfaceSelection?.selected_surface || null;
+    const expectedEvidenceSource = evidenceSourceForSurface(selectedSurface);
+    const gateV2 = gate.qa_contract_v2_required === true ? await evaluateQaGateV2(dir).catch((err) => ({
+        passed: false,
+        blockers: [`qa_gate_v2_evaluation_failed:${err?.message || String(err)}`],
+        unverified: []
+    })) : null;
     const reportFile = qaReportFileFromGate(gate);
     const reasons = [];
+    if (gateV2 && gateV2.passed !== true)
+        reasons.push(...(gateV2.blockers || []));
     for (const key of ['clarification_contract_sealed', 'qa_report_written', 'qa_ledger_complete', 'checklist_completed', 'safety_reviewed', 'deployed_destructive_tests_blocked', 'credentials_not_persisted', 'honest_mode_complete']) {
         if (gate[key] !== true)
             reasons.push(`${key}_missing`);
@@ -460,17 +500,22 @@ export async function evaluateQaGate(dir) {
     if (gate.unsafe_external_side_effects === true)
         reasons.push('unsafe_external_side_effects');
     if (gate.ui_e2e_required === true) {
-        if (gate.chrome_extension_preflight_passed !== true)
-            reasons.push('chrome_extension_preflight_missing');
-        if (gate.ui_chrome_extension_evidence !== true)
-            reasons.push('ui_chrome_extension_evidence_missing');
-        if (gate.ui_computer_use_evidence === true)
+        if (!selectedSurface || selectedSurface === 'codex_chrome_extension') {
+            if (gate.chrome_extension_preflight_passed !== true)
+                reasons.push('chrome_extension_preflight_missing');
+            if (gate.ui_chrome_extension_evidence !== true)
+                reasons.push('ui_chrome_extension_evidence_missing');
+        }
+        else if (gate.ui_live_surface_preflight_passed !== true) {
+            reasons.push('ui_live_surface_preflight_missing');
+        }
+        if (gate.ui_computer_use_evidence === true && selectedSurface !== 'codex_computer_use')
             reasons.push('ui_computer_use_evidence_forbidden_for_web');
-        if (gate.ui_evidence_source !== CODEX_WEB_VERIFICATION_EVIDENCE_SOURCE)
-            reasons.push('ui_evidence_source_not_codex_chrome_extension');
+        if (expectedEvidenceSource && gate.ui_evidence_source !== expectedEvidenceSource)
+            reasons.push(`ui_evidence_source_not_${expectedEvidenceSource}`);
         if (evidenceMentionsForbiddenBrowserAutomation({ evidence: gate.evidence, notes: gate.notes, ui_evidence_source: gate.ui_evidence_source }))
             reasons.push('forbidden_browser_automation_evidence');
-        if (evidenceMentionsForbiddenWebComputerUseEvidence({ evidence: gate.evidence, ui_evidence_source: gate.ui_evidence_source }))
+        if (selectedSurface !== 'codex_computer_use' && evidenceMentionsForbiddenWebComputerUseEvidence({ evidence: gate.evidence, ui_evidence_source: gate.ui_evidence_source }))
             reasons.push('computer_use_web_evidence_forbidden');
         reasons.push(...await missingQaLoopVisualEvidence(dir, gate));
     }
@@ -502,7 +547,7 @@ export async function evaluateQaGate(dir) {
         reasons.push('qa_ledger_missing');
     const uniqueReasons = [...new Set(reasons)];
     const passed = gate.passed === true && uniqueReasons.length === 0;
-    const result = { checked_at: nowIso(), passed, reasons: uniqueReasons, gate };
+    const result = { checked_at: nowIso(), passed, reasons: uniqueReasons, gate, gate_v2: gateV2 };
     await writeJsonAtomic(path.join(dir, 'qa-gate.evaluated.json'), result);
     return result;
 }
@@ -592,9 +637,9 @@ CONTRACT:
 ${JSON.stringify(contract, null, 2)}
 ${imageContractText}${appHandoffText}${executionProfileText}
 VISUAL EVIDENCE CONTRACT:
-- For web UI QA, do not set chrome_extension_preflight_passed/ui_chrome_extension_evidence to true unless the Codex Chrome Extension path is ready and ${QA_LOOP_VISUAL_EVIDENCE_ARTIFACT} records a real saved Chrome Extension screenshot artifact with path, sha256, and dimensions.
-- If decision-contract.json answers set QA_VISUAL_REVIEW_IMAGEGEN_REQUIRED=${GPT_IMAGE_2_ANNOTATED_REVIEW_REQUIRED_ACK}, use Codex App $imagegen/gpt-image-2 (${CODEX_APP_IMAGE_GENERATION_DOC_URL}) to produce a real generated annotated review image from the Chrome Extension screenshot. Record its path, sha256, model=gpt-image-2, provider=Codex App $imagegen, and source_screenshot_artifact in ${QA_LOOP_VISUAL_EVIDENCE_ARTIFACT} and qa-gate.json.
-- Do not substitute prose-only critique, Playwright/Selenium/Puppeteer/Browser Use screenshots, Computer Use browser screenshots, placeholder images, fake fixtures, or direct API fallback as full web UI visual evidence.
+- For UI QA, do not mark live UI evidence true unless qa-loop/qa-surface-selection.json selected the correct @Browser/@Chrome/@Computer surface and action/observation ledgers record real user-like actions.
+- If decision-contract.json answers set QA_VISUAL_REVIEW_IMAGEGEN_REQUIRED=${GPT_IMAGE_2_ANNOTATED_REVIEW_REQUIRED_ACK}, use Codex App $imagegen/gpt-image-2 (${CODEX_APP_IMAGE_GENERATION_DOC_URL}) to produce a real generated annotated review image from the selected-surface source screenshot. Record its path, sha256, model=gpt-image-2, provider=Codex App $imagegen, and source_screenshot_artifact in ${QA_LOOP_VISUAL_EVIDENCE_ARTIFACT} and qa-gate.json.
+- Do not substitute prose-only critique, Playwright/Selenium/Puppeteer screenshots, static screenshots, plugin cache, placeholder images, fake fixtures, or direct API fallback as full UI visual evidence.
 Previous tail:
 ${String(previous || '').slice(-2500)}
 `;
@@ -623,7 +668,7 @@ function qaChecklist(a) {
         ['preflight.roles', 'Map roles, permissions, protected areas.']
     ];
     if (qaUiRequired(a))
-        cases.push(['ui.chrome_extension_first', CODEX_WEB_VERIFICATION_POLICY], ['ui.navigation', 'Check primary navigation, deep links, back/forward, refresh, and protected routes.'], ['ui.auth', 'Check login, logout, session expiry, unauthorized access, and role-specific visibility.'], ['ui.forms', 'Check required fields, validation, disabled states, success, and failure.'], ['ui.states', 'Check loading, empty, error, retry, offline/timeout, and slow network states.'], ['ui.crud', 'Check allowed create/change flows and block forbidden destructive flows by environment.'], ['ui.responsive', 'Check desktop, tablet, mobile, overflow, long text, and keyboard focus order.'], ['ui.a11y', 'Check labels, focus traps, modals, contrast-sensitive controls, and screen-reader names.'], ['ui.visual', 'Capture evidence for meaningful UI regressions without storing secrets.']);
+        cases.push(['ui.surface_router', CODEX_WEB_VERIFICATION_POLICY], ['ui.navigation', 'Check primary navigation, deep links, back/forward, refresh, and protected routes.'], ['ui.auth', 'Check login, logout, session expiry, unauthorized access, and role-specific visibility.'], ['ui.forms', 'Check required fields, validation, disabled states, success, and failure.'], ['ui.states', 'Check loading, empty, error, retry, offline/timeout, and slow network states.'], ['ui.crud', 'Check allowed create/change flows and block forbidden destructive flows by environment.'], ['ui.responsive', 'Check desktop, tablet, mobile, overflow, long text, and keyboard focus order.'], ['ui.a11y', 'Check labels, focus traps, modals, contrast-sensitive controls, and screen-reader names.'], ['ui.visual', 'Capture evidence for meaningful UI regressions without storing secrets.']);
     if (qaApiRequired(a))
         cases.push(['api.health', 'Check health/version/readiness endpoints when available.'], ['api.auth', 'Check anonymous, authenticated, expired, and wrong-role access.'], ['api.contract', 'Check status codes, response shape, headers, content type, and error format.'], ['api.validation', 'Check missing, malformed, boundary, duplicate, and over-limit payloads.'], ['api.listing', 'Check pagination, sorting, filters, search, and empty results.'], ['api.mutation', 'Check allowed seeded create/change and forbid deployed destructive flows.'], ['api.idempotency', 'Check retry/idempotency behavior for safe operations.'], ['api.concurrency', 'Check stale change, conflict, and double-submit behavior.'], ['api.failure', 'Check timeout, upstream error, rate-limit, and rollback-visible failure paths.'], ['api.security', 'Check CORS, auth headers, PII redaction, and permission boundaries.']);
     cases.push(['report.evidence', 'Record pass/fail/blocked/skipped with evidence.'], ['report.corrective_loop', 'Record fixes, rechecks, unresolved findings, deferred blockers.'], ['report.honest', 'Run Honest Mode.']);
@@ -675,6 +720,8 @@ async function missingQaLoopVisualEvidence(dir, gate = {}) {
     const visual = await readJson(path.join(dir, QA_LOOP_VISUAL_EVIDENCE_ARTIFACT), null);
     const reasons = [];
     const uiRequired = gate.ui_e2e_required === true;
+    const selectedSurface = gate.ui_selected_surface || gate.qa_surface_selected || (gate.ui_chrome_extension_evidence === true ? 'codex_chrome_extension' : null);
+    const expectedSource = evidenceSourceForSurface(selectedSurface) || CODEX_WEB_VERIFICATION_EVIDENCE_SOURCE;
     if (uiRequired) {
         const screenshot = visual?.chrome_extension_screenshot || {};
         if (gate.ui_chrome_extension_screenshot_captured !== true && !positiveVisualStatus(screenshot.status, ['captured', 'attached', 'verified']))
@@ -690,8 +737,8 @@ async function missingQaLoopVisualEvidence(dir, gate = {}) {
         else
             reasons.push(...await imageEvidenceFileReasons(dir, screenshotPath, screenshotSha, 'ui_chrome_extension_screenshot', screenshotDims));
         const screenshotSource = firstNonEmpty(gate.ui_chrome_extension_screenshot_source, screenshot.evidence_source, gate.ui_evidence_source);
-        if (screenshotSource !== CODEX_WEB_VERIFICATION_EVIDENCE_SOURCE)
-            reasons.push('ui_chrome_extension_screenshot_source_not_codex_chrome_extension');
+        if (screenshotSource !== expectedSource)
+            reasons.push(`ui_chrome_extension_screenshot_source_not_${expectedSource}`);
     }
     const review = visual?.gpt_image_2_annotated_review || {};
     const gptImage2ReviewRequired = gate.gpt_image_2_annotated_review_required === true || review.required === true;
@@ -786,4 +833,14 @@ function positiveCount(value) {
     const n = Number(value || 0);
     return Number.isFinite(n) && n > 0;
 }
+function evidenceSourceForSurface(surface) {
+    const value = String(surface || '').trim();
+    if (value === 'codex_in_app_browser')
+        return CODEX_IN_APP_BROWSER_EVIDENCE_SOURCE;
+    if (value === 'codex_chrome_extension')
+        return CODEX_CHROME_EXTENSION_EVIDENCE_SOURCE;
+    if (value === 'codex_computer_use')
+        return CODEX_COMPUTER_USE_EVIDENCE_SOURCE;
+    return null;
+}
 //# sourceMappingURL=qa-loop.js.map

package/dist/core/release/gate-manifest.js CHANGED Viewed

@@ -6,6 +6,7 @@ export const FORBIDDEN_RECURSIVE_GATES = new Set([
     'release:check:dynamic:execute',
     'release:real-check',
     'release:publish',
+    'publish:ignore-scripts',
     'publish:npm',
     'publish:dry',
     'prepublishOnly'

package/dist/core/release/release-gate-dag.js CHANGED Viewed

@@ -28,15 +28,16 @@ export async function runReleaseGateDag(input) {
     const preset = input.preset || 'release';
     const manifest = loadReleaseGateManifest(root);
     const presetGates = selectReleaseGatePreset(manifest, preset);
-    const triwikiGraph = input.triwiki !== false && (preset === 'affected' || preset === 'fast' || preset === 'confidence') && input.full !== true
-        ? computeTriWikiAffectedGraph({ root, tier: preset === 'fast' ? 'affected' : 'confidence', changedSince: input.changedSince || 'auto', ...(input.changedFiles ? { changedFiles: input.changedFiles } : {}) })
-        : null;
     const affected = (preset === 'affected' || preset === 'fast' || preset === 'confidence') && input.full !== true
         ? selectAffectedReleaseGates(root, manifest, presetGates, { changedSince: input.changedSince || 'auto', ...(input.changedFiles ? { changedFiles: input.changedFiles } : {}), preset })
         : selectAffectedReleaseGates(root, manifest, presetGates, { full: true, preset });
+    const rootReleaseSurfaceChanged = affected.selection.changed_files.some((file) => file === 'package.json' || file === 'package-lock.json' || file === 'release-gates.v2.json');
+    const triwikiGraph = input.triwiki !== false && !rootReleaseSurfaceChanged && (preset === 'affected' || preset === 'fast' || preset === 'confidence') && input.full !== true
+        ? computeTriWikiAffectedGraph({ root, tier: preset === 'fast' ? 'affected' : 'confidence', changedSince: input.changedSince || 'auto', ...(input.changedFiles ? { changedFiles: input.changedFiles } : {}) })
+        : null;
     const triwikiSelectionUsed = Boolean(triwikiGraph);
     const triwikiConservative = Boolean(triwikiGraph?.conservative_reason);
-    const triwikiSelectedIds = new Set(triwikiGraph && !triwikiConservative ? triwikiGraph.gates : presetGates.map((gate) => gate.id));
+    const triwikiSelectedIds = new Set(triwikiGraph && !triwikiConservative ? triwikiGraph.gates : affected.gates.map((gate) => gate.id));
     const selected = triwikiGraph
         ? presetGates.filter((gate) => triwikiSelectedIds.has(gate.id))
         : affected.gates;
@@ -45,7 +46,7 @@ export async function runReleaseGateDag(input) {
         affected.selection.mode = 'affected';
         affected.selection.selected_gate_ids = selected.map((gate) => gate.id);
         affected.selection.skipped_gate_ids = triwikiSkippedGates;
-        affected.selection.reasons = Object.fromEntries(selected.map((gate) => [gate.id, triwikiConservative ? `triwiki_conservative:${triwikiGraph.conservative_reason}` : 'triwiki-affected']));
+        affected.selection.reasons = Object.fromEntries(selected.map((gate) => [gate.id, triwikiConservative ? `triwiki_conservative_fallback:${triwikiGraph.conservative_reason}` : 'triwiki-affected']));
     }
     const selectedIds = new Set(selected.map((gate) => gate.id));
     const affectedExternalSatisfiedDeps = affected.selection.mode === 'affected'

package/dist/core/release/sla-scheduler.js CHANGED Viewed

@@ -2,7 +2,7 @@ import { computeTriWikiAffectedGraph } from '../triwiki/triwiki-affected-graph.j
 import { buildTriWikiSlaCertificate } from '../triwiki/triwiki-sla-certificate.js';
 import { planExtremeParallelSchedule } from './extreme-parallel-scheduler.js';
 export const SLA_SCHEDULER_SCHEMA = 'sks.sla-scheduler.v1';
-export function planFiveMinuteSla(root, graph = computeTriWikiAffectedGraph({ root, tier: 'affected' }), slaMs = 300_000) {
+export function planFiveMinuteSla(root, graph = computeTriWikiAffectedGraph({ root, tier: 'affected', includeProofLookup: false }), slaMs = 300_000) {
     const schedule = planExtremeParallelSchedule(root, graph);
     const certificate = buildTriWikiSlaCertificate({
         graph,

package/dist/core/routes.js CHANGED Viewed

@@ -32,15 +32,30 @@ export const FROM_CHAT_IMG_QA_LOOP_ARTIFACT = 'from-chat-img-qa-loop.json';
 export const FROM_CHAT_IMG_TEMP_TRIWIKI_SESSIONS = 5;
 export const USAGE_TOPICS = 'install|setup|bootstrap|root|deps|zellij|tmux|auto-review|team|qa-loop|ppt|image-ux-review|computer-use|goal|fast-mode|research|db|git|codex|codex-app|codex-native|hooks|features|all-features|dfix|commit|commit-and-push|design|imagegen|dollar|context7|xai|pipeline|reasoning|guard|conflicts|versioning|eval|harness|hproof|gx|wiki|wrongness|code-structure|proof-field|skill-dream|rust';
 export const CODEX_COMPUTER_USE_EVIDENCE_SOURCE = 'codex_computer_use';
-export const CODEX_WEB_VERIFICATION_EVIDENCE_SOURCE = 'codex_chrome_extension';
+export const CODEX_IN_APP_BROWSER_EVIDENCE_SOURCE = 'codex_in_app_browser';
+export const CODEX_CHROME_EXTENSION_EVIDENCE_SOURCE = 'codex_chrome_extension';
+export const CODEX_WEB_VERIFICATION_EVIDENCE_SOURCE = CODEX_IN_APP_BROWSER_EVIDENCE_SOURCE;
 export const CODEX_IMAGEGEN_EVIDENCE_SOURCE = 'codex_app_imagegen_gpt_image_2';
+export const CODEX_IN_APP_BROWSER_DOC_URL = 'https://developers.openai.com/codex/app/browser';
 export const CODEX_CHROME_EXTENSION_DOC_URL = 'https://developers.openai.com/codex/app/chrome-extension';
+export const CODEX_COMPUTER_USE_DOC_URL = 'https://developers.openai.com/codex/app/computer-use';
+export const CODEX_RECORD_REPLAY_DOC_URL = 'https://developers.openai.com/codex/record-and-replay';
+export const CODEX_APP_SERVER_DOC_URL = 'https://developers.openai.com/codex/app-server';
 export const CODEX_APP_IMAGE_GENERATION_DOC_URL = 'https://developers.openai.com/codex/app/features#image-generation';
 export const OPENAI_IMAGE_GENERATION_DOC_URL = 'https://developers.openai.com/api/docs/guides/image-generation';
 export const OPENAI_CHATGPT_IMAGES_2_DOC_URL = 'https://openai.com/index/introducing-chatgpt-images-2-0/';
 export const OPENAI_GPT_IMAGE_2_MODEL_DOC_URL = 'https://developers.openai.com/api/docs/models/gpt-image-2';
-export const CODEX_WEB_VERIFICATION_POLICY = `Web, browser, localhost, website, webapp, and web-based app verification must use the official Codex Chrome Extension path first (${CODEX_CHROME_EXTENSION_DOC_URL}). Before web UX review, QA-LOOP, browser smoke, authenticated browser checks, or web visual verification proceeds, SKS must verify that the Chrome Extension path is installed/enabled through Codex App plugin readiness; if it is missing, rapidly halt the pipeline, tell the user to install/setup the extension, and resume only after the user explicitly says installation is complete. Do not use Codex Computer Use as browser/web-app verification evidence. Do not substitute Playwright, Selenium, Puppeteer, Browser Use, Chrome MCP, generic browser automation, screenshots fabricated from code, or prose-only checks for the Chrome Extension gate.`;
-export const CODEX_COMPUTER_USE_ONLY_POLICY = `Codex Computer Use is reserved for native macOS, desktop-app, OS-settings, and non-web visual tasks such as setting up a Mac app or inspecting a non-browser surface. It must not be used for browser, localhost, website, webapp, or web-based app verification; those routes follow the Chrome Extension policy instead. If live native Computer Use tools are unavailable for a non-web target, mark the native visual evidence unverified instead of fabricating screenshots or substituting browser automation. Codex App readiness/config verification is not target evidence: use Codex-provided control surfaces such as \`codex features list\`, \`codex mcp list\`, \`sks codex-app check\`, remote-control status, and plugin/tool exposure. In Codex App prompts, invoke @Computer or @AppName only for live native Mac/non-web target apps or screens.`;
+export const QA_INTERACTION_SURFACES = Object.freeze([
+    'codex_in_app_browser',
+    'codex_chrome_extension',
+    'codex_computer_use',
+    'codex_app_plugin',
+    'structured_mcp',
+    'shell_or_api_diagnostic'
+]);
+export const CODEX_QA_SURFACE_ROUTING_POLICY = `Codex QA surface routing follows the official Codex App split: use @Browser / in-app Browser (${CODEX_IN_APP_BROWSER_DOC_URL}) first for localhost, local development servers, file-backed previews, and public pages that do not require sign-in; use @Chrome / Codex Chrome Extension (${CODEX_CHROME_EXTENSION_DOC_URL}) for signed-in websites, cookies, browser profiles, extensions, existing tabs, or internal tools; use @Computer or @AppName (${CODEX_COMPUTER_USE_DOC_URL}) for native macOS/Windows apps, OS settings, cross-app workflows, and GUI-only bugs. Prefer structured Plugins/MCPs for repeatable data operations, then verify rendered user-visible results with Browser, Chrome, or Computer Use. Playwright, Selenium, Puppeteer, Chrome MCP, static screenshots, plugin cache, and final-agent prose are not Codex App live action proof. App Server evidence (${CODEX_APP_SERVER_DOC_URL}) must correlate thread, turn, item/tool events, approvals, diffs, actions, observations, findings, fixes, and same-flow replay before a real QA pass is claimed.`;
+export const CODEX_WEB_VERIFICATION_POLICY = CODEX_QA_SURFACE_ROUTING_POLICY;
+export const CODEX_COMPUTER_USE_ONLY_POLICY = `Codex Computer Use is a live GUI surface for supported macOS and Windows environments, invoked with @Computer or @AppName for native apps, OS settings, browser contexts that truly require GUI-level operation, and cross-app workflows. Do not replace @Browser localhost/public-page checks or @Chrome signed-in checks with Computer Use unless the surface router records a specific GUI-only/cross-app reason. If live Computer Use tools, permissions, or app access are unavailable, mark the affected native/GUI evidence blocked or unverified instead of fabricating screenshots or actions. Codex App readiness/config checks are capability evidence only, not target interaction proof.`;
 export const IMAGEGEN_SOCIAL_SOURCE_POLICY = 'Use public X/social/community reports only as prompt-quality and workflow-sentiment hints after official OpenAI/Codex docs. Social posts are not capability specs, evidence of tool availability, or proof that a generated asset was created.';
 export const CODEX_IMAGEGEN_REQUIRED_POLICY = 'Pipeline image generation, raster asset creation/editing, and generated image-review evidence must use real Codex App imagegen/$imagegen with gpt-image-2 when that evidence is required for full verification. For newest-model image requests, prompt explicitly for "ChatGPT Images 2.0 / GPT Image 2.0 with gpt-image-2" instead of relying on generic image-generation wording. Do not substitute placeholder SVG/HTML/CSS, prose-only critique, stock-like stand-ins, manually fabricated files, or missing-output ledgers for requested/generated raster assets or required generated review images. If imagegen/gpt-image-2 is unavailable or generated annotated images cannot be created/linked, record the blocker and cap any closeout at verified_partial/reference-only instead of claiming generated-image evidence or full route verification; that partial closeout requires source screenshots plus hashes, docs evidence, source Image Voxel anchors, and Honest Mode evidence. In Codex App prompts, invoke $imagegen when live image generation is needed; SKS hooks and skills can require the policy but cannot attach missing host image-generation tools to an already-started turn. Official OpenAI/Codex docs are authoritative for capabilities, surfaces, limits, and evidence rules; X/social/community reports may inform prompt style only.';
 export const DEFAULT_CODEX_APP_PLUGINS = Object.freeze([
@@ -56,7 +71,7 @@ export const RESERVED_CODEX_PLUGIN_SKILL_NAMES = Object.freeze([
     'browser-use',
     ...DEFAULT_CODEX_APP_PLUGINS.map(([name]) => name)
 ].sort());
-export const FORBIDDEN_BROWSER_AUTOMATION_RE = /\b(playwright|chrome\s+mcp|browser\s+use|selenium|puppeteer)\b/i;
+export const FORBIDDEN_BROWSER_AUTOMATION_RE = /\b(playwright|chrome\s+mcp|selenium|puppeteer)\b/i;
 export function evidenceMentionsForbiddenBrowserAutomation(value, seen = new Set()) {
     if (value == null)
         return false;
@@ -231,7 +246,7 @@ export function stackCurrentDocsPolicy(commandPrefix = 'sks') {
         validate_command: `${prefix} wiki validate .sneakoscope/wiki/context-pack.json`,
         priority: 'must_precede_coding_style_defaults',
         examples: [
-            'Supabase hosted projects should prefer sb_publishable_ and sb_secret_ keys over legacy anon/service_role keys when current docs apply.',
+            'Supabase hosted projects should prefer sb_publishable_ and sb_secret_ keys over legacy anon and service role keys when current docs apply.',
             'Next.js 16 deprecates the middleware file convention in favor of proxy.ts/proxy.js.',
             'Vercel Function duration limits, including the 300s default with Fluid Compute, are deployment constraints that must shape long-running server work.'
         ]
@@ -239,7 +254,7 @@ export function stackCurrentDocsPolicy(commandPrefix = 'sks') {
 }
 export function stackCurrentDocsPolicyText(commandPrefix = 'sks') {
     const policy = stackCurrentDocsPolicy(commandPrefix);
-    return `Stack current-docs policy: whenever project tech stack is added or a framework/package/runtime/platform version changes, fetch current docs with Context7 (resolve-library-id then query-docs) or official vendor web docs before coding, record the syntax/limits/security guidance as high-priority TriWiki claims in ${policy.memory_path}, run "${policy.refresh_command}", then "${policy.validate_command}". Treat these claims as higher priority than model-memory defaults. Examples include Supabase publishable/secret keys replacing legacy anon/service_role guidance for hosted projects, Next.js 16 proxy.ts/proxy.js replacing the deprecated middleware file convention, avoiding stale webpack defaults when newer framework guidance says otherwise, and Vercel Function duration limits such as the 300s default under Fluid Compute.`;
+    return `Stack current-docs policy: whenever project tech stack is added or a framework/package/runtime/platform version changes, fetch current docs with Context7 (resolve-library-id then query-docs) or official vendor web docs before coding, record the syntax/limits/security guidance as high-priority TriWiki claims in ${policy.memory_path}, run "${policy.refresh_command}", then "${policy.validate_command}". Treat these claims as higher priority than model-memory defaults. Examples include Supabase publishable/secret keys replacing legacy anon and service role guidance for hosted projects, Next.js 16 proxy.ts/proxy.js replacing the deprecated middleware file convention, avoiding stale webpack defaults when newer framework guidance says otherwise, and Vercel Function duration limits such as the 300s default under Fluid Compute.`;
 }
 export function triwikiContextTrackingText(commandPrefix = 'sks') {
     const ctx = triwikiContextTracking(commandPrefix);
@@ -549,21 +564,34 @@ export const ROUTES = [
         cliEntrypoint: 'sks db scan',
         examples: ['$DB check this migration safely']
     },
+    {
+        id: 'MadDB',
+        command: '$MAD-DB',
+        mode: 'MADDB',
+        route: 'first-class MadDB SQL-plane execution',
+        description: 'Explicit one-cycle MadDB route. When invoked by $MAD-DB or sks mad-db run|exec|apply-migration, SQL-plane mutations such as CREATE, ALTER, table/schema DROP, column add/drop/rename, INSERT, UPDATE, DELETE including all-row mutations, TRUNCATE, execute_sql, and apply_migration are authorized for the bound Supabase project and must be executed with tool-result plus read-back proof. Supabase project/account/billing/credential control-plane actions remain denied.',
+        requiredSkills: ['mad-db', 'db-safety-guard', 'pipeline-runner', 'context7-docs', REFLECTION_SKILL_NAME, 'honest-mode'],
+        appSkillAliases: ['mad-db'],
+        lifecycle: ['explicit_invocation', 'single_mission_capability_v2', 'ephemeral_write_profile', 'tool_inventory', 'execute_sql_or_apply_migration', 'read_back_verification', 'close_and_read_only_restore', 'post_route_reflection', 'honest_mode'],
+        context7Policy: 'required',
+        reasoningPolicy: 'xhigh',
+        stopGate: 'mad-db-gate.json',
+        cliEntrypoint: 'sks mad-db run|exec|apply-migration|status|close|revoke|doctor',
+        examples: ['$MAD-DB public.users legacy_code 컬럼 삭제', '$MAD-DB truncate public.staging_events']
+    },
     {
         id: 'MadSKS',
         command: '$MAD-SKS',
         mode: 'MADSKS',
         route: 'explicit scoped permission-widening modifier',
-        description: 'Explicit high-risk authorization modifier that can be combined with other $ commands to temporarily open approved target-project scopes such as files, shell, package installs, services, network, Computer Use/browser workflows, generated assets, file permissions, migrations, Supabase MCP DB writes, direct execute SQL, schema cleanup, and normal targeted DB writes for the active invocation, while preserving catastrophic wipe/all-row/project-management, credential-exfiltration, persistent security-weakening, and unrequested fallback safeguards.',
+        description: 'Explicit high-risk authorization modifier that can be combined with other $ commands to temporarily open approved target-project scopes such as files, shell, package installs, services, network, Computer Use/browser workflows, generated assets, file permissions, migrations, Supabase MCP DB writes, direct execute SQL, schema cleanup, and normal targeted DB writes for the active invocation, while preserving catastrophic wipe/all-row/project-management, credential-exfiltration, persistent security-weakening, and unrequested fallback safeguards. It is not the first-class MadDB destructive SQL-plane route.',
         requiredSkills: ['mad-sks', 'db-safety-guard', 'pipeline-runner', 'context7-docs', REFLECTION_SKILL_NAME, 'honest-mode'],
-        dollarAliases: ['$MAD-DB'],
-        appSkillAliases: ['mad-db'],
         lifecycle: ['explicit_invocation', 'auto_sealed_permission_scope', 'scoped_permission_override', 'catastrophic_guard', 'permission_deactivation', 'post_route_reflection', 'honest_mode'],
         context7Policy: 'required',
         reasoningPolicy: 'xhigh',
         stopGate: 'mad-sks-gate.json',
         cliEntrypoint: 'Codex App prompt route only: $MAD-SKS <task>',
-        examples: ['$MAD-SKS $Team target project maintenance with package/service/file and DB scopes', '$DB Supabase 점검 $MAD-SKS', '$MAD-DB enable one-cycle DB break-glass only after explicit ack']
+        examples: ['$MAD-SKS $Team target project maintenance with package/service/file and DB scopes', '$DB Supabase 점검 $MAD-SKS']
     },
     {
         id: 'GX',
@@ -964,6 +992,8 @@ export function routeRequiresSubagents(route, prompt = '') {
         return false;
     if (route.id === 'ImageUXReview')
         return false;
+    if (route.id === 'MadDB')
+        return false;
     if (route.id === 'Research' || route.id === 'AutoResearch')
         return true;
     if (route.id === 'Goal')
@@ -996,7 +1026,7 @@ export function simpleGitOnlyRouteId(prompt = '') {
 }
 export function reflectionRequiredForRoute(route) {
     const id = String(route?.id || route?.mode || route?.route || route || '').replace(/^\$/, '');
-    return /^(team|naruto|shadowclone|shadow-clone|kagebunshin|kage-bunshin|qaloop|qa-loop|ppt|imageuxreview|image-ux-review|research|autoresearch|db|database|madsks|mad-sks|gx)$/i.test(id);
+    return /^(team|naruto|shadowclone|shadow-clone|kagebunshin|kage-bunshin|qaloop|qa-loop|ppt|imageuxreview|image-ux-review|research|autoresearch|db|database|madsks|mad-sks|maddb|mad-db|gx)$/i.test(id);
 }
 export function looksLikeCodeChangingWork(prompt = '') {
     const text = String(prompt || '');
@@ -1038,7 +1068,7 @@ export function routeReasoning(route, prompt = '') {
     const base = ALLOWED_REASONING_EFFORTS.has(route?.reasoningPolicy) ? route.reasoningPolicy : 'medium';
     if (hasFromChatImgSignal(text))
         return reasoning('xhigh', 'from_chat_img_image_work_order_analysis');
-    if (/(?:^|\s)sks\s+--mad\b|(?:^|\s)--mad\b|\$MAD-SKS\b|\bmad-sks\b|\bmadsks\b/i.test(text))
+    if (/(?:^|\s)sks\s+--mad\b|(?:^|\s)--mad\b|\$MAD-SKS\b|\$MAD-DB\b|\bmad-sks\b|\bmadsks\b|\bmad-db\b|\bmaddb\b/i.test(text))
         return reasoning('xhigh', 'mad_sks_or_mad_launch_default');
     if (route?.id === 'Team' || route?.id === 'Naruto')
         return teamRouteReasoning(text);

package/dist/core/triwiki/triwiki-affected-graph.js CHANGED Viewed

@@ -35,7 +35,8 @@ export function computeTriWikiAffectedGraph(input) {
     const gatePacks = new Set();
     for (const impact of selected)
         gatePacks.add(impact.gate_pack);
-    const proofLookup = selected.map((impact) => {
+    const includeProofLookup = input.includeProofLookup !== false;
+    const proofLookup = includeProofLookup ? selected.map((impact) => {
         const cacheKey = computeTriWikiCacheKey({
             root: input.root,
             id: impact.gate_id,
@@ -46,7 +47,7 @@ export function computeTriWikiAffectedGraph(input) {
         });
         const hit = readReusableTriWikiProofCard({ root: input.root, subjectId: impact.gate_id, cacheKey: cacheKey.key });
         return { impact, hit };
-    });
+    }) : [];
     const reusedProofs = proofLookup
         .filter((row) => row.hit.hit && row.hit.card && row.hit.path)
         .map((row) => ({ gate_id: row.impact.gate_id, proof_id: row.hit.card.proof_id, path: row.hit.path }))

package/dist/core/version.js CHANGED Viewed

@@ -1,2 +1,2 @@
-export const PACKAGE_VERSION = '4.1.1';
+export const PACKAGE_VERSION = '4.2.1';
 //# sourceMappingURL=version.js.map

package/dist/core/zellij/zellij-slot-column-anchor.js CHANGED Viewed

@@ -115,7 +115,11 @@ function renderTelemetrySlotRows(snapshot) {
     });
 }
 function isMadDbActive(capability) {
-    if (!capability || capability.enabled !== true || capability.consumed === true)
+    if (!capability)
+        return false;
+    if (capability.schema === 'sks.mad-db-capability.v2' && !['transport_ready', 'active'].includes(String(capability.status || '')))
+        return false;
+    if (capability.schema !== 'sks.mad-db-capability.v2' && (capability.enabled !== true || capability.consumed === true))
         return false;
     const expires = Date.parse(capability.expires_at || '');
     return Number.isFinite(expires) && expires > Date.now();

package/dist/scripts/check-dist-runtime.js CHANGED Viewed

@@ -8,6 +8,7 @@ import { sourceSnapshot } from './lib/ensure-dist-fresh.js';
 const root = path.resolve(path.dirname(fileURLToPath(import.meta.url)), '..', '..');
 const distRoot = path.join(root, 'dist');
 const issues = [];
+const contractOnlyMarker = 'contract' + '_only';
 if (!fs.existsSync(distRoot))
     issues.push('dist_missing');
 requiredFile('dist/bin/sks.js');
@@ -63,8 +64,8 @@ if (fs.existsSync(distRoot)) {
         if (!rel.endsWith('.js'))
             continue;
         const text = fs.readFileSync(file, 'utf8');
-        if (text.includes('contract_only'))
-            issues.push(`contract_only:${rel}`);
+        if (text.includes(contractOnlyMarker))
+            issues.push(`${contractOnlyMarker}:${rel}`);
         if (/from\s+['"][^'"]+\.mjs['"]|import\(\s*['"][^'"]+\.mjs['"]\s*\)/.test(text)) {
             issues.push(`imports_mjs:${rel}`);
         }

package/dist/scripts/codex-0142-manifest-check.js CHANGED Viewed

@@ -8,11 +8,12 @@ const manifest = parity.manifest;
 const dep = pkg.dependencies?.['@openai/codex-sdk'];
 const lockSdk = lock.packages?.['node_modules/@openai/codex-sdk']?.version;
 const lockCli = lock.packages?.['node_modules/@openai/codex']?.version;
+const lockRootVersion = lock.packages?.['']?.version || lock.version;
 assertGate(parity.ok, 'Codex release manifest TS/JSON parity must hold', parity);
 assertGate(dep === manifest.sdkVersion, 'package.json must pin @openai/codex-sdk exactly to manifest sdkVersion', { dep, sdkVersion: manifest.sdkVersion });
 assertGate(lockSdk === manifest.sdkVersion, 'package-lock must resolve @openai/codex-sdk to manifest sdkVersion', { lockSdk, sdkVersion: manifest.sdkVersion });
 assertGate(lockCli === manifest.requiredCliVersion, 'package-lock must resolve @openai/codex to manifest requiredCliVersion', { lockCli, requiredCliVersion: manifest.requiredCliVersion });
-assertGate(pkg.version === '4.1.1', 'package version must be 4.1.1', { version: pkg.version });
+assertGate(pkg.version === lockRootVersion, 'package version must match package-lock root version', { version: pkg.version, lockRootVersion });
 emitGate('codex:0142:manifest', {
     manifest_sha256: parity.manifest_sha256,
     target_tag: manifest.targetTag,

package/dist/scripts/codex-control-all-pipelines-check.js CHANGED Viewed

@@ -10,6 +10,7 @@ const required = [
     'codex-control:thread-registry',
     'codex-control:side-effect-scope',
     'codex-control:empty-result-retry',
+    'codex-control:model-capacity-fallback',
     'codex-control:stream-idle-watchdog',
     'codex-control:tool-call-sequence-repair',
     'codex-control:keepalive-no-cot-leak'

package/dist/scripts/codex-control-model-capacity-fallback-check.js ADDED Viewed

@@ -0,0 +1,53 @@
+#!/usr/bin/env node
+// @ts-nocheck
+import { assertGate, emitGate, importDist, readText } from './sks-1-18-gate-lib.js';
+const mod = await importDist('core/codex-control/codex-reliability-shield.js');
+let attempts = 0;
+const seenAttempts = [];
+const result = await mod.runWithCodexReliabilityShield(baseTask(), async (attempt) => {
+    attempts += 1;
+    seenAttempts.push(attempt);
+    return {
+        ok: false,
+        sdkThreadId: '',
+        sdkRunId: null,
+        events: [{ type: 'turn.failed', message: 'Selected model is at capacity. Please try a different model.' }],
+        finalResponse: '',
+        structuredOutput: null,
+        blockers: ['Selected model is at capacity. Please try a different model.']
+    };
+});
+assertGate(attempts === 1, 'model capacity must not retry with downgraded pressure', { attempts, seenAttempts, result });
+assertGate(result.reliabilityShield.ok === false, 'terminal model capacity must remain visible as a blocker', result.reliabilityShield);
+assertGate(result.reliabilityShield.retry_count === 0, 'capacity retry count must stay zero', result.reliabilityShield);
+assertGate(result.reliabilityShield.model_capacity_retry_count === 0, 'model capacity retry must not be counted', result.reliabilityShield);
+assertGate(result.reliabilityShield.selected_model_capacity_fallback === false, 'capacity fallback flag must not be selected', result.reliabilityShield);
+assertGate(result.reliabilityShield.attempts[0].retryable === false, 'capacity attempt must be terminal', result.reliabilityShield.attempts[0]);
+assertGate(result.reliabilityShield.attempts[0].retry_reason === null, 'capacity retry reason must stay null', result.reliabilityShield.attempts[0]);
+assertGate(result.reliabilityShield.attempts[0].blockers.includes('codex_model_capacity_unavailable'), 'capacity blocker must be explicit', result.reliabilityShield.attempts[0]);
+assertGate(mod.isCodexModelCapacityError({ blockers: ['Selected model is at capacity. Please try a different model.'] }, []) === true, 'capacity classifier must recognize common Codex error text');
+const runnerSource = readText('src/core/codex-control/codex-task-runner.ts');
+assertGate(!runnerSource.includes("capacity_fallback_service_tier: 'standard'"), 'capacity fallback must not force standard service tier');
+assertGate(!runnerSource.includes("capacity_fallback_reasoning_effort: 'low'"), 'capacity fallback must not force low reasoning');
+assertGate(!runnerSource.includes('SKS_CODEX_CAPACITY_FALLBACK_MODEL'), 'capacity fallback model override must be removed');
+emitGate('codex-control:model-capacity-fallback', {
+    attempts,
+    retry_count: result.reliabilityShield.retry_count,
+    model_capacity_retry_count: result.reliabilityShield.model_capacity_retry_count
+});
+function baseTask() {
+    return {
+        route: '$Agent',
+        tier: 'worker',
+        missionId: 'M-model-capacity-fallback',
+        cwd: process.cwd(),
+        prompt: 'model capacity fallback fixture',
+        outputSchemaId: 'sks.agent-worker-result.v1',
+        outputSchema: {},
+        sandboxPolicy: 'read-only',
+        requestedScopeContract: { read_only: true },
+        reliabilityPolicy: { maxEmptyResultRetries: 1, idleTimeoutMs: 5000, timeoutClass: 'short' },
+        mutationLedgerRoot: process.cwd()
+    };
+}
+//# sourceMappingURL=codex-control-model-capacity-fallback-check.js.map

package/dist/scripts/config-managed-merge-callsite-coverage-check.js CHANGED Viewed

@@ -114,11 +114,17 @@ const ALLOWLIST = [
         reason: 'migration journal writes hashes and rollback metadata, not raw secret config values',
         expires: '3.2.0'
     },
+    {
+        file: 'src/core/mad-db/mad-db-runtime-profile.ts',
+        pattern: /codex-mad-db\.config\.toml|writeTextAtomic/,
+        reason: 'MAD-DB runtime profile writes only a mission-local temporary Codex profile and verifies read-only restoration on close',
+        expires: '4.3.0'
+    },
     {
         file: 'src/core/providers/glm/naruto/glm-naruto-trace.ts',
         pattern: /mission-result\.json|sanitizeArtifact/,
         reason: 'GLM Naruto trace writer persists sanitized mission-result proof artifacts, not raw env secret files',
-        expires: '4.2.0'
+        expires: '4.3.0'
     }
 ];
 const sources = listSourceFiles().map((file) => ({