npm - sneakoscope - Versions diffs - 3.1.7 → 3.1.9 - Mend

sneakoscope 3.1.7 → 3.1.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

package/README.md +9 -2
package/crates/sks-core/Cargo.lock +1 -1
package/crates/sks-core/Cargo.toml +1 -1
package/crates/sks-core/src/main.rs +1 -1
package/dist/.sks-build-stamp.json +4 -4
package/dist/bin/sks.js +1 -1
package/dist/cli/args.js +17 -0
package/dist/cli/command-registry.js +16 -13
package/dist/cli/router.js +8 -5
package/dist/commands/doctor.js +97 -2
package/dist/core/codex-app/codex-skill-sync.js +80 -154
package/dist/core/codex-native/core-skill-integrity.js +89 -0
package/dist/core/codex-native/core-skill-manifest.js +156 -0
package/dist/core/codex-native/native-capability-postcheck.js +35 -0
package/dist/core/codex-native/native-capability-repair-matrix.js +210 -0
package/dist/core/codex-native/native-capability-repair.js +47 -0
package/dist/core/codex-native/native-media-computer-repair.js +5 -0
package/dist/core/codex-native/project-skill-dedupe.js +109 -0
package/dist/core/codex-native/skill-name-canonicalizer.js +21 -0
package/dist/core/codex-native/skill-registry-ledger.js +85 -0
package/dist/core/commands/basic-cli.js +19 -10
package/dist/core/commands/mad-sks-command.js +36 -13
package/dist/core/commands/naruto-command.js +4 -1
package/dist/core/commands/pipeline-command.js +3 -4
package/dist/core/commands/qa-loop-command.js +36 -1
package/dist/core/commands/research-command.js +61 -1
package/dist/core/commands/team-command.js +63 -3
package/dist/core/config/config-migration-journal.js +27 -0
package/dist/core/config/managed-config-merge.js +105 -0
package/dist/core/config/secret-preservation.js +169 -0
package/dist/core/config/supabase-secret-preservation.js +29 -0
package/dist/core/decision-contract.js +28 -4
package/dist/core/doctor/command-alias-cleanup.js +64 -0
package/dist/core/doctor/doctor-native-capability-repair.js +48 -0
package/dist/core/feature-fixtures.js +2 -0
package/dist/core/feature-registry.js +2 -2
package/dist/core/fsx.js +1 -1
package/dist/core/init.js +5 -1
package/dist/core/naruto/naruto-work-graph.js +4 -1
package/dist/core/pipeline-internals/runtime-core.js +50 -4
package/dist/core/pipeline-internals/runtime-gates.js +10 -1
package/dist/core/proof/route-proof-gate.js +1 -1
package/dist/core/qa-loop.js +227 -11
package/dist/core/questions.js +239 -2
package/dist/core/routes.js +3 -4
package/dist/core/version.js +1 -1
package/dist/scripts/agent-native-release-gate.js +13 -4
package/dist/scripts/sizecheck.js +8 -2
package/dist/scripts/sks-3-1-8-check-lib.js +30 -0
package/package.json +27 -1

package/dist/core/pipeline-internals/runtime-core.js CHANGED Viewed

@@ -3,7 +3,7 @@ import path from 'node:path';
 import { appendJsonl, exists, nowIso, readJson, readText, writeJsonAtomic, writeTextAtomic } from '../fsx.js';
 import { containsUserQuestion, noQuestionContinuationReason } from '../no-question-guard.js';
 import { createMission, missionDir, setCurrent } from '../mission.js';
-import { buildQuestionSchemaForRoute, writeQuestions } from '../questions.js';
+import { buildQuestionSchemaForRoute, buildRequestIntake, REQUEST_INTAKE_ARTIFACT, writeQuestions } from '../questions.js';
 import { sealContract } from '../decision-contract.js';
 import { scanDbSafety } from '../db-safety.js';
 import { GOAL_WORKFLOW_ARTIFACT, writeGoalWorkflow } from '../goal-workflow.js';
@@ -81,6 +81,8 @@ function reflectionInstructionText(commandPrefix = 'sks') {
 export function buildPipelinePlan(input = {}) {
     const route = input.route || routePrompt(input.task || '$SKS');
     const task = String(input.task || '').trim();
+    const requestIntake = input.requestIntake || null;
+    const executionPrompt = String(requestIntake?.transformed_prompt || task || '').trim();
     const ambiguity = normalizeAmbiguity(input.ambiguity, route);
     const proof = normalizeProofField(input.proofField);
     const lane = selectPipelineLane(route, task, proof);
@@ -106,6 +108,18 @@ export function buildPipelinePlan(input = {}) {
             reflection_required: reflectionRequiredForRoute(route)
         },
         task,
+        request_intake: requestIntake ? {
+            artifact: REQUEST_INTAKE_ARTIFACT,
+            prompt_hash: requestIntake.prompt_hash || null,
+            interpreted_goal: requestIntake.interpreted_intent?.goal || null,
+            requirement_count: Array.isArray(requestIntake.requirements) ? requestIntake.requirements.length : 0,
+            transformed_prompt_available: Boolean(requestIntake.transformed_prompt),
+            wiki_context_used: requestIntake.wiki_context_used?.source || null
+        } : {
+            artifact: REQUEST_INTAKE_ARTIFACT,
+            status: 'not_attached'
+        },
+        execution_prompt: executionPrompt,
         ambiguity_gate: ambiguity,
         runtime_lane: lane,
         stages,
@@ -130,10 +144,37 @@ export function buildPipelinePlan(input = {}) {
     };
 }
 export async function writePipelinePlan(dir, input = {}) {
-    const plan = buildPipelinePlan(input);
+    const requestIntake = input.requestIntake || await writeRequestIntakeArtifact(dir, input);
+    const plan = buildPipelinePlan({ ...input, requestIntake });
     await writeJsonAtomic(path.join(dir, PIPELINE_PLAN_ARTIFACT), plan);
     return plan;
 }
+export async function writeRequestIntakeArtifact(dir, input = {}) {
+    const file = path.join(dir, REQUEST_INTAKE_ARTIFACT);
+    if (!input.requestIntake && !input.forceRequestIntakeRewrite) {
+        const existing = await readJson(file, null);
+        if (existing)
+            return existing;
+    }
+    const root = input.root || rootFromMissionDir(dir);
+    const wikiContext = input.wikiContext !== undefined
+        ? input.wikiContext
+        : await readJson(path.join(root, '.sneakoscope', 'wiki', 'context-pack.json'), null);
+    const intake = input.requestIntake || buildRequestIntake(input.task || '', {}, {
+        wikiContext,
+        route: input.route || null
+    });
+    await writeJsonAtomic(file, intake);
+    return intake;
+}
+function rootFromMissionDir(dir) {
+    const resolved = path.resolve(dir);
+    const parts = resolved.split(path.sep);
+    const idx = parts.lastIndexOf('.sneakoscope');
+    if (idx > 0)
+        return parts.slice(0, idx).join(path.sep) || path.sep;
+    return path.resolve(resolved, '..', '..', '..');
+}
 export function validatePipelinePlan(plan = {}) {
     const issues = [];
     if (plan.schema_version !== PIPELINE_PLAN_SCHEMA_VERSION)
@@ -336,12 +377,13 @@ function planVerification(route, proof) {
 function planNextActions(route, task, ambiguity, lane, agentPolicy = normalizeAgentPolicy(route, task, {})) {
     if (ambiguity.required && !ambiguity.passed) {
         return [
+            `read ${REQUEST_INTAKE_ARTIFACT} and preserve its source-order requirements`,
             'auto-seal execution contract from inferred answers',
             ...(looksLikeProblemSolvingRequest(task) ? ['run Solution Scout web search for similar fixes before editing'] : []),
             'continue with decision-contract.json'
         ];
     }
-    const actions = ['read pipeline-plan.json before work', 'execute kept stages only', 'run listed verification'];
+    const actions = [`read ${REQUEST_INTAKE_ARTIFACT} and use its transformed_prompt`, 'read pipeline-plan.json before work', 'execute kept stages only', 'run listed verification'];
     if (agentPolicy.required)
         actions.splice(1, 0, 'run sks agents run latest --json before implementation');
     if (!lane.fast_lane_allowed && routeRequiresSubagents(route, task)) {
@@ -375,6 +417,7 @@ export function promptPipelineContext(prompt, route = null) {
         'Hook visibility limit: hooks can inject context/status or block/continue a turn, but they cannot create arbitrary live chat bubbles; use team events, mission files, or normal assistant updates for live transcript details.',
         'Ambient Goal continuation: even without an explicit $Goal keyword, use Codex native /goal persistence when it helps keep long work resumable and complete; do not let it replace or skip the selected SKS route gates.',
         'Route contract: execution routes infer contract answers from the prompt, TriWiki/current-code defaults, and conservative SKS policy. DFix and Answer bypass stateful execution because they do not start implementation.',
+        `Wiki-informed request intake: when a mission exists, read ${REQUEST_INTAKE_ARTIFACT} before execution; preserve every source-order requirement, apply TriWiki attention/use_first and hydrate_first context, and execute request_intake.transformed_prompt through the selected route instead of relying on the vague original wording alone.`,
         'Plan-first interaction: when ambiguity questions are truly required, show the user only the missing human decision(s), then seal the decision contract internally and execute/verify.',
         'Question-shaped directive policy: before using Answer, decide whether a question is a real information request or an implicit instruction/complaint about broken behavior. Rhetorical bug reports, mandatory-policy statements, and "why is this not happening?" execution complaints must route to Naruto, not Answer.',
         'Best-practice prompt shape: extract Goal, Context, Constraints, and Done-when before implementation; keep questions compact and only ask for answers that can change scope, safety, user-facing behavior, or acceptance criteria.',
@@ -658,7 +701,8 @@ async function activePipelinePlanNote(root, state = {}) {
     const kept = plan.stage_summary?.kept ?? plan.kept_stages?.length ?? 0;
     const skipped = plan.stage_summary?.skipped ?? plan.skipped_stages?.length ?? 0;
     const next = Array.isArray(plan.next_actions) && plan.next_actions.length ? ` Next planned action: ${plan.next_actions[0]}.` : '';
-    return ` Pipeline plan: .sneakoscope/missions/${state.mission_id}/${PIPELINE_PLAN_ARTIFACT} (${lane}; kept=${kept}, skipped=${skipped}).${next}`;
+    const intake = plan.request_intake?.artifact ? ` Request intake: .sneakoscope/missions/${state.mission_id}/${plan.request_intake.artifact}; execution prompt=${plan.request_intake.transformed_prompt_available ? 'available' : 'missing'}.` : '';
+    return ` Pipeline plan: .sneakoscope/missions/${state.mission_id}/${PIPELINE_PLAN_ARTIFACT} (${lane}; kept=${kept}, skipped=${skipped}).${intake}${next}`;
 }
 async function prepareGoal(root, route, task, required) {
     const { id, dir, mission } = await createMission(root, { mode: 'goal', prompt: task });
@@ -1150,6 +1194,8 @@ function routeContext(route, id, task, required, next) {
 ${route.command} route prepared.
 Mission: ${id}
 Task: ${visibleTask}
+Request intake: .sneakoscope/missions/${id}/${REQUEST_INTAKE_ARTIFACT}
+Execution prompt: request-intake.transformed_prompt
 Pipeline plan: .sneakoscope/missions/${id}/${PIPELINE_PLAN_ARTIFACT}
 Required skills: ${route.requiredSkills.join(', ')}
 Stop gate: ${route.stopGate}

package/dist/core/pipeline-internals/runtime-gates.js CHANGED Viewed

@@ -4,6 +4,7 @@ import { appendJsonl, exists, nowIso, readJson, readText, writeJsonAtomic } from
 import { containsUserQuestion, noQuestionContinuationReason } from '../no-question-guard.js';
 import { missionDir } from '../mission.js';
 import { evaluateResearchGate } from '../research.js';
+import { evaluateQaGate } from '../qa-loop.js';
 import { PPT_REQUIRED_GATE_FIELDS } from '../ppt.js';
 import { validateFinalHonestModeReport } from '../artifact-schemas.js';
 import { IMAGE_UX_REVIEW_GATE_ARTIFACT, IMAGE_UX_REVIEW_POLICY_ARTIFACT, IMAGE_UX_REVIEW_SCREEN_INVENTORY_ARTIFACT, IMAGE_UX_REVIEW_GENERATED_REVIEW_LEDGER_ARTIFACT, IMAGE_UX_REVIEW_ISSUE_LEDGER_ARTIFACT, IMAGE_UX_REVIEW_ITERATION_REPORT_ARTIFACT, IMAGE_UX_REVIEW_REQUIRED_GATE_FIELDS, IMAGE_UX_REVIEW_REFERENCE_GATE_FIELDS, IMAGE_UX_REVIEW_HONEST_MODE_ARTIFACT, imageUxReviewGateAllowsReferenceCloseout } from '../image-ux-review.js';
@@ -392,7 +393,9 @@ function missingRequiredGateFields(file, state, gate = {}) {
     if (file === 'qa-gate.json' || mode === 'QALOOP') {
         const required = ['clarification_contract_sealed', 'qa_report_written', 'qa_ledger_complete', 'checklist_completed', 'safety_reviewed', 'deployed_destructive_tests_blocked', 'credentials_not_persisted', 'honest_mode_complete'];
         if (gate.ui_e2e_required === true)
-            required.push('chrome_extension_preflight_passed', 'ui_chrome_extension_evidence');
+            required.push('chrome_extension_preflight_passed', 'ui_chrome_extension_evidence', 'ui_chrome_extension_screenshot_captured');
+        if (gate.gpt_image_2_annotated_review_required === true)
+            required.push('gpt_image_2_annotated_review_generated');
         return required.filter((key) => gate[key] !== true);
     }
     if (file === 'ppt-gate.json' || mode === 'PPT') {
@@ -421,6 +424,12 @@ async function missingRequiredGateArtifacts(root, file, state, gate = {}) {
             return [];
         return (evaluated.reasons || ['research_gate_blocked']).map((reason) => `research-gate:${reason}`);
     }
+    if (file === 'qa-gate.json' || mode === 'QALOOP') {
+        const evaluated = await evaluateQaGate(missionDir(root, state.mission_id));
+        if (evaluated.passed === true)
+            return [];
+        return (evaluated.reasons || ['qa_gate_blocked']).map((reason) => `qa-gate:${reason}`);
+    }
     if (file === IMAGE_UX_REVIEW_GATE_ARTIFACT || mode === 'IMAGE_UX_REVIEW')
         return missingImageUxReviewArtifacts(root, state, gate);
     if (file === 'naruto-gate.json' || mode === 'NARUTO')

package/dist/core/proof/route-proof-gate.js CHANGED Viewed

@@ -41,7 +41,7 @@ export async function validateRouteCompletionProof(root, { missionId = null, rou
             if (agentCount < 5)
                 issues.push('agent_count_below_5');
             if (agentCount > maxAgentCount)
-                issues.push(`agent_count_above_${maxAgentCount}`);
+                issues.push(normalizedRoute === '$Naruto' ? 'agent_count_above_100' : 'agent_count_above_20');
             if (agents.all_sessions_closed !== true)
                 issues.push('agent_sessions_not_closed');
             if (agents.no_overlap_ok !== true)

package/dist/core/qa-loop.js CHANGED Viewed

@@ -1,12 +1,16 @@
 import path from 'node:path';
 import { exists, nowIso, readJson, readText, writeJsonAtomic, writeTextAtomic, PACKAGE_VERSION } from './fsx.js';
-import { CODEX_WEB_VERIFICATION_EVIDENCE_SOURCE, CODEX_WEB_VERIFICATION_POLICY, evidenceMentionsForbiddenBrowserAutomation, evidenceMentionsForbiddenWebComputerUseEvidence } from './routes.js';
+import { CODEX_APP_IMAGE_GENERATION_DOC_URL, CODEX_IMAGEGEN_REQUIRED_POLICY, CODEX_WEB_VERIFICATION_EVIDENCE_SOURCE, CODEX_WEB_VERIFICATION_POLICY, evidenceMentionsForbiddenBrowserAutomation, evidenceMentionsForbiddenWebComputerUseEvidence } from './routes.js';
 import { appendAgentLedgerEvent, initializeAgentCentralLedger } from './agents/agent-central-ledger.js';
 import { resolveCodexAppExecutionProfile } from './codex-app/codex-app-execution-profile.js';
 import { resolveCodexNativeInvocationPlan } from './codex-native/codex-native-invocation-router.js';
+import { imageDimensions, sha256File } from './wiki-image/image-hash.js';
 export const QA_LOOP_ROUTE = 'QALoop';
+export const QA_LOOP_VISUAL_EVIDENCE_ARTIFACT = 'qa-loop/visual-evidence.json';
 const QA_REPORT_SUFFIX = 'qa-report.md';
 const UI_CHROME_EXTENSION_FIRST_ACK = 'use_codex_chrome_extension_first_no_computer_use_for_web_ui_or_mark_unverified';
+const GPT_IMAGE_2_ANNOTATED_REVIEW_REQUIRED_ACK = 'yes_gpt_image_2_annotated_review';
+const IMAGE_FILE_RE = /\.(png|jpe?g|webp|gif)$/i;
 export const QA_NATIVE_AGENT_PERSONAS = Object.freeze([
     {
         id: 'qa_verifier_ui',
@@ -108,6 +112,9 @@ function promptText(prompt = '') {
 function lowerPrompt(prompt = '') {
     return promptText(prompt).toLowerCase();
 }
+function qaPromptWantsGptImage2AnnotatedReview(prompt = '') {
+    return /(gpt-image-2|gpt\s*image\s*2|imagegen|\$imagegen|annotated\s+review|annotated\s+image|callout|generated\s+review\s+image|이미지\s*리뷰|생성\s*이미지|주석\s*이미지|콜아웃)/i.test(promptText(prompt));
+}
 function firstUrl(prompt = '') {
     return promptText(prompt).match(/https?:\/\/[^\s)\]}>,]+/i)?.[0] || '';
 }
@@ -152,6 +159,16 @@ export function inferQaLoopAnswers(prompt = '') {
     const local = environment === 'local_dev_server';
     const login = loginPolicyFromPrompt(text);
     const scope = qaScopeFromPrompt(text);
+    const wantsGptImage2Review = isUiScope(scope) && qaPromptWantsGptImage2AnnotatedReview(text);
+    const acceptance = [
+        '앱 첫 화면 또는 지정된 대상이 정상 로드된다.',
+        '주요 내비게이션과 핵심 화면 진입에서 콘솔/화면상 치명 오류가 없다.',
+        '검증하지 못한 UI/API 범위는 통과로 주장하지 않고 QA 리포트에 남긴다.'
+    ];
+    if (isUiScope(scope))
+        acceptance.push('UI E2E 통과 증거는 실제 Codex Chrome Extension screenshot artifact path와 sha256을 기록해야 한다.');
+    if (wantsGptImage2Review)
+        acceptance.push('gpt-image-2 annotated review image가 필요한 경우 실제 Codex App $imagegen/gpt-image-2 출력 파일 path, sha256, model, provider를 기록해야 한다.');
     return {
         GOAL_PRECISE: text ? `현재 요청 범위에서 QA-LOOP를 안전하게 실행한다: ${text}` : '현재 로컬 개발 환경에서 핵심 사용자 흐름을 안전하게 QA한다.',
         QA_SCOPE: scope,
@@ -165,13 +182,10 @@ export function inferQaLoopAnswers(prompt = '') {
         ...login,
         CREDENTIAL_STORAGE_ACK: 'never_store_credentials_in_artifacts_or_wiki',
         UI_CHROME_EXTENSION_ACK: UI_CHROME_EXTENSION_FIRST_ACK,
+        QA_VISUAL_REVIEW_IMAGEGEN_REQUIRED: wantsGptImage2Review ? GPT_IMAGE_2_ANNOTATED_REVIEW_REQUIRED_ACK : 'not_required',
         TEAM_MODE_ALLOWED: 'no_parent_only',
         MAX_QA_CYCLES: '1',
-        ACCEPTANCE_CRITERIA: [
-            '앱 첫 화면 또는 지정된 대상이 정상 로드된다.',
-            '주요 내비게이션과 핵심 화면 진입에서 콘솔/화면상 치명 오류가 없다.',
-            '검증하지 못한 UI/API 범위는 통과로 주장하지 않고 QA 리포트에 남긴다.'
-        ],
+        ACCEPTANCE_CRITERIA: acceptance,
         NON_GOALS: [
             '결제, 실제 이메일/SMS 발송, 관리자 권한 변경, 데이터 삭제, 프로덕션 데이터 변경은 테스트하지 않는다.'
         ],
@@ -290,10 +304,22 @@ export function qaUiRequired(a = {}) {
 export function qaApiRequired(a = {}) {
     return a.QA_SCOPE === 'all_available' ? hasApiTarget(a) : isApiScope(a.QA_SCOPE);
 }
+export function qaGptImage2AnnotatedReviewRequired(contractOrAnswers = {}, prompt = '') {
+    const answers = contractOrAnswers?.answers || contractOrAnswers || {};
+    if (!qaUiRequired(answers))
+        return false;
+    const explicit = String(answers.QA_VISUAL_REVIEW_IMAGEGEN_REQUIRED || answers.GPT_IMAGE_2_ANNOTATED_REVIEW_REQUIRED || '').trim();
+    if (/^(yes|true|required|yes_gpt_image_2_annotated_review)$/i.test(explicit))
+        return true;
+    if (/^(no|false|not_required|none)$/i.test(explicit))
+        return false;
+    return qaPromptWantsGptImage2AnnotatedReview(`${prompt || ''}\n${answers.GOAL_PRECISE || ''}\n${JSON.stringify(answers.ACCEPTANCE_CRITERIA || [])}`);
+}
 export function defaultQaGate(contract = {}, opts = {}) {
     const a = contract.answers || {};
     const uiRequired = qaUiRequired(a);
     const apiRequired = qaApiRequired(a);
+    const gptImage2ReviewRequired = qaGptImage2AnnotatedReviewRequired(contract, contract.prompt);
     const reportFile = opts.reportFile || qaReportFilename();
     const corrective = a.QA_CORRECTIVE_POLICY !== 'report_only_no_code_changes';
     return {
@@ -311,6 +337,17 @@ export function defaultQaGate(contract = {}, opts = {}) {
         ui_chrome_extension_evidence: !uiRequired,
         ui_computer_use_evidence: false,
         ui_evidence_source: uiRequired ? null : 'not_required',
+        ui_chrome_extension_screenshot_required: uiRequired,
+        ui_chrome_extension_screenshot_captured: !uiRequired,
+        ui_chrome_extension_screenshot_artifact: null,
+        ui_chrome_extension_screenshot_sha256: null,
+        gpt_image_2_annotated_review_required: gptImage2ReviewRequired,
+        gpt_image_2_annotated_review_generated: !gptImage2ReviewRequired,
+        gpt_image_2_annotated_review_artifact: null,
+        gpt_image_2_annotated_review_sha256: null,
+        gpt_image_2_annotated_review_model: gptImage2ReviewRequired ? null : 'not_required',
+        gpt_image_2_annotated_review_provider: gptImage2ReviewRequired ? null : 'not_required',
+        qa_visual_evidence_artifact: QA_LOOP_VISUAL_EVIDENCE_ARTIFACT,
         desktop_app_handoff_required: false,
         desktop_app_handoff_status: 'not_requested',
         desktop_app_handoff_artifact: null,
@@ -360,13 +397,48 @@ export async function writeQaLoopArtifacts(dir, mission, contract) {
         codex_app_execution_profile: executionProfile ? compactExecutionProfile(executionProfile) : null,
         codex_native_invocation: codexNativeInvocation,
         target: { scope: a.QA_SCOPE, environment: a.TARGET_ENVIRONMENT, base_url: a.TARGET_BASE_URL, api_base_url: a.API_BASE_URL },
-        safety: { mutation_policy: a.QA_MUTATION_POLICY, deployed_destructive_tests_allowed: 'never', credentials: 'temp_only_never_saved', ui_evidence: 'codex_chrome_extension_first_required_for_web_ui_e2e' },
+        safety: { mutation_policy: a.QA_MUTATION_POLICY, deployed_destructive_tests_allowed: 'never', credentials: 'temp_only_never_saved', ui_evidence: 'codex_chrome_extension_first_required_for_web_ui_e2e', visual_review: 'gpt_image_2_annotated_review_required_when_contract_requests_it' },
         checklist
     });
+    await writeJsonAtomic(path.join(dir, QA_LOOP_VISUAL_EVIDENCE_ARTIFACT), buildQaLoopVisualEvidenceArtifact(mission, contract));
     await writeJsonAtomic(path.join(dir, 'qa-gate.json'), defaultQaGate(contract, { reportFile, executionProfile, codexNativeInvocation }));
     await writeTextAtomic(path.join(dir, reportFile), qaReportTemplate(mission, contract, checklist));
     return { checklist_count: checklist.length, report_file: reportFile };
 }
+export async function ensureQaLoopVisualEvidenceContract(dir, mission = {}, contract = {}) {
+    const visualPath = path.join(dir, QA_LOOP_VISUAL_EVIDENCE_ARTIFACT);
+    if (!(await exists(visualPath))) {
+        await writeJsonAtomic(visualPath, buildQaLoopVisualEvidenceArtifact(mission, contract));
+    }
+    const gatePath = path.join(dir, 'qa-gate.json');
+    const gate = await readJson(gatePath, null);
+    if (!gate)
+        return;
+    const defaults = defaultQaGate(contract, { reportFile: qaReportFileFromGate(gate) || qaReportFilename() });
+    const keys = [
+        'ui_chrome_extension_screenshot_required',
+        'ui_chrome_extension_screenshot_captured',
+        'ui_chrome_extension_screenshot_artifact',
+        'ui_chrome_extension_screenshot_sha256',
+        'gpt_image_2_annotated_review_required',
+        'gpt_image_2_annotated_review_generated',
+        'gpt_image_2_annotated_review_artifact',
+        'gpt_image_2_annotated_review_sha256',
+        'gpt_image_2_annotated_review_model',
+        'gpt_image_2_annotated_review_provider',
+        'qa_visual_evidence_artifact'
+    ];
+    const next = { ...gate };
+    let changed = false;
+    for (const key of keys) {
+        if (next[key] === undefined) {
+            next[key] = defaults[key];
+            changed = true;
+        }
+    }
+    if (changed)
+        await writeJsonAtomic(gatePath, next);
+}
 export async function evaluateQaGate(dir) {
     const gate = await readJson(path.join(dir, 'qa-gate.json'), {});
     const reportFile = qaReportFileFromGate(gate);
@@ -400,6 +472,10 @@ export async function evaluateQaGate(dir) {
             reasons.push('forbidden_browser_automation_evidence');
         if (evidenceMentionsForbiddenWebComputerUseEvidence({ evidence: gate.evidence, ui_evidence_source: gate.ui_evidence_source }))
             reasons.push('computer_use_web_evidence_forbidden');
+        reasons.push(...await missingQaLoopVisualEvidence(dir, gate));
+    }
+    else if (gate.gpt_image_2_annotated_review_required === true) {
+        reasons.push(...await missingQaLoopVisualEvidence(dir, gate));
     }
     if (gate.desktop_app_handoff_required === true) {
         if (!['pending', 'launched_pending_confirmation', 'completed'].includes(String(gate.desktop_app_handoff_status || '')))
@@ -424,8 +500,9 @@ export async function evaluateQaGate(dir) {
         reasons.push('qa_report_missing');
     if (!(await exists(path.join(dir, 'qa-ledger.json'))))
         reasons.push('qa_ledger_missing');
-    const passed = gate.passed === true && reasons.length === 0;
-    const result = { checked_at: nowIso(), passed, reasons, gate };
+    const uniqueReasons = [...new Set(reasons)];
+    const passed = gate.passed === true && uniqueReasons.length === 0;
+    const result = { checked_at: nowIso(), passed, reasons: uniqueReasons, gate };
     await writeJsonAtomic(path.join(dir, 'qa-gate.evaluated.json'), result);
     return result;
 }
@@ -514,12 +591,19 @@ ARTIFACTS: update qa-ledger.json, ${report}, qa-gate.json, and qa-loop/cycle-${c
 CONTRACT:
 ${JSON.stringify(contract, null, 2)}
 ${imageContractText}${appHandoffText}${executionProfileText}
+VISUAL EVIDENCE CONTRACT:
+- For web UI QA, do not set chrome_extension_preflight_passed/ui_chrome_extension_evidence to true unless the Codex Chrome Extension path is ready and ${QA_LOOP_VISUAL_EVIDENCE_ARTIFACT} records a real saved Chrome Extension screenshot artifact with path, sha256, and dimensions.
+- If decision-contract.json answers set QA_VISUAL_REVIEW_IMAGEGEN_REQUIRED=${GPT_IMAGE_2_ANNOTATED_REVIEW_REQUIRED_ACK}, use Codex App $imagegen/gpt-image-2 (${CODEX_APP_IMAGE_GENERATION_DOC_URL}) to produce a real generated annotated review image from the Chrome Extension screenshot. Record its path, sha256, model=gpt-image-2, provider=Codex App $imagegen, and source_screenshot_artifact in ${QA_LOOP_VISUAL_EVIDENCE_ARTIFACT} and qa-gate.json.
+- Do not substitute prose-only critique, Playwright/Selenium/Puppeteer/Browser Use screenshots, Computer Use browser screenshots, placeholder images, fake fixtures, or direct API fallback as full web UI visual evidence.
 Previous tail:
 ${String(previous || '').slice(-2500)}
 `;
 }
 export async function qaStatus(dir) {
-    const gate = await readJson(path.join(dir, 'qa-gate.evaluated.json'), await readJson(path.join(dir, 'qa-gate.json'), null));
+    const mission = await readJson(path.join(dir, 'mission.json'), {});
+    const contract = await readJson(path.join(dir, 'decision-contract.json'), { prompt: mission.prompt, answers: {}, sealed_hash: null });
+    await ensureQaLoopVisualEvidenceContract(dir, mission, contract).catch(() => undefined);
+    const gate = await evaluateQaGate(dir).catch(async () => await readJson(path.join(dir, 'qa-gate.evaluated.json'), await readJson(path.join(dir, 'qa-gate.json'), null)));
     const ledger = await readJson(path.join(dir, 'qa-ledger.json'), null);
     const appHandoff = await readJson(path.join(dir, 'qa-loop', 'app-handoff.json'), null);
     const appConfirmation = await readJson(path.join(dir, 'qa-loop', 'app-handoff-confirmation.json'), null);
@@ -545,6 +629,138 @@ function qaChecklist(a) {
     cases.push(['report.evidence', 'Record pass/fail/blocked/skipped with evidence.'], ['report.corrective_loop', 'Record fixes, rechecks, unresolved findings, deferred blockers.'], ['report.honest', 'Run Honest Mode.']);
     return cases.map(([id, title]) => ({ id, title, status: 'pending', evidence: [] }));
 }
+export function buildQaLoopVisualEvidenceArtifact(mission = {}, contract = {}) {
+    const answers = contract.answers || {};
+    const uiRequired = qaUiRequired(answers);
+    const gptImage2ReviewRequired = qaGptImage2AnnotatedReviewRequired(contract, contract.prompt || mission.prompt);
+    return {
+        schema: 'sks.qa-loop-visual-evidence.v1',
+        generated_at: nowIso(),
+        mission_id: mission.id || contract.mission_id || null,
+        contract_hash: contract.sealed_hash || null,
+        required: uiRequired || gptImage2ReviewRequired,
+        chrome_extension_screenshot: {
+            required: uiRequired,
+            status: uiRequired ? 'pending' : 'not_required',
+            evidence_source: CODEX_WEB_VERIFICATION_EVIDENCE_SOURCE,
+            artifact_path: null,
+            sha256: null,
+            width: null,
+            height: null,
+            privacy: 'local-only'
+        },
+        gpt_image_2_annotated_review: {
+            required: gptImage2ReviewRequired,
+            status: gptImage2ReviewRequired ? 'pending' : 'not_required',
+            model: gptImage2ReviewRequired ? 'gpt-image-2' : 'not_required',
+            provider: gptImage2ReviewRequired ? 'Codex App $imagegen' : 'not_required',
+            source_screenshot_artifact: null,
+            artifact_path: null,
+            sha256: null,
+            width: null,
+            height: null,
+            required_output: gptImage2ReviewRequired ? 'generated_annotated_review_image_with_numbered_callouts_severity_labels_and_visual_marks' : 'not_required',
+            docs_url: CODEX_APP_IMAGE_GENERATION_DOC_URL,
+            privacy: 'local-only'
+        },
+        blockers: uiRequired ? ['chrome_extension_screenshot_missing'] : [],
+        notes: [
+            'QA-LOOP web visual evidence must be backed by real saved local image files.',
+            CODEX_WEB_VERIFICATION_POLICY,
+            CODEX_IMAGEGEN_REQUIRED_POLICY
+        ]
+    };
+}
+async function missingQaLoopVisualEvidence(dir, gate = {}) {
+    const visual = await readJson(path.join(dir, QA_LOOP_VISUAL_EVIDENCE_ARTIFACT), null);
+    const reasons = [];
+    const uiRequired = gate.ui_e2e_required === true;
+    if (uiRequired) {
+        const screenshot = visual?.chrome_extension_screenshot || {};
+        if (gate.ui_chrome_extension_screenshot_captured !== true && !positiveVisualStatus(screenshot.status, ['captured', 'attached', 'verified']))
+            reasons.push('ui_chrome_extension_screenshot_missing');
+        const screenshotPath = firstNonEmpty(gate.ui_chrome_extension_screenshot_artifact, gate.chrome_extension_screenshot_artifact, gate.ui_chrome_extension_screenshot?.path, gate.chrome_extension_screenshot?.path, screenshot.artifact_path, screenshot.path);
+        const screenshotSha = firstNonEmpty(gate.ui_chrome_extension_screenshot_sha256, gate.chrome_extension_screenshot_sha256, gate.ui_chrome_extension_screenshot?.sha256, gate.chrome_extension_screenshot?.sha256, screenshot.sha256);
+        const screenshotDims = {
+            width: firstNonEmpty(gate.ui_chrome_extension_screenshot_width, gate.ui_chrome_extension_screenshot?.width, gate.chrome_extension_screenshot?.width, screenshot.width),
+            height: firstNonEmpty(gate.ui_chrome_extension_screenshot_height, gate.ui_chrome_extension_screenshot?.height, gate.chrome_extension_screenshot?.height, screenshot.height)
+        };
+        if (!screenshotPath)
+            reasons.push('ui_chrome_extension_screenshot_artifact_missing');
+        else
+            reasons.push(...await imageEvidenceFileReasons(dir, screenshotPath, screenshotSha, 'ui_chrome_extension_screenshot', screenshotDims));
+        const screenshotSource = firstNonEmpty(gate.ui_chrome_extension_screenshot_source, screenshot.evidence_source, gate.ui_evidence_source);
+        if (screenshotSource !== CODEX_WEB_VERIFICATION_EVIDENCE_SOURCE)
+            reasons.push('ui_chrome_extension_screenshot_source_not_codex_chrome_extension');
+    }
+    const review = visual?.gpt_image_2_annotated_review || {};
+    const gptImage2ReviewRequired = gate.gpt_image_2_annotated_review_required === true || review.required === true;
+    if (gptImage2ReviewRequired) {
+        if (gate.gpt_image_2_annotated_review_generated !== true && !positiveVisualStatus(review.status, ['generated', 'attached', 'verified']))
+            reasons.push('gpt_image_2_annotated_review_image_missing');
+        const reviewPath = firstNonEmpty(gate.gpt_image_2_annotated_review_artifact, gate.imagegen_annotated_review_artifact, gate.gpt_image_2_annotated_review?.path, gate.gpt_image_2_annotated_review_image?.path, review.artifact_path, review.path);
+        const reviewSha = firstNonEmpty(gate.gpt_image_2_annotated_review_sha256, gate.gpt_image_2_annotated_review?.sha256, gate.gpt_image_2_annotated_review_image?.sha256, review.sha256);
+        const reviewDims = {
+            width: firstNonEmpty(gate.gpt_image_2_annotated_review_width, gate.gpt_image_2_annotated_review?.width, gate.gpt_image_2_annotated_review_image?.width, review.width),
+            height: firstNonEmpty(gate.gpt_image_2_annotated_review_height, gate.gpt_image_2_annotated_review?.height, gate.gpt_image_2_annotated_review_image?.height, review.height)
+        };
+        if (!reviewPath)
+            reasons.push('gpt_image_2_annotated_review_artifact_missing');
+        else
+            reasons.push(...await imageEvidenceFileReasons(dir, reviewPath, reviewSha, 'gpt_image_2_annotated_review', reviewDims));
+        const model = firstNonEmpty(gate.gpt_image_2_annotated_review_model, gate.gpt_image_2_annotated_review?.model, gate.gpt_image_2_annotated_review_image?.model, review.model, review.provider?.model);
+        if (model !== 'gpt-image-2')
+            reasons.push('gpt_image_2_annotated_review_model_missing');
+        const provider = firstNonEmpty(gate.gpt_image_2_annotated_review_provider, gate.gpt_image_2_annotated_review?.provider, gate.gpt_image_2_annotated_review_image?.provider, review.provider, review.provider_surface);
+        if (!provider || !/codex\s+app|\$imagegen|codex_app_imagegen/i.test(String(provider)))
+            reasons.push('gpt_image_2_annotated_review_provider_not_codex_app_imagegen');
+        if (/mock|fake|fixture|placeholder|text[-_ ]?only|direct\s+api|openai_images_api|responses_image_generation/i.test(String(provider)))
+            reasons.push('gpt_image_2_annotated_review_provider_forbidden');
+        const sourceScreenshot = firstNonEmpty(gate.gpt_image_2_source_screenshot_artifact, gate.gpt_image_2_annotated_review?.source_screenshot_artifact, gate.gpt_image_2_annotated_review_image?.source_screenshot_artifact, review.source_screenshot_artifact, gate.ui_chrome_extension_screenshot_artifact);
+        if (!sourceScreenshot)
+            reasons.push('gpt_image_2_source_screenshot_artifact_missing');
+    }
+    return [...new Set(reasons)];
+}
+function positiveVisualStatus(status, accepted) {
+    return accepted.includes(String(status || '').trim().toLowerCase());
+}
+function firstNonEmpty(...values) {
+    for (const value of values) {
+        if (typeof value === 'string' && value.trim())
+            return value.trim();
+        if (value && typeof value !== 'string')
+            return value;
+    }
+    return null;
+}
+async function imageEvidenceFileReasons(dir, artifactPath, declaredSha, prefix, declaredDims = {}) {
+    const reasons = [];
+    const resolved = resolveEvidencePath(dir, artifactPath);
+    if (!resolved)
+        return [`${prefix}_artifact_path_invalid`];
+    if (!IMAGE_FILE_RE.test(resolved))
+        reasons.push(`${prefix}_artifact_not_image_file`);
+    if (!(await exists(resolved)))
+        return [...reasons, `${prefix}_artifact_file_missing`];
+    const sha = await sha256File(resolved).catch(() => null);
+    if (!declaredSha)
+        reasons.push(`${prefix}_sha256_missing`);
+    else if (sha && String(declaredSha) !== sha)
+        reasons.push(`${prefix}_sha256_mismatch`);
+    const dims = await imageDimensions(resolved).catch(() => null);
+    const width = Number(dims?.width ?? declaredDims?.width);
+    const height = Number(dims?.height ?? declaredDims?.height);
+    if (!Number.isFinite(width) || !Number.isFinite(height) || width <= 0 || height <= 0)
+        reasons.push(`${prefix}_dimensions_missing`);
+    return reasons;
+}
+function resolveEvidencePath(dir, artifactPath) {
+    const value = String(artifactPath || '').trim().replace(/^file:\/\//i, '');
+    if (!value || /^https?:\/\//i.test(value))
+        return null;
+    return path.isAbsolute(value) ? value : path.resolve(dir, value);
+}
 function missionRootFromDir(dir) {
     const normalized = path.resolve(String(dir || ''));
     const marker = `${path.sep}.sneakoscope${path.sep}missions${path.sep}`;
@@ -564,7 +780,7 @@ function compactExecutionProfile(profile) {
 }
 function qaReportTemplate(mission, contract, checklist) {
     const a = contract.answers || {};
-    return `# QA-LOOP Report\n\nMission: ${mission.id}\nTarget: ${a.TARGET_BASE_URL || 'unset'}\nScope: ${a.QA_SCOPE || 'unset'}\nEnvironment: ${a.TARGET_ENVIRONMENT || 'unset'}\n\n## Safety\n\n- Deployed destructive tests: never\n- Credentials: temp-only, never saved\n- UI evidence: ${CODEX_WEB_VERIFICATION_POLICY}\n\n## Checklist\n\n${checklist.map((item) => `- [ ] ${item.id}: ${item.title}`).join('\n')}\n\n## Findings\n\nTBD\n\n## Corrections And Rechecks\n\nTBD\n\n## Honest Mode\n\nTBD\n`;
+    return `# QA-LOOP Report\n\nMission: ${mission.id}\nTarget: ${a.TARGET_BASE_URL || 'unset'}\nScope: ${a.QA_SCOPE || 'unset'}\nEnvironment: ${a.TARGET_ENVIRONMENT || 'unset'}\n\n## Safety\n\n- Deployed destructive tests: never\n- Credentials: temp-only, never saved\n- UI evidence: ${CODEX_WEB_VERIFICATION_POLICY}\n- Visual evidence ledger: ${QA_LOOP_VISUAL_EVIDENCE_ARTIFACT}\n\n## Checklist\n\n${checklist.map((item) => `- [ ] ${item.id}: ${item.title}`).join('\n')}\n\n## Findings\n\nTBD\n\n## Corrections And Rechecks\n\nTBD\n\n## Honest Mode\n\nTBD\n`;
 }
 function positiveCount(value) {
     const n = Number(value || 0);