npm - @veraxhq/verax - Versions diffs - 0.1.0 → 0.2.0 - Mend

@veraxhq/verax 0.1.0 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (126) hide show

package/README.md +123 -88
package/bin/verax.js +11 -452
package/package.json +14 -36
package/src/cli/commands/default.js +523 -0
package/src/cli/commands/doctor.js +165 -0
package/src/cli/commands/inspect.js +109 -0
package/src/cli/commands/run.js +402 -0
package/src/cli/entry.js +196 -0
package/src/cli/util/atomic-write.js +37 -0
package/src/cli/util/detection-engine.js +296 -0
package/src/cli/util/env-url.js +33 -0
package/src/cli/util/errors.js +44 -0
package/src/cli/util/events.js +34 -0
package/src/cli/util/expectation-extractor.js +378 -0
package/src/cli/util/findings-writer.js +31 -0
package/src/cli/util/idgen.js +87 -0
package/src/cli/util/learn-writer.js +39 -0
package/src/cli/util/observation-engine.js +366 -0
package/src/cli/util/observe-writer.js +25 -0
package/src/cli/util/paths.js +29 -0
package/src/cli/util/project-discovery.js +277 -0
package/src/cli/util/project-writer.js +26 -0
package/src/cli/util/redact.js +128 -0
package/src/cli/util/run-id.js +30 -0
package/src/cli/util/summary-writer.js +32 -0
package/src/verax/cli/ci-summary.js +35 -0
package/src/verax/cli/context-explanation.js +89 -0
package/src/verax/cli/doctor.js +277 -0
package/src/verax/cli/error-normalizer.js +154 -0
package/src/verax/cli/explain-output.js +105 -0
package/src/verax/cli/finding-explainer.js +130 -0
package/src/verax/cli/init.js +237 -0
package/src/verax/cli/run-overview.js +163 -0
package/src/verax/cli/url-safety.js +101 -0
package/src/verax/cli/wizard.js +98 -0
package/src/verax/cli/zero-findings-explainer.js +57 -0
package/src/verax/cli/zero-interaction-explainer.js +127 -0
package/src/verax/core/action-classifier.js +86 -0
package/src/verax/core/budget-engine.js +218 -0
package/src/verax/core/canonical-outcomes.js +157 -0
package/src/verax/core/decision-snapshot.js +335 -0
package/src/verax/core/determinism-model.js +403 -0
package/src/verax/core/incremental-store.js +237 -0
package/src/verax/core/invariants.js +356 -0
package/src/verax/core/promise-model.js +230 -0
package/src/verax/core/replay-validator.js +350 -0
package/src/verax/core/replay.js +222 -0
package/src/verax/core/run-id.js +175 -0
package/src/verax/core/run-manifest.js +99 -0
package/src/verax/core/silence-impact.js +369 -0
package/src/verax/core/silence-model.js +521 -0
package/src/verax/detect/comparison.js +2 -34
package/src/verax/detect/confidence-engine.js +764 -329
package/src/verax/detect/detection-engine.js +293 -0
package/src/verax/detect/evidence-index.js +177 -0
package/src/verax/detect/expectation-model.js +194 -172
package/src/verax/detect/explanation-helpers.js +187 -0
package/src/verax/detect/finding-detector.js +450 -0
package/src/verax/detect/findings-writer.js +44 -8
package/src/verax/detect/flow-detector.js +366 -0
package/src/verax/detect/index.js +172 -286
package/src/verax/detect/interactive-findings.js +613 -0
package/src/verax/detect/signal-mapper.js +308 -0
package/src/verax/detect/verdict-engine.js +563 -0
package/src/verax/evidence-index-writer.js +61 -0
package/src/verax/index.js +90 -14
package/src/verax/intel/effect-detector.js +368 -0
package/src/verax/intel/handler-mapper.js +249 -0
package/src/verax/intel/index.js +281 -0
package/src/verax/intel/route-extractor.js +280 -0
package/src/verax/intel/ts-program.js +256 -0
package/src/verax/intel/vue-navigation-extractor.js +579 -0
package/src/verax/intel/vue-router-extractor.js +323 -0
package/src/verax/learn/action-contract-extractor.js +335 -101
package/src/verax/learn/ast-contract-extractor.js +95 -5
package/src/verax/learn/flow-extractor.js +172 -0
package/src/verax/learn/manifest-writer.js +97 -47
package/src/verax/learn/project-detector.js +40 -0
package/src/verax/learn/route-extractor.js +27 -96
package/src/verax/learn/state-extractor.js +212 -0
package/src/verax/learn/static-extractor-navigation.js +114 -0
package/src/verax/learn/static-extractor-validation.js +88 -0
package/src/verax/learn/static-extractor.js +112 -4
package/src/verax/learn/truth-assessor.js +24 -21
package/src/verax/observe/aria-sensor.js +211 -0
package/src/verax/observe/browser.js +10 -5
package/src/verax/observe/console-sensor.js +1 -17
package/src/verax/observe/domain-boundary.js +10 -1
package/src/verax/observe/expectation-executor.js +512 -0
package/src/verax/observe/flow-matcher.js +143 -0
package/src/verax/observe/focus-sensor.js +196 -0
package/src/verax/observe/human-driver.js +643 -275
package/src/verax/observe/index.js +908 -27
package/src/verax/observe/index.js.backup +1 -0
package/src/verax/observe/interaction-discovery.js +365 -14
package/src/verax/observe/interaction-runner.js +563 -198
package/src/verax/observe/loading-sensor.js +139 -0
package/src/verax/observe/navigation-sensor.js +255 -0
package/src/verax/observe/network-sensor.js +55 -7
package/src/verax/observe/observed-expectation-deriver.js +186 -0
package/src/verax/observe/observed-expectation.js +305 -0
package/src/verax/observe/page-frontier.js +234 -0
package/src/verax/observe/settle.js +37 -17
package/src/verax/observe/state-sensor.js +389 -0
package/src/verax/observe/timing-sensor.js +228 -0
package/src/verax/observe/traces-writer.js +61 -20
package/src/verax/observe/ui-signal-sensor.js +136 -17
package/src/verax/scan-summary-writer.js +77 -15
package/src/verax/shared/artifact-manager.js +110 -8
package/src/verax/shared/budget-profiles.js +136 -0
package/src/verax/shared/ci-detection.js +39 -0
package/src/verax/shared/config-loader.js +170 -0
package/src/verax/shared/dynamic-route-utils.js +218 -0
package/src/verax/shared/expectation-coverage.js +44 -0
package/src/verax/shared/expectation-prover.js +81 -0
package/src/verax/shared/expectation-tracker.js +201 -0
package/src/verax/shared/expectations-writer.js +60 -0
package/src/verax/shared/first-run.js +44 -0
package/src/verax/shared/progress-reporter.js +171 -0
package/src/verax/shared/retry-policy.js +14 -1
package/src/verax/shared/root-artifacts.js +49 -0
package/src/verax/shared/scan-budget.js +86 -0
package/src/verax/shared/url-normalizer.js +162 -0
package/src/verax/shared/zip-artifacts.js +65 -0
package/src/verax/validate/context-validator.js +244 -0
package/src/verax/validate/context-validator.js.bak +0 -0

package/src/verax/detect/verdict-engine.js ADDED Viewed

@@ -0,0 +1,563 @@
+/**
+ * OBSERVATION ENGINE
+ *
+ * Produces an observation summary from scan results.
+ *
+ * VERAX is an Outcome Observer - it does NOT judge, validate, or decide.
+ * It observes what code promises, what users do, and what actually happens.
+ * It reports observations, discrepancies, gaps, and unknowns - nothing more.
+ *
+ * NO VERDICT. NO JUDGMENT. NO SAFETY CLAIM. NO GO/NO-GO DECISIONS.
+ *
+ * PHASE 2: All observations include canonical outcome classifications.
+ * PHASE 3: All observations include Promise awareness - what promise was being evaluated.
+ * PHASE 4: All observations include Silence lifecycle - type, trigger, evaluation status, confidence impact.
+ */
+import fs from 'fs';
+import path from 'path';
+import { buildEvidenceIndex, writeEvidenceIndex } from './evidence-index.js';
+import { CANONICAL_OUTCOMES } from '../core/canonical-outcomes.js';
+import { SILENCE_TYPES, EVALUATION_STATUS } from '../core/silence-model.js';
+import { inferPromiseFromInteraction } from '../core/promise-model.js';
+import { createImpactSummary } from '../core/silence-impact.js';
+/**
+ * Compute observation summary from scan findings and analysis.
+ *
+ * SILENCE TRACKING: All gaps, timeouts, skips, sensor failures are explicit.
+ * Nothing unobserved is allowed to disappear.
+ *
+ * @param {Array} findings - Array of finding objects (observed discrepancies)
+ * @param {Object} observeTruth - Coverage data (what was observed)
+ * @param {Object} learnTruth - Learned route data
+ * @param {Array} coverageGaps - Expectations/interactions not evaluated
+ * @param {Boolean} budgetExceeded - Whether budget was exceeded during scan
+ * @param {Object} detectTruth - Detection truth (includes silence data)
+ * @returns {Object} ObservationSummary with findings, gaps, unknowns, coverage facts, silences
+ */
+export function computeObservationSummary(findings, observeTruth, learnTruth, coverageGaps, budgetExceeded, detectTruth = null, projectDir = null, silenceTracker = null) {
+  const isBudgetExceeded = budgetExceeded !== undefined ? budgetExceeded : (observeTruth?.budgetExceeded === true);
+  const traces = Array.isArray(observeTruth?.traces) ? observeTruth.traces : [];
+  const evidenceBuild = buildEvidenceIndex(traces, projectDir, silenceTracker);
+  // Extract coverage facts
+  const coverage = observeTruth?.coverage || {};
+  const pagesEvaluated = coverage.pagesVisited || 0;
+  const pagesDiscovered = coverage.pagesDiscovered || 0;
+  const interactionsEvaluated = coverage.interactionsExecuted || coverage.candidatesSelected || observeTruth?.interactionsObserved || 0;
+  const interactionsDiscovered = coverage.interactionsDiscovered || coverage.candidatesDiscovered || 0;
+  const expectationTotal = learnTruth?.expectationsDiscovered || 0;
+  const coverageGapsCount = coverageGaps?.length || 0;
+  const expectationsEvaluated = Math.max(0, expectationTotal - coverageGapsCount);
+  // Count unproven results (interactions without PROVEN expectations)
+  const unprovenTraces = traces.filter(t =>
+    t.unprovenResult === true || t.resultType === 'UNPROVEN_RESULT'
+  );
+  const skippedCount = coverage.skippedInteractions || 0;
+  // Count findings by confidence (for transparency, not judgment)
+  const findingsByConfidence = {
+    HIGH: 0,
+    MEDIUM: 0,
+    LOW: 0,
+    UNKNOWN: 0
+  };
+  const findingsByType = {};
+  const findingsByOutcome = {};  // PHASE 2: Added outcome tracking
+  const findingsByPromise = {};  // PHASE 3: Added promise tracking
+  for (const finding of (findings || [])) {
+    const confidence = finding.confidence?.level || 'UNKNOWN';
+    const type = finding.type || 'unknown';
+    const outcome = finding.outcome || CANONICAL_OUTCOMES.SILENT_FAILURE;  // Default for legacy findings
+    const promiseType = finding.promise?.type || 'UNKNOWN_PROMISE';  // PHASE 3
+    if (findingsByConfidence.hasOwnProperty(confidence)) {
+      findingsByConfidence[confidence]++;
+    }
+    findingsByType[type] = (findingsByType[type] || 0) + 1;
+    findingsByOutcome[outcome] = (findingsByOutcome[outcome] || 0) + 1;  // PHASE 2
+    findingsByPromise[promiseType] = (findingsByPromise[promiseType] || 0) + 1;  // PHASE 3
+  }
+  // Calculate ratios (factual, not judgmental)
+  const pageRatio = pagesDiscovered > 0 ? clampRatio(pagesEvaluated / pagesDiscovered) : (pagesDiscovered === 0 ? null : 0);
+  const interactionRatio = interactionsDiscovered > 0 ? clampRatio(interactionsEvaluated / interactionsDiscovered) : (interactionsDiscovered === 0 ? null : 0);
+  const expectationRatio = expectationTotal > 0 ? clampRatio(expectationsEvaluated / expectationTotal) : (expectationTotal === 0 ? null : 0);
+  // Identify gaps explicitly
+  const gaps = {
+    pages: pagesDiscovered > pagesEvaluated ? pagesDiscovered - pagesEvaluated : 0,
+    interactions: interactionsDiscovered > interactionsEvaluated ? interactionsDiscovered - interactionsEvaluated : 0,
+    expectations: coverageGapsCount,
+    skippedInteractions: skippedCount,
+    unprovenResults: unprovenTraces.length
+  };
+  // Build gap details
+  const gapDetails = [];
+  if (isBudgetExceeded) {
+    gapDetails.push({
+      outcome: CANONICAL_OUTCOMES.COVERAGE_GAP,  // PHASE 2
+      type: 'budget_exceeded',
+      message: `Budget limit reached: ${pagesEvaluated} ${pagesEvaluated}/${pagesDiscovered} pages and ${interactionsEvaluated}/${interactionsDiscovered} interactions evaluated - observation incomplete`,
+      pagesAffected: pagesDiscovered - pagesEvaluated,
+      interactionsAffected: interactionsDiscovered - interactionsEvaluated
+    });
+  }
+  if (gaps.pages > 0) {
+    gapDetails.push({
+      outcome: CANONICAL_OUTCOMES.COVERAGE_GAP,  // PHASE 2
+      type: 'pages_not_evaluated',
+      message: `${gaps.pages} page(s) discovered but not visited - observations for these pages are unavailable`,
+      count: gaps.pages
+    });
+  }
+  if (gaps.interactions > 0) {
+    gapDetails.push({
+      outcome: CANONICAL_OUTCOMES.COVERAGE_GAP,  // PHASE 2
+      type: 'interactions_not_evaluated',
+      message: `${gaps.interactions} interaction(s) discovered but not executed - behavior of these interactions is unknown`,
+      count: gaps.interactions
+    });
+  }
+  if (gaps.expectations > 0) {
+    gapDetails.push({
+      outcome: CANONICAL_OUTCOMES.COVERAGE_GAP,  // PHASE 2
+      type: 'expectations_not_evaluated',
+      message: `${gaps.expectations} expectation(s) defined but not evaluated - cannot determine if code matches reality for these`,
+      count: gaps.expectations,
+      details: coverageGaps.slice(0, 10) // Limit detail list
+    });
+  }
+  if (gaps.skippedInteractions > 0) {
+    gapDetails.push({
+      outcome: CANONICAL_OUTCOMES.UNPROVEN_INTERACTION,  // PHASE 2: Executed but outcome not asserted
+      type: 'interactions_skipped',
+      message: `${gaps.skippedInteractions} interaction(s) executed but outcomes not evaluated (safety policy, ambiguous state, or technical limitations)`,
+      count: gaps.skippedInteractions
+    });
+  }
+  // Build observation summary
+  const summary = {
+    toolStatus: 'completed',
+    observations: {
+      discrepanciesObserved: findings?.length || 0,
+      discrepanciesByType: findingsByType,
+      discrepanciesByConfidence: findingsByConfidence,
+      discrepanciesByOutcome: findingsByOutcome,  // PHASE 2: Canonical outcomes
+      discrepanciesByPromise: findingsByPromise,  // PHASE 3: Promise types
+      findings: findings || []
+    },
+    coverage: {
+      pagesEvaluated,
+      pagesDiscovered,
+      pageRatio: pageRatio !== null ? pageRatio : undefined,
+      interactionsEvaluated,
+      interactionsDiscovered,
+      interactionRatio: interactionRatio !== null ? interactionRatio : undefined,
+      expectationsEvaluated,
+      expectationsDiscovered: expectationTotal,
+      expectationRatio: expectationRatio !== null ? expectationRatio : undefined
+    },
+    gaps: {
+      total: Object.values(gaps).reduce((a, b) => a + b, 0),
+      pages: gaps.pages,
+      interactions: gaps.interactions + gaps.skippedInteractions,
+      expectations: gaps.expectations,
+      unprovenResults: gaps.unprovenResults,
+      details: gapDetails
+    },
+    // SILENCE TRACKING: Attach all silence data for explicit reporting
+    silences: detectTruth?.silences || null,
+    // PHASE 4: Add silence impact accounting
+    silenceImpactSummary: detectTruth?.silences?.entries ?
+      createImpactSummary(detectTruth.silences.entries) :
+      null,
+    evidenceIndex: evidenceBuild.evidenceIndex,
+    observedAt: new Date().toISOString()
+  };
+  return summary;
+}
+/**
+ * Format observation summary for console output.
+ *
+ * PHASE 2: Includes canonical outcome classifications
+ *
+ * SILENCE PHILOSOPHY:
+ * - Gaps/unknowns ALWAYS shown, even if zero (no silent success)
+ * - Timeouts, caps, skips, sensor failures explicitly reported
+ * - Zero counts are explicit: "(No gaps)" not hidden
+ * - Nothing unobserved is allowed to disappear
+ *
+ * Observational, not judgmental. Reports facts: what was observed, gaps, unknowns.
+ *
+ * @param {Object} observationSummary - Observation summary object
+ * @returns {string} Formatted observation report
+ */
+export function formatObservationSummary(observationSummary) {
+  const lines = [];
+  lines.push('\n═══════════════════════════════════════');
+  lines.push('OBSERVATION REPORT');
+  lines.push('═══════════════════════════════════════');
+  // Tool status (factual only)
+  lines.push('');
+  lines.push(`Tool Status: ${observationSummary.toolStatus || 'completed'}`);
+  lines.push(`(Indicates tool execution status, not site quality or safety)`);
+  // What was observed
+  lines.push('');
+  lines.push('DISCREPANCIES OBSERVED:');
+  const obs = observationSummary.observations || {};
+  lines.push(`  Count: ${obs.discrepanciesObserved || 0}`);
+  if (obs.discrepanciesObserved > 0) {
+    lines.push('  Types observed:');
+    for (const [type, count] of Object.entries(obs.discrepanciesByType || {})) {
+      lines.push(`    - ${type}: ${count}`);
+    }
+    // PHASE 2: Show outcomes
+    if (obs.discrepanciesByOutcome && Object.keys(obs.discrepanciesByOutcome).length > 0) {
+      lines.push('  By outcome classification:');
+      for (const [outcome, count] of Object.entries(obs.discrepanciesByOutcome)) {
+        if (count > 0) {
+          lines.push(`    - ${outcome}: ${count}`);
+        }
+      }
+    }
+    // PHASE 3: Show promises
+    if (obs.discrepanciesByPromise && Object.keys(obs.discrepanciesByPromise).length > 0) {
+      lines.push('  By promise type:');
+      for (const [promise, count] of Object.entries(obs.discrepanciesByPromise)) {
+        if (count > 0) {
+          const promiseLabel = promise.replace(/_PROMISE$/, '').replace(/_/g, ' ');
+          lines.push(`    - ${promiseLabel}: ${count}`);
+        }
+      }
+    }
+    lines.push('  By confidence level:');
+    const conf = obs.discrepanciesByConfidence || {};
+    if (conf.HIGH > 0) lines.push(`    - HIGH: ${conf.HIGH}`);
+    if (conf.MEDIUM > 0) lines.push(`    - MEDIUM: ${conf.MEDIUM}`);
+    if (conf.LOW > 0) lines.push(`    - LOW: ${conf.LOW}`);
+    if (conf.UNKNOWN > 0) lines.push(`    - UNKNOWN: ${conf.UNKNOWN}`);
+  } else {
+    lines.push('  No discrepancies observed between code promises and runtime behavior');
+  }
+  // Coverage facts
+  lines.push('');
+  lines.push('WHAT WAS EVALUATED:');
+  const cov = observationSummary.coverage || {};
+  lines.push(`  Pages: ${cov.pagesEvaluated || 0} of ${cov.pagesDiscovered || 0} discovered${cov.pageRatio !== undefined ? ` (${(cov.pageRatio * 100).toFixed(1)}% evaluated)` : ''}`);
+  lines.push(`  Interactions: ${cov.interactionsEvaluated || 0} of ${cov.interactionsDiscovered || 0} discovered${cov.interactionRatio !== undefined ? ` (${(cov.interactionRatio * 100).toFixed(1)}% evaluated)` : ''}`);
+  lines.push(`  Expectations: ${cov.expectationsEvaluated || 0} of ${cov.expectationsDiscovered || 0} discovered${cov.expectationRatio !== undefined ? ` (${(cov.expectationRatio * 100).toFixed(1)}% evaluated)` : ''}`);
+  // Gaps explicitly reported (always shown, even if zero)
+  const gaps = observationSummary.gaps || {};
+  lines.push('');
+  lines.push('EVALUATION GAPS (NOT evaluated - observations incomplete for these items):');
+  lines.push(`  Pages: ${gaps.pages || 0} not evaluated`);
+  lines.push(`  Interactions: ${gaps.interactions || 0} not evaluated`);
+  lines.push(`  Expectations: ${gaps.expectations || 0} not evaluated`);
+  if (gaps.unprovenResults > 0) {
+    lines.push(`  Interactions without PROVEN expectations: ${gaps.unprovenResults}`);
+  }
+  if (gaps.details && gaps.details.length > 0) {
+    lines.push('  Gap reasons:');
+    for (const gap of gaps.details.slice(0, 5)) {
+      lines.push(`    - ${gap.message}`);
+    }
+  } else if (gaps.total === 0) {
+    lines.push('  (No gaps reported - all discovered items were evaluated)');
+  }
+  // SILENCE TRACKING: Explicitly show all silences (timeouts, skips, sensor failures, caps)
+  // PHASE 4: Include lifecycle information (type, status, promise association, confidence impact)
+  const silences = observationSummary.silences;
+  if (silences && silences.totalSilences > 0) {
+    lines.push('');
+    lines.push('UNKNOWNS (Silences - things attempted but outcome unknown):');
+    lines.push(`  Total silence events: ${silences.totalSilences}`);
+    // PHASE 2: Show outcomes in silence
+    if (silences.summary && silences.summary.byOutcome && Object.keys(silences.summary.byOutcome).length > 0) {
+      lines.push('  By outcome classification:');
+      for (const [outcome, count] of Object.entries(silences.summary.byOutcome)) {
+        if (count > 0) {
+          lines.push(`    - ${outcome}: ${count}`);
+        }
+      }
+    }
+    // PHASE 4: Show silence lifecycle metrics
+    if (silences.summary && silences.summary.byType && Object.keys(silences.summary.byType).length > 0) {
+      lines.push('  By silence type:');
+      const types = Object.entries(silences.summary.byType)
+        .filter(([_, count]) => count > 0)
+        .sort((a, b) => b[1] - a[1])
+        .slice(0, 5);
+      for (const [type, count] of types) {
+        const typeLabel = type.replace(/_/g, ' ').toLowerCase();
+        lines.push(`    - ${typeLabel}: ${count}`);
+      }
+    }
+    // PHASE 4: Show evaluation status distribution
+    if (silences.summary && silences.summary.byEvaluationStatus && Object.keys(silences.summary.byEvaluationStatus).length > 0) {
+      lines.push('  By evaluation status:');
+      for (const [status, count] of Object.entries(silences.summary.byEvaluationStatus)) {
+        if (count > 0) {
+          lines.push(`    - ${status}: ${count}`);
+        }
+      }
+    }
+    // PHASE 4: Show promise association count
+    if (silences.summary && silences.summary.withPromiseAssociation) {
+      lines.push(`  Silences with promise association: ${silences.summary.withPromiseAssociation}`);
+    }
+    // PHASE 4: Show confidence impact
+    if (silences.summary && silences.summary.confidenceImpact) {
+      const impact = silences.summary.confidenceImpact;
+      if (impact.coverage !== 0 || impact.promise_verification !== 0 || impact.overall !== 0) {
+        lines.push('  Confidence impact:');
+        if (impact.coverage !== 0) lines.push(`    - Coverage confidence: ${impact.coverage > 0 ? '+' : ''}${impact.coverage}%`);
+        if (impact.promise_verification !== 0) lines.push(`    - Promise verification confidence: ${impact.promise_verification > 0 ? '+' : ''}${impact.promise_verification}%`);
+        if (impact.overall !== 0) lines.push(`    - Overall confidence: ${impact.overall > 0 ? '+' : ''}${impact.overall}%`);
+      }
+    }
+    if (silences.byCategory) {
+      lines.push('  By category:');
+      for (const [category, count] of Object.entries(silences.byCategory)) {
+        if (count > 0) {
+          lines.push(`    - ${category}: ${count}`);
+        }
+      }
+    }
+    if (silences.byReason) {
+      lines.push('  By reason:');
+      const sortedReasons = Object.entries(silences.byReason)
+        .filter(([_, count]) => count > 0)
+        .sort((a, b) => b[1] - a[1])
+        .slice(0, 5);
+      for (const [reason, count] of sortedReasons) {
+        lines.push(`    - ${reason.replace(/_/g, ' ')}: ${count}`);
+      }
+    }
+  } else {
+    lines.push('');
+    lines.push('UNKNOWNS (Silences):');
+    lines.push('  No silence events recorded (all attempted actions completed)');
+  }
+  // PHASE 4: Show silence impact summary
+  const impactSummary = observationSummary.silenceImpactSummary;
+  if (impactSummary && impactSummary.total_silences > 0) {
+    lines.push('');
+    lines.push('SILENCE IMPACT ON CONFIDENCE:');
+    const impact = impactSummary.aggregated_impact;
+    if (impact) {
+      lines.push(`  Aggregated impact: ${impactSummary.confidence_interpretation}`);
+      lines.push(`  Coverage confidence: ${impact.coverage > 0 ? '+' : ''}${impact.coverage}%`);
+      lines.push(`  Promise verification confidence: ${impact.promise_verification > 0 ? '+' : ''}${impact.promise_verification}%`);
+      lines.push(`  Overall observation confidence: ${impact.overall > 0 ? '+' : ''}${impact.overall}%`);
+    }
+    if (impactSummary.by_severity && Object.values(impactSummary.by_severity).some(v => v > 0)) {
+      lines.push('  Silences by severity:');
+      const sev = impactSummary.by_severity;
+      if (sev.critical > 0) lines.push(`    - CRITICAL: ${sev.critical} events`);
+      if (sev.high > 0) lines.push(`    - HIGH: ${sev.high} events`);
+      if (sev.medium > 0) lines.push(`    - MEDIUM: ${sev.medium} events`);
+      if (sev.low > 0) lines.push(`    - LOW: ${sev.low} events`);
+    }
+    if (impactSummary.most_impactful_types && impactSummary.most_impactful_types.length > 0) {
+      lines.push('  Most impactful silence types:');
+      for (const impactType of impactSummary.most_impactful_types.slice(0, 3)) {
+        lines.push(`    - ${impactType.type.replace(/_/g, ' ')}: ${impactType.count} events, avg impact ${impactType.average_impact}%`);
+      }
+    }
+  }
+  if (obs.discrepanciesObserved > 0 && obs.findings && obs.findings.length > 0) {
+    lines.push('');
+    lines.push('DISCREPANCIES OBSERVED (sample):');
+    for (const finding of obs.findings.slice(0, 3)) {
+      const outcome = finding.outcome ? ` [${finding.outcome}]` : '';
+      const promiseInfo = finding.promise ? ` (${finding.promise.type.replace(/_PROMISE$/, '')})` : '';
+      const confStr = finding.confidence?.level ? ` (${finding.confidence.level} confidence)` : '';
+      const userStmt = finding.what_happened ? `User: ${finding.what_happened}` : '';
+      lines.push(`  • ${finding.type}${outcome}${promiseInfo}`);
+      if (userStmt) lines.push(`    ${userStmt}`);
+      if (finding.what_was_expected) lines.push(`    Expected: ${finding.what_was_expected}`);
+      if (finding.what_was_observed) lines.push(`    Observed: ${finding.what_was_observed}`);
+      if (finding.promise?.expected_signal) lines.push(`    Promise signal: ${finding.promise.expected_signal}`);
+    }
+  }
+  lines.push('');
+  lines.push('═══════════════════════════════════════');
+  lines.push('');
+  return lines.join('\n');
+}
+/**
+ * Build evidence index from traces array.
+ * Maps expectations and interactions to evidence (screenshots, trace files).
+ */
+/**
+ * Build evidence index from traces array.
+ *
+ * PHASE 3: EVIDENCE INTEGRITY
+ * - Validates that evidence files actually exist
+ * - Missing evidence files are tracked as silence
+ * - Only includes verifiable evidence in index
+ *
+ * Maps expectations and interactions to evidence (screenshots, trace files).
+ */
+// buildEvidenceIndex moved to evidence-index.js - imported above
+/**
+ * PHASE 4: Associate silences with promises where applicable
+ *
+ * RULE: A silence can only be associated with a promise if we can infer what promise
+ * the user was attempting to verify when the silence occurred.
+ *
+ * Conservative approach:
+ * - Navigation timeouts → NAVIGATION_PROMISE
+ * - Interaction timeouts → infer from interaction type
+ * - Safety blocks → related promise
+ * - Budget/discovery failures → no promise (unevaluated)
+ *
+ * @param {Object} silence - SilenceEntry with silence_type, scope, context
+ * @returns {Object|null} Promise object with type/expected_signal, or null if cannot infer
+ */
+export function inferPromiseForSilence(silence) {
+  if (!silence) return null;
+  const { silence_type, scope, reason, context } = silence;
+  // Navigation-related silences
+  if (silence_type === SILENCE_TYPES.NAVIGATION_TIMEOUT ||
+      silence_type === SILENCE_TYPES.PROMISE_VERIFICATION_BLOCKED ||
+      (reason && reason.includes('navigation'))) {
+    return {
+      type: 'NAVIGATION_PROMISE',
+      expected_signal: 'URL change or navigation settled',
+      reason_no_association: null
+    };
+  }
+  // Interaction-related silences
+  if (silence_type === SILENCE_TYPES.INTERACTION_TIMEOUT) {
+    // Try to infer from context if available
+    if (context && context.interaction) {
+      return inferPromiseFromInteraction(context.interaction);
+    }
+    return {
+      type: 'FEEDBACK_PROMISE',
+      expected_signal: 'User feedback or interaction acknowledgment',
+      reason_no_association: 'Interaction type unknown in context'
+    };
+  }
+  // Safety blocks - the promise being blocked
+  if (silence_type === SILENCE_TYPES.SAFETY_POLICY_BLOCK) {
+    if (context && context.interaction) {
+      const inferred = inferPromiseFromInteraction(context.interaction);
+      return {
+        ...inferred,
+        blocked_by_safety: true
+      };
+    }
+    return null; // Cannot infer without interaction context
+  }
+  // Discovery/sensor failures - no promise can be evaluated
+  if (silence_type === SILENCE_TYPES.DISCOVERY_FAILURE ||
+      silence_type === SILENCE_TYPES.SENSOR_FAILURE) {
+    return {
+      type: null,
+      reason_no_association: 'Observation infrastructure failure - no promise evaluatable'
+    };
+  }
+  // Budget/incremental/ambiguous - no promise
+  if (silence_type === SILENCE_TYPES.BUDGET_LIMIT_EXCEEDED ||
+      silence_type === SILENCE_TYPES.INCREMENTAL_REUSE ||
+      silence_type === SILENCE_TYPES.PROMISE_NOT_EVALUATED) {
+    return {
+      type: null,
+      reason_no_association: 'Promise not yet evaluated'
+    };
+  }
+  // Conservative default: no association
+  return null;
+}
+/**
+ * Validate that a silence event makes forensic sense
+ * RULE: Silence can NEVER appear as success. It is always a gap in observation.
+ *
+ * @param {Object} silence - SilenceEntry
+ * @returns {Object} Validation result: { valid: boolean, reason: string }
+ */
+export function validateSilenceIntegrity(silence) {
+  if (!silence) {
+    return { valid: false, reason: 'Silence entry is null/undefined' };
+  }
+  // Silence can NEVER have outcome === INFORMATIONAL or any "success" outcome
+  const prohibitedOutcomes = ['SUCCESS', 'PASS', 'VERIFIED', 'CONFIRMED'];
+  if (prohibitedOutcomes.includes(silence.outcome?.toUpperCase())) {
+    return {
+      valid: false,
+      reason: `Silence cannot have outcome "${silence.outcome}" - silence is always a gap`
+    };
+  }
+  // Silence must have a valid scope
+  const validScopes = ['page', 'interaction', 'expectation', 'sensor', 'navigation', 'settle'];
+  if (!silence.scope || !validScopes.includes(silence.scope)) {
+    return { valid: false, reason: `Invalid scope: "${silence.scope}"` };
+  }
+  // Must have evaluation_status (Phase 4)
+  const validStatuses = Object.values(EVALUATION_STATUS);
+  if (!silence.evaluation_status || !validStatuses.includes(silence.evaluation_status)) {
+    return {
+      valid: false,
+      reason: `Invalid evaluation_status: "${silence.evaluation_status}". Must be one of: ${validStatuses.join(', ')}`
+    };
+  }
+  return { valid: true, reason: null };
+}
+function clampRatio(ratio) {
+  const clamped = Math.max(0, Math.min(1, ratio));
+  return Math.round(clamped * 10000) / 10000; // 4 decimal places
+}
+// writeEvidenceIndex moved to evidence-index.js - re-exported below
+export { buildEvidenceIndex, writeEvidenceIndex } from './evidence-index.js';

package/src/verax/evidence-index-writer.js ADDED Viewed

@@ -0,0 +1,61 @@
+import { resolve, dirname } from 'path';
+import { mkdirSync, writeFileSync } from 'fs';
+function resolveScreenshotPath(screenshotsDir, relativePath) {
+  if (!relativePath || !screenshotsDir) return null;
+  const observeDir = dirname(screenshotsDir);
+  return resolve(observeDir, relativePath);
+}
+function findEvidenceForFinding(finding, evidenceIndex) {
+  if (!Array.isArray(evidenceIndex)) return null;
+  if (finding.expectationId) {
+    const byExpectation = evidenceIndex.find(e => e.expectationId === finding.expectationId);
+    if (byExpectation) return byExpectation;
+  }
+  const selector = finding.interaction?.selector;
+  if (selector) {
+    const bySelector = evidenceIndex.find(e => e.interaction?.selector === selector);
+    if (bySelector) return bySelector;
+  }
+  return evidenceIndex[0] || null;
+}
+function buildEvidenceEntries(findings, evidenceIndex, tracesPath, screenshotsDir) {
+  const seen = new Set();
+  const entries = [];
+  (findings || []).forEach((finding, idx) => {
+    const evidence = findEvidenceForFinding(finding, evidenceIndex);
+    const findingId = finding.findingId || finding.id || `finding-${idx}`;
+    if (seen.has(findingId)) return;
+    seen.add(findingId);
+    entries.push({
+      findingId,
+      findingType: finding.type || 'finding',
+      expectationId: finding.expectationId || null,
+      interactionSelector: finding.interaction?.selector || null,
+      evidenceId: evidence?.id || null,
+      paths: {
+        beforeScreenshot: resolveScreenshotPath(screenshotsDir, evidence?.evidence?.beforeScreenshot || null),
+        afterScreenshot: resolveScreenshotPath(screenshotsDir, evidence?.evidence?.afterScreenshot || null),
+        traceFile: tracesPath || null,
+        networkTrace: null
+      }
+    });
+  });
+  return entries;
+}
+export function writeEvidenceIndex(projectDir, findings, verdict, tracesPath, screenshotsDir) {
+  const artifactsDir = resolve(projectDir, 'artifacts');
+  mkdirSync(artifactsDir, { recursive: true });
+  const items = buildEvidenceEntries(findings, verdict?.evidenceIndex || [], tracesPath, screenshotsDir);
+  const evidenceIndexPath = resolve(artifactsDir, 'evidence-index.json');
+  const payload = {
+    version: 1,
+    tracesPath,
+    items
+  };
+  writeFileSync(evidenceIndexPath, JSON.stringify(payload, null, 2) + '\n');
+  return { evidenceIndexPath, items };
+}