npm - nemoris - Versions diffs - 0.1.0 → 0.1.2 - Mend

nemoris 0.1.0 → 0.1.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (248) hide show

package/.env.example +49 -49
package/LICENSE +21 -21
package/README.md +209 -209
package/SECURITY.md +59 -119
package/bin/nemoris +46 -46
package/config/agents/agent.toml.example +28 -28
package/config/agents/content.toml +23 -0
package/config/agents/default.toml +22 -22
package/config/agents/heartbeat.toml +35 -0
package/config/agents/iris.toml +23 -0
package/config/agents/lab.toml +23 -0
package/config/agents/main.toml +45 -0
package/config/agents/nemo.toml +21 -0
package/config/agents/ops.toml +38 -0
package/config/agents/orchestrator.toml +18 -18
package/config/agents/revenue.toml +23 -0
package/config/agents/testyboo.toml +19 -0
package/config/delivery.toml +73 -73
package/config/embeddings.toml +5 -5
package/config/identity/content-purpose.md +11 -0
package/config/identity/content-soul.md +45 -0
package/config/identity/default-purpose.md +1 -1
package/config/identity/default-soul.md +3 -3
package/config/identity/heartbeat-purpose.md +9 -0
package/config/identity/heartbeat-soul.md +16 -0
package/config/identity/iris-purpose.md +17 -0
package/config/identity/iris-soul.md +68 -0
package/config/identity/lab-purpose.md +10 -0
package/config/identity/lab-soul.md +38 -0
package/config/identity/main-purpose.md +17 -0
package/config/identity/main-soul.md +66 -0
package/config/identity/main-user.md +22 -0
package/config/identity/ops-purpose.md +9 -0
package/config/identity/ops-soul.md +16 -0
package/config/identity/orchestrator-purpose.md +1 -1
package/config/identity/orchestrator-soul.md +1 -1
package/config/identity/revenue-purpose.md +9 -0
package/config/identity/revenue-soul.md +41 -0
package/config/identity/testyboo-purpose.md +13 -0
package/config/identity/testyboo-soul.md +20 -0
package/config/improvement-targets.toml +15 -15
package/config/jobs/heartbeat-check.toml +30 -30
package/config/jobs/memory-rollup.toml +46 -46
package/config/jobs/workspace-health.toml +63 -63
package/config/mcp.toml +16 -16
package/config/output-contracts.toml +17 -17
package/config/peers.toml +32 -32
package/config/peers.toml.example +32 -32
package/config/policies/memory-default.toml +10 -10
package/config/policies/memory-heartbeat.toml +5 -5
package/config/policies/memory-ops.toml +10 -10
package/config/policies/tools-heartbeat-minimal.toml +8 -8
package/config/policies/tools-interactive-safe.toml +8 -8
package/config/policies/tools-ops-bounded.toml +8 -8
package/config/policies/tools-orchestrator.toml +7 -7
package/config/providers/anthropic.toml +15 -15
package/config/providers/ollama.toml +5 -5
package/config/providers/openai-codex.toml +9 -9
package/config/providers/openrouter.toml +5 -5
package/config/router.toml +22 -22
package/config/runtime.toml +114 -114
package/config/skills/self-improvement.toml +15 -15
package/config/skills/telegram-onboarding-spec.md +240 -240
package/config/skills/workspace-monitor.toml +15 -15
package/config/task-router.toml +42 -42
package/install.sh +50 -50
package/package.json +91 -90
package/src/auth/auth-profiles.js +169 -169
package/src/auth/openai-codex-oauth.js +285 -285
package/src/battle.js +449 -449
package/src/cli/help.js +265 -265
package/src/cli/output-filter.js +49 -49
package/src/cli/runtime-control.js +704 -704
package/src/cli-main.js +2763 -2763
package/src/cli.js +78 -78
package/src/config/loader.js +332 -332
package/src/config/schema-validator.js +214 -214
package/src/config/toml-lite.js +8 -8
package/src/daemon/action-handlers.js +71 -71
package/src/daemon/healing-tick.js +87 -87
package/src/daemon/health-probes.js +90 -90
package/src/daemon/notifier.js +57 -57
package/src/daemon/nurse.js +218 -218
package/src/daemon/repair-log.js +106 -106
package/src/daemon/rule-staging.js +90 -90
package/src/daemon/rules.js +29 -29
package/src/daemon/telegram-commands.js +54 -54
package/src/daemon/updater.js +85 -85
package/src/jobs/job-runner.js +78 -78
package/src/mcp/consumer.js +129 -129
package/src/memory/active-recall.js +171 -171
package/src/memory/backend-manager.js +97 -97
package/src/memory/backends/file-backend.js +38 -38
package/src/memory/backends/qmd-backend.js +219 -219
package/src/memory/embedding-guards.js +24 -24
package/src/memory/embedding-index.js +118 -118
package/src/memory/embedding-service.js +179 -179
package/src/memory/file-index.js +177 -177
package/src/memory/memory-signature.js +5 -5
package/src/memory/memory-store.js +648 -648
package/src/memory/retrieval-planner.js +66 -66
package/src/memory/scoring.js +145 -145
package/src/memory/simhash.js +78 -78
package/src/memory/sqlite-active-store.js +824 -824
package/src/memory/write-policy.js +36 -36
package/src/onboarding/aliases.js +33 -33
package/src/onboarding/auth/api-key.js +224 -224
package/src/onboarding/auth/ollama-detect.js +42 -42
package/src/onboarding/clack-prompter.js +77 -77
package/src/onboarding/doctor.js +530 -530
package/src/onboarding/lock.js +42 -42
package/src/onboarding/model-catalog.js +344 -344
package/src/onboarding/phases/auth.js +576 -589
package/src/onboarding/phases/build.js +130 -130
package/src/onboarding/phases/choose.js +82 -82
package/src/onboarding/phases/detect.js +98 -98
package/src/onboarding/phases/hatch.js +216 -216
package/src/onboarding/phases/identity.js +79 -79
package/src/onboarding/phases/ollama.js +345 -345
package/src/onboarding/phases/scaffold.js +99 -99
package/src/onboarding/phases/telegram.js +377 -377
package/src/onboarding/phases/validate.js +204 -204
package/src/onboarding/phases/verify.js +206 -206
package/src/onboarding/platform.js +482 -482
package/src/onboarding/status-bar.js +95 -95
package/src/onboarding/templates.js +794 -794
package/src/onboarding/toml-writer.js +38 -38
package/src/onboarding/tui.js +250 -250
package/src/onboarding/uninstall.js +153 -153
package/src/onboarding/wizard.js +516 -499
package/src/providers/anthropic.js +168 -168
package/src/providers/base.js +247 -247
package/src/providers/circuit-breaker.js +136 -136
package/src/providers/ollama.js +163 -163
package/src/providers/openai-codex.js +149 -149
package/src/providers/openrouter.js +136 -136
package/src/providers/registry.js +36 -36
package/src/providers/router.js +16 -16
package/src/runtime/bootstrap-cache.js +47 -47
package/src/runtime/capabilities-prompt.js +25 -25
package/src/runtime/completion-ping.js +99 -99
package/src/runtime/config-validator.js +121 -121
package/src/runtime/context-ledger.js +360 -360
package/src/runtime/cutover-readiness.js +42 -42
package/src/runtime/daemon.js +729 -729
package/src/runtime/delivery-ack.js +195 -195
package/src/runtime/delivery-adapters/local-file.js +41 -41
package/src/runtime/delivery-adapters/openclaw-cli.js +94 -94
package/src/runtime/delivery-adapters/openclaw-peer.js +98 -98
package/src/runtime/delivery-adapters/shadow.js +13 -13
package/src/runtime/delivery-adapters/standalone-http.js +98 -98
package/src/runtime/delivery-adapters/telegram.js +104 -104
package/src/runtime/delivery-adapters/tui.js +128 -128
package/src/runtime/delivery-manager.js +807 -807
package/src/runtime/delivery-store.js +168 -168
package/src/runtime/dependency-health.js +118 -118
package/src/runtime/envelope.js +114 -114
package/src/runtime/evaluation.js +1089 -1089
package/src/runtime/exec-approvals.js +216 -216
package/src/runtime/executor.js +500 -500
package/src/runtime/failure-ping.js +67 -67
package/src/runtime/flows.js +83 -83
package/src/runtime/guards.js +45 -45
package/src/runtime/handoff.js +51 -51
package/src/runtime/identity-cache.js +28 -28
package/src/runtime/improvement-engine.js +109 -109
package/src/runtime/improvement-harness.js +581 -581
package/src/runtime/input-sanitiser.js +72 -72
package/src/runtime/interaction-contract.js +347 -347
package/src/runtime/lane-readiness.js +226 -226
package/src/runtime/migration.js +323 -323
package/src/runtime/model-resolution.js +78 -78
package/src/runtime/network.js +64 -64
package/src/runtime/notification-store.js +97 -97
package/src/runtime/notifier.js +256 -256
package/src/runtime/orchestrator.js +53 -53
package/src/runtime/orphan-reaper.js +41 -41
package/src/runtime/output-contract-schema.js +139 -139
package/src/runtime/output-contract-validator.js +439 -439
package/src/runtime/peer-readiness.js +69 -69
package/src/runtime/peer-registry.js +133 -133
package/src/runtime/pilot-status.js +108 -108
package/src/runtime/prompt-builder.js +261 -261
package/src/runtime/provider-attempt.js +582 -582
package/src/runtime/report-fallback.js +71 -71
package/src/runtime/result-normalizer.js +183 -183
package/src/runtime/retention.js +74 -74
package/src/runtime/review.js +244 -244
package/src/runtime/route-job.js +15 -15
package/src/runtime/run-store.js +38 -38
package/src/runtime/schedule.js +88 -88
package/src/runtime/scheduler-state.js +434 -434
package/src/runtime/scheduler.js +656 -656
package/src/runtime/session-compactor.js +182 -182
package/src/runtime/session-search.js +155 -155
package/src/runtime/slack-inbound.js +249 -249
package/src/runtime/ssrf.js +102 -102
package/src/runtime/status-aggregator.js +330 -330
package/src/runtime/task-contract.js +140 -140
package/src/runtime/task-packet.js +107 -107
package/src/runtime/task-router.js +140 -140
package/src/runtime/telegram-inbound.js +1565 -1565
package/src/runtime/token-counter.js +134 -134
package/src/runtime/token-estimator.js +59 -59
package/src/runtime/tool-loop.js +200 -200
package/src/runtime/transport-server.js +311 -311
package/src/runtime/tui-server.js +411 -411
package/src/runtime/ulid.js +44 -44
package/src/security/ssrf-check.js +197 -197
package/src/setup.js +369 -369
package/src/shadow/bridge.js +303 -303
package/src/skills/loader.js +84 -84
package/src/tools/catalog.json +49 -49
package/src/tools/cli-delegate.js +44 -44
package/src/tools/mcp-client.js +106 -106
package/src/tools/micro/cancel-task.js +6 -6
package/src/tools/micro/complete-task.js +6 -6
package/src/tools/micro/fail-task.js +6 -6
package/src/tools/micro/http-fetch.js +74 -74
package/src/tools/micro/index.js +36 -36
package/src/tools/micro/lcm-recall.js +60 -60
package/src/tools/micro/list-dir.js +17 -17
package/src/tools/micro/list-skills.js +46 -46
package/src/tools/micro/load-skill.js +38 -38
package/src/tools/micro/memory-search.js +45 -45
package/src/tools/micro/read-file.js +11 -11
package/src/tools/micro/session-search.js +54 -54
package/src/tools/micro/shell-exec.js +43 -43
package/src/tools/micro/trigger-job.js +79 -79
package/src/tools/micro/web-search.js +58 -58
package/src/tools/micro/workspace-paths.js +39 -39
package/src/tools/micro/write-file.js +14 -14
package/src/tools/micro/write-memory.js +41 -41
package/src/tools/registry.js +348 -348
package/src/tools/tool-result-contract.js +36 -36
package/src/tui/chat.js +835 -835
package/src/tui/renderer.js +175 -175
package/src/tui/socket-client.js +217 -217
package/src/utils/canonical-json.js +29 -29
package/src/utils/compaction.js +30 -30
package/src/utils/env-loader.js +5 -5
package/src/utils/errors.js +80 -80
package/src/utils/fs.js +101 -101
package/src/utils/ids.js +5 -5
package/src/utils/model-context-limits.js +30 -30
package/src/utils/token-budget.js +74 -74
package/src/utils/usage-cost.js +25 -25
package/src/utils/usage-metrics.js +14 -14

package/src/runtime/evaluation.js CHANGED Viewed

@@ -1,1089 +1,1089 @@
-import path from "node:path";
-import { RunReviewer } from "./review.js";
-import { Scheduler } from "./scheduler.js";
-import { RunStore } from "./run-store.js";
-import { NotificationStore } from "./notification-store.js";
-import { DeliveryStore } from "./delivery-store.js";
-import { validateOutputContract } from "./output-contract-validator.js";
-function groupBy(items, keyFn) {
-  const map = new Map();
-  for (const item of items) {
-    const key = keyFn(item);
-    if (!map.has(key)) map.set(key, []);
-    map.get(key).push(item);
-  }
-  return map;
-}
-function clamp(value, min = 0, max = 1) {
-  return Math.max(min, Math.min(max, value));
-}
-function average(values) {
-  if (values.length === 0) return null;
-  return values.reduce((sum, value) => sum + value, 0) / values.length;
-}
-function choosePrimaryV2Run(runs) {
-  if (!runs.length) return null;
-  return runs.find((run) => run.mode === "provider") || runs[0];
-}
-function pickBestLiveMatch(liveMatches) {
-  return liveMatches.find((match) => match.latestRun) || liveMatches[0] || null;
-}
-function normalizeText(value) {
-  return String(value || "")
-    .replace(/\s+/g, " ")
-    .trim();
-}
-function stripOuterFence(text) {
-  const raw = String(text || "").trim();
-  const fencedMatch = raw.match(/^```(?:json|markdown|md|text)?\s*([\s\S]*?)\s*```$/i);
-  return fencedMatch ? fencedMatch[1].trim() : raw;
-}
-function parseJsonCandidate(text) {
-  const candidate = stripOuterFence(text);
-  if (!(candidate.startsWith("{") && candidate.endsWith("}"))) {
-    return null;
-  }
-  try {
-    return JSON.parse(candidate);
-  } catch {
-    return null;
-  }
-}
-function titleCase(value) {
-  return String(value || "")
-    .replace(/[_-]+/g, " ")
-    .replace(/^#+\s*/, "")
-    .replace(/\b\w/g, (char) => char.toUpperCase())
-    .trim();
-}
-function normalizeInline(value) {
-  return normalizeText(value) || "None";
-}
-function normalizeSectionKey(value) {
-  return String(value || "")
-    .toLowerCase()
-    .replace(/^#+\s*/, "")
-    .replace(/[*:_-]+/g, " ")
-    .replace(/\s+/g, " ")
-    .trim();
-}
-function renderValue(value, { contract = null, summary = null } = {}) {
-  if (value == null) return "";
-  if (typeof value === "string") {
-    const parsed = parseJsonCandidate(value);
-    if (parsed && typeof parsed === "object") {
-      if (parsed.output !== undefined) {
-        return renderValue(parsed.output, {
-          contract,
-          summary: parsed.summary || summary
-        });
-      }
-      return renderValue(parsed, { contract, summary });
-    }
-    return stripOuterFence(value);
-  }
-  if (Array.isArray(value)) {
-    return value
-      .map((item) => renderValue(item, { contract, summary }))
-      .filter(Boolean)
-      .join("\n");
-  }
-  if (typeof value === "object") {
-    const entries = Object.entries(value);
-    const sectionOrder = contract?.requiredSections?.length
-      ? contract.requiredSections
-      : entries.map(([key]) => key);
-    const valueMap = new Map(entries.map(([key, entryValue]) => [normalizeSectionKey(key), entryValue]));
-    const sectionStyle = contract?.profile?.sectionStyle || (contract?.format === "structured_rollup" ? "headings" : "bullets");
-    const requireStatus = contract?.profile?.requireStatus ?? (contract?.format === "bulleted_briefing");
-    if (sectionStyle === "bullets") {
-      const lines = [];
-      if (requireStatus && summary) lines.push(`Status: ${normalizeInline(summary)}`);
-      for (const section of sectionOrder) {
-        lines.push(`- ${titleCase(section)}: ${normalizeInline(valueMap.get(normalizeSectionKey(section)))}`);
-      }
-      return lines.join("\n");
-    }
-    if (sectionStyle === "headings") {
-      const lines = [];
-      for (const section of sectionOrder) {
-        lines.push(`## ${titleCase(section)}`);
-        lines.push(`- ${normalizeInline(valueMap.get(normalizeSectionKey(section)))}`);
-        lines.push("");
-      }
-      return lines.join("\n").trim();
-    }
-    return entries
-      .map(([key, entryValue]) => `${titleCase(key)}: ${normalizeInline(entryValue)}`)
-      .join("\n");
-  }
-  return String(value);
-}
-function extractRunText(run, contract = null) {
-  if (!run) return "";
-  const summary = run?.result?.summary || run?.summary || "";
-  const value = run?.result?.output ?? run?.output ?? summary;
-  return renderValue(value, { contract, summary });
-}
-function extractLiveText(run) {
-  if (!run) return "";
-  return renderValue(run.summary || run.error || "");
-}
-function qualitySignals(text) {
-  const raw = String(text || "");
-  const normalized = normalizeText(text);
-  const lower = normalized.toLowerCase();
-  const findings = [];
-  let score = 1;
-  if (!normalized) {
-    findings.push("Output is empty.");
-    return { score: 0, findings };
-  }
-  if (normalized.length < 40) {
-    findings.push("Output is very short and may not carry enough signal.");
-    score -= 0.18;
-  }
-  if (/\[(title|link|summary|sub)\]/i.test(normalized)) {
-    findings.push("Output still contains placeholder text.");
-    score -= 0.4;
-  }
-  if (/i('| a)?m sorry|does not support|cannot complete|failed to/i.test(lower)) {
-    findings.push("Output contains apology or tool-failure language.");
-    score -= 0.28;
-  }
-  if (/```/.test(raw)) {
-    findings.push("Output is wrapped in a code block instead of a direct report.");
-    score -= 0.12;
-  }
-  if (/timed out|timeout/i.test(lower)) {
-    findings.push("Output references a timeout or stalled execution.");
-    score -= 0.35;
-  }
-  const repeatedLinePenalty = detectRepeatedLinePenalty(normalized);
-  if (repeatedLinePenalty > 0) {
-    findings.push("Output repeats nearly identical numbered lines.");
-    score -= repeatedLinePenalty;
-  }
-  return {
-    score: clamp(Number(score.toFixed(4))),
-    findings
-  };
-}
-function detectRepeatedLinePenalty(text) {
-  const lines = text
-    .split("\n")
-    .map((line) => line.trim())
-    .filter(Boolean)
-    .filter((line) => /^\d+\./.test(line));
-  if (lines.length < 3) return 0;
-  const normalized = lines.map((line) => line.replace(/^\d+\.\s*/, "").toLowerCase());
-  const unique = new Set(normalized);
-  const duplicateRatio = 1 - unique.size / normalized.length;
-  if (duplicateRatio < 0.5) return 0;
-  return Number((duplicateRatio * 0.25).toFixed(4));
-}
-function expandRelatedNotificationFiles(baseFiles, notifications) {
-  const related = new Set(baseFiles);
-  let changed = true;
-  while (changed) {
-    changed = false;
-    for (const item of notifications) {
-      if (!related.has(item.filePath)) continue;
-      for (const generated of item.generatedNotificationFiles || []) {
-        if (related.has(generated)) continue;
-        related.add(generated);
-        changed = true;
-      }
-    }
-  }
-  return related;
-}
-function evaluateLiveHistory(liveRuns) {
-  if (liveRuns.length === 0) {
-    return {
-      runCount: 0,
-      okCount: 0,
-      errorCount: 0,
-      skippedCount: 0,
-      failureRate: null,
-      avgDurationMs: null,
-      avgTotalTokens: null,
-      avgQualityScore: null,
-      findings: ["No recent live history available."]
-    };
-  }
-  const okCount = liveRuns.filter((run) => run.status === "ok").length;
-  const errorCount = liveRuns.filter((run) => run.status === "error").length;
-  const skippedCount = liveRuns.filter((run) => run.status === "skipped").length;
-  const failureRate = errorCount / liveRuns.length;
-  const durations = liveRuns.map((run) => run.durationMs).filter((value) => Number.isFinite(value));
-  const tokens = liveRuns.map((run) => run.usage?.total_tokens).filter((value) => Number.isFinite(value));
-  const qualityScores = liveRuns
-    .map((run) => qualitySignals(run.summary || run.error || "").score)
-    .filter((value) => Number.isFinite(value));
-  const findings = [];
-  if (failureRate >= 0.34) findings.push("Live cron lane is failing often.");
-  if (skippedCount > 0) findings.push("Live cron history includes intentional skips.");
-  if (tokens.some((value) => value > 12000)) findings.push("Live cron lane shows high token usage spikes.");
-  return {
-    runCount: liveRuns.length,
-    okCount,
-    errorCount,
-    skippedCount,
-    failureRate: Number(failureRate.toFixed(4)),
-    avgDurationMs: durations.length ? Math.round(average(durations)) : null,
-    avgTotalTokens: tokens.length ? Math.round(average(tokens)) : null,
-    avgQualityScore: qualityScores.length ? Number(average(qualityScores).toFixed(4)) : null,
-    findings
-  };
-}
-function scoreStatus(status) {
-  if (status === "ok") return 1;
-  if (status === "skipped") return 0.6;
-  if (status === "error") return 0;
-  return 0.5;
-}
-function buildRubric({ v2Run, liveHistory, matchedLiveJob, outputContract = null, contractCheck = null }) {
-  const findings = [];
-  const v2Text = extractRunText(v2Run, outputContract);
-  const v2Quality = qualitySignals(v2Text);
-  const latestLive = liveHistory[0] || null;
-  const latestLiveQuality = qualitySignals(extractLiveText(latestLive));
-  const history = evaluateLiveHistory(liveHistory);
-  const isDryRun = v2Run != null && v2Run.mode !== "provider";
-  const comparisonReadiness = v2Run
-    ? v2Run.mode === "provider"
-      ? 1
-      : 0.45
-    : 0;
-  const comparisonCoverage = matchedLiveJob ? 1 : 0.2;
-  const contractAdherence = contractCheck ? contractCheck.satisfiedRatio : null;
-  if (!v2Run) findings.push("No V2 run exists for this lane yet.");
-  else if (isDryRun) findings.push("Only a dry-run V2 artifact exists; output quality and contract adherence are excluded from the rubric score.");
-  if (!matchedLiveJob) findings.push("Comparison coverage is low because no live cron analogue is mapped.");
-  if (!isDryRun && v2Quality.findings.length) findings.push(...v2Quality.findings.map((item) => `V2: ${item}`));
-  if (latestLiveQuality.findings.length) findings.push(...latestLiveQuality.findings.map((item) => `Live: ${item}`));
-  if (history.findings.length) findings.push(...history.findings);
-  const fieldScores = contractCheck?.fieldScores || null;
-  if (!isDryRun && fieldScores) {
-    if (fieldScores.weakFields.length) {
-      findings.push(`Field-level quality is low for: ${fieldScores.weakFields.join(", ")}`);
-    }
-    if (fieldScores.placeholderFields.length) {
-      findings.push(`Placeholder text detected in: ${fieldScores.placeholderFields.join(", ")}`);
-    }
-  }
-  if (!matchedLiveJob) {
-    findings.push("No live cron analogue matched for this V2 job.");
-  }
-  const statusAlignment =
-    latestLive && v2Run
-      ? Number((scoreStatus(v2Run.result ? "ok" : v2Run.status) * scoreStatus(latestLive.status)).toFixed(4))
-      : null;
-  const liveReliability = history.failureRate == null ? null : Number((1 - history.failureRate).toFixed(4));
-  const fieldLevelQuality = !isDryRun && fieldScores ? fieldScores.averageScore : null;
-  const components = [
-    isDryRun ? null : v2Quality.score,
-    comparisonReadiness,
-    comparisonCoverage,
-    isDryRun ? null : contractAdherence,
-    fieldLevelQuality,
-    liveReliability,
-    statusAlignment
-  ].filter((value) => value != null);
-  const overallScore = components.length ? Number(average(components).toFixed(4)) : 0;
-  return {
-    overallScore,
-    dryRunExcluded: isDryRun,
-    components: {
-      v2OutputQuality: isDryRun ? null : v2Quality.score,
-      comparisonReadiness,
-      comparisonCoverage,
-      contractAdherence: isDryRun ? null : contractAdherence,
-      fieldLevelQuality,
-      liveReliability,
-      statusAlignment
-    },
-    findings: uniqueStrings(findings),
-    metrics: {
-      liveRunCount: history.runCount,
-      liveOkCount: history.okCount,
-      liveErrorCount: history.errorCount,
-      liveSkippedCount: history.skippedCount,
-      liveFailureRate: history.failureRate,
-      liveAvgDurationMs: history.avgDurationMs,
-      liveAvgTotalTokens: history.avgTotalTokens,
-      liveAvgQualityScore: history.avgQualityScore,
-      latestLiveQualityScore: latestLive ? latestLiveQuality.score : null
-    }
-  };
-}
-function uniqueStrings(items) {
-  return [...new Set(items.filter(Boolean))];
-}
-function summarizeV2Run(run) {
-  if (!run) return null;
-  return {
-    timestamp: run.timestamp,
-    mode: run.mode || null,
-    providerId: run.providerId || null,
-    modelId: run.modelId || null,
-    summary: run.result?.summary || run.summary || null,
-    output: run.result?.output || run.output || null,
-    retrievalMeta: run.retrievalMeta || null,
-    retrievedMemoryCount: run.retrievedMemory?.length || 0,
-    interaction: summarizeInteraction(run),
-    fallback: run.fallback || null
-  };
-}
-function summarizeInteraction(run) {
-  const interaction = run?.interaction || null;
-  if (!interaction) return null;
-  return {
-    ackRequired: interaction.ack?.required ?? false,
-    completionRequired: interaction.completion?.required ?? false,
-    handoffRequired: interaction.handoff?.required ?? false,
-    yielded: run?.yielded || false,
-    yieldSignal: run?.yieldSignal || null,
-    followUpState: run?.followUpState || null,
-    followUpQueued: run?.followUpQueued || false,
-    followUpConsumed: run?.followUpConsumed || false,
-    followUpTarget: run?.followUpTarget || null,
-    followUpCompleted: run?.followUpCompleted || false,
-    followUpExpired: run?.followUpExpired || false,
-    followUpEscalated: run?.followUpEscalated || false,
-    followUpEscalationFilePath: run?.followUpEscalationFilePath || null,
-    handoffTarget: interaction.handoff?.target || null,
-    suggestedPeerCount: interaction.handoff?.suggestions?.length || 0,
-    handoffChosenPeerId: run?.handoffChosenPeerId || null,
-    handoffChosenBy: run?.handoffChosenBy || null,
-    handoffDelivered: run?.handoffDelivered || false,
-    handoffDeliveryState: run?.handoffDeliveryState || null,
-    deliveryDeduped: run?.deliveryDeduped || false,
-    deliveryRetried: run?.deliveryRetried || false,
-    deliveryUncertain: run?.deliveryUncertain || false
-  };
-}
-function analyzeRetrieval(run) {
-  const retrievalMeta = run?.retrievalMeta || run?.plan?.packet?.layers?.retrievalMeta || null;
-  if (!run?.retrievedMemory?.length) {
-    return {
-      memoryCount: 0,
-      lexicalCount: 0,
-      semanticCount: 0,
-      qmdCount: 0,
-      freshEmbeddingCount: 0,
-      staleEmbeddingCount: 0,
-      missingEmbeddingCount: 0,
-      failedEmbeddingCount: retrievalMeta?.embeddingHealth?.failedCount || 0,
-      embeddingQueryMode: retrievalMeta?.embeddingQueryMode || "lexical_only",
-      embeddingError: retrievalMeta?.embeddingError || retrievalMeta?.embeddingHealth?.lastError || null,
-      findings: ["No retrieved memory was captured for this run."],
-      items: []
-    };
-  }
-  const items = run.retrievedMemory.map((item) => ({
-    entryId: item.entryId || null,
-    title: item.title || null,
-    sourceBackend: item.sourceBackend || "file",
-    candidateSource: item.candidateSource || "indexed",
-    lexicalScore: item.lexicalScore ?? 0,
-    embeddingSimilarity: item.embeddingSimilarity ?? 0,
-    embeddingFreshness: item.embeddingFreshness || "missing",
-    retrievalSources: item.retrievalSources || []
-  }));
-  const lexicalCount = items.filter((item) => item.retrievalSources.includes("lexical")).length;
-  const semanticCount = items.filter((item) => item.retrievalSources.includes("semantic")).length;
-  const qmdCount = items.filter((item) => item.retrievalSources.includes("qmd") || item.sourceBackend === "qmd").length;
-  const freshEmbeddingCount = items.filter((item) => item.embeddingFreshness === "fresh").length;
-  const staleEmbeddingCount = items.filter((item) => item.embeddingFreshness === "stale").length;
-  const missingEmbeddingCount = items.filter((item) => item.embeddingFreshness === "missing").length;
-  const failedEmbeddingCount = items.filter((item) => item.embeddingFreshness === "failed").length;
-  const findings = [];
-  if (semanticCount === 0) findings.push("No semantic retrieval candidates reached the final packet.");
-  if (staleEmbeddingCount > 0) findings.push("Some retrieved items have stale embeddings.");
-  if (freshEmbeddingCount === 0 && missingEmbeddingCount > 0) findings.push("Retrieved file memory is falling back to non-embedded retrieval.");
-  if ((retrievalMeta?.embeddingError || retrievalMeta?.embeddingHealth?.lastError) && !findings.includes("Embedding query failed and retrieval fell back to lexical mode.")) {
-    findings.push("Embedding query failed and retrieval fell back to lexical mode.");
-  }
-  return {
-    memoryCount: items.length,
-    lexicalCount,
-    semanticCount,
-    qmdCount,
-    freshEmbeddingCount,
-    staleEmbeddingCount,
-    missingEmbeddingCount,
-    failedEmbeddingCount,
-    embeddingQueryMode: retrievalMeta?.embeddingQueryMode || "lexical_only",
-    embeddingError: retrievalMeta?.embeddingError || retrievalMeta?.embeddingHealth?.lastError || null,
-    embeddingHealth: retrievalMeta?.embeddingHealth || null,
-    findings,
-    items
-  };
-}
-function summarizeInteractionDiagnosis({
-  ackRequired,
-  ackQueued,
-  completionRequired,
-  completionQueued,
-  handoffRequired,
-  handoffQueued,
-  yielded,
-  followUpQueued,
-  followUpConsumed,
-  handoffDelivered,
-  deliveryEvidenceRequired,
-  deliveryEvidenceHealthy,
-  deliveryUncertain,
-  findings
-}) {
-  const missingStages = [];
-  if (ackRequired && !ackQueued) missingStages.push("ack");
-  if (completionRequired && !completionQueued && !yielded) missingStages.push("completion");
-  if (handoffRequired && !handoffQueued && !yielded) missingStages.push("handoff");
-  if (!findings?.length) {
-    return {
-      status: "healthy",
-      code: null,
-      summary: "Interaction lifecycle evidence is complete.",
-      missingStages,
-      findings: []
-    };
-  }
-  if (missingStages.length) {
-    return {
-      status: "action_required",
-      code: "missing_required_notifications",
-      summary: `Required interaction notifications are missing: ${missingStages.join(", ")}.`,
-      missingStages,
-      findings
-    };
-  }
-  if (yielded && followUpQueued && !followUpConsumed) {
-    return {
-      status: "action_required",
-      code: "follow_up_incomplete",
-      summary: "Yielded follow-up is still pending or incomplete.",
-      missingStages,
-      findings
-    };
-  }
-  if (deliveryEvidenceRequired && !deliveryEvidenceHealthy) {
-    return {
-      status: "action_required",
-      code: "missing_delivery_evidence",
-      summary: "Required pingback notifications do not have delivery receipts yet.",
-      missingStages,
-      findings
-    };
-  }
-  if (handoffRequired && handoffQueued && !handoffDelivered) {
-    return {
-      status: "action_required",
-      code: "handoff_incomplete",
-      summary: "Handoff was queued but not fully delivered.",
-      missingStages,
-      findings
-    };
-  }
-  if (deliveryUncertain) {
-    return {
-      status: "warning",
-      code: "delivery_uncertain",
-      summary: "Interaction lifecycle completed with uncertain delivery evidence.",
-      missingStages,
-      findings
-    };
-  }
-  return {
-    status: "warning",
-    code: "interaction_findings_present",
-    summary: findings[0] || "Interaction lifecycle has unresolved findings.",
-    missingStages,
-    findings
-  };
-}
-function analyzeInteraction(run, notifications = [], deliveries = []) {
-  const interaction = run?.interaction || null;
-  const findings = [];
-  const ackRequired = interaction?.ack?.required ?? false;
-  const completionRequired = interaction?.completion?.required ?? false;
-  const handoffRequired = interaction?.handoff?.required ?? false;
-  const ackQueued = notifications.some((item) => item.stage === "ack");
-  const completionQueued = notifications.some((item) => item.stage === "completion");
-  const handoffQueued = notifications.some((item) => item.stage === "handoff");
-  const followUpQueued = notifications.some((item) => item.stage === "follow_up");
-  const followUpNotification = notifications.find((item) => item.stage === "follow_up") || null;
-  const handoffNotification = notifications.find((item) => item.stage === "handoff") || null;
-  const handoffPendingChoice = handoffNotification?.status === "awaiting_choice";
-  const handoffState = handoffNotification?.handoffState || (handoffPendingChoice ? "pending" : null);
-  const handoffChosen = Boolean(handoffNotification?.chosenPeer?.peerId);
-  const handoffChosenPeerId = handoffNotification?.chosenPeer?.peerId || null;
-  const handoffChosenBy = handoffNotification?.chosenBy || null;
-  const handoffDelivery = handoffNotification
-    ? deliveries.find((item) => item.notificationFilePath === handoffNotification.filePath) || null
-    : null;
-  const handoffDelivered = Boolean(handoffDelivery);
-  const handoffDeliveryState = handoffDelivery?.delivery?.status || null;
-  const deliveryStates = deliveries.map((item) => item.delivery?.status || item.stage || "unknown");
-  const yielded = interaction?.yield?.required ?? false;
-  const yieldSignal = interaction?.yield?.signal || null;
-  const followUpState = followUpNotification?.followUpState || followUpNotification?.yieldState || null;
-  const followUpConsumed = followUpNotification?.status === "consumed" || followUpNotification?.yieldState === "consumed" || followUpNotification?.followUpState === "consumed";
-  const followUpTarget = followUpNotification?.targetSurface || interaction?.yield?.targetSurface || null;
-  const generatedFiles = new Set(followUpNotification?.generatedNotificationFiles || []);
-  const followUpCompleted = deliveries.some((item) => generatedFiles.has(item.notificationFilePath));
-  const followUpExpired = followUpState === "expired";
-  const followUpEscalated = followUpState === "escalated";
-  const deliveryDeduped = deliveryStates.includes("duplicate_prevented");
-  const deliveryRetried = deliveries.some((item) => Number(item.attempt) > 1);
-  const deliveryUncertain = deliveryStates.includes("delivery_uncertain") || deliveryStates.includes("uncertain");
-  const yieldedCompletionHandled = yielded && followUpQueued && Boolean(followUpNotification?.payload?.completion);
-  const yieldedHandoffHandled = yielded && followUpQueued && Boolean(followUpNotification?.payload?.handoff);
-  const visibleDeliveryCount = yielded ? deliveries.filter((item) => !generatedFiles.has(item.notificationFilePath)).length : deliveries.length;
-  const deliveryEvidenceRequired = !yielded && Boolean(ackQueued || completionQueued || handoffQueued);
-  const deliveryEvidenceHealthy = !deliveryEvidenceRequired || visibleDeliveryCount > 0;
-  if (ackRequired && !ackQueued) findings.push("Required ack notification was not queued.");
-  if (completionRequired && !completionQueued && !yieldedCompletionHandled) {
-    findings.push("Required completion notification was not queued.");
-  }
-  if (handoffRequired && !handoffQueued && !yieldedHandoffHandled) {
-    findings.push("Configured handoff was not queued.");
-  }
-  if (yielded && !followUpQueued) findings.push("Run yielded but no follow-up payload was persisted.");
-  if (followUpQueued && !followUpConsumed) findings.push("Follow-up payload was persisted but never consumed.");
-  if (followUpExpired) findings.push("Follow-up expired before it was consumed.");
-  if (followUpEscalated) findings.push("Follow-up expired and was escalated to the operator.");
-  if (handoffPendingChoice) findings.push("Handoff is awaiting an explicit peer choice.");
-  if (handoffState === "expired") findings.push("Handoff expired without an operator choice.");
-  if (handoffState === "escalated") findings.push("Handoff expired and was escalated to the operator.");
-  if (handoffState === "blocked") findings.push(`Handoff is blocked${handoffNotification?.blockedReason ? `: ${handoffNotification.blockedReason}` : "."}`);
-  if (handoffQueued && !handoffPendingChoice && !handoffChosen) findings.push("Handoff was queued but no peer choice was recorded.");
-  if (handoffChosen && !handoffDelivered) findings.push("Handoff was promoted to a peer but not delivered yet.");
-  if (handoffDeliveryState && /error|blocked/i.test(handoffDeliveryState)) findings.push(`Handoff delivery did not complete cleanly: ${handoffDeliveryState}.`);
-  if (!deliveryEvidenceHealthy) {
-    findings.push("No delivery receipts exist yet for queued interaction notifications.");
-  }
-  if (deliveryDeduped) findings.push("A duplicate delivery attempt was prevented by dedupe policy.");
-  if (deliveryUncertain) findings.push("A delivery attempt was marked uncertain and will not be blindly retried.");
-  const diagnosis = summarizeInteractionDiagnosis({
-    ackRequired,
-    ackQueued,
-    completionRequired,
-    completionQueued,
-    handoffRequired,
-    handoffQueued,
-    yielded,
-    followUpQueued,
-    followUpConsumed,
-    handoffDelivered,
-    deliveryEvidenceRequired,
-    deliveryEvidenceHealthy,
-    deliveryUncertain,
-    findings
-  });
-  return {
-    ackRequired,
-    ackQueued,
-    completionRequired,
-    completionQueued,
-    handoffRequired,
-    handoffQueued,
-    yielded,
-    yieldSignal,
-    followUpState,
-    followUpQueued,
-    followUpConsumed,
-    followUpTarget,
-    followUpCompleted,
-    followUpExpired,
-    followUpEscalated,
-    followUpEscalationFilePath: followUpNotification?.escalationNotificationFilePath || null,
-    handoffPendingChoice,
-    handoffState,
-    handoffExpired: handoffState === "expired",
-    handoffEscalated: handoffState === "escalated",
-    handoffBlocked: handoffState === "blocked",
-    handoffChosen,
-    handoffChosenPeerId,
-    handoffChosenBy,
-    handoffDelivered,
-    handoffDeliveryState,
-    handoffBlockedReason: handoffNotification?.blockedReason || null,
-    deliveryEvidenceRequired,
-    deliveryEvidenceHealthy,
-    deliveryReceiptCount: visibleDeliveryCount,
-    deliveryStates,
-    deliveryDeduped,
-    deliveryRetried,
-    deliveryUncertain,
-    diagnosis,
-    findings
-  };
-}
-function summarizeLiveRun(run) {
-  if (!run) return null;
-  return {
-    ts: run.ts || null,
-    status: run.status || null,
-    summary: run.summary || null,
-    error: run.error || null,
-    durationMs: run.durationMs ?? null,
-    provider: run.provider || null,
-    model: run.model || null,
-    usage: run.usage || null
-  };
-}
-const SECTION_HINTS = [
-  "calendar",
-  "weather",
-  "projects",
-  "project",
-  "inbox",
-  "issues",
-  "backlog",
-  "update",
-  "summary",
-  "next actions",
-  "alerts",
-  "status"
-];
-const SECTION_ALIASES = new Map([
-  ["project", "projects"],
-  ["next action", "next actions"]
-]);
-function canonicalSectionKey(value) {
-  const normalized = normalizeSectionKey(value);
-  return SECTION_ALIASES.get(normalized) || normalized;
-}
-function extractSectionKeys(nonEmptyLines) {
-  const sectionKeys = [];
-  const seen = new Set();
-  const patterns = [
-    /^#{1,6}\s+(.+)$/,
-    /^\*\*([^*]+)\*\*$/,
-    /^[-*]\s+\**([^:*]+?)\**:\s+.+$/,
-    /^([^:]{2,40}):\s+.+$/
-  ];
-  for (const line of nonEmptyLines) {
-    for (const pattern of patterns) {
-      const match = line.match(pattern);
-      if (!match) continue;
-      const key = canonicalSectionKey(match[1]);
-      if (!key || key.length < 2) continue;
-      if (seen.has(key)) break;
-      seen.add(key);
-      sectionKeys.push(key);
-      break;
-    }
-  }
-  return sectionKeys;
-}
-function comparableSections(structure) {
-  return structure.sectionKeys.length ? structure.sectionKeys : structure.sectionHints;
-}
-function analyzeOutputStructure(text) {
-  const raw = String(text || "");
-  const trimmed = raw.trim();
-  const lines = raw.split("\n").map((line) => line.trim());
-  const nonEmptyLines = lines.filter(Boolean);
-  const lower = trimmed.toLowerCase();
-  const sectionKeys = extractSectionKeys(nonEmptyLines);
-  return {
-    charCount: trimmed.length,
-    lineCount: nonEmptyLines.length,
-    headingCount: nonEmptyLines.filter((line) => /^#{1,6}\s/.test(line) || /^\*\*[^*]+\*\*/.test(line)).length,
-    bulletCount: nonEmptyLines.filter((line) => /^[-*]\s/.test(line)).length,
-    numberedCount: nonEmptyLines.filter((line) => /^\d+\.\s/.test(line)).length,
-    codeFenceCount: (raw.match(/```/g) || []).length / 2,
-    sectionKeys,
-    sectionHints: SECTION_HINTS.filter((hint) => lower.includes(hint)),
-    hasMarkdownTable: /\|.+\|/.test(raw),
-    hasEmoji: /\p{Extended_Pictographic}/u.test(raw)
-  };
-}
-function buildOutputDiff(v2Run, liveRun, contract = null) {
-  const v2Text = extractRunText(v2Run, contract);
-  const liveText = extractLiveText(liveRun);
-  const v2 = analyzeOutputStructure(v2Text);
-  const live = analyzeOutputStructure(liveText);
-  const v2Sections = comparableSections(v2);
-  const liveSections = comparableSections(live);
-  const sharedSections = v2Sections.filter((hint) => liveSections.includes(hint));
-  const missingFromV2 = liveSections.filter((hint) => !v2Sections.includes(hint));
-  const extraInV2 = v2Sections.filter((hint) => !liveSections.includes(hint));
-  const findings = [];
-  if (!liveText) {
-    findings.push("No live output is available for structural comparison.");
-  } else {
-    if (missingFromV2.length) findings.push(`V2 is missing live sections: ${missingFromV2.join(", ")}.`);
-    if (v2.bulletCount + v2.numberedCount < live.bulletCount + live.numberedCount) {
-      findings.push("V2 output is less structured than the live report.");
-    }
-    if (v2.charCount > 0 && live.charCount > 0) {
-      const verbosityRatio = Number((v2.charCount / live.charCount).toFixed(4));
-      if (verbosityRatio < 0.55) findings.push("V2 output is much shorter than the live report.");
-      if (verbosityRatio > 1.8) findings.push("V2 output is much longer than the live report.");
-    }
-  }
-  return {
-    v2,
-    live,
-    alignment: {
-      sharedSections,
-      missingFromV2,
-      extraInV2,
-      bulletDelta: (v2.bulletCount + v2.numberedCount) - (live.bulletCount + live.numberedCount),
-      headingDelta: v2.headingCount - live.headingCount,
-      charDelta: v2.charCount - live.charCount
-    },
-    findings
-  };
-}
-function assessOutputContract(contract, v2Run, liveRun) {
-  if (!contract) return null;
-  const v2Validation = validateOutputContract(contract, v2Run?.result?.output ?? v2Run?.output ?? "");
-  const liveValidation = validateOutputContract(contract, liveRun?.summary || liveRun?.error || "");
-  const missingFromV2 = v2Validation?.missingSections || [];
-  const missingFromLive = liveValidation?.missingSections || [];
-  const findings = [
-    ...(v2Validation?.findings.map((item) => `V2: ${item}`) || []),
-    ...(liveValidation?.findings.map((item) => `Live: ${item}`) || [])
-  ];
-  return {
-    format: contract.format || null,
-    requiredSections: contract.requiredSections || [],
-    styleHints: contract.styleHints || [],
-    satisfiedRatio: v2Validation?.satisfiedRatio ?? 0,
-    missingFromV2,
-    missingFromLive,
-    emptyInV2: v2Validation?.emptySections || [],
-    emptyInLive: liveValidation?.emptySections || [],
-    parsedV2: v2Validation?.parsed || null,
-    parsedLive: liveValidation?.parsed || null,
-    fieldScores: v2Validation?.fieldScores || null,
-    findings
-  };
-}
-export { buildRubric };
-export class Evaluator {
-  constructor({ projectRoot, liveRoot, stateRoot }) {
-    this.liveRoot = liveRoot;
-    this.stateRoot = stateRoot;
-    this.reviewer = new RunReviewer({ stateRoot });
-    this.scheduler = new Scheduler({ projectRoot, liveRoot, stateRoot });
-    this.evalStore = new RunStore({ rootDir: path.join(stateRoot, "evaluations") });
-    this.notificationStore = new NotificationStore({ rootDir: path.join(stateRoot, "notifications") });
-    this.deliveryStore = new DeliveryStore({ rootDir: path.join(stateRoot, "deliveries") });
-  }
-  async resolveInteractionArtifacts(run, review = null) {
-    const reviewNotifications = review?.recentNotifications || [];
-    const _reviewDeliveries = review?.recentDeliveries || [];
-    const baseFiles = run?.notificationFiles || [];
-    const relatedNotificationFiles = expandRelatedNotificationFiles(
-      baseFiles,
-      reviewNotifications
-    );
-    const knownNotifications = reviewNotifications.filter((item) => relatedNotificationFiles.has(item.filePath));
-    const missingNotificationFiles = [...relatedNotificationFiles].filter(
-      (filePath) => !knownNotifications.some((item) => item.filePath === filePath)
-    );
-    const loadedNotifications = await this.notificationStore.getNotifications(missingNotificationFiles);
-    const notifications = [...knownNotifications, ...loadedNotifications].sort((a, b) =>
-      String(a.timestamp || "").localeCompare(String(b.timestamp || ""))
-    );
-    const expandedNotificationFiles = expandRelatedNotificationFiles(baseFiles, notifications);
-    // Load all delivery receipts once for deterministic interaction evidence.
-    const allDeliveries = await this.deliveryStore.listAll();
-    const deliveries = allDeliveries.filter((item) => expandedNotificationFiles.has(item.notificationFilePath));
-    return {
-      notificationFiles: expandedNotificationFiles,
-      notifications,
-      deliveries
-    };
-  }
-  async evaluate(limit = 20) {
-    const [review, comparisons] = await Promise.all([
-      this.reviewer.review(limit),
-      this.scheduler.compareJobs()
-    ]);
-    const recentRuns = review.recentRuns.filter((run) => !run.jobId.endsWith("-comparison"));
-    const grouped = groupBy(recentRuns, (run) => run.jobId);
-    const jobs = await Promise.all(
-      Array.from(grouped.entries()).map(async ([jobId, runs]) => this.evaluateJob(jobId, {
-        runs,
-        review,
-        comparisons
-      }))
-    );
-    return {
-      jobs: [...jobs].sort((a, b) => a.rubric.overallScore - b.rubric.overallScore),
-      recentRuns,
-      scheduler: review.scheduler
-    };
-  }
-  async evaluateJob(jobId, options = {}) {
-    const runtime = await this.scheduler.loadRuntime();
-    const jobConfig = runtime.jobs[jobId] || null;
-    const review = options.review || (await this.reviewer.review(options.limit ?? 20));
-    const comparisons = options.comparisons || (await this.scheduler.compareJobs());
-    const runs = options.runs || review.recentRuns.filter((run) => run.jobId === jobId && !run.jobId.endsWith("-comparison"));
-    const schedulerState = review.scheduler.find((item) => item.jobId === jobId) || null;
-    const comparison = comparisons.find((item) => item.v2JobId === jobId) || null;
-    const liveMatches = await Promise.all(
-      (comparison?.closestLiveJobs || []).map(async (match) => ({
-        ...match,
-        recentRuns: await this.scheduler.bridge.loadCronRunHistory(match.id, 5),
-        latestRun: (await this.scheduler.bridge.loadCronRunHistory(match.id, 1))[0] || null
-      }))
-    );
-    const selectedRun = choosePrimaryV2Run(runs);
-    const interactionRun = runs[0] || selectedRun;
-    const selectedLiveMatch = pickBestLiveMatch(liveMatches);
-    const liveHistory = selectedLiveMatch?.recentRuns || [];
-    const outputContract = normalizeOutputContract(jobConfig?.outputContract || null);
-    const outputDiff = buildOutputDiff(selectedRun, selectedLiveMatch?.latestRun || null, outputContract);
-    const contractCheck = assessOutputContract(outputContract, selectedRun, selectedLiveMatch?.latestRun || null);
-    const retrieval = analyzeRetrieval(selectedRun);
-    const interactionArtifacts = await this.resolveInteractionArtifacts(interactionRun, review);
-    const interaction = analyzeInteraction(interactionRun, interactionArtifacts.notifications, interactionArtifacts.deliveries);
-    const rubric = buildRubric({
-      v2Run: selectedRun,
-      liveHistory,
-      matchedLiveJob: selectedLiveMatch,
-      outputContract,
-      contractCheck
-    });
-    return {
-      jobId,
-      schedulerState,
-      maintenance: review?.maintenance || null,
-      latestRun: runs[0] || null,
-      primaryRun: summarizeV2Run(selectedRun),
-      interactionRunTimestamp: interactionRun?.timestamp || null,
-      runCount: runs.length,
-      modeCounts: countModes(runs),
-      liveMatches: liveMatches.map((match) => ({
-        id: match.id,
-        name: match.name,
-        description: match.description || null,
-        enabled: match.enabled,
-        schedule: match.schedule,
-        kind: match.kind || null,
-        lastStatus: match.lastStatus || null,
-        latestRun: summarizeLiveRun(match.latestRun)
-      })),
-      selectedLiveMatch: selectedLiveMatch
-        ? {
-            id: selectedLiveMatch.id,
-            name: selectedLiveMatch.name,
-            latestRun: summarizeLiveRun(selectedLiveMatch.latestRun)
-          }
-        : null,
-      retrieval,
-      interaction,
-      outputContract,
-      contractCheck,
-      outputDiff,
-      rubric,
-      comparisonNotes: buildComparisonNotes({
-        jobId,
-        selectedRun,
-        selectedLiveMatch,
-        schedulerState,
-        maintenance: review?.maintenance || null,
-        rubric,
-        outputDiff,
-        contractCheck,
-        retrieval,
-        interaction
-      }),
-      interactionArtifacts: {
-        notificationCount: interactionArtifacts.notifications.length,
-        deliveryCount: interactionArtifacts.deliveries.length,
-        notificationFileCount: interactionArtifacts.notificationFiles.size
-      }
-    };
-  }
-  async evaluateAndPersistJob(jobId, options = {}) {
-    const report = await this.evaluateJob(jobId, options);
-    const artifact = {
-      timestamp: new Date().toISOString(),
-      kind: "job-evaluation",
-      ...report
-    };
-    const filePath = await this.evalStore.saveRun(jobId, artifact);
-    return {
-      filePath,
-      ...artifact
-    };
-  }
-}
-function countModes(runs) {
-  return runs.reduce((acc, run) => {
-    const mode = run.mode || "unknown";
-    acc[mode] = (acc[mode] || 0) + 1;
-    return acc;
-  }, {});
-}
-function buildComparisonNotes({
-  jobId,
-  selectedRun,
-  selectedLiveMatch,
-  schedulerState,
-  maintenance,
-  rubric,
-  outputDiff,
-  contractCheck,
-  retrieval = null,
-  interaction = null
-}) {
-  const notes = [];
-  if (!selectedRun) notes.push("No V2 runs recorded.");
-  if (schedulerState?.lastStatus === "ok") notes.push("Latest V2 scheduler state is healthy.");
-  if (selectedRun?.fallback?.attempted && selectedRun?.fallback?.success) {
-    notes.push(
-      `Run used report fallback from ${selectedRun.fallback.sourceLane || "local"} to ${selectedRun.fallback.finalSourceLane || "remote"} after ${selectedRun.fallback.trigger || "failure"}.`
-    );
-  } else if (selectedRun?.fallback?.attempted && !selectedRun?.fallback?.success) {
-    notes.push(`Report fallback was attempted but did not succeed${selectedRun.fallback?.fallbackError ? `: ${selectedRun.fallback.fallbackError}` : "."}`);
-  } else if (selectedRun?.fallback?.allowed === false && selectedRun?.fallback?.trigger) {
-    notes.push(`Report fallback was blocked after ${selectedRun.fallback.trigger}${selectedRun.fallback?.blockedReason ? `: ${selectedRun.fallback.blockedReason}` : "."}`);
-  }
-  if (maintenance?.wal?.some((item) => item.action && item.action !== "none" && item.action !== "error")) {
-    notes.push("Daemon maintenance recently performed WAL checkpoint work.");
-  }
-  if (maintenance?.handoffs?.expiredCount > 0) {
-    notes.push(`Daemon maintenance expired or escalated ${maintenance.handoffs.expiredCount} pending handoff(s).`);
-  }
-  if (!selectedLiveMatch) {
-    notes.push("No live cron analogue matched.");
-    return uniqueStrings([...notes, ...rubric.findings, ...outputDiff.findings, ...(contractCheck?.findings || []), ...(interaction?.findings || [])]);
-  }
-  const latestLive = selectedLiveMatch.latestRun;
-  notes.push(`Closest live cron match: ${selectedLiveMatch.name || selectedLiveMatch.id}.`);
-  if (latestLive?.status) notes.push(`Latest live status: ${latestLive.status}.`);
-  if (latestLive?.provider) notes.push(`Latest live provider: ${latestLive.provider}.`);
-  if (latestLive?.durationMs != null) notes.push(`Latest live duration: ${latestLive.durationMs}ms.`);
-  const retrievalFindings = retrieval?.findings || [];
-  const interactionFindings = interaction?.findings || [];
-  const outputDiffFindings =
-    jobId === "memory-rollup" && Number(contractCheck?.satisfiedRatio || 0) >= 0.99
-      ? (outputDiff.findings || []).filter((item) => !/less structured|much shorter/i.test(item))
-      : outputDiff.findings || [];
-  return uniqueStrings([...notes, ...rubric.findings, ...outputDiffFindings, ...(contractCheck?.findings || []), ...retrievalFindings, ...interactionFindings]);
-}
-function normalizeOutputContract(contract) {
-  if (!contract) return null;
-  return {
-    format: contract.format || null,
-    requiredSections: contract.requiredSections || [],
-    styleHints: contract.styleHints || [],
-    profile: contract.profile || null
-  };
-}
+import path from "node:path";
+import { RunReviewer } from "./review.js";
+import { Scheduler } from "./scheduler.js";
+import { RunStore } from "./run-store.js";
+import { NotificationStore } from "./notification-store.js";
+import { DeliveryStore } from "./delivery-store.js";
+import { validateOutputContract } from "./output-contract-validator.js";
+function groupBy(items, keyFn) {
+  const map = new Map();
+  for (const item of items) {
+    const key = keyFn(item);
+    if (!map.has(key)) map.set(key, []);
+    map.get(key).push(item);
+  }
+  return map;
+}
+function clamp(value, min = 0, max = 1) {
+  return Math.max(min, Math.min(max, value));
+}
+function average(values) {
+  if (values.length === 0) return null;
+  return values.reduce((sum, value) => sum + value, 0) / values.length;
+}
+function choosePrimaryV2Run(runs) {
+  if (!runs.length) return null;
+  return runs.find((run) => run.mode === "provider") || runs[0];
+}
+function pickBestLiveMatch(liveMatches) {
+  return liveMatches.find((match) => match.latestRun) || liveMatches[0] || null;
+}
+function normalizeText(value) {
+  return String(value || "")
+    .replace(/\s+/g, " ")
+    .trim();
+}
+function stripOuterFence(text) {
+  const raw = String(text || "").trim();
+  const fencedMatch = raw.match(/^```(?:json|markdown|md|text)?\s*([\s\S]*?)\s*```$/i);
+  return fencedMatch ? fencedMatch[1].trim() : raw;
+}
+function parseJsonCandidate(text) {
+  const candidate = stripOuterFence(text);
+  if (!(candidate.startsWith("{") && candidate.endsWith("}"))) {
+    return null;
+  }
+  try {
+    return JSON.parse(candidate);
+  } catch {
+    return null;
+  }
+}
+function titleCase(value) {
+  return String(value || "")
+    .replace(/[_-]+/g, " ")
+    .replace(/^#+\s*/, "")
+    .replace(/\b\w/g, (char) => char.toUpperCase())
+    .trim();
+}
+function normalizeInline(value) {
+  return normalizeText(value) || "None";
+}
+function normalizeSectionKey(value) {
+  return String(value || "")
+    .toLowerCase()
+    .replace(/^#+\s*/, "")
+    .replace(/[*:_-]+/g, " ")
+    .replace(/\s+/g, " ")
+    .trim();
+}
+function renderValue(value, { contract = null, summary = null } = {}) {
+  if (value == null) return "";
+  if (typeof value === "string") {
+    const parsed = parseJsonCandidate(value);
+    if (parsed && typeof parsed === "object") {
+      if (parsed.output !== undefined) {
+        return renderValue(parsed.output, {
+          contract,
+          summary: parsed.summary || summary
+        });
+      }
+      return renderValue(parsed, { contract, summary });
+    }
+    return stripOuterFence(value);
+  }
+  if (Array.isArray(value)) {
+    return value
+      .map((item) => renderValue(item, { contract, summary }))
+      .filter(Boolean)
+      .join("\n");
+  }
+  if (typeof value === "object") {
+    const entries = Object.entries(value);
+    const sectionOrder = contract?.requiredSections?.length
+      ? contract.requiredSections
+      : entries.map(([key]) => key);
+    const valueMap = new Map(entries.map(([key, entryValue]) => [normalizeSectionKey(key), entryValue]));
+    const sectionStyle = contract?.profile?.sectionStyle || (contract?.format === "structured_rollup" ? "headings" : "bullets");
+    const requireStatus = contract?.profile?.requireStatus ?? (contract?.format === "bulleted_briefing");
+    if (sectionStyle === "bullets") {
+      const lines = [];
+      if (requireStatus && summary) lines.push(`Status: ${normalizeInline(summary)}`);
+      for (const section of sectionOrder) {
+        lines.push(`- ${titleCase(section)}: ${normalizeInline(valueMap.get(normalizeSectionKey(section)))}`);
+      }
+      return lines.join("\n");
+    }
+    if (sectionStyle === "headings") {
+      const lines = [];
+      for (const section of sectionOrder) {
+        lines.push(`## ${titleCase(section)}`);
+        lines.push(`- ${normalizeInline(valueMap.get(normalizeSectionKey(section)))}`);
+        lines.push("");
+      }
+      return lines.join("\n").trim();
+    }
+    return entries
+      .map(([key, entryValue]) => `${titleCase(key)}: ${normalizeInline(entryValue)}`)
+      .join("\n");
+  }
+  return String(value);
+}
+function extractRunText(run, contract = null) {
+  if (!run) return "";
+  const summary = run?.result?.summary || run?.summary || "";
+  const value = run?.result?.output ?? run?.output ?? summary;
+  return renderValue(value, { contract, summary });
+}
+function extractLiveText(run) {
+  if (!run) return "";
+  return renderValue(run.summary || run.error || "");
+}
+function qualitySignals(text) {
+  const raw = String(text || "");
+  const normalized = normalizeText(text);
+  const lower = normalized.toLowerCase();
+  const findings = [];
+  let score = 1;
+  if (!normalized) {
+    findings.push("Output is empty.");
+    return { score: 0, findings };
+  }
+  if (normalized.length < 40) {
+    findings.push("Output is very short and may not carry enough signal.");
+    score -= 0.18;
+  }
+  if (/\[(title|link|summary|sub)\]/i.test(normalized)) {
+    findings.push("Output still contains placeholder text.");
+    score -= 0.4;
+  }
+  if (/i('| a)?m sorry|does not support|cannot complete|failed to/i.test(lower)) {
+    findings.push("Output contains apology or tool-failure language.");
+    score -= 0.28;
+  }
+  if (/```/.test(raw)) {
+    findings.push("Output is wrapped in a code block instead of a direct report.");
+    score -= 0.12;
+  }
+  if (/timed out|timeout/i.test(lower)) {
+    findings.push("Output references a timeout or stalled execution.");
+    score -= 0.35;
+  }
+  const repeatedLinePenalty = detectRepeatedLinePenalty(normalized);
+  if (repeatedLinePenalty > 0) {
+    findings.push("Output repeats nearly identical numbered lines.");
+    score -= repeatedLinePenalty;
+  }
+  return {
+    score: clamp(Number(score.toFixed(4))),
+    findings
+  };
+}
+function detectRepeatedLinePenalty(text) {
+  const lines = text
+    .split("\n")
+    .map((line) => line.trim())
+    .filter(Boolean)
+    .filter((line) => /^\d+\./.test(line));
+  if (lines.length < 3) return 0;
+  const normalized = lines.map((line) => line.replace(/^\d+\.\s*/, "").toLowerCase());
+  const unique = new Set(normalized);
+  const duplicateRatio = 1 - unique.size / normalized.length;
+  if (duplicateRatio < 0.5) return 0;
+  return Number((duplicateRatio * 0.25).toFixed(4));
+}
+function expandRelatedNotificationFiles(baseFiles, notifications) {
+  const related = new Set(baseFiles);
+  let changed = true;
+  while (changed) {
+    changed = false;
+    for (const item of notifications) {
+      if (!related.has(item.filePath)) continue;
+      for (const generated of item.generatedNotificationFiles || []) {
+        if (related.has(generated)) continue;
+        related.add(generated);
+        changed = true;
+      }
+    }
+  }
+  return related;
+}
+function evaluateLiveHistory(liveRuns) {
+  if (liveRuns.length === 0) {
+    return {
+      runCount: 0,
+      okCount: 0,
+      errorCount: 0,
+      skippedCount: 0,
+      failureRate: null,
+      avgDurationMs: null,
+      avgTotalTokens: null,
+      avgQualityScore: null,
+      findings: ["No recent live history available."]
+    };
+  }
+  const okCount = liveRuns.filter((run) => run.status === "ok").length;
+  const errorCount = liveRuns.filter((run) => run.status === "error").length;
+  const skippedCount = liveRuns.filter((run) => run.status === "skipped").length;
+  const failureRate = errorCount / liveRuns.length;
+  const durations = liveRuns.map((run) => run.durationMs).filter((value) => Number.isFinite(value));
+  const tokens = liveRuns.map((run) => run.usage?.total_tokens).filter((value) => Number.isFinite(value));
+  const qualityScores = liveRuns
+    .map((run) => qualitySignals(run.summary || run.error || "").score)
+    .filter((value) => Number.isFinite(value));
+  const findings = [];
+  if (failureRate >= 0.34) findings.push("Live cron lane is failing often.");
+  if (skippedCount > 0) findings.push("Live cron history includes intentional skips.");
+  if (tokens.some((value) => value > 12000)) findings.push("Live cron lane shows high token usage spikes.");
+  return {
+    runCount: liveRuns.length,
+    okCount,
+    errorCount,
+    skippedCount,
+    failureRate: Number(failureRate.toFixed(4)),
+    avgDurationMs: durations.length ? Math.round(average(durations)) : null,
+    avgTotalTokens: tokens.length ? Math.round(average(tokens)) : null,
+    avgQualityScore: qualityScores.length ? Number(average(qualityScores).toFixed(4)) : null,
+    findings
+  };
+}
+function scoreStatus(status) {
+  if (status === "ok") return 1;
+  if (status === "skipped") return 0.6;
+  if (status === "error") return 0;
+  return 0.5;
+}
+function buildRubric({ v2Run, liveHistory, matchedLiveJob, outputContract = null, contractCheck = null }) {
+  const findings = [];
+  const v2Text = extractRunText(v2Run, outputContract);
+  const v2Quality = qualitySignals(v2Text);
+  const latestLive = liveHistory[0] || null;
+  const latestLiveQuality = qualitySignals(extractLiveText(latestLive));
+  const history = evaluateLiveHistory(liveHistory);
+  const isDryRun = v2Run != null && v2Run.mode !== "provider";
+  const comparisonReadiness = v2Run
+    ? v2Run.mode === "provider"
+      ? 1
+      : 0.45
+    : 0;
+  const comparisonCoverage = matchedLiveJob ? 1 : 0.2;
+  const contractAdherence = contractCheck ? contractCheck.satisfiedRatio : null;
+  if (!v2Run) findings.push("No V2 run exists for this lane yet.");
+  else if (isDryRun) findings.push("Only a dry-run V2 artifact exists; output quality and contract adherence are excluded from the rubric score.");
+  if (!matchedLiveJob) findings.push("Comparison coverage is low because no live cron analogue is mapped.");
+  if (!isDryRun && v2Quality.findings.length) findings.push(...v2Quality.findings.map((item) => `V2: ${item}`));
+  if (latestLiveQuality.findings.length) findings.push(...latestLiveQuality.findings.map((item) => `Live: ${item}`));
+  if (history.findings.length) findings.push(...history.findings);
+  const fieldScores = contractCheck?.fieldScores || null;
+  if (!isDryRun && fieldScores) {
+    if (fieldScores.weakFields.length) {
+      findings.push(`Field-level quality is low for: ${fieldScores.weakFields.join(", ")}`);
+    }
+    if (fieldScores.placeholderFields.length) {
+      findings.push(`Placeholder text detected in: ${fieldScores.placeholderFields.join(", ")}`);
+    }
+  }
+  if (!matchedLiveJob) {
+    findings.push("No live cron analogue matched for this V2 job.");
+  }
+  const statusAlignment =
+    latestLive && v2Run
+      ? Number((scoreStatus(v2Run.result ? "ok" : v2Run.status) * scoreStatus(latestLive.status)).toFixed(4))
+      : null;
+  const liveReliability = history.failureRate == null ? null : Number((1 - history.failureRate).toFixed(4));
+  const fieldLevelQuality = !isDryRun && fieldScores ? fieldScores.averageScore : null;
+  const components = [
+    isDryRun ? null : v2Quality.score,
+    comparisonReadiness,
+    comparisonCoverage,
+    isDryRun ? null : contractAdherence,
+    fieldLevelQuality,
+    liveReliability,
+    statusAlignment
+  ].filter((value) => value != null);
+  const overallScore = components.length ? Number(average(components).toFixed(4)) : 0;
+  return {
+    overallScore,
+    dryRunExcluded: isDryRun,
+    components: {
+      v2OutputQuality: isDryRun ? null : v2Quality.score,
+      comparisonReadiness,
+      comparisonCoverage,
+      contractAdherence: isDryRun ? null : contractAdherence,
+      fieldLevelQuality,
+      liveReliability,
+      statusAlignment
+    },
+    findings: uniqueStrings(findings),
+    metrics: {
+      liveRunCount: history.runCount,
+      liveOkCount: history.okCount,
+      liveErrorCount: history.errorCount,
+      liveSkippedCount: history.skippedCount,
+      liveFailureRate: history.failureRate,
+      liveAvgDurationMs: history.avgDurationMs,
+      liveAvgTotalTokens: history.avgTotalTokens,
+      liveAvgQualityScore: history.avgQualityScore,
+      latestLiveQualityScore: latestLive ? latestLiveQuality.score : null
+    }
+  };
+}
+function uniqueStrings(items) {
+  return [...new Set(items.filter(Boolean))];
+}
+function summarizeV2Run(run) {
+  if (!run) return null;
+  return {
+    timestamp: run.timestamp,
+    mode: run.mode || null,
+    providerId: run.providerId || null,
+    modelId: run.modelId || null,
+    summary: run.result?.summary || run.summary || null,
+    output: run.result?.output || run.output || null,
+    retrievalMeta: run.retrievalMeta || null,
+    retrievedMemoryCount: run.retrievedMemory?.length || 0,
+    interaction: summarizeInteraction(run),
+    fallback: run.fallback || null
+  };
+}
+function summarizeInteraction(run) {
+  const interaction = run?.interaction || null;
+  if (!interaction) return null;
+  return {
+    ackRequired: interaction.ack?.required ?? false,
+    completionRequired: interaction.completion?.required ?? false,
+    handoffRequired: interaction.handoff?.required ?? false,
+    yielded: run?.yielded || false,
+    yieldSignal: run?.yieldSignal || null,
+    followUpState: run?.followUpState || null,
+    followUpQueued: run?.followUpQueued || false,
+    followUpConsumed: run?.followUpConsumed || false,
+    followUpTarget: run?.followUpTarget || null,
+    followUpCompleted: run?.followUpCompleted || false,
+    followUpExpired: run?.followUpExpired || false,
+    followUpEscalated: run?.followUpEscalated || false,
+    followUpEscalationFilePath: run?.followUpEscalationFilePath || null,
+    handoffTarget: interaction.handoff?.target || null,
+    suggestedPeerCount: interaction.handoff?.suggestions?.length || 0,
+    handoffChosenPeerId: run?.handoffChosenPeerId || null,
+    handoffChosenBy: run?.handoffChosenBy || null,
+    handoffDelivered: run?.handoffDelivered || false,
+    handoffDeliveryState: run?.handoffDeliveryState || null,
+    deliveryDeduped: run?.deliveryDeduped || false,
+    deliveryRetried: run?.deliveryRetried || false,
+    deliveryUncertain: run?.deliveryUncertain || false
+  };
+}
+function analyzeRetrieval(run) {
+  const retrievalMeta = run?.retrievalMeta || run?.plan?.packet?.layers?.retrievalMeta || null;
+  if (!run?.retrievedMemory?.length) {
+    return {
+      memoryCount: 0,
+      lexicalCount: 0,
+      semanticCount: 0,
+      qmdCount: 0,
+      freshEmbeddingCount: 0,
+      staleEmbeddingCount: 0,
+      missingEmbeddingCount: 0,
+      failedEmbeddingCount: retrievalMeta?.embeddingHealth?.failedCount || 0,
+      embeddingQueryMode: retrievalMeta?.embeddingQueryMode || "lexical_only",
+      embeddingError: retrievalMeta?.embeddingError || retrievalMeta?.embeddingHealth?.lastError || null,
+      findings: ["No retrieved memory was captured for this run."],
+      items: []
+    };
+  }
+  const items = run.retrievedMemory.map((item) => ({
+    entryId: item.entryId || null,
+    title: item.title || null,
+    sourceBackend: item.sourceBackend || "file",
+    candidateSource: item.candidateSource || "indexed",
+    lexicalScore: item.lexicalScore ?? 0,
+    embeddingSimilarity: item.embeddingSimilarity ?? 0,
+    embeddingFreshness: item.embeddingFreshness || "missing",
+    retrievalSources: item.retrievalSources || []
+  }));
+  const lexicalCount = items.filter((item) => item.retrievalSources.includes("lexical")).length;
+  const semanticCount = items.filter((item) => item.retrievalSources.includes("semantic")).length;
+  const qmdCount = items.filter((item) => item.retrievalSources.includes("qmd") || item.sourceBackend === "qmd").length;
+  const freshEmbeddingCount = items.filter((item) => item.embeddingFreshness === "fresh").length;
+  const staleEmbeddingCount = items.filter((item) => item.embeddingFreshness === "stale").length;
+  const missingEmbeddingCount = items.filter((item) => item.embeddingFreshness === "missing").length;
+  const failedEmbeddingCount = items.filter((item) => item.embeddingFreshness === "failed").length;
+  const findings = [];
+  if (semanticCount === 0) findings.push("No semantic retrieval candidates reached the final packet.");
+  if (staleEmbeddingCount > 0) findings.push("Some retrieved items have stale embeddings.");
+  if (freshEmbeddingCount === 0 && missingEmbeddingCount > 0) findings.push("Retrieved file memory is falling back to non-embedded retrieval.");
+  if ((retrievalMeta?.embeddingError || retrievalMeta?.embeddingHealth?.lastError) && !findings.includes("Embedding query failed and retrieval fell back to lexical mode.")) {
+    findings.push("Embedding query failed and retrieval fell back to lexical mode.");
+  }
+  return {
+    memoryCount: items.length,
+    lexicalCount,
+    semanticCount,
+    qmdCount,
+    freshEmbeddingCount,
+    staleEmbeddingCount,
+    missingEmbeddingCount,
+    failedEmbeddingCount,
+    embeddingQueryMode: retrievalMeta?.embeddingQueryMode || "lexical_only",
+    embeddingError: retrievalMeta?.embeddingError || retrievalMeta?.embeddingHealth?.lastError || null,
+    embeddingHealth: retrievalMeta?.embeddingHealth || null,
+    findings,
+    items
+  };
+}
+function summarizeInteractionDiagnosis({
+  ackRequired,
+  ackQueued,
+  completionRequired,
+  completionQueued,
+  handoffRequired,
+  handoffQueued,
+  yielded,
+  followUpQueued,
+  followUpConsumed,
+  handoffDelivered,
+  deliveryEvidenceRequired,
+  deliveryEvidenceHealthy,
+  deliveryUncertain,
+  findings
+}) {
+  const missingStages = [];
+  if (ackRequired && !ackQueued) missingStages.push("ack");
+  if (completionRequired && !completionQueued && !yielded) missingStages.push("completion");
+  if (handoffRequired && !handoffQueued && !yielded) missingStages.push("handoff");
+  if (!findings?.length) {
+    return {
+      status: "healthy",
+      code: null,
+      summary: "Interaction lifecycle evidence is complete.",
+      missingStages,
+      findings: []
+    };
+  }
+  if (missingStages.length) {
+    return {
+      status: "action_required",
+      code: "missing_required_notifications",
+      summary: `Required interaction notifications are missing: ${missingStages.join(", ")}.`,
+      missingStages,
+      findings
+    };
+  }
+  if (yielded && followUpQueued && !followUpConsumed) {
+    return {
+      status: "action_required",
+      code: "follow_up_incomplete",
+      summary: "Yielded follow-up is still pending or incomplete.",
+      missingStages,
+      findings
+    };
+  }
+  if (deliveryEvidenceRequired && !deliveryEvidenceHealthy) {
+    return {
+      status: "action_required",
+      code: "missing_delivery_evidence",
+      summary: "Required pingback notifications do not have delivery receipts yet.",
+      missingStages,
+      findings
+    };
+  }
+  if (handoffRequired && handoffQueued && !handoffDelivered) {
+    return {
+      status: "action_required",
+      code: "handoff_incomplete",
+      summary: "Handoff was queued but not fully delivered.",
+      missingStages,
+      findings
+    };
+  }
+  if (deliveryUncertain) {
+    return {
+      status: "warning",
+      code: "delivery_uncertain",
+      summary: "Interaction lifecycle completed with uncertain delivery evidence.",
+      missingStages,
+      findings
+    };
+  }
+  return {
+    status: "warning",
+    code: "interaction_findings_present",
+    summary: findings[0] || "Interaction lifecycle has unresolved findings.",
+    missingStages,
+    findings
+  };
+}
+function analyzeInteraction(run, notifications = [], deliveries = []) {
+  const interaction = run?.interaction || null;
+  const findings = [];
+  const ackRequired = interaction?.ack?.required ?? false;
+  const completionRequired = interaction?.completion?.required ?? false;
+  const handoffRequired = interaction?.handoff?.required ?? false;
+  const ackQueued = notifications.some((item) => item.stage === "ack");
+  const completionQueued = notifications.some((item) => item.stage === "completion");
+  const handoffQueued = notifications.some((item) => item.stage === "handoff");
+  const followUpQueued = notifications.some((item) => item.stage === "follow_up");
+  const followUpNotification = notifications.find((item) => item.stage === "follow_up") || null;
+  const handoffNotification = notifications.find((item) => item.stage === "handoff") || null;
+  const handoffPendingChoice = handoffNotification?.status === "awaiting_choice";
+  const handoffState = handoffNotification?.handoffState || (handoffPendingChoice ? "pending" : null);
+  const handoffChosen = Boolean(handoffNotification?.chosenPeer?.peerId);
+  const handoffChosenPeerId = handoffNotification?.chosenPeer?.peerId || null;
+  const handoffChosenBy = handoffNotification?.chosenBy || null;
+  const handoffDelivery = handoffNotification
+    ? deliveries.find((item) => item.notificationFilePath === handoffNotification.filePath) || null
+    : null;
+  const handoffDelivered = Boolean(handoffDelivery);
+  const handoffDeliveryState = handoffDelivery?.delivery?.status || null;
+  const deliveryStates = deliveries.map((item) => item.delivery?.status || item.stage || "unknown");
+  const yielded = interaction?.yield?.required ?? false;
+  const yieldSignal = interaction?.yield?.signal || null;
+  const followUpState = followUpNotification?.followUpState || followUpNotification?.yieldState || null;
+  const followUpConsumed = followUpNotification?.status === "consumed" || followUpNotification?.yieldState === "consumed" || followUpNotification?.followUpState === "consumed";
+  const followUpTarget = followUpNotification?.targetSurface || interaction?.yield?.targetSurface || null;
+  const generatedFiles = new Set(followUpNotification?.generatedNotificationFiles || []);
+  const followUpCompleted = deliveries.some((item) => generatedFiles.has(item.notificationFilePath));
+  const followUpExpired = followUpState === "expired";
+  const followUpEscalated = followUpState === "escalated";
+  const deliveryDeduped = deliveryStates.includes("duplicate_prevented");
+  const deliveryRetried = deliveries.some((item) => Number(item.attempt) > 1);
+  const deliveryUncertain = deliveryStates.includes("delivery_uncertain") || deliveryStates.includes("uncertain");
+  const yieldedCompletionHandled = yielded && followUpQueued && Boolean(followUpNotification?.payload?.completion);
+  const yieldedHandoffHandled = yielded && followUpQueued && Boolean(followUpNotification?.payload?.handoff);
+  const visibleDeliveryCount = yielded ? deliveries.filter((item) => !generatedFiles.has(item.notificationFilePath)).length : deliveries.length;
+  const deliveryEvidenceRequired = !yielded && Boolean(ackQueued || completionQueued || handoffQueued);
+  const deliveryEvidenceHealthy = !deliveryEvidenceRequired || visibleDeliveryCount > 0;
+  if (ackRequired && !ackQueued) findings.push("Required ack notification was not queued.");
+  if (completionRequired && !completionQueued && !yieldedCompletionHandled) {
+    findings.push("Required completion notification was not queued.");
+  }
+  if (handoffRequired && !handoffQueued && !yieldedHandoffHandled) {
+    findings.push("Configured handoff was not queued.");
+  }
+  if (yielded && !followUpQueued) findings.push("Run yielded but no follow-up payload was persisted.");
+  if (followUpQueued && !followUpConsumed) findings.push("Follow-up payload was persisted but never consumed.");
+  if (followUpExpired) findings.push("Follow-up expired before it was consumed.");
+  if (followUpEscalated) findings.push("Follow-up expired and was escalated to the operator.");
+  if (handoffPendingChoice) findings.push("Handoff is awaiting an explicit peer choice.");
+  if (handoffState === "expired") findings.push("Handoff expired without an operator choice.");
+  if (handoffState === "escalated") findings.push("Handoff expired and was escalated to the operator.");
+  if (handoffState === "blocked") findings.push(`Handoff is blocked${handoffNotification?.blockedReason ? `: ${handoffNotification.blockedReason}` : "."}`);
+  if (handoffQueued && !handoffPendingChoice && !handoffChosen) findings.push("Handoff was queued but no peer choice was recorded.");
+  if (handoffChosen && !handoffDelivered) findings.push("Handoff was promoted to a peer but not delivered yet.");
+  if (handoffDeliveryState && /error|blocked/i.test(handoffDeliveryState)) findings.push(`Handoff delivery did not complete cleanly: ${handoffDeliveryState}.`);
+  if (!deliveryEvidenceHealthy) {
+    findings.push("No delivery receipts exist yet for queued interaction notifications.");
+  }
+  if (deliveryDeduped) findings.push("A duplicate delivery attempt was prevented by dedupe policy.");
+  if (deliveryUncertain) findings.push("A delivery attempt was marked uncertain and will not be blindly retried.");
+  const diagnosis = summarizeInteractionDiagnosis({
+    ackRequired,
+    ackQueued,
+    completionRequired,
+    completionQueued,
+    handoffRequired,
+    handoffQueued,
+    yielded,
+    followUpQueued,
+    followUpConsumed,
+    handoffDelivered,
+    deliveryEvidenceRequired,
+    deliveryEvidenceHealthy,
+    deliveryUncertain,
+    findings
+  });
+  return {
+    ackRequired,
+    ackQueued,
+    completionRequired,
+    completionQueued,
+    handoffRequired,
+    handoffQueued,
+    yielded,
+    yieldSignal,
+    followUpState,
+    followUpQueued,
+    followUpConsumed,
+    followUpTarget,
+    followUpCompleted,
+    followUpExpired,
+    followUpEscalated,
+    followUpEscalationFilePath: followUpNotification?.escalationNotificationFilePath || null,
+    handoffPendingChoice,
+    handoffState,
+    handoffExpired: handoffState === "expired",
+    handoffEscalated: handoffState === "escalated",
+    handoffBlocked: handoffState === "blocked",
+    handoffChosen,
+    handoffChosenPeerId,
+    handoffChosenBy,
+    handoffDelivered,
+    handoffDeliveryState,
+    handoffBlockedReason: handoffNotification?.blockedReason || null,
+    deliveryEvidenceRequired,
+    deliveryEvidenceHealthy,
+    deliveryReceiptCount: visibleDeliveryCount,
+    deliveryStates,
+    deliveryDeduped,
+    deliveryRetried,
+    deliveryUncertain,
+    diagnosis,
+    findings
+  };
+}
+function summarizeLiveRun(run) {
+  if (!run) return null;
+  return {
+    ts: run.ts || null,
+    status: run.status || null,
+    summary: run.summary || null,
+    error: run.error || null,
+    durationMs: run.durationMs ?? null,
+    provider: run.provider || null,
+    model: run.model || null,
+    usage: run.usage || null
+  };
+}
+const SECTION_HINTS = [
+  "calendar",
+  "weather",
+  "projects",
+  "project",
+  "inbox",
+  "issues",
+  "backlog",
+  "update",
+  "summary",
+  "next actions",
+  "alerts",
+  "status"
+];
+const SECTION_ALIASES = new Map([
+  ["project", "projects"],
+  ["next action", "next actions"]
+]);
+function canonicalSectionKey(value) {
+  const normalized = normalizeSectionKey(value);
+  return SECTION_ALIASES.get(normalized) || normalized;
+}
+function extractSectionKeys(nonEmptyLines) {
+  const sectionKeys = [];
+  const seen = new Set();
+  const patterns = [
+    /^#{1,6}\s+(.+)$/,
+    /^\*\*([^*]+)\*\*$/,
+    /^[-*]\s+\**([^:*]+?)\**:\s+.+$/,
+    /^([^:]{2,40}):\s+.+$/
+  ];
+  for (const line of nonEmptyLines) {
+    for (const pattern of patterns) {
+      const match = line.match(pattern);
+      if (!match) continue;
+      const key = canonicalSectionKey(match[1]);
+      if (!key || key.length < 2) continue;
+      if (seen.has(key)) break;
+      seen.add(key);
+      sectionKeys.push(key);
+      break;
+    }
+  }
+  return sectionKeys;
+}
+function comparableSections(structure) {
+  return structure.sectionKeys.length ? structure.sectionKeys : structure.sectionHints;
+}
+function analyzeOutputStructure(text) {
+  const raw = String(text || "");
+  const trimmed = raw.trim();
+  const lines = raw.split("\n").map((line) => line.trim());
+  const nonEmptyLines = lines.filter(Boolean);
+  const lower = trimmed.toLowerCase();
+  const sectionKeys = extractSectionKeys(nonEmptyLines);
+  return {
+    charCount: trimmed.length,
+    lineCount: nonEmptyLines.length,
+    headingCount: nonEmptyLines.filter((line) => /^#{1,6}\s/.test(line) || /^\*\*[^*]+\*\*/.test(line)).length,
+    bulletCount: nonEmptyLines.filter((line) => /^[-*]\s/.test(line)).length,
+    numberedCount: nonEmptyLines.filter((line) => /^\d+\.\s/.test(line)).length,
+    codeFenceCount: (raw.match(/```/g) || []).length / 2,
+    sectionKeys,
+    sectionHints: SECTION_HINTS.filter((hint) => lower.includes(hint)),
+    hasMarkdownTable: /\|.+\|/.test(raw),
+    hasEmoji: /\p{Extended_Pictographic}/u.test(raw)
+  };
+}
+function buildOutputDiff(v2Run, liveRun, contract = null) {
+  const v2Text = extractRunText(v2Run, contract);
+  const liveText = extractLiveText(liveRun);
+  const v2 = analyzeOutputStructure(v2Text);
+  const live = analyzeOutputStructure(liveText);
+  const v2Sections = comparableSections(v2);
+  const liveSections = comparableSections(live);
+  const sharedSections = v2Sections.filter((hint) => liveSections.includes(hint));
+  const missingFromV2 = liveSections.filter((hint) => !v2Sections.includes(hint));
+  const extraInV2 = v2Sections.filter((hint) => !liveSections.includes(hint));
+  const findings = [];
+  if (!liveText) {
+    findings.push("No live output is available for structural comparison.");
+  } else {
+    if (missingFromV2.length) findings.push(`V2 is missing live sections: ${missingFromV2.join(", ")}.`);
+    if (v2.bulletCount + v2.numberedCount < live.bulletCount + live.numberedCount) {
+      findings.push("V2 output is less structured than the live report.");
+    }
+    if (v2.charCount > 0 && live.charCount > 0) {
+      const verbosityRatio = Number((v2.charCount / live.charCount).toFixed(4));
+      if (verbosityRatio < 0.55) findings.push("V2 output is much shorter than the live report.");
+      if (verbosityRatio > 1.8) findings.push("V2 output is much longer than the live report.");
+    }
+  }
+  return {
+    v2,
+    live,
+    alignment: {
+      sharedSections,
+      missingFromV2,
+      extraInV2,
+      bulletDelta: (v2.bulletCount + v2.numberedCount) - (live.bulletCount + live.numberedCount),
+      headingDelta: v2.headingCount - live.headingCount,
+      charDelta: v2.charCount - live.charCount
+    },
+    findings
+  };
+}
+function assessOutputContract(contract, v2Run, liveRun) {
+  if (!contract) return null;
+  const v2Validation = validateOutputContract(contract, v2Run?.result?.output ?? v2Run?.output ?? "");
+  const liveValidation = validateOutputContract(contract, liveRun?.summary || liveRun?.error || "");
+  const missingFromV2 = v2Validation?.missingSections || [];
+  const missingFromLive = liveValidation?.missingSections || [];
+  const findings = [
+    ...(v2Validation?.findings.map((item) => `V2: ${item}`) || []),
+    ...(liveValidation?.findings.map((item) => `Live: ${item}`) || [])
+  ];
+  return {
+    format: contract.format || null,
+    requiredSections: contract.requiredSections || [],
+    styleHints: contract.styleHints || [],
+    satisfiedRatio: v2Validation?.satisfiedRatio ?? 0,
+    missingFromV2,
+    missingFromLive,
+    emptyInV2: v2Validation?.emptySections || [],
+    emptyInLive: liveValidation?.emptySections || [],
+    parsedV2: v2Validation?.parsed || null,
+    parsedLive: liveValidation?.parsed || null,
+    fieldScores: v2Validation?.fieldScores || null,
+    findings
+  };
+}
+export { buildRubric };
+export class Evaluator {
+  constructor({ projectRoot, liveRoot, stateRoot }) {
+    this.liveRoot = liveRoot;
+    this.stateRoot = stateRoot;
+    this.reviewer = new RunReviewer({ stateRoot });
+    this.scheduler = new Scheduler({ projectRoot, liveRoot, stateRoot });
+    this.evalStore = new RunStore({ rootDir: path.join(stateRoot, "evaluations") });
+    this.notificationStore = new NotificationStore({ rootDir: path.join(stateRoot, "notifications") });
+    this.deliveryStore = new DeliveryStore({ rootDir: path.join(stateRoot, "deliveries") });
+  }
+  async resolveInteractionArtifacts(run, review = null) {
+    const reviewNotifications = review?.recentNotifications || [];
+    const _reviewDeliveries = review?.recentDeliveries || [];
+    const baseFiles = run?.notificationFiles || [];
+    const relatedNotificationFiles = expandRelatedNotificationFiles(
+      baseFiles,
+      reviewNotifications
+    );
+    const knownNotifications = reviewNotifications.filter((item) => relatedNotificationFiles.has(item.filePath));
+    const missingNotificationFiles = [...relatedNotificationFiles].filter(
+      (filePath) => !knownNotifications.some((item) => item.filePath === filePath)
+    );
+    const loadedNotifications = await this.notificationStore.getNotifications(missingNotificationFiles);
+    const notifications = [...knownNotifications, ...loadedNotifications].sort((a, b) =>
+      String(a.timestamp || "").localeCompare(String(b.timestamp || ""))
+    );
+    const expandedNotificationFiles = expandRelatedNotificationFiles(baseFiles, notifications);
+    // Load all delivery receipts once for deterministic interaction evidence.
+    const allDeliveries = await this.deliveryStore.listAll();
+    const deliveries = allDeliveries.filter((item) => expandedNotificationFiles.has(item.notificationFilePath));
+    return {
+      notificationFiles: expandedNotificationFiles,
+      notifications,
+      deliveries
+    };
+  }
+  async evaluate(limit = 20) {
+    const [review, comparisons] = await Promise.all([
+      this.reviewer.review(limit),
+      this.scheduler.compareJobs()
+    ]);
+    const recentRuns = review.recentRuns.filter((run) => !run.jobId.endsWith("-comparison"));
+    const grouped = groupBy(recentRuns, (run) => run.jobId);
+    const jobs = await Promise.all(
+      Array.from(grouped.entries()).map(async ([jobId, runs]) => this.evaluateJob(jobId, {
+        runs,
+        review,
+        comparisons
+      }))
+    );
+    return {
+      jobs: [...jobs].sort((a, b) => a.rubric.overallScore - b.rubric.overallScore),
+      recentRuns,
+      scheduler: review.scheduler
+    };
+  }
+  async evaluateJob(jobId, options = {}) {
+    const runtime = await this.scheduler.loadRuntime();
+    const jobConfig = runtime.jobs[jobId] || null;
+    const review = options.review || (await this.reviewer.review(options.limit ?? 20));
+    const comparisons = options.comparisons || (await this.scheduler.compareJobs());
+    const runs = options.runs || review.recentRuns.filter((run) => run.jobId === jobId && !run.jobId.endsWith("-comparison"));
+    const schedulerState = review.scheduler.find((item) => item.jobId === jobId) || null;
+    const comparison = comparisons.find((item) => item.v2JobId === jobId) || null;
+    const liveMatches = await Promise.all(
+      (comparison?.closestLiveJobs || []).map(async (match) => ({
+        ...match,
+        recentRuns: await this.scheduler.bridge.loadCronRunHistory(match.id, 5),
+        latestRun: (await this.scheduler.bridge.loadCronRunHistory(match.id, 1))[0] || null
+      }))
+    );
+    const selectedRun = choosePrimaryV2Run(runs);
+    const interactionRun = runs[0] || selectedRun;
+    const selectedLiveMatch = pickBestLiveMatch(liveMatches);
+    const liveHistory = selectedLiveMatch?.recentRuns || [];
+    const outputContract = normalizeOutputContract(jobConfig?.outputContract || null);
+    const outputDiff = buildOutputDiff(selectedRun, selectedLiveMatch?.latestRun || null, outputContract);
+    const contractCheck = assessOutputContract(outputContract, selectedRun, selectedLiveMatch?.latestRun || null);
+    const retrieval = analyzeRetrieval(selectedRun);
+    const interactionArtifacts = await this.resolveInteractionArtifacts(interactionRun, review);
+    const interaction = analyzeInteraction(interactionRun, interactionArtifacts.notifications, interactionArtifacts.deliveries);
+    const rubric = buildRubric({
+      v2Run: selectedRun,
+      liveHistory,
+      matchedLiveJob: selectedLiveMatch,
+      outputContract,
+      contractCheck
+    });
+    return {
+      jobId,
+      schedulerState,
+      maintenance: review?.maintenance || null,
+      latestRun: runs[0] || null,
+      primaryRun: summarizeV2Run(selectedRun),
+      interactionRunTimestamp: interactionRun?.timestamp || null,
+      runCount: runs.length,
+      modeCounts: countModes(runs),
+      liveMatches: liveMatches.map((match) => ({
+        id: match.id,
+        name: match.name,
+        description: match.description || null,
+        enabled: match.enabled,
+        schedule: match.schedule,
+        kind: match.kind || null,
+        lastStatus: match.lastStatus || null,
+        latestRun: summarizeLiveRun(match.latestRun)
+      })),
+      selectedLiveMatch: selectedLiveMatch
+        ? {
+            id: selectedLiveMatch.id,
+            name: selectedLiveMatch.name,
+            latestRun: summarizeLiveRun(selectedLiveMatch.latestRun)
+          }
+        : null,
+      retrieval,
+      interaction,
+      outputContract,
+      contractCheck,
+      outputDiff,
+      rubric,
+      comparisonNotes: buildComparisonNotes({
+        jobId,
+        selectedRun,
+        selectedLiveMatch,
+        schedulerState,
+        maintenance: review?.maintenance || null,
+        rubric,
+        outputDiff,
+        contractCheck,
+        retrieval,
+        interaction
+      }),
+      interactionArtifacts: {
+        notificationCount: interactionArtifacts.notifications.length,
+        deliveryCount: interactionArtifacts.deliveries.length,
+        notificationFileCount: interactionArtifacts.notificationFiles.size
+      }
+    };
+  }
+  async evaluateAndPersistJob(jobId, options = {}) {
+    const report = await this.evaluateJob(jobId, options);
+    const artifact = {
+      timestamp: new Date().toISOString(),
+      kind: "job-evaluation",
+      ...report
+    };
+    const filePath = await this.evalStore.saveRun(jobId, artifact);
+    return {
+      filePath,
+      ...artifact
+    };
+  }
+}
+function countModes(runs) {
+  return runs.reduce((acc, run) => {
+    const mode = run.mode || "unknown";
+    acc[mode] = (acc[mode] || 0) + 1;
+    return acc;
+  }, {});
+}
+function buildComparisonNotes({
+  jobId,
+  selectedRun,
+  selectedLiveMatch,
+  schedulerState,
+  maintenance,
+  rubric,
+  outputDiff,
+  contractCheck,
+  retrieval = null,
+  interaction = null
+}) {
+  const notes = [];
+  if (!selectedRun) notes.push("No V2 runs recorded.");
+  if (schedulerState?.lastStatus === "ok") notes.push("Latest V2 scheduler state is healthy.");
+  if (selectedRun?.fallback?.attempted && selectedRun?.fallback?.success) {
+    notes.push(
+      `Run used report fallback from ${selectedRun.fallback.sourceLane || "local"} to ${selectedRun.fallback.finalSourceLane || "remote"} after ${selectedRun.fallback.trigger || "failure"}.`
+    );
+  } else if (selectedRun?.fallback?.attempted && !selectedRun?.fallback?.success) {
+    notes.push(`Report fallback was attempted but did not succeed${selectedRun.fallback?.fallbackError ? `: ${selectedRun.fallback.fallbackError}` : "."}`);
+  } else if (selectedRun?.fallback?.allowed === false && selectedRun?.fallback?.trigger) {
+    notes.push(`Report fallback was blocked after ${selectedRun.fallback.trigger}${selectedRun.fallback?.blockedReason ? `: ${selectedRun.fallback.blockedReason}` : "."}`);
+  }
+  if (maintenance?.wal?.some((item) => item.action && item.action !== "none" && item.action !== "error")) {
+    notes.push("Daemon maintenance recently performed WAL checkpoint work.");
+  }
+  if (maintenance?.handoffs?.expiredCount > 0) {
+    notes.push(`Daemon maintenance expired or escalated ${maintenance.handoffs.expiredCount} pending handoff(s).`);
+  }
+  if (!selectedLiveMatch) {
+    notes.push("No live cron analogue matched.");
+    return uniqueStrings([...notes, ...rubric.findings, ...outputDiff.findings, ...(contractCheck?.findings || []), ...(interaction?.findings || [])]);
+  }
+  const latestLive = selectedLiveMatch.latestRun;
+  notes.push(`Closest live cron match: ${selectedLiveMatch.name || selectedLiveMatch.id}.`);
+  if (latestLive?.status) notes.push(`Latest live status: ${latestLive.status}.`);
+  if (latestLive?.provider) notes.push(`Latest live provider: ${latestLive.provider}.`);
+  if (latestLive?.durationMs != null) notes.push(`Latest live duration: ${latestLive.durationMs}ms.`);
+  const retrievalFindings = retrieval?.findings || [];
+  const interactionFindings = interaction?.findings || [];
+  const outputDiffFindings =
+    jobId === "memory-rollup" && Number(contractCheck?.satisfiedRatio || 0) >= 0.99
+      ? (outputDiff.findings || []).filter((item) => !/less structured|much shorter/i.test(item))
+      : outputDiff.findings || [];
+  return uniqueStrings([...notes, ...rubric.findings, ...outputDiffFindings, ...(contractCheck?.findings || []), ...retrievalFindings, ...interactionFindings]);
+}
+function normalizeOutputContract(contract) {
+  if (!contract) return null;
+  return {
+    format: contract.format || null,
+    requiredSections: contract.requiredSections || [],
+    styleHints: contract.styleHints || [],
+    profile: contract.profile || null
+  };
+}