npm - role-os - Versions diffs - 2.3.1 → 2.6.0 - Mend

role-os 2.3.1 → 2.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

package/CHANGELOG.md +484 -437
package/README.es.md +319 -319
package/README.fr.md +319 -319
package/README.hi.md +319 -319
package/README.it.md +319 -319
package/README.ja.md +319 -319
package/README.md +387 -387
package/README.pt-BR.md +319 -319
package/README.zh.md +322 -322
package/bin/roleos.mjs +230 -225
package/package.json +51 -51
package/src/artifacts.mjs +693 -647
package/src/brainstorm-render.mjs +462 -462
package/src/brainstorm-roles.mjs +817 -817
package/src/brainstorm.mjs +778 -778
package/src/citation-panel.mjs +251 -0
package/src/dispatch.mjs +265 -265
package/src/mission.mjs +655 -655
package/src/packs.mjs +467 -467
package/src/route.mjs +766 -766
package/src/run-cmd.mjs +408 -408
package/src/run.mjs +1000 -1000
package/src/swarm/persist-bridge.mjs +4 -4
package/src/verify-citations-cmd.mjs +138 -0
package/src/verify-citations.mjs +523 -0
package/starter-pack/agents/engineering/caption-auditor.md +61 -0
package/starter-pack/agents/engineering/monster-taxonomy-verifier.md +62 -0
package/starter-pack/agents/engineering/red-teamer.md +75 -0
package/starter-pack/policy/tool-permissions.md +19 -0

package/src/swarm/persist-bridge.mjs CHANGED Viewed

@@ -1,12 +1,12 @@
 /**
- * Evidence Persistence Bridge — Optional connection to dogfood-labs.
+ * Evidence Persistence Bridge — Optional connection to dogfood-lab/testing-os.
  *
  * Converts swarm wave results into dogfood submission format and audit DB
  * payloads. The core swarm mission works without this — it's activated by
  * the --persist-evidence flag on `roleos swarm`.
  *
- * This mirrors the logic from dogfood-labs/tools/swarm/persist-results.js
- * but produces the payloads without requiring dogfood-labs to be present.
+ * This mirrors the logic from dogfood-lab/testing-os/packages/dogfood-swarm/persist-results.js
+ * but produces the payloads without requiring testing-os to be present.
  */
 // ── Surface mapping ─────────────────────────────────────────────────────────
@@ -104,7 +104,7 @@ export function computeOverallVerdict(scenarioResults) {
 // ── Dogfood submission payload ──────────────────────────────────────────────
 /**
- * Build a dogfood-labs-compatible submission payload.
+ * Build a testing-os-compatible submission payload.
  * @param {object} manifest - Swarm manifest
  * @param {object[]} waveReports - All wave reports from the run
  * @param {object} meta - { commitSha, branch, startedAt, completedAt }

package/src/verify-citations-cmd.mjs ADDED Viewed

@@ -0,0 +1,138 @@
+/**
+ * `roleos verify-citations <dispatch.md|.json>` — run the citation gate and report.
+ *
+ * Exit codes: 0 accept · 20 blocking (a cited paper did not resolve — likely fabricated) · 30
+ * escalate (verifier unreachable / low-confidence — a closed gate; NEVER accept) · 10 revise ·
+ * 2 no resolvable citations found. Non-zero = needs attention, so a mission step, CI job, or
+ * operator can branch on it.
+ */
+import { writeFileSync } from "node:fs";
+import { resolve, dirname, basename } from "node:path";
+import { runCitationGate } from "./verify-citations.mjs";
+export async function verifyCitationsCommand(args) {
+  const { flags, positional } = parseArgs(args);
+  const dispatch = positional[0];
+  if (!dispatch) {
+    const err = new Error(
+      "Usage: roleos verify-citations <dispatch.md|.json> [--provider ollama] [--intent <text>] [--local-panel] [--json] [--receipt <path>]",
+    );
+    err.exitCode = 1;
+    err.hint =
+      "Provide a research dispatch — markdown with a Research-grounding section, or a citations JSON array.";
+    throw err;
+  }
+  const result = runCitationGate(dispatch, {
+    provider: flags.provider || "ollama",
+    ...(typeof flags.intent === "string" ? { intent: flags.intent } : {}),
+    // --local-panel: add the family-different offload entailment panel as a second seat (local,
+    // zero-cost). Re-checks prism's `supported` citations; monotone-tightening (escalates on
+    // disagreement, never loosens). Needs llama-swap up + offload.py on the rig.
+    localPanel: flags["local-panel"] === true,
+    ...(typeof flags["offload-script"] === "string" ? { offloadScript: flags["offload-script"] } : {}),
+    ...(typeof flags["llamaswap-base"] === "string" ? { llamaswapBase: flags["llamaswap-base"] } : {}),
+  });
+  // Persist the chained receipt (audit trail) unless --no-receipt.
+  if (result.receipt && flags["no-receipt"] !== true) {
+    const out =
+      typeof flags.receipt === "string"
+        ? resolve(flags.receipt)
+        : resolve(dirname(dispatch), `${basename(dispatch).replace(/\.[^.]+$/, "")}.citation-receipt.json`);
+    try {
+      writeFileSync(out, JSON.stringify(result.receipt, null, 2));
+      result.receipt_path = out;
+    } catch (err) {
+      console.error(`warning: could not write the citation receipt to ${out}: ${err.message}`);
+    }
+  }
+  if (flags.json === true) {
+    console.log(JSON.stringify(result, null, 2));
+  } else {
+    printReport(dispatch, result);
+  }
+  process.exit(exitCodeFor(result));
+}
+/**
+ * Map a gate result to the shell exit code (the gate's machine contract). Blocking is checked
+ * FIRST so a (contradictory) accept can never shadow the hard halt.
+ *   20 = blocking (a fabricated citation) · 0 = accept · 2 = no citations ·
+ *   30 = escalate (verifier unreachable / low-confidence — a closed gate) · 10 = revise.
+ */
+export function exitCodeFor(result) {
+  if (result.blocking) return 20;
+  if (result.pass) return 0;
+  if (result.reason === "no_citations") return 2;
+  if (result.verdict === "escalate") return 30;
+  return 10;
+}
+function parseArgs(args) {
+  const flags = {};
+  const positional = [];
+  for (let i = 0; i < args.length; i++) {
+    const a = args[i];
+    if (a.startsWith("--")) {
+      const name = a.slice(2);
+      const next = args[i + 1];
+      if (next !== undefined && !next.startsWith("--")) {
+        flags[name] = next;
+        i += 1;
+      } else {
+        flags[name] = true;
+      }
+    } else {
+      positional.push(a);
+    }
+  }
+  return { flags, positional };
+}
+function printReport(dispatch, r) {
+  const tag = r.pass ? "ACCEPT" : r.blocking ? "REFUSE (blocking)" : "NEEDS REVIEW";
+  console.log(`\nroleos verify-citations — ${tag}\n`);
+  console.log(`Dispatch: ${dispatch}`);
+  console.log(`Verdict:  ${r.verdict}  (${r.citations.length} citation(s) checked, ${r.duration}ms)`);
+  if (r.reason) console.log(`Reason:   ${r.reason} — ${r.detail || ""}`);
+  for (const c of r.citations) {
+    if (c.verdict === "accept") continue;
+    const mark = c.existence === "fabricated" ? "DROP" : (c.action || c.verdict);
+    console.log(`  - [${mark}] ${c.identifier || c.id} — ${c.detail || c.finding_match || c.existence}`);
+    if (c.span) console.log(`      source span: ${c.span}`);
+  }
+  if (r.unparsed && r.unparsed.length) {
+    console.log(
+      `\n  ${r.unparsed.length} item(s) looked like citations but had no resolvable arXiv/DOI id (verify manually):`,
+    );
+    for (const u of r.unparsed.slice(0, 10)) console.log(`    ? ${u.slice(0, 120)}`);
+  }
+  if (r.local_panel) {
+    const p = r.local_panel;
+    const seats = p.seats && p.seats.length ? p.seats.join(", ") : "(none reached)";
+    console.log(`\nLocal panel: ${p.checked} citation(s) re-checked by [${seats}]${p.reachable ? "" : " — UNREACHABLE"}`);
+    for (const d of p.disagreements || []) {
+      console.log(`  - [DISAGREE] ${d.identifier || d.id} — prism: ${d.prism}, panel: ${d.panel}`);
+    }
+  }
+  if (r.receipt_path) console.log(`\nReceipt: ${r.receipt_path}`);
+  if (r.blocking) {
+    console.log(
+      `\nBLOCKING: a cited paper did not resolve in arXiv/Crossref (likely fabricated). Reject the dispatch.`,
+    );
+  } else if (r.advisory) {
+    console.log(
+      `\nADVISORY: citations resolved but need revision / human review — accept-with-notes or escalate per the items above.`,
+    );
+  }
+}

package/src/verify-citations.mjs ADDED Viewed

@@ -0,0 +1,523 @@
+/**
+ * Citation-Verification Gate — verifies a research dispatch's citations via the external
+ * `prism verify` CLI (a family-different, reasoning-stripped verifier) and gates the dispatch
+ * on the verdict. role-os is the GENERATOR; prism is the sound external CRITIC (LLM-Modulo,
+ * Kambhampati 2024 arXiv:2402.01817) — role-os never grades its own homework.
+ *
+ * Three tiers keyed to the FAILURE SOURCE (study-swarm wf_20651368-297):
+ *   - existence `fabricated` (deterministic arXiv/Crossref miss) -> BLOCKING hard halt
+ *   - metadata / numeric / groundedness `contradicted`           -> advisory: revise
+ *   - `unresolvable` / `not_addressed` / verifier-low-confidence  -> advisory: escalate (human)
+ *   - all `accept`                                                -> pass
+ * An unreachable verifier ESCALATES, never default-accepts ("an unreachable gate is a closed
+ * gate"). See design/citation-verification-runner.md. Peer to src/swarm/build-gate.mjs.
+ */
+import { execFileSync } from "node:child_process";
+import { mkdtempSync, writeFileSync, rmSync, readFileSync, existsSync } from "node:fs";
+import { join, extname } from "node:path";
+import { tmpdir } from "node:os";
+import { createHash } from "node:crypto";
+import { runOffloadPanel, applyLocalPanel, buildEvidence } from "./citation-panel.mjs";
+// ── Identifier patterns (copy-only — the extractor never invents an identifier) ──────────────
+// Matches `arXiv:2402.01817`, `arXiv 2402.01817`, AND URL forms `arxiv.org/abs/2402.01817`,
+// `.../pdf/...`, versioned, and old-style `hep-th/9901001` (the most common real citation format).
+const ARXIV =
+  /arxiv(?:\.org)?[:\s/]+(?:(?:abs|pdf)\/)?(\d{4}\.\d{4,5}(?:v\d+)?|[a-z-]+(?:\.[A-Z]{2})?\/\d{7}(?:v\d+)?)/i;
+const DOI = /\b(10\.\d{4,9}\/[^\s)\]}"'<>]+)/;
+/**
+ * @typedef {{ id: string|null, identifier: string, claim: string, authors: string, year: string }} Citation
+ */
+// ── Extraction ───────────────────────────────────────────────────────────────────────────────
+/**
+ * Extract citation records from a research dispatch (our Step-3 template prose).
+ * Deterministic and COPY-ONLY: it lifts the identifier + claim + authors verbatim and NEVER
+ * completes a missing field from memory (Khraisha 2024 — LLM-generated citations are fabricated
+ * at extreme rates). Only arXiv / DOI identifiers (what prism can resolve) become citations;
+ * items that look like a citation but carry no resolvable id are returned in `unparsed` so misses
+ * are visible, never silently dropped.
+ *
+ * @param {string} markdown
+ * @returns {{ citations: Citation[], unparsed: string[] }}
+ */
+export function extractCitations(markdown) {
+  const citations = [];
+  const unparsed = [];
+  let n = 0;
+  for (const raw of splitItems(String(markdown))) {
+    const identifier = matchIdentifier(raw);
+    if (!identifier) {
+      if (looksLikeCitation(raw)) unparsed.push(oneLine(raw));
+      continue;
+    }
+    n += 1;
+    citations.push({
+      id: `c${n}`,
+      identifier,
+      claim: extractClaim(raw),
+      authors: extractAuthors(raw),
+      year: extractYear(raw),
+    });
+    // Surface a multi-citation item (only the first identifier is verified) so the miss is visible.
+    if (countIdentifiers(raw) > 1) {
+      unparsed.push(`(item cites multiple sources — only the first was verified) ${oneLine(raw).slice(0, 120)}`);
+    }
+  }
+  return { citations, unparsed };
+}
+/** Count distinct arXiv/DOI identifiers in an item — flags multi-cite items that drop extras. */
+function countIdentifiers(text) {
+  const ax = text.match(new RegExp(ARXIV.source, "ig")) || [];
+  const di = text.match(new RegExp(DOI.source, "ig")) || [];
+  return ax.length + di.length;
+}
+/** Match the first resolvable identifier (arXiv first, then DOI). Returns null if none. */
+function matchIdentifier(text) {
+  const a = text.match(ARXIV);
+  if (a) return `arXiv:${a[1]}`;
+  const d = text.match(DOI);
+  if (d) return d[1].replace(/[.,;]+$/, "");
+  return null;
+}
+/** Group lines into logical items: break at list markers and blank lines. */
+function splitItems(markdown) {
+  const lines = markdown.split(/\r?\n/);
+  const isMarker = (l) => /^\s*(?:\d+[.)]|[-*+])\s+/.test(l);
+  const items = [];
+  let cur = [];
+  const flush = () => {
+    if (cur.length) items.push(cur.join(" ").trim());
+    cur = [];
+  };
+  for (const line of lines) {
+    if (line.trim() === "") flush();
+    else if (isMarker(line)) {
+      flush();
+      cur.push(line);
+    } else cur.push(line);
+  }
+  flush();
+  return items.filter(Boolean);
+}
+function stripMarkers(raw) {
+  return raw
+    .replace(/^\s*(?:\d+[.)]|[-*+])\s+/, "")
+    .replace(/[*`_]/g, "")
+    .trim();
+}
+/** Collapse an item to a single display line (drops the list marker, keeps the text). */
+function oneLine(raw) {
+  return raw.replace(/^\s*(?:\d+[.)]|[-*+])\s+/, "").replace(/\s+/g, " ").trim();
+}
+/** Claim = the bold finding if present, else the first sentence (capped). Always non-empty. */
+function extractClaim(raw) {
+  const bold = raw.match(/\*\*(.+?)\*\*/);
+  if (bold && bold[1].trim()) return bold[1].trim().slice(0, 500);
+  const cleaned = stripMarkers(raw);
+  const sentence = cleaned.match(/^(.{8,260}?[.!?])(?:\s|$)/);
+  const claim = (sentence ? sentence[1] : cleaned).slice(0, 500).trim();
+  return claim || cleaned.slice(0, 120).trim() || "(no claim text)";
+}
+function extractYear(raw) {
+  const m = raw.match(/\b(?:19|20)\d{2}\b/);
+  return m ? m[0] : "";
+}
+/** Best-effort authors (metadata only — prism resolves by identifier, not by this). */
+function extractAuthors(raw) {
+  const beforeYear = stripMarkers(raw)
+    .replace(/\*\*(.+?)\*\*/g, "")
+    .split(/\b(?:19|20)\d{2}\b/)[0] || "";
+  const m = beforeYear.match(/([A-Z][\w.'-]+(?:[\s,]+(?:et al\.?|&|and|[A-Z][\w.'-]+)){0,6})\s*$/);
+  return (m ? m[1] : "").replace(/[,\s]+$/, "").trim().slice(0, 120);
+}
+function looksLikeCitation(raw) {
+  return (
+    /\b(?:19|20)\d{2}\b/.test(raw) &&
+    /(et al\.?|\bdoi\b|\brfc\b|arxiv|https?:\/\/|[A-Z][a-z]+\s+(?:&|and|et al))/i.test(raw)
+  );
+}
+// ── Gate (maps prism's verdict to the three tiers) ─────────────────────────────────────────────
+/**
+ * @typedef {object} GateResult
+ * @property {string} verdict           accept | revise | refuse | escalate
+ * @property {boolean} pass             true iff verdict === "accept"
+ * @property {boolean} blocking         true iff any citation failed the deterministic existence floor
+ * @property {boolean} advisory         needs attention but not a fabrication (revise/escalate)
+ * @property {object[]} citations       per-citation result
+ * @property {string} [reason]
+ * @property {string} [detail]
+ */
+/**
+ * Map a parsed `prism verify` response to the three-tier gate. role-os enforces the existence
+ * floor itself: blocking dominates accept, and an accept with no adjudicated results is not trusted.
+ * @param {object} prismResponse  parsed VerifyResponse JSON, or `{ error: {...} }`
+ * @returns {GateResult}
+ */
+export function gateCitations(prismResponse) {
+  if (!prismResponse || typeof prismResponse !== "object") {
+    return blockedResult("escalate", "malformed_verifier_output", "verifier returned no object");
+  }
+  if (prismResponse.error) {
+    // prism refused to verify at all (e.g. INVALID_ARTIFACT, VERIFIER_UNAVAILABLE) -> escalate.
+    return {
+      verdict: "escalate",
+      pass: false,
+      blocking: false,
+      advisory: true,
+      reason: prismResponse.error.reason || "verifier_error",
+      detail: prismResponse.error.detail || "",
+      citations: [],
+    };
+  }
+  const rawVerdict = prismResponse.verdict || "escalate";
+  const citations = (prismResponse.citation_results || []).map((cr) => ({
+    id: cr.citation_id ?? null,
+    identifier: cr.identifier ?? null,
+    existence: cr.existence,
+    finding_match: cr.finding_match,
+    verdict: cr.verdict,
+    action: cr.action,
+    detail: cr.detail,
+    span: cr.supporting_span ?? null,
+    source_title: cr.source_title ?? null,
+    source_abstract: cr.source_abstract ?? null,
+  }));
+  // role-os enforces the deterministic floor ITSELF (it does not delegate it to prism's top-level
+  // aggregation): any fabricated-existence citation BLOCKS and dominates a top-level "accept", so a
+  // contradictory or drifted prism response can never shadow the hard halt.
+  const blocking = citations.some((c) => c.existence === "fabricated");
+  if (blocking) {
+    return { verdict: "refuse", pass: false, blocking: true, advisory: false, citations };
+  }
+  // A clean accept must actually adjudicate citations — an "accept" carrying ZERO results is not
+  // trusted (prism stdout is an untrusted boundary input). (Exact submitted-vs-adjudicated count
+  // cross-check is a v2 hardening.)
+  if (rawVerdict === "accept" && citations.length === 0) {
+    return {
+      verdict: "escalate",
+      pass: false,
+      blocking: false,
+      advisory: true,
+      reason: "incomplete_adjudication",
+      detail: "prism returned no adjudicated citations for an accept verdict",
+      citations,
+    };
+  }
+  const pass = rawVerdict === "accept";
+  return { verdict: rawVerdict, pass, blocking: false, advisory: !pass, citations };
+}
+function blockedResult(verdict, reason, detail) {
+  return { verdict, pass: false, blocking: false, advisory: true, reason, detail, citations: [] };
+}
+// ── Runner (orchestrates extract -> shell prism -> gate -> receipt) ────────────────────────────
+/**
+ * Run the citation gate over a dispatch (file path .md/.json, or a markdown string).
+ *
+ * @param {string} input
+ * @param {object} [options]
+ * @param {string} [options.prismCmd]        default: env PRISM_CMD || "prism"
+ * @param {string} [options.provider]        default: "ollama" (local, zero-cost)
+ * @param {string} [options.callerFamily]    default: "anthropic" (excluded from the verifier)
+ * @param {string} [options.intent]
+ * @param {number} [options.timeout]         per-call ms (default 120000)
+ * @param {number} [options.retries]         transient retries (default 1)
+ * @param {Function} [options.exec]          injectable (cmd, args, {timeout, cwd}) -> {status, stdout, stderr}
+ * @param {string} [options.cwd]
+ * @returns {GateResult & { unparsed: string[], receipt?: object, duration: number }}
+ */
+export function runCitationGate(input, options = {}) {
+  const {
+    prismCmd = process.env.PRISM_CMD || "prism",
+    provider = "ollama",
+    callerFamily = "anthropic",
+    intent = "verify each citation exists and the finding matches the source",
+    timeout = 120_000,
+    retries = 1,
+    exec = defaultExec,
+    cwd = process.cwd(),
+    // Local-panel seat (opt-in): a family-different entailment panel (offload, on local models)
+    // re-checks prism's `supported` citations. Monotone-tightening; off by default.
+    localPanel = false,
+    offloadExec,
+    offloadPython,
+    offloadScript,
+    llamaswapBase,
+  } = options;
+  const start = Date.now();
+  const { citations, unparsed } = loadCitations(input);
+  if (citations.length === 0) {
+    return {
+      ...blockedResult("escalate", "no_citations", "no resolvable arXiv/DOI citations were extracted"),
+      unparsed,
+      duration: Date.now() - start,
+    };
+  }
+  const artifact = citations.map((c) => ({
+    id: c.id,
+    identifier: c.identifier,
+    claim: c.claim,
+    authors: c.authors || "",
+    year: c.year || "",
+  }));
+  const dir = mkdtempSync(join(tmpdir(), "roleos-cite-"));
+  const file = join(dir, "citations.json");
+  let result;
+  try {
+    writeFileSync(file, JSON.stringify(artifact));
+    result = shellPrism({ prismCmd, file, intent, callerFamily, provider, timeout, retries, exec, cwd });
+  } finally {
+    rmSync(dir, { recursive: true, force: true });
+  }
+  if (!result.ok) {
+    // An unreachable gate is a closed gate -> escalate, NEVER default-accept.
+    return {
+      ...blockedResult("escalate", "verifier_unreachable", result.detail),
+      unparsed,
+      duration: Date.now() - start,
+    };
+  }
+  let gate = gateCitations(result.response);
+  // A clean accept also requires that extraction left NO citation-like item unverified — a non-empty
+  // `unparsed` (e.g. a citation format the extractor missed) must not pass as fully verified.
+  if (gate.pass && unparsed.length > 0) {
+    gate = {
+      ...gate,
+      verdict: "escalate",
+      pass: false,
+      advisory: true,
+      reason: "unparsed_citations",
+      detail: `${unparsed.length} citation-like item(s) could not be parsed/resolved`,
+    };
+  }
+  // Local-panel seat: re-check prism's `supported` citations with a family-different entailment
+  // panel on local models. Runs only when requested AND the gate is still passing — it can only
+  // tighten, so there is nothing to challenge on an already-blocking/advisory gate.
+  let panel = null;
+  if (localPanel && gate.pass) {
+    const supported = buildPanelInput(citations, gate.citations);
+    if (supported.length > 0) {
+      panel = runOffloadPanel(supported, {
+        ...(offloadExec ? { exec: offloadExec } : {}),
+        ...(offloadPython ? { python: offloadPython } : {}),
+        ...(offloadScript ? { script: offloadScript } : {}),
+        ...(llamaswapBase ? { base: llamaswapBase } : {}),
+        cwd,
+      });
+      gate = applyLocalPanel(gate, panel);
+    }
+  }
+  const receipt = buildReceipt({ input, artifact, response: result.response, gate, panel });
+  return { ...gate, unparsed, receipt, duration: Date.now() - start };
+}
+/**
+ * Build the local-panel input: prism's `supported` citations only (the panel can only challenge an
+ * accept), joined to their claim (from the artifact) + the evidence prism retrieved (title + span).
+ */
+function buildPanelInput(artifactCitations, gateCitations) {
+  const claimById = new Map();
+  const claimByIdent = new Map();
+  for (const c of artifactCitations) {
+    if (c.id) claimById.set(c.id, c.claim);
+    if (c.identifier) claimByIdent.set(c.identifier, c.claim);
+  }
+  const out = [];
+  for (const gc of gateCitations) {
+    if (gc.finding_match !== "supported") continue;
+    const claim = claimById.get(gc.id) ?? claimByIdent.get(gc.identifier) ?? "";
+    if (!claim) continue;
+    out.push({ id: gc.id, identifier: gc.identifier, claim, evidence: buildEvidence(gc) });
+  }
+  return out;
+}
+function loadCitations(input) {
+  if (
+    typeof input === "string" &&
+    (input.endsWith(".md") || input.endsWith(".json")) &&
+    existsSync(input)
+  ) {
+    const content = readFileSync(input, "utf8");
+    if (extname(input) === ".json") {
+      let arr;
+      try {
+        arr = JSON.parse(content);
+      } catch {
+        return { citations: [], unparsed: ["(.json file was not valid JSON)"] };
+      }
+      const citations = [];
+      const unparsed = [];
+      for (const item of Array.isArray(arr) ? arr : []) {
+        const norm = normalizeJsonCitation(item);
+        if (norm) citations.push(norm);
+        else if (item && typeof item === "object" && (item.claim || item.finding)) {
+          unparsed.push(oneLine(JSON.stringify(item)).slice(0, 160)); // a claim with no resolvable id
+        }
+      }
+      return { citations, unparsed };
+    }
+    return extractCitations(content);
+  }
+  return extractCitations(String(input));
+}
+function normalizeJsonCitation(c) {
+  if (!c || typeof c !== "object") return null;
+  const claim = (c.claim || c.finding || "").toString().trim();
+  if (!claim) return null;
+  const idText = [c.identifier, c.url, c.doi, c.arxiv].filter(Boolean).join(" ");
+  const identifier = matchIdentifier(idText) || matchIdentifier(claim);
+  if (!identifier) return null;
+  return {
+    id: (c.id || null),
+    identifier,
+    claim: claim.slice(0, 500),
+    authors: (c.authors || "").toString(),
+    year: (c.year || "").toString(),
+  };
+}
+function shellPrism({ prismCmd, file, intent, callerFamily, provider, timeout, retries, exec, cwd }) {
+  const args = [
+    "verify", "-a", `@${file}`, "--type", "citations",
+    "-i", intent, "--caller-family", callerFamily, "--provider", provider,
+  ];
+  let detail = "";
+  for (let attempt = 0; attempt <= retries; attempt++) {
+    let res;
+    try {
+      res = exec(prismCmd, args, { timeout, cwd });
+    } catch (err) {
+      detail = `failed to run ${prismCmd}: ${err.code || err.message}`;
+      if (err.code === "ENOENT") break; // missing binary -> escalate, do not retry
+      continue;
+    }
+    const parsed = tryParseJson((res.stdout || "").toString());
+    if (parsed) return { ok: true, response: parsed, exitCode: res.status ?? 0 };
+    detail = `prism produced no parseable JSON (exit ${res.status}): ${(res.stderr || res.stdout || "").toString().slice(0, 300)}`;
+  }
+  return { ok: false, detail };
+}
+/** Default exec — execFileSync, capturing stdout even when prism exits non-zero (refuse/error). */
+function defaultExec(cmd, args, { timeout, cwd }) {
+  try {
+    // No shell: execFileSync passes args verbatim (the intent string contains spaces).
+    // `cmd` must be an executable, not a shell builtin — on Windows set PRISM_CMD to the full
+    // path of prism.exe (a real PE shim, not a .cmd), or use a POSIX bare name on PATH.
+    const stdout = execFileSync(cmd, args, {
+      cwd,
+      timeout,
+      encoding: "utf8",
+      stdio: ["ignore", "pipe", "pipe"],
+      maxBuffer: 16 * 1024 * 1024,
+    });
+    return { status: 0, stdout, stderr: "" };
+  } catch (err) {
+    if (err.code === "ENOENT") throw err; // missing binary -> shellPrism escalates
+    return {
+      status: err.status ?? 1,
+      stdout: (err.stdout || "").toString(),
+      stderr: (err.stderr || "").toString(),
+    };
+  }
+}
+function tryParseJson(text) {
+  const s = (text || "").trim();
+  if (!s) return null;
+  try {
+    return JSON.parse(s);
+  } catch {
+    const start = s.indexOf("{");
+    const end = s.lastIndexOf("}");
+    if (start !== -1 && end > start) {
+      try {
+        return JSON.parse(s.slice(start, end + 1));
+      } catch {
+        return null;
+      }
+    }
+    return null;
+  }
+}
+function buildReceipt({ input, artifact, response, gate, panel = null }) {
+  const citationsHash = sha256(JSON.stringify(artifact));
+  const prismReceipt = response.receipt || {};
+  const pins = Array.isArray(prismReceipt.retrieval_pins) ? prismReceipt.retrieval_pins : [];
+  // The local-panel seat folds into the chain via gate.verdict (a disagreement downgrades it to
+  // escalate) AND via its own digest, so neither prism's verdict nor the panel's can be altered
+  // without breaking the chain.
+  const panelDigest = panel
+    ? sha256(JSON.stringify({ seats: panel.seats, perCitation: panel.perCitation }))
+    : "";
+  const chain = sha256([citationsHash, prismReceipt.signature || "", gate.verdict, panelDigest].join("|"));
+  return {
+    schema: "roleos-citation-receipt/v1",
+    kind: "citation-verification",
+    tool: "roleos verify-citations",
+    input: typeof input === "string" && input.length < 256 ? input : "(inline)",
+    verdict: gate.verdict,
+    blocking: gate.blocking,
+    advisory: gate.advisory,
+    citations_sha256: citationsHash,
+    // Chain to prism's inner HMAC receipt: verifying prism's signature is what lets role-os
+    // trust a verdict it did not itself compute (separate keys; Haber-Stornetta 1991).
+    prism_receipt: {
+      id: prismReceipt.id || null,
+      signature: prismReceipt.signature || null,
+      verdict: response.verdict || null,
+    },
+    // Per-citation retrieval pins enable drift detection on re-run (compare source_sha256).
+    retrieval_pins: pins.map((p) => ({
+      id: p.id,
+      identifier: p.identifier,
+      query: p.query,
+      source_sha256: p.source_sha256,
+      existence: p.existence,
+    })),
+    // Local-panel seat (when run): the actual seat models (PIN_PER_STEP), what each citation got,
+    // and any disagreement with prism that downgraded the gate.
+    local_panel: panel
+      ? {
+          seats: panel.seats,
+          reachable: panel.reachable,
+          checked: panel.checked,
+          per_citation: panel.perCitation,
+          disagreements: panel.disagreements,
+        }
+      : null,
+    chain_sha256: chain,
+  };
+}
+function sha256(s) {
+  return createHash("sha256").update(s).digest("hex");
+}