npm - rewritable - Versions diffs - 0.1.0 → 0.3.0 - Mend

rewritable 0.1.0 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/README.md +2 -0
package/bin/rwa.mjs +40 -4
package/package.json +6 -3
package/seeds/rewritable.html +3115 -140
package/src/commands.mjs +121 -5
package/src/import-claude.mjs +336 -0
package/src/import-vision.mjs +156 -0
package/src/import.mjs +289 -6
package/src/seed.mjs +15 -4

package/src/commands.mjs CHANGED Viewed

@@ -1,10 +1,13 @@
 import fs from 'node:fs/promises';
 import path from 'node:path';
-import { fileURLToPath } from 'node:url';
+import { fileURLToPath, pathToFileURL } from 'node:url';
+import { spawn } from 'node:child_process';
 import crypto from 'node:crypto';
 import { loadSeed, applySeedSubs, replaceInlineDoc } from './seed.mjs';
 import { convert } from './import.mjs';
+import { convertPdfViaVision } from './import-vision.mjs';
+import { convertViaClaudeCli } from './import-claude.mjs';
 const here = path.dirname(fileURLToPath(import.meta.url));
 const packageRoot = path.dirname(here);
@@ -53,7 +56,81 @@ function rel(p) {
   return r || p;
 }
-export async function newCmd({ outPath, force }) {
+// Parse a single var out of a .env-style file. Minimal — handles KEY=value,
+// surrounding whitespace, optional matched single/double quotes, leading `export`.
+// Skips blank/comment lines. No interpolation, no multiline values.
+async function readEnvKey(name) {
+  if (process.env[name]) return process.env[name];
+  let text;
+  try {
+    text = await fs.readFile(path.join(process.cwd(), '.env'), 'utf8');
+  } catch (_) { return null; }
+  for (const line of text.split('\n')) {
+    const m = line.match(/^\s*(?:export\s+)?([A-Za-z_][A-Za-z0-9_]*)\s*=\s*(.*?)\s*$/);
+    if (!m || m[1] !== name) continue;
+    let v = m[2];
+    if ((v.startsWith('"') && v.endsWith('"')) || (v.startsWith("'") && v.endsWith("'"))) {
+      v = v.slice(1, -1);
+    }
+    return v || null;
+  }
+  return null;
+}
+// Validate-and-return a backend name. Returns null for invalid input rather
+// than throwing — pre-fill is best-effort; an unknown value just means the
+// user sees the default backend (openrouter) on first paint.
+function validBackend(v) {
+  return ['openrouter', 'ollama', 'lmstudio', 'bridge'].includes(v) ? v : null;
+}
+// Collect URL-param pre-fills from env / ./.env. Returns an object whose keys
+// match the URL params the bootstrap lifts (key, backend, model). Missing or
+// invalid values are omitted; the bootstrap falls back to its defaults.
+async function collectPrefill() {
+  const out = {};
+  const key     = await readEnvKey('OPENROUTER_API_KEY');
+  const backend = validBackend(await readEnvKey('RWA_BACKEND'));
+  const model   = await readEnvKey('RWA_MODEL');
+  if (key)     out.key = key;
+  if (backend) out.backend = backend;
+  if (model)   out.model = model;
+  return out;
+}
+function openFile(target, prefill) {
+  // When any prefill is present we open via a file:// URL with the params so
+  // the bootstrap can lift them into sessionStorage on first paint and scrub
+  // the URL bar via history.replaceState. Without any prefill we use the bare
+  // path so the open command is byte-identical to before.
+  let arg;
+  const params = prefill || {};
+  const hasAny = params.key || params.backend || params.model;
+  if (hasAny) {
+    const u = pathToFileURL(target);
+    if (params.key) u.searchParams.set('key', params.key);
+    if (params.backend) u.searchParams.set('backend', params.backend);
+    if (params.model) u.searchParams.set('model', params.model);
+    arg = u.toString();
+  } else {
+    arg = target;
+  }
+  let cmd, args;
+  if (process.platform === 'darwin') {
+    cmd = 'open'; args = [arg];
+  } else if (process.platform === 'win32') {
+    cmd = 'cmd'; args = ['/c', 'start', '""', arg];
+  } else {
+    cmd = 'xdg-open'; args = [arg];
+  }
+  const child = spawn(cmd, args, { detached: true, stdio: 'ignore' });
+  child.on('error', err => {
+    console.error(`note: could not open file (${err.code || err.message})`);
+  });
+  child.unref();
+}
+export async function newCmd({ outPath, force, open }) {
   const out = path.resolve(outPath || './rewritable.html');
   await ensureWritable(out, force);
   const seed = await loadSeed(SEED_CANDIDATES);
@@ -66,9 +143,21 @@ export async function newCmd({ outPath, force }) {
   });
   await fs.writeFile(out, result, 'utf8');
   console.log(`wrote ${rel(out)}`);
+  if (open) {
+    const prefill = await collectPrefill();
+    if (prefill.key) console.error('note: passing OPENROUTER_API_KEY via ?key= URL parameter');
+    if (prefill.backend) console.error(`note: passing RWA_BACKEND=${prefill.backend} via ?backend= URL parameter`);
+    if (prefill.model) console.error(`note: passing RWA_MODEL=${prefill.model} via ?model= URL parameter`);
+    openFile(out, prefill);
+  }
 }
-export async function importCmd({ inputPath, outPath, force }) {
+export async function importCmd({ inputPath, outPath, force, open, vision, claude, model, timeoutSec }) {
+  if (vision && claude) {
+    const e = new Error('--vision and --claude are mutually exclusive');
+    e.exitCode = 2;
+    throw e;
+  }
   const input = path.resolve(inputPath);
   const inputDir = path.dirname(input);
   const inputBasename = path.basename(input, path.extname(input));
@@ -76,8 +165,28 @@ export async function importCmd({ inputPath, outPath, force }) {
   await ensureWritable(out, force);
   const ext = path.extname(input).toLowerCase().replace(/^\./, '');
-  const contents = await fs.readFile(input, 'utf8');
-  const { html, warnings } = await convert(ext, contents);
+  let html, warnings;
+  if (vision) {
+    if (ext !== 'pdf') {
+      const e = new Error(`--vision is currently only supported for .pdf (got .${ext})`);
+      e.exitCode = 2;
+      throw e;
+    }
+    console.error('note: vision: posting to openrouter…');
+    // Buffer for HTTP base64 encoding.
+    const contents = await fs.readFile(input);
+    ({ html, warnings } = await convertPdfViaVision(contents, { model }));
+  } else if (claude) {
+    console.error(`note: claude: spawning \`claude -p\`…`);
+    // Pass the path; the skill reads the file itself via its own tools.
+    const claudeOpts = timeoutSec ? { timeoutMs: timeoutSec * 1000 } : {};
+    ({ html, warnings } = await convertViaClaudeCli(input, ext, claudeOpts));
+  } else {
+    // Buffer (not utf8 string) — docx and pdf are binary, and text formats
+    // decode internally inside convert().
+    const contents = await fs.readFile(input);
+    ({ html, warnings } = await convert(ext, contents));
+  }
   for (const w of warnings) console.error(`note: ${w}`);
   const seed = await loadSeed(SEED_CANDIDATES);
@@ -97,4 +206,11 @@ export async function importCmd({ inputPath, outPath, force }) {
   const result = replaceInlineDoc(subbed, html);
   await fs.writeFile(out, result, 'utf8');
   console.log(`wrote ${rel(out)}`);
+  if (open) {
+    const prefill = await collectPrefill();
+    if (prefill.key) console.error('note: passing OPENROUTER_API_KEY via ?key= URL parameter');
+    if (prefill.backend) console.error(`note: passing RWA_BACKEND=${prefill.backend} via ?backend= URL parameter`);
+    if (prefill.model) console.error(`note: passing RWA_MODEL=${prefill.model} via ?model= URL parameter`);
+    openFile(out, prefill);
+  }
 }

package/src/import-claude.mjs ADDED Viewed

@@ -0,0 +1,336 @@
+import { spawn } from 'node:child_process';
+import { readFile } from 'node:fs/promises';
+import path from 'node:path';
+import * as pdfjs from 'pdfjs-dist/legacy/build/pdf.mjs';
+// PDF / docx → HTML by spawning the `claude` CLI in print mode.
+//
+// PDFs are processed in PARALLEL: split into page ranges, each chunk
+// handed to its own `claude -p` subprocess concurrently, then merged.
+// Long papers go from sequential N×t to roughly t×ceil(chunks/concurrency).
+//
+// Why: the user's machine has Anthropic's official `pdf` and `docx` skills
+// installed under ~/.claude/skills/. Those skills have rich Python tooling
+// (pypdf, pdfplumber, pandoc, mammoth, LibreOffice) that the rwa CLI itself
+// can't reasonably bundle. Calling `claude -p` lets the agent invoke its
+// skill, run the local Python sandbox, and hand back clean semantic HTML —
+// strictly better fidelity than either the local pdfjs heuristic or the
+// raw-vision OpenRouter path, on documents where the skills apply.
+//
+// Trust model: this spawns a Claude Code subprocess with
+// `--permission-mode bypassPermissions`, which lets the agent run shell
+// commands and write files without prompting. The user already trusts
+// their input file (they're importing it). Document this in HELP.
+const SKILL_FOR_EXT = { pdf: 'pdf', docx: 'docx' };
+const DEFAULT_CHUNK_SIZE = 5;       // pages per chunk
+const DEFAULT_CONCURRENCY = 4;      // simultaneous claude -p subprocesses
+const DEFAULT_TIMEOUT_MS = 1_200_000; // 20 minutes per chunk
+const PROMPT_TEMPLATE = (skill, filePath, pageRange) => {
+  const rangeNote = pageRange
+    ? `\n\nIMPORTANT: Process ONLY pages ${pageRange.start} to ${pageRange.end} (inclusive) of the document. Use the pdf skill's page-range support (pypdf/pdfplumber accept page indices) to extract just that slice. Do not output content from any other pages. The full document is ${pageRange.totalPages} pages; this chunk is pages ${pageRange.start}-${pageRange.end}.`
+    : '';
+  const styleNote = pageRange && pageRange.start > 1
+    ? `\n\nIMPORTANT (chunk ${pageRange.start}-${pageRange.end}): omit the leading <style> and @page rules. Output ONLY the inner content of the .doc wrapper for these pages — start your output with the actual content elements (e.g., <h2>, <p>, <table>...) and end with the last content element. Do NOT include <article>, <style>, <div class="doc">, or </article>, </div>. Just the content of pages ${pageRange.start}-${pageRange.end}, ready to splice into a larger document. The first chunk handled the styling; later chunks contribute content only.`
+    : '';
+  return `Use the ${skill} skill to extract the content of ${filePath} and convert it to a single <article>...</article> element that VISUALLY MATCHES the original document as closely as possible when rendered in a browser.${rangeNote}${styleNote}
+The output will be embedded inside a re-writeable document container that has its own dark-theme CSS. Your <article> must include a leading scoped <style> block that defines its own visual appearance, so the container's theme does not bleed in.
+Required structure (full-document or first-chunk only — see chunk note above):
+<article style="all: revert;">
+  <style>
+    /* Scope every rule to .doc to avoid leaking into the container.
+       Use 'all: revert' or explicit resets to neutralize the container's theme. */
+    .doc { background: ...; color: ...; font-family: ...; padding: ...; max-width: ...; margin: 0 auto; }
+    .doc h1, .doc h2, .doc p, .doc table, .doc th, .doc td { ... }
+    /* etc. */
+  </style>
+  <div class="doc">
+    ... actual content ...
+  </div>
+</article>
+Style requirements (match the source PDF):
+- Background color (usually white #ffffff for printed documents).
+- Text color (usually black #000000 or near-black).
+- Font family — pick a generic match: invoices and letters use sans-serif (Helvetica, Arial, system-ui); academic/literary uses serif (Georgia, Times New Roman); monospaced text uses monospace.
+- Font sizes — match the visual hierarchy (titles bigger, body smaller, footnotes smallest).
+- Text alignment — left, right, center, or justify, matching each block in the source.
+- Right-aligned blocks (sender addresses, dates) MUST remain right-aligned via CSS.
+- Padding/margins around sections that mirror the PDF's vertical density. Crucially, do NOT inflate vertical spacing — if the source fits on N pages, your output should fit on N pages when printed at the source paper size. Prefer tight margins (~0.5em-1em between blocks) over generous ones; a single-page invoice should remain a single-page invoice.
+- Tables — borders, cell padding, header weight, alternating rows or shading where the PDF has them.
+- Bold and italic where used, via <strong>/<em> (preferred) or font-weight/font-style in the scoped CSS.
+Print-fit requirements (REQUIRED for documents that match a paper size):
+- Include an @media print rule inside the scoped <style> block that:
+  * Removes any max-width constraint (so the doc fills the page width).
+  * Sets margin:0 / padding:0 on .doc so the printer's @page margin (default 0.5in) is the only outer margin.
+  * Optionally tightens block spacing further if the source page density is dense.
+  * Uses page-break-inside:avoid on tables, headers, and footer blocks so they don't split awkwardly across pages.
+- Add an @page rule with size matching the source (default A4 if uncertain): @page { size: A4; margin: 0.5in; }
+Content requirements:
+- Use semantic tags: <h1>-<h6>, <p>, <ul>/<ol>/<li>, <table>/<thead>/<tbody>/<tr>/<td>/<th>, <strong>/<em>, <a href="...">.
+- Preserve text exactly. Do not summarize, paraphrase, or reword.
+- Reconstruct multi-column layouts as the source has them: side-by-side blocks via CSS flex/grid in your scoped styles, or as table cells if that fits better.
+- No <img> tags. No <script>. No external resources (no @import, no <link>, no Google Fonts URLs — only system or generic font families).
+- No id attributes. Class names should be scoped under .doc to avoid collisions with the container.
+- Do not include <html>, <head>, <body>, or <!doctype>.
+Print ONLY the final HTML as your last response. No preamble, no markdown fences, no commentary.`;
+};
+/**
+ * @param {string} filePath  Absolute path to the file to import
+ * @param {string} ext       Extension without dot ("pdf" or "docx")
+ * @param {object} [opts]
+ * @param {AbortSignal} [opts.signal]
+ * @param {number} [opts.timeoutMs]    Wall-clock cap PER CHUNK (default 20min)
+ * @param {number} [opts.chunkSize]    Pages per chunk for PDFs (default 5)
+ * @param {number} [opts.concurrency]  Max simultaneous subprocesses (default 4)
+ * @returns {Promise<{ html: string, warnings: string[] }>}
+ */
+export async function convertViaClaudeCli(filePath, ext, opts = {}) {
+  const skill = SKILL_FOR_EXT[ext];
+  if (!skill) {
+    const e = new Error(`--claude only supports .pdf and .docx (got .${ext})`);
+    e.exitCode = 2;
+    throw e;
+  }
+  // docx isn't naturally page-chunkable (no fixed page boundaries inside the
+  // XML). Single call.
+  if (ext !== 'pdf') {
+    const stdout = await runClaude(filePath, PROMPT_TEMPLATE(skill, filePath, null), opts);
+    const html = extractArticle(stdout);
+    if (!html) {
+      const preview = stdout.trim().slice(0, 400);
+      const e = new Error(
+        `claude: output did not contain an <article> element. Output preview:\n${preview}`
+      );
+      e.exitCode = 2;
+      throw e;
+    }
+    return {
+      html,
+      warnings: [`claude: imported via \`claude -p\` (${skill} skill)`],
+    };
+  }
+  const totalPages = await getPdfPageCount(filePath);
+  const chunkSize = opts.chunkSize || DEFAULT_CHUNK_SIZE;
+  const concurrency = opts.concurrency || DEFAULT_CONCURRENCY;
+  const ranges = [];
+  for (let start = 1; start <= totalPages; start += chunkSize) {
+    const end = Math.min(start + chunkSize - 1, totalPages);
+    ranges.push({ start, end, totalPages });
+  }
+  console.error(
+    `note: claude: ${totalPages}-page PDF → ${ranges.length} chunk${ranges.length === 1 ? '' : 's'} of ≤${chunkSize} pages, ${Math.min(concurrency, ranges.length)} parallel`
+  );
+  const htmlChunks = await runWithConcurrency(ranges, concurrency, async (range, idx) => {
+    console.error(`note: claude: chunk ${idx + 1}/${ranges.length} (pages ${range.start}-${range.end}) starting…`);
+    const prompt = PROMPT_TEMPLATE(skill, filePath, range);
+    const html = await runClaude(filePath, prompt, opts);
+    console.error(`note: claude: chunk ${idx + 1}/${ranges.length} done`);
+    return html;
+  });
+  const merged = mergeChunks(htmlChunks);
+  return {
+    html: merged,
+    warnings: [
+      `claude: imported ${ranges.length} chunk${ranges.length === 1 ? '' : 's'} via parallel \`claude -p\` (${skill} skill)`,
+    ],
+  };
+}
+// Run a single `claude -p` invocation. Returns the extracted HTML for the
+// chunk (either a full <article> or content-only fragment depending on the
+// prompt's chunk hint).
+function runClaude(filePath, prompt, { signal, timeoutMs = DEFAULT_TIMEOUT_MS } = {}) {
+  const args = [
+    '-p',
+    '--output-format', 'text',
+    '--add-dir', path.dirname(filePath),
+    '--permission-mode', 'bypassPermissions',
+    prompt,
+  ];
+  return new Promise((resolve, reject) => {
+    let proc;
+    try {
+      proc = spawn('claude', args, { stdio: ['ignore', 'pipe', 'pipe'], signal });
+    } catch (err) {
+      const e = new Error(`claude: failed to spawn (${err && err.message ? err.message : String(err)}). Is the claude CLI installed?`);
+      e.exitCode = 2;
+      return reject(e);
+    }
+    let stdout = '';
+    let stderr = '';
+    proc.stdout.on('data', d => { stdout += d.toString('utf8'); });
+    proc.stderr.on('data', d => { stderr += d.toString('utf8'); });
+    const timer = setTimeout(() => {
+      proc.kill('SIGKILL');
+      const e = new Error(`claude: timed out after ${Math.round(timeoutMs / 1000)}s`);
+      e.exitCode = 2;
+      reject(e);
+    }, timeoutMs);
+    proc.on('error', err => {
+      clearTimeout(timer);
+      const e = new Error(`claude: spawn error (${err.code || err.message})`);
+      e.exitCode = 2;
+      reject(e);
+    });
+    proc.on('close', code => {
+      clearTimeout(timer);
+      if (code !== 0) {
+        const tail = stderr.trim().split('\n').slice(-5).join('\n').slice(0, 800);
+        const e = new Error(`claude -p exited ${code}${tail ? '\n' + tail : ''}`);
+        e.exitCode = 2;
+        return reject(e);
+      }
+      // Output may be a full <article>...</article> (first chunk / single call)
+      // or just inner content (later chunks). Hand the full stdout to the
+      // merger; it knows how to extract either shape.
+      resolve(stdout);
+    });
+  });
+}
+// Bounded-concurrency parallel runner. Items are processed in input order
+// up to `concurrency` at a time. Order of `results[]` matches input order,
+// regardless of completion order.
+async function runWithConcurrency(items, concurrency, fn) {
+  const results = new Array(items.length);
+  let nextIdx = 0;
+  const worker = async () => {
+    while (true) {
+      const myIdx = nextIdx++;
+      if (myIdx >= items.length) break;
+      results[myIdx] = await fn(items[myIdx], myIdx);
+    }
+  };
+  const workers = Array.from({ length: Math.min(concurrency, items.length) }, worker);
+  await Promise.all(workers);
+  return results;
+}
+async function getPdfPageCount(filePath) {
+  const buf = await readFile(filePath);
+  const data = new Uint8Array(buf.buffer, buf.byteOffset, buf.byteLength);
+  let doc;
+  try {
+    doc = await pdfjs.getDocument({ data, isEvalSupported: false }).promise;
+  } catch (err) {
+    const e = new Error(`claude: failed to read PDF page count (${err && err.message ? err.message : String(err)})`);
+    e.exitCode = 2;
+    throw e;
+  }
+  const count = doc.numPages;
+  await doc.destroy().catch(() => {});
+  return count;
+}
+// Merge per-chunk HTML output into a single <article>. The first chunk's
+// output is treated as a full <article> with leading <style>/@page; later
+// chunks are content-only fragments (per their prompt). We:
+// 1. Extract the first chunk's full <article ...>...<style>...</style>...<div class="doc"> shell
+// 2. Append each later chunk's content fragments inside that .doc
+// 3. Close with </div></article>
+//
+// If a later chunk DID emit a full <article>+<style> (the model ignored the
+// chunk hint), strip its <article>/<style>/<div class="doc"> wrappers and
+// keep only its inner content.
+function mergeChunks(stdouts) {
+  if (stdouts.length === 1) {
+    const html = extractArticle(stdouts[0]);
+    if (!html) {
+      const preview = stdouts[0].trim().slice(0, 400);
+      const e = new Error(
+        `claude: output did not contain an <article> element. Output preview:\n${preview}`
+      );
+      e.exitCode = 2;
+      throw e;
+    }
+    return html;
+  }
+  const first = extractArticle(stdouts[0]);
+  if (!first) {
+    const preview = stdouts[0].trim().slice(0, 400);
+    const e = new Error(
+      `claude: first chunk output did not contain an <article> element. Output preview:\n${preview}`
+    );
+    e.exitCode = 2;
+    throw e;
+  }
+  // Find the .doc wrapper closing in the first chunk, so we can splice
+  // additional content before it. Prefer </div></article>; fall back to just
+  // </article> if no .doc wrapper exists.
+  const closingDocArticle = /<\/div>\s*<\/article>\s*$/i;
+  const closingArticleOnly = /<\/article>\s*$/i;
+  let prefix, suffix;
+  if (closingDocArticle.test(first)) {
+    prefix = first.replace(closingDocArticle, '');
+    suffix = '</div></article>';
+  } else if (closingArticleOnly.test(first)) {
+    prefix = first.replace(closingArticleOnly, '');
+    suffix = '</article>';
+  } else {
+    // Shouldn't happen — extractArticle guarantees </article>. Defensive.
+    prefix = first;
+    suffix = '';
+  }
+  const additional = stdouts.slice(1).map(stripChunkWrappers).filter(Boolean);
+  return [prefix, ...additional.map(c => '\n' + c), suffix].join('');
+}
+// Pull content out of a chunk's stdout. If the chunk emitted a full
+// <article>+<style>+<div class="doc">...</div></article> (because the model
+// ignored the "content-only" hint), strip those wrappers and the <style>.
+// Otherwise return the cleaned stdout (already content-only).
+function stripChunkWrappers(stdout) {
+  let body = stdout.trim();
+  // If wrapped in <article>...</article>, take only the inside.
+  const articleMatch = body.match(/<article(?:\s[^>]*)?>([\s\S]*)<\/article>/i);
+  if (articleMatch) body = articleMatch[1];
+  // Strip any <style>...</style> (we keep only the first chunk's styles).
+  body = body.replace(/<style(?:\s[^>]*)?>[\s\S]*?<\/style>/gi, '');
+  // Strip <div class="doc">...</div> wrapper if present.
+  const docMatch = body.match(/<div[^>]*class\s*=\s*["']doc["'][^>]*>([\s\S]*)<\/div>/i);
+  if (docMatch) body = docMatch[1];
+  // Strip stray markdown fences (some models add them despite the prompt).
+  body = body.replace(/^```(?:html)?\s*/i, '').replace(/\s*```\s*$/i, '');
+  return body.trim();
+}
+// Extract the outermost <article>...</article>. The agent's stdout might
+// include thinking commentary, tool-use traces, or markdown fences in
+// addition to the HTML; pull out only the article element.
+function extractArticle(text) {
+  const start = text.search(/<article(?:\s[^>]*)?>/i);
+  if (start < 0) return null;
+  const end = text.lastIndexOf('</article>');
+  if (end < 0 || end < start) return null;
+  return text.slice(start, end + '</article>'.length).trim();
+}

package/src/import-vision.mjs ADDED Viewed

@@ -0,0 +1,156 @@
+import fs from 'node:fs/promises';
+import path from 'node:path';
+// PDF → HTML via OpenRouter chat completions.
+//
+// Why this exists: pdfjs's text extraction produces flat-paragraph output
+// that loses tables, multi-column layouts, and any text whose font has a
+// broken toUnicode CMap (e.g. "Ü" decoded as "UY"). Sending the raw PDF to
+// a vision-capable model bypasses both — the model reads the rendered
+// content and reconstructs semantic HTML.
+//
+// Trade-off: ~$0.01-$0.05 per page in API costs, network round-trip
+// latency. Opt-in via `rwa import file.pdf --vision`.
+//
+// Wire format: OpenRouter's PDF input docs say content type is "file" with
+// `file_data: "data:application/pdf;base64,..."`. For Anthropic models OR
+// passes this through as a native PDF document block; for others (Gemini,
+// GPT-4o), it's routed through OR's file-parser plugin (engine "native"
+// uses the model's own multimodal capability).
+const OPENROUTER_URL = 'https://openrouter.ai/api/v1/chat/completions';
+const SYSTEM_PROMPT = `You are converting a PDF document into clean, semantic HTML for embedding in a single-file rewritable document container.
+Output requirements:
+- A single <article> element containing all document content.
+- Use semantic HTML: <h1>-<h6> for headings, <p> for paragraphs, <ul>/<ol>/<li> for lists, <table><thead><tbody><tr><td>/<th> for tables, <strong>/<em> for emphasis, <a href="..."> for links.
+- Do NOT output <html>, <head>, <body>, <!doctype>, any preamble, or any explanation before or after the HTML.
+- Do NOT wrap output in markdown code fences (no \`\`\`html).
+- Preserve text content exactly — do not summarize, paraphrase, translate, or reword.
+- Reconstruct multi-column layouts and tables faithfully. Table headers go in <thead>, body rows in <tbody>.
+- Omit <img> entirely; this container is text-focused. If an image carries information, describe it briefly in a <p>.
+- No <script>, <style>, class, or id attributes. Plain semantic HTML only.
+Output ONLY the <article>...</article> element.`;
+const USER_PROMPT = 'Convert this PDF document to a single <article> element of clean semantic HTML, following the rules in the system prompt.';
+/**
+ * @param {Buffer|Uint8Array} bytes  PDF content
+ * @param {object} [opts]
+ * @param {string} [opts.apiKey]     OpenRouter API key. If omitted, read from
+ *                                   process.env.OPENROUTER_API_KEY, then ./.env
+ * @param {string} [opts.model]      OpenRouter model id; default reuses
+ *                                   the rwa container's default
+ * @param {AbortSignal} [opts.signal]
+ * @returns {Promise<{ html: string, warnings: string[] }>}
+ */
+export async function convertPdfViaVision(bytes, { apiKey, model, signal } = {}) {
+  apiKey = apiKey || process.env.OPENROUTER_API_KEY || await readDotEnvKey('OPENROUTER_API_KEY');
+  if (!apiKey) {
+    const e = new Error('vision: OPENROUTER_API_KEY is required (set in env or ./.env)');
+    e.exitCode = 2;
+    throw e;
+  }
+  const buf = Buffer.isBuffer(bytes) ? bytes : Buffer.from(bytes);
+  const dataUri = `data:application/pdf;base64,${buf.toString('base64')}`;
+  const body = {
+    model: model || 'google/gemini-3-flash-preview',
+    messages: [
+      { role: 'system', content: SYSTEM_PROMPT },
+      {
+        role: 'user',
+        content: [
+          { type: 'text', text: USER_PROMPT },
+          { type: 'file', file: { filename: 'document.pdf', file_data: dataUri } },
+        ],
+      },
+    ],
+    // Generous output budget — long PDFs can produce a lot of HTML.
+    // OpenRouter will clamp to model's actual max if smaller.
+    max_tokens: 16384,
+    // Deterministic output — we want the same HTML for the same input.
+    temperature: 0,
+  };
+  const res = await fetch(OPENROUTER_URL, {
+    method: 'POST',
+    headers: {
+      'Authorization': `Bearer ${apiKey}`,
+      'Content-Type': 'application/json',
+      // Recommended by OpenRouter for tracking, helps with rate-limit accounting.
+      'HTTP-Referer': 'https://github.com/martintreiber/rewritable',
+      'X-Title': 'rwa CLI',
+    },
+    body: JSON.stringify(body),
+    signal,
+  });
+  if (!res.ok) {
+    const text = await res.text().catch(() => '');
+    const e = new Error(`vision: openrouter ${res.status}${text ? ': ' + text.slice(0, 500) : ''}`);
+    e.exitCode = 2;
+    throw e;
+  }
+  const json = await res.json();
+  const content = json?.choices?.[0]?.message?.content;
+  if (typeof content !== 'string' || !content.trim()) {
+    const e = new Error('vision: openrouter returned empty content');
+    e.exitCode = 2;
+    throw e;
+  }
+  const html = extractArticle(content);
+  if (!html) {
+    const e = new Error(
+      `vision: model output did not contain an <article> element. Output preview:\n${content.slice(0, 300)}`
+    );
+    e.exitCode = 2;
+    throw e;
+  }
+  const warnings = [];
+  // Surface usage so the user sees what each import cost.
+  const usage = json?.usage;
+  if (usage) {
+    const tokens = `${usage.prompt_tokens || 0} in / ${usage.completion_tokens || 0} out`;
+    warnings.push(`vision: ${body.model} (${tokens} tokens)`);
+  }
+  return { html, warnings };
+}
+// Minimal .env reader for the OPENROUTER_API_KEY fallback path. Handles
+// KEY=value with optional surrounding whitespace, optional matched quotes,
+// optional `export` prefix. No interpolation, no multi-line values. Returns
+// null if the file or key is missing.
+async function readDotEnvKey(name) {
+  let text;
+  try {
+    text = await fs.readFile(path.join(process.cwd(), '.env'), 'utf8');
+  } catch (_) { return null; }
+  for (const line of text.split('\n')) {
+    const m = line.match(/^\s*(?:export\s+)?([A-Za-z_][A-Za-z0-9_]*)\s*=\s*(.*?)\s*$/);
+    if (!m || m[1] !== name) continue;
+    let v = m[2];
+    if ((v.startsWith('"') && v.endsWith('"')) || (v.startsWith("'") && v.endsWith("'"))) {
+      v = v.slice(1, -1);
+    }
+    return v || null;
+  }
+  return null;
+}
+// Extract the outermost <article>...</article>. Models often wrap output in
+// ```html fences or add a "Here is the HTML:" preamble despite the system
+// prompt; pull out only the article element to be robust to that.
+function extractArticle(text) {
+  // Find the first <article (allow attributes) and the LAST </article>.
+  const start = text.search(/<article(?:\s[^>]*)?>/i);
+  if (start < 0) return null;
+  const end = text.lastIndexOf('</article>');
+  if (end < 0 || end < start) return null;
+  return text.slice(start, end + '</article>'.length).trim();
+}