npm - @robzilla1738/agentswarm - Versions diffs - 0.5.0 → 0.6.0 - Mend

@robzilla1738/agentswarm 0.5.0 → 0.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (35) hide show

package/README.md +29 -12
package/dist/agent.js +2 -1
package/dist/cli.js +21 -4
package/dist/config.js +27 -1
package/dist/executor.js +243 -43
package/dist/hub.js +69 -3
package/dist/memory.js +5 -4
package/dist/pdftext.js +211 -0
package/dist/prompts.js +23 -15
package/dist/report.js +37 -0
package/dist/run.js +8 -0
package/dist/sandbox.js +11 -0
package/dist/searchcore.js +55 -2
package/dist/state.js +34 -6
package/dist/tools.js +196 -19
package/dist/util.js +85 -0
package/dist/webtools.js +145 -15
package/package.json +1 -1
package/ui/out/404/index.html +1 -1
package/ui/out/404.html +1 -1
package/ui/out/_next/static/chunks/677-721ce1c8b7a6a317.js +1 -0
package/ui/out/_next/static/chunks/app/run/page-3674e103981703a2.js +1 -0
package/ui/out/_next/static/chunks/app/settings/page-41a5d8ba43ecfd4a.js +1 -0
package/ui/out/_next/static/css/{9f7bd82b8e4c762c.css → d95c2ba395730031.css} +1 -1
package/ui/out/index.html +1 -1
package/ui/out/index.txt +3 -3
package/ui/out/run/index.html +1 -1
package/ui/out/run/index.txt +3 -3
package/ui/out/settings/index.html +1 -1
package/ui/out/settings/index.txt +3 -3
package/ui/out/_next/static/chunks/677-859e8d42add1806b.js +0 -1
package/ui/out/_next/static/chunks/app/run/page-2420c9e4c963d9b3.js +0 -1
package/ui/out/_next/static/chunks/app/settings/page-092a6bf42dfde57d.js +0 -1
/package/ui/out/_next/static/{errjtBR_bKoee8ogLp8xk → 7_pihFubDGD40BCy2ynlr}/_buildManifest.js +0 -0
/package/ui/out/_next/static/{errjtBR_bKoee8ogLp8xk → 7_pihFubDGD40BCy2ynlr}/_ssgManifest.js +0 -0

package/dist/pdftext.js ADDED Viewed

@@ -0,0 +1,211 @@
+"use strict";
+var __createBinding = (this && this.__createBinding) || (Object.create ? (function(o, m, k, k2) {
+    if (k2 === undefined) k2 = k;
+    var desc = Object.getOwnPropertyDescriptor(m, k);
+    if (!desc || ("get" in desc ? !m.__esModule : desc.writable || desc.configurable)) {
+      desc = { enumerable: true, get: function() { return m[k]; } };
+    }
+    Object.defineProperty(o, k2, desc);
+}) : (function(o, m, k, k2) {
+    if (k2 === undefined) k2 = k;
+    o[k2] = m[k];
+}));
+var __setModuleDefault = (this && this.__setModuleDefault) || (Object.create ? (function(o, v) {
+    Object.defineProperty(o, "default", { enumerable: true, value: v });
+}) : function(o, v) {
+    o["default"] = v;
+});
+var __importStar = (this && this.__importStar) || (function () {
+    var ownKeys = function(o) {
+        ownKeys = Object.getOwnPropertyNames || function (o) {
+            var ar = [];
+            for (var k in o) if (Object.prototype.hasOwnProperty.call(o, k)) ar[ar.length] = k;
+            return ar;
+        };
+        return ownKeys(o);
+    };
+    return function (mod) {
+        if (mod && mod.__esModule) return mod;
+        var result = {};
+        if (mod != null) for (var k = ownKeys(mod), i = 0; i < k.length; i++) if (k[i] !== "default") __createBinding(result, mod, k[i]);
+        __setModuleDefault(result, mod);
+        return result;
+    };
+})();
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.extractPdfText = extractPdfText;
+const zlib = __importStar(require("zlib"));
+/**
+ * Minimal zero-dependency PDF text extraction: inflate FlateDecode content
+ * streams (Node's built-in zlib) and interpret the text-showing operators
+ * (Tj / TJ / ' / "). Good enough for most digitally-produced text PDFs;
+ * returns null for scanned, encrypted, or exotic-encoding documents so the
+ * caller can tell the agent to find an HTML source instead.
+ */
+function extractPdfText(buf) {
+    if (buf.subarray(0, 5).toString("latin1") !== "%PDF-")
+        return null;
+    // latin1 preserves bytes 1:1, so stream offsets in the string match the buffer.
+    const raw = buf.toString("latin1");
+    const pages = (raw.match(/\/Type\s*\/Pages?\b/g) || []).filter((m) => !/Pages/.test(m)).length || 1;
+    let text = "";
+    const streamRe = /<<([\s\S]{0,2000}?)>>\s*stream\r?\n/g;
+    let m;
+    while ((m = streamRe.exec(raw))) {
+        const dict = m[1];
+        const start = m.index + m[0].length;
+        const end = raw.indexOf("endstream", start);
+        if (end < 0)
+            continue;
+        streamRe.lastIndex = end;
+        // Only plain or Flate-compressed streams are supported.
+        if (/\/Filter/.test(dict) && !/FlateDecode/.test(dict))
+            continue;
+        let len = end;
+        while (len > start && (raw[len - 1] === "\n" || raw[len - 1] === "\r"))
+            len--;
+        let data = buf.subarray(start, len);
+        if (/FlateDecode/.test(dict)) {
+            try {
+                data = zlib.inflateSync(data);
+            }
+            catch {
+                continue;
+            }
+        }
+        const content = data.toString("latin1");
+        if (!/\bBT\b/.test(content))
+            continue; // not a text content stream
+        const extracted = extractFromContent(content);
+        if (extracted.trim())
+            text += extracted + "\n";
+    }
+    const cleaned = text
+        .replace(/[^\S\n]+/g, " ")
+        .replace(/ ?\n ?/g, "\n")
+        .replace(/\n{3,}/g, "\n\n")
+        .trim();
+    // CID/Type0 fonts yield glyph-index garbage; require a body of real characters.
+    const printable = cleaned.replace(/[^\x20-\x7E\n -]/g, "");
+    if (printable.replace(/\s/g, "").length < 40)
+        return null;
+    return { text: printable, pages };
+}
+/** Walk a content stream, collecting strings shown by Tj/TJ/'/" with newline heuristics. */
+function extractFromContent(src) {
+    let out = "";
+    let pending = [];
+    const n = src.length;
+    let i = 0;
+    while (i < n) {
+        const ch = src[i];
+        if (ch === "(") {
+            const [s, next] = parseLiteralString(src, i);
+            pending.push(s);
+            i = next;
+        }
+        else if (ch === "<" && src[i + 1] !== "<") {
+            const close = src.indexOf(">", i + 1);
+            if (close < 0)
+                break;
+            pending.push(decodeHexString(src.slice(i + 1, close)));
+            i = close + 1;
+        }
+        else if (ch === "%") {
+            // comment to end of line
+            while (i < n && src[i] !== "\n" && src[i] !== "\r")
+                i++;
+        }
+        else if (/[A-Za-z'"*]/.test(ch)) {
+            let j = i;
+            while (j < n && /[A-Za-z'"*]/.test(src[j]))
+                j++;
+            const op = src.slice(i, j);
+            if (op === "Tj" || op === "TJ") {
+                out += pending.join("");
+            }
+            else if (op === "'" || op === '"') {
+                out += "\n" + pending.join("");
+            }
+            else if (op === "Td" || op === "TD" || op === "T*" || op === "Tm" || op === "ET") {
+                if (pending.length)
+                    out += pending.join("");
+                if (!out.endsWith("\n"))
+                    out += "\n";
+            }
+            pending = [];
+            i = j;
+        }
+        else if (ch === "-" || (ch >= "0" && ch <= "9") || ch === ".") {
+            let j = i + 1;
+            while (j < n && /[0-9.]/.test(src[j]))
+                j++;
+            // Large negative kerning inside a TJ array is a word gap.
+            const num = parseFloat(src.slice(i, j));
+            if (num <= -180 && pending.length && !pending[pending.length - 1].endsWith(" "))
+                pending.push(" ");
+            i = j;
+        }
+        else {
+            i++;
+        }
+    }
+    return out;
+}
+/** PDF literal string: balanced parens, backslash escapes, octal codes. */
+function parseLiteralString(src, start) {
+    let out = "";
+    let depth = 0;
+    let i = start;
+    for (; i < src.length; i++) {
+        const ch = src[i];
+        if (ch === "\\") {
+            const next = src[i + 1];
+            if (next >= "0" && next <= "7") {
+                let oct = "";
+                for (let k = 1; k <= 3 && src[i + k] >= "0" && src[i + k] <= "7"; k++)
+                    oct += src[i + k];
+                out += String.fromCharCode(parseInt(oct, 8));
+                i += oct.length;
+            }
+            else {
+                const map = { n: "\n", r: "\r", t: "\t", b: "\b", f: "\f", "(": "(", ")": ")", "\\": "\\" };
+                out += map[next] ?? next ?? "";
+                i++;
+            }
+        }
+        else if (ch === "(") {
+            depth++;
+            if (depth > 1)
+                out += ch;
+        }
+        else if (ch === ")") {
+            depth--;
+            if (depth === 0) {
+                i++;
+                break;
+            }
+            out += ch;
+        }
+        else {
+            out += ch;
+        }
+    }
+    return [out, i];
+}
+/** PDF hex string: byte pairs; a UTF-16BE BOM switches to two-byte chars. */
+function decodeHexString(hex) {
+    const clean = hex.replace(/[^0-9a-fA-F]/g, "");
+    const bytes = [];
+    for (let i = 0; i + 1 < clean.length; i += 2)
+        bytes.push(parseInt(clean.slice(i, i + 2), 16));
+    if (clean.length % 2)
+        bytes.push(parseInt(clean[clean.length - 1] + "0", 16));
+    if (bytes.length >= 2 && bytes[0] === 0xfe && bytes[1] === 0xff) {
+        let s = "";
+        for (let i = 2; i + 1 < bytes.length; i += 2)
+            s += String.fromCharCode((bytes[i] << 8) | bytes[i + 1]);
+        return s;
+    }
+    return bytes.map((b) => String.fromCharCode(b)).join("");
+}

package/dist/prompts.js CHANGED Viewed

@@ -122,7 +122,7 @@ function taskTable(tasks) {
         return "(no tasks yet)";
     const line = (t) => {
         const deps = t.deps.length ? ` deps:[${t.deps.join(",")}]` : "";
-        const extra = t.status === "failed" && t.error ? ` — ${(0, util_1.clip)(t.error, 80)}` : "";
+        const extra = (t.status === "failed" || t.status === "blocked") && t.error ? ` — ${(0, util_1.clip)(t.error, 120)}` : "";
         return `${t.id} [${t.status}${t.attempt > 1 ? ` a${t.attempt}` : ""}] (${t.role})${deps} ${(0, util_1.clip)(t.title, 70)}${extra}`;
     };
     const settled = tasks.filter((t) => ["done", "failed", "blocked"].includes(t.status));
@@ -146,6 +146,13 @@ function taskTable(tasks) {
     }
     return out.join("\n");
 }
+function sourcesLine(t, max = 6) {
+    if (!t.sources?.length)
+        return "";
+    const shown = t.sources.slice(0, max).map((s) => s.url);
+    const more = t.sources.length > max ? ` (+${t.sources.length - max} more)` : "";
+    return `\nsources: ${shown.join(" · ")}${more}`;
+}
 function reportBlock(t) {
     const head = `── ${t.id} (${t.role}) "${(0, util_1.clip)(t.title, 60)}" → ${t.status.toUpperCase()}${t.attempt > 1 ? ` (attempt ${t.attempt})` : ""}`;
     const body = t.report ? (0, util_1.clip)(t.report, 1600) : t.error ? `error: ${(0, util_1.clip)(t.error, 400)}` : "(no report)";
@@ -154,7 +161,7 @@ function reportBlock(t) {
     const files = t.filesTouched?.length ? `\nfiles touched: ${t.filesTouched.join(", ")}` : "";
     const arts = t.artifacts.length ? `\nartifacts: ${t.artifacts.join(", ")}` : "";
     const fb = t.feedback ? `\nverifier: ${(0, util_1.clip)(t.feedback, 300)}` : "";
-    return `${head}\n${body}${facts}${open}${files}${arts}${fb}`;
+    return `${head}\n${body}${facts}${open}${files}${arts}${sourcesLine(t)}${fb}`;
 }
 /**
  * Compact dependency context for a downstream worker: structured handoff
@@ -168,11 +175,12 @@ function depReportBlock(t) {
     const arts = t.artifacts.length ? `\nartifacts: ${t.artifacts.join(", ")}` : "";
     const full = (t.report ?? "").length > 1200 ? `\n(excerpt — full text: read_report("${t.id}"))` : "";
     const body = t.report ? (0, util_1.clip)(t.report, 1200) : t.error ? `error: ${(0, util_1.clip)(t.error, 400)}` : "(no report)";
-    return `${head}\n${body}${facts}${files}${arts}${full}`;
+    return `${head}\n${body}${facts}${files}${arts}${sourcesLine(t)}${full}`;
 }
 // ============================================================ workers
 const ROLE_HINTS = {
-    researcher: "Research craft: be exhaustive. Run deep web_search (deep=true, high count) across several distinct phrasings — pull DOZENS of sources for your sub-question, not three. Triangulate across independent sources; prefer primary docs and official sources over blog spam; capture exact figures, dates, and URLs, and keep the quotable passages the search returns. Record key findings as blackboard notes (with the source URL) and save a structured markdown file of your sources+findings as an artifact so the synthesizer can build on it. " +
+    researcher: "Research craft: be exhaustive. Run deep web_search (deep=true, high count) across several distinct phrasings — pull DOZENS of sources for your sub-question, not three. Triangulate across independent sources; prefer primary docs and official sources over blog spam; capture exact figures, dates, and URLs, and keep the quotable passages the search returns. Record key findings as blackboard notes (with url=<source>) and save a structured markdown file of your sources+findings as an artifact so the synthesizer can build on it. " +
+        "A finding without a source is an opinion: list EVERY source your findings rest on in report(...)'s `sources` field (url + what it supports) — only sources reported there can be cited in the final deliverable. When independent sources disagree on a material fact, post note(kind:'conflict') naming both sources and the discrepancy — never silently pick one. For scientific or technical questions, also run academic_search (arXiv + Crossref) — peer-reviewed beats blog posts. " +
         "If a crawl_site tool is available, use it to ingest whole documentation sites or multi-page sources into local markdown files, then read the saved files — far cheaper and broader than fetching pages one by one.",
     coder: "Engineering craft: read existing code before changing it; match its conventions; build/run/test after every meaningful change and include the command + result in your report. Leave the tree compiling.",
     analyst: "Analysis craft: quantify wherever possible; state assumptions explicitly; separate observation from interpretation; sanity-check numbers twice.",
@@ -209,7 +217,7 @@ OPERATING PROTOCOL
 - You are fully autonomous. Never ask questions; decide and act.
 - Plan briefly, then act in small verified steps: after changing anything, prove it worked (run it, read it back, test it).
 - Evidence over assumption: read before you edit; check outputs; cite concrete paths, commands and numbers.
-- Be token-lean: targeted reads (line ranges, grep via shell) over wholesale dumps; don't re-read unchanged files.
+- Be token-lean: targeted reads (line ranges, grep_files) over wholesale dumps; don't re-read unchanged files. Several edits to one file → one replace_in_file call with edits[].
 - Post durable discoveries other agents will need to the blackboard with note(...) — facts only, used sparingly.
 - Editing files other tasks might also touch? First search_notes for claims, then post note(kind:"claim", key:"<path>") before editing. Claims are advisory — coordinate, don't fight.
 - Save deliverable files with save_artifact so the operator sees them. Pick the format that genuinely fits the deliverable — structured data as .csv/.json, polished documents as self-contained .html, code as runnable files — not everything is a markdown report.
@@ -217,7 +225,7 @@ OPERATING PROTOCOL
 - Genuinely impossible / missing prerequisite → report(status:"blocked", …) early instead of thrashing.
 - You have at most ${opts.maxSteps} tool steps. Budget them.
 - Dependency reports above are excerpts; use read_report(task_id) for full text, and search_notes(query) to find facts posted earlier in the run.
-- ALWAYS end by calling report(...). The conductor sees ONLY that report — it is the entire value of your work. Specific beats vague: what you did, what you verified, key findings, exact paths. Fill key_facts (standalone facts downstream tasks need), open_questions, and files_touched — they are handed verbatim to dependent tasks.
+- ALWAYS end by calling report(...). The conductor sees ONLY that report — it is the entire value of your work. Specific beats vague: what you did, what you verified, key findings, exact paths. Fill key_facts (standalone facts downstream tasks need), open_questions, and files_touched — they are handed verbatim to dependent tasks. If your work drew on the web, fill sources (url + what it supports): only sources reported there can be cited in the final deliverable.
 ${roleHint ? "\n" + roleHint : ""}`;
 }
 exports.WORKER_KICKOFF = "Begin now. Work the task to completion, then call report(...).";
@@ -227,7 +235,7 @@ function forcedFinal(reason) {
     return `${reason} Stop working and call your terminal tool RIGHT NOW with your best honest account: what you completed, what you verified, what remains.`;
 }
 // ============================================================ verifier
-function verifierSystem(meta, task) {
+function verifierSystem(meta, task, depReports = "") {
     return `You are an adversarial verification agent. A worker claims it completed this task — your job is to try to falsify that claim with evidence.
 MISSION (for context): ${(0, util_1.clip)(meta.mission, 400)}
@@ -238,18 +246,18 @@ ${task.context ? `Context: ${(0, util_1.clip)(task.context, 600)}` : ""}
 Worker's report:
 ${(0, util_1.clip)(task.report ?? "", 2400)}
 ${task.artifacts.length ? `Claimed artifacts: ${task.artifacts.join(", ")}` : ""}
+${depReports ? `\nUPSTREAM INPUTS (settled dependency reports — what this task had to build on; judge completeness against them):\n${depReports}\n` : ""}
 Working directory: ${meta.cwd}
 PROTOCOL
 - Do NOT trust the report. Verify concretely with tools: read the files it claims to have written, run the build/tests/commands, fetch the URLs, check the numbers. You see only the worker's CLAIMS — gather your own evidence; do not assume shared context.
 - RUBRIC — fail unless all hold:
-  1. Completeness: every part of the objective and its "Done when" criteria is addressed.
+  1. Completeness: every part of the objective and its "Done when" criteria is addressed${depReports ? " (including everything the upstream inputs handed over)" : ""}.
   2. Evidence: each substantive claim in the report is backed by something you verified yourself.
   3. Deliverables: claimed files/artifacts exist, are non-trivial (not stubs/placeholders), and match what the report says about them.
   4. Correctness: commands/builds/tests the task implies actually succeed when you run them.
 - Spot-check depth over exhaustive breadth; ~5-12 tool steps.
-- Then call verdict(pass, feedback). On fail, feedback must be actionable: exactly what is wrong and where. On pass, one line citing the evidence you checked.`;
+- Then call verdict(pass, feedback, issues). On fail, ALSO fill issues — one entry per concrete problem with the evidence you gathered and the exact change needed; the worker's retry sees them verbatim. On pass, feedback is one line citing the evidence you checked.`;
 }
 exports.VERIFIER_KICKOFF = "Verify now, then call verdict(...).";
 // ============================================================ synthesizer
@@ -265,13 +273,13 @@ Conductor's closing notes: ${opts.finishNotes || "(none)"}
 ALL TASK REPORTS
 ${opts.reports}
-${opts.blackboard ? `BLACKBOARD\n${opts.blackboard}\n` : ""}${opts.artifactList ? `ARTIFACTS ON DISK\n${opts.artifactList}\n` : ""}
+${opts.sources ? `SOURCES (numbered, deduplicated from the task reports — the only sources that exist)\n${opts.sources}\n\n` : ""}${opts.blackboard ? `BLACKBOARD\n${opts.blackboard}\n` : ""}${opts.artifactList ? `ARTIFACTS ON DISK\n${opts.artifactList}\n` : ""}
 Working directory: ${opts.meta.cwd}
 PROTOCOL
 - You may read files (read_file / list_dir) to confirm specifics before writing — verify key claims you repeat.
 - The mission's PRIMARY deliverable should exist in the format that serves it best, not only as prose. If the task reports produced data, comparisons, or rankings that the artifacts don't already capture in a structured form, save them now with save_artifact (e.g. data/results.csv, data/findings.json) before submitting. Don't duplicate artifacts that already exist — point to them.
-- Then call submit_final with:
+${opts.sources ? `- CITE YOUR SOURCES: where a claim rests on a numbered source, cite it inline as [n]. End report_markdown with a \`## Sources\` section listing each number you actually cited as a markdown link ([n] [title](url)). Never invent a source or cite a number not in the list. Where sources conflict, present both positions with their citations — do not silently pick one.\n` : ""}- Then call submit_final with:
   • report_markdown — the deliverable document. Structure: # title; **Outcome** first (did the mission succeed, headline results); then What was built/found with evidence and exact paths; How to use/run it (if applicable); Open issues & recommended next steps. Write for the operator: complete, concrete, zero filler. Use real markdown tables for tabular findings. (A styled HTML rendering is generated automatically — do not hand-write one.)
   • summary — ≤8 sentences for the console.
 - The report stands alone: a reader who saw nothing else must understand what happened and where everything is.`;
@@ -292,7 +300,7 @@ ${reports}
 Reply with EXACTLY "COMPLETE" if the mission's requirements are genuinely covered. Otherwise reply with a short numbered list of concrete gaps (max 5), each one actionable enough to become a task. Do not invent nice-to-haves — only true gaps against the stated mission.`;
 }
-function synthCheckPrompt(mission, reports, finalReport) {
+function synthCheckPrompt(mission, reports, finalReport, sources) {
     return `You are checking a final mission report for faithfulness before delivery. Compare it against the underlying task reports.
 MISSION
@@ -301,10 +309,10 @@ ${mission}
 TASK REPORTS (ground truth)
 ${reports}
-FINAL REPORT (to check)
+${sources ? `SOURCE LIST (the only citable sources)\n${sources}\n\n` : ""}FINAL REPORT (to check)
 ${finalReport}
-Reply with EXACTLY "OK" if the final report's claims are supported by the task reports and nothing material is misrepresented or fabricated. Otherwise list the specific discrepancies (max 5), each citing what the final report says vs what the task reports support.`;
+Reply with EXACTLY "OK" if the final report's claims are supported by the task reports and nothing material is misrepresented or fabricated${sources ? ", its inline [n] citations all reference numbers that exist in the source list, and no key web-derived factual claim is left uncited" : ""}. Otherwise list the specific discrepancies (max 5), each citing what the final report says vs what the task reports support.`;
 }
 // ============================================================ compaction
 function compactorPrompt(serialized) {

package/dist/report.js CHANGED Viewed

@@ -11,8 +11,45 @@
  * broken markup.
  */
 Object.defineProperty(exports, "__esModule", { value: true });
+exports.aggregateSources = aggregateSources;
+exports.sourcesBlock = sourcesBlock;
 exports.mdToHtml = mdToHtml;
 exports.renderFinalHtml = renderFinalHtml;
+const searchcore_1 = require("./searchcore");
+/**
+ * Dedupe every task's reported sources (by canonical URL) into one numbered
+ * bibliography for the synthesizer. First occurrence wins the number; later
+ * tasks fill in missing titles/dates.
+ */
+function aggregateSources(tasks) {
+    const byKey = new Map();
+    for (const t of tasks) {
+        for (const s of t.sources ?? []) {
+            const key = (0, searchcore_1.canonicalizeUrl)(s.url);
+            const cur = byKey.get(key);
+            if (cur) {
+                if (!cur.taskIds.includes(t.id))
+                    cur.taskIds.push(t.id);
+                if (!cur.title && s.title)
+                    cur.title = s.title;
+                if (!cur.date && s.date)
+                    cur.date = s.date;
+                if (!cur.note && s.note)
+                    cur.note = s.note;
+            }
+            else {
+                byKey.set(key, { ...s, n: byKey.size + 1, taskIds: [t.id] });
+            }
+        }
+    }
+    return [...byKey.values()];
+}
+/** Render the numbered source list for prompts (one line per source). */
+function sourcesBlock(sources) {
+    return sources
+        .map((s) => `[${s.n}] ${s.title ? `${s.title} — ` : ""}${s.url}${s.date ? ` (${s.date})` : ""}${s.note ? ` — ${s.note}` : ""} [cited by ${s.taskIds.join(",")}]`)
+        .join("\n");
+}
 function esc(s) {
     return s
         .replace(/&/g, "&amp;")

package/dist/run.js CHANGED Viewed

@@ -198,6 +198,14 @@ function listRuns(pricing) {
         s.pid = readPid(id);
         out.push(applyLiveness(s));
     }
+    // Deleted runs must not pin their reduced state in a long-lived hub forever.
+    const live = new Set(ids);
+    for (const key of summaryCache.keys())
+        if (!live.has(key))
+            summaryCache.delete(key);
+    for (const key of liveCache.keys())
+        if (!live.has(key))
+            liveCache.delete(key);
     out.sort((a, b) => b.createdAt - a.createdAt);
     return out;
 }

package/dist/sandbox.js CHANGED Viewed

@@ -302,7 +302,17 @@ class RemoteRuntime {
             throw new Error(`${what} failed (exit ${r.code}): ${r.out.slice(0, 300)}`);
         return r.out;
     }
+    /** base64-over-shell transfers buffer the whole file — refuse the huge ones. */
+    async checkSize(abs, capBytes, what) {
+        const out = await this.execOk(`wc -c < ${shq(abs)}`, `stat ${abs}`);
+        const size = Number(out.trim());
+        if (Number.isFinite(size) && size > capBytes) {
+            throw new Error(`${what}: file is ${Math.round(size / 1e6)}MB (cap ${Math.round(capBytes / 1e6)}MB) — ` +
+                `compress it or extract the relevant part in the sandbox first`);
+        }
+    }
     async readFile(abs) {
+        await this.checkSize(abs, 4_000_000, `read ${abs}`);
         const out = await this.execOk(`base64 < ${shq(abs)}`, `read ${abs}`);
         return Buffer.from(out.replace(/\s+/g, ""), "base64").toString("utf8");
     }
@@ -319,6 +329,7 @@ class RemoteRuntime {
         }
     }
     async pull(remoteAbs, localAbs) {
+        await this.checkSize(remoteAbs, 32_000_000, `pull ${remoteAbs}`);
         const out = await this.execOk(`base64 < ${shq(remoteAbs)}`, `pull ${remoteAbs}`);
         (0, util_1.ensureDir)(path.dirname(localAbs));
         fs.writeFileSync(localAbs, Buffer.from(out.replace(/\s+/g, ""), "base64"));

package/dist/searchcore.js CHANGED Viewed

@@ -9,8 +9,11 @@
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.queryTerms = queryTerms;
 exports.expandQueries = expandQueries;
+exports.reformulate = reformulate;
+exports.looksAcademic = looksAcademic;
 exports.canonicalizeUrl = canonicalizeUrl;
 exports.classifySource = classifySource;
+exports.freshnessBoost = freshnessBoost;
 exports.detectDate = detectDate;
 exports.selectPassages = selectPassages;
 exports.scorePage = scorePage;
@@ -42,6 +45,22 @@ function expandQueries(query, max = 3) {
     const seen = new Set();
     return out.map((q) => q.trim()).filter((q) => q && !seen.has(q.toLowerCase()) && seen.add(q.toLowerCase())).slice(0, max);
 }
+/**
+ * Fallback phrasing when a query returns nothing: strip quotes and search
+ * operators down to the top keyword terms. Returns "" when no useful
+ * simplification exists.
+ */
+function reformulate(query) {
+    const cleaned = query
+        .replace(/["'""'']/g, " ")
+        .replace(/\b(site|intitle|inurl|filetype):\S+/gi, " ");
+    const alt = queryTerms(cleaned).slice(0, 6).join(" ");
+    return alt && alt !== query.toLowerCase().trim() ? alt : "";
+}
+/** Queries that smell academic trigger the scholarly engines in deep mode. */
+function looksAcademic(query) {
+    return /\b(paper|papers|study|studies|research|arxiv|doi|journal|peer.?review(ed)?|preprint|dataset|benchmark|survey|meta.?analysis|citations?|et al)\b/i.test(query);
+}
 const TRACKING_KEYS = new Set(["fbclid", "gclid", "mc_cid", "mc_eid"]);
 /** Stable canonical form for dedup: strip tracking params, www, trailing slash; sort the query. */
 function canonicalizeUrl(url) {
@@ -61,18 +80,50 @@ function canonicalizeUrl(url) {
         path = path.replace(/\/+$/, "");
     return `${u.protocol.toLowerCase()}//${host}${path}${query}`;
 }
+const ACADEMIC_HOSTS = [
+    "arxiv.org",
+    "doi.org",
+    "semanticscholar.org",
+    "ncbi.nlm.nih.gov",
+    "nature.com",
+    "sciencedirect.com",
+    "springer.com",
+    "link.springer.com",
+    "scholar.google.com",
+    "acm.org",
+    "ieee.org",
+];
 function classifySource(domain) {
     const d = domain.toLowerCase();
     if (d.endsWith(".gov") || d.endsWith(".mil"))
         return "government";
     if (d.endsWith(".edu"))
         return "academic";
+    if (ACADEMIC_HOSTS.some((h) => d === h || d.endsWith("." + h)))
+        return "academic";
     if (["twitter.com", "x.com", "reddit.com", "facebook.com"].some((s) => d.includes(s)))
         return "social";
     if (d.includes("news") || d.includes("reuters.com") || d.includes("apnews.com") || d.includes("bbc."))
         return "news";
     return "secondary";
 }
+/** Recency boost from an ISO date or bare year: +3 <1y, +2 <2y, +1 <5y, 0 older/undated. */
+function freshnessBoost(date, now = Date.now()) {
+    if (!date)
+        return 0;
+    const m = /^(\d{4})(?:-(\d{1,2})(?:-(\d{1,2}))?)?/.exec(date.trim());
+    if (!m)
+        return 0;
+    const t = Date.UTC(Number(m[1]), m[2] ? Number(m[2]) - 1 : 6, m[3] ? Number(m[3]) : 15);
+    const years = (now - t) / 31_557_600_000;
+    if (years < 1)
+        return 3;
+    if (years < 2)
+        return 2;
+    if (years < 5)
+        return 1;
+    return 0;
+}
 /** ISO date if present, else a bare year. */
 function detectDate(text) {
     const iso = /\b(20\d{2}-\d{2}-\d{2})\b/.exec(text);
@@ -136,8 +187,7 @@ function scorePage(page, terms) {
         score += 4;
     if (["pypi.org", "npmjs.com", "rubygems.org"].includes(domain))
         score -= 2;
-    if (page.date)
-        score += 1;
+    score += freshnessBoost(page.date);
     const lowered = page.text.toLowerCase();
     for (const t of terms)
         if (lowered.includes(t))
@@ -158,6 +208,9 @@ function resultQualityScore(c) {
         score += 4;
     if (url.includes("github.com") || url.includes("gitlab.com"))
         score += 3;
+    if (c.engine === "arxiv" || c.engine === "crossref")
+        score += 3;
+    score += Math.min(2, freshnessBoost(c.date));
     if (LOW_VALUE_SNIPPET.some((t) => snippet.includes(t)))
         score -= 10;
     return score;

package/dist/state.js CHANGED Viewed

@@ -21,6 +21,8 @@ class RunState {
     usageByModel = new Map();
     totalUsage = { ...types_1.ZERO_USAGE };
     cost = 0;
+    /** Sampled cumulative token spend over time (budget sparkline). */
+    budgetSeries = [];
     finalSummary;
     finalReportPath;
     lastSeq = 0;
@@ -55,6 +57,7 @@ class RunState {
                 this.usageByModel.set(model, (0, types_1.addUsage)(this.usageByModel.get(model) ?? { ...types_1.ZERO_USAGE }, u));
                 this.totalUsage = (0, types_1.addUsage)(this.totalUsage, u);
                 this.cost += (0, types_1.usageCost)(u, this.pricing[model]);
+                this.pushBudgetPoint(ev.t);
             }
             return;
         }
@@ -127,6 +130,8 @@ class RunState {
                         t.openQuestions = ev.openQuestions;
                     if (Array.isArray(ev.filesTouched))
                         t.filesTouched = ev.filesTouched;
+                    if (Array.isArray(ev.sources))
+                        t.sources = ev.sources;
                 }
                 break;
             }
@@ -202,15 +207,17 @@ class RunState {
                     key: ev.key,
                     kind: ev.kind,
                     text: ev.text,
+                    url: typeof ev.url === "string" ? ev.url : undefined,
                 });
                 // Reduced state is held live by the hub and the resume seed — keep
-                // only the tail that digests/views actually use. Decisions are never
-                // dropped: they anchor the conductor's long-horizon coherence.
+                // only the tail that digests/views actually use. Decisions and
+                // conflicts are never dropped: they anchor long-horizon coherence.
                 if (this.notes.length > 1000) {
-                    const decisions = this.notes.filter((n) => n.kind === "decision");
-                    const rest = this.notes.filter((n) => n.kind !== "decision");
-                    rest.splice(0, rest.length - Math.max(0, 1000 - decisions.length));
-                    this.notes = [...decisions, ...rest].sort((a, b) => a.t - b.t);
+                    const keep = (n) => n.kind === "decision" || n.kind === "conflict";
+                    const pinned = this.notes.filter(keep);
+                    const rest = this.notes.filter((n) => !keep(n));
+                    rest.splice(0, rest.length - Math.max(0, 1000 - pinned.length));
+                    this.notes = [...pinned, ...rest].sort((a, b) => a.t - b.t);
                 }
                 break;
             case "conductor.say":
@@ -233,6 +240,7 @@ class RunState {
                 this.usageByModel.set(model, (0, types_1.addUsage)(this.usageByModel.get(model) ?? { ...types_1.ZERO_USAGE }, u));
                 this.totalUsage = (0, types_1.addUsage)(this.totalUsage, u);
                 this.cost += (0, types_1.usageCost)(u, this.pricing[model]);
+                this.pushBudgetPoint(ev.t);
                 break;
             }
             case "run.final":
@@ -241,6 +249,26 @@ class RunState {
                 break;
         }
     }
+    /**
+     * Sample the cumulative spend: a point per meaningful jump (≥0.5% of the
+     * budget cap, or 2k tokens unbounded), halving resolution past 600 points.
+     */
+    pushBudgetPoint(t) {
+        const tokens = this.totalUsage.promptTokens + this.totalUsage.completionTokens;
+        const cap = this.meta?.options?.maxTokens ?? 0;
+        const minStep = cap > 0 ? Math.max(2000, cap * 0.005) : 2000;
+        const last = this.budgetSeries[this.budgetSeries.length - 1];
+        if (last && tokens - last.tokens < minStep) {
+            last.t = t;
+            last.tokens = tokens;
+            last.cost = this.cost;
+            return;
+        }
+        this.budgetSeries.push({ t, tokens, cost: this.cost });
+        if (this.budgetSeries.length > 600) {
+            this.budgetSeries = this.budgetSeries.filter((_, i) => i % 2 === 0 || i === this.budgetSeries.length - 1);
+        }
+    }
     taskList() {
         return this.taskOrder.map((id) => this.tasks.get(id)).filter(Boolean);
     }