npm - @empir3/empir3-bridge - Versions diffs - 0.3.21 - Mend

@empir3/empir3-bridge 0.3.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (62) hide show

package/CHANGELOG.md +1531 -0
package/CODE_OF_CONDUCT.md +9 -0
package/CONTRIBUTING.md +75 -0
package/LICENSE +21 -0
package/README.md +464 -0
package/SECURITY.md +130 -0
package/assets/accuracy-lab.html +2639 -0
package/assets/api-clis-real.jpg +0 -0
package/assets/bridge-console-hero.jpg +0 -0
package/assets/browser-privacy.svg +151 -0
package/assets/demo-orchestration.svg +74 -0
package/assets/desktop-select-region.jpg +0 -0
package/assets/in-page-chat.gif +0 -0
package/assets/orchestration-hero.svg +126 -0
package/assets/social-preview.png +0 -0
package/assets/zara-accent.png +0 -0
package/build/bootstrap.js +548 -0
package/build/build.js +680 -0
package/build/payload-entry.js +649 -0
package/build/payload-signing-pub.json +7 -0
package/docs/AGENT_GUIDE.md +259 -0
package/docs/RELEASE.md +106 -0
package/docs/SAFETY.md +112 -0
package/docs/TESTING.md +181 -0
package/installer/server.js +231 -0
package/installer/ui/app.js +278 -0
package/installer/ui/index.html +24 -0
package/installer/ui/styles.css +146 -0
package/package.json +95 -0
package/scripts/bootstrap-e2e.mjs +650 -0
package/scripts/certify-bridge.mjs +636 -0
package/scripts/check-companion-surface.mjs +118 -0
package/scripts/extract-welcome.mjs +64 -0
package/scripts/gh-route-handler-check.mjs +57 -0
package/scripts/gh-wire-test.mjs +107 -0
package/scripts/publish-downloads.mjs +180 -0
package/scripts/smoke-all-tools.mjs +509 -0
package/scripts/smoke-live-bridge.mjs +696 -0
package/scripts/splice-welcome.mjs +63 -0
package/scripts/welcome-body.txt +2733 -0
package/src/anthropic-client.ts +192 -0
package/src/bootstrap-exe.ts +69 -0
package/src/bridge.ts +2444 -0
package/src/chat.ts +345 -0
package/src/cli-runner.ts +239 -0
package/src/cli.ts +649 -0
package/src/config.ts +199 -0
package/src/desktop-overlay.ps1 +121 -0
package/src/executable-resolver.ts +330 -0
package/src/handlers/agy-imagegen.ts +179 -0
package/src/handlers/github-cli.ts +399 -0
package/src/handlers/higgsfield-cli.ts +783 -0
package/src/launch.js +337 -0
package/src/mcp-server.ts +1265 -0
package/src/pair-claim.ts +218 -0
package/src/payload-daemon.ts +168 -0
package/src/server.ts +21036 -0
package/src/tool-defaults.ts +230 -0
package/src/update-check.js +136 -0
package/tray/build.py +76 -0
package/tray/requirements.txt +2 -0
package/tray/tray.py +1843 -0

package/src/chat.ts ADDED Viewed

@@ -0,0 +1,345 @@
+/**
+ * Chat orchestration — picks a runner (api | cli), runs the tool-use
+ * loop, persists every turn, yields a unified event stream the HTTP/SSE
+ * layer can serialize to the overlay.
+ *
+ * Responsibilities split:
+ *   - anthropic-client.ts streams raw model events
+ *   - cli-runner.ts streams the same shape from a `claude` subprocess
+ *   - this file picks one, drives the tool-use loop in API mode, and
+ *     dispatches tool calls back through the bridge's HTTP API
+ *
+ * Tool-use loop (API mode only):
+ *   1. Send messages + tools to the API, stream events
+ *   2. On tool_use_start → dispatch via /api/command, capture result
+ *   3. After message_end, if stop_reason === 'tool_use':
+ *      append assistant turn + tool_result turn to messages, restart
+ *   4. Loop caps at config.maxLoopIterations
+ *
+ * CLI mode currently runs without tool-use (see cli-runner.ts header).
+ */
+import { existsSync, mkdirSync, appendFileSync, readFileSync, readdirSync } from 'fs';
+import { join } from 'path';
+import { homedir } from 'os';
+import { randomUUID } from 'crypto';
+import { streamMessages, type AnthropicMessage, type AnthropicTool, type StreamEvent } from './anthropic-client.js';
+import { streamCli } from './cli-runner.js';
+import { loadConfig, type BridgeConfig, configReady } from './config.js';
+import { TOOL_META } from './tool-defaults.js';
+const CONV_DIR = join(homedir(), '.empir3-bridge', 'conversations');
+// ── Public chat-event shape (what the server SSE relays) ─────────
+export type ChatEvent =
+  | { type: 'message_start'; conversationId: string; role: 'assistant' }
+  | { type: 'text_delta'; text: string }
+  | { type: 'tool_use'; id: string; name: string; input: unknown }
+  | { type: 'tool_result'; id: string; name: string; ok: boolean; output: string }
+  | { type: 'usage'; inputTokens: number; outputTokens: number }
+  | { type: 'message_end'; stopReason: string | null; iterations: number }
+  | { type: 'error'; message: string };
+export interface StreamChatRequest {
+  messages: AnthropicMessage[];
+  conversationId?: string;
+  modeOverride?: 'api' | 'cli';
+  signal?: AbortSignal;
+  bridgeBaseUrl?: string; // default localhost:<bridgePort> at server start; injected by server.ts
+}
+const DEFAULT_SYSTEM_PROMPT =
+  'You are Claude, running inside a local browser-bridge daemon. The user is viewing a web page in a Chrome window controlled by this bridge. ' +
+  'When you need to see or interact with the page, call the appropriate browser_* tool. Prefer browser_snapshot over browser_screenshot — it returns the accessibility tree with element refs (e0, e1, etc) which are cheaper and more reliable than coordinates. ' +
+  'Be concise. Only act when the user actually needs an action.';
+// ── Tool input schemas mirror src/mcp-server.ts so what the model
+//    sees in API mode is identical to what Claude Code sees through MCP.
+const TOOL_SCHEMAS: Record<string, AnthropicTool['input_schema']> = {
+  bridge_overlay_reinject: { type: 'object', properties: {} },
+  browser_status:       { type: 'object', properties: {} },
+  browser_text:         { type: 'object', properties: {} },
+  browser_screenshot:   { type: 'object', properties: {} },
+  desktop_monitors:     { type: 'object', properties: {} },
+  desktop_screenshot:   { type: 'object', properties: { monitor: { type: 'string', description: 'all, primary, DISPLAY1, DISPLAY2, or full device name. Default: all' } } },
+  browser_snapshot:     { type: 'object', properties: { filter: { type: 'string', enum: ['interactive', 'all'], description: 'Default: interactive' } } },
+  browser_navigate:     { type: 'object', properties: { url: { type: 'string' } }, required: ['url'] },
+  browser_scroll:       { type: 'object', properties: { y: { type: 'number', description: 'Vertical pixels (positive=down, negative=up)' }, x: { type: 'number' } }, required: ['y'] },
+  browser_refresh:      { type: 'object', properties: {} },
+  browser_click:        { type: 'object', properties: { selector: { type: 'string' } }, required: ['selector'] },
+  browser_click_ref:    { type: 'object', properties: { ref: { type: 'string', description: 'Element ref from snapshot (e.g. "e5")' } }, required: ['ref'] },
+  browser_click_xy:     { type: 'object', properties: { x: { type: 'number' }, y: { type: 'number' } }, required: ['x', 'y'] },
+  desktop_click:        { type: 'object', properties: { x: { type: 'number' }, y: { type: 'number' }, monitor: { type: 'string', description: 'Optional monitor id. When supplied, x/y are monitor-relative.' }, double: { type: 'boolean' }, button: { type: 'string', enum: ['left', 'right', 'middle'] } }, required: ['x', 'y'] },
+  desktop_hover:        { type: 'object', properties: { x: { type: 'number' }, y: { type: 'number' }, monitor: { type: 'string', description: 'Optional monitor id. When supplied, x/y are monitor-relative.' } }, required: ['x', 'y'] },
+  desktop_drag:         { type: 'object', properties: { x: { type: 'number' }, y: { type: 'number' }, toX: { type: 'number' }, toY: { type: 'number' }, monitor: { type: 'string', description: 'Optional monitor id. When supplied, both endpoints are monitor-relative.' }, durationMs: { type: 'number' }, steps: { type: 'number' }, button: { type: 'string', enum: ['left', 'right', 'middle'] } }, required: ['x', 'y', 'toX', 'toY'] },
+  browser_type:         { type: 'object', properties: { selector: { type: 'string' }, text: { type: 'string' } }, required: ['selector', 'text'] },
+  browser_type_ref:     { type: 'object', properties: { ref: { type: 'string' }, text: { type: 'string' } }, required: ['ref', 'text'] },
+  browser_press:        { type: 'object', properties: { key: { type: 'string', description: 'e.g. "Enter", "Tab", "Control+a"' } }, required: ['key'] },
+  browser_highlight:    { type: 'object', properties: { selector: { type: 'string' } }, required: ['selector'] },
+  browser_evaluate:     { type: 'object', properties: { script: { type: 'string', description: 'JS expression to evaluate on the page' } }, required: ['script'] },
+  browser_chat:         { type: 'object', properties: { message: { type: 'string' } }, required: ['message'] },
+  browser_read_chat:    { type: 'object', properties: { limit: { type: 'number' } } },
+  browser_record_start: { type: 'object', properties: {} },
+  browser_record_stop:  { type: 'object', properties: { name: { type: 'string' } } },
+  browser_play:         { type: 'object', properties: { recording: { type: 'string' }, speed: { type: 'number' }, variables: { type: 'object' } }, required: ['recording'] },
+  browser_recordings:   { type: 'object', properties: {} },
+};
+function buildToolDefs(cfg: BridgeConfig): AnthropicTool[] {
+  const tools: AnthropicTool[] = [];
+  for (const meta of TOOL_META) {
+    if (!cfg.enabledTools[meta.name]) continue;
+    const schema = TOOL_SCHEMAS[meta.name];
+    if (!schema) continue;
+    tools.push({ name: meta.name, description: meta.blurb, input_schema: schema });
+  }
+  return tools;
+}
+// ── Bridge-side dispatch ────────────────────────────────────────
+async function dispatchTool(name: string, input: any, bridgeBaseUrl: string): Promise<{ ok: boolean; output: string }> {
+  // /api/command wraps responses as { ok, result } | { ok:false, error }.
+  // Unwrap to result so dispatch sites can read fields directly.
+  const post = async (cmd: any) => {
+    const r = await fetch(`${bridgeBaseUrl}/api/command`, {
+      method: 'POST',
+      headers: { 'Content-Type': 'application/json' },
+      body: JSON.stringify(cmd),
+    });
+    if (!r.ok) throw new Error(`HTTP ${r.status}: ${await r.text().catch(() => '')}`);
+    const env = await r.json();
+    if (env && typeof env === 'object' && 'ok' in env) {
+      if (!env.ok) throw new Error(env.error || 'command failed');
+      return env.result ?? {};
+    }
+    return env;
+  };
+  const get = async (path: string) => {
+    const r = await fetch(`${bridgeBaseUrl}${path}`);
+    if (!r.ok) throw new Error(`HTTP ${r.status}`);
+    return r.json();
+  };
+  try {
+    switch (name) {
+      case 'browser_status':       return ok(JSON.stringify(await get('/api/status'), null, 2));
+      case 'bridge_overlay_reinject': return ok(JSON.stringify(await post({ type: 'overlay_reinject', reason: 'chat' }), null, 2));
+      case 'browser_text':         return ok((await post({ type: 'text' })).text || '(no text)');
+      case 'browser_snapshot': {
+        const r = await post({ type: 'snapshot', filter: input?.filter || 'interactive', format: 'compact' });
+        return ok(typeof r.snapshot === 'string' ? r.snapshot : JSON.stringify(r.snapshot, null, 2));
+      }
+      case 'browser_screenshot': {
+        const r = await fetch(`${bridgeBaseUrl}/api/screenshot?quality=50`);
+        if (!r.ok) return fail(`screenshot HTTP ${r.status}`);
+        const buf = Buffer.from(await r.arrayBuffer());
+        return ok(`[screenshot captured: ${buf.byteLength} bytes JPEG]`);
+      }
+      case 'desktop_monitors':     return ok(JSON.stringify(await post({ type: 'desktop_monitors' }), null, 2));
+      case 'desktop_screenshot':   return ok(JSON.stringify(await post({ type: 'desktop_screenshot', monitor: input?.monitor || 'all' }), null, 2));
+      case 'browser_navigate':     return ok(`Navigated to: ${(await post({ type: 'navigate', url: input.url })).url}`);
+      case 'browser_scroll': {
+        const r = await post({ type: 'scroll', x: input.x || 0, y: input.y });
+        return ok(JSON.stringify({ requested: r.scrolled, moved: r.moved, position: r.position, scroll: r.scroll }, null, 2));
+      }
+      case 'browser_refresh':      { await post({ type: 'refresh' }); return ok('Page refreshed'); }
+      case 'browser_click':        { await post({ type: 'click', selector: input.selector }); return ok(`Clicked: ${input.selector}`); }
+      case 'browser_click_ref':    { await post({ type: 'click_ref', ref: input.ref }); return ok(`Clicked ref: ${input.ref}`); }
+      case 'browser_click_xy':     { await post({ type: 'click_xy', x: input.x, y: input.y }); return ok(`Clicked coordinates: ${input.x},${input.y}`); }
+      case 'desktop_click':        {
+        const r = await post({ type: 'desktop_click', x: input.x, y: input.y, monitor: input.monitor, space: input.monitor ? 'monitor' : 'desktop', double: !!input.double, button: input.button || 'left' });
+        return ok(JSON.stringify(r, null, 2));
+      }
+      case 'desktop_hover':        {
+        const r = await post({ type: 'desktop_hover', x: input.x, y: input.y, monitor: input.monitor, space: input.monitor ? 'monitor' : 'desktop' });
+        return ok(JSON.stringify(r, null, 2));
+      }
+      case 'desktop_drag':         {
+        const r = await post({ type: 'desktop_drag', x: input.x, y: input.y, toX: input.toX, toY: input.toY, monitor: input.monitor, space: input.monitor ? 'monitor' : 'desktop', durationMs: input.durationMs, steps: input.steps, button: input.button || 'left' });
+        return ok(JSON.stringify(r, null, 2));
+      }
+      case 'browser_type':         { await post({ type: 'type', selector: input.selector, text: input.text }); return ok(`Typed into ${input.selector}`); }
+      case 'browser_type_ref':     { await post({ type: 'type_ref', ref: input.ref, text: input.text }); return ok(`Typed into ref:${input.ref}`); }
+      case 'browser_press':        { await post({ type: 'press', text: input.key }); return ok(`Pressed: ${input.key}`); }
+      case 'browser_highlight':    { await post({ type: 'highlight', selector: input.selector }); return ok(`Highlighted: ${input.selector}`); }
+      case 'browser_evaluate':     return ok(JSON.stringify(await post({ type: 'evaluate', script: input.script }), null, 2));
+      case 'browser_chat':         { await post({ type: 'chat', message: input.message }); return ok(`Sent to overlay: ${input.message}`); }
+      case 'browser_read_chat': {
+        const messages = await get('/api/chat');
+        const limit = typeof input?.limit === 'number' ? input.limit : 20;
+        const recent = (messages as any[]).slice(-limit);
+        if (recent.length === 0) return ok('(no messages)');
+        return ok(recent.map(m => `[${m.from}] ${m.text}`).join('\n'));
+      }
+      case 'browser_record_start': return ok(`Recording started at ${(await post({ type: 'record_start' })).startUrl}`);
+      case 'browser_record_stop':  {
+        const r = await post({ type: 'record_stop', text: input?.name });
+        return ok(`Saved ${r.saved} (${r.actionCount} actions, ${(r.duration / 1000).toFixed(1)}s)`);
+      }
+      case 'browser_play': {
+        const r = await post({ type: 'play', recording: input.recording, speed: input.speed || 1, variables: input.variables || {} });
+        return ok(`Playback: ${r.passed}/${r.total} passed, ${r.failed} failed`);
+      }
+      case 'browser_recordings':   {
+        const list = await get('/api/recordings') as any[];
+        return ok(list.length === 0 ? '(no recordings)' : list.map(r => `${r.name} (${r.actionCount} actions, ${(r.duration / 1000).toFixed(1)}s)`).join('\n'));
+      }
+      default:                     return fail(`Unknown tool: ${name}`);
+    }
+  } catch (e: any) {
+    return fail(e?.message || String(e));
+  }
+}
+const ok = (output: string) => ({ ok: true, output });
+const fail = (output: string) => ({ ok: false, output });
+// ── Persistence ────────────────────────────────────────────────
+function ensureConvDir() {
+  if (!existsSync(CONV_DIR)) mkdirSync(CONV_DIR, { recursive: true });
+}
+function persistTurn(conversationId: string, entry: any) {
+  try {
+    ensureConvDir();
+    appendFileSync(join(CONV_DIR, `${conversationId}.jsonl`), JSON.stringify({ ...entry, ts: new Date().toISOString() }) + '\n');
+  } catch { /* swallow — persistence is best-effort */ }
+}
+export function listConversations(): Array<{ id: string; size: number; mtime: string }> {
+  try {
+    ensureConvDir();
+    const files = readdirSync(CONV_DIR).filter(f => f.endsWith('.jsonl'));
+    return files.map(f => {
+      const stat = require('fs').statSync(join(CONV_DIR, f));
+      return { id: f.replace(/\.jsonl$/, ''), size: stat.size, mtime: stat.mtime.toISOString() };
+    }).sort((a, b) => b.mtime.localeCompare(a.mtime));
+  } catch { return []; }
+}
+export function readConversation(id: string): any[] {
+  try {
+    const path = join(CONV_DIR, `${id}.jsonl`);
+    if (!existsSync(path)) return [];
+    return readFileSync(path, 'utf-8')
+      .split('\n')
+      .filter(l => l.trim())
+      .map(l => { try { return JSON.parse(l); } catch { return null; } })
+      .filter(Boolean);
+  } catch { return []; }
+}
+// ── Main entry ─────────────────────────────────────────────────
+export async function* streamChat(req: StreamChatRequest): AsyncGenerator<ChatEvent> {
+  const cfg = loadConfig();
+  const ready = configReady(cfg);
+  if (!ready.ready) { yield { type: 'error', message: ready.reason || 'Config not ready' }; return; }
+  const mode = req.modeOverride || cfg.mode;
+  const conversationId = req.conversationId || randomUUID();
+  const bridgeBaseUrl = req.bridgeBaseUrl || `http://localhost:3006`;
+  const system = cfg.systemPrompt || DEFAULT_SYSTEM_PROMPT;
+  const tools = buildToolDefs(cfg);
+  yield { type: 'message_start', conversationId, role: 'assistant' };
+  // Persist the user's most recent turn (if any) so the conversation
+  // log lines up with the prompt that produced this stream.
+  const lastUser = [...req.messages].reverse().find(m => m.role === 'user');
+  if (lastUser) persistTurn(conversationId, { role: 'user', content: lastUser.content });
+  // CLI mode: no tool-use loop in v0.1.0. Also no multi-turn history —
+  // the `claude` CLI treats each input line as its own turn and responds
+  // separately, which produces N replies instead of one when we replay
+  // a conversation. Until v0.1.1 wires up --resume <session-id>, we send
+  // only the latest user message and rely on the CLI for that single turn.
+  if (mode === 'cli') {
+    const latestUser = [...req.messages].reverse().find(m => m.role === 'user');
+    const cliMessages = latestUser ? [latestUser] : req.messages;
+    let assistantText = '';
+    for await (const ev of streamCli({
+      cliPath: cfg.claudeCliPath,
+      model: cfg.model,
+      system,
+      messages: cliMessages,
+      signal: req.signal,
+    })) {
+      if (ev.type === 'text_delta') { assistantText += ev.text; yield ev; }
+      else if (ev.type === 'usage') yield ev;
+      else if (ev.type === 'message_end') yield { type: 'message_end', stopReason: ev.stopReason, iterations: 1 };
+      else if (ev.type === 'error') yield ev;
+    }
+    if (assistantText) persistTurn(conversationId, { role: 'assistant', content: assistantText, mode: 'cli' });
+    return;
+  }
+  // API mode with tool-use loop.
+  const messages: AnthropicMessage[] = [...req.messages];
+  let iter = 0;
+  while (iter < cfg.maxLoopIterations) {
+    iter++;
+    let assistantText = '';
+    const toolUses: Array<{ id: string; name: string; input: any }> = [];
+    let lastStopReason: string | null = null;
+    let inputTokens = 0;
+    let outputTokens = 0;
+    for await (const ev of streamMessages({
+      apiKey: cfg.anthropicApiKey,
+      model: cfg.model,
+      maxTokens: cfg.maxTokens,
+      system,
+      messages,
+      tools,
+      signal: req.signal,
+    })) {
+      if (ev.type === 'text_delta') { assistantText += ev.text; yield ev; }
+      else if (ev.type === 'tool_use_start') {
+        toolUses.push({ id: ev.id, name: ev.name, input: ev.input });
+        yield { type: 'tool_use', id: ev.id, name: ev.name, input: ev.input };
+      }
+      else if (ev.type === 'usage') { inputTokens = ev.inputTokens; outputTokens = ev.outputTokens; yield ev; }
+      else if (ev.type === 'message_end') { lastStopReason = ev.stopReason; }
+      else if (ev.type === 'error') { yield ev; persistTurn(conversationId, { role: 'error', message: ev.message }); return; }
+    }
+    // Append assistant's turn to history. Preserve tool_use blocks so the
+    // next call has a complete record.
+    const assistantContent: any[] = [];
+    if (assistantText) assistantContent.push({ type: 'text', text: assistantText });
+    for (const tu of toolUses) assistantContent.push({ type: 'tool_use', id: tu.id, name: tu.name, input: tu.input });
+    if (assistantContent.length > 0) {
+      messages.push({ role: 'assistant', content: assistantContent });
+      persistTurn(conversationId, { role: 'assistant', content: assistantContent, mode: 'api', stopReason: lastStopReason, inputTokens, outputTokens, iter });
+    }
+    if (lastStopReason !== 'tool_use' || toolUses.length === 0) {
+      yield { type: 'message_end', stopReason: lastStopReason, iterations: iter };
+      return;
+    }
+    // Defense-in-depth: refuse any tool name that's not in the enabled list.
+    // (anthropic-client should never emit one because we filter the tools
+    // array, but trust nothing.)
+    const toolResults: any[] = [];
+    for (const tu of toolUses) {
+      let result: { ok: boolean; output: string };
+      if (!cfg.enabledTools[tu.name]) {
+        result = { ok: false, output: `Tool ${tu.name} is disabled in bridge settings (localhost:3006/settings).` };
+      } else {
+        result = await dispatchTool(tu.name, tu.input, bridgeBaseUrl);
+      }
+      yield { type: 'tool_result', id: tu.id, name: tu.name, ok: result.ok, output: result.output };
+      toolResults.push({ type: 'tool_result', tool_use_id: tu.id, content: result.output, ...(result.ok ? {} : { is_error: true }) });
+      persistTurn(conversationId, { role: 'tool_result', toolUseId: tu.id, name: tu.name, ok: result.ok, output: result.output });
+    }
+    messages.push({ role: 'user', content: toolResults });
+    // Loop continues with the tool results in context.
+  }
+  yield { type: 'error', message: `Tool-use loop exceeded ${cfg.maxLoopIterations} iterations` };
+}

package/src/cli-runner.ts ADDED Viewed

@@ -0,0 +1,239 @@
+/**
+ * Claude CLI runner — spawns the user's `claude` binary in stream-json
+ * mode and translates its stdout into the same StreamEvent shape that
+ * anthropic-client emits. So chat.ts can call either runner without
+ * branching on mode beyond the entry point.
+ *
+ * Why subprocess instead of API: a user with Claude Max already pays
+ * Anthropic for inference. Routing through their CLI means they don't
+ * pay twice.
+ *
+ * Tool integration: NOT wired here. v0.1.0 CLI mode = plain chat. To
+ * add browser tools to the CLI session, pass `--mcp-config <path>`
+ * pointing at this bridge's MCP server (deferred to v0.1.1 — the MCP
+ * shim already exists at dist/mcp-server.cjs, we just need a temp
+ * config file generator that filters by enabledTools). API mode in
+ * chat.ts runs the full tool-use loop today.
+ *
+ * Wave 2 reuse: this same module is the pattern Wave 2 M2.2 uses to
+ * route Empir3-server-driven turns through the user's local CLI.
+ */
+import { spawn, ChildProcessWithoutNullStreams } from 'child_process';
+import type { AnthropicMessage, StreamEvent } from './anthropic-client.js';
+export interface CliStreamRequest {
+  cliPath: string;
+  model?: string;
+  system?: string;
+  messages: AnthropicMessage[];
+  signal?: AbortSignal;
+  cwd?: string;
+  extraArgs?: string[];
+}
+const SIGTERM_GRACE_MS = 5000;
+export async function* streamCli(req: CliStreamRequest): AsyncGenerator<StreamEvent> {
+  const args = ['--print', '--output-format', 'stream-json', '--input-format', 'stream-json', '--verbose'];
+  if (req.model) args.push('--model', req.model);
+  if (req.extraArgs && req.extraArgs.length) args.push(...req.extraArgs);
+  // Build the input turn. The CLI's stream-json input format takes one JSON
+  // line per turn — system+messages are flattened into a single user line
+  // for simple chat. Multi-turn history is replayed as separate lines.
+  const stdinPayload = buildStreamJsonInput(req);
+  // On Windows, the npm-installed `claude` ships as both a bare unix shim
+  // and a `.cmd` batch shim. Node's spawn can only execute the `.cmd` shim
+  // directly. If the saved config still points at a path without an
+  // extension, transparently rewrite to the `.cmd` companion.
+  let cliPath = req.cliPath;
+  if (process.platform === 'win32' && !/\.(cmd|exe|bat|ps1)$/i.test(cliPath)) {
+    const fs = require('fs') as typeof import('fs');
+    if (fs.existsSync(cliPath + '.cmd')) cliPath = cliPath + '.cmd';
+  }
+  let child: ChildProcessWithoutNullStreams;
+  try {
+    // Node 18.20+/20.12+ refuse to spawn `.cmd`/`.bat` directly on Windows
+    // for security (CVE-2024-27980). The fix: spawn cmd.exe directly (an
+    // .exe, so no CVE applies) and pass the .cmd path as a properly-escaped
+    // arg. `shell: true` + quoted command is NOT used here because cmd.exe
+    // misinterprets the double-quote + backslash combo in Windows paths,
+    // silently dropping the `\` in `C:\` and failing with "not recognized".
+    const isWinShim = process.platform === 'win32' && /\.(cmd|bat)$/i.test(cliPath);
+    if (isWinShim) {
+      child = spawn('cmd.exe', ['/d', '/s', '/c', cliPath, ...args], {
+        stdio: ['pipe', 'pipe', 'pipe'],
+        cwd: req.cwd,
+        windowsHide: true,
+      });
+    } else {
+      child = spawn(cliPath, args, {
+        stdio: ['pipe', 'pipe', 'pipe'],
+        cwd: req.cwd,
+        windowsHide: true,
+      });
+    }
+  } catch (e: any) {
+    yield { type: 'error', message: `Failed to spawn claude CLI at ${cliPath}: ${e?.message || String(e)}` };
+    return;
+  }
+  // Hook abort signal — SIGTERM, then SIGKILL after grace period.
+  const abortHandler = () => {
+    try { child.kill('SIGTERM'); } catch { /* ignore */ }
+    setTimeout(() => { try { child.kill('SIGKILL'); } catch { /* ignore */ } }, SIGTERM_GRACE_MS);
+  };
+  if (req.signal) {
+    if (req.signal.aborted) abortHandler();
+    else req.signal.addEventListener('abort', abortHandler, { once: true });
+  }
+  child.stdin.write(stdinPayload);
+  child.stdin.end();
+  // Pump stdout chunks into a buffered queue the generator drains.
+  const queue: StreamEvent[] = [];
+  let waiter: ((v: void) => void) | null = null;
+  const wake = () => { if (waiter) { const w = waiter; waiter = null; w(); } };
+  let exited = false;
+  let exitCode = 0;
+  let stderrBuffer = '';
+  let stopReason: string | null = null;
+  let inputTokens = 0;
+  let outputTokens = 0;
+  let lineBuffer = '';
+  const pendingTools = new Map<number, { id: string; name: string; jsonBuffer: string }>();
+  child.stdout.on('data', (chunk: Buffer) => {
+    lineBuffer += chunk.toString('utf-8');
+    const lines = lineBuffer.split('\n');
+    lineBuffer = lines.pop() || '';
+    for (const raw of lines) {
+      const line = raw.trim();
+      if (!line) continue;
+      let ev: any;
+      try { ev = JSON.parse(line); } catch { continue; }
+      handleCliEvent(ev);
+    }
+    wake();
+  });
+  child.stderr.on('data', (chunk: Buffer) => { stderrBuffer += chunk.toString('utf-8'); });
+  child.on('close', code => { exitCode = code ?? -1; exited = true; wake(); });
+  child.on('error', err => { stderrBuffer += `\n[spawn error] ${err.message}`; exited = true; wake(); });
+  function handleCliEvent(ev: any) {
+    // Token-level streaming deltas — preferred shape, matches API client.
+    if (ev.type === 'stream_event' && ev.event?.type === 'content_block_delta') {
+      const d = ev.event.delta;
+      if (d?.type === 'text_delta' && typeof d.text === 'string') {
+        queue.push({ type: 'text_delta', text: d.text });
+      } else if (d?.type === 'input_json_delta' && typeof d.partial_json === 'string') {
+        const idx = ev.event.index;
+        const pending = pendingTools.get(idx);
+        if (pending) pending.jsonBuffer += d.partial_json;
+      }
+      return;
+    }
+    if (ev.type === 'stream_event' && ev.event?.type === 'content_block_start') {
+      const block = ev.event.content_block;
+      if (block?.type === 'tool_use') {
+        pendingTools.set(ev.event.index, { id: block.id, name: block.name, jsonBuffer: '' });
+      }
+      return;
+    }
+    if (ev.type === 'stream_event' && ev.event?.type === 'content_block_stop') {
+      const idx = ev.event.index;
+      const pending = pendingTools.get(idx);
+      if (pending) {
+        let parsed: unknown = {};
+        if (pending.jsonBuffer) { try { parsed = JSON.parse(pending.jsonBuffer); } catch { parsed = {}; } }
+        queue.push({ type: 'tool_use_start', id: pending.id, name: pending.name, input: parsed });
+        pendingTools.delete(idx);
+      }
+      return;
+    }
+    // Per-turn assistant fallback — when token-level streaming isn't
+    // available, the CLI still emits a complete `assistant` event. Push
+    // its text once so we don't lose the message.
+    if (ev.type === 'assistant' && ev.message?.content) {
+      const blocks = ev.message.content as Array<{ type?: string; text?: string }>;
+      const text = blocks.filter(b => b.type === 'text').map(b => b.text || '').join('');
+      // Only emit fallback text if we never streamed any deltas for this turn.
+      // Heuristic: if the queue's last text_delta is empty, emit; else assume
+      // streaming already covered it. We can't reliably check — just always
+      // emit and let the consumer dedupe via its own message buffer if needed.
+      // Tradeoff acknowledged: a minor risk of double-text vs total loss when
+      // CLI doesn't stream. CLIs we've tested do stream, so this is rarely hit.
+      if (text) queue.push({ type: 'text_delta', text });
+      return;
+    }
+    if (ev.type === 'result') {
+      if (ev.usage?.input_tokens) inputTokens = ev.usage.input_tokens;
+      if (ev.usage?.output_tokens) outputTokens = ev.usage.output_tokens;
+      if (ev.is_error || ev.subtype === 'error_during_execution' || ev.subtype === 'error_max_turns') {
+        const detail = typeof ev.result === 'string' && ev.result.trim()
+          ? ev.result.trim()
+          : `${ev.subtype || 'error'} (status ${ev.api_error_status ?? 'unknown'})`;
+        queue.push({ type: 'error', message: `[CLI ${ev.subtype || 'error'}] ${detail}` });
+        stopReason = 'error';
+      } else if (ev.subtype === 'success' || ev.stop_reason === 'end_turn') {
+        stopReason = 'end_turn';
+      } else if (ev.stop_reason === 'max_turns') {
+        stopReason = 'max_turns';
+      }
+    }
+  }
+  // Drain loop: yield queued events as the subprocess produces them.
+  while (true) {
+    while (queue.length > 0) {
+      yield queue.shift()!;
+    }
+    if (exited) break;
+    await new Promise<void>(r => { waiter = r; });
+  }
+  if (exitCode !== 0 && stopReason !== 'error') {
+    const msg = stderrBuffer.trim() || `claude CLI exited with code ${exitCode}`;
+    yield { type: 'error', message: msg };
+    return;
+  }
+  if (inputTokens > 0 || outputTokens > 0) {
+    yield { type: 'usage', inputTokens, outputTokens };
+  }
+  yield { type: 'message_end', stopReason };
+}
+/**
+ * Convert AnthropicMessage[] to the CLI's stream-json input format.
+ * Each user message becomes one JSONL line on stdin. Assistant messages
+ * are echoed back as turn history. The CLI assembles them into a
+ * conversation context.
+ */
+function buildStreamJsonInput(req: CliStreamRequest): string {
+  const lines: string[] = [];
+  for (const m of req.messages) {
+    const content = typeof m.content === 'string' ? m.content : flattenContent(m.content);
+    lines.push(JSON.stringify({
+      type: m.role,
+      message: { role: m.role, content: [{ type: 'text', text: content }] },
+    }));
+  }
+  return lines.join('\n') + '\n';
+}
+function flattenContent(blocks: Exclude<AnthropicMessage['content'], string>): string {
+  return blocks.map(b => {
+    if (b.type === 'text') return b.text;
+    if (b.type === 'tool_result') return `[tool_result for ${b.tool_use_id}]\n${b.content}`;
+    if (b.type === 'tool_use') return `[tool_use: ${b.name}]`;
+    return '';
+  }).join('\n');
+}