npm - agent-sh - Versions diffs - 0.4.0 → 0.6.0 - Mend

agent-sh 0.4.0 → 0.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (83) hide show

package/README.md +37 -115
package/dist/agent/agent-loop.d.ts +86 -0
package/dist/agent/agent-loop.js +704 -0
package/dist/agent/conversation-state.d.ts +27 -0
package/dist/agent/conversation-state.js +59 -0
package/dist/agent/index.d.ts +11 -0
package/dist/agent/index.js +9 -0
package/dist/agent/skills.d.ts +25 -0
package/dist/agent/skills.js +186 -0
package/dist/agent/subagent.d.ts +37 -0
package/dist/agent/subagent.js +119 -0
package/dist/agent/system-prompt.d.ts +14 -0
package/dist/agent/system-prompt.js +103 -0
package/dist/agent/tool-registry.d.ts +15 -0
package/dist/agent/tool-registry.js +30 -0
package/dist/agent/tools/bash.d.ts +7 -0
package/dist/agent/tools/bash.js +71 -0
package/dist/agent/tools/display.d.ts +13 -0
package/dist/agent/tools/display.js +70 -0
package/dist/agent/tools/edit-file.d.ts +2 -0
package/dist/agent/tools/edit-file.js +148 -0
package/dist/agent/tools/glob.d.ts +2 -0
package/dist/agent/tools/glob.js +87 -0
package/dist/agent/tools/grep.d.ts +2 -0
package/dist/agent/tools/grep.js +168 -0
package/dist/agent/tools/list-skills.d.ts +2 -0
package/dist/agent/tools/list-skills.js +28 -0
package/dist/agent/tools/ls.d.ts +2 -0
package/dist/agent/tools/ls.js +72 -0
package/dist/agent/tools/read-file.d.ts +10 -0
package/dist/agent/tools/read-file.js +101 -0
package/dist/agent/tools/user-shell.d.ts +13 -0
package/dist/agent/tools/user-shell.js +84 -0
package/dist/agent/tools/write-file.d.ts +2 -0
package/dist/agent/tools/write-file.js +82 -0
package/dist/agent/types.d.ts +78 -0
package/dist/agent/types.js +1 -0
package/dist/core.d.ts +22 -14
package/dist/core.js +256 -36
package/dist/event-bus.d.ts +98 -17
package/dist/event-bus.js +10 -1
package/dist/extension-loader.d.ts +1 -1
package/dist/extension-loader.js +10 -1
package/dist/extensions/command-suggest.d.ts +10 -0
package/dist/extensions/command-suggest.js +41 -0
package/dist/extensions/slash-commands.d.ts +1 -1
package/dist/extensions/slash-commands.js +161 -64
package/dist/extensions/tui-renderer.js +426 -126
package/dist/index.js +110 -129
package/dist/input-handler.js +78 -9
package/dist/output-parser.d.ts +7 -0
package/dist/output-parser.js +27 -0
package/dist/settings.d.ts +53 -2
package/dist/settings.js +46 -3
package/dist/shell.js +35 -28
package/dist/types.d.ts +33 -6
package/dist/utils/box-frame.d.ts +3 -1
package/dist/utils/box-frame.js +12 -5
package/dist/utils/diff.js +10 -0
package/dist/utils/llm-client.d.ts +45 -0
package/dist/utils/llm-client.js +60 -0
package/dist/utils/markdown.d.ts +1 -0
package/dist/utils/markdown.js +25 -3
package/dist/utils/stream-transform.js +20 -47
package/dist/utils/tool-display.d.ts +4 -0
package/dist/utils/tool-display.js +35 -8
package/examples/extensions/claude-code-bridge/README.md +35 -0
package/examples/extensions/claude-code-bridge/index.ts +194 -0
package/examples/extensions/claude-code-bridge/package.json +11 -0
package/examples/extensions/openrouter.ts +87 -0
package/examples/extensions/pi-bridge/README.md +35 -0
package/examples/extensions/pi-bridge/index.ts +263 -0
package/examples/extensions/pi-bridge/package.json +13 -0
package/examples/extensions/secret-guard.ts +100 -0
package/examples/extensions/subagents.ts +87 -0
package/package.json +3 -5
package/dist/acp-client.d.ts +0 -105
package/dist/acp-client.js +0 -684
package/dist/extensions/shell-exec.d.ts +0 -24
package/dist/extensions/shell-exec.js +0 -188
package/dist/mcp-server.d.ts +0 -13
package/dist/mcp-server.js +0 -234
package/examples/pi-agent-sh.ts +0 -166

package/dist/agent/agent-loop.js ADDED Viewed

@@ -0,0 +1,704 @@
+import { setMaxListeners } from "node:events";
+import * as fs from "node:fs/promises";
+import * as path from "node:path";
+import { computeDiff } from "../utils/diff.js";
+import { ToolRegistry } from "./tool-registry.js";
+import { ConversationState } from "./conversation-state.js";
+import { STATIC_SYSTEM_PROMPT, buildDynamicContext } from "./system-prompt.js";
+// Core tool factories
+import { createBashTool } from "./tools/bash.js";
+import { createReadFileTool } from "./tools/read-file.js";
+import { createWriteFileTool } from "./tools/write-file.js";
+import { createEditFileTool } from "./tools/edit-file.js";
+import { createGrepTool } from "./tools/grep.js";
+import { createGlobTool } from "./tools/glob.js";
+import { createLsTool } from "./tools/ls.js";
+import { createUserShellTool } from "./tools/user-shell.js";
+import { createDisplayTool } from "./tools/display.js";
+import { createListSkillsTool } from "./tools/list-skills.js";
+import { discoverProjectSkills } from "./skills.js";
+export class AgentLoop {
+    bus;
+    contextManager;
+    llmClient;
+    handlers;
+    abortController = null;
+    toolRegistry = new ToolRegistry();
+    conversation = new ConversationState();
+    fileReadCache = new Map();
+    modes;
+    currentModeIndex = 0;
+    boundListeners = [];
+    lastProjectSkillNames = new Set();
+    static THINKING_LEVELS = ["off", "low", "medium", "high"];
+    thinkingLevel = "off";
+    constructor(bus, contextManager, llmClient, handlers, modeConfig, initialModeIndex) {
+        this.bus = bus;
+        this.contextManager = contextManager;
+        this.llmClient = llmClient;
+        this.handlers = handlers;
+        // Default modes: just the configured model
+        this.modes = modeConfig ?? [
+            { model: llmClient.model },
+        ];
+        this.currentModeIndex = initialModeIndex ?? 0;
+        // Register core tools
+        this.registerCoreTools();
+        // Register handlers — extensions can advise these
+        this.registerHandlers();
+    }
+    /** Subscribe to bus events — activates this backend. */
+    wire() {
+        const on = (event, fn) => {
+            this.bus.on(event, fn);
+            this.boundListeners.push({ event, fn });
+        };
+        on("agent:submit", ({ query }) => {
+            this.handleQuery(query).catch(() => { });
+        });
+        on("agent:cancel-request", (e) => {
+            this.abortController?.abort(e.silent ? "silent" : undefined);
+        });
+        on("config:cycle", () => this.cycleMode());
+        on("config:switch-model", ({ model: target }) => {
+            const idx = this.modes.findIndex((m) => m.model === target);
+            if (idx === -1) {
+                this.bus.emit("ui:error", { message: `Unknown model: ${target}` });
+                return;
+            }
+            this.currentModeIndex = idx;
+            const m = this.modes[idx];
+            if (m.providerConfig) {
+                this.llmClient.reconfigure({ ...m.providerConfig, model: m.model });
+            }
+            else {
+                this.llmClient.model = m.model;
+            }
+            const label = m.provider ? `${m.provider}: ${m.model}` : m.model;
+            this.bus.emit("agent:info", { name: "agent-sh", version: "0.4", model: m.model, provider: m.provider, contextWindow: m.contextWindow });
+            this.bus.emit("ui:info", { message: `Model: ${label}` });
+            this.bus.emit("config:changed", {});
+        });
+        this.bus.onPipe("config:get-models", (payload) => {
+            const models = this.modes.map((m) => ({ model: m.model, provider: m.provider ?? "" }));
+            const active = this.modes[this.currentModeIndex]?.model ?? null;
+            return { models, active };
+        });
+        on("config:set-thinking", ({ level }) => {
+            if (!AgentLoop.THINKING_LEVELS.includes(level)) {
+                this.bus.emit("ui:error", { message: `Unknown thinking level: ${level}. Use: ${AgentLoop.THINKING_LEVELS.join(", ")}` });
+                return;
+            }
+            const mode = this.currentMode;
+            if (level !== "off" && mode.reasoning === false) {
+                this.bus.emit("ui:error", { message: `Model ${mode.model} does not support thinking.` });
+                return;
+            }
+            if (level !== "off" && mode.supportsReasoningEffort === false) {
+                this.bus.emit("ui:error", { message: `Provider ${mode.provider ?? "unknown"} does not support reasoning_effort.` });
+                return;
+            }
+            this.thinkingLevel = level;
+            this.bus.emit("ui:info", { message: `Thinking: ${level}` });
+            this.bus.emit("config:changed", {});
+        });
+        this.bus.onPipe("config:get-thinking", () => {
+            const mode = this.currentMode;
+            const supported = mode.reasoning !== false && mode.supportsReasoningEffort !== false;
+            return { level: this.thinkingLevel, levels: AgentLoop.THINKING_LEVELS, supported };
+        });
+        on("config:set-modes", ({ modes: newModes }) => {
+            this.modes = newModes;
+            this.currentModeIndex = 0;
+            const m = this.modes[0];
+            if (m.providerConfig) {
+                this.llmClient.reconfigure({ ...m.providerConfig, model: m.model });
+            }
+            else {
+                this.llmClient.model = m.model;
+            }
+            this.bus.emit("config:changed", {});
+        });
+        on("agent:reset-session", () => {
+            this.cancel();
+            this.conversation = new ConversationState();
+            this.lastProjectSkillNames.clear();
+        });
+        on("shell:cwd-change", ({ cwd }) => {
+            const projectSkills = discoverProjectSkills(cwd);
+            const newNames = new Set(projectSkills.map(s => s.name));
+            // Check if the set of project skills changed
+            if (newNames.size === this.lastProjectSkillNames.size &&
+                [...newNames].every(n => this.lastProjectSkillNames.has(n))) {
+                return; // no change
+            }
+            this.lastProjectSkillNames = newNames;
+            if (projectSkills.length > 0) {
+                const names = projectSkills.map(s => s.name).join(", ");
+                this.conversation.addSystemNote(`[Project skills available: ${names}. Use list_skills for details, read_file to load.]`);
+            }
+        });
+    }
+    /** Unsubscribe from bus events — deactivates this backend. */
+    unwire() {
+        for (const { event, fn } of this.boundListeners) {
+            this.bus.off(event, fn);
+        }
+        this.boundListeners = [];
+    }
+    /** Register a tool (used by extensions via ctx.registerTool). */
+    registerTool(tool) {
+        this.toolRegistry.register(tool);
+    }
+    /** Get all registered tools. */
+    getTools() {
+        return this.toolRegistry.all();
+    }
+    kill() {
+        this.cancel();
+    }
+    cancel() {
+        this.abortController?.abort();
+    }
+    /** Check if reasoning_effort should be sent for the current model/provider. */
+    shouldSendReasoningEffort() {
+        if (this.thinkingLevel === "off")
+            return false;
+        const mode = this.currentMode;
+        if (mode.reasoning === false)
+            return false;
+        if (mode.supportsReasoningEffort === false)
+            return false;
+        return true;
+    }
+    cycleMode() {
+        const prevMode = this.modes[this.currentModeIndex];
+        this.currentModeIndex =
+            (this.currentModeIndex + 1) % this.modes.length;
+        const newMode = this.modes[this.currentModeIndex];
+        // Reconfigure LlmClient if provider changed
+        if (newMode.provider !== prevMode.provider && newMode.providerConfig) {
+            this.llmClient.reconfigure({
+                apiKey: newMode.providerConfig.apiKey,
+                baseURL: newMode.providerConfig.baseURL,
+                model: newMode.model,
+            });
+        }
+        else {
+            this.llmClient.model = newMode.model;
+        }
+        const label = newMode.provider
+            ? `${newMode.provider}: ${newMode.model}`
+            : newMode.model;
+        this.bus.emit("agent:info", { name: "agent-sh", version: "0.4", model: newMode.model, provider: newMode.provider, contextWindow: newMode.contextWindow });
+        this.bus.emit("ui:info", { message: `Model: ${label}` });
+        this.bus.emit("config:changed", {});
+    }
+    get currentMode() {
+        return this.modes[this.currentModeIndex];
+    }
+    get currentModel() {
+        return this.modes[this.currentModeIndex].model;
+    }
+    isContextOverflow(e) {
+        if (!(e instanceof Error))
+            return false;
+        const msg = e.message.toLowerCase();
+        return msg.includes("context") || msg.includes("token") || msg.includes("too long");
+    }
+    /** Check if an error is retryable (transient). */
+    isRetryable(e) {
+        if (!(e instanceof Error))
+            return false;
+        const msg = e.message.toLowerCase();
+        // Network errors
+        if (msg.includes("econnreset") || msg.includes("econnrefused") ||
+            msg.includes("etimedout") || msg.includes("fetch failed") ||
+            msg.includes("network") || msg.includes("socket hang up")) {
+            return true;
+        }
+        // HTTP status-based (OpenAI SDK includes status in error)
+        const status = e.status;
+        if (status === 429 || status === 500 || status === 502 || status === 503 || status === 529) {
+            return true;
+        }
+        return false;
+    }
+    /** Extract retry delay from error headers or use exponential backoff. */
+    getRetryDelay(e, attempt) {
+        // Check for Retry-After header (OpenAI SDK exposes headers)
+        const headers = e.headers;
+        if (headers) {
+            const retryAfter = headers["retry-after"] ?? headers.get?.("retry-after");
+            if (retryAfter) {
+                const seconds = parseInt(retryAfter, 10);
+                if (!isNaN(seconds))
+                    return seconds * 1000;
+            }
+        }
+        // Exponential backoff: 1s, 2s, 4s, 8s, capped at 30s
+        return Math.min(1000 * Math.pow(2, attempt), 30_000);
+    }
+    /** Format an error with provider context for user-facing display. */
+    formatError(e) {
+        const raw = e instanceof Error ? e.message : String(e);
+        const status = e.status;
+        const model = this.currentModel;
+        const baseURL = this.llmClient.config?.baseURL;
+        const provider = this.currentMode.provider;
+        // Connection errors — most likely misconfigured provider
+        if (raw.includes("ECONNREFUSED") || raw.includes("ECONNRESET") ||
+            raw.includes("ETIMEDOUT") || raw.includes("fetch failed") ||
+            raw.includes("socket hang up")) {
+            const target = baseURL ?? provider ?? "provider";
+            return `Could not connect to ${target} (${raw}). Check that the API endpoint is reachable.`;
+        }
+        // Auth errors
+        if (status === 401 || raw.toLowerCase().includes("auth")) {
+            return `Authentication failed for ${provider ?? "provider"} (model: ${model}). Check your API key.`;
+        }
+        // Model not found
+        if (status === 404) {
+            return `Model "${model}" not found at ${provider ?? baseURL ?? "provider"}. Check the model name.`;
+        }
+        // Rate limit (after retries exhausted)
+        if (status === 429) {
+            return `Rate limited by ${provider ?? "provider"} (model: ${model}). Try again in a moment.`;
+        }
+        // Generic with context
+        const context = provider ? ` (${provider}, model: ${model})` : ` (model: ${model})`;
+        return `${raw}${context}`;
+    }
+    registerCoreTools() {
+        const getCwd = () => this.contextManager.getCwd();
+        const getEnv = () => {
+            const env = {};
+            for (const [k, v] of Object.entries(process.env)) {
+                if (v !== undefined)
+                    env[k] = v;
+            }
+            return env;
+        };
+        this.toolRegistry.register(createBashTool({ getCwd, getEnv, bus: this.bus }));
+        this.toolRegistry.register(createReadFileTool(getCwd, this.fileReadCache));
+        this.toolRegistry.register(createWriteFileTool(getCwd));
+        this.toolRegistry.register(createEditFileTool(getCwd));
+        this.toolRegistry.register(createGrepTool(getCwd));
+        this.toolRegistry.register(createGlobTool(getCwd));
+        this.toolRegistry.register(createLsTool(getCwd));
+        this.toolRegistry.register(createUserShellTool({ getCwd, bus: this.bus }));
+        this.toolRegistry.register(createDisplayTool({ getCwd, bus: this.bus }));
+        this.toolRegistry.register(createListSkillsTool(getCwd));
+    }
+    /**
+     * Register named handlers that extensions can advise.
+     * Only high-power use cases where multiple extensions compose.
+     */
+    registerHandlers() {
+        const h = this.handlers;
+        // Extensions compose additional context (git info, project rules, etc.)
+        h.define("dynamic-context:build", () => buildDynamicContext(this.toolRegistry.all(), this.contextManager));
+        // Full control over what the LLM sees: takes messages[], returns messages[].
+        // Default: pass through. Extensions can advise to compact, summarize,
+        // filter, reorder, inject — whatever strategy fits.
+        h.define("conversation:prepare", (messages) => messages);
+        // Wraps each tool call: permission → execute → emit events.
+        // Extensions advise to add safe-mode, logging, metrics, custom policies.
+        // The ctx.onChunk callback is exposed so advisors can wrap it to
+        // intercept/transform streamed tool output (e.g. secret redaction).
+        h.define("tool:execute", async (ctx) => {
+            const { name, id, args, tool } = ctx;
+            const display = tool.getDisplayInfo?.(args) ?? { kind: "execute" };
+            let diffShown = false;
+            // Permission gating
+            if (tool.requiresPermission) {
+                let permKind = "tool-call";
+                let permTitle = typeof args.description === "string"
+                    ? `${name}: ${args.description}`
+                    : name;
+                let metadata = { args };
+                // For file-modifying tools, pre-compute diff for display
+                if (tool.modifiesFiles && typeof args.path === "string") {
+                    try {
+                        const absPath = path.resolve(process.cwd(), args.path);
+                        let oldContent = null;
+                        try {
+                            oldContent = await fs.readFile(absPath, "utf-8");
+                        }
+                        catch { /* new file */ }
+                        let newContent;
+                        if (typeof args.content === "string") {
+                            // write_file
+                            newContent = args.content;
+                        }
+                        else if (typeof args.old_text === "string" && typeof args.new_text === "string" && oldContent) {
+                            // edit_file
+                            newContent = oldContent.replace(args.old_text.replace(/\r\n/g, "\n"), args.new_text.replace(/\r\n/g, "\n"));
+                        }
+                        if (newContent !== undefined) {
+                            const diff = computeDiff(oldContent, newContent);
+                            if (!diff.isIdentical) {
+                                permKind = "file-write";
+                                // Shorten path for display
+                                const cwd = process.cwd();
+                                const home = process.env.HOME;
+                                let displayPath = absPath;
+                                if (absPath.startsWith(cwd + "/"))
+                                    displayPath = absPath.slice(cwd.length + 1);
+                                else if (home && absPath.startsWith(home + "/"))
+                                    displayPath = "~/" + absPath.slice(home.length + 1);
+                                permTitle = displayPath;
+                                metadata = { args, diff };
+                                diffShown = true;
+                            }
+                        }
+                    }
+                    catch { /* fall back to generic permission */ }
+                }
+                const perm = await this.bus.emitPipeAsync("permission:request", {
+                    kind: permKind,
+                    title: permTitle,
+                    metadata,
+                    decision: { outcome: "approved" },
+                });
+                if (perm.decision.outcome !== "approved") {
+                    return { content: "Permission denied by user.", exitCode: 1, isError: true };
+                }
+            }
+            // Emit tool-started for TUI
+            const label = tool.displayName ?? name;
+            this.bus.emit("agent:tool-started", {
+                title: typeof args.description === "string" ? `${label}: ${args.description}` : label,
+                toolCallId: id,
+                kind: display.kind, icon: display.icon, locations: display.locations, rawInput: args,
+                displayDetail: tool.formatCall?.(args),
+                batchIndex: ctx.batchIndex, batchTotal: ctx.batchTotal,
+            });
+            this.bus.emit("agent:tool-call", { tool: name, args });
+            // Execute — use ctx.onChunk so advisors can wrap the streaming callback.
+            // Suppress streaming output if diff was already shown.
+            const onChunk = (tool.showOutput !== false && !diffShown)
+                ? ctx.onChunk
+                : undefined;
+            const result = await tool.execute(args, onChunk);
+            // Invalidate read cache when a file is modified
+            if (tool.modifiesFiles && typeof args.path === "string" && !result.isError) {
+                const absPath = path.resolve(process.cwd(), args.path);
+                this.fileReadCache.delete(absPath);
+            }
+            // Compute result display: tool-provided → default (none)
+            const resultDisplay = tool.formatResult?.(args, result);
+            // Emit completion events (via transform pipe so extensions can override)
+            this.bus.emitTransform("agent:tool-completed", {
+                toolCallId: id, exitCode: result.exitCode,
+                rawOutput: result.content, kind: display.kind,
+                resultDisplay,
+            });
+            this.bus.emit("agent:tool-output", {
+                tool: name, output: result.content, exitCode: result.exitCode,
+            });
+            return result;
+        });
+    }
+    async handleQuery(query) {
+        // Cancel any in-flight loop (concurrent prompt handling)
+        if (this.abortController) {
+            this.abortController.abort();
+        }
+        this.abortController = new AbortController();
+        const signal = this.abortController.signal;
+        // Each loop iteration adds an abort listener (via OpenAI SDK stream);
+        // raise the limit to avoid spurious warnings on multi-tool queries.
+        setMaxListeners(50, signal);
+        this.bus.emit("agent:query", { query });
+        this.bus.emit("agent:processing-start", {});
+        let responseText = "";
+        try {
+            this.conversation.addUserMessage(query);
+            responseText = await this.executeLoop(signal);
+        }
+        catch (e) {
+            if (signal.aborted && signal.reason !== "silent") {
+                this.bus.emit("agent:cancelled", {});
+            }
+            else if (!signal.aborted) {
+                const msg = this.formatError(e);
+                this.bus.emit("agent:error", { message: msg });
+            }
+        }
+        finally {
+            // Ensure any buffered text in the stream transform pipeline gets
+            // flushed as a complete line before response-done closes the box.
+            if (responseText && !responseText.endsWith("\n")) {
+                this.bus.emitTransform("agent:response-chunk", {
+                    blocks: [{ type: "text", text: "\n" }],
+                });
+            }
+            this.bus.emitTransform("agent:response-done", {
+                response: responseText,
+            });
+            this.bus.emit("agent:processing-done", {});
+            this.abortController = null;
+        }
+    }
+    /** Max tokens before auto-compaction (conservative default). */
+    maxContextTokens = 60_000;
+    /**
+     * Core agent loop: stream LLM response → execute tools → repeat.
+     * Returns the final accumulated response text.
+     */
+    async executeLoop(signal) {
+        let fullResponseText = "";
+        while (!signal.aborted) {
+            // Auto-compact if conversation is getting large
+            const estimatedTokens = Math.ceil(JSON.stringify(this.conversation.getMessages()).length / 4);
+            if (estimatedTokens > this.maxContextTokens) {
+                this.conversation.compact(10);
+                this.bus.emit("ui:info", { message: "(conversation compacted)" });
+            }
+            // System prompt is static (cacheable); dynamic context uses handler
+            // so extensions can compose additional context via advise()
+            const systemPrompt = STATIC_SYSTEM_PROMPT;
+            const dynamicContext = this.handlers.call("dynamic-context:build");
+            // Stream LLM response with retry
+            const result = await this.streamWithRetry(systemPrompt, dynamicContext, signal);
+            const { text, toolCalls, assistantContent, assistantToolCalls } = result;
+            fullResponseText += text;
+            // Record the assistant message in conversation
+            this.conversation.addAssistantMessage(assistantContent, assistantToolCalls);
+            // No tool calls → agent is done
+            if (toolCalls.length === 0)
+                break;
+            // Emit batch info so the TUI can render group headers upfront
+            {
+                const groupMap = new Map();
+                for (const tc of toolCalls) {
+                    const tool = this.toolRegistry.get(tc.name);
+                    const kind = tool?.getDisplayInfo?.((() => { try {
+                        return JSON.parse(tc.argumentsJson);
+                    }
+                    catch {
+                        return {};
+                    } })())?.kind ?? "execute";
+                    let args = {};
+                    try {
+                        args = JSON.parse(tc.argumentsJson);
+                    }
+                    catch { }
+                    const detail = tool?.formatCall?.(args);
+                    if (!groupMap.has(kind))
+                        groupMap.set(kind, []);
+                    groupMap.get(kind).push({ name: tc.name, displayDetail: detail });
+                }
+                const groups = Array.from(groupMap.entries()).map(([kind, tools]) => ({ kind, tools }));
+                this.bus.emit("agent:tool-batch", { groups });
+            }
+            // Execute tool calls — run read-only tools in parallel, permission-
+            // requiring tools sequentially (to avoid overlapping permission prompts).
+            const batchTotal = toolCalls.length;
+            const executeSingle = async (tc, batchIndex) => {
+                const tool = this.toolRegistry.get(tc.name);
+                if (!tool) {
+                    this.conversation.addToolResult(tc.id, `Error: Unknown tool "${tc.name}"`);
+                    return;
+                }
+                let args;
+                try {
+                    args = JSON.parse(tc.argumentsJson);
+                }
+                catch {
+                    this.conversation.addToolResult(tc.id, `Error: Invalid JSON arguments for ${tc.name}`);
+                    return;
+                }
+                // Execute via handler — extensions can advise to add safe-mode,
+                // logging, metrics, custom permission policies, etc.
+                const defaultOnChunk = (chunk) => {
+                    this.bus.emit("agent:tool-output-chunk", { chunk });
+                };
+                const result = await this.handlers.call("tool:execute", { name: tc.name, id: tc.id, args, tool, onChunk: defaultOnChunk,
+                    batchIndex, batchTotal: batchTotal > 1 ? batchTotal : undefined });
+                // Add tool result to conversation (truncate large outputs to avoid
+                // blowing through the context window on a single tool call)
+                let content = result.isError
+                    ? `Error: ${result.content}`
+                    : result.content;
+                const maxBytes = 16_384; // ~4k tokens
+                if (content.length > maxBytes) {
+                    const headBytes = Math.floor(maxBytes * 0.6);
+                    const tailBytes = maxBytes - headBytes;
+                    const lines = content.split("\n");
+                    let headEnd = 0, headLen = 0;
+                    for (let i = 0; i < lines.length && headLen + lines[i].length + 1 <= headBytes; i++) {
+                        headLen += lines[i].length + 1;
+                        headEnd = i + 1;
+                    }
+                    let tailStart = lines.length, tailLen = 0;
+                    for (let i = lines.length - 1; i >= headEnd && tailLen + lines[i].length + 1 <= tailBytes; i--) {
+                        tailLen += lines[i].length + 1;
+                        tailStart = i;
+                    }
+                    const omitted = tailStart - headEnd;
+                    content = [
+                        ...lines.slice(0, headEnd),
+                        `\n[… ${omitted} lines omitted (output truncated to ${Math.round(maxBytes / 1024)}KB) …]\n`,
+                        ...lines.slice(tailStart),
+                    ].join("\n");
+                }
+                this.conversation.addToolResult(tc.id, content);
+            };
+            // Partition into parallel-safe (read-only) and sequential (needs permission)
+            const parallel = [];
+            const sequential = [];
+            for (const tc of toolCalls) {
+                const tool = this.toolRegistry.get(tc.name);
+                if (tool && !tool.requiresPermission && !tool.modifiesFiles) {
+                    parallel.push(tc);
+                }
+                else {
+                    sequential.push(tc);
+                }
+            }
+            // Run read-only tools in parallel
+            let batchIdx = 0;
+            if (parallel.length > 0 && !signal.aborted) {
+                await Promise.all(parallel.map(tc => {
+                    const idx = ++batchIdx;
+                    return signal.aborted ? Promise.resolve() : executeSingle(tc, idx);
+                }));
+            }
+            // Run permission-requiring tools sequentially
+            for (const tc of sequential) {
+                if (signal.aborted)
+                    break;
+                await executeSingle(tc, ++batchIdx);
+            }
+            // Loop back — LLM sees tool results
+        }
+        return fullResponseText;
+    }
+    maxRetries = 3;
+    /**
+     * Stream with retry logic. Handles:
+     *   - Context overflow → compact and retry
+     *   - Rate limits (429) → backoff with Retry-After
+     *   - Transient errors (500/502/503, network) → exponential backoff
+     */
+    async streamWithRetry(systemPrompt, dynamicContext, signal) {
+        for (let attempt = 0; attempt <= this.maxRetries; attempt++) {
+            try {
+                return await this.streamResponse(systemPrompt, dynamicContext, signal);
+            }
+            catch (e) {
+                if (signal.aborted)
+                    throw e;
+                // Context overflow — compact and retry (no backoff needed)
+                if (this.isContextOverflow(e)) {
+                    this.conversation.compact(6);
+                    this.bus.emit("ui:info", { message: "(context overflow — compacted, retrying)" });
+                    continue;
+                }
+                // Retryable transient error — backoff
+                if (this.isRetryable(e) && attempt < this.maxRetries) {
+                    const delay = this.getRetryDelay(e, attempt);
+                    const status = e.status;
+                    const reason = status === 429 ? "rate limited" : `error ${status ?? "network"}`;
+                    this.bus.emit("ui:info", {
+                        message: `(${reason}, retrying in ${Math.ceil(delay / 1000)}s — attempt ${attempt + 2}/${this.maxRetries + 1})`,
+                    });
+                    await new Promise((resolve, reject) => {
+                        const timer = setTimeout(resolve, delay);
+                        signal.addEventListener("abort", () => { clearTimeout(timer); reject(new Error("aborted")); }, { once: true });
+                    });
+                    continue;
+                }
+                // Non-retryable or exhausted retries
+                throw e;
+            }
+        }
+        // Should not reach here, but TypeScript needs it
+        throw new Error("Retry loop exhausted");
+    }
+    /**
+     * Stream a single LLM response. Returns accumulated text, parsed tool calls,
+     * and the raw assistant message data for conversation recording.
+     */
+    async streamResponse(systemPrompt, dynamicContext, signal) {
+        let text = "";
+        const pendingToolCalls = [];
+        const rawMessages = [
+            { role: "system", content: systemPrompt },
+            { role: "user", content: `<context>\n${dynamicContext}\n</context>` },
+            { role: "assistant", content: "Understood." },
+            ...this.conversation.getMessages(),
+        ];
+        // Let extensions transform the message array (compact, summarize, filter, etc.)
+        const messages = this.handlers.call("conversation:prepare", rawMessages);
+        const stream = await this.llmClient.stream({
+            messages,
+            tools: this.toolRegistry.toAPITools(),
+            model: this.currentModel,
+            reasoning_effort: this.shouldSendReasoningEffort() ? this.thinkingLevel : undefined,
+            signal,
+        });
+        for await (const chunk of stream) {
+            if (signal.aborted)
+                break;
+            const choice = chunk.choices[0];
+            if (!choice)
+                continue;
+            const delta = choice.delta;
+            // Text content
+            if (delta?.content) {
+                text += delta.content;
+                this.bus.emitTransform("agent:response-chunk", {
+                    blocks: [{ type: "text", text: delta.content }],
+                });
+            }
+            // Reasoning/thinking tokens (non-standard, e.g. DeepSeek)
+            if (delta?.reasoning_content) {
+                this.bus.emit("agent:thinking-chunk", {
+                    text: delta.reasoning_content,
+                });
+            }
+            // Tool calls (streamed incrementally)
+            if (delta?.tool_calls) {
+                for (const tc of delta.tool_calls) {
+                    const idx = tc.index;
+                    if (!pendingToolCalls[idx]) {
+                        pendingToolCalls[idx] = {
+                            id: tc.id,
+                            name: tc.function.name,
+                            argumentsJson: "",
+                        };
+                    }
+                    if (tc.function?.arguments) {
+                        pendingToolCalls[idx].argumentsJson +=
+                            tc.function.arguments;
+                    }
+                }
+            }
+            // Token usage (final chunk from providers that support it)
+            if (chunk.usage) {
+                const u = chunk.usage;
+                this.bus.emit("agent:usage", {
+                    prompt_tokens: u.prompt_tokens ?? 0,
+                    completion_tokens: u.completion_tokens ?? 0,
+                    total_tokens: u.total_tokens ?? 0,
+                });
+            }
+        }
+        // Build assistant tool calls for conversation recording
+        const assistantToolCalls = pendingToolCalls.length
+            ? pendingToolCalls.map((tc) => ({
+                id: tc.id,
+                function: { name: tc.name, arguments: tc.argumentsJson },
+            }))
+            : undefined;
+        return {
+            text,
+            toolCalls: pendingToolCalls,
+            assistantContent: text || null,
+            assistantToolCalls,
+        };
+    }
+}