npm - @zds-ai/cli - Versions diffs - 0.1.5 → 0.1.6 - Mend

@zds-ai/cli 0.1.5 → 0.1.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (75) hide show

package/dist/agent/grok-agent.d.ts +5 -1
package/dist/agent/grok-agent.js +243 -30
package/dist/agent/grok-agent.js.map +1 -1
package/dist/agent/llm-agent.d.ts +276 -0
package/dist/agent/llm-agent.js +2839 -0
package/dist/agent/llm-agent.js.map +1 -0
package/dist/agent/prompt-variables.d.ts +33 -5
package/dist/agent/prompt-variables.js +162 -28
package/dist/agent/prompt-variables.js.map +1 -1
package/dist/bin/fastcaption.sh +3 -2
package/dist/bin/generate_image_sd.sh +1 -1
package/dist/grok/client.d.ts +9 -9
package/dist/grok/client.js +3 -4
package/dist/grok/client.js.map +1 -1
package/dist/grok/tools.d.ts +5 -5
package/dist/grok/tools.js +12 -12
package/dist/grok/tools.js.map +1 -1
package/dist/hooks/use-input-handler.d.ts +3 -3
package/dist/hooks/use-input-handler.js +19 -12
package/dist/hooks/use-input-handler.js.map +1 -1
package/dist/index.js +17 -10
package/dist/index.js.map +1 -1
package/dist/mcp/client.js +10 -2
package/dist/mcp/client.js.map +1 -1
package/dist/tools/character-tool.js +1 -1
package/dist/tools/character-tool.js.map +1 -1
package/dist/tools/clear-cache-tool.js +1 -1
package/dist/tools/clear-cache-tool.js.map +1 -1
package/dist/tools/file-conversion-tool.js +1 -1
package/dist/tools/file-conversion-tool.js.map +1 -1
package/dist/tools/image-tool.d.ts +2 -2
package/dist/tools/image-tool.js +5 -3
package/dist/tools/image-tool.js.map +1 -1
package/dist/tools/internet-tool.js +1 -1
package/dist/tools/internet-tool.js.map +1 -1
package/dist/tools/introspect-tool.js +7 -12
package/dist/tools/introspect-tool.js.map +1 -1
package/dist/tools/task-tool.js +1 -1
package/dist/tools/task-tool.js.map +1 -1
package/dist/tools/text-editor.js +1 -1
package/dist/tools/text-editor.js.map +1 -1
package/dist/tools/zsh.js +1 -1
package/dist/tools/zsh.js.map +1 -1
package/dist/ui/components/active-task-status.d.ts +2 -2
package/dist/ui/components/api-key-input.d.ts +2 -2
package/dist/ui/components/api-key-input.js +2 -2
package/dist/ui/components/api-key-input.js.map +1 -1
package/dist/ui/components/backend-status.d.ts +2 -2
package/dist/ui/components/chat-history.d.ts +1 -1
package/dist/ui/components/chat-history.js +1 -1
package/dist/ui/components/chat-history.js.map +1 -1
package/dist/ui/components/chat-interface.d.ts +2 -2
package/dist/ui/components/chat-interface.js +4 -0
package/dist/ui/components/chat-interface.js.map +1 -1
package/dist/ui/components/context-status.d.ts +2 -2
package/dist/ui/components/model-selection.js +1 -1
package/dist/ui/components/model-selection.js.map +1 -1
package/dist/ui/components/mood-status.d.ts +2 -2
package/dist/ui/components/persona-status.d.ts +2 -2
package/dist/utils/chat-history-manager.d.ts +1 -1
package/dist/utils/hook-executor.d.ts +8 -2
package/dist/utils/hook-executor.js +138 -13
package/dist/utils/hook-executor.js.map +1 -1
package/dist/utils/rephrase-handler.d.ts +2 -2
package/dist/utils/rephrase-handler.js.map +1 -1
package/dist/utils/settings-manager.d.ts +5 -0
package/dist/utils/settings-manager.js +6 -0
package/dist/utils/settings-manager.js.map +1 -1
package/dist/utils/slash-commands.d.ts +7 -3
package/dist/utils/slash-commands.js +17 -17
package/dist/utils/slash-commands.js.map +1 -1
package/dist/utils/startup-hook.d.ts +3 -3
package/dist/utils/startup-hook.js +9 -4
package/dist/utils/startup-hook.js.map +1 -1
package/package.json +1 -1

package/dist/agent/llm-agent.js ADDED Viewed

@@ -0,0 +1,2839 @@
+import { LLMClient } from "../grok/client.js";
+import { getAllLLMTools, getMCPManager, initializeMCPServers, } from "../grok/tools.js";
+import { loadMCPConfig } from "../mcp/config.js";
+import { ChatHistoryManager } from "../utils/chat-history-manager.js";
+import { logApiError } from "../utils/error-logger.js";
+import { parseImagesFromMessage, hasImageReferences } from "../utils/image-encoder.js";
+import { getTextContent } from "../utils/content-utils.js";
+import { Variable } from "./prompt-variables.js";
+import fs from "fs";
+import { TextEditorTool, MorphEditorTool, ZshTool, ConfirmationTool, SearchTool, EnvTool, IntrospectTool, ClearCacheTool, CharacterTool, TaskTool, InternetTool, ImageTool, FileConversionTool, RestartTool } from "../tools/index.js";
+import { EventEmitter } from "events";
+import { createTokenCounter } from "../utils/token-counter.js";
+import { getSettingsManager } from "../utils/settings-manager.js";
+import { executeOperationHook, executeToolApprovalHook, applyHookCommands } from "../utils/hook-executor.js";
+// Interval (ms) between token count updates when streaming
+const TOKEN_UPDATE_INTERVAL_MS = 250;
+// Minimum delay (in ms) applied when stopping a task to ensure smooth UI/UX.
+const MINIMUM_STOP_TASK_DELAY_MS = 3000;
+// Maximum number of attempts to parse nested JSON strings in executeTool
+const MAX_JSON_PARSE_ATTEMPTS = 5;
+/**
+ * Threshold used to determine whether an AI response is "substantial" (in characters).
+ */
+const SUBSTANTIAL_RESPONSE_THRESHOLD = 50;
+/**
+ * Extracts the first complete JSON object from a string.
+ * Handles duplicate/concatenated JSON objects (LLM bug) like: {"key":"val"}{"key":"val"}
+ * @param jsonString The string potentially containing concatenated JSON objects
+ * @returns The first complete JSON object, or the original string if no duplicates found
+ */
+function extractFirstJsonObject(jsonString) {
+    if (!jsonString.includes('}{'))
+        return jsonString;
+    try {
+        // Find the end of the first complete JSON object
+        let depth = 0;
+        let firstObjEnd = -1;
+        for (let i = 0; i < jsonString.length; i++) {
+            if (jsonString[i] === "{")
+                depth++;
+            if (jsonString[i] === "}") {
+                depth--;
+                if (depth === 0) {
+                    firstObjEnd = i + 1;
+                    break;
+                }
+            }
+        }
+        if (firstObjEnd > 0 && firstObjEnd < jsonString.length) {
+            // Extract and validate first object
+            const firstObj = jsonString.substring(0, firstObjEnd);
+            JSON.parse(firstObj); // Validate it's valid JSON
+            return firstObj;
+        }
+    }
+    catch {
+        // If extraction fails, return the original string
+    }
+    return jsonString;
+}
+/**
+ * Cleans up LLM-generated JSON argument strings for tool calls.
+ * Removes duplicate/concatenated JSON objects and trims.
+ * @param args The raw arguments string from the tool call
+ * @returns Cleaned and sanitized argument string
+ */
+function sanitizeToolArguments(args) {
+    let argsString = args?.trim() || "{}";
+    // Handle duplicate/concatenated JSON objects (LLM bug)
+    const extractedArgsString = extractFirstJsonObject(argsString);
+    if (extractedArgsString !== argsString) {
+        argsString = extractedArgsString;
+    }
+    return argsString;
+}
+export class LLMAgent extends EventEmitter {
+    llmClient;
+    textEditor;
+    morphEditor;
+    zsh;
+    confirmationTool;
+    search;
+    env;
+    introspect;
+    clearCacheTool;
+    characterTool;
+    taskTool;
+    internetTool;
+    imageTool;
+    fileConversionTool;
+    restartTool;
+    chatHistory = [];
+    messages = [];
+    tokenCounter;
+    abortController = null;
+    mcpInitialized = false;
+    maxToolRounds;
+    temperature;
+    maxTokens;
+    firstMessageProcessed = false;
+    contextWarningAt80 = false;
+    contextWarningAt90 = false;
+    persona = "";
+    personaColor = "white";
+    mood = "";
+    moodColor = "white";
+    activeTask = "";
+    activeTaskAction = "";
+    activeTaskColor = "white";
+    apiKeyEnvVar = "GROK_API_KEY";
+    pendingContextEditSession = null;
+    rephraseState = null;
+    hookPrefillText = null;
+    constructor(apiKey, baseURL, model, maxToolRounds, debugLogFile, startupHookOutput, temperature, maxTokens) {
+        super();
+        const manager = getSettingsManager();
+        const savedModel = manager.getCurrentModel();
+        const modelToUse = model || savedModel || "grok-code-fast-1";
+        this.maxToolRounds = maxToolRounds || 400;
+        this.temperature = temperature ?? manager.getTemperature();
+        this.maxTokens = maxTokens ?? manager.getMaxTokens();
+        // Get display name from environment (set by zai/helpers)
+        const displayName = process.env.GROK_BACKEND_DISPLAY_NAME;
+        this.llmClient = new LLMClient(apiKey, modelToUse, baseURL, displayName);
+        // Set apiKeyEnvVar based on backend name
+        const backendName = this.llmClient.getBackendName().toUpperCase();
+        this.apiKeyEnvVar = `${backendName}_API_KEY`;
+        this.textEditor = new TextEditorTool();
+        this.morphEditor = process.env.MORPH_API_KEY ? new MorphEditorTool() : null;
+        this.zsh = new ZshTool();
+        this.confirmationTool = new ConfirmationTool();
+        this.search = new SearchTool();
+        this.env = new EnvTool();
+        this.introspect = new IntrospectTool();
+        this.clearCacheTool = new ClearCacheTool();
+        this.restartTool = new RestartTool();
+        this.characterTool = new CharacterTool();
+        this.taskTool = new TaskTool();
+        this.internetTool = new InternetTool();
+        this.imageTool = new ImageTool();
+        this.fileConversionTool = new FileConversionTool();
+        this.textEditor.setAgent(this); // Give text editor access to agent for context awareness
+        this.introspect.setAgent(this); // Give introspect access to agent for tool class info
+        this.clearCacheTool.setAgent(this); // Give clearCache access to agent
+        this.characterTool.setAgent(this); // Give character tool access to agent
+        this.taskTool.setAgent(this); // Give task tool access to agent
+        this.internetTool.setAgent(this); // Give internet tool access to agent
+        this.imageTool.setAgent(this); // Give image tool access to agent
+        this.zsh.setAgent(this); // Give zsh tool access to agent for CWD tracking
+        this.tokenCounter = createTokenCounter(modelToUse);
+        // Initialize MCP servers if configured
+        this.initializeMCP(debugLogFile);
+        // System message will be set after async initialization
+        this.messages.push({
+            role: "system",
+            content: "Initializing...", // Temporary, will be replaced in initialize()
+        });
+        // Note: THE system prompt is NOT added to chatHistory
+        // Only conversational system messages go in chatHistory
+        // Store startup hook output for later use
+        this.startupHookOutput = startupHookOutput;
+    }
+    startupHookOutput;
+    systemPrompt = "Initializing..."; // THE system prompt (always at messages[0])
+    hasRunInstanceHook = false;
+    /**
+     * Initialize the agent with dynamic system prompt
+     * Must be called after construction
+     */
+    async initialize() {
+        // Build system message
+        await this.buildSystemMessage();
+    }
+    /**
+     * Build/rebuild the system message with current tool availability
+     * Updates this.systemPrompt which is always used for messages[0]
+     */
+    async buildSystemMessage() {
+        // Generate dynamic tool list using introspect tool
+        const toolsResult = await this.introspect.introspect("tools");
+        const toolsSection = toolsResult.success ? toolsResult.output : "Tools: Unknown";
+        // Set APP:TOOLS variable
+        Variable.set("APP:TOOLS", toolsSection);
+        // Build THE system prompt
+        this.systemPrompt = Variable.renderFull('SYSTEM');
+        // Update messages[0] with the system prompt
+        this.messages[0] = {
+            role: "system",
+            content: this.systemPrompt,
+        };
+        // Note: chatHistory no longer contains THE system prompt
+        // Only conversational system messages (persona, mood, etc.) go in chatHistory
+    }
+    async loadInitialHistory(history, systemPrompt) {
+        // Load chatHistory (no system messages in new architecture)
+        this.chatHistory = history;
+        // Set system prompt if provided, otherwise generate one
+        if (systemPrompt) {
+            this.setSystemPrompt(systemPrompt);
+        }
+        else {
+            await this.buildSystemMessage();
+        }
+        // Instance hook now runs in initialize() for both fresh and existing sessions
+        // Convert history to messages format for API calls
+        const historyMessages = [];
+        // Track which tool_call_ids we've seen in assistant messages
+        const seenToolCallIds = new Set();
+        // First pass: collect all tool_call_ids from assistant messages
+        for (const entry of history) {
+            if (entry.type === "assistant" && entry.tool_calls) {
+                entry.tool_calls.forEach(tc => seenToolCallIds.add(tc.id));
+            }
+        }
+        // Second pass: build history messages, only including tool_results that have matching tool_calls
+        const toolResultMessages = [];
+        const toolCallIdToMessage = new Map();
+        for (const entry of history) {
+            switch (entry.type) {
+                case "system":
+                    // All system messages from chatHistory go into conversation (persona, mood, etc.)
+                    // System messages must always be strings
+                    historyMessages.push({
+                        role: "system",
+                        content: getTextContent(entry.content),
+                    });
+                    break;
+                case "user":
+                    // User messages can have images (content arrays)
+                    historyMessages.push({
+                        role: "user",
+                        content: entry.content || "",
+                    });
+                    break;
+                case "assistant":
+                    // Assistant messages are always text (no images in responses)
+                    const assistantMessage = {
+                        role: "assistant",
+                        content: getTextContent(entry.content) || "", // Ensure content is never null/undefined
+                    };
+                    if (entry.tool_calls && entry.tool_calls.length > 0) {
+                        // For assistant messages with tool calls, collect the tool results that correspond to them
+                        const correspondingToolResults = [];
+                        const toolCallsWithResults = [];
+                        entry.tool_calls.forEach(tc => {
+                            // Find the tool_result entry for this tool_call
+                            const toolResultEntry = history.find(h => h.type === "tool_result" && h.toolCall?.id === tc.id);
+                            if (toolResultEntry) {
+                                // Only include this tool_call if we have its result
+                                toolCallsWithResults.push(tc);
+                                correspondingToolResults.push({
+                                    role: "tool",
+                                    content: toolResultEntry.toolResult?.output || toolResultEntry.toolResult?.error || "",
+                                    tool_call_id: tc.id,
+                                });
+                            }
+                        });
+                        // Only add tool_calls if we have at least one with a result
+                        if (toolCallsWithResults.length > 0) {
+                            assistantMessage.tool_calls = toolCallsWithResults;
+                            // Add assistant message
+                            historyMessages.push(assistantMessage);
+                            // Add corresponding tool results immediately after
+                            historyMessages.push(...correspondingToolResults);
+                        }
+                        else {
+                            // No tool results found, just add the assistant message without tool_calls
+                            historyMessages.push(assistantMessage);
+                        }
+                    }
+                    else {
+                        historyMessages.push(assistantMessage);
+                    }
+                    break;
+                case "tool_result":
+                    // Skip tool_result entries here - they're handled when processing assistant messages with tool_calls
+                    break;
+                // Skip tool_call entries as they are included with assistant
+            }
+        }
+        // Insert history messages after the system message
+        this.messages.splice(1, 0, ...historyMessages);
+        // Update token count in system message
+        const currentTokens = this.tokenCounter.countTokens(this.messages.map(m => typeof m.content === 'string' ? m.content : '').join(''));
+        if (this.messages.length > 0 && this.messages[0].role === 'system' && typeof this.messages[0].content === 'string') {
+            this.messages[0].content = this.messages[0].content.replace(/Current conversation token usage: .*/, `Current conversation token usage: ${currentTokens}`);
+        }
+    }
+    async initializeMCP(debugLogFile) {
+        // Initialize MCP in the background without blocking
+        Promise.resolve().then(async () => {
+            try {
+                const config = loadMCPConfig();
+                if (config.servers.length > 0) {
+                    await initializeMCPServers(debugLogFile);
+                }
+            }
+            catch (error) {
+                console.warn("MCP initialization failed:", error);
+            }
+            finally {
+                this.mcpInitialized = true;
+            }
+        });
+    }
+    isGrokModel() {
+        const currentModel = this.llmClient.getCurrentModel();
+        return currentModel.toLowerCase().includes("grok");
+    }
+    // Heuristic: enable web search only when likely needed
+    shouldUseSearchFor(message) {
+        const q = message.toLowerCase();
+        const keywords = [
+            "today",
+            "latest",
+            "news",
+            "trending",
+            "breaking",
+            "current",
+            "now",
+            "recent",
+            "x.com",
+            "twitter",
+            "tweet",
+            "what happened",
+            "as of",
+            "update on",
+            "release notes",
+            "changelog",
+            "price",
+        ];
+        if (keywords.some((k) => q.includes(k)))
+            return true;
+        // crude date pattern (e.g., 2024/2025) may imply recency
+        if (/(20\d{2})/.test(q))
+            return true;
+        return false;
+    }
+    async processUserMessage(message) {
+        // Detect rephrase commands
+        let isRephraseCommand = false;
+        let isSystemRephrase = false;
+        let messageToSend = message;
+        let messageType = "user";
+        let prefillText;
+        if (message.startsWith("/system rephrase")) {
+            isRephraseCommand = true;
+            isSystemRephrase = true;
+            messageToSend = message.substring(8).trim(); // Strip "/system " (8 chars including space)
+            messageType = "system";
+            // Extract prefill text after "/system rephrase "
+            const prefillMatch = message.match(/^\/system rephrase\s+(.+)$/);
+            if (prefillMatch) {
+                prefillText = prefillMatch[1];
+            }
+        }
+        else if (message.startsWith("/rephrase")) {
+            isRephraseCommand = true;
+            messageToSend = message; // Keep full text including "/rephrase"
+            messageType = "user";
+            // Extract prefill text after "/rephrase "
+            const prefillMatch = message.match(/^\/rephrase\s+(.+)$/);
+            if (prefillMatch) {
+                prefillText = prefillMatch[1];
+            }
+        }
+        // If this is a rephrase command, find the last assistant message
+        if (isRephraseCommand) {
+            // Find index of last assistant message in chatHistory
+            let lastAssistantIndex = -1;
+            for (let i = this.chatHistory.length - 1; i >= 0; i--) {
+                if (this.chatHistory[i].type === "assistant") {
+                    lastAssistantIndex = i;
+                    break;
+                }
+            }
+            if (lastAssistantIndex === -1) {
+                throw new Error("No previous assistant message to rephrase");
+            }
+            // Store rephrase state (will be updated with newResponseIndex after response)
+            // For now, just mark that we're in rephrase mode
+            this.setRephraseState(lastAssistantIndex, this.chatHistory.length, -1, messageType, prefillText);
+        }
+        // Before adding the new user message, check if there are incomplete tool calls
+        // from a previous interrupted turn. This prevents malformed message sequences
+        // that cause Ollama 500 errors.
+        const lastMessage = this.messages[this.messages.length - 1];
+        if (lastMessage?.role === "assistant" && lastMessage.tool_calls) {
+            // Find tool_call_ids that don't have corresponding tool result messages
+            const toolCallIds = new Set(lastMessage.tool_calls.map((tc) => tc.id));
+            const completedToolCallIds = new Set();
+            // Check which tool calls have results
+            for (let i = this.messages.length - 1; i >= 0; i--) {
+                const msg = this.messages[i];
+                if (msg.role === "tool" && msg.tool_call_id) {
+                    completedToolCallIds.add(msg.tool_call_id);
+                }
+                // Stop when we hit the assistant message with tool_calls
+                if (this.messages[i] === lastMessage)
+                    break;
+            }
+            // Add cancelled results for any incomplete tool calls
+            for (const toolCallId of toolCallIds) {
+                if (!completedToolCallIds.has(toolCallId)) {
+                    console.error(`Adding cancelled result for incomplete tool call: ${toolCallId}`);
+                    this.messages.push({
+                        role: "tool",
+                        content: "[Cancelled by user]",
+                        tool_call_id: toolCallId,
+                    });
+                }
+            }
+        }
+        // Clear one-shot variables
+        Variable.clearOneShot();
+        // Execute instance hook once per session (after first clearOneShot)
+        if (!this.hasRunInstanceHook) {
+            this.hasRunInstanceHook = true;
+            const settings = getSettingsManager();
+            const instanceHookPath = settings.getInstanceHook();
+            if (instanceHookPath) {
+                const hookResult = await executeOperationHook(instanceHookPath, "instance", {}, 30000, false, // Instance hook is not mandatory
+                this.getCurrentTokenCount(), this.getMaxContextSize());
+                if (hookResult.approved && hookResult.commands && hookResult.commands.length > 0) {
+                    // Apply hook commands (ENV, TOOL_RESULT, MODEL, SYSTEM, SET*)
+                    const results = applyHookCommands(hookResult.commands);
+                    // Apply prompt variables from SET* commands
+                    for (const [varName, value] of results.promptVars.entries()) {
+                        Variable.set(varName, value);
+                    }
+                    // Process other hook commands (MODEL, BACKEND, ENV)
+                    await this.processHookCommands(results);
+                    // Add SYSTEM message to messages array if present
+                    if (results.system) {
+                        this.messages.push({
+                            role: 'system',
+                            content: results.system
+                        });
+                    }
+                    // Store prefill text from hook if present
+                    if (results.prefill) {
+                        this.hookPrefillText = results.prefill;
+                    }
+                }
+            }
+        }
+        // Parse images once if present (for both text extraction and later assembly)
+        const parsed = hasImageReferences(messageToSend)
+            ? parseImagesFromMessage(messageToSend)
+            : { text: messageToSend, images: [] };
+        // Set USER:PROMPT variable (text only, images stripped)
+        Variable.set("USER:PROMPT", parsed.text);
+        // Execute prePrompt hook if configured
+        const hookPath = getSettingsManager().getPrePromptHook();
+        if (hookPath) {
+            const hookResult = await executeOperationHook(hookPath, "prePrompt", { USER_MESSAGE: parsed.text }, 30000, false, // prePrompt hook is never mandatory
+            this.getCurrentTokenCount(), this.getMaxContextSize());
+            if (hookResult.approved && hookResult.commands) {
+                const results = applyHookCommands(hookResult.commands);
+                // Set prompt variables from hook output (SET, SET_FILE, SET_TEMP_FILE)
+                for (const [varName, value] of results.promptVars.entries()) {
+                    Variable.set(varName, value);
+                }
+                // Process other hook commands (MODEL, BACKEND, SYSTEM, etc.)
+                await this.processHookCommands(results);
+                // Store prefill text from hook if present
+                if (results.prefill) {
+                    this.hookPrefillText = results.prefill;
+                }
+            }
+        }
+        // Assemble final message from variables
+        const assembledMessage = Variable.renderFull("USER");
+        // Add user/system message to conversation
+        // Note: System messages can only have string content, so images are only supported for user messages
+        const supportsVision = this.llmClient.getSupportsVision();
+        let messageContent = assembledMessage;
+        if (messageType === "user" && parsed.images.length > 0 && supportsVision) {
+            // Construct content array with assembled text and images
+            messageContent = [
+                { type: "text", text: assembledMessage },
+                ...parsed.images
+            ];
+        }
+        const userEntry = {
+            type: messageType,
+            content: messageContent,
+            originalContent: messageType === "user" ? (parsed.images.length > 0 && supportsVision
+                ? [{ type: "text", text: parsed.text }, ...parsed.images]
+                : parsed.text) : undefined,
+            timestamp: new Date(),
+        };
+        this.chatHistory.push(userEntry);
+        // Push to messages array with proper typing based on role
+        if (messageType === "user") {
+            this.messages.push({ role: "user", content: messageContent });
+        }
+        else {
+            // System messages must have string content only
+            this.messages.push({ role: "system", content: typeof messageContent === "string" ? messageContent : messageToSend });
+        }
+        await this.emitContextChange();
+        const newEntries = [userEntry];
+        const maxToolRounds = this.maxToolRounds; // Prevent infinite loops
+        let toolRounds = 0;
+        let consecutiveNonToolResponses = 0;
+        try {
+            // If this is a rephrase with prefill text, add the assistant message now
+            if (this.rephraseState?.prefillText) {
+                this.messages.push({
+                    role: "assistant",
+                    content: this.rephraseState.prefillText
+                });
+            }
+            // If a hook returned prefill text, add the assistant message now
+            if (this.hookPrefillText) {
+                this.messages.push({
+                    role: "assistant",
+                    content: this.hookPrefillText
+                });
+            }
+            // Always fetch tools fresh - getAllLLMTools() handles lazy refresh internally
+            const supportsTools = this.llmClient.getSupportsTools();
+            let currentResponse = await this.llmClient.chat(this.messages, supportsTools ? await getAllLLMTools() : [], undefined, this.isGrokModel() && this.shouldUseSearchFor(message)
+                ? { search_parameters: { mode: "auto" } }
+                : { search_parameters: { mode: "off" } }, this.temperature, this.abortController?.signal, this.maxTokens);
+            // Parse XML tool calls from response if present
+            if (currentResponse.choices?.[0]?.message) {
+                currentResponse.choices[0].message = this.parseXMLToolCalls(currentResponse.choices[0].message);
+            }
+            // Agent loop - continue until no more tool calls or max rounds reached
+            while (toolRounds < maxToolRounds) {
+                const assistantMessage = currentResponse.choices?.[0]?.message;
+                if (!assistantMessage) {
+                    throw new Error("No response from LLM");
+                }
+                // Handle tool calls
+                if (assistantMessage.tool_calls &&
+                    assistantMessage.tool_calls.length > 0) {
+                    toolRounds++;
+                    consecutiveNonToolResponses = 0; // Reset counter when AI makes tool calls
+                    // Clean up tool call arguments before adding to conversation history
+                    // This prevents Ollama from rejecting malformed tool calls on subsequent API calls
+                    const cleanedToolCalls = assistantMessage.tool_calls.map(toolCall => {
+                        let argsString = sanitizeToolArguments(toolCall.function.arguments);
+                        return {
+                            ...toolCall,
+                            function: {
+                                ...toolCall.function,
+                                arguments: argsString
+                            }
+                        };
+                    });
+                    // Add assistant message to conversation
+                    this.messages.push({
+                        role: "assistant",
+                        content: assistantMessage.content || "(Calling tools to perform this request)",
+                        tool_calls: cleanedToolCalls,
+                    });
+                    // Add assistant message to chat history
+                    const assistantToolCallEntry = {
+                        type: "assistant",
+                        content: assistantMessage.content || "(Calling tools to perform this request)",
+                        timestamp: new Date(),
+                        tool_calls: assistantMessage.tool_calls,
+                    };
+                    this.chatHistory.push(assistantToolCallEntry);
+                    newEntries.push(assistantToolCallEntry);
+                    await this.emitContextChange();
+                    // Create initial tool call entries to show tools are being executed
+                    // Use cleanedToolCalls to preserve arguments in chatHistory
+                    cleanedToolCalls.forEach((toolCall) => {
+                        const toolCallEntry = {
+                            type: "tool_call",
+                            content: "Executing...",
+                            timestamp: new Date(),
+                            toolCall: toolCall,
+                        };
+                        this.chatHistory.push(toolCallEntry);
+                        newEntries.push(toolCallEntry);
+                    });
+                    // Execute tool calls and update the entries
+                    let toolIndex = 0;
+                    const completedToolCallIds = new Set();
+                    try {
+                        for (const toolCall of cleanedToolCalls) {
+                            // Check for cancellation before executing each tool
+                            if (this.abortController?.signal.aborted) {
+                                console.error(`Tool execution cancelled after ${toolIndex}/${cleanedToolCalls.length} tools`);
+                                // Add cancelled responses for remaining uncompleted tools
+                                for (let i = toolIndex; i < cleanedToolCalls.length; i++) {
+                                    const remainingToolCall = cleanedToolCalls[i];
+                                    this.messages.push({
+                                        role: "tool",
+                                        content: "[Cancelled by user]",
+                                        tool_call_id: remainingToolCall.id,
+                                    });
+                                    completedToolCallIds.add(remainingToolCall.id);
+                                }
+                                throw new Error("Operation cancelled by user");
+                            }
+                            const result = await this.executeTool(toolCall);
+                            // Update the existing tool_call entry with the result
+                            const entryIndex = this.chatHistory.findIndex((entry) => entry.type === "tool_call" && entry.toolCall?.id === toolCall.id);
+                            if (entryIndex !== -1) {
+                                const updatedEntry = {
+                                    ...this.chatHistory[entryIndex],
+                                    type: "tool_result",
+                                    content: result.success
+                                        ? result.output || "Success"
+                                        : result.error || "Error occurred",
+                                    toolResult: result,
+                                };
+                                this.chatHistory[entryIndex] = updatedEntry;
+                                // Also update in newEntries for return value
+                                const newEntryIndex = newEntries.findIndex((entry) => entry.type === "tool_call" &&
+                                    entry.toolCall?.id === toolCall.id);
+                                if (newEntryIndex !== -1) {
+                                    newEntries[newEntryIndex] = updatedEntry;
+                                }
+                            }
+                            // Add tool result to messages with proper format (needed for AI context)
+                            this.messages.push({
+                                role: "tool",
+                                content: result.success
+                                    ? result.output || "Success"
+                                    : result.error || "Error",
+                                tool_call_id: toolCall.id,
+                            });
+                            completedToolCallIds.add(toolCall.id);
+                            await this.emitContextChange();
+                            toolIndex++;
+                        }
+                    }
+                    finally {
+                        // Ensure ALL tool calls in this.messages have results, even if we crashed/errored
+                        for (const toolCall of cleanedToolCalls) {
+                            if (!completedToolCallIds.has(toolCall.id)) {
+                                this.messages.push({
+                                    role: "tool",
+                                    content: "[Error: Tool execution interrupted]",
+                                    tool_call_id: toolCall.id,
+                                });
+                            }
+                        }
+                    }
+                    // After all tool results are added, add any system messages from this tool round
+                    // System messages are added to chatHistory during tool execution (for display)
+                    // Now we add them to this.messages in the same order (after all tool results)
+                    // Find the most recent assistant message with tool_calls in chatHistory (search backwards)
+                    let assistantIndex = -1;
+                    for (let i = this.chatHistory.length - 1; i >= 0; i--) {
+                        const entry = this.chatHistory[i];
+                        if (entry.type === "assistant" && entry.tool_calls && entry.tool_calls.length > 0) {
+                            assistantIndex = i;
+                            break;
+                        }
+                    }
+                    if (assistantIndex !== -1) {
+                        // Collect system messages that appeared after this assistant message
+                        for (let i = assistantIndex + 1; i < this.chatHistory.length; i++) {
+                            const entry = this.chatHistory[i];
+                            const content = getTextContent(entry.content);
+                            if (entry.type === 'system' && content && content.trim()) {
+                                this.messages.push({
+                                    role: 'system',
+                                    content: content
+                                });
+                            }
+                            // Stop if we hit another assistant or user message (next turn)
+                            if (entry.type === 'assistant' || entry.type === 'user') {
+                                break;
+                            }
+                        }
+                    }
+                    // Get next response - this might contain more tool calls
+                    // Debug logging to diagnose tool_call/tool_result mismatch
+                    const debugLogPath = ChatHistoryManager.getDebugLogPath();
+                    const timestamp = new Date().toISOString();
+                    fs.appendFileSync(debugLogPath, `\n${timestamp} - [DEBUG] Messages before API call (${this.messages.length} messages):\n`);
+                    this.messages.forEach((msg, idx) => {
+                        const msgSummary = { idx, role: msg.role };
+                        if (msg.tool_calls)
+                            msgSummary.tool_calls = msg.tool_calls.map((tc) => tc.id);
+                        if (msg.tool_call_id)
+                            msgSummary.tool_call_id = msg.tool_call_id;
+                        fs.appendFileSync(debugLogPath, `  ${JSON.stringify(msgSummary)}\n`);
+                    });
+                    currentResponse = await this.llmClient.chat(this.messages, supportsTools ? await getAllLLMTools() : [], undefined, this.isGrokModel() && this.shouldUseSearchFor(message)
+                        ? { search_parameters: { mode: "auto" } }
+                        : { search_parameters: { mode: "off" } }, this.temperature, this.abortController?.signal, this.maxTokens);
+                }
+                else {
+                    // No tool calls in this response - only add it if there's actual content
+                    let trimmedContent = assistantMessage.content?.trim();
+                    // If this was a rephrase with prefill, prepend the prefill text to the response
+                    if (trimmedContent && this.rephraseState?.prefillText) {
+                        trimmedContent = this.rephraseState.prefillText + trimmedContent;
+                    }
+                    // If a hook provided prefill, prepend it to the response
+                    if (trimmedContent && this.hookPrefillText) {
+                        trimmedContent = this.hookPrefillText + trimmedContent;
+                        this.hookPrefillText = null; // Clear after use
+                    }
+                    if (trimmedContent) {
+                        const responseEntry = {
+                            type: "assistant",
+                            content: trimmedContent,
+                            timestamp: new Date(),
+                        };
+                        this.chatHistory.push(responseEntry);
+                        this.messages.push({
+                            role: "assistant",
+                            content: trimmedContent,
+                        });
+                        newEntries.push(responseEntry);
+                        // Update rephrase state with the new response index
+                        if (this.rephraseState && this.rephraseState.newResponseIndex === -1) {
+                            const newResponseIndex = this.chatHistory.length - 1;
+                            this.setRephraseState(this.rephraseState.originalAssistantMessageIndex, this.rephraseState.rephraseRequestIndex, newResponseIndex, this.rephraseState.messageType, this.rephraseState.prefillText);
+                        }
+                    }
+                    // TODO: HACK - This is a temporary fix to prevent duplicate responses.
+                    // We need a proper way for the bot to signal task completion, such as:
+                    // - A special tool call like "taskComplete()"
+                    // - A finish_reason indicator in the API response
+                    // - A structured response format that explicitly marks completion
+                    // For now, we break immediately after a substantial response to avoid
+                    // the cascade of duplicate responses caused by "give it one more chance" logic.
+                    // If the AI provided a substantial response (>SUBSTANTIAL_RESPONSE_THRESHOLD chars), task is complete
+                    if (assistantMessage.content && assistantMessage.content.trim().length > SUBSTANTIAL_RESPONSE_THRESHOLD) {
+                        break; // Task complete - bot gave a full response
+                    }
+                    // Short/empty response, give AI another chance
+                    currentResponse = await this.llmClient.chat(this.messages, supportsTools ? await getAllLLMTools() : [], undefined, this.isGrokModel() && this.shouldUseSearchFor(message)
+                        ? { search_parameters: { mode: "auto" } }
+                        : { search_parameters: { mode: "off" } }, this.temperature, this.abortController?.signal, this.maxTokens);
+                    // Parse XML tool calls from followup response if present
+                    if (currentResponse.choices?.[0]?.message) {
+                        currentResponse.choices[0].message = this.parseXMLToolCalls(currentResponse.choices[0].message);
+                    }
+                    const followupMessage = currentResponse.choices?.[0]?.message;
+                    if (!followupMessage?.tool_calls || followupMessage.tool_calls.length === 0) {
+                        break; // AI doesn't want to continue
+                    }
+                }
+            }
+            if (toolRounds >= maxToolRounds) {
+                const warningEntry = {
+                    type: "assistant",
+                    content: "Maximum tool execution rounds reached. Stopping to prevent infinite loops.",
+                    timestamp: new Date(),
+                };
+                this.chatHistory.push(warningEntry);
+                newEntries.push(warningEntry);
+            }
+            // Mark first message as processed so subsequent messages use cached tools
+            this.firstMessageProcessed = true;
+            // Check if tool support changed during first message processing
+            // If model doesn't support tools, regenerate system message without tool list
+            const supportsToolsAfter = this.llmClient.getSupportsTools();
+            if (!supportsToolsAfter && supportsTools) {
+                // Tool support was disabled during first message - regenerate system message
+                await this.buildSystemMessage();
+            }
+            return newEntries;
+        }
+        catch (error) {
+            // Check if context is too large (413 error when vision already disabled)
+            if (error.message && error.message.startsWith('CONTEXT_TOO_LARGE:')) {
+                const beforeCount = this.chatHistory.length;
+                this.compactContext(20);
+                const afterCount = this.chatHistory.length;
+                const removedCount = beforeCount - afterCount;
+                const compactEntry = {
+                    type: "system",
+                    content: `Context was too large for backend. Automatically compacted: removed ${removedCount} older messages, keeping last 20 messages. Please retry your request.`,
+                    timestamp: new Date(),
+                };
+                this.chatHistory.push(compactEntry);
+                // Mark first message as processed
+                this.firstMessageProcessed = true;
+                return [userEntry, compactEntry];
+            }
+            const errorEntry = {
+                type: "assistant",
+                content: `Sorry, I encountered an error: ${error.message}`,
+                timestamp: new Date(),
+            };
+            this.chatHistory.push(errorEntry);
+            // Mark first message as processed even on error
+            this.firstMessageProcessed = true;
+            return [userEntry, errorEntry];
+        }
+    }
+    /**
+     * Parse XML-formatted tool calls from message content (x.ai format)
+     * Converts <xai:function_call> elements to standard LLMToolCall format
+     */
+    parseXMLToolCalls(message) {
+        if (!message.content || typeof message.content !== 'string') {
+            return message;
+        }
+        const content = message.content;
+        const xmlToolCallRegex = /<xai:function_call\s+name="([^"]+)">([\s\S]*?)<\/xai:function_call>/g;
+        const matches = Array.from(content.matchAll(xmlToolCallRegex));
+        if (matches.length === 0) {
+            return message;
+        }
+        // Parse each XML tool call
+        const toolCalls = [];
+        let cleanedContent = content;
+        for (const match of matches) {
+            const functionName = match[1];
+            const paramsXML = match[2];
+            // Parse parameters
+            const paramRegex = /<parameter\s+name="([^"]+)">([^<]*)<\/parameter>/g;
+            const paramMatches = Array.from(paramsXML.matchAll(paramRegex));
+            const args = {};
+            for (const paramMatch of paramMatches) {
+                args[paramMatch[1]] = paramMatch[2];
+            }
+            // Generate a unique ID for this tool call
+            const toolCallId = `call_xml_${Date.now()}_${Math.random().toString(36).substring(7)}`;
+            toolCalls.push({
+                id: toolCallId,
+                type: "function",
+                function: {
+                    name: functionName,
+                    arguments: JSON.stringify(args)
+                }
+            });
+            // Remove this XML block from content
+            cleanedContent = cleanedContent.replace(match[0], '');
+        }
+        // Trim any extra whitespace
+        cleanedContent = cleanedContent.trim();
+        // Return modified message with tool_calls and cleaned content
+        return {
+            ...message,
+            content: cleanedContent || null,
+            tool_calls: [...(message.tool_calls || []), ...toolCalls]
+        };
+    }
+    messageReducer(previous, item) {
+        const reduce = (acc, delta) => {
+            // Ensure acc is always an object before spreading (handles null/undefined)
+            acc = { ...(acc || {}) };
+            for (const [key, value] of Object.entries(delta)) {
+                // Skip null values in delta (Venice sends tool_calls: null which breaks Object.entries)
+                if (value === null)
+                    continue;
+                if (acc[key] === undefined || acc[key] === null) {
+                    acc[key] = value;
+                    // Clean up index properties from tool calls
+                    if (Array.isArray(acc[key])) {
+                        for (const arr of acc[key]) {
+                            delete arr.index;
+                        }
+                    }
+                }
+                else if (typeof acc[key] === "string" && typeof value === "string") {
+                    // Don't concatenate certain properties that should remain separate
+                    const nonConcatenableProps = ['id', 'type', 'name'];
+                    if (nonConcatenableProps.includes(key)) {
+                        // For non-concatenable properties, keep the new value
+                        acc[key] = value;
+                    }
+                    else {
+                        // For content, arguments, and other text properties, concatenate
+                        acc[key] += value;
+                    }
+                }
+                else if (Array.isArray(acc[key]) && Array.isArray(value)) {
+                    const accArray = acc[key];
+                    for (let i = 0; i < value.length; i++) {
+                        if (!accArray[i])
+                            accArray[i] = {};
+                        accArray[i] = reduce(accArray[i], value[i]);
+                    }
+                }
+                else if (typeof acc[key] === "object" && typeof value === "object") {
+                    acc[key] = reduce(acc[key], value);
+                }
+            }
+            return acc;
+        };
+        return reduce(previous, item.choices?.[0]?.delta || {});
+    }
+    async *processUserMessageStream(message) {
+        // Create new abort controller for this request
+        this.abortController = new AbortController();
+        // Detect rephrase commands
+        let isRephraseCommand = false;
+        let isSystemRephrase = false;
+        let messageToSend = message;
+        let messageType = "user";
+        let prefillText;
+        if (message.startsWith("/system rephrase")) {
+            isRephraseCommand = true;
+            isSystemRephrase = true;
+            messageToSend = message.substring(8).trim(); // Strip "/system " (8 chars including space)
+            messageType = "system";
+            // Extract prefill text after "/system rephrase "
+            const prefillMatch = message.match(/^\/system rephrase\s+(.+)$/);
+            if (prefillMatch) {
+                prefillText = prefillMatch[1];
+            }
+        }
+        else if (message.startsWith("/rephrase")) {
+            isRephraseCommand = true;
+            messageToSend = message; // Keep full text including "/rephrase"
+            messageType = "user";
+            // Extract prefill text after "/rephrase "
+            const prefillMatch = message.match(/^\/rephrase\s+(.+)$/);
+            if (prefillMatch) {
+                prefillText = prefillMatch[1];
+            }
+        }
+        // If this is a rephrase command, find the last assistant message
+        if (isRephraseCommand) {
+            // Find index of last assistant message in chatHistory
+            let lastAssistantIndex = -1;
+            for (let i = this.chatHistory.length - 1; i >= 0; i--) {
+                if (this.chatHistory[i].type === "assistant") {
+                    lastAssistantIndex = i;
+                    break;
+                }
+            }
+            if (lastAssistantIndex === -1) {
+                throw new Error("No previous assistant message to rephrase");
+            }
+            // Store rephrase state (will be updated with newResponseIndex after response)
+            // For now, just mark that we're in rephrase mode
+            this.setRephraseState(lastAssistantIndex, this.chatHistory.length, -1, messageType, prefillText);
+        }
+        // Before adding the new user message, check if there are incomplete tool calls
+        // from a previous interrupted turn. This prevents malformed message sequences
+        // that cause Ollama 500 errors.
+        const lastMessage = this.messages[this.messages.length - 1];
+        if (lastMessage?.role === "assistant" && lastMessage.tool_calls) {
+            // Find tool_call_ids that don't have corresponding tool result messages
+            const toolCallIds = new Set(lastMessage.tool_calls.map((tc) => tc.id));
+            const completedToolCallIds = new Set();
+            // Check which tool calls have results
+            for (let i = this.messages.length - 1; i >= 0; i--) {
+                const msg = this.messages[i];
+                if (msg.role === "tool" && msg.tool_call_id) {
+                    completedToolCallIds.add(msg.tool_call_id);
+                }
+                // Stop when we hit the assistant message with tool_calls
+                if (this.messages[i] === lastMessage)
+                    break;
+            }
+            // Add cancelled results for any incomplete tool calls
+            for (const toolCallId of toolCallIds) {
+                if (!completedToolCallIds.has(toolCallId)) {
+                    console.error(`Adding cancelled result for incomplete tool call: ${toolCallId}`);
+                    this.messages.push({
+                        role: "tool",
+                        content: "[Cancelled by user]",
+                        tool_call_id: toolCallId,
+                    });
+                }
+            }
+        }
+        // Clear one-shot variables
+        Variable.clearOneShot();
+        // Execute instance hook once per session (after first clearOneShot)
+        if (!this.hasRunInstanceHook) {
+            this.hasRunInstanceHook = true;
+            const settings = getSettingsManager();
+            const instanceHookPath = settings.getInstanceHook();
+            if (instanceHookPath) {
+                const hookResult = await executeOperationHook(instanceHookPath, "instance", {}, 30000, false, // Instance hook is not mandatory
+                this.getCurrentTokenCount(), this.getMaxContextSize());
+                if (hookResult.approved && hookResult.commands && hookResult.commands.length > 0) {
+                    // Apply hook commands (ENV, TOOL_RESULT, MODEL, SYSTEM, SET*)
+                    const results = applyHookCommands(hookResult.commands);
+                    // Apply prompt variables from SET* commands
+                    for (const [varName, value] of results.promptVars.entries()) {
+                        Variable.set(varName, value);
+                    }
+                    // Process other hook commands (MODEL, BACKEND, ENV)
+                    await this.processHookCommands(results);
+                    // Add SYSTEM message to messages array if present
+                    if (results.system) {
+                        this.messages.push({
+                            role: 'system',
+                            content: results.system
+                        });
+                    }
+                    // Store prefill text from hook if present
+                    if (results.prefill) {
+                        this.hookPrefillText = results.prefill;
+                    }
+                }
+            }
+        }
+        // Parse images once if present (for both text extraction and later assembly)
+        const parsed = hasImageReferences(messageToSend)
+            ? parseImagesFromMessage(messageToSend)
+            : { text: messageToSend, images: [] };
+        // Set USER:PROMPT variable (text only, images stripped)
+        Variable.set("USER:PROMPT", parsed.text);
+        // Execute prePrompt hook if configured
+        const hookPath = getSettingsManager().getPrePromptHook();
+        if (hookPath) {
+            const hookResult = await executeOperationHook(hookPath, "prePrompt", { USER_MESSAGE: parsed.text }, 30000, false, // prePrompt hook is never mandatory
+            this.getCurrentTokenCount(), this.getMaxContextSize());
+            if (hookResult.approved && hookResult.commands) {
+                const results = applyHookCommands(hookResult.commands);
+                // Set prompt variables from hook output (SET, SET_FILE, SET_TEMP_FILE)
+                for (const [varName, value] of results.promptVars.entries()) {
+                    Variable.set(varName, value);
+                }
+                // Process other hook commands (MODEL, BACKEND, SYSTEM, etc.)
+                await this.processHookCommands(results);
+                // Store prefill text from hook if present
+                if (results.prefill) {
+                    this.hookPrefillText = results.prefill;
+                }
+            }
+        }
+        // Assemble final message from variables
+        const assembledMessage = Variable.renderFull("USER");
+        // Add user/system message to both API conversation and chat history
+        // Note: System messages can only have string content, so images are only supported for user messages
+        const supportsVision = this.llmClient.getSupportsVision();
+        let messageContent = assembledMessage;
+        if (messageType === "user" && parsed.images.length > 0 && supportsVision) {
+            // Construct content array with assembled text and images
+            messageContent = [
+                { type: "text", text: assembledMessage },
+                ...parsed.images
+            ];
+        }
+        const userEntry = {
+            type: messageType,
+            content: messageContent,
+            originalContent: messageType === "user" ? (parsed.images.length > 0 && supportsVision
+                ? [{ type: "text", text: parsed.text }, ...parsed.images]
+                : parsed.text) : undefined,
+            timestamp: new Date(),
+        };
+        this.chatHistory.push(userEntry);
+        // Push to messages array with proper typing based on role
+        if (messageType === "user") {
+            this.messages.push({ role: "user", content: messageContent });
+        }
+        else {
+            // System messages must have string content only
+            this.messages.push({ role: "system", content: typeof messageContent === "string" ? messageContent : assembledMessage });
+        }
+        await this.emitContextChange();
+        // Yield user message so UI can display it immediately
+        yield {
+            type: "user_message",
+            userEntry: userEntry,
+        };
+        // If this is a rephrase with prefill text, add the assistant message now
+        if (this.rephraseState?.prefillText) {
+            this.messages.push({
+                role: "assistant",
+                content: this.rephraseState.prefillText
+            });
+        }
+        // If a hook returned prefill text, add the assistant message now
+        if (this.hookPrefillText) {
+            this.messages.push({
+                role: "assistant",
+                content: this.hookPrefillText
+            });
+        }
+        // Calculate input tokens
+        let inputTokens = this.tokenCounter.countMessageTokens(this.messages);
+        yield {
+            type: "token_count",
+            tokenCount: inputTokens,
+        };
+        const maxToolRounds = this.maxToolRounds; // Prevent infinite loops
+        let toolRounds = 0;
+        let totalOutputTokens = 0;
+        let lastTokenUpdate = 0;
+        let consecutiveNonToolResponses = 0;
+        try {
+            // Always fetch tools fresh - getAllLLMTools() handles lazy refresh internally
+            const supportsTools = this.llmClient.getSupportsTools();
+            // Agent loop - continue until no more tool calls or max rounds reached
+            while (toolRounds < maxToolRounds) {
+                // Check if operation was cancelled
+                if (this.abortController?.signal.aborted) {
+                    yield {
+                        type: "content",
+                        content: "\n\n[Operation cancelled by user]",
+                    };
+                    yield { type: "done" };
+                    return;
+                }
+                // Update system message with current token count
+                if (this.messages.length > 0 && this.messages[0].role === 'system' && typeof this.messages[0].content === 'string') {
+                    this.messages[0].content = this.messages[0].content.replace(/Current conversation token usage: .*/, `Current conversation token usage: ${inputTokens}`);
+                }
+                // Stream response and accumulate
+                const stream = this.llmClient.chatStream(this.messages, supportsTools ? await getAllLLMTools() : [], undefined, this.isGrokModel() && this.shouldUseSearchFor(message)
+                    ? { search_parameters: { mode: "auto" } }
+                    : { search_parameters: { mode: "off" } }, this.temperature, this.abortController?.signal, this.maxTokens);
+                let accumulatedMessage = {};
+                let accumulatedContent = "";
+                let tool_calls_yielded = false;
+                let streamFinished = false;
+                let insideThinkTag = false;
+                // If this is a rephrase with prefill, yield the prefill text first and add to accumulated content
+                if (this.rephraseState?.prefillText) {
+                    yield {
+                        type: "content",
+                        content: this.rephraseState.prefillText,
+                    };
+                    accumulatedContent = this.rephraseState.prefillText;
+                }
+                // If a hook provided prefill, yield it first and add to accumulated content
+                if (this.hookPrefillText) {
+                    yield {
+                        type: "content",
+                        content: this.hookPrefillText,
+                    };
+                    accumulatedContent = this.hookPrefillText;
+                    this.hookPrefillText = null; // Clear after use
+                }
+                try {
+                    for await (const chunk of stream) {
+                        // Check for cancellation in the streaming loop
+                        if (this.abortController?.signal.aborted) {
+                            yield {
+                                type: "content",
+                                content: "\n\n[Operation cancelled by user]",
+                            };
+                            yield { type: "done" };
+                            return;
+                        }
+                        if (!chunk.choices?.[0])
+                            continue;
+                        // Check if stream is finished (Venice sends garbage after this)
+                        if (chunk.choices?.[0]?.finish_reason === "stop" || chunk.choices?.[0]?.finish_reason === "tool_calls") {
+                            streamFinished = true;
+                        }
+                        // Accumulate the message using reducer
+                        accumulatedMessage = this.messageReducer(accumulatedMessage, chunk);
+                        // Check for tool calls - yield when we have complete tool calls with function names
+                        if (!tool_calls_yielded && accumulatedMessage.tool_calls?.length > 0) {
+                            // Check if we have at least one complete tool call with a function name
+                            const hasCompleteTool = accumulatedMessage.tool_calls.some((tc) => tc.function?.name);
+                            if (hasCompleteTool) {
+                                yield {
+                                    type: "tool_calls",
+                                    tool_calls: accumulatedMessage.tool_calls,
+                                };
+                                tool_calls_yielded = true;
+                            }
+                        }
+                        // Stream content as it comes (but ignore content after stream is finished to avoid Venice garbage)
+                        if (chunk.choices[0].delta?.content && !streamFinished) {
+                            let deltaContent = chunk.choices[0].delta.content;
+                            // Handle thinking tags that may span multiple chunks
+                            // First, remove complete <think>...</think> blocks within this chunk
+                            deltaContent = deltaContent.replace(/<think>[\s\S]*?<\/think>/g, '');
+                            // Check for opening <think> tag
+                            if (deltaContent.includes('<think>')) {
+                                insideThinkTag = true;
+                                // Remove everything from <think> onwards in this chunk
+                                deltaContent = deltaContent.substring(0, deltaContent.indexOf('<think>'));
+                            }
+                            // If we're inside a think tag, remove everything up to and including </think>
+                            if (insideThinkTag) {
+                                if (deltaContent.includes('</think>')) {
+                                    // Found closing tag - remove everything up to and including it
+                                    const closeIndex = deltaContent.indexOf('</think>');
+                                    deltaContent = deltaContent.substring(closeIndex + 8); // 8 = length of '</think>'
+                                    insideThinkTag = false;
+                                }
+                                else {
+                                    // Still inside think block - remove entire chunk
+                                    deltaContent = '';
+                                }
+                            }
+                            // Skip completely empty chunks after filtering (but keep spaces!)
+                            if (deltaContent === '')
+                                continue;
+                            accumulatedContent += deltaContent;
+                            // Update token count in real-time including accumulated content and any tool calls
+                            const currentOutputTokens = this.tokenCounter.estimateStreamingTokens(accumulatedContent) +
+                                (accumulatedMessage.tool_calls
+                                    ? this.tokenCounter.countTokens(JSON.stringify(accumulatedMessage.tool_calls))
+                                    : 0);
+                            totalOutputTokens = currentOutputTokens;
+                            yield {
+                                type: "content",
+                                content: deltaContent,
+                            };
+                            // Emit token count update
+                            const now = Date.now();
+                            if (now - lastTokenUpdate > TOKEN_UPDATE_INTERVAL_MS) {
+                                lastTokenUpdate = now;
+                                yield {
+                                    type: "token_count",
+                                    tokenCount: inputTokens + totalOutputTokens,
+                                };
+                            }
+                        }
+                    }
+                }
+                catch (streamError) {
+                    // Check if stream was aborted
+                    if (this.abortController?.signal.aborted || streamError.name === 'AbortError' || streamError.code === 'ABORT_ERR') {
+                        yield {
+                            type: "content",
+                            content: "\n\n[Operation cancelled by user]",
+                        };
+                        yield { type: "done" };
+                        return;
+                    }
+                    // Re-throw other errors to be caught by outer catch
+                    throw streamError;
+                }
+                // Parse XML tool calls from accumulated message if present
+                accumulatedMessage = this.parseXMLToolCalls(accumulatedMessage);
+                // Clean up tool call arguments before adding to conversation history
+                // This prevents Ollama from rejecting malformed tool calls on subsequent API calls
+                const cleanedToolCalls = accumulatedMessage.tool_calls?.map(toolCall => {
+                    let argsString = sanitizeToolArguments(toolCall.function.arguments);
+                    return {
+                        ...toolCall,
+                        function: {
+                            ...toolCall.function,
+                            arguments: argsString
+                        }
+                    };
+                });
+                // Add accumulated message to conversation for API context
+                this.messages.push({
+                    role: "assistant",
+                    content: accumulatedMessage.content || "(Calling tools to perform this request)",
+                    tool_calls: cleanedToolCalls,
+                });
+                // Add assistant message to chat history
+                const assistantEntry = {
+                    type: "assistant",
+                    content: accumulatedMessage.content || "(Calling tools to perform this request)",
+                    timestamp: new Date(),
+                    tool_calls: accumulatedMessage.tool_calls,
+                };
+                this.chatHistory.push(assistantEntry);
+                await this.emitContextChange();
+                // Update rephrase state if this is a final response (no tool calls)
+                if (this.rephraseState && this.rephraseState.newResponseIndex === -1 && (!accumulatedMessage.tool_calls || accumulatedMessage.tool_calls.length === 0)) {
+                    const newResponseIndex = this.chatHistory.length - 1;
+                    this.setRephraseState(this.rephraseState.originalAssistantMessageIndex, this.rephraseState.rephraseRequestIndex, newResponseIndex, this.rephraseState.messageType);
+                }
+                // Handle tool calls if present
+                if (accumulatedMessage.tool_calls?.length > 0) {
+                    toolRounds++;
+                    // Only yield tool_calls if we haven't already yielded them during streaming
+                    if (!tool_calls_yielded) {
+                        yield {
+                            type: "tool_calls",
+                            tool_calls: accumulatedMessage.tool_calls,
+                        };
+                    }
+                    // Add tool_call entries to chatHistory so they persist through UI sync
+                    // Use cleanedToolCalls to preserve arguments in chatHistory
+                    cleanedToolCalls.forEach((toolCall) => {
+                        const toolCallEntry = {
+                            type: "tool_call",
+                            content: "Executing...",
+                            timestamp: new Date(),
+                            toolCall: toolCall,
+                        };
+                        this.chatHistory.push(toolCallEntry);
+                    });
+                    // Execute tools
+                    let toolIndex = 0;
+                    const completedToolCallIds = new Set();
+                    try {
+                        for (const toolCall of cleanedToolCalls) {
+                            // Check for cancellation before executing each tool
+                            if (this.abortController?.signal.aborted) {
+                                console.error(`Tool execution cancelled after ${toolIndex}/${cleanedToolCalls.length} tools`);
+                                // Add cancelled responses for remaining uncompleted tools
+                                for (let i = toolIndex; i < cleanedToolCalls.length; i++) {
+                                    const remainingToolCall = cleanedToolCalls[i];
+                                    this.messages.push({
+                                        role: "tool",
+                                        content: "[Cancelled by user]",
+                                        tool_call_id: remainingToolCall.id,
+                                    });
+                                    completedToolCallIds.add(remainingToolCall.id);
+                                }
+                                yield {
+                                    type: "content",
+                                    content: "\n\n[Operation cancelled by user]",
+                                };
+                                yield { type: "done" };
+                                return;
+                            }
+                            // Capture chatHistory length before tool execution to detect new system messages
+                            const chatHistoryLengthBefore = this.chatHistory.length;
+                            const result = await this.executeTool(toolCall);
+                            // Collect any new system messages added during tool execution (from hooks)
+                            const newSystemMessages = [];
+                            for (let i = chatHistoryLengthBefore; i < this.chatHistory.length; i++) {
+                                if (this.chatHistory[i].type === "system") {
+                                    newSystemMessages.push(this.chatHistory[i]);
+                                }
+                            }
+                            yield {
+                                type: "tool_result",
+                                toolCall,
+                                toolResult: result,
+                                systemMessages: newSystemMessages.length > 0 ? newSystemMessages : undefined,
+                            };
+                            // Update the tool_call entry in chatHistory to tool_result
+                            const entryIndex = this.chatHistory.findIndex((entry) => entry.type === "tool_call" && entry.toolCall?.id === toolCall.id);
+                            if (entryIndex !== -1) {
+                                this.chatHistory[entryIndex] = {
+                                    ...this.chatHistory[entryIndex],
+                                    type: "tool_result",
+                                    content: result.success
+                                        ? (result.output?.trim() || "Success")
+                                        : (result.error?.trim() || "Error occurred"),
+                                    toolResult: result,
+                                };
+                            }
+                            // Add tool result with proper format (needed for AI context)
+                            this.messages.push({
+                                role: "tool",
+                                content: result.success
+                                    ? result.output || "Success"
+                                    : result.error || "Error",
+                                tool_call_id: toolCall.id,
+                            });
+                            completedToolCallIds.add(toolCall.id);
+                            toolIndex++;
+                        }
+                    }
+                    finally {
+                        // Ensure ALL tool calls in this.messages have results, even if we crashed/errored
+                        for (const toolCall of cleanedToolCalls) {
+                            if (!completedToolCallIds.has(toolCall.id)) {
+                                this.messages.push({
+                                    role: "tool",
+                                    content: "[Error: Tool execution interrupted]",
+                                    tool_call_id: toolCall.id,
+                                });
+                            }
+                        }
+                    }
+                    // After all tool results are added, add any system messages from this tool round
+                    // System messages are added to chatHistory during tool execution (for display)
+                    // Now we add them to this.messages in the same order (after all tool results)
+                    // Find the most recent assistant message with tool_calls in chatHistory (search backwards)
+                    let assistantIndex = -1;
+                    for (let i = this.chatHistory.length - 1; i >= 0; i--) {
+                        const entry = this.chatHistory[i];
+                        if (entry.type === "assistant" && entry.tool_calls && entry.tool_calls.length > 0) {
+                            assistantIndex = i;
+                            break;
+                        }
+                    }
+                    if (assistantIndex !== -1) {
+                        // Collect system messages that appeared after this assistant message
+                        for (let i = assistantIndex + 1; i < this.chatHistory.length; i++) {
+                            const entry = this.chatHistory[i];
+                            const content = getTextContent(entry.content);
+                            if (entry.type === 'system' && content && content.trim()) {
+                                this.messages.push({
+                                    role: 'system',
+                                    content: content
+                                });
+                            }
+                            // Stop if we hit another assistant or user message (next turn)
+                            if (entry.type === 'assistant' || entry.type === 'user') {
+                                break;
+                            }
+                        }
+                    }
+                    // Update token count after processing all tool calls to include tool results
+                    inputTokens = this.tokenCounter.countMessageTokens(this.messages);
+                    // Final token update after tools processed
+                    yield {
+                        type: "token_count",
+                        tokenCount: inputTokens + totalOutputTokens,
+                    };
+                    // Continue the loop to get the next response (which might have more tool calls)
+                }
+                else {
+                    // No tool calls, we're done
+                    break;
+                }
+            }
+            if (toolRounds >= maxToolRounds) {
+                yield {
+                    type: "content",
+                    content: "\n\nMaximum tool execution rounds reached. Stopping to prevent infinite loops.",
+                };
+            }
+            // Mark first message as processed so subsequent messages use cached tools
+            this.firstMessageProcessed = true;
+            // Check if tool support changed during first message processing
+            // If model doesn't support tools, regenerate system message without tool list
+            const supportsToolsAfter = this.llmClient.getSupportsTools();
+            if (!supportsToolsAfter && supportsTools) {
+                // Tool support was disabled during first message - regenerate system message
+                await this.buildSystemMessage();
+            }
+            yield { type: "done" };
+        }
+        catch (error) {
+            // Check if this was a cancellation (check both abort signal and error name)
+            if (this.abortController?.signal.aborted || error.name === 'AbortError' || error.code === 'ABORT_ERR') {
+                yield {
+                    type: "content",
+                    content: "\n\n[Operation cancelled by user]",
+                };
+                yield { type: "done" };
+                return;
+            }
+            // Check if context is too large (413 error when vision already disabled)
+            if (error.message && error.message.startsWith('CONTEXT_TOO_LARGE:')) {
+                const beforeCount = this.chatHistory.length;
+                this.compactContext(20);
+                const afterCount = this.chatHistory.length;
+                const removedCount = beforeCount - afterCount;
+                const compactEntry = {
+                    type: "system",
+                    content: `Context was too large for backend. Automatically compacted: removed ${removedCount} older messages, keeping last 20 messages. Please retry your request.`,
+                    timestamp: new Date(),
+                };
+                this.chatHistory.push(compactEntry);
+                yield {
+                    type: "content",
+                    content: getTextContent(compactEntry.content),
+                };
+                yield { type: "done" };
+                return;
+            }
+            const errorEntry = {
+                type: "assistant",
+                content: `Sorry, I encountered an error: ${error.message}`,
+                timestamp: new Date(),
+            };
+            this.chatHistory.push(errorEntry);
+            yield {
+                type: "content",
+                content: getTextContent(errorEntry.content),
+            };
+            // Mark first message as processed even on error
+            this.firstMessageProcessed = true;
+            yield { type: "done" };
+        }
+        finally {
+            // Clean up abort controller
+            this.abortController = null;
+        }
+    }
+    /**
+     * Apply default parameter values for tools
+     * This ensures the approval hook sees the same parameters that will be used during execution
+     */
+    applyToolParameterDefaults(toolName, params) {
+        // Handle null/undefined params (can happen if API sends "null" as arguments string)
+        const result = { ...(params || {}) };
+        switch (toolName) {
+            case "listFiles":
+                // dirname defaults to current directory
+                if (!result.dirname) {
+                    result.dirname = ".";
+                }
+                break;
+            // Add other tools with defaults here as needed
+        }
+        return result;
+    }
+    /**
+     * Validate tool arguments against the tool's schema
+     * Returns null if valid, or an error message if invalid
+     */
+    async validateToolArguments(toolName, args) {
+        try {
+            // Get all tools (including MCP tools)
+            const supportsTools = this.llmClient.getSupportsTools();
+            const allTools = supportsTools ? await getAllLLMTools() : [];
+            // Find the tool schema
+            const toolSchema = allTools.find(t => t.function.name === toolName);
+            if (!toolSchema) {
+                return `Unknown tool: ${toolName}`;
+            }
+            const schema = toolSchema.function.parameters;
+            const properties = schema.properties || {};
+            const required = schema.required || [];
+            // Check if tool accepts no parameters
+            const acceptsNoParams = Object.keys(properties).length === 0;
+            const hasArgs = args && typeof args === 'object' && Object.keys(args).length > 0;
+            if (acceptsNoParams && hasArgs) {
+                return `Tool ${toolName} accepts no parameters, but received: ${JSON.stringify(args)}`;
+            }
+            // Check for unknown parameters
+            for (const argKey of Object.keys(args || {})) {
+                if (!properties[argKey]) {
+                    return `Tool ${toolName} does not accept parameter '${argKey}'. Valid parameters: ${Object.keys(properties).join(', ') || 'none'}`;
+                }
+            }
+            // Check for missing required parameters
+            for (const requiredParam of required) {
+                if (!(requiredParam in (args || {}))) {
+                    return `Tool ${toolName} missing required parameter '${requiredParam}'`;
+                }
+            }
+            return null; // Valid
+        }
+        catch (error) {
+            console.error(`Error validating tool arguments for ${toolName}:`, error);
+            return null; // Allow execution if validation itself fails
+        }
+    }
+    async executeTool(toolCall) {
+        try {
+            // Parse arguments - handle empty string as empty object for parameter-less tools
+            let argsString = toolCall.function.arguments?.trim() || "{}";
+            // Handle duplicate/concatenated JSON objects (LLM bug)
+            // Pattern: {"key":"val"}{"key":"val"}
+            let hadDuplicateJson = false;
+            const extractedArgsString = extractFirstJsonObject(argsString);
+            if (extractedArgsString !== argsString) {
+                hadDuplicateJson = true;
+                argsString = extractedArgsString;
+            }
+            let args = JSON.parse(argsString);
+            // Handle multiple layers of JSON encoding (API bug)
+            // Keep parsing until we get an object, not a string
+            let parseCount = 0;
+            while (typeof args === 'string' && parseCount < MAX_JSON_PARSE_ATTEMPTS) {
+                parseCount++;
+                try {
+                    args = JSON.parse(args);
+                }
+                catch (e) {
+                    // If parse fails, the string isn't valid JSON - stop trying
+                    break;
+                }
+            }
+            // Log if we had to fix encoding
+            if (parseCount > 0) {
+                const bugMsg = `[BUG] Tool ${toolCall.function.name} had ${parseCount} extra layer(s) of JSON encoding`;
+                console.warn(bugMsg);
+                const systemMsg = `Warning: Tool arguments for ${toolCall.function.name} had ${parseCount} extra encoding layer(s) - this is an API bug`;
+                this.messages.push({
+                    role: 'system',
+                    content: systemMsg
+                });
+                this.chatHistory.push({
+                    type: 'system',
+                    content: systemMsg,
+                    timestamp: new Date()
+                });
+            }
+            // Log if we had to fix duplicate JSON
+            if (hadDuplicateJson) {
+                const bugMsg = `[BUG] Tool ${toolCall.function.name} had duplicate/concatenated JSON objects`;
+                console.warn(bugMsg);
+                const systemMsg = `Warning: Tool arguments for ${toolCall.function.name} had duplicate JSON objects (used first object only) - this is an LLM bug`;
+                this.messages.push({
+                    role: 'system',
+                    content: systemMsg
+                });
+                this.chatHistory.push({
+                    type: 'system',
+                    content: systemMsg,
+                    timestamp: new Date()
+                });
+            }
+            // Ensure args is always an object (API might send null)
+            if (!args || typeof args !== 'object' || Array.isArray(args)) {
+                args = {};
+            }
+            // Apply parameter defaults before validation and execution
+            args = this.applyToolParameterDefaults(toolCall.function.name, args);
+            // Validate tool arguments against schema
+            const validationError = await this.validateToolArguments(toolCall.function.name, args);
+            if (validationError) {
+                // Validation failed - return error
+                const errorMsg = `Tool call validation failed: ${validationError}. Please try again with correct parameters.`;
+                console.warn(`[VALIDATION ERROR] ${errorMsg}`);
+                return {
+                    success: false,
+                    error: validationError
+                };
+            }
+            // Task tools (startActiveTask, transitionActiveTaskStatus, stopActiveTask) have their own
+            // dedicated task approval hook, so skip the general tool approval hook for them
+            const isTaskTool = ['startActiveTask', 'transitionActiveTaskStatus', 'stopActiveTask'].includes(toolCall.function.name);
+            // Check tool approval hook if configured (skip for task tools)
+            const settings = getSettingsManager();
+            const toolApprovalHook = settings.getToolApprovalHook();
+            if (toolApprovalHook && !isTaskTool) {
+                const approvalResult = await executeToolApprovalHook(toolApprovalHook, toolCall.function.name, args, 30000, // 30 second timeout
+                this.getCurrentTokenCount(), this.getMaxContextSize());
+                if (!approvalResult.approved) {
+                    const reason = approvalResult.reason || "Tool execution denied by approval hook";
+                    // Process rejection commands (MODEL, SYSTEM, BACKEND, etc.)
+                    await this.processHookResult(approvalResult);
+                    return {
+                        success: false,
+                        error: `Tool execution blocked: ${reason}`,
+                    };
+                }
+                if (approvalResult.timedOut) {
+                    // Log timeout for debugging (don't block)
+                    console.warn(`Tool approval hook timed out for ${toolCall.function.name} (auto-approved)`);
+                }
+                // Process hook commands (ENV, TOOL_RESULT, MODEL, SYSTEM, BACKEND, etc.)
+                // TOOL_RESULT is for tool return values, not used by approval hook
+                // ENV variables can affect tool behavior if tools read from process.env
+                await this.processHookResult(approvalResult);
+            }
+            switch (toolCall.function.name) {
+                case "viewFile":
+                    {
+                        let range;
+                        range = args.start_line && args.end_line
+                            ? [args.start_line, args.end_line]
+                            : undefined;
+                        return await this.textEditor.viewFile(args.filename, range);
+                    }
+                case "createNewFile":
+                    return await this.textEditor.createNewFile(args.filename, args.content);
+                case "strReplace":
+                    return await this.textEditor.strReplace(args.filename, args.old_str, args.new_str, args.replace_all);
+                case "editFile":
+                    if (!this.morphEditor) {
+                        return {
+                            success: false,
+                            error: "Morph Fast Apply not available. Please set MORPH_API_KEY environment variable to use this feature.",
+                        };
+                    }
+                    return await this.morphEditor.editFile(args.filename, args.instructions, args.code_edit);
+                case "execute":
+                    return await this.zsh.execute(args.command);
+                case "listFiles":
+                    return await this.zsh.listFiles(args.dirname);
+                case "universalSearch":
+                    return await this.search.universalSearch(args.query, {
+                        searchType: args.search_type,
+                        includePattern: args.include_pattern,
+                        excludePattern: args.exclude_pattern,
+                        caseSensitive: args.case_sensitive,
+                        wholeWord: args.whole_word,
+                        regex: args.regex,
+                        maxResults: args.max_results,
+                        fileTypes: args.file_types,
+                        includeHidden: args.include_hidden,
+                    });
+                case "getEnv":
+                    return await this.env.getEnv(args.variable);
+                case "getAllEnv":
+                    return await this.env.getAllEnv();
+                case "searchEnv":
+                    return await this.env.searchEnv(args.pattern);
+                case "introspect":
+                    return await this.introspect.introspect(args.target);
+                case "clearCache":
+                    return await this.clearCacheTool.clearCache(args.confirmationCode);
+                case "restart":
+                    return await this.restartTool.restart();
+                case "setPersona":
+                    return await this.characterTool.setPersona(args.persona, args.color);
+                case "setMood":
+                    return await this.characterTool.setMood(args.mood, args.color);
+                case "getPersona":
+                    return await this.characterTool.getPersona();
+                case "getMood":
+                    return await this.characterTool.getMood();
+                case "getAvailablePersonas":
+                    return await this.characterTool.getAvailablePersonas();
+                case "startActiveTask":
+                    return await this.taskTool.startActiveTask(args.activeTask, args.action, args.color);
+                case "transitionActiveTaskStatus":
+                    return await this.taskTool.transitionActiveTaskStatus(args.action, args.color);
+                case "stopActiveTask":
+                    return await this.taskTool.stopActiveTask(args.reason, args.documentationFile, args.color);
+                case "insertLines":
+                    return await this.textEditor.insertLines(args.filename, args.insert_line, args.new_str);
+                case "replaceLines":
+                    return await this.textEditor.replaceLines(args.filename, args.start_line, args.end_line, args.new_str);
+                case "undoEdit":
+                    return await this.textEditor.undoEdit();
+                case "chdir":
+                    return this.zsh.chdir(args.dirname);
+                case "pwdir":
+                    return this.zsh.pwdir();
+                case "downloadFile":
+                    return await this.internetTool.downloadFile(args.url);
+                case "generateImage":
+                    return await this.imageTool.generateImage(args.prompt, args.negativePrompt, args.width, args.height, args.model, args.sampler, args.configScale, args.numSteps, args.nsfw, args.name, args.move, args.seed);
+                case "captionImage":
+                    return await this.imageTool.captionImage(args.filename, args.backend);
+                case "pngInfo":
+                    return await this.imageTool.pngInfo(args.filename);
+                case "listImageModels":
+                    return await this.imageTool.listImageModels();
+                case "readXlsx":
+                    return await this.fileConversionTool.readXlsx(args.filename, args.sheetName, args.outputFormat, args.output);
+                case "listXlsxSheets":
+                    return await this.fileConversionTool.listXlsxSheets(args.filename);
+                default:
+                    // Check if this is an MCP tool
+                    if (toolCall.function.name.startsWith("mcp__")) {
+                        return await this.executeMCPTool(toolCall.function.name, args);
+                    }
+                    return {
+                        success: false,
+                        error: `Unknown tool: ${toolCall.function.name}`,
+                    };
+            }
+        }
+        catch (error) {
+            return {
+                success: false,
+                error: `Tool execution error: ${error.message}`,
+            };
+        }
+    }
+    async executeMCPTool(toolName, args) {
+        try {
+            const mcpManager = getMCPManager();
+            const result = await mcpManager.callTool(toolName, args);
+            if (result.isError) {
+                return {
+                    success: false,
+                    error: result.content[0]?.text || "MCP tool error",
+                };
+            }
+            // Extract content from result
+            const output = result.content
+                .map((item) => {
+                if (item.type === "text") {
+                    return item.text;
+                }
+                else if (item.type === "resource") {
+                    return `Resource: ${item.resource?.uri || "Unknown"}`;
+                }
+                return String(item);
+            })
+                .join("\n");
+            // After successful MCP tool execution, invalidate cache for that server
+            // Next call to getAllLLMTools() will lazy-refresh this server
+            const serverNameMatch = toolName.match(/^mcp__(.+?)__/);
+            if (serverNameMatch) {
+                const serverName = serverNameMatch[1];
+                mcpManager.invalidateCache(serverName);
+            }
+            return {
+                success: true,
+                output: output || "Success",
+            };
+        }
+        catch (error) {
+            return {
+                success: false,
+                error: `MCP tool execution error: ${error.message}`,
+            };
+        }
+    }
+    getChatHistory() {
+        return [...this.chatHistory];
+    }
+    setChatHistory(history) {
+        this.chatHistory = [...history];
+    }
+    getSystemPrompt() {
+        return this.systemPrompt;
+    }
+    setSystemPrompt(prompt) {
+        this.systemPrompt = prompt;
+        this.messages[0] = {
+            role: "system",
+            content: prompt,
+        };
+    }
+    getMessages() {
+        return [...this.messages];
+    }
+    getCurrentTokenCount() {
+        return this.tokenCounter.countMessageTokens(this.messages);
+    }
+    getMaxContextSize() {
+        // TODO: Make this model-specific when different models have different context windows
+        // For now, return the standard Grok context window size
+        return 128000;
+    }
+    getContextUsagePercent() {
+        const current = this.getCurrentTokenCount();
+        const max = this.getMaxContextSize();
+        return (current / max) * 100;
+    }
+    /**
+     * Convert context messages to markdown format for viewing
+     * Format: (N) Name (role) - timestamp
+     */
+    async convertContextToMarkdown() {
+        const lines = [];
+        // Header
+        const { ChatHistoryManager } = await import("../utils/chat-history-manager.js");
+        const historyManager = ChatHistoryManager.getInstance();
+        const contextFilePath = historyManager.getContextFilePath();
+        lines.push("# Conversation Context");
+        lines.push(`Context File: ${contextFilePath}`);
+        lines.push(`Session: ${process.env.ZDS_AI_AGENT_SESSION || "N/A"}`);
+        lines.push(`Tokens: ${this.getCurrentTokenCount()} / ${this.getMaxContextSize()} (${this.getContextUsagePercent().toFixed(1)}%)`);
+        lines.push("");
+        lines.push("---");
+        lines.push("");
+        // Get agent name from environment or default
+        const agentName = process.env.ZDS_AI_AGENT_BOT_NAME || "Assistant";
+        const userName = process.env.ZDS_AI_AGENT_MESSAGE_AUTHOR || "User";
+        // Process messages
+        this.chatHistory.forEach((entry, index) => {
+            const msgNum = index + 1;
+            const timestamp = entry.timestamp.toLocaleTimeString();
+            if (entry.type === 'user') {
+                lines.push(`(${msgNum}) ${userName} (user) - ${timestamp}`);
+                lines.push(getTextContent(entry.content) || "");
+                lines.push("");
+            }
+            else if (entry.type === 'assistant') {
+                lines.push(`(${msgNum}) ${agentName} (assistant) - ${timestamp}`);
+                lines.push(getTextContent(entry.content) || "");
+                lines.push("");
+            }
+            else if (entry.type === 'system') {
+                lines.push(`(${msgNum}) System (system) - ${timestamp}`);
+                lines.push(getTextContent(entry.content) || "");
+                lines.push("");
+            }
+            else if (entry.type === 'tool_call') {
+                const toolCall = entry.toolCall;
+                const toolName = toolCall?.function?.name || "unknown";
+                const params = toolCall?.function?.arguments ? JSON.parse(toolCall.function.arguments) : {};
+                lines.push(`(${msgNum}) ${agentName} (tool_call: ${toolName}) - ${timestamp}`);
+                lines.push(`Parameters: ${JSON.stringify(params, null, 2)}`);
+                lines.push("");
+            }
+            else if (entry.type === 'tool_result') {
+                const toolCall = entry.toolCall;
+                const toolName = toolCall?.function?.name || "unknown";
+                lines.push(`(${msgNum}) System (tool_result: ${toolName}) - ${timestamp}`);
+                lines.push(getTextContent(entry.content) || "");
+                lines.push("");
+            }
+        });
+        return lines.join("\n");
+    }
+    getPersona() {
+        return this.persona;
+    }
+    getPersonaColor() {
+        return this.personaColor;
+    }
+    getMood() {
+        return this.mood;
+    }
+    getMoodColor() {
+        return this.moodColor;
+    }
+    getActiveTask() {
+        return this.activeTask;
+    }
+    getActiveTaskAction() {
+        return this.activeTaskAction;
+    }
+    getActiveTaskColor() {
+        return this.activeTaskColor;
+    }
+    setPendingContextEditSession(tmpJsonPath, contextFilePath) {
+        this.pendingContextEditSession = { tmpJsonPath, contextFilePath };
+    }
+    getPendingContextEditSession() {
+        return this.pendingContextEditSession;
+    }
+    clearPendingContextEditSession() {
+        this.pendingContextEditSession = null;
+    }
+    setRephraseState(originalAssistantMessageIndex, rephraseRequestIndex, newResponseIndex, messageType, prefillText) {
+        this.rephraseState = { originalAssistantMessageIndex, rephraseRequestIndex, newResponseIndex, messageType, prefillText };
+    }
+    getRephraseState() {
+        return this.rephraseState;
+    }
+    clearRephraseState() {
+        this.rephraseState = null;
+    }
+    async setPersona(persona, color) {
+        // Execute hook if configured
+        const settings = getSettingsManager();
+        const hookPath = settings.getPersonaHook();
+        const hookMandatory = settings.isPersonaHookMandatory();
+        if (!hookPath && hookMandatory) {
+            const reason = "Persona hook is mandatory but not configured";
+            return {
+                success: false,
+                error: reason
+            };
+        }
+        if (hookPath) {
+            const hookResult = await executeOperationHook(hookPath, "setPersona", {
+                persona_old: this.persona || "",
+                persona_new: persona,
+                persona_color: color || "white"
+            }, 30000, hookMandatory, this.getCurrentTokenCount(), this.getMaxContextSize());
+            if (!hookResult.approved) {
+                const reason = hookResult.reason || "Hook rejected persona change";
+                // Process rejection commands (MODEL, SYSTEM)
+                // Even in rejection, we process commands (might have MODEL change)
+                await this.processHookResult(hookResult);
+                // Note: We ignore the return value here since we're already rejecting the persona
+                return {
+                    success: false,
+                    error: reason
+                };
+            }
+            if (hookResult.timedOut) {
+                // Hook timed out but was auto-approved
+            }
+            // Process hook commands (ENV, MODEL, SYSTEM)
+            const result = await this.processHookResult(hookResult, 'ZDS_AI_AGENT_PERSONA');
+            if (!result.success) {
+                // Model/backend test failed - don't apply persona change
+                return {
+                    success: false,
+                    error: "Persona change rejected due to failed model/backend test"
+                };
+            }
+            // Apply persona transformation if present
+            if (result.transformedValue) {
+                persona = result.transformedValue;
+            }
+        }
+        const oldPersona = this.persona;
+        const oldColor = this.personaColor;
+        this.persona = persona;
+        this.personaColor = color || "white";
+        process.env.ZDS_AI_AGENT_PERSONA = persona;
+        // Persona hook generates success message - no need for redundant CLI message
+        this.emit('personaChange', {
+            persona: this.persona,
+            color: this.personaColor
+        });
+        return { success: true };
+    }
+    async setMood(mood, color) {
+        // Execute hook if configured
+        const settings = getSettingsManager();
+        const hookPath = settings.getMoodHook();
+        const hookMandatory = settings.isMoodHookMandatory();
+        if (!hookPath && hookMandatory) {
+            const reason = "Mood hook is mandatory but not configured";
+            return {
+                success: false,
+                error: reason
+            };
+        }
+        if (hookPath) {
+            const hookResult = await executeOperationHook(hookPath, "setMood", {
+                mood_old: this.mood || "",
+                mood_new: mood,
+                mood_color: color || "white"
+            }, 30000, hookMandatory, this.getCurrentTokenCount(), this.getMaxContextSize());
+            if (!hookResult.approved) {
+                const reason = hookResult.reason || "Hook rejected mood change";
+                // Process rejection commands (MODEL, SYSTEM)
+                await this.processHookResult(hookResult);
+                return {
+                    success: false,
+                    error: reason
+                };
+            }
+            if (hookResult.timedOut) {
+                // Hook timed out but was auto-approved
+            }
+            // Process hook commands (ENV, MODEL, SYSTEM)
+            const result = await this.processHookResult(hookResult, 'ZDS_AI_AGENT_MOOD');
+            if (!result.success) {
+                // Model/backend test failed - don't apply mood change
+                return {
+                    success: false,
+                    error: "Mood change rejected due to failed model/backend test"
+                };
+            }
+            // Apply mood transformation if present
+            if (result.transformedValue) {
+                mood = result.transformedValue;
+            }
+        }
+        const oldMood = this.mood;
+        const oldColor = this.moodColor;
+        this.mood = mood;
+        this.moodColor = color || "white";
+        process.env.ZDS_AI_AGENT_MOOD = mood;
+        // Add system message for recordkeeping
+        let systemContent;
+        if (oldMood) {
+            const oldColorStr = oldColor && oldColor !== "white" ? ` (${oldColor})` : "";
+            const newColorStr = this.moodColor && this.moodColor !== "white" ? ` (${this.moodColor})` : "";
+            systemContent = `Assistant changed the mood from "${oldMood}"${oldColorStr} to "${this.mood}"${newColorStr}`;
+        }
+        else {
+            const colorStr = this.moodColor && this.moodColor !== "white" ? ` (${this.moodColor})` : "";
+            systemContent = `Assistant set the mood to "${this.mood}"${colorStr}`;
+        }
+        // Note: Don't add to this.messages during tool execution - only chatHistory
+        // System messages added during tool execution create invalid message sequences
+        // because they get inserted between tool_calls and tool_results
+        this.chatHistory.push({
+            type: 'system',
+            content: systemContent,
+            timestamp: new Date()
+        });
+        this.emit('moodChange', {
+            mood: this.mood,
+            color: this.moodColor
+        });
+        return { success: true };
+    }
+    async startActiveTask(activeTask, action, color) {
+        // Cannot start new task if one already exists
+        if (this.activeTask) {
+            return {
+                success: false,
+                error: `Cannot start new task "${activeTask}". Active task "${this.activeTask}" must be stopped first.`
+            };
+        }
+        // Execute hook if configured
+        const settings = getSettingsManager();
+        const hookPath = settings.getTaskApprovalHook();
+        if (hookPath) {
+            const hookResult = await executeOperationHook(hookPath, "startActiveTask", {
+                activetask: activeTask,
+                action: action,
+                color: color || "white"
+            }, 30000, false, // Task hook is not mandatory
+            this.getCurrentTokenCount(), this.getMaxContextSize());
+            // Process hook commands (MODEL, SYSTEM, ENV, BACKEND, etc.) for both approval and rejection
+            await this.processHookResult(hookResult);
+            if (!hookResult.approved) {
+                const reason = hookResult.reason || "Hook rejected task start";
+                return {
+                    success: false,
+                    error: reason
+                };
+            }
+            if (hookResult.timedOut) {
+                // Hook timed out but was auto-approved
+            }
+        }
+        // Set the task
+        this.activeTask = activeTask;
+        this.activeTaskAction = action;
+        this.activeTaskColor = color || "white";
+        // Add system message
+        const colorStr = this.activeTaskColor && this.activeTaskColor !== "white" ? ` (${this.activeTaskColor})` : "";
+        this.messages.push({
+            role: 'system',
+            content: `Assistant changed task status for "${this.activeTask}" to ${this.activeTaskAction}${colorStr}`
+        });
+        // Emit event
+        this.emit('activeTaskChange', {
+            activeTask: this.activeTask,
+            action: this.activeTaskAction,
+            color: this.activeTaskColor
+        });
+        return { success: true };
+    }
+    async transitionActiveTaskStatus(action, color) {
+        // Cannot transition if no active task
+        if (!this.activeTask) {
+            return {
+                success: false,
+                error: "Cannot transition task status. No active task is currently running."
+            };
+        }
+        // Execute hook if configured
+        const settings = getSettingsManager();
+        const hookPath = settings.getTaskApprovalHook();
+        if (hookPath) {
+            const hookResult = await executeOperationHook(hookPath, "transitionActiveTaskStatus", {
+                action: action,
+                color: color || "white"
+            }, 30000, false, // Task hook is not mandatory
+            this.getCurrentTokenCount(), this.getMaxContextSize());
+            // Process hook commands (MODEL, SYSTEM, ENV, BACKEND, etc.) for both approval and rejection
+            await this.processHookResult(hookResult);
+            if (!hookResult.approved) {
+                const reason = hookResult.reason || "Hook rejected task status transition";
+                return {
+                    success: false,
+                    error: reason
+                };
+            }
+            if (hookResult.timedOut) {
+                // Hook timed out but was auto-approved
+            }
+        }
+        // Store old action for system message
+        const oldAction = this.activeTaskAction;
+        // Update the action and color
+        this.activeTaskAction = action;
+        this.activeTaskColor = color || this.activeTaskColor;
+        // Add system message
+        const colorStr = this.activeTaskColor && this.activeTaskColor !== "white" ? ` (${this.activeTaskColor})` : "";
+        this.messages.push({
+            role: 'system',
+            content: `Assistant changed task status for "${this.activeTask}" from ${oldAction} to ${this.activeTaskAction}${colorStr}`
+        });
+        // Emit event
+        this.emit('activeTaskChange', {
+            activeTask: this.activeTask,
+            action: this.activeTaskAction,
+            color: this.activeTaskColor
+        });
+        return { success: true };
+    }
+    async stopActiveTask(reason, documentationFile, color) {
+        // Cannot stop if no active task
+        if (!this.activeTask) {
+            return {
+                success: false,
+                error: "Cannot stop task. No active task is currently running."
+            };
+        }
+        // Record the start time for 3-second minimum
+        const startTime = Date.now();
+        // Execute hook if configured
+        const settings = getSettingsManager();
+        const hookPath = settings.getTaskApprovalHook();
+        if (hookPath) {
+            const hookResult = await executeOperationHook(hookPath, "stopActiveTask", {
+                reason: reason,
+                documentation_file: documentationFile,
+                color: color || "white"
+            }, 30000, false, // Task hook is not mandatory
+            this.getCurrentTokenCount(), this.getMaxContextSize());
+            // Process hook commands (MODEL, SYSTEM, ENV, BACKEND, etc.) for both approval and rejection
+            await this.processHookResult(hookResult);
+            if (!hookResult.approved) {
+                const hookReason = hookResult.reason || "Hook rejected task stop";
+                return {
+                    success: false,
+                    error: hookReason
+                };
+            }
+            if (hookResult.timedOut) {
+                // Hook timed out but was auto-approved
+            }
+        }
+        // Calculate remaining time to meet 3-second minimum
+        const elapsed = Date.now() - startTime;
+        const minimumDelay = MINIMUM_STOP_TASK_DELAY_MS;
+        const remainingDelay = Math.max(0, minimumDelay - elapsed);
+        // Wait for remaining time if needed
+        if (remainingDelay > 0) {
+            await new Promise(resolve => setTimeout(resolve, remainingDelay));
+        }
+        // Store task info for system message before clearing
+        const stoppedTask = this.activeTask;
+        const stoppedAction = this.activeTaskAction;
+        // Clear the task
+        this.activeTask = "";
+        this.activeTaskAction = "";
+        this.activeTaskColor = "white";
+        // Add system message
+        const colorStr = color && color !== "white" ? ` (${color})` : "";
+        this.messages.push({
+            role: 'system',
+            content: `Assistant stopped task "${stoppedTask}" (was ${stoppedAction}) with reason: ${reason}${colorStr}`
+        });
+        // Emit event to clear widget
+        this.emit('activeTaskChange', {
+            activeTask: "",
+            action: "",
+            color: "white"
+        });
+        return { success: true };
+    }
+    async emitContextChange() {
+        const percent = this.getContextUsagePercent();
+        this.emit('contextChange', {
+            current: this.getCurrentTokenCount(),
+            max: this.getMaxContextSize(),
+            percent
+        });
+        // Add system warnings based on context usage (may auto-clear at 100%)
+        await this.addContextWarningIfNeeded(percent);
+    }
+    async addContextWarningIfNeeded(percent) {
+        let warning = null;
+        const roundedPercent = Math.round(percent);
+        if (percent >= 100) {
+            // Auto-clear at 100%+ to prevent exceeding context limits
+            warning = `CONTEXT LIMIT REACHED: You are at ${roundedPercent}% context capacity!  Automatically clearing cache to prevent context overflow...`;
+            this.messages.push({
+                role: 'system',
+                content: warning
+            });
+            // Perform automatic cache clear
+            await this.clearCache();
+            return;
+        }
+        if (percent >= 95) {
+            // Very stern warning at 95%+ (every time)
+            warning = `CRITICAL CONTEXT WARNING: You are at ${roundedPercent}% context capacity!  You MUST immediately save any notes and lessons learned, then run the 'clearCache' tool to reset the conversation context.  The conversation will fail if you do not take action now.`;
+        }
+        else if (percent >= 90 && !this.contextWarningAt90) {
+            // Dire warning at 90% (one time only)
+            this.contextWarningAt90 = true;
+            warning = `URGENT CONTEXT WARNING: You are at ${roundedPercent}% context capacity!  Perform your final tasks or responses and prepare to be reset.`;
+        }
+        else if (percent >= 80 && !this.contextWarningAt80) {
+            // Initial warning at 80% (one time only)
+            this.contextWarningAt80 = true;
+            warning = `Context Warning: You are at ${roundedPercent}% context capacity!  You are approaching the limit.  Be concise and avoid lengthy outputs.`;
+        }
+        if (warning) {
+            // Add as a system message
+            this.messages.push({
+                role: 'system',
+                content: warning
+            });
+        }
+    }
+    async executeCommand(command, skipConfirmation = false) {
+        return await this.zsh.execute(command, 30000, skipConfirmation);
+    }
+    getCurrentModel() {
+        return this.llmClient.getCurrentModel();
+    }
+    setModel(model) {
+        this.llmClient.setModel(model);
+        // Reset supportsVision flag for new model
+        this.llmClient.setSupportsVision(true);
+        // Update token counter for new model
+        this.tokenCounter.dispose();
+        this.tokenCounter = createTokenCounter(model);
+    }
+    /**
+     * Strip in-progress tool calls from messages for backend/model testing
+     * Removes tool_calls from the last assistant message and any corresponding tool results
+     * @returns Cleaned copy of messages array, or original if no stripping needed
+     */
+    static stripInProgressToolCalls(messages) {
+        // Find the last assistant message
+        let lastAssistantIndex = -1;
+        for (let i = messages.length - 1; i >= 0; i--) {
+            if (messages[i].role === 'assistant') {
+                lastAssistantIndex = i;
+                break;
+            }
+        }
+        // If no assistant message or it has no tool_calls, return original
+        if (lastAssistantIndex === -1 || !messages[lastAssistantIndex].tool_calls) {
+            return messages;
+        }
+        // Create deep copy to avoid modifying original
+        const cleanedMessages = JSON.parse(JSON.stringify(messages));
+        // Collect tool_call_ids from the last assistant message
+        const toolCallIds = new Set((cleanedMessages[lastAssistantIndex].tool_calls || []).map((tc) => tc.id));
+        // Remove tool_calls from the last assistant message
+        delete cleanedMessages[lastAssistantIndex].tool_calls;
+        // Remove any tool result messages that correspond to those tool_call_ids
+        // (in case some finished but not all)
+        return cleanedMessages.filter((msg, idx) => {
+            if (idx <= lastAssistantIndex) {
+                return true; // Keep all messages before and including the assistant message
+            }
+            if (msg.role === 'tool' && toolCallIds.has(msg.tool_call_id)) {
+                return false; // Remove tool results for the in-progress tool calls
+            }
+            return true;
+        });
+    }
+    /**
+     * Test a model change by making a test API call with current conversation context
+     * Rolls back to previous model if test fails
+     * @param newModel Model to test
+     * @returns Promise with success status and optional error message
+     */
+    async testModel(newModel) {
+        const previousModel = this.getCurrentModel();
+        const previousTokenCounter = this.tokenCounter;
+        // Strip in-progress tool calls to avoid sending incomplete assistant messages
+        const testMessages = LLMAgent.stripInProgressToolCalls(this.messages);
+        // Build request payload for logging
+        const supportsTools = this.llmClient.getSupportsTools();
+        const tools = supportsTools ? await getAllLLMTools() : [];
+        const requestPayload = {
+            model: newModel,
+            messages: testMessages,
+            tools: supportsTools && tools.length > 0 ? tools : undefined,
+            temperature: this.temperature,
+            max_tokens: 10
+        };
+        try {
+            // Temporarily set the new model
+            this.llmClient.setModel(newModel);
+            this.tokenCounter = createTokenCounter(newModel);
+            // Test with actual conversation context to verify the model can handle it
+            // This catches issues like ollama models that fail to parse tool calls
+            const response = await this.llmClient.chat(testMessages, tools, newModel, undefined, this.temperature, undefined, 10);
+            // Check if response is valid
+            if (!response || !response.choices || response.choices.length === 0) {
+                throw new Error("Invalid response from API");
+            }
+            // Test succeeded - keep the new model
+            previousTokenCounter.dispose();
+            return { success: true };
+        }
+        catch (error) {
+            // Test failed - roll back to previous model
+            this.llmClient.setModel(previousModel);
+            this.tokenCounter.dispose();
+            this.tokenCounter = previousTokenCounter;
+            // Log test failure with full request/response for debugging
+            const { message: logPaths } = await logApiError(requestPayload, error, { errorType: 'model-switch-test-failure', previousModel, newModel }, 'test-fail');
+            const errorMessage = error.message || "Unknown error during model test";
+            return {
+                success: false,
+                error: `Model test failed: ${errorMessage}\n${logPaths}`
+            };
+        }
+    }
+    /**
+     * Test backend/baseUrl/model changes by making a test API call with current conversation context
+     * Rolls back all changes if test fails
+     * @param backend Backend display name
+     * @param baseUrl Base URL for API calls
+     * @param apiKeyEnvVar Name of environment variable containing API key
+     * @param model Model to use (optional, uses current model if not specified)
+     * @returns Promise with success status and optional error message
+     */
+    async testBackendModelChange(backend, baseUrl, apiKeyEnvVar, model) {
+        const previousClient = this.llmClient;
+        const previousApiKeyEnvVar = this.apiKeyEnvVar;
+        const previousBackend = this.llmClient.getBackendName();
+        const previousModel = this.getCurrentModel();
+        let requestPayload;
+        let newModel;
+        try {
+            // Get API key from environment
+            const apiKey = process.env[apiKeyEnvVar];
+            if (!apiKey) {
+                throw new Error(`API key not found in environment variable: ${apiKeyEnvVar}`);
+            }
+            // Use current model if not specified
+            newModel = model || this.getCurrentModel();
+            // Create new client with new configuration
+            this.llmClient = new LLMClient(apiKey, newModel, baseUrl, backend);
+            // Store the API key env var name for session persistence
+            this.apiKeyEnvVar = apiKeyEnvVar;
+            // Reinitialize MCP servers since we're switching to a new backend/model
+            try {
+                const config = loadMCPConfig();
+                if (config.servers.length > 0) {
+                    await initializeMCPServers();
+                }
+            }
+            catch (mcpError) {
+                console.warn("MCP reinitialization failed:", mcpError);
+            }
+            // Strip in-progress tool calls to avoid sending incomplete assistant messages
+            const testMessages = LLMAgent.stripInProgressToolCalls(this.messages);
+            // Build request payload for logging
+            const supportsTools = this.llmClient.getSupportsTools();
+            const tools = supportsTools ? await getAllLLMTools() : [];
+            requestPayload = {
+                backend,
+                baseUrl,
+                model: newModel,
+                messages: testMessages,
+                tools: supportsTools && tools.length > 0 ? tools : undefined,
+                temperature: this.temperature,
+                max_tokens: 10
+            };
+            // Test with actual conversation context to verify the backend/model can handle it
+            // This catches issues like ollama models that fail to parse tool calls
+            const response = await this.llmClient.chat(testMessages, tools, newModel, undefined, this.temperature, undefined, 10);
+            // Check if response is valid
+            if (!response || !response.choices || response.choices.length === 0) {
+                throw new Error("Invalid response from API");
+            }
+            // Test succeeded - new client is now active
+            return { success: true };
+        }
+        catch (error) {
+            // Test failed - restore previous client and API key env var
+            this.llmClient = previousClient;
+            this.apiKeyEnvVar = previousApiKeyEnvVar;
+            // Log test failure with full request/response for debugging (if we got far enough to build the payload)
+            let logPaths = '';
+            if (requestPayload) {
+                const result = await logApiError(requestPayload, error, {
+                    errorType: 'backend-switch-test-failure',
+                    previousBackend,
+                    previousModel,
+                    newBackend: backend,
+                    newModel,
+                    baseUrl,
+                    apiKeyEnvVar
+                }, 'test-fail');
+                logPaths = result.message;
+            }
+            const errorMessage = error.message || "Unknown error during backend/model test";
+            return {
+                success: false,
+                error: logPaths ? `${errorMessage}\n${logPaths}` : errorMessage
+            };
+        }
+    }
+    /**
+     * Process hook result including commands and transformations
+     * Handles ENV transformations, model/backend testing, and error messaging
+     * @param hookResult Hook execution result
+     * @param envKey Optional ENV key to check for transformation (e.g., ZDS_AI_AGENT_PERSONA)
+     * @returns Object with success status and transformed value (if any)
+     */
+    async processHookResult(hookResult, envKey) {
+        if (!hookResult.commands) {
+            return { success: true };
+        }
+        const results = applyHookCommands(hookResult.commands);
+        // Check for transformation via ENV if key provided
+        let transformedValue;
+        if (envKey && results.env[envKey]) {
+            transformedValue = results.env[envKey];
+        }
+        // Process commands (test model/backend, apply ENV vars, add SYSTEM messages)
+        const success = await this.processHookCommands(results);
+        return { success, transformedValue };
+    }
+    /**
+     * Process hook commands (MODEL, BACKEND, BASE_URL, SYSTEM, ENV)
+     * Handles model/backend testing and error messaging
+     * @param commands Hook commands from applyHookCommands()
+     */
+    async processHookCommands(commands) {
+        // Import the helper function
+        const { applyEnvVariables } = await import('../utils/hook-executor.js');
+        // Check if backend or model change is requested
+        const hasBackendChange = commands.backend && commands.baseUrl && commands.apiKeyEnvVar;
+        const hasModelChange = commands.model;
+        // Test backend/model changes FIRST before applying anything
+        if (hasBackendChange) {
+            // Backend change - test backend/baseUrl/model together
+            const testResult = await this.testBackendModelChange(commands.backend, commands.baseUrl, commands.apiKeyEnvVar, commands.model);
+            if (!testResult.success) {
+                // Test failed - don't apply ANYTHING
+                const parts = [];
+                if (commands.backend)
+                    parts.push(`backend to "${commands.backend}"`);
+                if (commands.model)
+                    parts.push(`model to "${commands.model}"`);
+                const errorMsg = `Failed to change ${parts.join(' and ')}: ${testResult.error}`;
+                // Note: Don't add to this.messages during tool execution - only chatHistory
+                this.chatHistory.push({
+                    type: "system",
+                    content: errorMsg,
+                    timestamp: new Date(),
+                });
+                return false; // Signal failure - caller should not apply other changes
+            }
+            // Test succeeded - apply ENV variables and add success message
+            applyEnvVariables(commands.env);
+            const parts = [];
+            if (commands.backend)
+                parts.push(`backend to "${commands.backend}"`);
+            if (commands.model)
+                parts.push(`model to "${commands.model}"`);
+            const successMsg = `Changed ${parts.join(' and ')}`;
+            // Note: Don't add to this.messages during tool execution - only chatHistory
+            this.chatHistory.push({
+                type: "system",
+                content: successMsg,
+                timestamp: new Date(),
+            });
+            // Emit events for UI updates
+            if (commands.backend) {
+                this.emit('backendChange', {
+                    backend: commands.backend
+                });
+            }
+            if (commands.model) {
+                this.emit('modelChange', {
+                    model: commands.model
+                });
+            }
+        }
+        else if (hasModelChange) {
+            // Model-only change
+            const testResult = await this.testModel(commands.model);
+            if (!testResult.success) {
+                // Test failed - don't apply ANYTHING
+                const errorMsg = `Failed to change model to "${commands.model}": ${testResult.error}`;
+                // Note: Don't add to this.messages during tool execution - only chatHistory
+                this.chatHistory.push({
+                    type: "system",
+                    content: errorMsg,
+                    timestamp: new Date(),
+                });
+                return false; // Signal failure - caller should not apply other changes
+            }
+            // Test succeeded - apply ENV variables and add success message
+            applyEnvVariables(commands.env);
+            const successMsg = `Model changed to "${commands.model}"`;
+            // Note: Don't add to this.messages during tool execution - only chatHistory
+            this.chatHistory.push({
+                type: "system",
+                content: successMsg,
+                timestamp: new Date(),
+            });
+            // Emit modelChange event for UI updates
+            this.emit('modelChange', {
+                model: commands.model
+            });
+        }
+        else {
+            // No model or backend change - just apply ENV variables
+            applyEnvVariables(commands.env);
+        }
+        // Add SYSTEM message if present
+        if (commands.system) {
+            // Note: Don't add to this.messages during tool execution - only chatHistory
+            this.chatHistory.push({
+                type: "system",
+                content: commands.system,
+                timestamp: new Date(),
+            });
+        }
+        return true; // Signal success - caller can apply other changes
+    }
+    getBackend() {
+        // Just return the backend name from the client (no detection)
+        return this.llmClient.getBackendName();
+    }
+    abortCurrentOperation() {
+        if (this.abortController) {
+            this.abortController.abort();
+        }
+    }
+    async clearCache() {
+        const { ChatHistoryManager } = await import("../utils/chat-history-manager.js");
+        const { executeStartupHook } = await import("../utils/startup-hook.js");
+        const { executeOperationHook, applyHookCommands } = await import("../utils/hook-executor.js");
+        const historyManager = ChatHistoryManager.getInstance();
+        // Backup current context to timestamped files
+        historyManager.backupHistory();
+        // Clear the context
+        this.chatHistory = [];
+        this.messages = [];
+        this.contextWarningAt80 = false;
+        this.contextWarningAt90 = false;
+        this.firstMessageProcessed = false;
+        // Add temporary system message (will be replaced by initialize())
+        this.messages.push({
+            role: "system",
+            content: "Initializing...",
+        });
+        this.chatHistory.push({
+            type: "system",
+            content: "Initializing...",
+            timestamp: new Date(),
+        });
+        try {
+            // Re-execute startup hook to get fresh output
+            this.startupHookOutput = await executeStartupHook();
+            // Reinitialize with system message and startup hook
+            // Instance hook runs automatically at end of initialize()
+            await this.initialize();
+        }
+        catch (error) {
+            console.error("Error during initialize() in clearCache():", error);
+            // Continue anyway - we still want to save the cleared state
+        }
+        // Save the cleared state FIRST before emitting (in case emit causes exit)
+        const sessionState = this.getSessionState();
+        historyManager.saveContext(this.systemPrompt, this.chatHistory, sessionState);
+        historyManager.saveMessages(this.messages);
+        // Emit context change WITHOUT calling addContextWarningIfNeeded (to avoid recursive clearCache)
+        const percent = this.getContextUsagePercent();
+        this.emit('contextChange', {
+            current: this.getCurrentTokenCount(),
+            max: this.getMaxContextSize(),
+            percent
+        });
+        // Note: Intentionally NOT calling addContextWarningIfNeeded here to prevent recursion
+    }
+    /**
+     * Get current session state for persistence
+     */
+    getSessionState() {
+        return {
+            session: process.env.ZDS_AI_AGENT_SESSION || "",
+            persona: this.persona,
+            personaColor: this.personaColor,
+            mood: this.mood,
+            moodColor: this.moodColor,
+            activeTask: this.activeTask,
+            activeTaskAction: this.activeTaskAction,
+            activeTaskColor: this.activeTaskColor,
+            cwd: process.cwd(),
+            contextCurrent: this.getCurrentTokenCount(),
+            contextMax: this.getMaxContextSize(),
+            backend: this.llmClient.getBackendName(),
+            baseUrl: this.llmClient.getBaseURL(),
+            apiKeyEnvVar: this.apiKeyEnvVar,
+            model: this.getCurrentModel(),
+            supportsVision: this.llmClient.getSupportsVision(),
+        };
+    }
+    /**
+     * Restore session state from persistence
+     */
+    async restoreSessionState(state) {
+        // Restore session ID
+        if (state.session) {
+            process.env.ZDS_AI_AGENT_SESSION = state.session;
+        }
+        // Restore cwd early (hooks may need correct working directory)
+        if (state.cwd) {
+            try {
+                const fs = await import('fs');
+                // Only attempt to change directory if it exists
+                if (fs.existsSync(state.cwd)) {
+                    process.chdir(state.cwd);
+                }
+                // Silently skip if directory doesn't exist (common in containerized environments)
+            }
+            catch (error) {
+                // Silently skip on any error - working directory restoration is non-critical
+            }
+        }
+        // Restore backend/baseUrl/apiKeyEnvVar/model if present (creates initial client)
+        if (state.backend && state.baseUrl && state.apiKeyEnvVar) {
+            try {
+                // Get API key from environment
+                const apiKey = process.env[state.apiKeyEnvVar];
+                if (apiKey) {
+                    // Create new client with restored configuration
+                    const model = state.model || this.getCurrentModel();
+                    this.llmClient = new LLMClient(apiKey, model, state.baseUrl, state.backend);
+                    this.apiKeyEnvVar = state.apiKeyEnvVar;
+                    // Restore supportsVision flag if present
+                    if (state.supportsVision !== undefined) {
+                        this.llmClient.setSupportsVision(state.supportsVision);
+                    }
+                    // Reinitialize MCP servers when restoring session
+                    try {
+                        const config = loadMCPConfig();
+                        if (config.servers.length > 0) {
+                            await initializeMCPServers();
+                        }
+                    }
+                    catch (mcpError) {
+                        console.warn("MCP reinitialization failed:", mcpError);
+                    }
+                    // Dispose old token counter and create new one for the restored model
+                    this.tokenCounter.dispose();
+                    this.tokenCounter = createTokenCounter(model);
+                    // Emit events for UI updates
+                    this.emit('backendChange', { backend: state.backend });
+                    this.emit('modelChange', { model });
+                }
+                else {
+                    console.warn("Failed to restore backend: API key not found in environment.");
+                }
+            }
+            catch (error) {
+                console.warn(`Failed to restore backend configuration:`, error);
+            }
+        }
+        // Restore persona (hook may change backend/model and sets env vars)
+        if (state.persona) {
+            try {
+                const result = await this.setPersona(state.persona, state.personaColor);
+                if (!result.success) {
+                    // If persona hook failed (e.g., backend test failed), still set the persona values
+                    // but don't change backend/model. This prevents losing persona state on transitory errors.
+                    console.warn(`Persona hook failed, setting persona without backend change: ${result.error}`);
+                    this.persona = state.persona;
+                    this.personaColor = state.personaColor;
+                    process.env.ZDS_AI_AGENT_PERSONA = state.persona;
+                }
+            }
+            catch (error) {
+                console.warn(`Failed to restore persona "${state.persona}":`, error);
+                // Still set persona values even if hook crashed
+                this.persona = state.persona;
+                this.personaColor = state.personaColor;
+                process.env.ZDS_AI_AGENT_PERSONA = state.persona;
+            }
+        }
+        // Restore mood (hook sets env vars)
+        if (state.mood) {
+            try {
+                const result = await this.setMood(state.mood, state.moodColor);
+                if (!result.success) {
+                    // If mood hook failed (e.g., backend test failed), still set the mood values
+                    // but don't change backend/model. This prevents losing mood state on transitory errors.
+                    console.warn(`Mood hook failed, setting mood without backend change: ${result.error}`);
+                    this.mood = state.mood;
+                    this.moodColor = state.moodColor;
+                    process.env.ZDS_AI_AGENT_MOOD = state.mood;
+                }
+            }
+            catch (error) {
+                console.warn(`Failed to restore mood "${state.mood}":`, error);
+                // Still set mood values even if hook crashed
+                this.mood = state.mood;
+                this.moodColor = state.moodColor;
+                process.env.ZDS_AI_AGENT_MOOD = state.mood;
+            }
+        }
+        // Restore active task (hook sets env vars)
+        if (state.activeTask) {
+            try {
+                const result = await this.startActiveTask(state.activeTask, state.activeTaskAction, state.activeTaskColor);
+                if (!result.success) {
+                    // If task hook failed (e.g., backend test failed), still set the task values
+                    // but don't change backend/model. This prevents losing task state on transitory errors.
+                    console.warn(`Task hook failed, setting active task without backend change: ${result.error}`);
+                    this.activeTask = state.activeTask;
+                    this.activeTaskAction = state.activeTaskAction;
+                    this.activeTaskColor = state.activeTaskColor;
+                    process.env.ZDS_AI_AGENT_ACTIVE_TASK = state.activeTask;
+                    process.env.ZDS_AI_AGENT_ACTIVE_TASK_ACTION = state.activeTaskAction;
+                }
+            }
+            catch (error) {
+                console.warn(`Failed to restore active task "${state.activeTask}":`, error);
+                // Still set task values even if hook crashed
+                this.activeTask = state.activeTask;
+                this.activeTaskAction = state.activeTaskAction;
+                this.activeTaskColor = state.activeTaskColor;
+                process.env.ZDS_AI_AGENT_ACTIVE_TASK = state.activeTask;
+                process.env.ZDS_AI_AGENT_ACTIVE_TASK_ACTION = state.activeTaskAction;
+            }
+        }
+    }
+    /**
+     * Compact conversation context by keeping system prompt and last N messages
+     * Reduces context size when it grows too large for backend to handle
+     * @returns Number of messages removed
+     */
+    compactContext(keepLastMessages = 20) {
+        if (this.chatHistory.length <= keepLastMessages) {
+            // Nothing to compact
+            return 0;
+        }
+        const removedCount = this.chatHistory.length - keepLastMessages;
+        const keptMessages = this.chatHistory.slice(-keepLastMessages);
+        // Clear both arrays
+        this.chatHistory = keptMessages;
+        this.messages = [];
+        // Add system message noting the compaction
+        const compactionNote = {
+            type: 'system',
+            content: `Context compacted: removed ${removedCount} older messages, keeping last ${keepLastMessages} messages.`,
+            timestamp: new Date()
+        };
+        this.chatHistory.push(compactionNote);
+        // Rebuild this.messages from compacted chatHistory
+        for (const entry of this.chatHistory) {
+            if (entry.type === 'system') {
+                this.messages.push({
+                    role: 'system',
+                    content: entry.content
+                });
+            }
+            else if (entry.type === 'user') {
+                this.messages.push({
+                    role: 'user',
+                    content: entry.content
+                });
+            }
+            else if (entry.type === 'assistant') {
+                this.messages.push({
+                    role: 'assistant',
+                    content: entry.content
+                });
+            }
+            else if (entry.type === 'tool_result') {
+                this.messages.push({
+                    role: 'tool',
+                    tool_call_id: entry.toolResult.output || '',
+                    content: JSON.stringify(entry.toolResult)
+                });
+            }
+        }
+        return removedCount;
+    }
+    /**
+     * Get all tool instances and their class names for display purposes
+     */
+    getToolClassInfo() {
+        const toolInstances = this.getToolInstances();
+        return toolInstances.map(({ instance, className }) => ({
+            className,
+            methods: instance.getHandledToolNames ? instance.getHandledToolNames() : []
+        }));
+    }
+    /**
+     * Get all tool instances via reflection
+     */
+    getToolInstances() {
+        const instances = [];
+        // Use reflection to find all tool instance properties
+        const propertyNames = Object.getOwnPropertyNames(this);
+        for (const propName of propertyNames) {
+            const propValue = this[propName];
+            // Check if this property is a tool instance (has getHandledToolNames method)
+            if (propValue &&
+                typeof propValue === 'object' &&
+                typeof propValue.getHandledToolNames === 'function') {
+                instances.push({
+                    instance: propValue,
+                    className: propValue.constructor.name
+                });
+            }
+        }
+        return instances;
+    }
+}
+//# sourceMappingURL=llm-agent.js.map