npm - @defai.digital/ax-cli - Versions diffs - 3.7.2 → 3.8.2 - Mend

@defai.digital/ax-cli 3.7.2 → 3.8.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (213) hide show

package/README.md +148 -53
package/dist/agent/context-manager.d.ts +15 -1
package/dist/agent/context-manager.js +50 -19
package/dist/agent/context-manager.js.map +1 -1
package/dist/agent/dependency-resolver.js +13 -7
package/dist/agent/dependency-resolver.js.map +1 -1
package/dist/agent/llm-agent.d.ts +37 -0
package/dist/agent/llm-agent.js +318 -98
package/dist/agent/llm-agent.js.map +1 -1
package/dist/agent/status-reporter.d.ts +114 -0
package/dist/agent/status-reporter.js +335 -0
package/dist/agent/status-reporter.js.map +1 -0
package/dist/analyzers/best-practices/rules/typescript/no-magic-numbers.js +8 -2
package/dist/analyzers/best-practices/rules/typescript/no-magic-numbers.js.map +1 -1
package/dist/analyzers/best-practices/rules/typescript/no-unused-vars.js +3 -1
package/dist/analyzers/best-practices/rules/typescript/no-unused-vars.js.map +1 -1
package/dist/analyzers/best-practices/rules/typescript/prefer-const.js +3 -1
package/dist/analyzers/best-practices/rules/typescript/prefer-const.js.map +1 -1
package/dist/analyzers/best-practices/rules/typescript/prefer-readonly.js +3 -1
package/dist/analyzers/best-practices/rules/typescript/prefer-readonly.js.map +1 -1
package/dist/analyzers/code-smells/detectors/duplicate-code-detector.js +9 -3
package/dist/analyzers/code-smells/detectors/duplicate-code-detector.js.map +1 -1
package/dist/analyzers/git/churn-calculator.d.ts +2 -0
package/dist/analyzers/git/churn-calculator.js +42 -8
package/dist/analyzers/git/churn-calculator.js.map +1 -1
package/dist/analyzers/git/hotspot-detector.js +2 -2
package/dist/analyzers/git/hotspot-detector.js.map +1 -1
package/dist/analyzers/metrics/metrics-analyzer.js +1 -1
package/dist/analyzers/metrics/metrics-analyzer.js.map +1 -1
package/dist/analyzers/security/security-analyzer.js +1 -1
package/dist/analyzers/security/security-analyzer.js.map +1 -1
package/dist/checkpoint/manager.d.ts +1 -0
package/dist/checkpoint/manager.js +49 -9
package/dist/checkpoint/manager.js.map +1 -1
package/dist/checkpoint/storage.js +2 -2
package/dist/checkpoint/storage.js.map +1 -1
package/dist/commands/mcp-migrate.d.ts +9 -0
package/dist/commands/mcp-migrate.js +172 -0
package/dist/commands/mcp-migrate.js.map +1 -0
package/dist/commands/status.d.ts +7 -0
package/dist/commands/status.js +211 -0
package/dist/commands/status.js.map +1 -0
package/dist/commands/vscode.d.ts +7 -0
package/dist/commands/vscode.js +363 -0
package/dist/commands/vscode.js.map +1 -0
package/dist/index.js +79 -30
package/dist/index.js.map +1 -1
package/dist/llm/client.js +33 -4
package/dist/llm/client.js.map +1 -1
package/dist/mcp/automatosx-loader.d.ts +84 -0
package/dist/mcp/automatosx-loader.js +238 -0
package/dist/mcp/automatosx-loader.js.map +1 -0
package/dist/mcp/client-mutex-patch.d.ts +36 -0
package/dist/mcp/client-mutex-patch.js +75 -0
package/dist/mcp/client-mutex-patch.js.map +1 -0
package/dist/mcp/client-v2.d.ts +229 -0
package/dist/mcp/client-v2.js +740 -0
package/dist/mcp/client-v2.js.map +1 -0
package/dist/mcp/client.d.ts +111 -13
package/dist/mcp/client.js +168 -253
package/dist/mcp/client.js.map +1 -1
package/dist/mcp/config-detector-v2.d.ts +83 -0
package/dist/mcp/config-detector-v2.js +328 -0
package/dist/mcp/config-detector-v2.js.map +1 -0
package/dist/mcp/config-detector.d.ts +90 -0
package/dist/mcp/config-detector.js +242 -0
package/dist/mcp/config-detector.js.map +1 -0
package/dist/mcp/config-migrator-v2.d.ts +89 -0
package/dist/mcp/config-migrator-v2.js +288 -0
package/dist/mcp/config-migrator-v2.js.map +1 -0
package/dist/mcp/config-migrator.d.ts +63 -0
package/dist/mcp/config-migrator.js +269 -0
package/dist/mcp/config-migrator.js.map +1 -0
package/dist/mcp/config-v2.d.ts +106 -0
package/dist/mcp/config-v2.js +417 -0
package/dist/mcp/config-v2.js.map +1 -0
package/dist/mcp/config.d.ts +12 -1
package/dist/mcp/config.js +95 -10
package/dist/mcp/config.js.map +1 -1
package/dist/mcp/error-formatter.d.ts +46 -0
package/dist/mcp/error-formatter.js +244 -0
package/dist/mcp/error-formatter.js.map +1 -0
package/dist/mcp/health.d.ts +5 -0
package/dist/mcp/health.js +22 -2
package/dist/mcp/health.js.map +1 -1
package/dist/mcp/invariants.d.ts +141 -0
package/dist/mcp/invariants.js +243 -0
package/dist/mcp/invariants.js.map +1 -0
package/dist/mcp/mutex-safe.d.ts +153 -0
package/dist/mcp/mutex-safe.js +260 -0
package/dist/mcp/mutex-safe.js.map +1 -0
package/dist/mcp/mutex.d.ts +73 -0
package/dist/mcp/mutex.js +137 -0
package/dist/mcp/mutex.js.map +1 -0
package/dist/mcp/reconnection.d.ts +4 -0
package/dist/mcp/reconnection.js +25 -1
package/dist/mcp/reconnection.js.map +1 -1
package/dist/mcp/transports-v2.d.ts +152 -0
package/dist/mcp/transports-v2.js +481 -0
package/dist/mcp/transports-v2.js.map +1 -0
package/dist/mcp/type-safety.d.ts +231 -0
package/dist/mcp/type-safety.js +273 -0
package/dist/mcp/type-safety.js.map +1 -0
package/dist/planner/task-planner.js +13 -0
package/dist/planner/task-planner.js.map +1 -1
package/dist/planner/types.d.ts +6 -6
package/dist/schemas/confirmation-schemas.d.ts +2 -2
package/dist/schemas/settings-schemas.d.ts +196 -0
package/dist/schemas/settings-schemas.js +146 -5
package/dist/schemas/settings-schemas.js.map +1 -1
package/dist/sdk/index.d.ts +118 -2
package/dist/sdk/index.js +146 -4
package/dist/sdk/index.js.map +1 -1
package/dist/sdk/testing.d.ts +182 -0
package/dist/sdk/testing.js +231 -0
package/dist/sdk/testing.js.map +1 -1
package/dist/sdk/version.d.ts +114 -15
package/dist/sdk/version.js +137 -15
package/dist/sdk/version.js.map +1 -1
package/dist/tools/bash.js +54 -9
package/dist/tools/bash.js.map +1 -1
package/dist/tools/registry.d.ts +146 -0
package/dist/tools/registry.js +170 -0
package/dist/tools/registry.js.map +1 -0
package/dist/tools/search.js +12 -2
package/dist/tools/search.js.map +1 -1
package/dist/tools/text-editor.js +84 -26
package/dist/tools/text-editor.js.map +1 -1
package/dist/ui/components/chat-history.js +6 -1
package/dist/ui/components/chat-history.js.map +1 -1
package/dist/ui/components/chat-input.d.ts +2 -1
package/dist/ui/components/chat-input.js +5 -2
package/dist/ui/components/chat-input.js.map +1 -1
package/dist/ui/components/chat-interface.js +187 -5
package/dist/ui/components/chat-interface.js.map +1 -1
package/dist/ui/components/context-breakdown.d.ts +23 -0
package/dist/ui/components/context-breakdown.js +124 -0
package/dist/ui/components/context-breakdown.js.map +1 -0
package/dist/ui/components/keyboard-help.d.ts +17 -0
package/dist/ui/components/keyboard-help.js +116 -0
package/dist/ui/components/keyboard-help.js.map +1 -0
package/dist/ui/components/keyboard-hints.js +2 -2
package/dist/ui/components/keyboard-hints.js.map +1 -1
package/dist/ui/components/quick-actions.js +43 -7
package/dist/ui/components/quick-actions.js.map +1 -1
package/dist/ui/components/status-bar.d.ts +3 -0
package/dist/ui/components/status-bar.js +25 -16
package/dist/ui/components/status-bar.js.map +1 -1
package/dist/ui/components/toast-notification.d.ts +42 -0
package/dist/ui/components/toast-notification.js +30 -2
package/dist/ui/components/toast-notification.js.map +1 -1
package/dist/ui/components/tool-group-display.js +34 -4
package/dist/ui/components/tool-group-display.js.map +1 -1
package/dist/ui/components/welcome-panel.js +2 -2
package/dist/ui/components/welcome-panel.js.map +1 -1
package/dist/ui/hooks/use-enhanced-input.d.ts +9 -1
package/dist/ui/hooks/use-enhanced-input.js +901 -90
package/dist/ui/hooks/use-enhanced-input.js.map +1 -1
package/dist/ui/hooks/use-input-handler.d.ts +11 -1
package/dist/ui/hooks/use-input-handler.js +67 -3
package/dist/ui/hooks/use-input-handler.js.map +1 -1
package/dist/ui/hooks/use-input-history.d.ts +1 -1
package/dist/ui/hooks/use-input-history.js +50 -14
package/dist/ui/hooks/use-input-history.js.map +1 -1
package/dist/ui/utils/bracketed-paste-handler.d.ts +97 -0
package/dist/ui/utils/bracketed-paste-handler.js +322 -0
package/dist/ui/utils/bracketed-paste-handler.js.map +1 -0
package/dist/ui/utils/change-summarizer.js +16 -6
package/dist/ui/utils/change-summarizer.js.map +1 -1
package/dist/ui/utils/tool-grouper.d.ts +10 -1
package/dist/ui/utils/tool-grouper.js +143 -30
package/dist/ui/utils/tool-grouper.js.map +1 -1
package/dist/utils/auto-accept-logger.d.ts +173 -0
package/dist/utils/auto-accept-logger.js +420 -0
package/dist/utils/auto-accept-logger.js.map +1 -0
package/dist/utils/background-task-manager.d.ts +11 -0
package/dist/utils/background-task-manager.js +124 -38
package/dist/utils/background-task-manager.js.map +1 -1
package/dist/utils/confirmation-service.d.ts +1 -0
package/dist/utils/confirmation-service.js +6 -1
package/dist/utils/confirmation-service.js.map +1 -1
package/dist/utils/encryption.d.ts +8 -0
package/dist/utils/encryption.js +44 -27
package/dist/utils/encryption.js.map +1 -1
package/dist/utils/enhanced-error-messages.d.ts +33 -0
package/dist/utils/enhanced-error-messages.js +420 -0
package/dist/utils/enhanced-error-messages.js.map +1 -0
package/dist/utils/error-handler.d.ts +13 -3
package/dist/utils/error-handler.js +16 -4
package/dist/utils/error-handler.js.map +1 -1
package/dist/utils/external-editor.d.ts +47 -0
package/dist/utils/external-editor.js +179 -0
package/dist/utils/external-editor.js.map +1 -0
package/dist/utils/history-migration.d.ts +9 -0
package/dist/utils/history-migration.js +36 -0
package/dist/utils/history-migration.js.map +1 -0
package/dist/utils/paste-utils.js +12 -11
package/dist/utils/paste-utils.js.map +1 -1
package/dist/utils/rate-limiter.js +20 -1
package/dist/utils/rate-limiter.js.map +1 -1
package/dist/utils/safety-rules.d.ts +64 -0
package/dist/utils/safety-rules.js +225 -0
package/dist/utils/safety-rules.js.map +1 -0
package/dist/utils/settings-manager.d.ts +89 -1
package/dist/utils/settings-manager.js +359 -3
package/dist/utils/settings-manager.js.map +1 -1
package/dist/utils/token-counter.d.ts +2 -0
package/dist/utils/token-counter.js +32 -9
package/dist/utils/token-counter.js.map +1 -1
package/dist/utils/version.d.ts +11 -2
package/dist/utils/version.js +54 -21
package/dist/utils/version.js.map +1 -1
package/package.json +2 -1

package/dist/agent/llm-agent.js CHANGED Viewed

@@ -20,6 +20,8 @@ import { SubagentOrchestrator } from "./subagent-orchestrator.js";
 import { getTaskPlanner, isComplexRequest, } from "../planner/index.js";
 import { PLANNER_CONFIG } from "../constants.js";
 import { resolveMCPReferences, extractMCPReferences } from "../mcp/resources.js";
+import { SDKError, SDKErrorCode } from "../sdk/errors.js";
+import { getStatusReporter } from "./status-reporter.js";
 export class LLMAgent extends EventEmitter {
     llmClient;
     textEditor;
@@ -51,6 +53,11 @@ export class LLMAgent extends EventEmitter {
     thinkingConfig;
     /** Track if agent has been disposed */
     disposed = false;
+    /** Tool approval system for VSCode integration */
+    requireToolApproval = false;
+    toolApprovalCallbacks = new Map();
+    /** BUG FIX: Track approval timeouts for cleanup to prevent memory leaks */
+    toolApprovalTimeouts = new Map();
     constructor(apiKey, baseURL, model, maxToolRounds) {
         super();
         const manager = getSettingsManager();
@@ -76,10 +83,15 @@ export class LLMAgent extends EventEmitter {
         // Load sampling configuration from settings (supports env vars, project, and user settings)
         this.samplingConfig = manager.getSamplingSettings();
         // Wire up checkpoint callback for automatic checkpoint creation
+        // CRITICAL FIX: Deep clone chatHistory to prevent race conditions
+        // The checkpoint creation is async and chatHistory can be modified during the operation
         this.textEditor.setCheckpointCallback(async (files, description) => {
+            // Create immutable snapshot of chat history at callback time
+            // This prevents inconsistencies if messages are added during checkpoint creation
+            const chatHistorySnapshot = JSON.parse(JSON.stringify(this.chatHistory));
             await this.checkpointManager.createCheckpoint({
                 files,
-                conversationState: this.chatHistory,
+                conversationState: chatHistorySnapshot,
                 description,
                 metadata: {
                     model: this.llmClient.getCurrentModel(),
@@ -110,6 +122,17 @@ export class LLMAgent extends EventEmitter {
             role: "system",
             content: `Current working directory: ${process.cwd()}\nTimestamp: ${new Date().toISOString().split('T')[0]}`,
         });
+        // NEW: Listen for context pruning to generate summaries
+        // CRITICAL FIX: Wrap async callback to prevent uncaught promise rejections
+        // Event listeners don't handle async errors automatically, so we must catch them
+        this.contextManager.on('before_prune', (data) => {
+            this.handleContextOverflow(data).catch((error) => {
+                const errorMsg = extractErrorMessage(error);
+                console.error('Error handling context overflow:', errorMsg);
+                // Emit error event for monitoring
+                this.emit('error', error);
+            });
+        });
     }
     initializeCheckpointManager() {
         // Initialize checkpoint manager in the background
@@ -130,7 +153,6 @@ export class LLMAgent extends EventEmitter {
     }
     async initializeMCP() {
         // Initialize MCP in the background without blocking
-        // Single error handler - no redundant catch needed since inner try-catch handles all errors
         Promise.resolve().then(async () => {
             try {
                 const config = loadMCPConfig();
@@ -144,6 +166,9 @@ export class LLMAgent extends EventEmitter {
                 console.warn("MCP initialization failed:", errorMsg);
                 this.emit('system', `MCP initialization failed: ${errorMsg}`);
             }
+        }).catch((error) => {
+            // Catch any errors from emit() or other unexpected failures
+            console.error("Unexpected MCP initialization error:", error);
         });
     }
     /**
@@ -188,32 +213,134 @@ export class LLMAgent extends EventEmitter {
     getSamplingConfig() {
         return this.samplingConfig;
     }
+    /**
+     * Enable or disable tool approval requirement
+     * When enabled, text_editor operations will emit 'tool:approval_required' events
+     * and wait for approval before executing
+     *
+     * This is used by VSCode extension to show diff previews
+     *
+     * @param enabled - Whether to require approval for text_editor operations
+     */
+    setRequireToolApproval(enabled) {
+        this.requireToolApproval = enabled;
+    }
+    /**
+     * Approve or reject a pending tool call
+     * Called by external integrations (e.g., VSCode extension) in response to
+     * 'tool:approval_required' events
+     *
+     * @param toolCallId - The ID of the tool call to approve/reject
+     * @param approved - true to execute the tool, false to reject it
+     */
+    approveToolCall(toolCallId, approved) {
+        const callback = this.toolApprovalCallbacks.get(toolCallId);
+        if (callback) {
+            // BUG FIX: Clear the timeout when approval is received (prevents memory leak)
+            const timeout = this.toolApprovalTimeouts.get(toolCallId);
+            if (timeout) {
+                clearTimeout(timeout);
+                this.toolApprovalTimeouts.delete(toolCallId);
+            }
+            callback(approved);
+            this.toolApprovalCallbacks.delete(toolCallId);
+        }
+    }
+    /**
+     * Wait for external approval of a tool call
+     * Emits 'tool:approval_required' event and waits for approveToolCall() to be called
+     *
+     * @param toolCall - The tool call awaiting approval
+     * @returns Promise<boolean> - true if approved, false if rejected or timeout
+     */
+    waitForToolApproval(toolCall) {
+        return new Promise((resolve) => {
+            // Emit event so external integrations can show diff preview
+            this.emit('tool:approval_required', toolCall);
+            // Store callback
+            this.toolApprovalCallbacks.set(toolCall.id, resolve);
+            // BUG FIX: Track the timeout so it can be cleared on approval/disposal
+            // This prevents memory leaks from dangling timers
+            const timeoutId = setTimeout(() => {
+                // Clean up both the callback and timeout tracking
+                this.toolApprovalTimeouts.delete(toolCall.id);
+                if (this.toolApprovalCallbacks.has(toolCall.id)) {
+                    this.toolApprovalCallbacks.delete(toolCall.id);
+                    resolve(false); // Auto-reject on timeout
+                }
+            }, 5 * 60 * 1000);
+            // Track the timeout for cleanup
+            this.toolApprovalTimeouts.set(toolCall.id, timeoutId);
+        });
+    }
+    /**
+     * Handle context overflow by generating a summary
+     * Called when context manager is about to prune messages
+     */
+    async handleContextOverflow(data) {
+        try {
+            const reporter = getStatusReporter();
+            const summary = await reporter.generateContextSummary(data.messages, this.chatHistory, 'context_overflow', data.tokenCount);
+            // Log for debugging
+            if (process.env.DEBUG) {
+                console.log(`[Context Overflow] Summary generated: ${summary.path}`);
+            }
+            // Add a chat entry to inform user (non-blocking)
+            const summaryEntry = {
+                type: 'assistant',
+                content: `⚠️ Context window approaching limit (${data.tokenCount.toLocaleString()} tokens). Summary saved to:\n\`${summary.path}\``,
+                timestamp: new Date(),
+            };
+            this.chatHistory.push(summaryEntry);
+            // Emit event for UI/logging
+            this.emit('context:summary', summary);
+        }
+        catch (error) {
+            // Summary generation failure should not block execution
+            const errorMsg = extractErrorMessage(error);
+            console.warn('Failed to generate context summary:', errorMsg);
+        }
+    }
     /**
      * Apply context pruning to both messages and chatHistory
      * BUGFIX: Prevents chatHistory from growing unbounded
      */
     applyContextPruning() {
+        // Prune LLM messages if needed
         if (this.contextManager.shouldPrune(this.messages, this.tokenCounter)) {
-            // Prune LLM messages
             this.messages = this.contextManager.pruneMessages(this.messages, this.tokenCounter);
-            // Also prune chatHistory to prevent unlimited growth
-            // Keep last 200 entries which is more than enough for UI display
-            const MAX_CHAT_HISTORY_ENTRIES = 200;
-            if (this.chatHistory.length > MAX_CHAT_HISTORY_ENTRIES) {
-                const entriesToRemove = this.chatHistory.length - MAX_CHAT_HISTORY_ENTRIES;
-                this.chatHistory = this.chatHistory.slice(entriesToRemove);
-                // Update tool call index map after pruning
-                // Clear and rebuild only for remaining entries
-                this.toolCallIndexMap.clear();
-                this.chatHistory.forEach((entry, index) => {
-                    if (entry.type === "tool_call" && entry.toolCall?.id) {
-                        this.toolCallIndexMap.set(entry.toolCall.id, index);
-                    }
-                    else if (entry.type === "tool_result" && entry.toolCall?.id) {
-                        this.toolCallIndexMap.set(entry.toolCall.id, index);
-                    }
-                });
-            }
+        }
+        // CRITICAL FIX: Always check and prune chatHistory to prevent unbounded growth
+        // This must happen UNCONDITIONALLY, even if context pruning is disabled
+        // Keep last 200 entries which is more than enough for UI display
+        const MAX_CHAT_HISTORY_ENTRIES = 200;
+        if (this.chatHistory.length > MAX_CHAT_HISTORY_ENTRIES) {
+            const entriesToRemove = this.chatHistory.length - MAX_CHAT_HISTORY_ENTRIES;
+            this.chatHistory = this.chatHistory.slice(entriesToRemove);
+            // Update tool call index map after pruning
+            // Clear and rebuild only for remaining entries
+            this.toolCallIndexMap.clear();
+            this.chatHistory.forEach((entry, index) => {
+                if (entry.type === "tool_call" && entry.toolCall?.id) {
+                    this.toolCallIndexMap.set(entry.toolCall.id, index);
+                }
+                else if (entry.type === "tool_result" && entry.toolCall?.id) {
+                    this.toolCallIndexMap.set(entry.toolCall.id, index);
+                }
+            });
+        }
+        // CRITICAL FIX: Add hard limit for messages array as safety backstop
+        // In case contextManager.shouldPrune() always returns false
+        const MAX_MESSAGES = 500;
+        if (this.messages.length > MAX_MESSAGES) {
+            // Keep system message (if exists) + last N messages
+            const systemMessages = this.messages.filter(m => m.role === 'system');
+            const nonSystemMessages = this.messages.filter(m => m.role !== 'system');
+            const keepMessages = Math.min(nonSystemMessages.length, MAX_MESSAGES - systemMessages.length);
+            this.messages = [
+                ...systemMessages,
+                ...nonSystemMessages.slice(-keepMessages)
+            ];
         }
     }
     /**
@@ -235,13 +362,16 @@ export class LLMAgent extends EventEmitter {
         try {
             const args = JSON.parse(toolCall.function.arguments || '{}');
             this.toolCallArgsCache.set(toolCall.id, args);
-            // Prevent unbounded memory growth - limit cache size
+            // CRITICAL FIX: Prevent unbounded memory growth with proper cache eviction
+            // When cache exceeds limit, reduce to 80% capacity (not just remove 100 entries)
             if (this.toolCallArgsCache.size > 500) {
+                const targetSize = 400; // 80% of max capacity
+                const toRemove = this.toolCallArgsCache.size - targetSize;
                 let deleted = 0;
                 for (const key of this.toolCallArgsCache.keys()) {
                     this.toolCallArgsCache.delete(key);
                     deleted++;
-                    if (deleted >= 100)
+                    if (deleted >= toRemove)
                         break;
                 }
             }
@@ -727,6 +857,29 @@ export class LLMAgent extends EventEmitter {
             }
             // Emit plan completed event
             this.emit("plan:completed", { plan, result: planResult });
+            // Generate status report on plan completion
+            try {
+                const reporter = getStatusReporter();
+                const tokenCount = this.tokenCounter.countMessageTokens(this.messages);
+                const statusReport = await reporter.generateStatusReport({
+                    messages: this.messages,
+                    chatHistory: this.chatHistory,
+                    tokenCount,
+                    plan,
+                });
+                // Notify user of status report
+                yield {
+                    type: "content",
+                    content: `\n📊 Status report saved to: \`${statusReport.path}\`\n`,
+                };
+                // Emit event for UI/logging
+                this.emit("plan:report", statusReport);
+            }
+            catch (error) {
+                // Status report generation failure should not block execution
+                const errorMsg = extractErrorMessage(error);
+                console.warn("Failed to generate status report:", errorMsg);
+            }
             this.currentPlan = null;
         }
         catch (error) {
@@ -1167,85 +1320,102 @@ export class LLMAgent extends EventEmitter {
         let accumulatedContent = "";
         let toolCallsYielded = false;
         let usageData = null;
-        for await (const chunk of stream) {
-            // Check for cancellation in the streaming loop
-            if (this.isCancelled()) {
-                yield* this.yieldCancellation();
-                // Return empty state after cancellation to avoid processing partial results
-                return { accumulated: {}, content: "", yielded: false };
-            }
-            if (!chunk.choices?.[0])
-                continue;
-            // Capture usage data from chunks (usually in the final chunk)
-            if (chunk.usage) {
-                usageData = chunk.usage;
-            }
-            // Accumulate the message using reducer
-            accumulatedMessage = this.messageReducer(accumulatedMessage, chunk);
-            // Check for tool calls - yield when we have complete tool calls with function names
-            const toolCalls = accumulatedMessage.tool_calls;
-            if (!toolCallsYielded && toolCalls && Array.isArray(toolCalls) && toolCalls.length > 0) {
-                const hasCompleteTool = toolCalls.some((tc) => tc.function?.name);
-                if (hasCompleteTool) {
+        // CRITICAL FIX: Ensure stream is properly closed on cancellation or error
+        // Without this, HTTP connections and buffers remain in memory
+        try {
+            for await (const chunk of stream) {
+                // Check for cancellation in the streaming loop
+                if (this.isCancelled()) {
+                    yield* this.yieldCancellation();
+                    // Return empty state after cancellation to avoid processing partial results
+                    return { accumulated: {}, content: "", yielded: false };
+                }
+                if (!chunk.choices?.[0])
+                    continue;
+                // Capture usage data from chunks (usually in the final chunk)
+                if (chunk.usage) {
+                    usageData = chunk.usage;
+                }
+                // Accumulate the message using reducer
+                accumulatedMessage = this.messageReducer(accumulatedMessage, chunk);
+                // Check for tool calls - yield when we have complete tool calls with function names
+                const toolCalls = accumulatedMessage.tool_calls;
+                if (!toolCallsYielded && toolCalls && Array.isArray(toolCalls) && toolCalls.length > 0) {
+                    const hasCompleteTool = toolCalls.some((tc) => tc.function?.name);
+                    if (hasCompleteTool) {
+                        yield {
+                            type: "tool_calls",
+                            toolCalls: toolCalls,
+                        };
+                        toolCallsYielded = true;
+                    }
+                }
+                // Stream reasoning content (GLM-4.6 thinking mode)
+                // Safety check: ensure choices[0] exists before accessing
+                if (chunk.choices[0]?.delta?.reasoning_content) {
                     yield {
-                        type: "tool_calls",
-                        toolCalls: toolCalls,
+                        type: "reasoning",
+                        reasoningContent: chunk.choices[0].delta.reasoning_content,
                     };
-                    toolCallsYielded = true;
+                }
+                // Stream content as it comes
+                if (chunk.choices[0]?.delta?.content) {
+                    accumulatedContent += chunk.choices[0].delta.content;
+                    yield {
+                        type: "content",
+                        content: chunk.choices[0].delta.content,
+                    };
+                    // Emit token count update (throttled and optimized)
+                    const now = Date.now();
+                    if (now - lastTokenUpdate.value > 1000) { // Increased throttle to 1s for better performance
+                        lastTokenUpdate.value = now;
+                        // Use fast estimation during streaming (4 chars ≈ 1 token)
+                        // This is ~70% faster than tiktoken encoding
+                        const estimatedOutputTokens = Math.floor(accumulatedContent.length / 4) +
+                            (accumulatedMessage.tool_calls
+                                ? Math.floor(JSON.stringify(accumulatedMessage.tool_calls).length / 4)
+                                : 0);
+                        totalOutputTokens.value = estimatedOutputTokens;
+                        yield {
+                            type: "token_count",
+                            tokenCount: inputTokens + estimatedOutputTokens,
+                        };
+                    }
                 }
             }
-            // Stream reasoning content (GLM-4.6 thinking mode)
-            // Safety check: ensure choices[0] exists before accessing
-            if (chunk.choices[0]?.delta?.reasoning_content) {
-                yield {
-                    type: "reasoning",
-                    reasoningContent: chunk.choices[0].delta.reasoning_content,
-                };
-            }
-            // Stream content as it comes
-            if (chunk.choices[0]?.delta?.content) {
-                accumulatedContent += chunk.choices[0].delta.content;
-                yield {
-                    type: "content",
-                    content: chunk.choices[0].delta.content,
-                };
-                // Emit token count update (throttled and optimized)
-                const now = Date.now();
-                if (now - lastTokenUpdate.value > 1000) { // Increased throttle to 1s for better performance
-                    lastTokenUpdate.value = now;
-                    // Use fast estimation during streaming (4 chars ≈ 1 token)
-                    // This is ~70% faster than tiktoken encoding
-                    const estimatedOutputTokens = Math.floor(accumulatedContent.length / 4) +
-                        (accumulatedMessage.tool_calls
-                            ? Math.floor(JSON.stringify(accumulatedMessage.tool_calls).length / 4)
-                            : 0);
-                    totalOutputTokens.value = estimatedOutputTokens;
+            // Track usage if available and emit accurate final token count
+            if (usageData) {
+                const tracker = getUsageTracker();
+                tracker.trackUsage(this.llmClient.getCurrentModel(), usageData);
+                // Emit accurate token count from API usage data (replaces estimation)
+                const totalTokens = usageData.total_tokens;
+                const completionTokens = usageData.completion_tokens;
+                if (totalTokens) {
+                    totalOutputTokens.value = completionTokens || 0;
                     yield {
                         type: "token_count",
-                        tokenCount: inputTokens + estimatedOutputTokens,
+                        tokenCount: totalTokens,
                     };
                 }
             }
+            // CRITICAL: Yield the accumulated result so the main loop can access it!
+            const result = { accumulated: accumulatedMessage, content: accumulatedContent, yielded: toolCallsYielded };
+            yield result;
+            return result;
         }
-        // Track usage if available and emit accurate final token count
-        if (usageData) {
-            const tracker = getUsageTracker();
-            tracker.trackUsage(this.llmClient.getCurrentModel(), usageData);
-            // Emit accurate token count from API usage data (replaces estimation)
-            const totalTokens = usageData.total_tokens;
-            const completionTokens = usageData.completion_tokens;
-            if (totalTokens) {
-                totalOutputTokens.value = completionTokens || 0;
-                yield {
-                    type: "token_count",
-                    tokenCount: totalTokens,
-                };
+        finally {
+            // CRITICAL FIX: Properly close the async iterator to release HTTP connections and buffers
+            // This prevents socket leaks when streams are cancelled or errors occur
+            if (typeof stream.return === 'function') {
+                try {
+                    await stream.return();
+                }
+                catch (cleanupError) {
+                    // Log but don't throw - cleanup errors shouldn't break the flow
+                    console.warn('Stream cleanup warning:', cleanupError);
+                }
             }
         }
-        // CRITICAL: Yield the accumulated result so the main loop can access it!
-        const result = { accumulated: accumulatedMessage, content: accumulatedContent, yielded: toolCallsYielded };
-        yield result;
-        return result;
     }
     /**
      * Add assistant message to history and conversation
@@ -1485,6 +1655,27 @@ export class LLMAgent extends EventEmitter {
                 return { success: false, error: parseResult.error };
             }
             const args = parseResult.args;
+            // Check if tool approval is required (for VSCode integration)
+            if (this.requireToolApproval) {
+                // Only require approval for file modification operations
+                const needsApproval = toolCall.function.name === "create_file" ||
+                    toolCall.function.name === "str_replace_editor" ||
+                    toolCall.function.name === "insert_text";
+                if (needsApproval) {
+                    // Emit event and wait for approval
+                    const approved = await this.waitForToolApproval(toolCall);
+                    if (!approved) {
+                        // User rejected the change
+                        this.emit('tool:rejected', toolCall);
+                        return {
+                            success: false,
+                            error: 'Change rejected by user'
+                        };
+                    }
+                    // User approved
+                    this.emit('tool:approved', toolCall);
+                }
+            }
             // Helper to safely get string argument with validation
             const getString = (key, required = true) => {
                 const value = args[key];
@@ -1724,6 +1915,9 @@ export class LLMAgent extends EventEmitter {
             // Safely preserve system message if it exists
             const systemMessage = this.messages.length > 0 ? this.messages[0] : null;
             this.messages = systemMessage ? [systemMessage] : [];
+            // CRITICAL FIX: Track tool calls to validate tool results
+            // Prevents API errors from orphaned tool results without corresponding tool calls
+            const toolCallIds = new Set();
             for (const entry of conversationState) {
                 if (entry.type === 'user') {
                     this.messages.push({
@@ -1732,6 +1926,14 @@ export class LLMAgent extends EventEmitter {
                     });
                 }
                 else if (entry.type === 'assistant') {
+                    // Track tool call IDs from assistant messages
+                    if (entry.toolCalls && Array.isArray(entry.toolCalls)) {
+                        for (const toolCall of entry.toolCalls) {
+                            if (toolCall?.id) {
+                                toolCallIds.add(toolCall.id);
+                            }
+                        }
+                    }
                     this.messages.push({
                         role: 'assistant',
                         content: entry.content,
@@ -1739,11 +1941,18 @@ export class LLMAgent extends EventEmitter {
                     });
                 }
                 else if (entry.type === 'tool_result' && entry.toolCall) {
-                    this.messages.push({
-                        role: 'tool',
-                        content: entry.content,
-                        tool_call_id: entry.toolCall.id,
-                    });
+                    // CRITICAL FIX: Only add tool result if corresponding tool call exists
+                    // This prevents "tool message without corresponding tool call" API errors
+                    if (toolCallIds.has(entry.toolCall.id)) {
+                        this.messages.push({
+                            role: 'tool',
+                            content: entry.content,
+                            tool_call_id: entry.toolCall.id,
+                        });
+                    }
+                    else {
+                        console.warn(`Skipping orphaned tool result for tool_call_id: ${entry.toolCall.id}`);
+                    }
                 }
             }
             this.emit('system', `Conversation rewound to checkpoint ${checkpointId}`);
@@ -1890,7 +2099,6 @@ export class LLMAgent extends EventEmitter {
      */
     checkDisposed() {
         if (this.disposed) {
-            const { SDKError, SDKErrorCode } = require('../sdk/errors.js');
             throw new SDKError(SDKErrorCode.AGENT_DISPOSED, 'Agent has been disposed and cannot be used. Create a new agent instance.');
         }
     }
@@ -1927,17 +2135,29 @@ export class LLMAgent extends EventEmitter {
         this.disposed = true;
         // Remove all event listeners to prevent memory leaks
         this.removeAllListeners();
+        // CRITICAL FIX: Remove event listeners from contextManager to prevent memory leak
+        // The 'before_prune' listener was registered in constructor (line 188) but never removed
+        this.contextManager.removeAllListeners('before_prune');
         // Dispose tools that have cleanup methods
         this.bash.dispose();
         // Clear in-memory caches
         this.recentToolCalls.clear();
         this.toolCallIndexMap.clear();
         this.toolCallArgsCache.clear();
+        // BUG FIX: Clear all pending tool approval timeouts to prevent memory leaks
+        // These timers would otherwise keep running for up to 5 minutes after dispose
+        for (const timeout of this.toolApprovalTimeouts.values()) {
+            clearTimeout(timeout);
+        }
+        this.toolApprovalTimeouts.clear();
+        this.toolApprovalCallbacks.clear();
         // Clear conversation history to free memory
         this.chatHistory = [];
         this.messages = [];
-        // Dispose token counter and context manager
-        this.tokenCounter.dispose();
+        // Dispose context manager (tokenCounter is a singleton, don't dispose)
+        // CRITICAL FIX: tokenCounter is obtained via getTokenCounter() which returns
+        // a shared singleton instance. Disposing it would break other agent instances
+        // using the same model. The singleton manages its own lifecycle.
         this.contextManager.dispose();
         // Abort any in-flight requests
         if (this.abortController) {