npm - mstro-app - Versions diffs - 0.1.58 → 0.2.0 - Mend

mstro-app 0.1.58 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (100) hide show

package/bin/commands/login.js +27 -14
package/bin/commands/logout.js +35 -1
package/bin/commands/status.js +1 -1
package/bin/mstro.js +5 -108
package/dist/server/cli/headless/claude-invoker.d.ts.map +1 -1
package/dist/server/cli/headless/claude-invoker.js +432 -103
package/dist/server/cli/headless/claude-invoker.js.map +1 -1
package/dist/server/cli/headless/index.d.ts +2 -1
package/dist/server/cli/headless/index.d.ts.map +1 -1
package/dist/server/cli/headless/index.js +2 -0
package/dist/server/cli/headless/index.js.map +1 -1
package/dist/server/cli/headless/prompt-utils.d.ts +5 -8
package/dist/server/cli/headless/prompt-utils.d.ts.map +1 -1
package/dist/server/cli/headless/prompt-utils.js +40 -5
package/dist/server/cli/headless/prompt-utils.js.map +1 -1
package/dist/server/cli/headless/runner.d.ts +1 -1
package/dist/server/cli/headless/runner.d.ts.map +1 -1
package/dist/server/cli/headless/runner.js +29 -7
package/dist/server/cli/headless/runner.js.map +1 -1
package/dist/server/cli/headless/stall-assessor.d.ts +77 -1
package/dist/server/cli/headless/stall-assessor.d.ts.map +1 -1
package/dist/server/cli/headless/stall-assessor.js +336 -20
package/dist/server/cli/headless/stall-assessor.js.map +1 -1
package/dist/server/cli/headless/tool-watchdog.d.ts +67 -0
package/dist/server/cli/headless/tool-watchdog.d.ts.map +1 -0
package/dist/server/cli/headless/tool-watchdog.js +296 -0
package/dist/server/cli/headless/tool-watchdog.js.map +1 -0
package/dist/server/cli/headless/types.d.ts +80 -1
package/dist/server/cli/headless/types.d.ts.map +1 -1
package/dist/server/cli/improvisation-session-manager.d.ts +109 -2
package/dist/server/cli/improvisation-session-manager.d.ts.map +1 -1
package/dist/server/cli/improvisation-session-manager.js +737 -132
package/dist/server/cli/improvisation-session-manager.js.map +1 -1
package/dist/server/index.js +5 -10
package/dist/server/index.js.map +1 -1
package/dist/server/mcp/bouncer-integration.d.ts.map +1 -1
package/dist/server/mcp/bouncer-integration.js +18 -0
package/dist/server/mcp/bouncer-integration.js.map +1 -1
package/dist/server/mcp/security-audit.d.ts +2 -2
package/dist/server/mcp/security-audit.d.ts.map +1 -1
package/dist/server/mcp/security-audit.js +12 -8
package/dist/server/mcp/security-audit.js.map +1 -1
package/dist/server/mcp/security-patterns.d.ts.map +1 -1
package/dist/server/mcp/security-patterns.js +9 -4
package/dist/server/mcp/security-patterns.js.map +1 -1
package/dist/server/routes/improvise.js +6 -6
package/dist/server/routes/improvise.js.map +1 -1
package/dist/server/services/analytics.d.ts +2 -0
package/dist/server/services/analytics.d.ts.map +1 -1
package/dist/server/services/analytics.js +13 -3
package/dist/server/services/analytics.js.map +1 -1
package/dist/server/services/platform.d.ts.map +1 -1
package/dist/server/services/platform.js +4 -9
package/dist/server/services/platform.js.map +1 -1
package/dist/server/services/sandbox-utils.d.ts +6 -0
package/dist/server/services/sandbox-utils.d.ts.map +1 -0
package/dist/server/services/sandbox-utils.js +72 -0
package/dist/server/services/sandbox-utils.js.map +1 -0
package/dist/server/services/settings.d.ts +6 -0
package/dist/server/services/settings.d.ts.map +1 -1
package/dist/server/services/settings.js +21 -0
package/dist/server/services/settings.js.map +1 -1
package/dist/server/services/terminal/pty-manager.d.ts +3 -51
package/dist/server/services/terminal/pty-manager.d.ts.map +1 -1
package/dist/server/services/terminal/pty-manager.js +14 -100
package/dist/server/services/terminal/pty-manager.js.map +1 -1
package/dist/server/services/websocket/handler.d.ts +36 -15
package/dist/server/services/websocket/handler.d.ts.map +1 -1
package/dist/server/services/websocket/handler.js +452 -223
package/dist/server/services/websocket/handler.js.map +1 -1
package/dist/server/services/websocket/types.d.ts +6 -2
package/dist/server/services/websocket/types.d.ts.map +1 -1
package/hooks/bouncer.sh +11 -4
package/package.json +4 -1
package/server/cli/headless/claude-invoker.ts +602 -119
package/server/cli/headless/index.ts +7 -1
package/server/cli/headless/prompt-utils.ts +37 -5
package/server/cli/headless/runner.ts +30 -8
package/server/cli/headless/stall-assessor.ts +453 -22
package/server/cli/headless/tool-watchdog.ts +390 -0
package/server/cli/headless/types.ts +84 -1
package/server/cli/improvisation-session-manager.ts +884 -143
package/server/index.ts +5 -10
package/server/mcp/bouncer-integration.ts +28 -0
package/server/mcp/security-audit.ts +12 -8
package/server/mcp/security-patterns.ts +8 -2
package/server/routes/improvise.ts +6 -6
package/server/services/analytics.ts +13 -3
package/server/services/platform.test.ts +0 -10
package/server/services/platform.ts +4 -10
package/server/services/sandbox-utils.ts +78 -0
package/server/services/settings.ts +25 -0
package/server/services/terminal/pty-manager.ts +16 -127
package/server/services/websocket/handler.ts +515 -251
package/server/services/websocket/types.ts +10 -4
package/dist/server/services/terminal/tmux-manager.d.ts +0 -82
package/dist/server/services/terminal/tmux-manager.d.ts.map +0 -1
package/dist/server/services/terminal/tmux-manager.js +0 -352
package/dist/server/services/terminal/tmux-manager.js.map +0 -1
package/server/services/terminal/tmux-manager.ts +0 -426

package/server/cli/headless/tool-watchdog.ts ADDED Viewed

@@ -0,0 +1,390 @@
+// Copyright (c) 2025-present Mstro, Inc. All rights reserved.
+// Licensed under the MIT License. See LICENSE file for details.
+/**
+ * Tool Watchdog
+ *
+ * Per-tool adaptive timeout system using TCP RTO-style EMA tracking (RFC 6298).
+ * Monitors individual tool call durations and kills tools that exceed their
+ * adaptive timeout, preserving work via checkpoint-and-retry.
+ *
+ * Three-tier timeout strategy:
+ * 1. EMA tracking: timeout = estimatedDuration + 4 * deviation
+ * 2. Floor/ceiling bounds: never kill below floor, always kill at ceiling
+ * 3. Haiku tiebreaker: optional AI assessment before killing ambiguous cases
+ */
+import type {
+  ExecutionCheckpoint,
+  ToolDurationTracker,
+  ToolTimeoutProfile,
+  ToolUseAccumulator,
+} from './types.js';
+// RFC 6298 smoothing constants
+const ALPHA = 0.125;  // smoothing factor for duration EMA
+const BETA = 0.25;    // smoothing factor for deviation EMA
+const DEVIATION_MULTIPLIER = 4;  // timeout = est + 4*dev (same as TCP)
+/** Default timeout profiles per tool type */
+export const DEFAULT_TOOL_TIMEOUT_PROFILES: Record<string, ToolTimeoutProfile> = {
+  WebFetch: {
+    coldStartMs: 180_000,      // 3 min — accounts for slow sites + Haiku inference
+    floorMs: 120_000,          // 2 min absolute minimum
+    ceilingMs: 300_000,        // 5 min hard cap
+    useAdaptive: true,
+    useHaikuTiebreaker: true,
+  },
+  WebSearch: {
+    coldStartMs: 90_000,       // 1.5 min
+    floorMs: 60_000,           // 1 min minimum
+    ceilingMs: 180_000,        // 3 min hard cap
+    useAdaptive: true,
+    useHaikuTiebreaker: false,
+  },
+  Task: {
+    coldStartMs: 900_000,      // 15 min — subagents are inherently long-running
+    floorMs: 600_000,          // 10 min minimum (research agents routinely take 7-10 min)
+    ceilingMs: 2_700_000,      // 45 min hard cap
+    useAdaptive: true,         // learn from past Task durations via EMA
+    useHaikuTiebreaker: true,
+  },
+  Bash: {
+    coldStartMs: 300_000,      // 5 min
+    floorMs: 120_000,          // 2 min minimum
+    ceilingMs: 600_000,        // 10 min hard cap
+    useAdaptive: false,
+    useHaikuTiebreaker: true,
+  },
+  // Local filesystem tools — adaptive EMA learns actual durations, short cold starts
+  Read: {
+    coldStartMs: 60_000,       // 1 min — local reads should be fast
+    floorMs: 15_000,           // 15s minimum
+    ceilingMs: 300_000,        // 5 min ceiling (large files, slow mounts)
+    useAdaptive: true,
+    useHaikuTiebreaker: false, // local ops don't need AI assessment
+  },
+  Grep: {
+    coldStartMs: 60_000,
+    floorMs: 15_000,
+    ceilingMs: 300_000,
+    useAdaptive: true,
+    useHaikuTiebreaker: false,
+  },
+  Glob: {
+    coldStartMs: 30_000,       // 30s — pattern matching is fast
+    floorMs: 10_000,
+    ceilingMs: 120_000,
+    useAdaptive: true,
+    useHaikuTiebreaker: false,
+  },
+  Edit: {
+    coldStartMs: 30_000,
+    floorMs: 10_000,
+    ceilingMs: 120_000,
+    useAdaptive: true,
+    useHaikuTiebreaker: false,
+  },
+  Write: {
+    coldStartMs: 30_000,
+    floorMs: 10_000,
+    ceilingMs: 120_000,
+    useAdaptive: true,
+    useHaikuTiebreaker: false,
+  },
+};
+const DEFAULT_TOOL_TIMEOUT_PROFILE: ToolTimeoutProfile = {
+  coldStartMs: 300_000,
+  floorMs: 120_000,
+  ceilingMs: 600_000,
+  useAdaptive: false,
+  useHaikuTiebreaker: true,
+};
+export interface ToolWatchdogOptions {
+  profiles?: Record<string, Partial<ToolTimeoutProfile>>;
+  verbose?: boolean;
+  /** Called before killing — if returns 'extend', reschedule with extensionMs */
+  onTiebreaker?: (toolName: string, toolInput: Record<string, unknown>, elapsedMs: number) => Promise<{ action: 'extend' | 'kill'; extensionMs: number; reason: string }>;
+}
+interface ActiveWatch {
+  toolName: string;
+  toolInput: Record<string, unknown>;
+  startTime: number;
+  timer: ReturnType<typeof setTimeout>;
+  timeoutMs: number;
+  tiebreakerAttempted: boolean;
+}
+export class ToolWatchdog {
+  private trackers: Map<string, ToolDurationTracker> = new Map();
+  private profiles: Record<string, ToolTimeoutProfile>;
+  private activeWatches: Map<string, ActiveWatch> = new Map();
+  private verbose: boolean;
+  private onTiebreaker?: ToolWatchdogOptions['onTiebreaker'];
+  constructor(options: ToolWatchdogOptions = {}) {
+    this.verbose = options.verbose ?? false;
+    this.onTiebreaker = options.onTiebreaker;
+    // Merge user profiles with defaults
+    this.profiles = { ...DEFAULT_TOOL_TIMEOUT_PROFILES };
+    if (options.profiles) {
+      for (const [name, partial] of Object.entries(options.profiles)) {
+        const base = this.profiles[name] || DEFAULT_TOOL_TIMEOUT_PROFILE;
+        this.profiles[name] = { ...base, ...partial };
+      }
+    }
+  }
+  /** Record a tool completion — updates the EMA tracker for its type */
+  recordCompletion(toolName: string, durationMs: number): void {
+    const profile = this.getProfile(toolName);
+    if (!profile.useAdaptive) return;
+    const tracker = this.trackers.get(toolName);
+    if (!tracker) {
+      this.trackers.set(toolName, {
+        estimatedDuration: durationMs,
+        deviation: durationMs / 2,
+        sampleCount: 1,
+      });
+      if (this.verbose) {
+        console.log(`[WATCHDOG] ${toolName}: first sample ${durationMs}ms, initial timeout ${this.getTimeout(toolName)}ms`);
+      }
+      return;
+    }
+    // RFC 6298 update
+    tracker.deviation = (1 - BETA) * tracker.deviation + BETA * Math.abs(durationMs - tracker.estimatedDuration);
+    tracker.estimatedDuration = (1 - ALPHA) * tracker.estimatedDuration + ALPHA * durationMs;
+    tracker.sampleCount++;
+    if (this.verbose) {
+      console.log(`[WATCHDOG] ${toolName}: sample #${tracker.sampleCount} ${durationMs}ms, est=${Math.round(tracker.estimatedDuration)}ms, dev=${Math.round(tracker.deviation)}ms, timeout=${this.getTimeout(toolName)}ms`);
+    }
+  }
+  /** Compute the current timeout for a tool type */
+  getTimeout(toolName: string): number {
+    const profile = this.getProfile(toolName);
+    if (!profile.useAdaptive) return profile.coldStartMs;
+    const tracker = this.trackers.get(toolName);
+    if (!tracker || tracker.sampleCount < 1) return profile.coldStartMs;
+    const adaptive = tracker.estimatedDuration + DEVIATION_MULTIPLIER * tracker.deviation;
+    return Math.max(profile.floorMs, Math.min(profile.ceilingMs, adaptive));
+  }
+  /** Get the profile for a tool (with fallback to default) */
+  getProfile(toolName: string): ToolTimeoutProfile {
+    return this.profiles[toolName] || DEFAULT_TOOL_TIMEOUT_PROFILE;
+  }
+  /** Start watching a tool call */
+  startWatch(toolId: string, toolName: string, toolInput: Record<string, unknown>, onTimeout: () => void): void {
+    // Clear any existing watch for this ID
+    this.clearWatch(toolId);
+    const timeoutMs = this.getTimeout(toolName);
+    const profile = this.getProfile(toolName);
+    if (this.verbose) {
+      console.log(`[WATCHDOG] Starting watch: ${toolName} (${toolId}), timeout=${Math.round(timeoutMs / 1000)}s`);
+    }
+    const timer = setTimeout(async () => {
+      const extended = await this.handleTimeoutWithTiebreaker(toolId, toolName, toolInput, profile, onTimeout);
+      if (!extended) {
+        // Don't delete the watch here — buildCheckpoint() needs it.
+        // handleToolTimeout() calls clearAll() after building the checkpoint.
+        onTimeout();
+      }
+    }, timeoutMs);
+    this.activeWatches.set(toolId, {
+      toolName,
+      toolInput,
+      startTime: Date.now(),
+      timer,
+      timeoutMs,
+      tiebreakerAttempted: false,
+    });
+  }
+  /** Handle timeout expiry: attempt tiebreaker if configured, return true if extended */
+  private async handleTimeoutWithTiebreaker(
+    toolId: string,
+    toolName: string,
+    toolInput: Record<string, unknown>,
+    profile: ToolTimeoutProfile,
+    onTimeout: () => void,
+  ): Promise<boolean> {
+    const watch = this.activeWatches.get(toolId);
+    if (!watch) return true;
+    const elapsedMs = Date.now() - watch.startTime;
+    if (!profile.useHaikuTiebreaker || !this.onTiebreaker || watch.tiebreakerAttempted) {
+      if (this.verbose) {
+        console.log(`[WATCHDOG] ${toolName} (${toolId}) timed out after ${Math.round(elapsedMs / 1000)}s, killing`);
+      }
+      return false;
+    }
+    return this.runTiebreaker(watch, toolId, toolName, toolInput, elapsedMs, onTimeout);
+  }
+  /** Execute the Haiku tiebreaker and reschedule if extended */
+  private async runTiebreaker(
+    watch: ActiveWatch,
+    toolId: string,
+    toolName: string,
+    toolInput: Record<string, unknown>,
+    elapsedMs: number,
+    onTimeout: () => void,
+  ): Promise<boolean> {
+    watch.tiebreakerAttempted = true;
+    if (this.verbose) {
+      console.log(`[WATCHDOG] ${toolName} (${toolId}) hit timeout after ${Math.round(elapsedMs / 1000)}s, running tiebreaker...`);
+    }
+    try {
+      const verdict = await this.onTiebreaker!(toolName, toolInput, elapsedMs);
+      if (verdict.action === 'extend') {
+        if (this.verbose) {
+          console.log(`[WATCHDOG] Tiebreaker: extend ${toolName} by ${Math.round(verdict.extensionMs / 1000)}s — ${verdict.reason}`);
+        }
+        this.scheduleExtensionTimeout(watch, toolId, toolName, verdict.extensionMs, onTimeout);
+        watch.timeoutMs = elapsedMs + verdict.extensionMs;
+        return true;
+      }
+      if (this.verbose) {
+        console.log(`[WATCHDOG] Tiebreaker: kill ${toolName} — ${verdict.reason}`);
+      }
+    } catch (err) {
+      if (this.verbose) {
+        console.log(`[WATCHDOG] Tiebreaker failed: ${err}, proceeding with kill`);
+      }
+    }
+    return false;
+  }
+  /** Schedule a post-extension timeout that kills without another tiebreaker */
+  private scheduleExtensionTimeout(
+    watch: ActiveWatch,
+    toolId: string,
+    toolName: string,
+    extensionMs: number,
+    onTimeout: () => void,
+  ): void {
+    watch.timer = setTimeout(() => {
+      const w = this.activeWatches.get(toolId);
+      if (!w) return;
+      if (this.verbose) {
+        console.log(`[WATCHDOG] ${toolName} (${toolId}) still running after extension, killing`);
+      }
+      // Don't delete the watch — buildCheckpoint() needs it.
+      // handleToolTimeout() calls clearAll() after building the checkpoint.
+      onTimeout();
+    }, extensionMs);
+  }
+  /** Stop watching a tool (it completed normally) */
+  clearWatch(toolId: string): void {
+    const watch = this.activeWatches.get(toolId);
+    if (watch) {
+      clearTimeout(watch.timer);
+      this.activeWatches.delete(toolId);
+    }
+  }
+  /** Clear all active watches (process ending) */
+  clearAll(): void {
+    for (const [_id, watch] of this.activeWatches) {
+      clearTimeout(watch.timer);
+    }
+    this.activeWatches.clear();
+  }
+  /** Get the active watch for a tool ID (for checkpoint building) */
+  getActiveWatch(toolId: string): ActiveWatch | undefined {
+    return this.activeWatches.get(toolId);
+  }
+  /** Get all active watches */
+  getActiveWatches(): Map<string, ActiveWatch> {
+    return this.activeWatches;
+  }
+  /** Build an ExecutionCheckpoint from the current state */
+  buildCheckpoint(
+    originalPrompt: string,
+    assistantText: string,
+    thinkingText: string,
+    accumulatedToolUse: ToolUseAccumulator[],
+    hungToolId: string,
+    claudeSessionId: string | undefined,
+    processStartTime: number,
+  ): ExecutionCheckpoint | null {
+    const hungWatch = this.activeWatches.get(hungToolId);
+    if (!hungWatch) return null;
+    // Find the matching tool entry
+    const hungToolEntry = accumulatedToolUse.find(t => t.toolId === hungToolId);
+    // Build completed tools list (exclude the hung one)
+    const completedTools = accumulatedToolUse
+      .filter(t => t.toolId !== hungToolId && t.result !== undefined)
+      .map(t => ({
+        toolName: t.toolName,
+        toolId: t.toolId,
+        input: t.toolInput,
+        result: t.result || '',
+        isError: t.isError || false,
+        durationMs: t.duration || 0,
+      }));
+    // Build in-progress tools list (started but no result, excluding the hung one)
+    const inProgressTools = accumulatedToolUse
+      .filter(t => t.toolId !== hungToolId && t.result === undefined)
+      .map(t => ({
+        toolName: t.toolName,
+        toolId: t.toolId,
+        input: t.toolInput,
+      }));
+    // Extract URL from tool input if WebFetch/WebSearch
+    let url: string | undefined;
+    const toolInput = hungToolEntry?.toolInput || hungWatch.toolInput;
+    if (toolInput.url) {
+      url = String(toolInput.url);
+    } else if (toolInput.query) {
+      url = String(toolInput.query);
+    }
+    return {
+      originalPrompt,
+      assistantText,
+      thinkingText,
+      completedTools,
+      inProgressTools,
+      hungTool: {
+        toolName: hungWatch.toolName,
+        toolId: hungToolId,
+        input: toolInput,
+        timeoutMs: hungWatch.timeoutMs,
+        url,
+      },
+      claudeSessionId,
+      elapsedMs: Date.now() - processStartTime,
+    };
+  }
+}

package/server/cli/headless/types.ts CHANGED Viewed

@@ -33,6 +33,57 @@ export interface ImageAttachment {
   mimeType?: string;      // MIME type (e.g., "image/png")
 }
+/** Per-tool-type timeout configuration with adaptive tracking */
+export interface ToolTimeoutProfile {
+  /** Initial timeout when no prior samples exist (ms) */
+  coldStartMs: number;
+  /** Minimum timeout — never kill before this (ms) */
+  floorMs: number;
+  /** Maximum timeout — always kill after this (ms) */
+  ceilingMs: number;
+  /** Track EMA of past durations and adapt timeout dynamically */
+  useAdaptive: boolean;
+  /** Spawn a Haiku call to assess before killing */
+  useHaikuTiebreaker: boolean;
+}
+/** Snapshot of execution state at the moment a tool times out */
+export interface ExecutionCheckpoint {
+  originalPrompt: string;
+  assistantText: string;
+  thinkingText: string;
+  completedTools: Array<{
+    toolName: string;
+    toolId: string;
+    input: Record<string, unknown>;
+    result: string;
+    isError: boolean;
+    durationMs: number;
+  }>;
+  /** Tools that were still running (not the hung tool) when the process was killed */
+  inProgressTools: Array<{
+    toolName: string;
+    toolId: string;
+    input: Record<string, unknown>;
+  }>;
+  hungTool: {
+    toolName: string;
+    toolId: string;
+    input: Record<string, unknown>;
+    timeoutMs: number;
+    url?: string;
+  };
+  claudeSessionId?: string;
+  elapsedMs: number;
+}
+/** EMA tracker for a single tool type's completion times */
+export interface ToolDurationTracker {
+  estimatedDuration: number;
+  deviation: number;
+  sampleCount: number;
+}
 export interface HeadlessConfig {
   workingDir: string;
   tokenBudgetThreshold: number;
@@ -58,6 +109,16 @@ export interface HeadlessConfig {
   stallHardCapMs?: number;     // Absolute wall-clock kill cap (default: 3600000 = 60 min)
   /** Claude model for main execution (e.g., 'opus', 'sonnet'). 'default' = no --model flag. */
   model?: string;
+  /** Per-tool timeout profiles (merge with defaults) */
+  toolTimeoutProfiles?: Record<string, Partial<ToolTimeoutProfile>>;
+  /** Enable per-tool adaptive timeout watchdog (default: true) */
+  enableToolWatchdog?: boolean;
+  /** Max auto-retries on tool timeout (default: 2) */
+  maxAutoRetries?: number;
+  /** Called when a tool times out with checkpoint data */
+  onToolTimeout?: (checkpoint: ExecutionCheckpoint) => void;
+  /** When true, spawn Claude with sanitized env (strips secrets, HOME=workingDir) */
+  sandboxed?: boolean;
 }
 export interface SessionState {
@@ -92,6 +153,14 @@ export interface SessionResult {
     duration?: number;
   }>;
   claudeSessionId?: string;
+  /** Number of Claude Code native tool timeouts detected during this execution */
+  nativeTimeoutCount?: number;
+  /** Assistant text buffered after native timeouts — not yet shown to user.
+   *  Flush to output if context is OK, discard if context was lost and recovery starts. */
+  postTimeoutOutput?: string;
+  /** Assistant text buffered during resume assessment — held back until thinking/tool activity
+   *  confirms Claude has context. Undefined when not in resume mode or buffer was flushed. */
+  resumeBufferedOutput?: string;
 }
 export interface ToolUseAccumulator {
@@ -104,6 +173,9 @@ export interface ToolUseAccumulator {
   duration?: number;
 }
+/** Map of toolId -> toolName for currently pending (started but not yet returned) tools */
+export type PendingToolMap = Map<string, string>;
 export interface ExecutionResult {
   output: string;
   error?: string;
@@ -112,10 +184,18 @@ export interface ExecutionResult {
   thinkingOutput?: string;
   toolUseHistory?: ToolUseAccumulator[];
   claudeSessionId?: string;
+  /** Number of Claude Code native tool timeouts detected during this execution */
+  nativeTimeoutCount?: number;
+  /** Assistant text buffered after native timeouts — not yet sent to outputCallback.
+   *  The session manager should flush this to the client if context is OK, or discard if recovering. */
+  postTimeoutOutput?: string;
+  /** Assistant text buffered during resume assessment — held back until thinking/tool activity
+   *  confirms Claude has context. Undefined when not in resume mode or buffer was flushed. */
+  resumeBufferedOutput?: string;
 }
 /** Resolved config with all defaults applied */
-export type ResolvedHeadlessConfig = Omit<Required<HeadlessConfig>, 'outputCallback' | 'thinkingCallback' | 'toolUseCallback' | 'continueSession' | 'claudeSessionId' | 'imageAttachments' | 'model'> & {
+export type ResolvedHeadlessConfig = Omit<Required<HeadlessConfig>, 'outputCallback' | 'thinkingCallback' | 'toolUseCallback' | 'continueSession' | 'claudeSessionId' | 'imageAttachments' | 'model' | 'toolTimeoutProfiles' | 'onToolTimeout' | 'sandboxed'> & {
   outputCallback?: (text: string) => void;
   thinkingCallback?: (text: string) => void;
   toolUseCallback?: (event: ToolUseEvent) => void;
@@ -123,4 +203,7 @@ export type ResolvedHeadlessConfig = Omit<Required<HeadlessConfig>, 'outputCallb
   claudeSessionId?: string;
   imageAttachments?: ImageAttachment[];
   model?: string;
+  toolTimeoutProfiles?: Record<string, Partial<ToolTimeoutProfile>>;
+  onToolTimeout?: (checkpoint: ExecutionCheckpoint) => void;
+  sandboxed?: boolean;
 };