npm - @runtypelabs/cli - Versions diffs - 2.0.2 → 2.2.0 - Mend

@runtypelabs/cli 2.0.2 → 2.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/dist/index.js CHANGED Viewed

@@ -8469,8 +8469,12 @@ function setStoredToolPayloadField(payloads, toolId, field, value) {
   const next = { ...payloads.get(toolId) ?? {} };
   if (value === void 0) {
     delete next[field];
+  } else if (field === "parameters") {
+    next.parameters = value;
+  } else if (field === "result") {
+    next.result = value;
   } else {
-    next[field] = value;
+    next.streamedInput = value;
   }
   if (next.parameters === void 0 && next.result === void 0 && next.streamedInput === void 0) {
     payloads.delete(toolId);
@@ -12272,7 +12276,7 @@ import { theme as theme24 } from "@runtypelabs/ink-components";
 import { jsx as jsx25, jsxs as jsxs21 } from "react/jsx-runtime";
 var MENU_ITEMS = [
   { key: "c", label: "Copy session JSON" },
-  { key: "o", label: "Open session JSON in editor" },
+  { key: "e", label: "Open session JSON in editor" },
   { key: "f", label: "Open marathon folder in file manager" },
   { key: "d", label: "Open agent in Runtype dashboard" }
 ];
@@ -12294,7 +12298,7 @@ function SessionActionMenu({
       onCopySession();
       return;
     }
-    if (input === "o" && hasStateFile) {
+    if (input === "e" && hasStateFile) {
       onOpenStateFile();
       return;
     }
@@ -12320,7 +12324,7 @@ function SessionActionMenu({
       children: [
         /* @__PURE__ */ jsx25(Text24, { bold: true, color: theme24.accent, children: "Session" }),
         /* @__PURE__ */ jsx25(Box22, { flexDirection: "column", marginTop: 1, children: MENU_ITEMS.map((item) => {
-          const dimmed = item.key === "o" && !hasStateFile || item.key === "f" && !hasStateFile || item.key === "d" && !hasDashboard;
+          const dimmed = item.key === "e" && !hasStateFile || item.key === "f" && !hasStateFile || item.key === "d" && !hasDashboard;
           return /* @__PURE__ */ jsxs21(Text24, { children: [
             /* @__PURE__ */ jsx25(Text24, { color: dimmed ? theme24.textSubtle : theme24.accentActive, children: `  ${item.key}  ` }),
             /* @__PURE__ */ jsx25(Text24, { color: dimmed ? theme24.textSubtle : theme24.textMuted, children: item.label })
@@ -14797,6 +14801,8 @@ var NETWORK_ERROR_PATTERNS = [
   "econnrefused",
   "econnaborted",
   "etimedout",
+  "timeout",
+  "request timeout",
   "enetunreach",
   "enetdown",
   "ehostunreach",
@@ -14816,12 +14822,78 @@ var NETWORK_ERROR_PATTERNS = [
   "unable to connect",
   "err_network"
 ];
+var LOCAL_NETWORK_PATTERNS = [
+  "enetunreach",
+  "enetdown",
+  "enotfound",
+  "network error",
+  "network request failed",
+  "networkerror",
+  "err_network"
+];
+var SERVER_UNREACHABLE_PATTERNS = [
+  "econnrefused",
+  "econnreset",
+  "connection refused",
+  "connection reset",
+  "ehostunreach"
+];
+function collectErrorSignals(error, seen = /* @__PURE__ */ new Set()) {
+  if (error == null || seen.has(error)) return [];
+  if (typeof error === "string") return [error];
+  if (typeof error !== "object") return [String(error)];
+  seen.add(error);
+  const parts = [];
+  if ("message" in error && typeof error.message === "string") {
+    parts.push(error.message);
+  }
+  if ("code" in error && typeof error.code === "string") {
+    parts.push(error.code);
+  }
+  if ("cause" in error) {
+    parts.push(...collectErrorSignals(error.cause, seen));
+  }
+  return parts;
+}
+function getNetworkErrorContext(error) {
+  const signals = collectErrorSignals(error);
+  const fallbackMessage = error instanceof Error ? error.message : String(error);
+  const uniqueSignals = [...new Set(signals.map((signal) => signal.trim()).filter(Boolean))];
+  const searchText = uniqueSignals.join(" ").toLowerCase();
+  const detailMessage = uniqueSignals.find((signal) => signal.toLowerCase() !== "fetch failed") ?? fallbackMessage;
+  return {
+    searchText,
+    detailMessage
+  };
+}
+function describeNetworkError(error) {
+  const { searchText, detailMessage } = getNetworkErrorContext(error);
+  const isLocalNetwork = LOCAL_NETWORK_PATTERNS.some((p) => searchText.includes(p));
+  const isServerUnreachable = SERVER_UNREACHABLE_PATTERNS.some((p) => searchText.includes(p));
+  const isTimeout = searchText.includes("etimedout") || searchText.includes("timeout");
+  const lines = [];
+  if (isLocalNetwork) {
+    lines.push("Could not reach the Runtype API \u2014 your network appears to be offline.");
+    lines.push("Check your internet connection and try again.");
+  } else if (isServerUnreachable) {
+    lines.push("Could not reach the Runtype API \u2014 the server is not responding.");
+    lines.push("The service may be temporarily unavailable. Try again in a few minutes.");
+  } else if (isTimeout) {
+    lines.push("Could not reach the Runtype API \u2014 the request timed out.");
+    lines.push("This could be a network issue or the server may be under heavy load.");
+  } else {
+    lines.push("Could not reach the Runtype API \u2014 a network error occurred.");
+    lines.push("Check your internet connection or try again in a few minutes.");
+  }
+  lines.push(`Details: ${detailMessage}`);
+  return lines;
+}
 function isTransientNetworkError(error) {
   if (error instanceof RuntypeApiError) return false;
-  const message = error instanceof Error ? error.message.toLowerCase() : String(error).toLowerCase();
-  if (error instanceof TypeError && message.includes("fetch")) return true;
+  const { searchText } = getNetworkErrorContext(error);
+  if (error instanceof TypeError && searchText.includes("fetch")) return true;
   if (error instanceof DOMException && error.name === "AbortError") return true;
-  return NETWORK_ERROR_PATTERNS.some((pattern) => message.includes(pattern));
+  return NETWORK_ERROR_PATTERNS.some((pattern) => searchText.includes(pattern));
 }
 async function retryOnNetworkError(fn, opts = {}) {
   const maxRetries = opts.maxRetries ?? 3;
@@ -14898,9 +14970,8 @@ function describeMarathonApiError(error) {
   if (!(error instanceof Error)) {
     return ["Task failed: Unknown error"];
   }
-  if (!(error instanceof RuntypeApiError) || error.statusCode !== 429) {
-    const message = error instanceof Error ? error.message : "Unknown error";
-    return [`Task failed: ${message}`];
+  if (isTransientNetworkError(error)) {
+    return describeNetworkError(error);
   }
   return [`Task failed: ${error.message}`];
 }
@@ -15311,7 +15382,9 @@ function extractRunTaskResumeState(state) {
     ...sanitized.bestCandidateNeedsVerification ? { bestCandidateNeedsVerification: sanitized.bestCandidateNeedsVerification } : {},
     ...sanitized.bestCandidateVerified ? { bestCandidateVerified: sanitized.bestCandidateVerified } : {},
     ...sanitized.verificationRequired !== void 0 ? { verificationRequired: sanitized.verificationRequired } : {},
-    ...sanitized.lastVerificationPassed ? { lastVerificationPassed: sanitized.lastVerificationPassed } : {}
+    ...sanitized.lastVerificationPassed ? { lastVerificationPassed: sanitized.lastVerificationPassed } : {},
+    ...sanitized.isCreationTask !== void 0 ? { isCreationTask: sanitized.isCreationTask } : {},
+    ...sanitized.outputRoot ? { outputRoot: sanitized.outputRoot } : {}
   };
 }
 function findStateFile(name, stateDir) {
@@ -15476,6 +15549,29 @@ var IGNORED_REPO_DIRS = /* @__PURE__ */ new Set([
   "dist",
   "node_modules"
 ]);
+var SENSITIVE_PATH_PATTERNS = [
+  { name: ".env", test: (n) => n === ".env" || n.endsWith("/.env") },
+  { name: ".env.*", test: (n) => /\.env\.?[^/]*$/.test(n) || /\/\.env\.?[^/]*$/.test(n) },
+  { name: "private keys", test: (n) => /(^|\/)(id_rsa|id_ed25519|id_ecdsa)(\.pub)?$/.test(n) },
+  { name: "known_hosts", test: (n) => n.endsWith("known_hosts") || n.endsWith("/known_hosts") },
+  { name: "authorized_keys", test: (n) => n.endsWith("authorized_keys") || n.endsWith("/authorized_keys") },
+  { name: "cert/key extensions", test: (n) => /\.(pem|key|p12|pfx)$/i.test(n) },
+  { name: "npm/pypi config", test: (n) => /(^|\/)(\.npmrc|\.pypirc|\.netrc)$/.test(n) },
+  { name: "docker config", test: (n) => /\.docker\/config\.json$/i.test(n) },
+  { name: "credentials", test: (n) => /(^|\/)(credentials\.json|secrets\.json)$/i.test(n) },
+  { name: "service account", test: (n) => /service-account.*\.json$/i.test(n) || /firebase-admin.*\.json$/i.test(n) },
+  { name: ".ssh", test: (n) => n === ".ssh" || n.startsWith(".ssh/") || n.includes("/.ssh/") },
+  { name: ".aws", test: (n) => n === ".aws" || n.startsWith(".aws/") || n.includes("/.aws/") },
+  { name: ".gnupg", test: (n) => n === ".gnupg" || n.startsWith(".gnupg/") || n.includes("/.gnupg/") },
+  { name: ".terraform", test: (n) => n === ".terraform" || n.startsWith(".terraform/") || n.includes("/.terraform/") },
+  { name: ".git", test: (n) => n === ".git" || n.startsWith(".git/") || n.includes("/.git/") },
+  { name: ".runtype", test: (n) => n === ".runtype" || n.startsWith(".runtype/") || n.includes("/.runtype/") }
+];
+function isSensitivePath(normalizedPath) {
+  const n = normalizedPath.replace(/\\/g, "/").trim();
+  if (!n) return false;
+  return SENSITIVE_PATH_PATTERNS.some(({ test }) => test(n));
+}
 var DEFAULT_DISCOVERY_MAX_RESULTS = 50;
 var MAX_FILE_BYTES_TO_SCAN = 1024 * 1024;
 var LOW_SIGNAL_FILE_NAMES = /* @__PURE__ */ new Set([
@@ -15564,12 +15660,15 @@ function scoreSearchPath(relativePath) {
   return score;
 }
 function shouldIgnoreRepoEntry(entryPath) {
-  const normalized = normalizeToolPath(entryPath);
+  const normalized = normalizeToolPath(entryPath).replace(/\\/g, "/");
   if (normalized === ".") return false;
+  if (isSensitivePath(normalized)) return true;
   return normalized.split(path8.sep).some((segment) => IGNORED_REPO_DIRS.has(segment));
 }
 function safeReadTextFile(filePath) {
   try {
+    const normalized = normalizeToolPath(filePath).replace(/\\/g, "/");
+    if (isSensitivePath(normalized)) return null;
     const stat = fs8.statSync(filePath);
     if (!stat.isFile() || stat.size > MAX_FILE_BYTES_TO_SCAN) return null;
     const buffer = fs8.readFileSync(filePath);
@@ -15700,9 +15799,10 @@ function resolveToolPath(toolPath, options = {}) {
     return { ok: false, error: `Path does not exist: ${requestedPath}` };
   }
   const workspaceRoot = fs9.realpathSync.native(process.cwd());
+  const extraRoots = (options.allowedRoots || []).map((rootPath) => canonicalizeAllowedRoot(rootPath));
   const allowedRoots = [
-    workspaceRoot,
-    ...(options.allowedRoots || []).map((rootPath) => canonicalizeAllowedRoot(rootPath))
+    ...extraRoots,
+    workspaceRoot
   ];
   const matchedRoot = allowedRoots.find(
     (rootPath) => isPathWithinRoot(resolved.canonicalPath, rootPath)
@@ -15721,6 +15821,13 @@ function resolveToolPath(toolPath, options = {}) {
         error: `Access denied: ${requestedPath} is inside restricted workspace state (${blockedSegment})`
       };
     }
+    const relativeFromWorkspace = path9.relative(workspaceRoot, resolved.canonicalPath).replace(/\\/g, "/");
+    if (isSensitivePath(relativeFromWorkspace)) {
+      return {
+        ok: false,
+        error: `Access denied: ${requestedPath} is a sensitive path and cannot be read or written`
+      };
+    }
   }
   if (resolved.exists) {
     const stat = fs9.statSync(resolved.canonicalPath);
@@ -15741,8 +15848,17 @@ function resolveToolPath(toolPath, options = {}) {
   }
   return { ok: true, resolvedPath: resolved.canonicalPath };
 }
+function getTaskStateRoot(taskName, stateDir) {
+  return path9.join(stateDir || getMarathonStateDir(), stateSafeName3(taskName));
+}
 function createDefaultLocalTools(context) {
-  const allowedReadRoots = context?.taskName ? [getOffloadedOutputDir(context.taskName, context.stateDir)] : [];
+  const taskStateRoot = context?.taskName ? getTaskStateRoot(context.taskName, context.stateDir) : void 0;
+  const planDir = context?.taskName ? path9.resolve(`.runtype/marathons/${stateSafeName3(context.taskName)}`) : void 0;
+  const allowedReadRoots = context?.taskName ? [
+    getOffloadedOutputDir(context.taskName, context.stateDir),
+    ...taskStateRoot ? [taskStateRoot] : [],
+    ...planDir ? [planDir] : []
+  ] : [];
   return {
     read_file: {
       description: "Read the contents of a file at the given path",
@@ -15944,6 +16060,8 @@ function createDefaultLocalTools(context) {
   };
 }
 function createCheckpointedWriteFileTool(taskName, stateDir) {
+  const taskStateRoot = getTaskStateRoot(taskName, stateDir);
+  const planDir = path9.resolve(`.runtype/marathons/${stateSafeName3(taskName)}`);
   return {
     description: "Write content to a file, creating directories as needed and checkpointing original repo files",
     parametersSchema: {
@@ -15956,7 +16074,8 @@ function createCheckpointedWriteFileTool(taskName, stateDir) {
     },
     execute: async (args) => {
       const resolvedPath = resolveToolPath(String(args.path || ""), {
-        allowMissing: true
+        allowMissing: true,
+        allowedRoots: [taskStateRoot, planDir]
       });
       if (!resolvedPath.ok) return `Error: ${resolvedPath.error}`;
       const content = String(args.content || "");
@@ -16047,6 +16166,7 @@ function createRunCheckTool() {
       if (!isSafeVerificationCommand(command)) {
         return JSON.stringify({
           success: false,
+          blocked: true,
           command,
           error: "Blocked unsafe verification command. Use a single non-destructive lint/test/typecheck/build command."
         });
@@ -16085,6 +16205,57 @@ function createRunCheckTool() {
     }
   };
 }
+function createSearchSessionHistoryTool(client, taskName) {
+  return {
+    description: "Search across all prior marathon sessions for specific information, decisions, findings, or tool outputs. Use this when you need to recall something from earlier sessions that may have been compacted away. Returns ranked results with content snippets from matching sessions.",
+    parametersSchema: {
+      type: "object",
+      properties: {
+        query: {
+          type: "string",
+          description: 'What to search for (e.g. "authentication flow decisions", "test failures in auth module")'
+        },
+        limit: {
+          type: "number",
+          description: "Maximum number of results to return (default 5, max 20)"
+        },
+        types: {
+          type: "array",
+          items: { type: "string", enum: ["response", "reasoning", "tool_output"] },
+          description: "Filter by content type (default: all types)"
+        }
+      },
+      required: ["query"]
+    },
+    execute: async (args) => {
+      const query = String(args.query || "").trim();
+      if (!query) return "Error: query is required";
+      const limit = Math.max(1, Math.min(20, Number(args.limit) || 5));
+      const types = Array.isArray(args.types) ? args.types : void 0;
+      try {
+        const response = await client.post("/session-context/search", {
+          query,
+          taskName,
+          limit,
+          ...types ? { types } : {}
+        });
+        if (!response.success || !response.results || response.results.length === 0) {
+          return "No matching session context found for your query.";
+        }
+        const formatted = response.results.map((r, i) => {
+          const header = `[Result ${i + 1}] Session ${r.sessionIndex} | ${r.type}${r.toolName ? ` (${r.toolName})` : ""} | Score: ${r.score.toFixed(3)}`;
+          return `${header}
+${r.content}`;
+        });
+        return `Found ${response.count} matching results:
+${formatted.join("\n\n---\n\n")}`;
+      } catch (error) {
+        return `Session search unavailable: ${error instanceof Error ? error.message : String(error)}`;
+      }
+    }
+  };
+}
 function buildLocalTools(client, sandboxProvider, options, context) {
   const enabledTools = {};
   if (!options.noLocalTools) {
@@ -16100,6 +16271,9 @@ function buildLocalTools(client, sandboxProvider, options, context) {
         context.stateDir
       );
       enabledTools.run_check = createRunCheckTool();
+      if (options.sessionSearch === true) {
+        enabledTools.search_session_history = createSearchSessionHistoryTool(client, context.taskName);
+      }
     }
   }
   if (sandboxProvider) {
@@ -16111,6 +16285,62 @@ function buildLocalTools(client, sandboxProvider, options, context) {
   return Object.keys(enabledTools).length > 0 ? enabledTools : void 0;
 }
+// src/marathon/session-chunker.ts
+var DEFAULT_MAX_CHUNK_CHARS = 2e3;
+var MIN_CONTENT_LENGTH = 50;
+function extractSessionChunks(snapshot, maxChunkChars = DEFAULT_MAX_CHUNK_CHARS) {
+  const chunks = [];
+  if (snapshot.content && snapshot.content.length >= MIN_CONTENT_LENGTH) {
+    chunks.push(...chunkText(snapshot.content, "response", maxChunkChars));
+  }
+  if (snapshot.reasoning && snapshot.reasoning.length >= MIN_CONTENT_LENGTH) {
+    chunks.push(...chunkText(snapshot.reasoning, "reasoning", maxChunkChars));
+  }
+  for (const tool of snapshot.tools) {
+    const result = typeof tool.result === "string" ? tool.result : JSON.stringify(tool.result ?? "");
+    if (result.length >= MIN_CONTENT_LENGTH) {
+      chunks.push(
+        ...chunkText(result, "tool_output", maxChunkChars, tool.name)
+      );
+    }
+  }
+  return chunks;
+}
+function chunkText(text, type, maxChars, toolName) {
+  if (text.length <= maxChars) {
+    return [{ content: text, type, ...toolName ? { toolName } : {} }];
+  }
+  const chunks = [];
+  const paragraphs = text.split(/\n\n+/);
+  let current = "";
+  for (const paragraph of paragraphs) {
+    if (paragraph.length > maxChars) {
+      if (current.length >= MIN_CONTENT_LENGTH) {
+        chunks.push({ content: current.trim(), type, ...toolName ? { toolName } : {} });
+        current = "";
+      }
+      const sentences = paragraph.match(/[^.!?]+[.!?]+\s*|[^.!?]+$/g) || [paragraph];
+      for (const sentence of sentences) {
+        if (current.length + sentence.length > maxChars && current.length > 0) {
+          chunks.push({ content: current.trim(), type, ...toolName ? { toolName } : {} });
+          current = "";
+        }
+        current += sentence;
+      }
+      continue;
+    }
+    if (current.length + paragraph.length + 2 > maxChars && current.length >= MIN_CONTENT_LENGTH) {
+      chunks.push({ content: current.trim(), type, ...toolName ? { toolName } : {} });
+      current = "";
+    }
+    current += (current ? "\n\n" : "") + paragraph;
+  }
+  if (current.length >= MIN_CONTENT_LENGTH) {
+    chunks.push({ content: current.trim(), type, ...toolName ? { toolName } : {} });
+  }
+  return chunks;
+}
 // src/marathon/loop-detector.ts
 var DEFAULT_MAX_HISTORY = 30;
 var DEFAULT_MIN_PATTERN_LENGTH = 2;
@@ -16462,12 +16692,46 @@ function resolveModelForPhase(phase, cliOverrides, milestoneModels) {
   }
   return cliOverrides.defaultModel;
 }
+function resolveErrorHandlingForPhase(phase, cliFallbackModel, milestoneFallbackModels) {
+  const phaseFallbacks = phase ? milestoneFallbackModels?.[phase] : void 0;
+  if (phaseFallbacks?.length) {
+    return {
+      onError: "fallback",
+      fallbacks: [
+        { type: "retry", delay: 5e3 },
+        ...phaseFallbacks.map((fb) => ({
+          type: "model",
+          model: fb.model,
+          ...fb.temperature !== void 0 ? { temperature: fb.temperature } : {},
+          ...fb.maxTokens !== void 0 ? { maxTokens: fb.maxTokens } : {}
+        }))
+      ]
+    };
+  }
+  if (cliFallbackModel) {
+    return {
+      onError: "fallback",
+      fallbacks: [
+        { type: "retry", delay: 5e3 },
+        { type: "model", model: cliFallbackModel }
+      ]
+    };
+  }
+  return void 0;
+}
 // src/marathon/playbook-loader.ts
 import * as fs12 from "fs";
 import * as path12 from "path";
 import * as os4 from "os";
+import micromatch from "micromatch";
 import { parse as parseYaml } from "yaml";
+var DISCOVERY_TOOLS = /* @__PURE__ */ new Set([
+  "search_repo",
+  "glob_files",
+  "tree_directory",
+  "list_directory"
+]);
 var PLAYBOOKS_DIR = ".runtype/marathons/playbooks";
 function getCandidatePaths(nameOrPath, cwd) {
   const home = os4.homedir();
@@ -16542,7 +16806,54 @@ function buildIsComplete(criteria) {
       return () => false;
   }
 }
+function buildPolicyIntercept(policy) {
+  if (!policy.blockedTools?.length && !policy.blockDiscoveryTools && !policy.allowedReadGlobs?.length && !policy.allowedWriteGlobs?.length && !policy.requirePlanBeforeWrite) {
+    return void 0;
+  }
+  const blockedSet = new Set(
+    (policy.blockedTools ?? []).map((t) => t.trim()).filter(Boolean)
+  );
+  const readGlobs = policy.allowedReadGlobs ?? [];
+  const writeGlobs = policy.allowedWriteGlobs ?? [];
+  return (toolName, args, ctx) => {
+    if (blockedSet.has(toolName)) {
+      return `Blocked by playbook policy: ${toolName} is not allowed for this task.`;
+    }
+    if (policy.blockDiscoveryTools && DISCOVERY_TOOLS.has(toolName)) {
+      return `Blocked by playbook policy: discovery tools are disabled for this task.`;
+    }
+    const pathArg = typeof args.path === "string" && args.path.trim() ? ctx.normalizePath(String(args.path)) : void 0;
+    if (pathArg) {
+      const isWrite = toolName === "write_file" || toolName === "restore_file_checkpoint";
+      const isRead = toolName === "read_file";
+      if (isRead && readGlobs.length > 0) {
+        const allowed = micromatch.some(pathArg, readGlobs, { dot: true });
+        if (!allowed) {
+          return `Blocked by playbook policy: ${toolName} path "${pathArg}" is outside allowed read globs: ${readGlobs.join(", ")}`;
+        }
+      }
+      if (isWrite && writeGlobs.length > 0) {
+        const planPath = ctx.state.planPath ? ctx.normalizePath(ctx.state.planPath) : void 0;
+        if (planPath && pathArg === planPath) {
+        } else {
+          const allowed = micromatch.some(pathArg, writeGlobs, { dot: true });
+          if (!allowed) {
+            return `Blocked by playbook policy: ${toolName} path "${pathArg}" is outside allowed write globs: ${writeGlobs.join(", ")}`;
+          }
+        }
+      }
+      if (isWrite && policy.requirePlanBeforeWrite && !ctx.state.planWritten && !ctx.trace.planWritten) {
+        const planPath = ctx.state.planPath ? ctx.normalizePath(ctx.state.planPath) : void 0;
+        if (!planPath || pathArg !== planPath) {
+          return `Blocked by playbook policy: write the plan before creating other files.`;
+        }
+      }
+    }
+    return void 0;
+  };
+}
 function convertToWorkflow(config2) {
+  const policyIntercept = config2.policy ? buildPolicyIntercept(config2.policy) : void 0;
   const phases = config2.milestones.map((milestone) => ({
     name: milestone.name,
     description: milestone.description,
@@ -16558,6 +16869,7 @@ ${instructions}`;
       return milestone.toolGuidance ?? [];
     },
     isComplete: buildIsComplete(milestone.completionCriteria),
+    interceptToolCall: policyIntercept,
     // Default to rejecting TASK_COMPLETE unless the playbook explicitly allows it.
     // The SDK accepts completion by default when canAcceptCompletion is undefined,
     // which would let the model end the marathon prematurely in early phases.
@@ -16568,23 +16880,37 @@ ${instructions}`;
     phases
   };
 }
+function normalizeFallbackModel(input) {
+  if (typeof input === "string") return { model: input };
+  return {
+    model: input.model,
+    ...input.temperature !== void 0 ? { temperature: input.temperature } : {},
+    ...input.maxTokens !== void 0 ? { maxTokens: input.maxTokens } : {}
+  };
+}
 function loadPlaybook(nameOrPath, cwd) {
   const baseCwd = cwd || process.cwd();
   const candidates = getCandidatePaths(nameOrPath, baseCwd);
   for (const candidate of candidates) {
-    if (!fs12.existsSync(candidate)) continue;
+    if (!fs12.existsSync(candidate) || fs12.statSync(candidate).isDirectory()) continue;
     const config2 = parsePlaybookFile(candidate);
     validatePlaybook(config2, candidate);
     const milestoneModels = {};
+    const milestoneFallbackModels = {};
     for (const m of config2.milestones) {
       if (m.model) milestoneModels[m.name] = m.model;
+      if (m.fallbackModels?.length) {
+        milestoneFallbackModels[m.name] = m.fallbackModels.map(normalizeFallbackModel);
+      }
     }
     return {
       workflow: convertToWorkflow(config2),
       milestones: config2.milestones.map((m) => m.name),
       milestoneModels: Object.keys(milestoneModels).length > 0 ? milestoneModels : void 0,
+      milestoneFallbackModels: Object.keys(milestoneFallbackModels).length > 0 ? milestoneFallbackModels : void 0,
       verification: config2.verification,
-      rules: config2.rules
+      rules: config2.rules,
+      policy: config2.policy
     };
   }
   throw new Error(
@@ -16749,13 +17075,22 @@ function normalizeMarathonAgentArgument(agent) {
 function buildMarathonAutoCreatedAgentBootstrap(agentName, options = {}) {
   const normalizedModel = options.model?.trim();
   const normalizedToolIds = [...new Set((options.toolIds || []).map((toolId) => toolId.trim()).filter(Boolean))];
-  const config2 = normalizedModel || normalizedToolIds.length > 0 ? {
+  const normalizedFallbackModel = options.fallbackModel?.trim();
+  const errorHandling = normalizedFallbackModel ? {
+    onError: "fallback",
+    fallbacks: [
+      { type: "retry", delay: 5e3 },
+      { type: "model", model: normalizedFallbackModel }
+    ]
+  } : void 0;
+  const config2 = normalizedModel || normalizedToolIds.length > 0 || errorHandling ? {
     ...normalizedModel ? { model: normalizedModel } : {},
     ...normalizedToolIds.length > 0 ? {
       tools: {
         toolIds: normalizedToolIds
       }
-    } : {}
+    } : {},
+    ...errorHandling ? { errorHandling } : {}
   } : void 0;
   return {
     description: `Powering a marathon for ${agentName}`,
@@ -16936,6 +17271,9 @@ async function taskAction(agent, options) {
             console.log(chalk16.green(`Created agent: ${agentId}`));
           }
         } catch (createErr) {
+          if (isTransientNetworkError(createErr)) {
+            await failBeforeMain(formatMarathonApiError(createErr));
+          }
           const errMsg = createErr instanceof Error ? createErr.message : String(createErr);
           await failBeforeMain([
             chalk16.red(`Failed to create agent "${normalizedAgent}"`),
@@ -16944,6 +17282,9 @@ async function taskAction(agent, options) {
         }
       }
     } catch (error) {
+      if (isTransientNetworkError(error)) {
+        await failBeforeMain(formatMarathonApiError(error));
+      }
       const errMsg = error instanceof Error ? error.message : String(error);
       await failBeforeMain([
         chalk16.red("Failed to list agents"),
@@ -17109,11 +17450,17 @@ async function taskAction(agent, options) {
   let playbookWorkflow;
   let playbookMilestones;
   let playbookMilestoneModels;
+  let playbookMilestoneFallbackModels;
+  let playbookPolicy;
   if (options.playbook) {
     const result = loadPlaybook(options.playbook);
     playbookWorkflow = result.workflow;
     playbookMilestones = result.milestones;
     playbookMilestoneModels = result.milestoneModels;
+    playbookMilestoneFallbackModels = result.milestoneFallbackModels;
+    playbookPolicy = result.policy;
+  } else {
+    playbookPolicy = void 0;
   }
   if (useStartupShell && !options.model?.trim()) {
     if (playbookMilestoneModels && Object.keys(playbookMilestoneModels).length > 0 && startupShellRef.current) {
@@ -17214,7 +17561,8 @@ ${rulesContext}`;
   if (autoCreatedAgent) {
     const bootstrapPayload = buildMarathonAutoCreatedAgentBootstrap(normalizedAgent, {
       model: options.model || agentConfigModel || defaultConfiguredModel,
-      toolIds: resolvedToolIds
+      toolIds: resolvedToolIds,
+      fallbackModel: options.fallbackModel
     });
     try {
       await client.agents.update(agentId, bootstrapPayload);
@@ -17230,6 +17578,16 @@ ${rulesContext}`;
         );
       }
     }
+  } else if (options.fallbackModel || playbookMilestoneFallbackModels) {
+    const initialErrorHandling = resolveErrorHandlingForPhase(
+      currentPhase,
+      options.fallbackModel,
+      playbookMilestoneFallbackModels
+    );
+    if (initialErrorHandling) {
+      await client.agents.update(agentId, { config: { errorHandling: initialErrorHandling } }).catch(() => {
+      });
+    }
   }
   let localTools = buildLocalTools(client, parsedSandbox, options, {
     taskName,
@@ -17532,7 +17890,13 @@ Saving state... done. Session saved to ${filePath}`);
             model: event.model || effectiveModelForContext
           });
         },
-        ...resumeState ? { resumeState } : {},
+        ...resumeState || playbookPolicy ? {
+          resumeState: {
+            ...resumeState ?? {},
+            ...playbookPolicy?.outputRoot ? { outputRoot: playbookPolicy.outputRoot } : {},
+            ...playbookPolicy?.requireVerification !== void 0 ? { verificationRequired: playbookPolicy.requireVerification } : {}
+          }
+        } : {},
         toolContextMode: options.toolContext || "hot-tail",
         toolWindow: options.toolWindow === "session" || !options.toolWindow ? "session" : parseInt(options.toolWindow, 10) || 10,
         onSession: async (state) => {
@@ -17575,6 +17939,21 @@ Saving state... done. Session saved to ${filePath}`);
           resumeState = extractRunTaskResumeState(adjustedState);
           lastSessionMessages = state.messages ?? [];
           saveState(filePath, adjustedState, { stripSnapshotEvents: !!eventLogWriter });
+          if (options.sessionSearch === true) {
+            const latestSnapshot = persistedSessionSnapshots[persistedSessionSnapshots.length - 1];
+            if (latestSnapshot) {
+              const chunks = extractSessionChunks(latestSnapshot);
+              if (chunks.length > 0) {
+                const sessionIdx = currentSessionOffset + state.sessionCount - 1;
+                client.post("/session-context/index", {
+                  taskName,
+                  sessionIndex: sessionIdx,
+                  chunks
+                }).catch(() => {
+                });
+              }
+            }
+          }
           if (resumeState?.workflowPhase) {
             const displayMilestone = detectedVariant === "external" && resumeState.workflowPhase === "research" && adjustedState.planWritten ? "report" : resumeState.workflowPhase;
             streamRef.current?.updateMilestone(displayMilestone);
@@ -17594,6 +17973,17 @@ Saving state... done. Session saved to ${filePath}`);
               options.model = newPhaseModel;
               modelChangedOnPhaseTransition = true;
             }
+            if (options.fallbackModel || playbookMilestoneFallbackModels) {
+              const newErrorHandling = resolveErrorHandlingForPhase(
+                resumeState.workflowPhase,
+                options.fallbackModel,
+                playbookMilestoneFallbackModels
+              );
+              client.agents.update(agentId, {
+                config: { errorHandling: newErrorHandling ?? null }
+              }).catch(() => {
+              });
+            }
           }
           if (state.recentActionKeys && state.recentActionKeys.length > 0) {
             for (const key of state.recentActionKeys) {
@@ -17939,7 +18329,7 @@ ${details}`);
   }
   return resolved;
 }
-function detectDeployWorkflow(_message, sandboxProvider, resumeState) {
+function detectDeployWorkflow(_message, _sandboxProvider, resumeState) {
   if (resumeState?.workflowVariant === "game") return gameWorkflow;
   if (resumeState?.workflowPhase === "design" || resumeState?.workflowPhase === "build" || resumeState?.workflowPhase === "verify") {
     return gameWorkflow;
@@ -17970,7 +18360,7 @@ function resolveSandboxWorkflowSelection(message, sandboxProvider, resumeState)
   };
 }
 function applyTaskOptions(cmd) {
-  return cmd.argument("<agent>", "Agent ID or name").option("-g, --goal <text>", "Goal message for the agent").option("--max-sessions <n>", "Maximum sessions", "50").option("--max-cost <n>", "Budget in USD").option("--model <modelId>", "Model ID to use (overrides agent config)").option("--name <name>", "Task name (used for state file, defaults to agent name)").option("--session <name>", "Resume a specific session by name").option("--state-dir <path>", "Directory for state files (default: ~/.runtype/projects/<hash>/marathons/)").option("--resume [message]", "Resume from existing local state, optionally with a new message").option("--fresh", "Start a new run and ignore any existing local state for this task").option("--compact", "Force compact-summary resume mode instead of replaying full history").option("--compact-strategy <strategy>", "Compaction strategy: auto (default), provider_native, or summary_fallback").option("--compact-threshold <value>", "Auto-compact when estimated context crosses this threshold (default: 80% fallback, 90% native; accepts percent like 90% or absolute token count like 120000)").option("--compact-instructions <text>", "Extra instructions for what a compact summary must preserve").option("--no-auto-compact", "Disable automatic context-aware history compaction").option("--track", "Sync progress to a Runtype record (visible in dashboard)").option("--debug", "Show debug output from each session").option("--json", "Output final result as JSON").option("--sandbox <provider>", "Enable sandbox code execution tool (cloudflare-worker, quickjs, or daytona)").option("--no-local-tools", "Disable built-in local tool execution (read_file, write_file, list_directory)").option("-t, --tools <tools...>", "Enable built-in tools (e.g., exa, firecrawl, dalle, openai_web_search, anthropic_web_search)").option("--plain-text", "Disable markdown rendering in output").option("--no-reasoning", "Disable model reasoning/thinking (enabled by default for supported models)").option("--no-checkpoint", "Run all iterations without checkpoint pauses (fully autonomous)").option("--checkpoint-timeout <seconds>", "Auto-continue timeout in seconds (default: 10)", "10").option("--planning-model <modelId>", "Model to use during research/planning phases").option("--execution-model <modelId>", "Model to use during execution phase").option("--playbook <name>", "Load a playbook from .runtype/marathons/playbooks/").option("--offload-threshold <chars>", 'Offload tool outputs larger than this to files (default: 100000; use "off" or "0" to disable guardrails)').option("--tool-context <mode>", "Tool result storage: hot-tail (default), observation-mask, or full-inline").option("--tool-window <window>", 'Compaction window: "session" (default) or a number for last-N tool results (e.g. 10)').option("--runner-char <char>", "Custom runner emoji (default: \u{1F3C3})").option("--finish-char <char>", "Custom finish line emoji (default: \u{1F3C1})").option("--no-runner", "Hide the runner emoji from the header border").option("--no-finish", "Hide the finish line emoji from the header border").action(taskAction);
+  return cmd.argument("<agent>", "Agent ID or name").option("-g, --goal <text>", "Goal message for the agent").option("--max-sessions <n>", "Maximum sessions", "50").option("--max-cost <n>", "Budget in USD").option("--model <modelId>", "Model ID to use (overrides agent config)").option("--name <name>", "Task name (used for state file, defaults to agent name)").option("--session <name>", "Resume a specific session by name").option("--state-dir <path>", "Directory for state files (default: ~/.runtype/projects/<hash>/marathons/)").option("--resume [message]", "Resume from existing local state, optionally with a new message").option("--fresh", "Start a new run and ignore any existing local state for this task").option("--compact", "Force compact-summary resume mode instead of replaying full history").option("--compact-strategy <strategy>", "Compaction strategy: auto (default), provider_native, or summary_fallback").option("--compact-threshold <value>", "Auto-compact when estimated context crosses this threshold (default: 80% fallback, 90% native; accepts percent like 90% or absolute token count like 120000)").option("--compact-instructions <text>", "Extra instructions for what a compact summary must preserve").option("--no-auto-compact", "Disable automatic context-aware history compaction").option("--track", "Sync progress to a Runtype record (visible in dashboard)").option("--debug", "Show debug output from each session").option("--json", "Output final result as JSON").option("--sandbox <provider>", "Enable sandbox code execution tool (cloudflare-worker, quickjs, or daytona)").option("--no-local-tools", "Disable built-in local tool execution (read_file, write_file, list_directory)").option("--session-search", "Enable session context indexing and search_session_history tool").option("-t, --tools <tools...>", "Enable built-in tools (e.g., exa, firecrawl, dalle, openai_web_search, anthropic_web_search)").option("--plain-text", "Disable markdown rendering in output").option("--no-reasoning", "Disable model reasoning/thinking (enabled by default for supported models)").option("--no-checkpoint", "Run all iterations without checkpoint pauses (fully autonomous)").option("--checkpoint-timeout <seconds>", "Auto-continue timeout in seconds (default: 10)", "10").option("--planning-model <modelId>", "Model to use during research/planning phases").option("--execution-model <modelId>", "Model to use during execution phase").option("--fallback-model <modelId>", "Model to fall back to when primary model fails").option("--playbook <name>", "Load a playbook from .runtype/marathons/playbooks/").option("--offload-threshold <chars>", 'Offload tool outputs larger than this to files (default: 100000; use "off" or "0" to disable guardrails)').option("--tool-context <mode>", "Tool result storage: hot-tail (default), observation-mask, or full-inline").option("--tool-window <window>", 'Compaction window: "session" (default) or a number for last-N tool results (e.g. 10)').option("--runner-char <char>", "Custom runner emoji (default: \u{1F3C3})").option("--finish-char <char>", "Custom finish line emoji (default: \u{1F3C1})").option("--no-runner", "Hide the runner emoji from the header border").option("--no-finish", "Hide the finish line emoji from the header border").action(taskAction);
 }
 var taskCommand = applyTaskOptions(
   new Command10("task").description("Run a multi-session agent task")