npm - @llmist/cli - Versions diffs - 15.12.0 → 15.14.0 - Mend

@llmist/cli 15.12.0 → 15.14.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/dist/cli.js CHANGED Viewed

@@ -51,7 +51,11 @@ var OPTION_FLAGS = {
   maxRetries: "--max-retries <count>",
   retryMinTimeout: "--retry-min-timeout <ms>",
   retryMaxTimeout: "--retry-max-timeout <ms>",
-  noRetry: "--no-retry"
+  noRetry: "--no-retry",
+  // Reasoning options
+  reasoning: "--reasoning [effort]",
+  noReasoning: "--no-reasoning",
+  reasoningBudget: "--reasoning-budget <tokens>"
 };
 var OPTION_DESCRIPTIONS = {
   model: "Model identifier, e.g. openai:gpt-5-nano or anthropic:claude-sonnet-4-5.",
@@ -88,7 +92,11 @@ var OPTION_DESCRIPTIONS = {
   maxRetries: "Maximum retry attempts for failed API calls.",
   retryMinTimeout: "Initial retry delay in milliseconds.",
   retryMaxTimeout: "Maximum retry delay in milliseconds.",
-  noRetry: "Disable retry logic for API calls."
+  noRetry: "Disable retry logic for API calls.",
+  // Reasoning descriptions
+  reasoning: "Enable reasoning mode. Optional effort: none, low, medium, high, maximum (default: medium).",
+  noReasoning: "Disable auto-enabled reasoning for reasoning-capable models.",
+  reasoningBudget: "Explicit reasoning token budget (Anthropic/Gemini 2.5). Overrides effort level."
 };
 var SUMMARY_PREFIX = "[llmist]";
@@ -98,7 +106,7 @@ import { Command, InvalidArgumentError as InvalidArgumentError2 } from "commande
 // package.json
 var package_default = {
   name: "@llmist/cli",
-  version: "15.12.0",
+  version: "15.14.0",
   description: "CLI for llmist - run LLM agents from the command line",
   type: "module",
   main: "dist/cli.js",
@@ -154,7 +162,7 @@ var package_default = {
     node: ">=22.0.0"
   },
   dependencies: {
-    llmist: "^15.12.0",
+    llmist: "^15.14.0",
     "@unblessed/node": "^1.0.0-alpha.23",
     chalk: "^5.6.2",
     commander: "^12.1.0",
@@ -168,7 +176,7 @@ var package_default = {
     zod: "^4.1.12"
   },
   devDependencies: {
-    "@llmist/testing": "^15.12.0",
+    "@llmist/testing": "^15.14.0",
     "@types/diff": "^8.0.0",
     "@types/js-yaml": "^4.0.9",
     "@types/marked-terminal": "^6.1.1",
@@ -420,6 +428,7 @@ var COMPLETE_CONFIG_KEYS = /* @__PURE__ */ new Set([
   "log-llm-requests",
   "rate-limits",
   "retry",
+  "reasoning",
   "type"
   // Allowed for inheritance compatibility, ignored for built-in commands
 ]);
@@ -452,6 +461,7 @@ var AGENT_CONFIG_KEYS = /* @__PURE__ */ new Set([
   "log-llm-requests",
   "rate-limits",
   "retry",
+  "reasoning",
   "type"
   // Allowed for inheritance compatibility, ignored for built-in commands
 ]);
@@ -684,6 +694,39 @@ function validateRetryConfig(value, section) {
   }
   return result;
 }
+var REASONING_CONFIG_KEYS = /* @__PURE__ */ new Set(["enabled", "effort", "budget-tokens"]);
+var VALID_REASONING_EFFORTS = /* @__PURE__ */ new Set(["none", "low", "medium", "high", "maximum"]);
+function validateReasoningConfig(value, section) {
+  if (typeof value !== "object" || value === null || Array.isArray(value)) {
+    throw new ConfigError(`[${section}] must be a table`);
+  }
+  const raw = value;
+  const result = {};
+  for (const [key, val] of Object.entries(raw)) {
+    if (!REASONING_CONFIG_KEYS.has(key)) {
+      throw new ConfigError(`[${section}] has unknown key: ${key}`);
+    }
+    switch (key) {
+      case "enabled":
+        result.enabled = validateBoolean(val, key, section);
+        break;
+      case "effort": {
+        const effort = validateString(val, key, section);
+        if (!VALID_REASONING_EFFORTS.has(effort)) {
+          throw new ConfigError(
+            `[${section}].effort must be one of: none, low, medium, high, maximum (got "${effort}")`
+          );
+        }
+        result.effort = effort;
+        break;
+      }
+      case "budget-tokens":
+        result["budget-tokens"] = validateNumber(val, key, section, { integer: true, min: 1 });
+        break;
+    }
+  }
+  return result;
+}
 function validateGlobalSubagentConfig(value, section) {
   if (typeof value !== "object" || value === null || Array.isArray(value)) {
     throw new ConfigError(`[${section}] must be a table`);
@@ -850,6 +893,9 @@ function validateCompleteConfig(raw, section) {
   if ("retry" in rawObj) {
     result.retry = validateRetryConfig(rawObj.retry, `${section}.retry`);
   }
+  if ("reasoning" in rawObj) {
+    result.reasoning = validateReasoningConfig(rawObj.reasoning, `${section}.reasoning`);
+  }
   return result;
 }
 function validateAgentConfig(raw, section) {
@@ -947,6 +993,9 @@ function validateAgentConfig(raw, section) {
   if ("retry" in rawObj) {
     result.retry = validateRetryConfig(rawObj.retry, `${section}.retry`);
   }
+  if ("reasoning" in rawObj) {
+    result.reasoning = validateReasoningConfig(rawObj.reasoning, `${section}.reasoning`);
+  }
   return result;
 }
 function validateImageConfig(raw, section) {
@@ -3164,6 +3213,8 @@ var StreamProgress = class {
   // Cache token tracking for live cost estimation during streaming
   callCachedInputTokens = 0;
   callCacheCreationInputTokens = 0;
+  // Reasoning token tracking for live cost estimation during streaming
+  callReasoningTokens = 0;
   // Cumulative stats (cumulative mode)
   totalStartTime = Date.now();
   totalTokens = 0;
@@ -3282,6 +3333,7 @@ var StreamProgress = class {
       if (info.cachedInputTokens !== void 0) agent.cachedInputTokens = info.cachedInputTokens;
       if (info.cacheCreationInputTokens !== void 0)
         agent.cacheCreationInputTokens = info.cacheCreationInputTokens;
+      if (info.reasoningTokens !== void 0) agent.reasoningTokens = info.reasoningTokens;
       if (info.finishReason !== void 0) agent.finishReason = info.finishReason;
       if (info.cost !== void 0) {
         agent.cost = info.cost;
@@ -3293,7 +3345,8 @@ var StreamProgress = class {
             agent.inputTokens ?? 0,
             agent.outputTokens,
             agent.cachedInputTokens,
-            agent.cacheCreationInputTokens
+            agent.cacheCreationInputTokens,
+            agent.reasoningTokens
           );
           agent.cost = costResult?.totalCost;
         } catch {
@@ -3407,6 +3460,7 @@ var StreamProgress = class {
     this.isStreaming = false;
     this.callCachedInputTokens = 0;
     this.callCacheCreationInputTokens = 0;
+    this.callReasoningTokens = 0;
     this.start();
   }
   /**
@@ -3425,7 +3479,8 @@ var StreamProgress = class {
             usage.inputTokens,
             usage.outputTokens,
             usage.cachedInputTokens ?? 0,
-            usage.cacheCreationInputTokens ?? 0
+            usage.cacheCreationInputTokens ?? 0,
+            usage.reasoningTokens ?? 0
           );
           if (cost) {
             this.totalCost += cost.totalCost;
@@ -3484,6 +3539,14 @@ var StreamProgress = class {
     this.callCachedInputTokens = cachedInputTokens;
     this.callCacheCreationInputTokens = cacheCreationInputTokens;
   }
+  /**
+   * Sets reasoning token count for the current call (from stream metadata).
+   * Used for live cost estimation during streaming.
+   * @param reasoningTokens - Number of reasoning/thinking tokens (subset of outputTokens)
+   */
+  setReasoningTokens(reasoningTokens) {
+    this.callReasoningTokens = reasoningTokens;
+  }
   /**
    * Get total elapsed time in seconds since the first call started.
    * @returns Elapsed time in seconds with 1 decimal place
@@ -3725,7 +3788,8 @@ var StreamProgress = class {
         this.callInputTokens,
         outputTokens,
         this.callCachedInputTokens,
-        this.callCacheCreationInputTokens
+        this.callCacheCreationInputTokens,
+        this.callReasoningTokens
       );
       return cost?.totalCost ?? 0;
     } catch {
@@ -3946,7 +4010,11 @@ function addCompleteOptions(cmd, defaults) {
     OPTION_DESCRIPTIONS.retryMaxTimeout,
     createNumericParser({ label: "Max timeout", integer: true, min: 0 }),
     defaults?.retry?.["max-timeout"]
-  ).option(OPTION_FLAGS.noRetry, OPTION_DESCRIPTIONS.noRetry);
+  ).option(OPTION_FLAGS.noRetry, OPTION_DESCRIPTIONS.noRetry).option(OPTION_FLAGS.reasoning, OPTION_DESCRIPTIONS.reasoning).option(OPTION_FLAGS.noReasoning, OPTION_DESCRIPTIONS.noReasoning).option(
+    OPTION_FLAGS.reasoningBudget,
+    OPTION_DESCRIPTIONS.reasoningBudget,
+    createNumericParser({ label: "Reasoning budget", integer: true, min: 1 })
+  );
 }
 function addAgentOptions(cmd, defaults) {
   const gadgetAccumulator = (value, previous = []) => [
@@ -4009,7 +4077,11 @@ function addAgentOptions(cmd, defaults) {
     OPTION_DESCRIPTIONS.retryMaxTimeout,
     createNumericParser({ label: "Max timeout", integer: true, min: 0 }),
     defaults?.retry?.["max-timeout"]
-  ).option(OPTION_FLAGS.noRetry, OPTION_DESCRIPTIONS.noRetry);
+  ).option(OPTION_FLAGS.noRetry, OPTION_DESCRIPTIONS.noRetry).option(OPTION_FLAGS.reasoning, OPTION_DESCRIPTIONS.reasoning).option(OPTION_FLAGS.noReasoning, OPTION_DESCRIPTIONS.noReasoning).option(
+    OPTION_FLAGS.reasoningBudget,
+    OPTION_DESCRIPTIONS.reasoningBudget,
+    createNumericParser({ label: "Reasoning budget", integer: true, min: 1 })
+  );
 }
 function configToCompleteOptions(config) {
   const result = {};
@@ -4034,6 +4106,9 @@ function configToCompleteOptions(config) {
     if (r["max-timeout"] !== void 0) result.retryMaxTimeout = r["max-timeout"];
     if (r.enabled === false) result.noRetry = true;
   }
+  if (config.reasoning) {
+    result.profileReasoning = config.reasoning;
+  }
   return result;
 }
 function configToAgentOptions(config) {
@@ -4073,6 +4148,9 @@ function configToAgentOptions(config) {
     if (r["max-timeout"] !== void 0) result.retryMaxTimeout = r["max-timeout"];
     if (r.enabled === false) result.noRetry = true;
   }
+  if (config.reasoning) {
+    result.profileReasoning = config.reasoning;
+  }
   if (config["show-hints"] !== void 0) result.showHints = config["show-hints"];
   return result;
 }
@@ -4327,6 +4405,9 @@ function formatLLMCallCollapsed(node, selected) {
     if (d.outputTokens && d.outputTokens > 0) {
       parts.push(chalk3.dim("\u2193") + chalk3.green(` ${formatTokens(d.outputTokens)}`));
     }
+    if (d.reasoningTokens && d.reasoningTokens > 0) {
+      parts.push(chalk3.dim("\u{1F4AD}") + chalk3.magenta(` ${formatTokens(d.reasoningTokens)}`));
+    }
     if (d.elapsedSeconds !== void 0) {
       parts.push(chalk3.dim(`${d.elapsedSeconds.toFixed(1)}s`));
     }
@@ -4374,6 +4455,11 @@ function formatLLMCallExpanded(node) {
       `${indent}${chalk3.dim(BOX.vertical)} Output:  ${chalk3.green(formatTokens(d.outputTokens))} tokens`
     );
   }
+  if (d.reasoningTokens !== void 0 && d.reasoningTokens > 0) {
+    lines.push(
+      `${indent}${chalk3.dim(BOX.vertical)} Reason:  ${chalk3.magenta(formatTokens(d.reasoningTokens))} tokens`
+    );
+  }
   if (d.contextPercent !== void 0) {
     let contextColor = chalk3.green;
     if (d.contextPercent >= 80) contextColor = chalk3.red;
@@ -4633,6 +4719,8 @@ var BlockRenderer = class _BlockRenderer {
   nodeIdCounter = 0;
   /** Current LLM call node (for adding gadget children) */
   currentLLMCallId = null;
+  /** Current thinking block (accumulates chunks during streaming) */
+  currentThinkingId = null;
   /** Persisted expanded states (survives rebuildBlocks) */
   expandedStates = /* @__PURE__ */ new Map();
   /** Whether to auto-scroll to bottom on new content ("follow mode") */
@@ -4868,6 +4956,66 @@ var BlockRenderer = class _BlockRenderer {
     this.rebuildBlocks();
     return id;
   }
+  /**
+   * Add thinking content from a reasoning model.
+   * Creates a new thinking block on first chunk, appends to existing on subsequent chunks.
+   * The block lives as a child of the current LLM call.
+   *
+   * @param content - Thinking text chunk
+   * @param thinkingType - Whether this is actual thinking or redacted content
+   */
+  addThinking(content, thinkingType) {
+    if (this.currentThinkingId) {
+      const node2 = this.getNode(this.currentThinkingId);
+      if (node2 && node2.type === "thinking") {
+        node2.content += content;
+        this.updateBlock(this.currentThinkingId);
+        return;
+      }
+    }
+    const id = this.generateId("thinking");
+    const parentLLMCallId = this.currentLLMCallId;
+    let depth = 0;
+    if (parentLLMCallId) {
+      const parent = this.getNode(parentLLMCallId);
+      if (parent) {
+        depth = parent.depth + 1;
+      }
+    }
+    const node = {
+      id,
+      type: "thinking",
+      depth,
+      parentId: parentLLMCallId,
+      sessionId: this.currentSessionId,
+      content,
+      thinkingType,
+      isComplete: false,
+      children: []
+    };
+    this.nodes.set(id, node);
+    if (parentLLMCallId) {
+      const parent = this.getNode(parentLLMCallId);
+      parent.children.push(id);
+    } else {
+      this.rootIds.push(id);
+    }
+    this.currentThinkingId = id;
+    this.rebuildBlocks();
+  }
+  /**
+   * Complete the current thinking block.
+   * Called when the LLM call finishes to mark thinking as complete.
+   */
+  completeThinking() {
+    if (!this.currentThinkingId) return;
+    const node = this.getNode(this.currentThinkingId);
+    if (node && node.type === "thinking") {
+      node.isComplete = true;
+      this.updateBlock(this.currentThinkingId);
+    }
+    this.currentThinkingId = null;
+  }
   /**
    * Add a user message block (for REPL mid-session input).
    *
@@ -4951,6 +5099,7 @@ var BlockRenderer = class _BlockRenderer {
     this.selectableIds = [];
     this.selectedIndex = -1;
     this.currentLLMCallId = null;
+    this.currentThinkingId = null;
     for (const child of [...this.container.children]) {
       child.detach();
     }
@@ -5280,6 +5429,25 @@ ${fullContent}
         }
         return this.abbreviateToLines(fullContent, 2, selected);
       }
+      case "thinking": {
+        const DIM2 = "\x1B[2m";
+        const RED_DIM = "\x1B[2;31m";
+        const RESET3 = "\x1B[0m";
+        const contIndent = getContinuationIndent(node.depth);
+        if (node.thinkingType === "redacted") {
+          const header2 = `${indent}${RED_DIM}\u{1F512} [Redacted thinking block]${RESET3}`;
+          return header2;
+        }
+        if (!expanded) {
+          const firstLine = node.content.split("\n")[0]?.slice(0, 60) ?? "";
+          const suffix = node.isComplete ? "" : "...";
+          return `${indent}${DIM2}\u{1F4AD} Thinking${suffix} ${firstLine}${RESET3}`;
+        }
+        const tokenInfo = node.isComplete ? ` (${Math.ceil(node.content.length / 4)} tokens est.)` : "";
+        const header = `${indent}${DIM2}\u25BC \u{1F4AD} Thinking${tokenInfo}${RESET3}`;
+        const contentLines = node.content.split("\n").map((line) => `${contIndent}${DIM2}${line}${RESET3}`);
+        return [header, ...contentLines].join("\n");
+      }
       case "system_message": {
         const icon = this.getSystemMessageIcon(node.category);
         const color = this.getSystemMessageColor(node.category);
@@ -5619,6 +5787,8 @@ ${indicator}`;
         return true;
       case "llm_call":
         return false;
+      case "thinking":
+        return false;
       case "gadget": {
         const name = node.name;
         return name === "TellUser" || name === "AskUser" || name === "Finish";
@@ -5680,6 +5850,7 @@ ${indicator}`;
   handleTreeEvent(event, tree) {
     switch (event.type) {
       case "llm_call_start": {
+        this.currentThinkingId = null;
         let parentBlockId;
         if (event.parentId) {
           parentBlockId = this.treeNodeToBlockId.get(event.parentId);
@@ -5698,12 +5869,14 @@ ${indicator}`;
         break;
       }
       case "llm_call_complete": {
+        this.completeThinking();
         const blockId = this.treeNodeToBlockId.get(event.nodeId);
         if (blockId) {
           this.completeLLMCall(blockId, {
             inputTokens: event.usage?.inputTokens,
             cachedInputTokens: event.usage?.cachedInputTokens,
             outputTokens: event.usage?.outputTokens,
+            reasoningTokens: event.usage?.reasoningTokens,
             cost: event.cost,
             finishReason: event.finishReason ?? void 0
           });
@@ -5714,6 +5887,10 @@ ${indicator}`;
         }
         break;
       }
+      case "thinking": {
+        this.addThinking(event.content, event.thinkingType);
+        break;
+      }
       case "gadget_call": {
         let parentBlockId;
         if (event.parentId) {
@@ -7404,6 +7581,7 @@ var StatusBar = class {
       inputTokens: 0,
       outputTokens: 0,
       cachedTokens: 0,
+      reasoningTokens: 0,
       cost: 0,
       startTime: Date.now(),
       iteration: 0,
@@ -7437,10 +7615,11 @@ var StatusBar = class {
    * Called when an LLM call completes.
    * Replaces streaming estimates with actual values.
    */
-  endCall(inputTokens, outputTokens, cachedTokens, cost) {
+  endCall(inputTokens, outputTokens, cachedTokens, cost, reasoningTokens = 0) {
     this.metrics.inputTokens += inputTokens;
     this.metrics.outputTokens += outputTokens;
     this.metrics.cachedTokens += cachedTokens;
+    this.metrics.reasoningTokens += reasoningTokens;
     this.metrics.cost += cost;
     this.streamingInputTokens = 0;
     this.streamingOutputTokens = 0;
@@ -7640,7 +7819,8 @@ var StatusBar = class {
               event.usage?.inputTokens ?? 0,
               event.usage?.outputTokens ?? 0,
               event.usage?.cachedInputTokens ?? 0,
-              event.cost ?? 0
+              event.cost ?? 0,
+              event.usage?.reasoningTokens ?? 0
             );
           }
           this.nodeIdToLabel.delete(event.nodeId);
@@ -7805,6 +7985,9 @@ var StatusBar = class {
       const outputPrefix = this.isStreaming ? "~" : "";
       parts.push(`${GREEN2}\u2193${outputPrefix}${formatTokens(displayOutputTokens)}${RESET3}`);
     }
+    if (this.metrics.reasoningTokens > 0) {
+      parts.push(`${MAGENTA2}\u{1F4AD}${formatTokens(this.metrics.reasoningTokens)}${RESET3}`);
+    }
     const earliestStart = this.getEarliestLLMCallStartTime();
     if (earliestStart !== null) {
       const elapsedSeconds = (Date.now() - earliestStart) / 1e3;
@@ -8048,6 +8231,8 @@ var TUIApp = class _TUIApp {
   handleEvent(event) {
     if (event.type === "text") {
       this.blockRenderer.addText(event.content);
+    } else if (event.type === "thinking") {
+      this.blockRenderer.addThinking(event.content, event.thinkingType);
     }
   }
   /**
@@ -8698,6 +8883,27 @@ ${ctx.gadgetName} requires interactive approval. Run in a terminal to approve.`
   if (options.temperature !== void 0) {
     builder.withTemperature(options.temperature);
   }
+  if (options.reasoning === false) {
+    builder.withoutReasoning();
+  } else if (options.reasoning !== void 0 || options.reasoningBudget !== void 0) {
+    const effort = typeof options.reasoning === "string" ? options.reasoning : void 0;
+    builder.withReasoning({
+      enabled: true,
+      ...effort && { effort },
+      ...options.reasoningBudget && { budgetTokens: options.reasoningBudget }
+    });
+  } else if (options.profileReasoning) {
+    const cfg = options.profileReasoning;
+    if (cfg.enabled === false) {
+      builder.withoutReasoning();
+    } else {
+      builder.withReasoning({
+        enabled: true,
+        ...cfg.effort && { effort: cfg.effort },
+        ...cfg["budget-tokens"] && { budgetTokens: cfg["budget-tokens"] }
+      });
+    }
+  }
   if (tui) {
     builder.onHumanInput(async (question) => {
       return tui.waitForInput(question, "AskUser");
@@ -8788,6 +8994,11 @@ ${ctx.gadgetName} requires interactive approval. Run in a terminal to approve.`
       } else {
         if (event.type === "text") {
           env.stdout.write(event.content);
+        } else if (event.type === "thinking") {
+          const stderrTTY = env.stderr.isTTY === true;
+          if (stderrTTY && !options.quiet) {
+            env.stderr.write(`\x1B[2m${event.content}\x1B[0m`);
+          }
         } else if (event.type === "gadget_result" && event.result.gadgetName === "TellUser" && event.result.result) {
           env.stdout.write(`${event.result.result}
 `);
@@ -8854,6 +9065,7 @@ function registerAgentCommand(program, env, config, globalSubagents, globalRateL
         globalRetry,
         profileRateLimits: config?.["rate-limits"],
         profileRetry: config?.retry,
+        profileReasoning: config?.reasoning,
         showHints: config?.["show-hints"]
       };
       return executeAgent(prompt, mergedOptions, env, "agent");
@@ -8908,11 +9120,34 @@ async function executeComplete(promptArg, options, env) {
     const content = formatLlmRequest2(messages);
     await writeLogFile(llmLogDir, filename, content);
   }
+  let reasoning;
+  if (options.reasoning === false) {
+    reasoning = { enabled: false };
+  } else if (options.reasoning !== void 0 || options.reasoningBudget !== void 0) {
+    const effort = typeof options.reasoning === "string" ? options.reasoning : void 0;
+    reasoning = {
+      enabled: true,
+      ...effort && { effort },
+      ...options.reasoningBudget && { budgetTokens: options.reasoningBudget }
+    };
+  } else if (options.profileReasoning) {
+    const cfg = options.profileReasoning;
+    if (cfg.enabled === false) {
+      reasoning = { enabled: false };
+    } else {
+      reasoning = {
+        enabled: true,
+        ...cfg.effort && { effort: cfg.effort },
+        ...cfg["budget-tokens"] && { budgetTokens: cfg["budget-tokens"] }
+      };
+    }
+  }
   const stream = client.stream({
     model,
     messages,
     temperature: options.temperature,
-    maxTokens: options.maxTokens
+    maxTokens: options.maxTokens,
+    ...reasoning && { reasoning }
   });
   const printer = new StreamPrinter(env.stdout);
   const stderrTTY = env.stderr.isTTY === true;
@@ -8932,6 +9167,12 @@ async function executeComplete(promptArg, options, env) {
         progress.setOutputTokens(chunk.usage.outputTokens, false);
       }
     }
+    if (chunk.thinking?.content) {
+      if (stderrTTY && !options.quiet) {
+        progress.pause();
+        env.stderr.write(`\x1B[2m${chunk.thinking.content}\x1B[0m`);
+      }
+    }
     if (chunk.text) {
       progress.pause();
       accumulatedResponse += chunk.text;
@@ -8965,7 +9206,8 @@ function registerCompleteCommand(program, env, config, globalRateLimits, globalR
       const mergedOptions = {
         ...options,
         globalRateLimits,
-        globalRetry
+        globalRetry,
+        profileReasoning: config?.reasoning
       };
       return executeComplete(prompt, mergedOptions, env);
     }, env)