npm - lynkr - Versions diffs - 9.0.1 → 9.1.2 - Mend

lynkr 9.0.1 → 9.1.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (58) hide show

package/README.md +70 -21
package/bin/cli.js +34 -4
package/bin/lynkr-trajectory.js +136 -0
package/bin/lynkr-usage.js +219 -0
package/funding.json +110 -0
package/index.js +7 -3
package/install.sh +3 -3
package/lynkr-skill.tar.gz +0 -0
package/native/Cargo.toml +26 -0
package/native/index.js +29 -0
package/native/lynkr-native.node +0 -0
package/native/src/lib.rs +321 -0
package/package.json +6 -5
package/public/dashboard.html +665 -0
package/src/api/files-multipart.js +30 -0
package/src/api/files-router.js +81 -0
package/src/api/middleware/budget.js +19 -1
package/src/api/middleware/load-shedding.js +17 -0
package/src/api/openai-router.js +353 -301
package/src/api/router.js +275 -40
package/src/cache/prompt.js +13 -0
package/src/clients/databricks.js +42 -18
package/src/clients/ollama-utils.js +21 -17
package/src/clients/openai-format.js +50 -10
package/src/clients/openrouter-utils.js +42 -37
package/src/clients/prompt-cache-injection.js +140 -0
package/src/clients/provider-capabilities.js +41 -0
package/src/clients/responses-format.js +8 -7
package/src/clients/standard-tools.js +1 -1
package/src/clients/xml-tool-extractor.js +307 -0
package/src/cluster.js +82 -0
package/src/config/index.js +16 -0
package/src/context/distill.js +15 -0
package/src/context/tool-result-compressor.js +563 -0
package/src/dashboard/api.js +170 -0
package/src/dashboard/router.js +13 -0
package/src/headroom/client.js +3 -109
package/src/headroom/index.js +0 -14
package/src/memory/extractor.js +22 -0
package/src/memory/search.js +0 -50
package/src/orchestrator/index.js +163 -204
package/src/orchestrator/preflight.js +188 -0
package/src/routing/index.js +64 -32
package/src/routing/interaction.js +183 -0
package/src/routing/risk-analyzer.js +194 -0
package/src/routing/telemetry.js +47 -2
package/src/server.js +15 -0
package/src/stores/file-store.js +104 -0
package/src/stores/response-store.js +25 -0
package/src/tools/index.js +1 -1
package/src/tools/smart-selection.js +11 -2
package/src/tools/web.js +1 -1
package/src/training/trajectory-compressor.js +266 -0
package/src/usage/aggregator.js +206 -0
package/src/utils/markdown-ansi.js +146 -0
package/.lynkr/telemetry.db +0 -0
package/.lynkr/telemetry.db-shm +0 -0
package/.lynkr/telemetry.db-wal +0 -0

package/src/orchestrator/index.js CHANGED Viewed

@@ -17,6 +17,7 @@ const { compressMessages: headroomCompress, isEnabled: isHeadroomEnabled } = req
 const { createAuditLogger } = require("../logger/audit-logger");
 const { getResolvedIp, runWithDnsContext } = require("../clients/dns-logger");
 const { getShuttingDown } = require("../api/health");
+const { tryPreflight, buildSatisfiedResponse: buildPreflightResponse } = require("./preflight");
 const crypto = require("crypto");
 const { asyncClone, asyncTransform, getPoolStats } = require("../workers/helpers");
 const { getSemanticCache, isSemanticCacheEnabled } = require("../cache/semantic");
@@ -68,7 +69,6 @@ const DROP_KEYS = new Set([
   "beta",
   "context_management",
   "stream",
-  "thinking",
   "max_steps",
   "max_duration_ms",
 ]);
@@ -187,7 +187,14 @@ function normaliseMessages(payload, options = {}) {
       const rawContent = message.content;
       let content;
       if (Array.isArray(rawContent)) {
-        content = flattenContent ? flattenBlocks(rawContent) : rawContent.slice();
+        const hasToolBlocks = rawContent.some(
+          (b) => b && (b.type === "tool_use" || b.type === "tool_result" || b.type === "document" || b.type === "image" || b.type === "thinking")
+        );
+        if (hasToolBlocks) {
+          content = rawContent.slice();
+        } else {
+          content = flattenContent ? flattenBlocks(rawContent) : rawContent.slice();
+        }
       } else if (rawContent === undefined || rawContent === null) {
         content = flattenContent ? "" : rawContent;
       } else if (typeof rawContent === "string") {
@@ -197,7 +204,11 @@ function normaliseMessages(payload, options = {}) {
       } else {
         content = rawContent;
       }
-      normalised.push({ role, content });
+      const entry = { role, content };
+      if (Array.isArray(message.tool_calls) && message.tool_calls.length > 0) {
+        entry.tool_calls = message.tool_calls;
+      }
+      normalised.push(entry);
     }
   }
   return normalised;
@@ -470,8 +481,8 @@ function injectToolLoopStopInstruction(messages, threshold = 5) {
 // requests escape it.
 const DEDUP_MAX_SIGNATURES = 50;
-const DEDUP_WARN_THRESHOLD = 2;
-const DEDUP_TERMINATE_THRESHOLD = 3;
+const DEDUP_WARN_THRESHOLD = 5;
+const DEDUP_TERMINATE_THRESHOLD = 8;
 /**
  * Initialise session.metadata.toolCallDedup if missing.
@@ -1021,10 +1032,14 @@ function toAnthropicResponse(openai, requestedModel, wantsThinking) {
   const toolCalls = Array.isArray(message.tool_calls) ? message.tool_calls : [];
   const contentItems = [];
-  if (wantsThinking) {
+  // Pass through real reasoning_content as a thinking block
+  const reasoningContent = typeof message.reasoning_content === "string" ? message.reasoning_content : "";
+  if (reasoningContent && wantsThinking) {
+    contentItems.push({ type: "thinking", thinking: reasoningContent });
+  } else if (wantsThinking) {
     contentItems.push({
       type: "thinking",
-      thinking: "Reasoning not available from the backing Databricks model.",
+      thinking: "Reasoning not available from the backing model.",
     });
   }
@@ -1220,6 +1235,13 @@ function sanitizePayload(payload) {
   }
   DROP_KEYS.forEach((key) => delete clean[key]);
+  // Conditionally keep or strip the `thinking` parameter based on provider
+  const { getThinkingBehavior } = require("../clients/provider-capabilities");
+  const thinkingBehavior = getThinkingBehavior(providerType, clean.model);
+  if (clean.thinking && thinkingBehavior !== "native") {
+    delete clean.thinking;
+  }
   if (Array.isArray(clean.tools) && clean.tools.length === 0) {
     delete clean.tools;
   } else if (providerType === "databricks") {
@@ -1362,7 +1384,9 @@ function sanitizePayload(payload) {
     clean.tools = selectedTools.length > 0 ? selectedTools : undefined;
   }
-  clean.stream = payload?.stream ?? false;
+  // Always false: the agent loop needs buffered JSON to parse tool calls.
+  // Lynkr synthesises SSE back to the client from the buffered response.
+  clean.stream = false;
   if (
     config.modelProvider?.type === "azure-anthropic" &&
@@ -1397,47 +1421,37 @@ function sanitizePayload(payload) {
   applyToonCompression(clean, config.toon, { logger });
   // FIX: Handle consecutive messages with the same role (causes llama.cpp 400 error)
-  // Strategy: Merge all consecutive messages, add instruction to focus on last request
+  // Strategy: Merge consecutive same-role messages, but NEVER merge messages
+  // that contain tool_use or tool_result blocks — they must stay intact for
+  // the provider's tool-call protocol.
   if (Array.isArray(clean.messages) && clean.messages.length > 0) {
     const merged = [];
     const messages = clean.messages;
+    const hasToolContent = (msg) => {
+      if (Array.isArray(msg?.content)) {
+        return msg.content.some(b => b && (b.type === 'tool_use' || b.type === 'tool_result'));
+      }
+      return Array.isArray(msg?.tool_calls) && msg.tool_calls.length > 0;
+    };
     for (let i = 0; i < messages.length; i++) {
       const msg = messages[i];
+      const prev = merged.length > 0 ? merged[merged.length - 1] : null;
-      if (merged.length > 0 && msg.role === merged[merged.length - 1].role) {
-        // Merge content with the previous message of the same role
-        const prevMsg = merged[merged.length - 1];
-        const prevContent = typeof prevMsg.content === 'string' ? prevMsg.content : JSON.stringify(prevMsg.content);
+      if (prev && msg.role === prev.role && !hasToolContent(msg) && !hasToolContent(prev)) {
+        const prevContent = typeof prev.content === 'string' ? prev.content : JSON.stringify(prev.content);
         const currContent = typeof msg.content === 'string' ? msg.content : JSON.stringify(msg.content);
-        prevMsg.content = prevContent + '\n\n' + currContent;
-        logger.debug({
-          mergedRole: msg.role,
-          addedContentPreview: currContent.substring(0, 50)
-        }, 'Merged consecutive message with same role');
+        prev.content = prevContent + '\n\n' + currContent;
       } else {
         merged.push({ ...msg });
       }
     }
-    // If the last message is from user, add instruction to focus on the actual request
-    if (merged.length > 0 && merged[merged.length - 1].role === 'user') {
-      const lastMsg = merged[merged.length - 1];
-      const content = typeof lastMsg.content === 'string' ? lastMsg.content : JSON.stringify(lastMsg.content);
-      // Find the last actual user request (after all the context/instructions)
-      // Add a clear separator to help the model focus
-      if (content.length > 500) {
-        lastMsg.content = content + '\n\n---\nIMPORTANT: Focus on and respond ONLY to my most recent request above. Do not summarize or acknowledge previous instructions.';
-      }
-    }
     if (merged.length !== clean.messages.length) {
       logger.debug({
         originalCount: clean.messages.length,
         mergedCount: merged.length,
-        reduced: clean.messages.length - merged.length
       }, 'Merged consecutive messages with same role');
     }
@@ -1788,9 +1802,11 @@ async function runAgentLoop({
       }
     }
-    // Inject tool termination instructions for non-Claude models
-    // This helps models know when to stop calling tools and provide a text response
-    if (steps === 1 && providerType !== 'databricks' && providerType !== 'azure-anthropic') {
+    const hasRequestTools = Array.isArray(cleanPayload.tools) && cleanPayload.tools.length > 0;
+    // Inject tool termination instructions for non-Claude models — only when tools
+    // are actually in the request. Injecting when there are no tools confuses models
+    // like MiniMax into hallucinating tool_use blocks spontaneously.
+    if (steps === 1 && hasRequestTools && providerType !== 'databricks' && providerType !== 'azure-anthropic') {
       const toolTerminationInstruction = `
 IMPORTANT TOOL USAGE RULES:
@@ -1804,6 +1820,13 @@ IMPORTANT TOOL USAGE RULES:
       logger.debug({ sessionId: session?.id ?? null }, 'Tool termination instructions injected for non-Claude model');
     }
+    // When no tools are in the request, explicitly forbid tool_use output for
+    // Ollama models that have been trained on Claude Code data and tend to emit
+    // tool_use blocks spontaneously (e.g. minimax-m2.5:cloud calling Write).
+    if (steps === 1 && !hasRequestTools && providerType === 'ollama') {
+      cleanPayload.system = (cleanPayload.system || '') + '\n\nCRITICAL: You have NO tools available. Do NOT generate tool_use, function_call, or code_execution blocks. Output ONLY text content directly.';
+    }
     // Compute model-aware token budget thresholds
     const registry = getModelRegistrySync();
     const modelInfo = registry.getCost(requestedModel);
@@ -1882,7 +1905,17 @@ IMPORTANT TOOL USAGE RULES:
         cleanPayload.tools || [],
         {
           mode: config.headroom?.mode,
-          queryContext: cleanPayload.messages[cleanPayload.messages.length - 1]?.content,
+          queryContext: (() => {
+            const last = cleanPayload.messages[cleanPayload.messages.length - 1]?.content;
+            if (typeof last === 'string') return last;
+            if (Array.isArray(last)) {
+              return last
+                .map(b => (b?.type === 'text' ? b.text : b?.type === 'tool_result' ? String(b.content ?? '') : ''))
+                .filter(Boolean)
+                .join('\n') || null;
+            }
+            return null;
+          })(),
           model: requestedModel,
           modelLimit: modelContextWindow,
           tokenBudget: effectiveMax,
@@ -1933,6 +1966,14 @@ IMPORTANT TOOL USAGE RULES:
     cleanPayload._workspace = headers["x-lynkr-workspace"];
   }
+  // RTK-inspired tool result compression: compress large tool_results
+  // before they reach the model (saves 60-90% on test/git/lint output)
+  if (config.toolResultCompression?.enabled !== false) {
+    const { compressToolResults } = require("../context/tool-result-compressor");
+    const tier = cleanPayload._routingTier || "MEDIUM";
+    compressToolResults(cleanPayload.messages, { tier });
+  }
   if (agentTimer) agentTimer.mark("preInvokeModel");
   let databricksResponse;
   try {
@@ -2127,6 +2168,21 @@ IMPORTANT TOOL USAGE RULES:
           _anthropic_block: block,
         }));
+      // Extract tool calls from text blocks that contain XML (some Ollama models)
+      if (toolCalls.length === 0) {
+        const { extractToolCallsFromText } = require("../clients/xml-tool-extractor");
+        for (const block of contentArray) {
+          if (block?.type === "text" && block?.text) {
+            const extracted = extractToolCallsFromText(block.text);
+            if (extracted.toolCalls.length > 0) {
+              toolCalls = extracted.toolCalls;
+              block.text = extracted.cleanedText || "";
+              break;
+            }
+          }
+        }
+      }
       logger.debug(
         {
           sessionId: session?.id ?? null,
@@ -2141,6 +2197,17 @@ IMPORTANT TOOL USAGE RULES:
       const choice = databricksResponse.json?.choices?.[0];
       message = choice?.message ?? {};
       toolCalls = Array.isArray(message.tool_calls) ? message.tool_calls : [];
+      // Extract tool calls embedded as XML/text in content (Minimax, Qwen, GLM, Llama, etc.)
+      if (toolCalls.length === 0 && typeof message.content === "string" && message.content.trim()) {
+        const { extractToolCallsFromText } = require("../clients/xml-tool-extractor");
+        const extracted = extractToolCallsFromText(message.content);
+        if (extracted.toolCalls.length > 0) {
+          toolCalls = extracted.toolCalls;
+          message.tool_calls = toolCalls;
+          message.content = extracted.cleanedText;
+        }
+      }
     }
     // Guard: drop hallucinated tool calls when no tools were sent to the model.
@@ -2155,7 +2222,30 @@ IMPORTANT TOOL USAGE RULES:
         noToolInjection: !!cleanPayload._noToolInjection,
       }, "Dropped hallucinated tool calls (no tools were sent to model)");
       toolCalls = [];
-      // If there's also no text content, treat as empty response (handled below)
+      // Check if there is any text content alongside the hallucinated tool calls.
+      // If not, the response is effectively empty. Inject a redirect message so the
+      // model outputs the artifact directly instead of looping tool-call attempts.
+      const hasTextContent = isAnthropicFormat
+        ? (databricksResponse.json?.content ?? []).some(b => b?.type === "text" && String(b.text || "").trim().length > 0)
+        : (typeof message.content === "string" && message.content.trim().length > 0);
+      if (!hasTextContent && steps < settings.maxSteps - 1) {
+        logger.info({
+          sessionId: session?.id ?? null,
+          step: steps,
+        }, "Hallucinated tool calls with no text content — injecting redirect to force direct output");
+        // Push a phantom assistant turn (thinking only, no tool_use) then a user
+        // redirect message so the model outputs the artifact directly.
+        const redirectUser = {
+          role: "user",
+          content: "You don't have any tools available in this context. Please output the result directly as an <artifact identifier=\"design.html\" type=\"text/html\" title=\"Design\"> block containing complete HTML. Do not attempt to call any tools.",
+        };
+        cleanPayload.messages.push(redirectUser);
+        steps++;
+        continue;
+      }
     }
     if (toolCalls.length > 0) {
@@ -2167,6 +2257,7 @@ IMPORTANT TOOL USAGE RULES:
       } else {
         // Convert OpenAI/OpenRouter format to Anthropic content blocks
         const contentBlocks = [];
+        let toolCallIdx = 0;
         // Add text content if present
         if (message.content && typeof message.content === 'string' && message.content.trim()) {
@@ -2198,7 +2289,7 @@ IMPORTANT TOOL USAGE RULES:
           contentBlocks.push({
             type: "tool_use",
-            id: toolCall.id || `toolu_${Date.now()}_${Math.random().toString(36).substr(2, 9)}`,
+            id: toolCall.id || `toolu_${Date.now()}_${(toolCallIdx++).toString(36)}_${Math.random().toString(36).substr(2, 6)}`,
             name: func.name || toolCall.name || "unknown",
             input
           });
@@ -2262,7 +2353,7 @@ IMPORTANT TOOL USAGE RULES:
       const serverSideToolCalls = [];
       const clientSideToolCalls = [];
-      const SERVER_SIDE_TOOLS = new Set(["task", "web_search", "web_fetch", "websearch", "webfetch", "web_agent"]);
+      const SERVER_SIDE_TOOLS = new Set(["task", "Task", "web_search", "web_fetch", "websearch", "webfetch", "web_agent", "WebSearch", "WebFetch", "WebAgent"]);
       for (const call of toolCalls) {
         const toolName = (call.function?.name ?? call.name ?? "").toLowerCase();
@@ -2285,7 +2376,9 @@ IMPORTANT TOOL USAGE RULES:
             executionMode,
             clientTools: clientSideToolCalls.map((c) => c.function?.name ?? c.name),
           },
-          "Hybrid mode: returning non-Task tools to client, executing Task tools on server"
+          clientSideToolCalls.length > 1
+            ? `Parallel tool passthrough: ${clientSideToolCalls.length} tools → client`
+            : "Hybrid mode: returning non-Task tools to client, executing Task tools on server"
         );
         // Filter sessionContent to only include client-side tool_use blocks
@@ -2322,26 +2415,11 @@ IMPORTANT TOOL USAGE RULES:
         // then continue the conversation loop. For now, let's fall through to execute server-side tools.
         if (serverSideToolCalls.length === 0) {
           // No server-side tools - pure passthrough
-          // Record outbound client-side tool calls into cross-request dedup tracker
-          if (session && clientSideToolCalls.length > 0) {
-            ensureDedupStructure(session);
-            for (const call of clientSideToolCalls) {
-              recordCrossRequestToolCall(session, call);
-            }
-            // Persist dedup state (non-ephemeral sessions only)
-            if (session.id && !session._ephemeral) {
-              try { upsertSession(session.id, { metadata: session.metadata }); } catch (e) {
-                logger.debug({ err: e.message }, "Failed to persist outbound dedup state");
-              }
-            }
-            const { maxCount, toolName: dedupTool } = getMaxDedupCount(session);
-            logger.debug({
-              sessionId: session?.id ?? null,
-              clientToolCount: clientSideToolCalls.length,
-              maxDedupCount: maxCount,
-              maxDedupTool: dedupTool,
-            }, "Cross-request tool dedup: recorded outbound tool calls");
-          }
+          // Do NOT record outbound tool calls here — the inbound recording
+          // on the next request (when the client sends results back) is
+          // enough to detect real loops.  Recording both outbound + inbound
+          // for the same call double-counts and triggers the dedup warning
+          // on the very first normal tool round-trip.
           return {
             response: {
@@ -3646,6 +3724,28 @@ async function processMessage({ payload, headers, session, cwd, options = {} })
     };
   }
+  // === PREFLIGHT CHECK ===
+  // If the request supplied preflight_commands and they all pass in
+  // the workspace, the work is already done — short-circuit with a
+  // synthetic response and never touch the model. No-op when the
+  // feature is disabled or the request didn't opt in.
+  const preflightResult = tryPreflight({ payload, cwd });
+  if (preflightResult?.satisfied) {
+    logger.info({
+      commands: preflightResult.results.length,
+      reason: preflightResult.reason,
+    }, '[Preflight] Satisfied — skipping model call');
+    return buildPreflightResponse({
+      model: requestedModel,
+      preflightResult,
+    });
+  }
+  if (preflightResult && !preflightResult.satisfied) {
+    logger.debug({
+      failedCommand: preflightResult.failedCommand,
+    }, '[Preflight] Not satisfied — proceeding with model call');
+  }
   // === TOOL LOOP GUARD (EARLY CHECK) ===
   // Check BEFORE sanitization since sanitizePayload removes conversation history
   // All providers use threshold 2 to catch loops early
@@ -3787,150 +3887,9 @@ async function processMessage({ payload, headers, session, cwd, options = {} })
       }
     }
-    // Client mode still uses the relaxed per-request threshold for the count-based guard
-    const effectiveThreshold = 10;
-    if (toolResultCount >= effectiveThreshold) {
-      logger.error({
-        toolResultCount,
-        toolUseCount,
-        threshold: effectiveThreshold,
-        sessionId: session?.id ?? null,
-      }, "[ToolLoopGuard] FORCE TERMINATING - too many tool calls in conversation");
-      let toolResultsSummary = "";
-      const messages = payload?.messages || [];
-      let lastUserTextIndex = -1;
-      for (let i = messages.length - 1; i >= 0; i--) {
-        const msg = messages[i];
-        if (msg?.role !== 'user') continue;
-        if (typeof msg.content === 'string' && msg.content.trim().length > 0) {
-          lastUserTextIndex = i;
-          break;
-        }
-        if (Array.isArray(msg.content)) {
-          const hasText = msg.content.some(block =>
-            (block?.type === 'text' && block?.text?.trim?.().length > 0) ||
-            (block?.type === 'input_text' && block?.input_text?.trim?.().length > 0)
-          );
-          if (hasText) {
-            lastUserTextIndex = i;
-            break;
-          }
-        }
-      }
-      const startIndex = lastUserTextIndex >= 0 ? lastUserTextIndex : 0;
-      for (let i = startIndex; i < messages.length; i++) {
-        const msg = messages[i];
-        if (!msg || !Array.isArray(msg.content)) continue;
-        for (const block of msg.content) {
-          if (block?.type === 'tool_result' && block?.content) {
-            const content = typeof block.content === 'string'
-              ? block.content
-              : JSON.stringify(block.content);
-            if (content && !content.includes('Found 0')) {
-              toolResultsSummary += content + "\n";
-            }
-          }
-        }
-      }
-      let responseText = `Based on the tool results, here's what I found:\n\n`;
-      if (toolResultsSummary.trim()) {
-        responseText += toolResultsSummary.trim();
-      } else {
-        responseText += `The tools executed but didn't return clear results. Please check the tool output above or try a different command.`;
-      }
-      const forcedResponse = {
-        id: `msg_forced_${Date.now()}`,
-        type: "message",
-        role: "assistant",
-        content: [{ type: "text", text: responseText }],
-        model: requestedModel || "unknown",
-        stop_reason: "end_turn",
-        stop_sequence: null,
-        usage: { input_tokens: 0, output_tokens: 100 },
-      };
-      return {
-        status: 200,
-        body: forcedResponse,
-        terminationReason: "tool_loop_guard",
-      };
-    }
-  } else {
-    // Server mode: use existing threshold 2 with countToolCallsInHistory
-    const effectiveThreshold = toolLoopThreshold;
-    if (toolResultCount >= effectiveThreshold) {
-      logger.error({
-        toolResultCount,
-        toolUseCount,
-        threshold: effectiveThreshold,
-        sessionId: session?.id ?? null,
-      }, "[ToolLoopGuard] FORCE TERMINATING - too many tool calls in conversation");
-      let toolResultsSummary = "";
-      const messages = payload?.messages || [];
-      let lastUserTextIndex = -1;
-      for (let i = messages.length - 1; i >= 0; i--) {
-        const msg = messages[i];
-        if (msg?.role !== 'user') continue;
-        if (typeof msg.content === 'string' && msg.content.trim().length > 0) {
-          lastUserTextIndex = i;
-          break;
-        }
-        if (Array.isArray(msg.content)) {
-          const hasText = msg.content.some(block =>
-            (block?.type === 'text' && block?.text?.trim?.().length > 0) ||
-            (block?.type === 'input_text' && block?.input_text?.trim?.().length > 0)
-          );
-          if (hasText) {
-            lastUserTextIndex = i;
-            break;
-          }
-        }
-      }
-      const startIndex = lastUserTextIndex >= 0 ? lastUserTextIndex : 0;
-      for (let i = startIndex; i < messages.length; i++) {
-        const msg = messages[i];
-        if (!msg || !Array.isArray(msg.content)) continue;
-        for (const block of msg.content) {
-          if (block?.type === 'tool_result' && block?.content) {
-            const content = typeof block.content === 'string'
-              ? block.content
-              : JSON.stringify(block.content);
-            if (content && !content.includes('Found 0')) {
-              toolResultsSummary += content + "\n";
-            }
-          }
-        }
-      }
-      let responseText = `Based on the tool results, here's what I found:\n\n`;
-      if (toolResultsSummary.trim()) {
-        responseText += toolResultsSummary.trim();
-      } else {
-        responseText += `The tools executed but didn't return clear results. Please check the tool output above or try a different command.`;
-      }
-      const forcedResponse = {
-        id: `msg_forced_${Date.now()}`,
-        type: "message",
-        role: "assistant",
-        content: [{ type: "text", text: responseText }],
-        model: requestedModel || "unknown",
-        stop_reason: "end_turn",
-        stop_sequence: null,
-        usage: { input_tokens: 0, output_tokens: 100 },
-      };
-      return {
-        status: 200,
-        body: forcedResponse,
-        terminationReason: "tool_loop_guard",
-      };
-    }
+    // No count-based tool_loop_guard. Natural limits (maxSteps, maxDurationMs,
+    // provider token/rate limits, client-side loop detection, and the
+    // cross-request dedup above) are sufficient protection.
   }
   const { createTimer } = require("../utils/perf-timer");