npm - @botbotgo/agent-harness - Versions diffs - 0.0.321 → 0.0.323 - Mend

@botbotgo/agent-harness 0.0.321 → 0.0.323

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/dist/package-version.d.ts CHANGED Viewed

	@@ -1 +1 @@
1	- export declare const AGENT_HARNESS_VERSION = "0.0.~~320~~";
1	+ export declare const AGENT_HARNESS_VERSION = "0.0.322";

package/dist/package-version.js CHANGED Viewed

	@@ -1 +1 @@
1	- export const AGENT_HARNESS_VERSION = "0.0.~~320~~";
1	+ export const AGENT_HARNESS_VERSION = "0.0.322";

package/dist/resource/backend/workspace-scoped-backend.js CHANGED Viewed

@@ -34,6 +34,9 @@ export function normalizeWorkspaceScopedPath(rootDir, inputPath) {
     if (typeof inputPath !== "string" || inputPath.length === 0 || !path.isAbsolute(inputPath)) {
         return inputPath;
     }
+    if (inputPath.startsWith("/large_tool_results/")) {
+        throw new Error(`Path '${inputPath}' is an internal runtime spill path, not a workspace file. Do not read internal runtime spill files such as '/large_tool_results/...'. Use the preview already in context, rerun the producing tool with narrower output, or write the needed data to a workspace-relative file instead.`);
+    }
     if (inputPath === "/") {
         return ".";
     }

package/dist/resources/prompts/runtime/autonomous-investigation-recovery.md ADDED Viewed

@@ -0,0 +1 @@

+ Do not stop at a plan or ask the user to choose the next obvious diagnostic step when the request is for deep investigation, root-cause analysis, or step-by-step execution and tool evidence already exists in the conversation. Continue the investigation yourself with the next concrete tool call. If the task is non-trivial, call write_todos, then keep executing the next diagnostic steps until you can explain the likely causes, impact, and recommended next actions.

package/dist/resources/prompts/runtime/internal-runtime-spill-path.md ADDED Viewed

	@@ -0,0 +1 @@
1	+ The previous tool call tried to read an internal runtime spill path such as '/large_tool_results/...'. Do not read internal runtime spill files. Use the preview already present in the conversation, rerun the producing tool with narrower output if needed, or write the needed data to a workspace-relative file and read that file instead.

package/dist/resources/tools/_runtime_tool_helpers.mjs CHANGED Viewed

@@ -78,6 +78,9 @@ export function normalizeWorkspacePath(context, inputPath, fallback = ".") {
   if (!workspaceRoot || !path.isAbsolute(rawPath)) {
     return rawPath;
   }
+  if (rawPath.startsWith("/large_tool_results/")) {
+    throw new Error(`Path '${rawPath}' is an internal runtime spill path, not a workspace file. Do not read internal runtime spill files such as '/large_tool_results/...'. Use the preview already in context, rerun the producing tool with narrower output, or write the needed data to a workspace-relative file instead.`);
+  }
   const resolvedWorkspaceRoot = path.resolve(workspaceRoot);
   const resolvedInputPath = path.resolve(rawPath);
   if (resolvedInputPath === resolvedWorkspaceRoot || resolvedInputPath.startsWith(`${resolvedWorkspaceRoot}${path.sep}`)) {

package/dist/runtime/adapter/tool/builtin-middleware-tools.js CHANGED Viewed

@@ -97,6 +97,9 @@ function normalizeWorkspacePathOrThrow(backend, inputPath) {
     if (!workspaceRoot || !path.isAbsolute(inputPath)) {
         return inputPath;
     }
+    if (inputPath.startsWith("/large_tool_results/")) {
+        throw new Error(`Path '${inputPath}' is an internal runtime spill path, not a workspace file. Do not read internal runtime spill files such as '/large_tool_results/...'. Use the preview already in context, rerun the producing tool with narrower output, or write the needed data to a workspace-relative file instead.`);
+    }
     const normalizedWorkspaceRoot = path.resolve(workspaceRoot);
     const normalizedInputPath = path.resolve(inputPath);
     if (normalizedInputPath === normalizedWorkspaceRoot || normalizedInputPath.startsWith(`${normalizedWorkspaceRoot}${path.sep}`)) {

package/dist/runtime/parsing/output-recovery.d.ts CHANGED Viewed

@@ -1,5 +1,6 @@
 export declare function isToolCallValidationFailure(error: unknown): boolean;
 export declare function isWorkspacePathScopeFailure(error: unknown): boolean;
+export declare function isInternalRuntimeSpillPathFailure(error: unknown): boolean;
 export declare function isRepairableWriteTodosPlaceholderFailure(error: unknown): boolean;
 export declare function isRepairableWriteTodosContentFailure(error: unknown): boolean;
 export declare function isRepairableWriteTodosEmptyFailure(error: unknown): boolean;
@@ -11,4 +12,4 @@ export declare function resolveExecutionWithoutToolEvidenceTextInstruction(reque
 export declare function resolveToolCallRecoveryInstruction(error: unknown): string | null;
 export declare function appendToolRecoveryInstruction(input: unknown, instruction: string): unknown;
 export declare function wrapResolvedModel<T>(value: T): T;
-export { BROWSER_CAPABILITY_DISCLAIMER_RECOVERY_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_RETRY_INSTRUCTION, INVALID_TOOL_SELECTION_RECOVERY_INSTRUCTION, STRICT_TOOL_JSON_INSTRUCTION, WORKSPACE_RELATIVE_PATH_INSTRUCTION, WRITE_TODOS_DESCRIPTIVE_CONTENT_INSTRUCTION, WRITE_TODOS_FULL_ENTRY_INSTRUCTION, WRITE_TODOS_NON_EMPTY_INITIAL_LIST_INSTRUCTION } from "../prompts/runtime-prompts.js";
+export { AUTONOMOUS_INVESTIGATION_RECOVERY_INSTRUCTION, BROWSER_CAPABILITY_DISCLAIMER_RECOVERY_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_RETRY_INSTRUCTION, INTERNAL_RUNTIME_SPILL_PATH_INSTRUCTION, INVALID_TOOL_SELECTION_RECOVERY_INSTRUCTION, STRICT_TOOL_JSON_INSTRUCTION, WORKSPACE_RELATIVE_PATH_INSTRUCTION, WRITE_TODOS_DESCRIPTIVE_CONTENT_INSTRUCTION, WRITE_TODOS_FULL_ENTRY_INSTRUCTION, WRITE_TODOS_NON_EMPTY_INITIAL_LIST_INSTRUCTION } from "../prompts/runtime-prompts.js";

package/dist/runtime/parsing/output-recovery.js CHANGED Viewed

@@ -1,4 +1,4 @@
-import { BROWSER_CAPABILITY_DISCLAIMER_RECOVERY_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_RETRY_INSTRUCTION, STRICT_TOOL_JSON_INSTRUCTION, WORKSPACE_RELATIVE_PATH_INSTRUCTION, WRITE_TODOS_DESCRIPTIVE_CONTENT_INSTRUCTION, WRITE_TODOS_FULL_ENTRY_INSTRUCTION, WRITE_TODOS_NON_EMPTY_INITIAL_LIST_INSTRUCTION, } from "../prompts/runtime-prompts.js";
+import { AUTONOMOUS_INVESTIGATION_RECOVERY_INSTRUCTION, BROWSER_CAPABILITY_DISCLAIMER_RECOVERY_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_RETRY_INSTRUCTION, INTERNAL_RUNTIME_SPILL_PATH_INSTRUCTION, STRICT_TOOL_JSON_INSTRUCTION, WORKSPACE_RELATIVE_PATH_INSTRUCTION, WRITE_TODOS_DESCRIPTIVE_CONTENT_INSTRUCTION, WRITE_TODOS_FULL_ENTRY_INSTRUCTION, WRITE_TODOS_NON_EMPTY_INITIAL_LIST_INSTRUCTION, } from "../prompts/runtime-prompts.js";
 import { hasToolCalls, readTextContent, wrapNormalizedMessage } from "./output-content.js";
 function isToolCallParseFailure(error) {
     if (!(error instanceof Error))
@@ -52,6 +52,9 @@ function collectErrorMessages(error) {
 export function isWorkspacePathScopeFailure(error) {
     return collectErrorMessages(error).some((message) => /outside the workspace root|workspace-relative path/i.test(message));
 }
+export function isInternalRuntimeSpillPathFailure(error) {
+    return collectErrorMessages(error).some((message) => /\/large_tool_results\/|internal runtime spill path/i.test(message));
+}
 export function isRepairableWriteTodosPlaceholderFailure(error) {
     if (!(error instanceof Error))
         return false;
@@ -81,6 +84,7 @@ export function isToolCallRecoveryFailure(error) {
         isToolCallValidationFailure(error) ||
         isRepairableWriteTodosEmptyFailure(error) ||
         isRepairableWriteTodosPlaceholderFailure(error) ||
+        isInternalRuntimeSpillPathFailure(error) ||
         isWorkspacePathScopeFailure(error));
 }
 function extractMessageContent(message) {
@@ -123,6 +127,71 @@ function extractLastUserMessageText(input) {
     }
     return "";
 }
+function extractAllUserMessageText(input) {
+    if (!Array.isArray(input) && !(typeof input === "object" && input && Array.isArray(input.messages))) {
+        return "";
+    }
+    const messages = Array.isArray(input) ? input : input.messages;
+    const values = [];
+    for (const message of messages) {
+        if (typeof message !== "object" || !message)
+            continue;
+        const typed = message;
+        if (typed.role === "user") {
+            const text = extractMessageContent(message).trim();
+            if (text)
+                values.push(text);
+            continue;
+        }
+        const ids = Array.isArray(typed.id) ? typed.id.filter((item) => typeof item === "string") : [];
+        const typeName = ids.at(-1);
+        const runtimeType = typeof message._getType === "function"
+            ? message._getType()
+            : typeof message.getType === "function"
+                ? message.getType()
+                : undefined;
+        if (typeName === "HumanMessage" || runtimeType === "human") {
+            const text = extractMessageContent(message).trim();
+            if (text)
+                values.push(text);
+            continue;
+        }
+        if (typeof typed.kwargs === "object" && typed.kwargs && typed.kwargs.role === "user") {
+            const text = extractMessageContent(message).trim();
+            if (text)
+                values.push(text);
+        }
+    }
+    return values.join("\n").trim();
+}
+function hasToolResultEvidence(input) {
+    if (!Array.isArray(input) && !(typeof input === "object" && input && Array.isArray(input.messages))) {
+        return false;
+    }
+    const messages = Array.isArray(input) ? input : input.messages;
+    for (const message of messages) {
+        if (typeof message !== "object" || !message)
+            continue;
+        const typed = message;
+        if (typed.role === "tool") {
+            return true;
+        }
+        const ids = Array.isArray(typed.id) ? typed.id.filter((item) => typeof item === "string") : [];
+        const typeName = ids.at(-1);
+        const runtimeType = typeof message._getType === "function"
+            ? message._getType()
+            : typeof message.getType === "function"
+                ? message.getType()
+                : undefined;
+        if (typeName === "ToolMessage" || runtimeType === "tool") {
+            return true;
+        }
+        if (typeof typed.kwargs === "object" && typed.kwargs && typed.kwargs.role === "tool") {
+            return true;
+        }
+    }
+    return false;
+}
 function isToolRequiredExecutionPrompt(text) {
     if (!text)
         return false;
@@ -130,6 +199,12 @@ function isToolRequiredExecutionPrompt(text) {
         /\b(create|write|edit|read|show|display|append|run|execute|wait|sleep|repeat|loop|file|files|command)\b/i.test(text) ||
         /(创建|写入|读取|显示|追加|执行|运行|等待|重复|文件|命令|步骤)/.test(text));
 }
+function isAutonomousInvestigationPrompt(text) {
+    if (!text)
+        return false;
+    return (/\b(root cause|rca|deep investigation|investigate deeply|investigate fully|step by step|find all (?:issues|problems|causes)|continue investigating|keep digging|until complete|until you find)\b/i.test(text) ||
+        /(根因分析|深度调查|深入调查|一步一步|逐步分析|逐个分析|继续排查|排查到底|找到所有问题|查出所有问题|直到完成|直到找到.*原因)/.test(text));
+}
 function isBrowserOrUrlTask(text) {
     if (!text)
         return false;
@@ -149,6 +224,18 @@ function claimsMissingBrowserCapability(text) {
     return (/\b(i do not have the capability to access external websites|i do not have access to external websites|i cannot access external websites|i can(?:not|'t) browse|i do not have (?:direct )?(?:web|browser|browsing) access|i do not have .*tool.*(?:website|url|browser)|i cannot summarize .* because .*tool.*failed|please provide (?:the )?text content.*i (?:will|can) summarize)\b/i.test(text) ||
         /(我没有直接访问外部网站|我无法直接访问外部网站|我无法访问外部网站|我不能访问外部网站|我无法直接访问外部网站内容|我无法访问网页|请提供文本内容.*我将为您进行总结|我没有.*浏览.*工具|我没有.*网页抓取.*工具|我没有.*访问.*网站.*工具|我无法总结该网页内容，因为.*工具执行失败)/.test(text));
 }
+function asksUserToChooseObviousNextDiagnosticStep(text) {
+    if (!text)
+        return false;
+    return (/\b(which (?:direction|aspect|node|namespace|part)|what would you like me to check|please choose|please tell me (?:which|what|where) .* (?:check|inspect|investigate)|which .* should we start with)\b/i.test(text) ||
+        /(请告诉我.*(哪个|哪一个|什么方向)|请选择.*(方向|项目|节点)|您希望我.*(检查|查看).*(哪个|哪一个|方向)|从哪个方向开始)/.test(text));
+}
+function claimsFutureExecutionWithoutToolEvidence(text) {
+    if (!text)
+        return false;
+    return (/\b(i will|i'll|we will|next i(?:'ll| will)|i am going to)\b.*\b(run|execute|inspect|check|investigate|continue|start)\b/i.test(text) ||
+        /(我将|我会|接下来我会|现在我将|我将继续).*(执行|检查|查看|调查|排查|开始|继续)/.test(text));
+}
 export function isRetrySafeInvalidToolSelectionError(value) {
     const text = readTextContent(value).trim();
     if (!text)
@@ -156,9 +243,9 @@ export function isRetrySafeInvalidToolSelectionError(value) {
     return /is not a valid tool, try one of \[/i.test(text);
 }
 export function shouldValidateExecutionWithoutToolEvidence(request) {
-    const userText = extractLastUserMessageText(request);
+    const userText = extractAllUserMessageText(request);
     const browserOrUrlTask = isBrowserOrUrlTask(userText);
-    return browserOrUrlTask || isToolRequiredExecutionPrompt(userText);
+    return browserOrUrlTask || isToolRequiredExecutionPrompt(userText) || isAutonomousInvestigationPrompt(userText);
 }
 function extractAssistantTextFromResult(result) {
     if (typeof result === "object" && result && "messages" in result) {
@@ -192,14 +279,21 @@ export function resolveExecutionWithoutToolEvidenceInstruction(request, result)
     return resolveExecutionWithoutToolEvidenceTextInstruction(request, assistantText, hasToolCalls(result));
 }
 export function resolveExecutionWithoutToolEvidenceTextInstruction(request, assistantText, toolCallEvidence = false) {
-    const userText = extractLastUserMessageText(request);
+    const userText = extractAllUserMessageText(request);
     const browserOrUrlTask = isBrowserOrUrlTask(userText);
+    const autonomousInvestigationTask = isAutonomousInvestigationPrompt(userText);
+    const toolResultEvidence = hasToolResultEvidence(request);
     if (!shouldValidateExecutionWithoutToolEvidence(request)) {
         return null;
     }
     if (!assistantText || toolCallEvidence) {
         return null;
     }
+    if (autonomousInvestigationTask &&
+        toolResultEvidence &&
+        (asksUserToChooseObviousNextDiagnosticStep(assistantText) || claimsFutureExecutionWithoutToolEvidence(assistantText))) {
+        return AUTONOMOUS_INVESTIGATION_RECOVERY_INSTRUCTION;
+    }
     if (browserOrUrlTask && claimsMissingBrowserCapability(assistantText)) {
         return BROWSER_CAPABILITY_DISCLAIMER_RECOVERY_INSTRUCTION;
     }
@@ -215,6 +309,9 @@ export function resolveToolCallRecoveryInstruction(error) {
     if (isRepairableWriteTodosPlaceholderFailure(error)) {
         return WRITE_TODOS_DESCRIPTIVE_CONTENT_INSTRUCTION;
     }
+    if (isInternalRuntimeSpillPathFailure(error)) {
+        return INTERNAL_RUNTIME_SPILL_PATH_INSTRUCTION;
+    }
     if (isWorkspacePathScopeFailure(error)) {
         return WORKSPACE_RELATIVE_PATH_INSTRUCTION;
     }
@@ -285,4 +382,4 @@ export function wrapResolvedModel(value) {
         },
     });
 }
-export { BROWSER_CAPABILITY_DISCLAIMER_RECOVERY_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_RETRY_INSTRUCTION, INVALID_TOOL_SELECTION_RECOVERY_INSTRUCTION, STRICT_TOOL_JSON_INSTRUCTION, WORKSPACE_RELATIVE_PATH_INSTRUCTION, WRITE_TODOS_DESCRIPTIVE_CONTENT_INSTRUCTION, WRITE_TODOS_FULL_ENTRY_INSTRUCTION, WRITE_TODOS_NON_EMPTY_INITIAL_LIST_INSTRUCTION } from "../prompts/runtime-prompts.js";
+export { AUTONOMOUS_INVESTIGATION_RECOVERY_INSTRUCTION, BROWSER_CAPABILITY_DISCLAIMER_RECOVERY_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_RETRY_INSTRUCTION, INTERNAL_RUNTIME_SPILL_PATH_INSTRUCTION, INVALID_TOOL_SELECTION_RECOVERY_INSTRUCTION, STRICT_TOOL_JSON_INSTRUCTION, WORKSPACE_RELATIVE_PATH_INSTRUCTION, WRITE_TODOS_DESCRIPTIVE_CONTENT_INSTRUCTION, WRITE_TODOS_FULL_ENTRY_INSTRUCTION, WRITE_TODOS_NON_EMPTY_INITIAL_LIST_INSTRUCTION } from "../prompts/runtime-prompts.js";

package/dist/runtime/prompts/runtime-prompts.d.ts CHANGED Viewed

@@ -9,6 +9,8 @@ export declare const WRITE_TODOS_NON_EMPTY_INITIAL_LIST_INSTRUCTION: string;
 export declare const WRITE_TODOS_DESCRIPTIVE_CONTENT_INSTRUCTION: string;
 export declare const EXECUTION_WITH_TOOL_EVIDENCE_INSTRUCTION: string;
 export declare const EXECUTION_WITH_TOOL_EVIDENCE_RETRY_INSTRUCTION: string;
+export declare const AUTONOMOUS_INVESTIGATION_RECOVERY_INSTRUCTION: string;
+export declare const INTERNAL_RUNTIME_SPILL_PATH_INSTRUCTION: string;
 export declare const WORKSPACE_RELATIVE_PATH_INSTRUCTION: string;
 export declare function renderDurableMemoryContextPrompt(memoryContext: string): string;
 export declare function renderSlashCommandSkillInstruction(input: {

package/dist/runtime/prompts/runtime-prompts.js CHANGED Viewed

@@ -12,6 +12,8 @@ export const WRITE_TODOS_NON_EMPTY_INITIAL_LIST_INSTRUCTION = readRuntimePrompt(
 export const WRITE_TODOS_DESCRIPTIVE_CONTENT_INSTRUCTION = readRuntimePrompt("write-todos-descriptive-content");
 export const EXECUTION_WITH_TOOL_EVIDENCE_INSTRUCTION = readRuntimePrompt("execution-with-tool-evidence");
 export const EXECUTION_WITH_TOOL_EVIDENCE_RETRY_INSTRUCTION = readRuntimePrompt("execution-with-tool-evidence-retry");
+export const AUTONOMOUS_INVESTIGATION_RECOVERY_INSTRUCTION = readRuntimePrompt("autonomous-investigation-recovery");
+export const INTERNAL_RUNTIME_SPILL_PATH_INSTRUCTION = readRuntimePrompt("internal-runtime-spill-path");
 export const WORKSPACE_RELATIVE_PATH_INSTRUCTION = readRuntimePrompt("workspace-relative-path");
 export function renderDurableMemoryContextPrompt(memoryContext) {
     return renderBundledTemplate("prompts/runtime/durable-memory-context.md", {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@botbotgo/agent-harness",
-  "version": "0.0.321",
+  "version": "0.0.323",
   "description": "Workspace runtime for multi-agent applications",
   "license": "MIT",
   "type": "module",