npm - @botbotgo/agent-harness - Versions diffs - 0.0.324 → 0.0.326 - Mend

@botbotgo/agent-harness 0.0.324 → 0.0.326

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

package/README.md +2 -1
package/README.zh.md +2 -1
package/dist/cli/main.js +84 -2
package/dist/cli/managed-service.d.ts +2 -1
package/dist/cli/managed-service.js +78 -2
package/dist/cli/options-serve.d.ts +13 -0
package/dist/cli/options-serve.js +116 -0
package/dist/cli/options.d.ts +1 -1
package/dist/cli/options.js +7 -1
package/dist/cli/server-commands.d.ts +1 -1
package/dist/cli/server-commands.js +28 -8
package/dist/config/knowledge/knowledge-runtime.yaml +3 -2
package/dist/config/prompts/orchestra-system.md +4 -0
package/dist/config/runtime/runtime-memory.yaml +3 -2
package/dist/knowledge/module.js +2 -1
package/dist/package-version.d.ts +2 -2
package/dist/package-version.js +2 -2
package/dist/resource/isolation.js +28 -0
package/dist/resources/prompts/runtime/autonomous-investigation-recovery.md +1 -1
package/dist/resources/prompts/runtime/durable-memory-context.md +2 -0
package/dist/resources/prompts/runtime/execution-with-tool-evidence-retry.md +1 -1
package/dist/resources/prompts/runtime/write-todos-required-plan.md +1 -0
package/dist/runtime/adapter/flow/stream-runtime.js +9 -141
package/dist/runtime/adapter/model/invocation-request.js +1 -1
package/dist/runtime/adapter/tool/builtin-middleware-tools.js +22 -8
package/dist/runtime/harness/run/stream-run.js +17 -0
package/dist/runtime/harness/system/runtime-memory-manager.js +4 -0
package/dist/runtime/harness/system/runtime-memory-policy.d.ts +14 -0
package/dist/runtime/harness/system/runtime-memory-policy.js +19 -0
package/dist/runtime/parsing/output-parsing.d.ts +2 -1
package/dist/runtime/parsing/output-parsing.js +2 -1
package/dist/runtime/parsing/output-recovery.d.ts +4 -2
package/dist/runtime/parsing/output-recovery.js +30 -264
package/dist/runtime/parsing/stream-event-parsing.js +10 -1
package/dist/runtime/prompts/runtime-prompts.d.ts +1 -0
package/dist/runtime/prompts/runtime-prompts.js +1 -0
package/dist/scaffold/init-project.js +6 -4
package/dist/tools.js +25 -2
package/package.json +1 -1

package/dist/runtime/parsing/output-recovery.js CHANGED Viewed

@@ -1,14 +1,11 @@
-import { AUTONOMOUS_INVESTIGATION_RECOVERY_INSTRUCTION, BROWSER_CAPABILITY_DISCLAIMER_RECOVERY_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_RETRY_INSTRUCTION, INTERNAL_RUNTIME_SPILL_PATH_INSTRUCTION, STRICT_TOOL_JSON_INSTRUCTION, WORKSPACE_RELATIVE_PATH_INSTRUCTION, WRITE_TODOS_DESCRIPTIVE_CONTENT_INSTRUCTION, WRITE_TODOS_FULL_ENTRY_INSTRUCTION, WRITE_TODOS_NON_EMPTY_INITIAL_LIST_INSTRUCTION, } from "../prompts/runtime-prompts.js";
-import { hasToolCalls, readTextContent, wrapNormalizedMessage } from "./output-content.js";
+import { EXECUTION_WITH_TOOL_EVIDENCE_RETRY_INSTRUCTION, INTERNAL_RUNTIME_SPILL_PATH_INSTRUCTION, STRICT_TOOL_JSON_INSTRUCTION, WORKSPACE_RELATIVE_PATH_INSTRUCTION, WRITE_TODOS_DESCRIPTIVE_CONTENT_INSTRUCTION, WRITE_TODOS_FULL_ENTRY_INSTRUCTION, WRITE_TODOS_NON_EMPTY_INITIAL_LIST_INSTRUCTION, } from "../prompts/runtime-prompts.js";
+import { wrapNormalizedMessage, readTextContent } from "./output-content.js";
 function isToolCallParseFailure(error) {
-    if (!(error instanceof Error))
-        return false;
-    return /error parsing tool call:/i.test(error.message);
+    return error instanceof Error && /error parsing tool call:/i.test(error.message);
 }
 function isStructuredValidationIssue(value) {
-    if (typeof value !== "object" || !value || Array.isArray(value)) {
+    if (typeof value !== "object" || !value || Array.isArray(value))
         return false;
-    }
     const typed = value;
     return typeof typed.code === "string" && Array.isArray(typed.path) && (typed.message === undefined || typeof typed.message === "string");
 }
@@ -31,18 +28,16 @@ export function isToolCallValidationFailure(error) {
     return /Received tool input did not match expected schema/i.test(message) && /(?:→\s*at|at)\s+[\w[\].]+/i.test(message);
 }
 function collectErrorMessages(error) {
-    if (!error) {
+    if (!error)
         return [];
-    }
     if (error instanceof Error) {
         const nested = Array.isArray(error.errors)
             ? (error.errors ?? []).flatMap((item) => collectErrorMessages(item))
             : [];
         return [error.message, ...nested].filter((value) => typeof value === "string" && value.trim().length > 0);
     }
-    if (typeof error === "string" && error.trim().length > 0) {
+    if (typeof error === "string" && error.trim().length > 0)
         return [error];
-    }
     if (typeof error === "object") {
         const record = error;
         return [record.message, record.error, record.details].flatMap((item) => collectErrorMessages(item));
@@ -56,28 +51,13 @@ export function isInternalRuntimeSpillPathFailure(error) {
     return collectErrorMessages(error).some((message) => /\/large_tool_results\/|internal runtime spill path/i.test(message));
 }
 export function isRepairableWriteTodosPlaceholderFailure(error) {
-    if (!(error instanceof Error))
-        return false;
-    const message = error.message.trim();
-    if (!message)
-        return false;
-    return /write_todos/i.test(message) && /descriptive task content|placeholder entries/i.test(message);
+    return error instanceof Error && /write_todos/i.test(error.message) && /descriptive task content|placeholder entries/i.test(error.message);
 }
 export function isRepairableWriteTodosContentFailure(error) {
-    if (!(error instanceof Error))
-        return false;
-    const message = error.message.trim();
-    if (!message)
-        return false;
-    return /write_todos/i.test(message) && /todos\[\d+\]\.content/i.test(message);
+    return error instanceof Error && /write_todos/i.test(error.message) && /todos\[\d+\]\.content/i.test(error.message);
 }
 export function isRepairableWriteTodosEmptyFailure(error) {
-    if (!(error instanceof Error))
-        return false;
-    const message = error.message.trim();
-    if (!message)
-        return false;
-    return /write_todos/i.test(message) && /Initial write_todos call cannot use an empty todo list/i.test(message);
+    return error instanceof Error && /write_todos/i.test(error.message) && /Initial write_todos call cannot use an empty todo list/i.test(error.message);
 }
 export function isToolCallRecoveryFailure(error) {
     return (isToolCallParseFailure(error) ||
@@ -87,237 +67,39 @@ export function isToolCallRecoveryFailure(error) {
         isInternalRuntimeSpillPathFailure(error) ||
         isWorkspacePathScopeFailure(error));
 }
-function extractMessageContent(message) {
-    if (typeof message !== "object" || !message)
-        return "";
-    const typed = message;
-    if (typed.content !== undefined)
-        return readTextContent(typed.content);
-    if (typeof typed.kwargs === "object" && typed.kwargs) {
-        return readTextContent(typed.kwargs.content);
-    }
-    return "";
-}
-function extractLastUserMessageText(input) {
-    if (!Array.isArray(input) && !(typeof input === "object" && input && Array.isArray(input.messages))) {
-        return "";
-    }
-    const messages = Array.isArray(input) ? input : input.messages;
-    for (let index = messages.length - 1; index >= 0; index -= 1) {
-        const message = messages[index];
-        if (typeof message !== "object" || !message)
-            continue;
-        const typed = message;
-        if (typed.role === "user") {
-            return extractMessageContent(message).trim();
-        }
-        const ids = Array.isArray(typed.id) ? typed.id.filter((item) => typeof item === "string") : [];
-        const typeName = ids.at(-1);
-        const runtimeType = typeof message._getType === "function"
-            ? message._getType()
-            : typeof message.getType === "function"
-                ? message.getType()
-                : undefined;
-        if (typeName === "HumanMessage" || runtimeType === "human") {
-            return extractMessageContent(message).trim();
-        }
-        if (typeof typed.kwargs === "object" && typed.kwargs && typed.kwargs.role === "user") {
-            return extractMessageContent(message).trim();
-        }
-    }
-    return "";
-}
-function extractAllUserMessageText(input) {
-    if (!Array.isArray(input) && !(typeof input === "object" && input && Array.isArray(input.messages))) {
-        return "";
-    }
-    const messages = Array.isArray(input) ? input : input.messages;
-    const values = [];
-    for (const message of messages) {
-        if (typeof message !== "object" || !message)
-            continue;
-        const typed = message;
-        if (typed.role === "user") {
-            const text = extractMessageContent(message).trim();
-            if (text)
-                values.push(text);
-            continue;
-        }
-        const ids = Array.isArray(typed.id) ? typed.id.filter((item) => typeof item === "string") : [];
-        const typeName = ids.at(-1);
-        const runtimeType = typeof message._getType === "function"
-            ? message._getType()
-            : typeof message.getType === "function"
-                ? message.getType()
-                : undefined;
-        if (typeName === "HumanMessage" || runtimeType === "human") {
-            const text = extractMessageContent(message).trim();
-            if (text)
-                values.push(text);
-            continue;
-        }
-        if (typeof typed.kwargs === "object" && typed.kwargs && typed.kwargs.role === "user") {
-            const text = extractMessageContent(message).trim();
-            if (text)
-                values.push(text);
-        }
-    }
-    return values.join("\n").trim();
-}
-function hasToolResultEvidence(input) {
-    if (!Array.isArray(input) && !(typeof input === "object" && input && Array.isArray(input.messages))) {
-        return false;
-    }
-    const messages = Array.isArray(input) ? input : input.messages;
-    for (const message of messages) {
-        if (typeof message !== "object" || !message)
-            continue;
-        const typed = message;
-        if (typed.role === "tool") {
-            return true;
-        }
-        const ids = Array.isArray(typed.id) ? typed.id.filter((item) => typeof item === "string") : [];
-        const typeName = ids.at(-1);
-        const runtimeType = typeof message._getType === "function"
-            ? message._getType()
-            : typeof message.getType === "function"
-                ? message.getType()
-                : undefined;
-        if (typeName === "ToolMessage" || runtimeType === "tool") {
-            return true;
-        }
-        if (typeof typed.kwargs === "object" && typed.kwargs && typed.kwargs.role === "tool") {
-            return true;
-        }
-    }
-    return false;
-}
-function isToolRequiredExecutionPrompt(text) {
-    if (!text)
-        return false;
-    return (/write_todos/i.test(text) ||
-        /\b(create|write|edit|read|show|display|append|run|execute|wait|sleep|repeat|loop|file|files|command)\b/i.test(text) ||
-        /(创建|写入|读取|显示|追加|执行|运行|等待|重复|文件|命令|步骤)/.test(text));
-}
-function isAutonomousInvestigationPrompt(text) {
-    if (!text)
-        return false;
-    return (/\b(root cause|rca|deep investigation|investigate deeply|investigate fully|step by step|find all (?:issues|problems|causes)|continue investigating|keep digging|until complete|until you find)\b/i.test(text) ||
-        /(根因分析|深度调查|深入调查|一步一步|逐步分析|逐个分析|继续排查|排查到底|找到所有问题|查出所有问题|直到完成|直到找到.*原因)/.test(text));
-}
-function isBrowserOrUrlTask(text) {
-    if (!text)
-        return false;
-    return (/https?:\/\/\S+/i.test(text) ||
-        /\b(url|urls|website|websites|web page|webpage|browser|browse|page summary|summari[sz]e.*page|open.*page)\b/i.test(text) ||
-        /(网址|链接|网页|网站|页面|浏览器|总结.*网页|总结.*页面|打开.*网页)/.test(text));
-}
-function claimsExecutionWithoutToolEvidence(text) {
-    if (!text)
-        return false;
-    return (/\b(completed|done|created|wrote|written|read|displayed|appended|executed|waited|result|results)\b/i.test(text) ||
-        /(已创建|已写入|已读取|已显示|已追加|已执行|已等待|执行结果|状态更新|步骤\s*\d+|文件内容)/.test(text));
-}
-function claimsMissingBrowserCapability(text) {
-    if (!text)
-        return false;
-    return (/\b(i do not have the capability to access external websites|i do not have access to external websites|i cannot access external websites|i can(?:not|'t) browse|i do not have (?:direct )?(?:web|browser|browsing) access|i do not have .*tool.*(?:website|url|browser)|i cannot summarize .* because .*tool.*failed|please provide (?:the )?text content.*i (?:will|can) summarize)\b/i.test(text) ||
-        /(我没有直接访问外部网站|我无法直接访问外部网站|我无法访问外部网站|我不能访问外部网站|我无法直接访问外部网站内容|我无法访问网页|请提供文本内容.*我将为您进行总结|我没有.*浏览.*工具|我没有.*网页抓取.*工具|我没有.*访问.*网站.*工具|我无法总结该网页内容，因为.*工具执行失败)/.test(text));
-}
-function asksUserToChooseObviousNextDiagnosticStep(text) {
-    if (!text)
-        return false;
-    return (/\b(which (?:direction|aspect|node|namespace|part)|what would you like me to check|please choose|please tell me (?:which|what|where) .* (?:check|inspect|investigate)|which .* should we start with)\b/i.test(text) ||
-        /(请告诉我.*(哪个|哪一个|什么方向)|请选择.*(方向|项目|节点)|您希望我.*(检查|查看).*(哪个|哪一个|方向)|从哪个方向开始)/.test(text));
-}
-function claimsFutureExecutionWithoutToolEvidence(text) {
-    if (!text)
-        return false;
-    return (/\b(i will|i'll|we will|next i(?:'ll| will)|i am going to)\b.*\b(run|execute|inspect|check|investigate|continue|start)\b/i.test(text) ||
-        /(我将|我会|接下来我会|现在我将|我将继续).*(执行|检查|查看|调查|排查|开始|继续)/.test(text));
-}
 export function isRetrySafeInvalidToolSelectionError(value) {
     const text = readTextContent(value).trim();
-    if (!text)
-        return false;
-    return /is not a valid tool, try one of \[/i.test(text);
+    return !!text && /is not a valid tool, try one of \[/i.test(text);
 }
 export function shouldValidateExecutionWithoutToolEvidence(request) {
-    const userText = extractAllUserMessageText(request);
-    const browserOrUrlTask = isBrowserOrUrlTask(userText);
-    return browserOrUrlTask || isToolRequiredExecutionPrompt(userText) || isAutonomousInvestigationPrompt(userText);
-}
-function extractAssistantTextFromResult(result) {
-    if (typeof result === "object" && result && "messages" in result) {
-        const messages = result.messages;
-        if (Array.isArray(messages)) {
-            for (let index = messages.length - 1; index >= 0; index -= 1) {
-                const message = messages[index];
-                if (typeof message !== "object" || !message)
-                    continue;
-                const ids = Array.isArray(message.id)
-                    ? message.id.filter((item) => typeof item === "string")
-                    : [];
-                const typeName = ids.at(-1);
-                const runtimeType = typeof message._getType === "function"
-                    ? message._getType()
-                    : typeof message.getType === "function"
-                        ? message.getType()
-                        : undefined;
-                if (typeName === "AIMessage" || runtimeType === "ai") {
-                    return extractMessageContent(message).trim();
-                }
-            }
-        }
-    }
-    return "";
+    void request;
+    return false;
 }
 export function resolveExecutionWithoutToolEvidenceInstruction(request, result) {
-    const assistantText = typeof result === "object" && result && "content" in result
-        ? readTextContent(result.content).trim()
-        : extractAssistantTextFromResult(result);
-    return resolveExecutionWithoutToolEvidenceTextInstruction(request, assistantText, hasToolCalls(result));
+    void request;
+    void result;
+    return null;
 }
-export function resolveExecutionWithoutToolEvidenceTextInstruction(request, assistantText, toolCallEvidence = false) {
-    const userText = extractAllUserMessageText(request);
-    const browserOrUrlTask = isBrowserOrUrlTask(userText);
-    const autonomousInvestigationTask = isAutonomousInvestigationPrompt(userText);
-    const toolResultEvidence = hasToolResultEvidence(request);
-    if (!shouldValidateExecutionWithoutToolEvidence(request)) {
-        return null;
-    }
-    if (!assistantText || toolCallEvidence) {
-        return null;
-    }
-    if (autonomousInvestigationTask &&
-        toolResultEvidence &&
-        (asksUserToChooseObviousNextDiagnosticStep(assistantText) || claimsFutureExecutionWithoutToolEvidence(assistantText))) {
-        return AUTONOMOUS_INVESTIGATION_RECOVERY_INSTRUCTION;
-    }
-    if (browserOrUrlTask && claimsMissingBrowserCapability(assistantText)) {
-        return BROWSER_CAPABILITY_DISCLAIMER_RECOVERY_INSTRUCTION;
-    }
-    return claimsExecutionWithoutToolEvidence(assistantText) ? EXECUTION_WITH_TOOL_EVIDENCE_INSTRUCTION : null;
+export function resolveExecutionWithoutToolEvidenceTextInstruction(request, assistantText, toolCallEvidence = false, resultEvidence = {}) {
+    void request;
+    void assistantText;
+    void toolCallEvidence;
+    void resultEvidence;
+    return null;
 }
 export function resolveToolCallRecoveryInstruction(error) {
-    if (isRepairableWriteTodosEmptyFailure(error)) {
+    if (isRepairableWriteTodosEmptyFailure(error))
         return WRITE_TODOS_NON_EMPTY_INITIAL_LIST_INSTRUCTION;
-    }
-    if (isRepairableWriteTodosContentFailure(error)) {
+    if (isRepairableWriteTodosContentFailure(error))
         return WRITE_TODOS_FULL_ENTRY_INSTRUCTION;
-    }
-    if (isRepairableWriteTodosPlaceholderFailure(error)) {
+    if (isRepairableWriteTodosPlaceholderFailure(error))
         return WRITE_TODOS_DESCRIPTIVE_CONTENT_INSTRUCTION;
-    }
-    if (isInternalRuntimeSpillPathFailure(error)) {
+    if (isInternalRuntimeSpillPathFailure(error))
         return INTERNAL_RUNTIME_SPILL_PATH_INSTRUCTION;
-    }
-    if (isWorkspacePathScopeFailure(error)) {
+    if (isWorkspacePathScopeFailure(error))
         return WORKSPACE_RELATIVE_PATH_INSTRUCTION;
-    }
-    if (isToolCallRecoveryFailure(error)) {
+    if (isToolCallRecoveryFailure(error))
         return STRICT_TOOL_JSON_INSTRUCTION;
-    }
     return null;
 }
 export function appendToolRecoveryInstruction(input, instruction) {
@@ -344,30 +126,15 @@ export function wrapResolvedModel(value) {
                     let activeArgs = [...args];
                     for (let attempt = 0; attempt < 3; attempt += 1) {
                         try {
-                            const normalized = wrapNormalizedMessage(await member.apply(currentTarget, activeArgs));
-                            const executionRecoveryInstruction = resolveExecutionWithoutToolEvidenceInstruction(activeArgs[0], normalized);
-                            if (!executionRecoveryInstruction) {
-                                return normalized;
-                            }
-                            if (attempt === 2) {
-                                throw new Error("Model claimed task execution without any tool calls after repeated recovery attempts. Refusing to treat that response as a successful execution.");
-                            }
-                            const nextInstruction = attempt === 0
-                                ? executionRecoveryInstruction
-                                : EXECUTION_WITH_TOOL_EVIDENCE_RETRY_INSTRUCTION;
-                            activeArgs = [...activeArgs];
-                            activeArgs[0] = appendToolRecoveryInstruction(activeArgs[0], nextInstruction);
+                            return wrapNormalizedMessage(await member.apply(currentTarget, activeArgs));
                         }
                         catch (error) {
                             const recoveryInstruction = resolveToolCallRecoveryInstruction(error);
-                            if (!recoveryInstruction) {
-                                throw error;
-                            }
-                            if (attempt === 2) {
+                            if (!recoveryInstruction || attempt === 2) {
                                 throw error;
                             }
                             activeArgs = [...activeArgs];
-                            activeArgs[0] = appendToolRecoveryInstruction(activeArgs[0], recoveryInstruction);
+                            activeArgs[0] = appendToolRecoveryInstruction(activeArgs[0], attempt === 0 ? recoveryInstruction : EXECUTION_WITH_TOOL_EVIDENCE_RETRY_INSTRUCTION);
                         }
                     }
                     throw new Error("Model invocation retry loop exited unexpectedly.");
@@ -382,4 +149,3 @@ export function wrapResolvedModel(value) {
         },
     });
 }
-export { AUTONOMOUS_INVESTIGATION_RECOVERY_INSTRUCTION, BROWSER_CAPABILITY_DISCLAIMER_RECOVERY_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_INSTRUCTION, EXECUTION_WITH_TOOL_EVIDENCE_RETRY_INSTRUCTION, INTERNAL_RUNTIME_SPILL_PATH_INSTRUCTION, INVALID_TOOL_SELECTION_RECOVERY_INSTRUCTION, STRICT_TOOL_JSON_INSTRUCTION, WORKSPACE_RELATIVE_PATH_INSTRUCTION, WRITE_TODOS_DESCRIPTIVE_CONTENT_INSTRUCTION, WRITE_TODOS_FULL_ENTRY_INSTRUCTION, WRITE_TODOS_NON_EMPTY_INITIAL_LIST_INSTRUCTION } from "../prompts/runtime-prompts.js";

package/dist/runtime/parsing/stream-event-parsing.js CHANGED Viewed

@@ -196,7 +196,16 @@ function isErrorLikeToolOutput(value) {
     if (!message) {
         return false;
     }
-    return /(^|\b)(error|exception|failed|failure|denied|timed out|timeout|not permitted|eperm|eacces)(\b|:)/i.test(message);
+    const firstNonEmptyLine = message
+        .split("\n")
+        .map((line) => line.trim())
+        .find((line) => line.length > 0) ?? "";
+    if (!firstNonEmptyLine) {
+        return false;
+    }
+    return /^(error|exception|failed|failure|denied|timed out|timeout|not permitted|eperm|eacces)\b:?/i.test(firstNonEmptyLine)
+        || /^command failed:/i.test(firstNonEmptyLine)
+        || /^stderr:/i.test(firstNonEmptyLine);
 }
 function isEmptyInitialWriteTodosResult(value) {
     if (typeof value !== "object" || !value || Array.isArray(value)) {

package/dist/runtime/prompts/runtime-prompts.d.ts CHANGED Viewed

@@ -7,6 +7,7 @@ export declare const INVALID_TOOL_SELECTION_RECOVERY_INSTRUCTION: string;
 export declare const WRITE_TODOS_FULL_ENTRY_INSTRUCTION: string;
 export declare const WRITE_TODOS_NON_EMPTY_INITIAL_LIST_INSTRUCTION: string;
 export declare const WRITE_TODOS_DESCRIPTIVE_CONTENT_INSTRUCTION: string;
+export declare const WRITE_TODOS_REQUIRED_PLAN_INSTRUCTION: string;
 export declare const EXECUTION_WITH_TOOL_EVIDENCE_INSTRUCTION: string;
 export declare const EXECUTION_WITH_TOOL_EVIDENCE_RETRY_INSTRUCTION: string;
 export declare const AUTONOMOUS_INVESTIGATION_RECOVERY_INSTRUCTION: string;

package/dist/runtime/prompts/runtime-prompts.js CHANGED Viewed

@@ -10,6 +10,7 @@ export const INVALID_TOOL_SELECTION_RECOVERY_INSTRUCTION = readRuntimePrompt("in
 export const WRITE_TODOS_FULL_ENTRY_INSTRUCTION = readRuntimePrompt("write-todos-full-entry");
 export const WRITE_TODOS_NON_EMPTY_INITIAL_LIST_INSTRUCTION = readRuntimePrompt("write-todos-non-empty-initial-list");
 export const WRITE_TODOS_DESCRIPTIVE_CONTENT_INSTRUCTION = readRuntimePrompt("write-todos-descriptive-content");
+export const WRITE_TODOS_REQUIRED_PLAN_INSTRUCTION = readRuntimePrompt("write-todos-required-plan");
 export const EXECUTION_WITH_TOOL_EVIDENCE_INSTRUCTION = readRuntimePrompt("execution-with-tool-evidence");
 export const EXECUTION_WITH_TOOL_EVIDENCE_RETRY_INSTRUCTION = readRuntimePrompt("execution-with-tool-evidence-retry");
 export const AUTONOMOUS_INVESTIGATION_RECOVERY_INSTRUCTION = readRuntimePrompt("autonomous-investigation-recovery");

package/dist/scaffold/init-project.js CHANGED Viewed

@@ -205,7 +205,8 @@ spec:
         Rules:
         - Store only durable reusable knowledge. Reject transient chatter, scratchpad, or duplication without added value.
         - Reject raw request/session summaries, source-specific page/news recaps, and generic "we learned how to use the tools/workflow" reflections unless they clearly contain reusable preferences, facts, decisions, or procedures.
-        - If transcript evidence shows the user explicitly asked the system to remember or follow a future instruction and the assistant confirmed that intent, store the durable instruction instead of rejecting it as a generic summary.
+        - Never store assistant- or system-authored workflow instructions inferred from a single transcript reflection, such as "how the system should investigate", "what the assistant should ask first", or other generic control-flow recipes for future turns.
+        - If transcript evidence shows the user explicitly asked the system to remember or follow a future instruction and the assistant confirmed that intent, store the durable user instruction instead of rejecting it as a generic summary.
         - Treat durable knowledge as generic mutable records with database-like operations over the same underlying knowledge item.
         - One candidate may yield zero, one, or multiple durable knowledge items. Split it only when the input clearly contains multiple independently mutable knowledge points.
         - When storing a knowledge item, always return a \`knowledgeMutation\` object with a stable \`identity\` and an \`operation\` of \`create\`, \`update\`, or \`delete\`.
@@ -214,7 +215,7 @@ spec:
         - If an existing relevant record already represents the same underlying knowledge item, reuse that record's \`knowledge_identity\` instead of inventing a new one.
         - Do not invent a second identity just because the new statement negates, revokes, deletes, or replaces the old wording. That is usually the same knowledge item with a different mutation operation.
         - The stored \`content\` must be canonical knowledge text, not an assistant acknowledgement such as "已记住" or "I will remember".
-        - You may optionally include \`operationalRule\` when the knowledge is naturally a rule, instruction, or recurring procedure. Treat it as structured metadata, not as the primary identity mechanism.
+        - You may optionally include \`operationalRule\` when the knowledge is a durable user-approved rule, instruction, or recurring procedure. Do not use it for assistant-only workflow guidance inferred from one conversation. Treat it as structured metadata, not as the primary identity mechanism.
         - Prefer semantic/episodic/procedural kinds only.
         - Prefer scopes session/agent/workspace/user/project only.
         - If the candidate should not be stored, return {"store": false, "reason": "..."}
@@ -283,7 +284,8 @@ spec:
         Rules:
         - Store only durable reusable knowledge. Reject transient chatter, scratchpad, or duplication without added value.
         - Reject raw request/session summaries, source-specific page/news recaps, and generic "we learned how to use the tools/workflow" reflections unless they clearly contain reusable preferences, facts, decisions, or procedures.
-        - If transcript evidence shows the user explicitly asked the system to remember or follow a future instruction and the assistant confirmed that intent, store the durable instruction instead of rejecting it as a generic summary.
+        - Never store assistant- or system-authored workflow instructions inferred from a single transcript reflection, such as "how the system should investigate", "what the assistant should ask first", or other generic control-flow recipes for future turns.
+        - If transcript evidence shows the user explicitly asked the system to remember or follow a future instruction and the assistant confirmed that intent, store the durable user instruction instead of rejecting it as a generic summary.
         - Treat durable knowledge as generic mutable records with database-like operations over the same underlying knowledge item.
         - One candidate may yield zero, one, or multiple durable knowledge items. Split it only when the input clearly contains multiple independently mutable knowledge points.
         - When storing a knowledge item, always return a \`knowledgeMutation\` object with a stable \`identity\` and an \`operation\` of \`create\`, \`update\`, or \`delete\`.
@@ -292,7 +294,7 @@ spec:
         - If an existing relevant record already represents the same underlying knowledge item, reuse that record's \`knowledge_identity\` instead of inventing a new one.
         - Do not invent a second identity just because the new statement negates, revokes, deletes, or replaces the old wording. That is usually the same knowledge item with a different mutation operation.
         - The stored \`content\` must be canonical knowledge text, not an assistant acknowledgement such as "已记住" or "I will remember".
-        - You may optionally include \`operationalRule\` when the knowledge is naturally a rule, instruction, or recurring procedure. Treat it as structured metadata, not as the primary identity mechanism.
+        - You may optionally include \`operationalRule\` when the knowledge is a durable user-approved rule, instruction, or recurring procedure. Do not use it for assistant-only workflow guidance inferred from one conversation. Treat it as structured metadata, not as the primary identity mechanism.
         - Prefer semantic/episodic/procedural kinds only.
         - Prefer scopes session/agent/workspace/user/project only.
         - If the candidate should not be stored, return {"store": false, "reason": "..."}

package/dist/tools.js CHANGED Viewed

@@ -1,8 +1,10 @@
-import { z } from "zod";
 export const TOOL_DEFINITION_MARKER = "__agent_harness_tool_definition__";
 function isZodSchema(value) {
     return typeof value === "object" && value !== null && typeof value.parse === "function";
 }
+function isParseableSchema(value) {
+    return typeof value === "object" && value !== null && typeof value.parse === "function";
+}
 function getZodLikeTypeName(value) {
     if (typeof value !== "object" || value === null) {
         return undefined;
@@ -113,7 +115,28 @@ export function normalizeToolSchema(schema) {
     if (isZodSchema(schema)) {
         return schema;
     }
-    return z.object(schema);
+    const rawShape = schema;
+    return {
+        shape: rawShape,
+        parse(input) {
+            const source = typeof input === "object" && input !== null && !Array.isArray(input)
+                ? input
+                : {};
+            const parsed = {};
+            for (const [key, validator] of Object.entries(rawShape)) {
+                if (!isParseableSchema(validator)) {
+                    throw new TypeError(`Tool schema field '${key}' is not parseable.`);
+                }
+                const hasValue = Object.prototype.hasOwnProperty.call(source, key);
+                const value = hasValue ? source[key] : undefined;
+                const parsedValue = validator.parse(value);
+                if (parsedValue !== undefined) {
+                    parsed[key] = parsedValue;
+                }
+            }
+            return parsed;
+        },
+    };
 }
 export function tool(definition) {
     return {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@botbotgo/agent-harness",
-  "version": "0.0.324",
+  "version": "0.0.326",
   "description": "Workspace runtime for multi-agent applications",
   "license": "MIT",
   "type": "module",