npm - botholomew - Versions diffs - 0.11.5 → 0.11.6 - Mend

botholomew 0.11.5 → 0.11.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/package.json +1 -1
package/src/chat/agent.ts +1 -0
package/src/context/embedder-impl.ts +7 -5
package/src/tools/context/pipe.ts +228 -0
package/src/tools/registry.ts +2 -0

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "botholomew",
-  "version": "0.11.5",
+  "version": "0.11.6",
   "description": "An autonomous AI agent for knowledge work — works your task queue while you sleep.",
   "type": "module",
   "bin": {

package/src/chat/agent.ts CHANGED Viewed

@@ -56,6 +56,7 @@ const CHAT_TOOL_NAMES = new Set([
   "mcp_info",
   "mcp_exec",
   "read_large_result",
+  "pipe_to_context",
   "spawn_worker",
   "skill_list",
   "skill_read",

package/src/context/embedder-impl.ts CHANGED Viewed

@@ -47,11 +47,13 @@ function isModelCached(model: string): boolean {
 async function getPipeline(model: string): Promise<FeatureExtractionPipeline> {
   let p = pipelinePromises.get(model);
   if (!p) {
-    logger.info(
-      isModelCached(model)
-        ? `Loading embedding model ${model}`
-        : `Loading embedding model ${model} (first run, downloading weights)`,
-    );
+    if (isModelCached(model)) {
+      logger.debug(`Loading embedding model ${model}`);
+    } else {
+      logger.info(
+        `Loading embedding model ${model} (first run, downloading weights)`,
+      );
+    }
     p = pipeline("feature-extraction", model);
     pipelinePromises.set(model, p);
   }

package/src/tools/context/pipe.ts ADDED Viewed

@@ -0,0 +1,228 @@
+import { isText } from "istextorbinary";
+import { z } from "zod";
+import { formatDriveRef } from "../../context/drives.ts";
+import { ingestByPath } from "../../context/ingest.ts";
+import {
+  createContextItemStrict,
+  PathConflictError,
+  upsertContextItem,
+} from "../../db/context.ts";
+import { getTool, type ToolDefinition } from "../tool.ts";
+const PREVIEW_CHARS = 200;
+const ERROR_MESSAGE_CAP = 2000;
+const TOOL_NAME = "pipe_to_context";
+function mimeFromPath(path: string): string {
+  const type = Bun.file(path).type.split(";")[0];
+  return type ?? "application/octet-stream";
+}
+function isTextualPath(path: string): boolean {
+  const filename = path.split("/").pop() ?? path;
+  return isText(filename) !== false;
+}
+function truncate(s: string, cap: number): string {
+  if (s.length <= cap) return s;
+  return `${s.slice(0, cap)}…[truncated, ${s.length - cap} more chars]`;
+}
+const inputSchema = z.object({
+  tool_name: z
+    .string()
+    .describe(
+      "Name of the tool to dispatch. Its full output is piped into a context item; you (the LLM) will only see the storage acknowledgment, never the raw bytes.",
+    ),
+  tool_input: z
+    .record(z.string(), z.unknown())
+    .describe(
+      "Arguments to pass to the inner tool (same shape as a normal call).",
+    ),
+  drive: z
+    .string()
+    .default("agent")
+    .describe(
+      "Drive to write to (defaults to 'agent', the agent's scratch drive).",
+    ),
+  path: z.string().describe("Path within the drive (starts with /)"),
+  title: z
+    .string()
+    .optional()
+    .describe("Title for the file (defaults to filename)"),
+  description: z.string().optional().describe("Description of the file"),
+  on_conflict: z
+    .enum(["error", "overwrite"])
+    .optional()
+    .describe(
+      "What to do if a file already exists at this (drive, path). Defaults to 'error'. Pass 'overwrite' to replace.",
+    ),
+});
+const outputSchema = z.object({
+  is_error: z.boolean(),
+  id: z.string().optional(),
+  drive: z.string().optional(),
+  path: z.string().optional(),
+  ref: z.string().optional(),
+  bytes_written: z.number().optional(),
+  preview: z
+    .string()
+    .optional()
+    .describe(
+      `First ${PREVIEW_CHARS} characters of the stored content so you can sanity-check what was captured.`,
+    ),
+  inner_tool_is_error: z.boolean().optional(),
+  error_type: z
+    .enum([
+      "unknown_tool",
+      "forbidden_tool",
+      "invalid_input",
+      "inner_tool_error",
+      "path_conflict",
+    ])
+    .optional(),
+  message: z.string().optional(),
+  next_action_hint: z.string().optional(),
+});
+export const pipeToContextTool = {
+  name: TOOL_NAME,
+  description:
+    "[[ bash equivalent command: cmd > file ]] Run another tool and pipe its full output directly into a context item, without the result flowing through the conversation. Use this when you need a large tool output (web pages, search dumps, big mcp_exec results) to be searchable/embedded for later but you do NOT need to read the bytes yourself. You'll only see the storage ack (drive, path, id, size, short preview).",
+  group: "context",
+  inputSchema,
+  outputSchema,
+  execute: async (input, ctx) => {
+    const inner = getTool(input.tool_name);
+    if (!inner) {
+      return {
+        is_error: true,
+        error_type: "unknown_tool",
+        message: `No tool named "${input.tool_name}".`,
+        next_action_hint:
+          "Check the tool name spelling, or call the inner tool directly if you do need to see its output.",
+      };
+    }
+    if (inner.name === TOOL_NAME || inner.terminal) {
+      return {
+        is_error: true,
+        error_type: "forbidden_tool",
+        message: `Tool "${inner.name}" cannot be piped (terminal tools and pipe_to_context itself are not allowed).`,
+        next_action_hint:
+          "Pipe a non-terminal tool (search_grep, mcp_exec, context_refresh, etc.) instead.",
+      };
+    }
+    const parsedInner = inner.inputSchema.safeParse(input.tool_input);
+    if (!parsedInner.success) {
+      const issues = parsedInner.error.issues
+        .map((i) => `${i.path.join(".")}: ${i.message}`)
+        .join("; ");
+      return {
+        is_error: true,
+        error_type: "invalid_input",
+        message: `Invalid input for ${inner.name}: ${issues}.`,
+        next_action_hint:
+          "Fix tool_input to match the inner tool's schema and retry.",
+      };
+    }
+    let innerResult: unknown;
+    try {
+      innerResult = await inner.execute(parsedInner.data, ctx);
+    } catch (err) {
+      return {
+        is_error: true,
+        error_type: "inner_tool_error",
+        inner_tool_is_error: true,
+        message: truncate(
+          `Tool ${inner.name} threw: ${err instanceof Error ? err.message : String(err)}`,
+          ERROR_MESSAGE_CAP,
+        ),
+        next_action_hint:
+          "Retry with different arguments, or call the tool directly to see the full error.",
+      };
+    }
+    const innerIsError =
+      typeof innerResult === "object" &&
+      innerResult !== null &&
+      "is_error" in innerResult
+        ? (innerResult as { is_error: boolean }).is_error
+        : false;
+    const innerOutput =
+      typeof innerResult === "string"
+        ? innerResult
+        : JSON.stringify(innerResult);
+    if (innerIsError) {
+      return {
+        is_error: true,
+        error_type: "inner_tool_error",
+        inner_tool_is_error: true,
+        message: truncate(innerOutput, ERROR_MESSAGE_CAP),
+        next_action_hint:
+          "The inner tool returned an error and nothing was written. Fix the inputs and retry, or pipe a different tool.",
+      };
+    }
+    const mimeType = mimeFromPath(input.path);
+    const isTextual = isTextualPath(input.path);
+    const title =
+      input.title ?? input.path.split("/").filter(Boolean).pop() ?? input.path;
+    const onConflict = input.on_conflict ?? "error";
+    const target = { drive: input.drive, path: input.path };
+    try {
+      const item =
+        onConflict === "overwrite"
+          ? await upsertContextItem(ctx.conn, {
+              title,
+              description: input.description,
+              content: innerOutput,
+              drive: target.drive,
+              path: target.path,
+              mimeType,
+              isTextual,
+            })
+          : await createContextItemStrict(ctx.conn, {
+              title,
+              description: input.description,
+              content: innerOutput,
+              drive: target.drive,
+              path: target.path,
+              mimeType,
+              isTextual,
+            });
+      await ingestByPath(ctx.conn, target, ctx.config);
+      return {
+        is_error: false,
+        id: item.id,
+        drive: item.drive,
+        path: item.path,
+        ref: formatDriveRef(item),
+        bytes_written: innerOutput.length,
+        preview: innerOutput.slice(0, PREVIEW_CHARS),
+      };
+    } catch (err) {
+      if (err instanceof PathConflictError) {
+        return {
+          is_error: true,
+          error_type: "path_conflict",
+          drive: err.drive,
+          path: err.path,
+          ref: formatDriveRef({ drive: err.drive, path: err.path }),
+          message: `A file already exists at ${formatDriveRef({ drive: err.drive, path: err.path })} (id: ${err.existingId}). The inner tool ran but its output was discarded.`,
+          next_action_hint:
+            "Retry with on_conflict='overwrite' to replace, or pick a different path.",
+        };
+      }
+      throw err;
+    }
+  },
+} satisfies ToolDefinition<typeof inputSchema, typeof outputSchema>;

package/src/tools/registry.ts CHANGED Viewed

@@ -2,6 +2,7 @@
 import { capabilitiesRefreshTool } from "./capabilities/refresh.ts";
 // Context tools
 import { contextListDrivesTool } from "./context/list-drives.ts";
+import { pipeToContextTool } from "./context/pipe.ts";
 import { readLargeResultTool } from "./context/read-large-result.ts";
 import { contextRefreshTool } from "./context/refresh.ts";
 import { contextSearchTool } from "./context/search.ts";
@@ -85,6 +86,7 @@ export function registerAllTools(): void {
   registerTool(updateBeliefsTool);
   registerTool(updateGoalsTool);
   registerTool(readLargeResultTool);
+  registerTool(pipeToContextTool);
   // Capabilities
   registerTool(capabilitiesRefreshTool);