npm - @crewhaus/tool-catalog - Versions diffs - 0.1.0 - Mend

@crewhaus/tool-catalog 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/package.json ADDED Viewed

@@ -0,0 +1,42 @@
+{
+  "name": "@crewhaus/tool-catalog",
+  "version": "0.1.0",
+  "type": "module",
+  "description": "ToolDefinition interface, RegisteredTool, and ToolCatalog registry",
+  "main": "src/index.ts",
+  "types": "src/index.ts",
+  "exports": {
+    ".": "./src/index.ts"
+  },
+  "scripts": {
+    "test": "bun test src"
+  },
+  "dependencies": {
+    "@crewhaus/errors": "0.0.0",
+    "zod": "^3.23.8"
+  },
+  "license": "Apache-2.0",
+  "author": {
+    "name": "Max Meier",
+    "email": "max@studiomax.io",
+    "url": "https://studiomax.io"
+  },
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/crewhaus/factory.git",
+    "directory": "packages/tool-catalog"
+  },
+  "homepage": "https://github.com/crewhaus/factory/tree/main/packages/tool-catalog#readme",
+  "bugs": {
+    "url": "https://github.com/crewhaus/factory/issues"
+  },
+  "publishConfig": {
+    "access": "restricted"
+  },
+  "files": [
+    "src",
+    "README.md",
+    "LICENSE",
+    "NOTICE"
+  ]
+}

package/src/index.test.ts ADDED Viewed

@@ -0,0 +1,98 @@
+import { beforeEach, describe, expect, test } from "bun:test";
+import { CrewhausError } from "@crewhaus/errors";
+import { z } from "zod";
+import { type RegisteredTool, ToolCatalog, ToolCatalogError, defaultCatalog } from "./index";
+function makeTool(name: string): RegisteredTool {
+  return {
+    name,
+    description: `${name} tool`,
+    inputSchema: z.object({ value: z.string() }) as RegisteredTool["inputSchema"],
+    execute: async (_input) => "ok",
+    concurrencySafe: false,
+    readOnly: false,
+    destructive: false,
+    requiresSandbox: false,
+    classifyOutput: true,
+    scope: "internal",
+    requireJustification: false,
+  };
+}
+describe("ToolCatalog", () => {
+  let catalog: ToolCatalog;
+  beforeEach(() => {
+    catalog = new ToolCatalog();
+  });
+  test("register and get round-trip", () => {
+    const tool = makeTool("Bash");
+    catalog.register(tool);
+    expect(catalog.get("Bash")).toBe(tool);
+  });
+  test("has returns true after register, false before", () => {
+    expect(catalog.has("Read")).toBe(false);
+    catalog.register(makeTool("Read"));
+    expect(catalog.has("Read")).toBe(true);
+  });
+  test("list returns tools in insertion order", () => {
+    const bash = makeTool("Bash");
+    const read = makeTool("Read");
+    const write = makeTool("Write");
+    catalog.register(bash);
+    catalog.register(read);
+    catalog.register(write);
+    expect(catalog.list()).toEqual([bash, read, write]);
+  });
+  test("list returns empty array when catalog is empty", () => {
+    expect(catalog.list()).toEqual([]);
+  });
+  test("get returns undefined for unknown tool", () => {
+    expect(catalog.get("Unknown")).toBeUndefined();
+  });
+  test("duplicate name throws ToolCatalogError", () => {
+    catalog.register(makeTool("Bash"));
+    expect(() => catalog.register(makeTool("Bash"))).toThrow(ToolCatalogError);
+    expect(() => catalog.register(makeTool("Bash"))).toThrow(/already registered/);
+  });
+  test("ToolCatalogError is instanceof CrewhausError", () => {
+    expect(new ToolCatalogError("x")).toBeInstanceOf(CrewhausError);
+  });
+  test("ToolCatalogError has code 'tool'", () => {
+    expect(new ToolCatalogError("x").code).toBe("tool");
+  });
+});
+describe("defaultCatalog", () => {
+  test("is a ToolCatalog instance", () => {
+    expect(defaultCatalog).toBeInstanceOf(ToolCatalog);
+  });
+});
+describe("RegisteredTool jsonSchema field", () => {
+  test("optional jsonSchema is preserved when set", () => {
+    const catalog = new ToolCatalog();
+    const tool: RegisteredTool = {
+      ...makeTool("Mcp"),
+      jsonSchema: { type: "object", properties: { x: { type: "number" } } },
+    };
+    catalog.register(tool);
+    const got = catalog.get("Mcp");
+    expect(got?.jsonSchema).toEqual({ type: "object", properties: { x: { type: "number" } } });
+  });
+  test("absent jsonSchema is undefined", () => {
+    const catalog = new ToolCatalog();
+    const tool = makeTool("Plain");
+    catalog.register(tool);
+    expect(catalog.get("Plain")?.jsonSchema).toBeUndefined();
+  });
+});

package/src/index.ts ADDED Viewed

@@ -0,0 +1,188 @@
+import { CrewhausError } from "@crewhaus/errors";
+import type { ZodType } from "zod";
+/**
+ * Per-call context passed as the second argument to `execute`. Tools that
+ * support cooperative cancellation (e.g. tool-bash forwarding to Bun.spawn)
+ * read `signal` from here; tools that don't care can ignore it entirely.
+ *
+ * `bridge` (Section 13) is an opaque payload runtime-core stuffs in once per
+ * run. Framework-aware tools — today only the `Task` tool — cast it back to
+ * the typed `RuntimeBridge` from `@crewhaus/agent-context-isolation`.
+ * Ordinary tools ignore it.
+ *
+ * Section 18 — `onStreamChunk` is invoked by streaming tools (e.g.
+ * tool-code-execution piping container stdout/stderr) so runtime-core can
+ * publish `tool_stream_chunk` trace events. The callback is fire-and-forget
+ * — tools must not block on it. Optional; tools that don't stream skip it.
+ */
+export interface ToolExecuteContext {
+  readonly signal?: AbortSignal;
+  readonly bridge?: unknown;
+  readonly onStreamChunk?: (stream: "stdout" | "stderr", chunk: string) => void;
+}
+/**
+ * Section 14 — non-string tool result content. Mirrors the subset of
+ * Anthropic's `ToolResultBlockParam.content` we use today: text + base64
+ * image blocks. `runtime-core` forwards arrays of these verbatim into the
+ * API's `tool_result.content` field, so the model sees them as image
+ * inputs rather than as base64 text.
+ *
+ * Tools that don't return rich content (the majority — fs, bash, todo,
+ * mcp, channel, task) keep returning `string` and never construct these.
+ */
+export interface ToolResultTextBlock {
+  readonly type: "text";
+  readonly text: string;
+}
+export interface ToolResultImageBlock {
+  readonly type: "image";
+  readonly source: {
+    readonly type: "base64";
+    readonly media_type: "image/png" | "image/jpeg" | "image/gif" | "image/webp";
+    readonly data: string;
+  };
+}
+export type ToolResultContentBlock = ToolResultTextBlock | ToolResultImageBlock;
+export type ToolResultContent = ReadonlyArray<ToolResultContentBlock>;
+export type ToolExecuteResult = string | ToolResultContent;
+/**
+ * Pillar 3 sink-side fabric — where a tool's effect lands.
+ *
+ * - `"internal"`: the tool reads/writes process-local state only
+ *   (filesystem, sandboxed code execution, memory, todo, code-graph
+ *   index). Egress classifier skips internal tools.
+ * - `"external"`: the tool transmits data to a sink the runtime cannot
+ *   re-classify after the fact — a URL fetched, a channel message sent,
+ *   a federation outbound payload, an MCP tool invocation, an EVM tx
+ *   broadcast, an image upload. Every such call routes through
+ *   `egress-classifier` first.
+ *
+ * Default at normalization is `"internal"` (fails closed). Tools that
+ * cross a process or network boundary MUST set `"external"` explicitly
+ * in their `ToolDefinition`.
+ */
+export type ToolScope = "internal" | "external";
+export interface ToolDefinition<TInput = unknown> {
+  name: string;
+  description: string;
+  inputSchema: ZodType<TInput>;
+  execute: (input: TInput, ctx?: ToolExecuteContext) => Promise<ToolExecuteResult>;
+  concurrencySafe?: boolean;
+  readOnly?: boolean;
+  destructive?: boolean;
+  /**
+   * Section 18 — declares that the tool MUST run inside a sandbox. The
+   * permission engine refuses to grant `allow` in default mode unless an
+   * `alwaysAllow` rule matches AND a real sandbox backend is available
+   * (see `permission-engine.evaluate`). Tool implementations are
+   * responsible for actually using the sandbox; the flag is the policy
+   * declaration that the floor enforces.
+   */
+  requiresSandbox?: boolean;
+  /**
+   * Section 18 — when explicitly false, the post-tool prompt-injection
+   * classifier in runtime-core is skipped for this tool. Default is true
+   * (run the classifier on every output). Set to false ONLY for tools whose
+   * output is structurally guaranteed not to be attacker-controlled (e.g.
+   * the in-process `Task` sub-agent tool wrapper).
+   */
+  classifyOutput?: boolean;
+  /**
+   * Pillar 3 sink-side — see `ToolScope`. Default `"internal"` at
+   * normalization. Set `"external"` for any tool whose effect leaves the
+   * process boundary unmonitored.
+   */
+  scope?: ToolScope;
+  /**
+   * Pillar 3 intent gate — when true, runtime-core demands the model
+   * supply a `justification` string in the tool's input alongside the
+   * declared schema, and `permission-engine` evaluates the justification
+   * against the session's stated goal via an LLM-as-judge. Failures emit
+   * `permission_justification_evaluated` audit events and deny the call.
+   *
+   * Default at normalization is `false`. Recommended `true` for any tool
+   * with destructive or external side effects (evm-tx, message-channel,
+   * federation outbound). Independent of `scope` — a tool can be
+   * `internal` and still require justification (e.g. a destructive fs
+   * delete), and a tool can be `external` without requiring justification
+   * (e.g. a read-only public-data fetch).
+   */
+  requireJustification?: boolean;
+  /**
+   * Authoritative JSON Schema for the tool's input. When set, runtime-core
+   * forwards this verbatim to the model instead of running
+   * `zodToJsonSchema(inputSchema)`. Used by tools whose canonical schema is
+   * already JSON Schema (e.g. MCP tools), where the Zod round-trip would be
+   * lossy. The `inputSchema` slot is still required for the validator path
+   * (typically `z.unknown()` for MCP).
+   */
+  jsonSchema?: unknown;
+}
+/** Normalized form stored in the catalog. All flags are required booleans and
+ *  execute is type-erased so the registry can hold a homogeneous map. */
+export interface RegisteredTool {
+  name: string;
+  description: string;
+  inputSchema: ZodType<unknown>;
+  execute: (input: unknown, ctx?: ToolExecuteContext) => Promise<ToolExecuteResult>;
+  concurrencySafe: boolean;
+  readOnly: boolean;
+  destructive: boolean;
+  /** Section 18 — fails closed (false) when omitted by `buildTool`. */
+  requiresSandbox: boolean;
+  /** Section 18 — defaults to true so post-tool classification runs. */
+  classifyOutput: boolean;
+  /**
+   * Pillar 3 sink-side — fails closed (`"internal"`) when omitted. Tools
+   * that cross a process or network boundary MUST set `"external"`
+   * explicitly in their `ToolDefinition`.
+   */
+  scope: ToolScope;
+  /**
+   * Pillar 3 intent gate — fails closed (false) when omitted. See
+   * `ToolDefinition.requireJustification`.
+   */
+  requireJustification: boolean;
+  /** See ToolDefinition.jsonSchema. Optional; runtime-core falls back to
+   *  zodToJsonSchema(inputSchema) when absent. */
+  jsonSchema?: unknown;
+}
+export class ToolCatalogError extends CrewhausError {
+  override readonly name = "ToolCatalogError";
+  constructor(message: string, cause?: unknown) {
+    super("tool", message, cause);
+  }
+}
+export class ToolCatalog {
+  private readonly _tools = new Map<string, RegisteredTool>();
+  register(tool: RegisteredTool): void {
+    if (this._tools.has(tool.name)) {
+      throw new ToolCatalogError(`tool "${tool.name}" is already registered`);
+    }
+    this._tools.set(tool.name, tool);
+  }
+  get(name: string): RegisteredTool | undefined {
+    return this._tools.get(name);
+  }
+  has(name: string): boolean {
+    return this._tools.has(name);
+  }
+  list(): ReadonlyArray<RegisteredTool> {
+    return [...this._tools.values()];
+  }
+}
+export const defaultCatalog = new ToolCatalog();