npm - botholomew - Versions diffs - 0.8.6 → 0.8.8 - Mend

botholomew 0.8.6 → 0.8.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

package/README.md +1 -0
package/package.json +1 -1
package/src/chat/session.ts +19 -0
package/src/cli.ts +2 -0
package/src/commands/capabilities.ts +45 -0
package/src/context/capabilities.ts +512 -0
package/src/init/index.ts +21 -0
package/src/init/templates.ts +22 -0
package/src/skills/commands.ts +12 -0
package/src/tools/capabilities/refresh.ts +53 -0
package/src/tools/registry.ts +5 -1
package/src/tui/App.tsx +46 -2
package/src/tui/components/InputBar.tsx +24 -7
package/src/tui/slashCompletion.ts +16 -2

package/README.md CHANGED Viewed

@@ -139,6 +139,7 @@ Everything the agent can touch is here. No surprises.
 | `botholomew task list\|add\|view\|update\|reset\|delete` | Manage the task queue |
 | `botholomew schedule list\|add\|enable\|trigger\|delete` | Recurring work |
 | `botholomew context add\|list\|view\|search\|refresh\|remove` | Ingest & browse knowledge (files, folders, URLs) |
+| `botholomew capabilities` | Rescan built-in + MCPX tools and rewrite `.botholomew/capabilities.md` |
 | `botholomew mcpx servers\|add\|remove\|info\|search\|exec\|ping\|auth\|import-global` | Configure external MCP servers |
 | `botholomew skill list\|show\|create\|validate` | Manage slash-command skills |
 | `botholomew context ... \| search ...` | Direct access to the agent's virtual filesystem |

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "botholomew",
-  "version": "0.8.6",
+  "version": "0.8.8",
   "description": "An autonomous AI agent for knowledge work — works your task queue while you sleep.",
   "type": "module",
   "bin": {

package/src/chat/session.ts CHANGED Viewed

@@ -140,3 +140,22 @@ export async function endChatSession(session: ChatSession): Promise<void> {
   await withDb(session.dbPath, (conn) => endThread(conn, session.threadId));
   await session.cleanup();
 }
+/**
+ * End the current thread and start a fresh one on the same session.
+ * The old thread is persisted (marked ended) and can still be resumed
+ * via `botholomew chat --thread-id <id>`. Returns the previous thread
+ * ID so callers can display it to the user.
+ */
+export async function clearChatSession(
+  session: ChatSession,
+): Promise<{ previousThreadId: string; newThreadId: string }> {
+  const previousThreadId = session.threadId;
+  const newThreadId = await withDb(session.dbPath, async (conn) => {
+    await endThread(conn, previousThreadId);
+    return createThread(conn, "chat_session", undefined, "New chat");
+  });
+  session.threadId = newThreadId;
+  session.messages.length = 0;
+  return { previousThreadId, newThreadId };
+}

package/src/cli.ts CHANGED Viewed

@@ -2,6 +2,7 @@
 import ansis from "ansis";
 import { program } from "commander";
+import { registerCapabilitiesCommand } from "./commands/capabilities.ts";
 import { registerChatCommand } from "./commands/chat.ts";
 import { registerCheckUpdateCommand } from "./commands/check-update.ts";
 import { registerContextCommand } from "./commands/context.ts";
@@ -39,6 +40,7 @@ registerThreadCommand(program);
 registerScheduleCommand(program);
 registerChatCommand(program);
 registerContextCommand(program);
+registerCapabilitiesCommand(program);
 registerMcpxCommand(program);
 registerSkillCommand(program);
 registerNukeCommand(program);

package/src/commands/capabilities.ts ADDED Viewed

@@ -0,0 +1,45 @@
+import type { Command } from "commander";
+import { createSpinner } from "nanospinner";
+import { loadConfig } from "../config/loader.ts";
+import { writeCapabilitiesFile } from "../context/capabilities.ts";
+import { createMcpxClient } from "../mcpx/client.ts";
+import { withDb } from "./with-db.ts";
+export function registerCapabilitiesCommand(program: Command) {
+  program
+    .command("capabilities")
+    .description(
+      "Regenerate .botholomew/capabilities.md by scanning built-in tools and MCPX tools",
+    )
+    .option("--no-mcp", "Skip MCPX tool enumeration (built-in tools only)")
+    .action((opts: { mcp?: boolean }) =>
+      withDb(program, async (_conn, dir) => {
+        const includeMcp = opts.mcp !== false;
+        const spinner = createSpinner("Loading config").start();
+        const config = await loadConfig(dir);
+        spinner.update({ text: "Connecting to MCPX servers" });
+        const mcpxClient = includeMcp ? await createMcpxClient(dir) : null;
+        try {
+          const result = await writeCapabilitiesFile(
+            dir,
+            mcpxClient,
+            config,
+            (phase) => spinner.update({ text: phase }),
+          );
+          const bits = [
+            `${result.counts.internal} built-in`,
+            `${result.counts.mcp} MCPX`,
+          ];
+          if (!includeMcp) bits.push("MCPX skipped");
+          spinner.success({
+            text: `Wrote ${result.path} (${bits.join(", ")})`,
+          });
+        } catch (err) {
+          spinner.error({ text: `Failed: ${(err as Error).message}` });
+          process.exit(1);
+        } finally {
+          await mcpxClient?.close();
+        }
+      }),
+    );
+}

package/src/context/capabilities.ts ADDED Viewed

@@ -0,0 +1,512 @@
+import { join } from "node:path";
+import Anthropic from "@anthropic-ai/sdk";
+import type { McpxClient } from "@evantahler/mcpx";
+import type { BotholomewConfig } from "../config/schemas.ts";
+import { getBotholomewDir } from "../constants.ts";
+import { getAllTools, type ToolDefinition } from "../tools/tool.ts";
+import {
+  type ContextFileMeta,
+  parseContextFile,
+  serializeContextFile,
+} from "../utils/frontmatter.ts";
+import { logger } from "../utils/logger.ts";
+export const CAPABILITIES_FILENAME = "capabilities.md";
+// LLM config — summarization is one call per refresh, no streaming needed.
+const SUMMARIZE_TIMEOUT_MS = 30_000;
+const SUMMARIZE_MAX_TOKENS = 4096;
+// biome-ignore lint/suspicious/noExplicitAny: Zod-free tool schema for Anthropic SDK
+type AnyTool = ToolDefinition<any, any>;
+/**
+ * Groups rendered for built-in tools when we can't summarize via LLM.
+ * Order here controls rendering order in the fallback.
+ */
+const GROUP_ORDER = [
+  "task",
+  "schedule",
+  "context",
+  "search",
+  "thread",
+  "mcp",
+  "worker",
+  "capabilities",
+] as const;
+const GROUP_HEADINGS: Record<string, string> = {
+  task: "Task management",
+  schedule: "Schedules",
+  context: "Virtual filesystem & self-reflection",
+  search: "Search",
+  thread: "Threads",
+  mcp: "MCPX meta-tools",
+  worker: "Workers",
+  capabilities: "Capabilities",
+  other: "Other",
+};
+export interface CapabilitiesCounts {
+  internal: number;
+  mcp: number;
+}
+export interface GenerateResult {
+  body: string;
+  counts: CapabilitiesCounts;
+}
+/** Called at each phase transition so callers (CLI) can render progress. */
+export type ProgressCallback = (phase: string) => void;
+interface RawInventory {
+  internal: Map<string, AnyTool[]>;
+  internalTotal: number;
+  mcpByServer: Map<string, Array<{ name: string; description: string }>>;
+  mcpTotal: number;
+  mcpError: string | null;
+  mcpConfigured: boolean;
+}
+/** Collect the tool inventory without rendering. */
+async function collectInventory(
+  mcpxClient: McpxClient | null,
+  onPhase?: ProgressCallback,
+): Promise<RawInventory> {
+  onPhase?.("Scanning internal tools");
+  const allTools = getAllTools();
+  const internal = new Map<string, AnyTool[]>();
+  for (const tool of allTools) {
+    const key = (GROUP_ORDER as readonly string[]).includes(tool.group)
+      ? tool.group
+      : "other";
+    const list = internal.get(key) ?? [];
+    list.push(tool);
+    internal.set(key, list);
+  }
+  const mcpByServer = new Map<
+    string,
+    Array<{ name: string; description: string }>
+  >();
+  let mcpTotal = 0;
+  let mcpError: string | null = null;
+  if (mcpxClient) {
+    onPhase?.("Querying MCPX servers");
+    try {
+      const mcpTools = await mcpxClient.listTools();
+      mcpTotal = mcpTools.length;
+      for (const entry of mcpTools) {
+        const list = mcpByServer.get(entry.server) ?? [];
+        list.push({
+          name: entry.tool.name,
+          description: (entry.tool.description ?? "").trim(),
+        });
+        mcpByServer.set(entry.server, list);
+      }
+    } catch (err) {
+      mcpError = (err as Error).message;
+    }
+  }
+  return {
+    internal,
+    internalTotal: allTools.length,
+    mcpByServer,
+    mcpTotal,
+    mcpError,
+    mcpConfigured: mcpxClient !== null,
+  };
+}
+// ---------------------------------------------------------------------------
+// LLM summarization
+// ---------------------------------------------------------------------------
+interface Theme {
+  name: string;
+  summary: string;
+}
+interface ServerThemes {
+  server: string;
+  themes: Theme[];
+}
+interface SummarizedCapabilities {
+  internal_themes: Theme[];
+  mcpx_servers: ServerThemes[];
+}
+const SUMMARIZE_TOOL_NAME = "return_capability_summary";
+const SUMMARIZE_TOOL = {
+  name: SUMMARIZE_TOOL_NAME,
+  description:
+    "Return thematic capability summaries for the agent's tool inventory.",
+  input_schema: {
+    type: "object" as const,
+    properties: {
+      internal_themes: {
+        type: "array",
+        description:
+          "Themes covering the agent's built-in tools (task queue, virtual filesystem, search, threads, MCPX meta-tools, workers, self-reflection, etc.).",
+        items: {
+          type: "object",
+          properties: {
+            name: {
+              type: "string",
+              description: "Short theme name (2-4 words).",
+            },
+            summary: {
+              type: "string",
+              description:
+                "One sentence with concrete action verbs. No tool names. No preamble.",
+            },
+          },
+          required: ["name", "summary"],
+        },
+      },
+      mcpx_servers: {
+        type: "array",
+        description:
+          "MCPX tools grouped by their source server. Within each server, split into themes only when the server exposes distinct services (e.g. Gmail + Google Calendar on one server).",
+        items: {
+          type: "object",
+          properties: {
+            server: {
+              type: "string",
+              description: "Server name exactly as given in the inventory.",
+            },
+            themes: {
+              type: "array",
+              items: {
+                type: "object",
+                properties: {
+                  name: {
+                    type: "string",
+                    description: "Theme name (usually the service, e.g. Gmail)",
+                  },
+                  summary: {
+                    type: "string",
+                    description:
+                      "One sentence with concrete action verbs. No tool names.",
+                  },
+                },
+                required: ["name", "summary"],
+              },
+            },
+          },
+          required: ["server", "themes"],
+        },
+      },
+    },
+    required: ["internal_themes", "mcpx_servers"],
+  },
+};
+function renderInventoryForPrompt(inv: RawInventory): string {
+  const sections: string[] = [];
+  sections.push("## Internal tools");
+  for (const group of [...GROUP_ORDER, "other" as const]) {
+    const tools = inv.internal.get(group);
+    if (!tools || tools.length === 0) continue;
+    sections.push(`\n### ${GROUP_HEADINGS[group] ?? group}`);
+    const sorted = [...tools].sort((a, b) => a.name.localeCompare(b.name));
+    for (const t of sorted) {
+      sections.push(`- ${t.name}: ${t.description}`);
+    }
+  }
+  if (inv.mcpByServer.size > 0) {
+    sections.push("\n## MCPX tools");
+    const servers = [...inv.mcpByServer.keys()].sort();
+    for (const server of servers) {
+      sections.push(`\n### ${server}`);
+      const tools = inv.mcpByServer.get(server) ?? [];
+      const sorted = [...tools].sort((a, b) => a.name.localeCompare(b.name));
+      for (const t of sorted) {
+        sections.push(`- ${t.name}: ${t.description || "(no description)"}`);
+      }
+    }
+  }
+  return sections.join("\n");
+}
+const SUMMARIZE_SYSTEM = `You summarize an AI agent's tool inventory into a terse "capabilities" document. The agent loads this document into every system prompt, so it MUST be compact — 1 line per theme.
+Rules:
+- Do NOT list specific tool names. The agent discovers exact names via the MCPX meta-tools (mcp_search, mcp_list_tools, mcp_info) when it actually needs to invoke one.
+- Group tools into natural themes.
+- For MCPX tools, one theme usually = one external service (Gmail, Google Calendar, GitHub, Linear, Slack, Google Docs, Google Drive, Google Sheets, Apple Notes, etc.). Split a single server into multiple themes when it clearly exposes distinct services.
+- For internal tools, use coarse buckets aligned with the provided groups (task management, virtual filesystem, search, threads, MCPX meta-tools, workers, self-reflection, capabilities). Merge overlapping groups if natural.
+- Each summary is ONE sentence with concrete action verbs. Present-tense imperative, no preamble.
+GOOD examples:
+  "Gmail — read, send, draft, search, and reply to emails; manage labels and threads"
+  "Virtual filesystem — read, write, edit, move, copy, delete, and navigate items in the agent's persistent memory store"
+  "GitHub — read and write repositories, branches, files, issues, pull requests, reviews, and labels"
+BAD examples (do not produce):
+  "Provides access to Gmail operations via tools like Gmail_SendEmail..."
+  "Tools for working with email"`;
+async function summarizeViaLLM(
+  inv: RawInventory,
+  config: Required<BotholomewConfig>,
+): Promise<SummarizedCapabilities | null> {
+  if (
+    !config.anthropic_api_key ||
+    config.anthropic_api_key === "your-api-key-here"
+  ) {
+    return null;
+  }
+  const client = new Anthropic({ apiKey: config.anthropic_api_key });
+  const userPrompt = `Summarize this tool inventory. Return via the \`${SUMMARIZE_TOOL_NAME}\` tool.\n\n${renderInventoryForPrompt(inv)}`;
+  try {
+    const response = await Promise.race([
+      client.messages.create({
+        model: config.chunker_model,
+        max_tokens: SUMMARIZE_MAX_TOKENS,
+        system: SUMMARIZE_SYSTEM,
+        tools: [SUMMARIZE_TOOL],
+        tool_choice: { type: "tool", name: SUMMARIZE_TOOL_NAME },
+        messages: [{ role: "user", content: userPrompt }],
+      }),
+      new Promise<never>((_, reject) =>
+        setTimeout(
+          () => reject(new Error("Capability summarization timeout")),
+          SUMMARIZE_TIMEOUT_MS,
+        ),
+      ),
+    ]);
+    const toolBlock = response.content.find((b) => b.type === "tool_use");
+    if (!toolBlock || toolBlock.type !== "tool_use") return null;
+    const input = toolBlock.input as SummarizedCapabilities;
+    if (!Array.isArray(input.internal_themes)) return null;
+    if (!Array.isArray(input.mcpx_servers)) return null;
+    return input;
+  } catch (err) {
+    logger.debug(`Capability summarization failed: ${(err as Error).message}`);
+    return null;
+  }
+}
+// ---------------------------------------------------------------------------
+// Rendering
+// ---------------------------------------------------------------------------
+function renderHeader(now: Date): string[] {
+  return [
+    "# Capabilities",
+    "",
+    `*Generated ${now.toISOString()}. Regenerate with \`botholomew capabilities\`, the \`capabilities_refresh\` tool, or the \`/capabilities\` skill.*`,
+    "",
+    "A high-level summary of what this agent can do. Specific tool names are **not** listed — use `mcp_list_tools`, `mcp_search`, or `mcp_info` to find exact names when you need to invoke an external tool.",
+    "",
+  ];
+}
+function renderSummarized(
+  summary: SummarizedCapabilities,
+  inv: RawInventory,
+  now: Date,
+): string {
+  const parts: string[] = [];
+  parts.push(...renderHeader(now));
+  parts.push("## Internal capabilities");
+  parts.push("");
+  for (const theme of summary.internal_themes) {
+    parts.push(`- **${theme.name}** — ${theme.summary}`);
+  }
+  parts.push("");
+  parts.push("## External capabilities (via MCPX)");
+  parts.push("");
+  if (!inv.mcpConfigured) {
+    parts.push(
+      "_No MCPX servers configured. Add one with `botholomew mcpx add` and rerun `botholomew capabilities`._",
+    );
+  } else if (inv.mcpError) {
+    parts.push(
+      `_Failed to list MCPX tools: ${inv.mcpError}. Check your MCPX server configuration._`,
+    );
+  } else if (summary.mcpx_servers.length === 0) {
+    parts.push(
+      "_MCPX is configured but no tools are exposed by the connected servers._",
+    );
+  } else {
+    for (const srv of summary.mcpx_servers) {
+      parts.push(`### ${srv.server}`);
+      parts.push("");
+      for (const theme of srv.themes) {
+        parts.push(`- **${theme.name}** — ${theme.summary}`);
+      }
+      parts.push("");
+    }
+  }
+  return parts.join("\n").trimEnd();
+}
+/**
+ * Fallback rendering when no API key is set or the LLM call fails.
+ * Produces a static high-level summary of internal tools plus a server-level
+ * listing for MCPX (with tool counts), still far more compact than listing
+ * every tool. The agent uses the MCPX meta-tools to drill in when needed.
+ */
+function renderFallback(inv: RawInventory, now: Date): string {
+  const parts: string[] = [];
+  parts.push(...renderHeader(now));
+  parts.push("## Internal capabilities");
+  parts.push("");
+  const fallbackInternal: Record<string, string> = {
+    task: "create, list, view, update, complete, fail, and wait on tasks in the agent's work queue",
+    schedule:
+      "create and list recurring schedules that automatically generate tasks",
+    context:
+      "read, write, edit, move, copy, delete, and navigate items in the agent's persistent memory store; update beliefs and goals; read large tool results",
+    search: "keyword and semantic search over the virtual filesystem",
+    thread: "list and view past conversation threads and tool interactions",
+    mcp: "search, list, inspect, and execute tools exposed by configured MCPX servers",
+    worker: "spawn background workers to run tasks asynchronously",
+    capabilities: "refresh this capabilities file (the tool inventory)",
+  };
+  for (const group of [...GROUP_ORDER, "other" as const]) {
+    const tools = inv.internal.get(group);
+    if (!tools || tools.length === 0) continue;
+    const heading = GROUP_HEADINGS[group] ?? group;
+    const summary = fallbackInternal[group] ?? "(no summary)";
+    parts.push(`- **${heading}** — ${summary}`);
+  }
+  parts.push("");
+  parts.push("## External capabilities (via MCPX)");
+  parts.push("");
+  if (!inv.mcpConfigured) {
+    parts.push(
+      "_No MCPX servers configured. Add one with `botholomew mcpx add` and rerun `botholomew capabilities`._",
+    );
+  } else if (inv.mcpError) {
+    parts.push(
+      `_Failed to list MCPX tools: ${inv.mcpError}. Check your MCPX server configuration._`,
+    );
+  } else if (inv.mcpByServer.size === 0) {
+    parts.push(
+      "_MCPX is configured but no tools are exposed by the connected servers._",
+    );
+  } else {
+    parts.push(
+      "_(LLM summarization unavailable — set `anthropic_api_key` and rerun to generate themed summaries. Until then, use `mcp_list_tools` with each server to see what's exposed.)_",
+    );
+    parts.push("");
+    const servers = [...inv.mcpByServer.keys()].sort();
+    for (const server of servers) {
+      const tools = inv.mcpByServer.get(server) ?? [];
+      parts.push(`- **${server}** — ${tools.length} tool(s)`);
+    }
+  }
+  return parts.join("\n").trimEnd();
+}
+/**
+ * Build the body of capabilities.md. When `config.anthropic_api_key` is set,
+ * Claude is asked to produce thematic summaries. Otherwise (or on failure) a
+ * static fallback listing is rendered.
+ */
+export async function generateCapabilitiesMarkdown(
+  mcpxClient: McpxClient | null,
+  config: Required<BotholomewConfig>,
+  now: Date = new Date(),
+  onPhase?: ProgressCallback,
+): Promise<GenerateResult> {
+  const inv = await collectInventory(mcpxClient, onPhase);
+  // Don't call the LLM when the inventory is empty / broken — the fallback
+  // conveys the same information and avoids an unnecessary API round trip.
+  const hasAnythingToSummarize =
+    inv.mcpByServer.size > 0 || inv.internalTotal > 0;
+  let summary: SummarizedCapabilities | null = null;
+  if (hasAnythingToSummarize) {
+    const canSummarize =
+      config.anthropic_api_key &&
+      config.anthropic_api_key !== "your-api-key-here";
+    if (canSummarize) {
+      onPhase?.(
+        `Summarizing ${inv.internalTotal} internal + ${inv.mcpTotal} MCPX tools with Claude`,
+      );
+    }
+    summary = await summarizeViaLLM(inv, config);
+  }
+  const body = summary
+    ? renderSummarized(summary, inv, now)
+    : renderFallback(inv, now);
+  return {
+    body,
+    counts: { internal: inv.internalTotal, mcp: inv.mcpTotal },
+  };
+}
+export interface WriteResult {
+  path: string;
+  counts: CapabilitiesCounts;
+  createdFile: boolean;
+}
+/**
+ * Regenerate and write `.botholomew/capabilities.md`. Preserves any existing
+ * frontmatter (so a human-edited `loading:` flag survives). On first write
+ * the default frontmatter is `loading: always`, `agent-modification: true`.
+ */
+export async function writeCapabilitiesFile(
+  projectDir: string,
+  mcpxClient: McpxClient | null,
+  config: Required<BotholomewConfig>,
+  onPhase?: ProgressCallback,
+): Promise<WriteResult> {
+  const filePath = join(getBotholomewDir(projectDir), CAPABILITIES_FILENAME);
+  const file = Bun.file(filePath);
+  let meta: ContextFileMeta = {
+    loading: "always",
+    "agent-modification": true,
+  };
+  let createdFile = true;
+  if (await file.exists()) {
+    const raw = await file.text();
+    const parsed = parseContextFile(raw);
+    if (parsed.meta && typeof parsed.meta === "object") {
+      meta = {
+        loading: parsed.meta.loading ?? meta.loading,
+        "agent-modification":
+          parsed.meta["agent-modification"] ?? meta["agent-modification"],
+      };
+    }
+    createdFile = false;
+  }
+  const { body, counts } = await generateCapabilitiesMarkdown(
+    mcpxClient,
+    config,
+    new Date(),
+    onPhase,
+  );
+  onPhase?.(`Writing ${CAPABILITIES_FILENAME}`);
+  const serialized = serializeContextFile(meta, body);
+  await Bun.write(filePath, serialized);
+  return { path: filePath, counts, createdFile };
+}

package/src/init/index.ts CHANGED Viewed

@@ -1,16 +1,22 @@
 import { mkdir } from "node:fs/promises";
 import { join } from "node:path";
+import { loadConfig } from "../config/loader.ts";
 import {
   getBotholomewDir,
   getDbPath,
   getMcpxDir,
   getSkillsDir,
 } from "../constants.ts";
+import { writeCapabilitiesFile } from "../context/capabilities.ts";
 import { getConnection } from "../db/connection.ts";
 import { migrate } from "../db/schema.ts";
+import { createMcpxClient } from "../mcpx/client.ts";
+import { registerAllTools } from "../tools/registry.ts";
 import { logger } from "../utils/logger.ts";
 import {
   BELIEFS_MD,
+  CAPABILITIES_MD,
+  CAPABILITIES_SKILL,
   DEFAULT_CONFIG,
   DEFAULT_MCPX_SERVERS,
   GOALS_MD,
@@ -44,10 +50,12 @@ export async function initProject(
   await Bun.write(join(dotDir, "soul.md"), SOUL_MD);
   await Bun.write(join(dotDir, "beliefs.md"), BELIEFS_MD);
   await Bun.write(join(dotDir, "goals.md"), GOALS_MD);
+  await Bun.write(join(dotDir, "capabilities.md"), CAPABILITIES_MD);
   // Write default skills
   await Bun.write(join(skillsDir, "summarize.md"), SUMMARIZE_SKILL);
   await Bun.write(join(skillsDir, "standup.md"), STANDUP_SKILL);
+  await Bun.write(join(skillsDir, "capabilities.md"), CAPABILITIES_SKILL);
   // Write config (with placeholder API key)
   await Bun.write(
@@ -67,6 +75,19 @@ export async function initProject(
   await migrate(conn);
   conn.close();
+  // Populate capabilities.md with the real tool inventory. Seeded mcpx
+  // servers.json has no entries on first init, so this lists only the
+  // built-in tools; running `botholomew capabilities` later after
+  // adding MCPX servers picks those up.
+  registerAllTools();
+  const config = await loadConfig(projectDir);
+  const mcpxClient = await createMcpxClient(projectDir);
+  try {
+    await writeCapabilitiesFile(projectDir, mcpxClient, config);
+  } finally {
+    await mcpxClient?.close();
+  }
   // Update .gitignore
   await updateGitignore(projectDir);

package/src/init/templates.ts CHANGED Viewed

@@ -37,6 +37,28 @@ agent-modification: true
 - Get set up and ready to help.
 `;
+export const CAPABILITIES_MD = `---
+loading: always
+agent-modification: true
+---
+# Capabilities
+*This file is an auto-generated inventory of every tool available to Botholomew — built-in tools and tools exposed via configured MCPX servers.*
+*Regenerate with \`botholomew capabilities\`, the \`capabilities_refresh\` tool, or the \`/capabilities\` slash command.*
+_(Pending first scan. Run \`botholomew capabilities\` to populate.)_
+`;
+export const CAPABILITIES_SKILL = `---
+name: capabilities
+description: "Refresh capabilities.md — rescan internal and MCPX tools"
+arguments: []
+---
+Call \`capabilities_refresh\` to rescan every available tool (built-in and MCPX) and rewrite \`.botholomew/capabilities.md\`. After it finishes, give me a one-line summary of the counts.
+`;
 export const SUMMARIZE_SKILL = `---
 name: summarize
 description: "Summarize the current conversation"

package/src/skills/commands.ts CHANGED Viewed

@@ -4,11 +4,13 @@ import { renderSkill } from "./parser.ts";
 export interface SlashCommand {
   name: string;
   description: string;
+  takesArgs?: boolean;
 }
 export const BUILTIN_SLASH_COMMANDS: SlashCommand[] = [
   { name: "help", description: "Show command reference and shortcuts" },
   { name: "skills", description: "List available skills" },
+  { name: "clear", description: "End current thread and start a new one" },
   { name: "exit", description: "End the chat session" },
 ];
@@ -17,6 +19,7 @@ export interface SlashCommandContext {
   addSystemMessage: (content: string) => void;
   queueUserMessage: (content: string) => void;
   exit: () => void;
+  clearChat?: () => void;
 }
 /**
@@ -38,6 +41,15 @@ export function handleSlashCommand(
     return true;
   }
+  if (name === "clear") {
+    if (ctx.clearChat) {
+      ctx.clearChat();
+    } else {
+      ctx.addSystemMessage("/clear is only available in the chat TUI.");
+    }
+    return true;
+  }
   if (name === "skills") {
     if (ctx.skills.size === 0) {
       ctx.addSystemMessage(

package/src/tools/capabilities/refresh.ts ADDED Viewed

@@ -0,0 +1,53 @@
+import { z } from "zod";
+import { writeCapabilitiesFile } from "../../context/capabilities.ts";
+import type { ToolDefinition } from "../tool.ts";
+const inputSchema = z.object({
+  include_mcp: z
+    .boolean()
+    .optional()
+    .describe(
+      "When false, skip MCPX tool enumeration (internal tools only). Defaults to true.",
+    ),
+});
+const outputSchema = z.object({
+  path: z.string(),
+  internal_tool_count: z.number(),
+  mcp_tool_count: z.number(),
+  created_file: z.boolean(),
+  message: z.string(),
+  is_error: z.boolean(),
+});
+export const capabilitiesRefreshTool = {
+  name: "capabilities_refresh",
+  description:
+    "[[ bash equivalent command: which ]] Rescan every available tool (built-in + configured MCPX servers) and rewrite `.botholomew/capabilities.md`. Call this when you think the inventory is stale — new MCP servers were added, tools were renamed, or the capabilities file was deleted. The regenerated file is automatically loaded into every subsequent system prompt.",
+  group: "capabilities",
+  inputSchema,
+  outputSchema,
+  execute: async (input, ctx) => {
+    const includeMcp = input.include_mcp !== false;
+    const client = includeMcp ? ctx.mcpxClient : null;
+    const result = await writeCapabilitiesFile(
+      ctx.projectDir,
+      client,
+      ctx.config,
+    );
+    const parts = [
+      `${result.counts.internal} internal tool(s)`,
+      `${result.counts.mcp} MCPX tool(s)`,
+    ];
+    if (!includeMcp) parts.push("MCPX skipped");
+    if (result.createdFile) parts.push("file created");
+    return {
+      path: result.path,
+      internal_tool_count: result.counts.internal,
+      mcp_tool_count: result.counts.mcp,
+      created_file: result.createdFile,
+      message: `Wrote capabilities.md (${parts.join(", ")})`,
+      is_error: false,
+    };
+  },
+} satisfies ToolDefinition<typeof inputSchema, typeof outputSchema>;

package/src/tools/registry.ts CHANGED Viewed

@@ -1,5 +1,6 @@
+// Capabilities tools
+import { capabilitiesRefreshTool } from "./capabilities/refresh.ts";
 // Context tools
 import { readLargeResultTool } from "./context/read-large-result.ts";
 import { contextRefreshTool } from "./context/refresh.ts";
 import { contextSearchTool } from "./context/search.ts";
@@ -76,6 +77,9 @@ export function registerAllTools(): void {
   registerTool(updateGoalsTool);
   registerTool(readLargeResultTool);
+  // Capabilities
+  registerTool(capabilitiesRefreshTool);
   // Schedule
   registerTool(createScheduleTool);
   registerTool(listSchedulesTool);

package/src/tui/App.tsx CHANGED Viewed

@@ -2,6 +2,7 @@ import { Box, Static, Text, useApp, useInput } from "ink";
 import { useCallback, useEffect, useMemo, useRef, useState } from "react";
 import {
   type ChatSession,
+  clearChatSession,
   endChatSession,
   sendMessage,
   startChatSession,
@@ -126,6 +127,7 @@ export function App({
 }: AppProps) {
   const { exit } = useApp();
   const [messages, setMessages] = useState<ChatMessage[]>([]);
+  const [messagesEpoch, setMessagesEpoch] = useState(0);
   const [inputValue, setInputValue] = useState("");
   const [inputHistory, setInputHistory] = useState<string[]>([]);
   const [isLoading, setIsLoading] = useState(false);
@@ -490,7 +492,8 @@ export function App({
             "  ⌥+Enter        Insert newline",
             "  ↑/↓            Browse input history",
             "  /              Open slash-command autocomplete",
-            "  Tab/Enter      Accept highlighted command (popup open)",
+            "  Enter          Run highlighted command / insert if it takes args (popup open)",
+            "  Tab            Insert highlighted command without submitting (popup open)",
             "  ↑/↓            Move highlight (popup open)",
             "  Esc            Close popup",
             "",
@@ -534,6 +537,7 @@ export function App({
             "Commands:",
             "  /help           Show this help",
             "  /skills         List available skills",
+            "  /clear          End current thread and start a new one",
             "  /exit           End the chat session",
             ...skillLines,
           ].join("\n"),
@@ -563,6 +567,42 @@ export function App({
             processQueue();
           },
           exit,
+          clearChat: () => {
+            const session = sessionRef.current;
+            if (!session) return;
+            // Drain any queued messages so they don't leak into the new thread.
+            queueRef.current.length = 0;
+            syncQueue();
+            clearChatSession(session)
+              .then(({ previousThreadId, newThreadId }) => {
+                // Ink's <Static> writes messages to terminal scrollback and
+                // can't un-write them, so setMessages alone leaves the old
+                // lines visible. Clear the terminal (including scrollback)
+                // and bump the epoch key on <Static> to force a fresh mount.
+                process.stdout.write("\x1b[2J\x1b[3J\x1b[H");
+                setMessages([
+                  {
+                    id: msgId(),
+                    role: "system",
+                    content: `Started a new chat thread (${newThreadId}). Previous thread saved — resume with: botholomew chat --thread-id ${previousThreadId}`,
+                    timestamp: new Date(),
+                  },
+                ]);
+                setMessagesEpoch((n) => n + 1);
+                setChatTitle(undefined);
+              })
+              .catch((err) => {
+                setMessages((prev) => [
+                  ...prev,
+                  {
+                    id: msgId(),
+                    role: "system",
+                    content: `Failed to clear chat: ${err}`,
+                    timestamp: new Date(),
+                  },
+                ]);
+              });
+          },
         });
         if (handled) return;
       }
@@ -595,6 +635,10 @@ export function App({
       ? Array.from(sessionSkills.values()).map((s) => ({
           name: s.name,
           description: s.description,
+          takesArgs:
+            s.arguments.length > 0 ||
+            /\$ARGUMENTS\b/.test(s.body) ||
+            /\$[1-9]\b/.test(s.body),
         }))
       : [];
     return buildSlashCommands(BUILTIN_SLASH_COMMANDS, skillList);
@@ -640,7 +684,7 @@ export function App({
           node always has proper terminal width in its Yoga layout.
           Otherwise Ink's border renderer crashes with a negative
           contentWidth when tool-call boxes are rendered at width 0. */}
-      <Static items={messages}>
+      <Static key={messagesEpoch} items={messages}>
         {(msg) => <MessageBubble key={msg.id} message={msg} />}
       </Static>

package/src/tui/components/InputBar.tsx CHANGED Viewed

@@ -9,7 +9,7 @@ import {
   useState,
 } from "react";
 import type { SlashCommand } from "../../skills/commands.ts";
-import { getSlashMatches } from "../slashCompletion.ts";
+import { getSlashMatches, shouldSubmitOnEnter } from "../slashCompletion.ts";
 import { SlashCommandPopup } from "./SlashCommandPopup.tsx";
 interface InputBarProps {
@@ -128,11 +128,23 @@ export const InputBar = memo(function InputBar({
         ? getSlashMatches(val, slashCommandsRef.current ?? [])
         : null;
-      const acceptSelection = () => {
+      const acceptSelection = (mode: "insert" | "submit") => {
         if (!popupOpen) return false;
         const chosen =
           popupOpen[Math.min(selectedIndexRef.current, popupOpen.length - 1)];
         if (!chosen) return false;
+        if (mode === "submit") {
+          const completed = `/${chosen.name}`;
+          valueRef.current = completed;
+          cursorPosRef.current = 0;
+          onChangeRef.current(completed);
+          setCursorPos(0);
+          historyIndexRef.current = -1;
+          setHistoryIndex(-1);
+          savedInput.current = "";
+          onSubmitRef.current(completed);
+          return true;
+        }
         const completed = `/${chosen.name} `;
         valueRef.current = completed;
         cursorPosRef.current = completed.length;
@@ -152,11 +164,16 @@ export const InputBar = memo(function InputBar({
         return;
       }
-      // Enter: if popup is open, accept selection (do not submit).
-      // Otherwise submit as before.
+      // Enter: if popup is open, accept the highlighted entry. No-arg
+      // commands submit in one keystroke; commands that take args insert
+      // `/<name> ` and wait for the user to finish typing.
       if (key.return) {
         if (popupOpen && !key.shift && !key.meta) {
-          acceptSelection();
+          const chosen =
+            popupOpen[Math.min(selectedIndexRef.current, popupOpen.length - 1)];
+          acceptSelection(
+            chosen && shouldSubmitOnEnter(chosen) ? "submit" : "insert",
+          );
           return;
         }
         if (key.shift || key.meta) {
@@ -179,10 +196,10 @@ export const InputBar = memo(function InputBar({
         return;
       }
-      // Tab: accept popup selection if open. No-op otherwise.
+      // Tab: insert the highlighted completion so the user can keep editing.
       if (key.tab) {
         if (popupOpen) {
-          acceptSelection();
+          acceptSelection("insert");
         }
         return;
       }

package/src/tui/slashCompletion.ts CHANGED Viewed

@@ -28,11 +28,25 @@ export function getSlashMatches(
 export function buildSlashCommands(
   builtins: SlashCommand[],
-  skills: Iterable<{ name: string; description: string }>,
+  skills: Iterable<{ name: string; description: string; takesArgs?: boolean }>,
 ): SlashCommand[] {
   const out: SlashCommand[] = [...builtins];
   for (const s of skills) {
-    out.push({ name: s.name, description: s.description });
+    out.push({
+      name: s.name,
+      description: s.description,
+      takesArgs: s.takesArgs,
+    });
   }
   return out;
 }
+/**
+ * Decide whether pressing Enter on a highlighted popup entry should both
+ * accept the completion and immediately submit. True for no-argument
+ * commands (single-Enter runs them); false for commands that take args,
+ * where we insert `/<name> ` and wait for the user to finish typing.
+ */
+export function shouldSubmitOnEnter(cmd: SlashCommand): boolean {
+  return !cmd.takesArgs;
+}