npm - mulmoclaude - Versions diffs - 0.6.2 → 0.6.4 - Mend

mulmoclaude 0.6.2 → 0.6.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (182) hide show

package/README.md +26 -0
package/bin/mulmoclaude.js +11 -1
package/client/assets/JsonEditor-D6WBWLoa.js +10 -0
package/client/assets/JsonEditor-Di5xGeZY.css +1 -0
package/client/assets/_plugin-vue_export-helper-BOai-rQB.js +1 -0
package/client/assets/chunk-D8eiyYIV-LcKZGJv5.js +1 -0
package/client/assets/{html2canvas-CDGcmOD3-Bkf2uOth.js → html2canvas-CDGcmOD3-XVrO-eyz.js} +1 -1
package/client/assets/index-CyBr8Mkr.css +2 -0
package/client/assets/index-zZIqEbNX.js +5106 -0
package/client/assets/{index.es-DqtpmBm8-D9mAh_KQ.js → index.es-DqtpmBm8-DHT6q10o.js} +1 -1
package/client/assets/material-symbols-outlined-DtIK7AQn.woff2 +0 -0
package/client/assets/runtime-protocol-vue-D6kcV0wa.js +1 -0
package/client/assets/{runtime-vue-BVUzgYGA.js → runtime-vue-fFYhnNg3.js} +1 -1
package/client/assets/{vue-C8UuIO9J.js → vue-D4w8THF_.js} +1 -1
package/client/assets/vue-i18n-CQbxVmNs.js +3 -0
package/client/assets/vue.runtime.esm-bundler-BTyIdNAI.js +4 -0
package/client/index.html +10 -10
package/package.json +9 -8
package/server/agent/backend/claude-code.ts +34 -0
package/server/agent/backend/fake-echo.ts +370 -0
package/server/agent/backend/index.ts +16 -1
package/server/agent/config.ts +74 -24
package/server/agent/index.ts +104 -80
package/server/agent/mcpFailureMonitor.ts +167 -0
package/server/agent/mcpPreflight.ts +185 -0
package/server/agent/prompt.ts +50 -359
package/server/agent/stdioHttpShim.ts +171 -0
package/server/agent/stream.ts +12 -1
package/server/api/routes/encore.ts +55 -0
package/server/api/routes/files.ts +22 -0
package/server/api/routes/mulmo-script.ts +19 -1
package/server/api/routes/schedulerHandlers.ts +52 -4
package/server/api/routes/sessions.ts +15 -0
package/server/api/routes/skills.ts +263 -0
package/server/build/dispatcher.mjs +299 -0
package/server/encore/INVARIANTS.md +272 -0
package/server/encore/boot.ts +39 -0
package/server/encore/closure.ts +36 -0
package/server/encore/cycle.ts +276 -0
package/server/encore/dispatch.ts +103 -0
package/server/encore/handlers/amend.ts +99 -0
package/server/encore/handlers/appendNote.ts +74 -0
package/server/encore/handlers/defineEncore.ts +42 -0
package/server/encore/handlers/listTickets.ts +107 -0
package/server/encore/handlers/markStepDone.ts +41 -0
package/server/encore/handlers/markTargetSkipped.ts +33 -0
package/server/encore/handlers/query.ts +138 -0
package/server/encore/handlers/recordValues.ts +44 -0
package/server/encore/handlers/resolveNotification.ts +121 -0
package/server/encore/handlers/setup.ts +81 -0
package/server/encore/handlers/shared.ts +137 -0
package/server/encore/handlers/snooze.ts +87 -0
package/server/encore/handlers/startObligationChat.ts +64 -0
package/server/encore/handlers/startSetupChat.ts +50 -0
package/server/encore/lock.ts +61 -0
package/server/encore/notifier.ts +123 -0
package/server/encore/obligation.ts +25 -0
package/server/encore/paths.ts +78 -0
package/server/encore/reconcile.ts +661 -0
package/server/encore/tick.ts +191 -0
package/server/encore/yaml-fm.ts +63 -0
package/server/events/notifications.ts +19 -91
package/server/index.ts +94 -9
package/server/notifier/engine.ts +102 -1
package/server/notifier/macosReminderAdapter.ts +30 -0
package/server/notifier/runtime-api.ts +41 -1
package/server/notifier/types.ts +15 -2
package/server/plugins/runtime.ts +11 -2
package/server/prompts/index.ts +39 -0
package/server/prompts/system/journal-pointer.md +12 -0
package/server/prompts/system/memory-management-atomic.md +33 -0
package/server/prompts/system/memory-management-topic.md +60 -0
package/server/prompts/system/news-concierge.md +24 -0
package/server/prompts/system/sandbox-tools.md +10 -0
package/server/prompts/system/sources-context.md +16 -0
package/server/prompts/system/system.md +91 -0
package/server/system/announceOptionalDeps.ts +57 -0
package/server/system/appVersion.ts +34 -0
package/server/system/config.ts +17 -1
package/server/system/docker.ts +14 -6
package/server/system/env.ts +18 -5
package/server/system/optionalDeps.ts +129 -0
package/server/utils/cli-flags.d.mts +14 -0
package/server/utils/cli-flags.mjs +53 -0
package/server/utils/files/encore-io.ts +111 -0
package/server/utils/time.ts +6 -0
package/server/workspace/helps/business.md +2 -2
package/server/workspace/helps/encore-dsl.md +482 -0
package/server/workspace/helps/index.md +15 -13
package/server/workspace/helps/mulmoscript.md +3 -3
package/server/workspace/helps/sandbox.md +2 -2
package/server/workspace/hooks/dispatcher.ts +7 -5
package/server/workspace/hooks/provision.ts +6 -3
package/server/workspace/paths.ts +13 -4
package/server/workspace/skills/catalog.ts +355 -0
package/server/workspace/skills/external/catalog.ts +283 -0
package/server/workspace/skills/external/clone.ts +129 -0
package/server/workspace/skills/external/id.ts +194 -0
package/server/workspace/skills/external/install.ts +417 -0
package/server/workspace/skills/external/presets.ts +50 -0
package/server/workspace/skills-preset.ts +29 -17
package/server/workspace/workspace.ts +10 -5
package/src/App.vue +37 -8
package/src/components/FileContentRenderer.vue +102 -9
package/src/components/JsonEditor.vue +160 -0
package/src/components/NotificationBell.vue +35 -3
package/src/components/PluginLauncher.vue +20 -41
package/src/components/RightSidebar.vue +19 -0
package/src/components/SettingsMcpTab.vue +58 -11
package/src/components/SettingsModal.vue +22 -1
package/src/components/StackView.vue +10 -1
package/src/components/TodoExplorer.vue +16 -0
package/src/components/todo/TodoKanbanView.vue +34 -6
package/src/composables/useNotifications.ts +21 -1
package/src/config/apiRoutes.ts +0 -6
package/src/config/mcpCatalog.ts +12 -7
package/src/config/mcpTypes.ts +5 -0
package/src/config/roles.ts +52 -15
package/src/config/systemFileDescriptors.ts +12 -0
package/src/lang/de.ts +108 -12
package/src/lang/en.ts +105 -11
package/src/lang/es.ts +106 -11
package/src/lang/fr.ts +106 -11
package/src/lang/ja.ts +104 -11
package/src/lang/ko.ts +105 -11
package/src/lang/pt-BR.ts +106 -11
package/src/lang/zh.ts +103 -11
package/src/main.ts +1 -0
package/src/plugins/_generated/metas.ts +4 -0
package/src/plugins/_generated/registrations.ts +2 -0
package/src/plugins/_generated/server-bindings.ts +5 -0
package/src/plugins/encore/EncoreDashboard.vue +504 -0
package/src/plugins/encore/EncoreRedirect.vue +116 -0
package/src/plugins/encore/View.vue +36 -0
package/src/plugins/encore/defineEncoreDefinition.ts +74 -0
package/src/plugins/encore/defineEncoreMeta.ts +13 -0
package/src/plugins/encore/index.ts +93 -0
package/src/plugins/encore/manageEncoreDefinition.ts +100 -0
package/src/plugins/encore/manageEncoreMeta.ts +36 -0
package/src/plugins/manageSkills/View.vue +832 -30
package/src/plugins/manageSkills/categories.ts +125 -0
package/src/plugins/manageSkills/meta.ts +30 -0
package/src/plugins/markdown/definition.ts +3 -3
package/src/plugins/meta-types.ts +5 -0
package/src/plugins/presentMulmoScript/Preview.vue +3 -3
package/src/plugins/presentMulmoScript/View.vue +157 -33
package/src/plugins/presentMulmoScript/meta.ts +4 -0
package/src/plugins/scheduler/View.vue +45 -9
package/src/plugins/scheduler/calendarDefinition.ts +6 -2
package/src/plugins/scheduler/multiDayHelpers.ts +95 -0
package/src/plugins/skill/View.vue +1 -5
package/src/plugins/spreadsheet/View.vue +3 -3
package/src/plugins/spreadsheet/definition.ts +1 -1
package/src/plugins/textResponse/Preview.vue +14 -1
package/src/plugins/textResponse/View.vue +39 -24
package/src/plugins/wiki/components/WikiPageBody.vue +4 -0
package/src/router/index.ts +11 -0
package/src/router/pageRoutes.ts +1 -0
package/src/types/encore-dsl/at-expression.ts +120 -0
package/src/types/encore-dsl/at-resolver.ts +32 -0
package/src/types/encore-dsl/cadence.ts +289 -0
package/src/types/encore-dsl/schema.ts +288 -0
package/src/types/notification.ts +2 -1
package/src/types/session.ts +6 -0
package/src/types/sse.ts +5 -0
package/src/types/toolCallHistory.ts +7 -0
package/src/utils/agent/eventDispatch.ts +26 -5
package/src/utils/agent/mcpHint.ts +50 -0
package/src/utils/image/htmlSrcAttrs.ts +117 -13
package/src/utils/session/sessionEntries.ts +8 -32
package/client/assets/PluginScopedRoot-YjvQq0Nn.js +0 -3
package/client/assets/chunk-CernVdwh.js +0 -1
package/client/assets/chunk-D8eiyYIV-CAXpUwLd.js +0 -1
package/client/assets/index-BwrlMMHr.js +0 -5005
package/client/assets/index-CvvNuegU.css +0 -2
package/client/assets/material-symbols-outlined-BOZVWuR3.woff2 +0 -0
package/client/assets/runtime-protocol-vue-C1To4M3t.js +0 -1
package/client/assets/vue.runtime.esm-bundler-DQ8Kjjui.js +0 -4
package/server/api/routes/notifications.ts +0 -195
package/server/notifier/legacy-adapters.ts +0 -76
package/server/workspace/hooks/dispatcher.mjs +0 -300
package/src/composables/useSelectedResult.ts +0 -49

package/server/agent/backend/fake-echo.ts ADDED Viewed

@@ -0,0 +1,370 @@
+// Test-only LLM backend. Loaded by `getActiveBackend()` only when
+// `MULMOCLAUDE_FAKE_AGENT=1` (CI workflow boot wiring), and re-usable
+// from unit tests via `setFakeResponse()` / `resetFakeResponse()`.
+//
+// Default behavior:
+//   - emits a synthesized `claudeSessionId` so the orchestrator's
+//     resume bookkeeping sees the same shape as a real run
+//   - short-circuits `/<slug>` slash-command turns by reading the
+//     seeded SKILL.md and echoing the canary marker line
+//   - emits the concatenated per-session message history as the
+//     assistant text reply, so context-recall tests (session L-12)
+//     see prior turn content
+//
+// Tool dispatch: when the user prompt matches a known shape (see
+// detectToolCalls), fake-echo emits the corresponding tool_call
+// AND posts the args to the same internal plugin endpoint the MCP
+// bridge would use under real Claude (see PLUGIN_ENDPOINTS). The
+// handler runs unmodified, the artifact lands on disk, and the
+// canvas mounts the plugin View — fake at the LLM seam only, real
+// from the tool dispatch downward. Tests that need an LLM that
+// actually reasons (presentForm field design, agent-driven slug
+// choice in skill creation, etc.) still stay gated on
+// `E2E_LIVE_NO_LLM=1`.
+import { randomUUID } from "node:crypto";
+import { readFile } from "node:fs/promises";
+import path from "node:path";
+import { getCurrentToken } from "../../api/auth/token.js";
+import { makeUuid } from "../../utils/id.js";
+import { API_ROUTES } from "../../../src/config/apiRoutes.js";
+import { EVENT_TYPES } from "../../../src/types/events.js";
+import { WORKSPACE_DIRS } from "../../workspace/paths.js";
+import type { AgentEvent } from "../stream.js";
+import type { AgentInput, LLMBackend } from "./types.js";
+interface PluginEnvelope {
+  data?: unknown;
+  message?: unknown;
+  instructions?: unknown;
+  [key: string]: unknown;
+}
+export interface FakeToolCall {
+  toolName: string;
+  args: unknown;
+  /** Result string emitted in the matching `tool_call_result`.
+   *  Defaults to `{ ok: true }` JSON. */
+  result?: string;
+}
+export interface FakeResponse {
+  /** Tool calls emitted before the text block. Default generator
+   *  never emits any — tests that want tool events drive them
+   *  through `setFakeResponse()`. */
+  toolCalls?: readonly FakeToolCall[];
+  /** Assistant text. Omit to skip the text event entirely. */
+  text?: string;
+  /** When set, emit a single `error` AgentEvent with this message
+   *  and stop — mirrors what the claude-code backend does when the
+   *  CLI exits non-zero (`readAgentEvents`). Tool calls / text that
+   *  would otherwise follow are suppressed. */
+  error?: string;
+  /** Emit the `tool_call` for each `toolCalls` entry but NOT the
+   *  paired `tool_call_result` — simulates a truncated / partial
+   *  stream where the model died mid tool round-trip. */
+  omitToolResult?: boolean;
+}
+export type FakeResponseFn = (input: AgentInput) => FakeResponse | Promise<FakeResponse>;
+// Per-session conversation memory so context-recall tests see prior
+// turn content in the reply. Cleared by `resetFakeResponse()`.
+const sessionTurns = new Map<string, string[]>();
+async function defaultResponse(input: AgentInput): Promise<FakeResponse> {
+  // Slash-command turn shape: the SPA's "Run" button on a skill row
+  // (e2e-live L-22) starts a new chat with `/<slug>` as the only
+  // user message. Real Claude resolves this through its skill
+  // pipeline and uses the SKILL.md body as system prompt; here we
+  // short-circuit to read the seeded body and apply the
+  // "respond with this exact line" heuristic the e2e-live canaries
+  // rely on. Falls through to default echo on no match.
+  // Prompt-driven error trigger for e2e-live. The in-process
+  // `setFakeResponse()` knob is unreachable from a browser-driven
+  // spec (separate process), so the error-banner UI canary opts in
+  // by sending a message containing this exact marker. Prod never
+  // reaches fake-echo (real Claude backend) so this is inert there.
+  if (input.message.includes("__FAKE_ERROR__")) {
+    // Message text is rendered through marked() in the chat card,
+    // so keep it free of markdown-significant characters (no `__`,
+    // `*`, backticks) — the e2e-live canary asserts on a literal
+    // substring of this string.
+    return { error: "fake-echo forced error for the e2e-live error-banner canary" };
+  }
+  const slashMatch = input.message.trim().match(/^\/([a-z0-9][a-z0-9-]*)$/i);
+  if (slashMatch) {
+    const skillReply = await replyFromSeededSkill(input.workspacePath, slashMatch[1]);
+    if (skillReply !== null) return { text: skillReply };
+  }
+  const history = sessionTurns.get(input.sessionId) ?? [];
+  history.push(input.message);
+  sessionTurns.set(input.sessionId, history);
+  const toolCalls = detectToolCalls(input.message);
+  return {
+    toolCalls,
+    text: history.join("\n\n"),
+  };
+}
+// ── Tool-call pattern detectors ───────────────────────────────────
+//
+// Each detector matches one e2e-live prompt shape. The fake-echo
+// loop below dispatches each detected call to the matching server-
+// side plugin endpoint (see PLUGIN_ENDPOINTS) so the real handler
+// runs, the artifact lands on disk, and the canvas mounts the View.
+// Production never reaches this code path — gated by
+// MULMOCLAUDE_FAKE_AGENT=1 at server boot.
+function detectPresentMulmoScript(message: string): FakeToolCall | null {
+  if (!/presentMulmoScript/i.test(message)) return null;
+  const filePathMatch = message.match(/filePath:\s*["']([^"']+)["']/);
+  if (!filePathMatch) return null;
+  return { toolName: "presentMulmoScript", args: { filePath: filePathMatch[1] } };
+}
+function detectPresentHtml(message: string): FakeToolCall | null {
+  if (!/presentHtml/i.test(message)) return null;
+  const idx = message.indexOf("<");
+  if (idx < 0) return null;
+  // The handler expects a self-contained document; wrap if the
+  // prompt only supplies fragments (the spec's prompt does).
+  const fragment = message.slice(idx).trim();
+  const html = /^<!DOCTYPE/i.test(fragment) ? fragment : `<!DOCTYPE html><html><body>${fragment}</body></html>`;
+  return { toolName: "presentHtml", args: { html } };
+}
+function detectPresentForm(message: string): FakeToolCall | null {
+  if (!/presentForm/i.test(message)) return null;
+  const titleMatch = message.match(/titled\s+['"]([^'"]+)['"]/i);
+  const idMatch = message.match(/id\s*=\s*['"]([^'"]+)['"]/i);
+  const labelMatch = message.match(/label\s*=\s*['"]([^'"]+)['"]/i);
+  return {
+    toolName: "presentForm",
+    args: {
+      title: titleMatch?.[1] ?? "Quick check",
+      fields: [
+        {
+          id: idMatch?.[1] ?? "field1",
+          type: "text",
+          label: labelMatch?.[1] ?? "Field",
+          required: /required/i.test(message),
+          description: "auto-generated by fake-echo",
+        },
+      ],
+    },
+  };
+}
+function detectPresentChart(message: string): FakeToolCall | null {
+  if (!/presentChart/i.test(message)) return null;
+  const titleMatch = message.match(/titled\s+['"]([^'"]+)['"]/i);
+  const pairs = Array.from(message.matchAll(/\b([A-Za-z]{3,})\s+(\d{1,6})\b/g)).map(([, label, value]) => ({ label, value: Number(value) }));
+  const labels = pairs.length > 0 ? pairs.map((pair) => pair.label) : ["A", "B", "C"];
+  const values = pairs.length > 0 ? pairs.map((pair) => pair.value) : [1, 2, 3];
+  const title = titleMatch?.[1] ?? "Untitled";
+  return {
+    toolName: "presentChart",
+    args: {
+      document: {
+        title,
+        charts: [
+          {
+            title,
+            type: "bar",
+            option: {
+              xAxis: { type: "category", data: labels },
+              yAxis: { type: "value" },
+              series: [{ type: "bar", data: values }],
+            },
+          },
+        ],
+      },
+    },
+  };
+}
+function detectToolCalls(message: string): FakeToolCall[] | undefined {
+  const calls: FakeToolCall[] = [];
+  for (const detector of [detectPresentMulmoScript, detectPresentHtml, detectPresentForm, detectPresentChart]) {
+    const call = detector(message);
+    if (call) calls.push(call);
+  }
+  return calls.length > 0 ? calls : undefined;
+}
+// ── Plugin dispatch ───────────────────────────────────────────────
+//
+// Maps each fake-detected tool to the same internal API the MCP
+// bridge would post to in a real run, so the actual server-side
+// handler runs end-to-end: artifact saved, canvas slug returned.
+// Anything not in this table falls back to a synthesized success
+// envelope (caller can override via FakeToolCall.result).
+const PLUGIN_ENDPOINTS: Readonly<Record<string, string>> = {
+  presentForm: "/api/form",
+  presentHtml: "/api/html",
+  presentChart: "/api/chart",
+  presentMulmoScript: "/api/mulmoScript/save",
+};
+// Mirrors what server/agent/mcp-server.ts#handleToolCall does for
+// the real MCP bridge:
+//   1. POST to the plugin endpoint to get the envelope back
+//   2. If envelope.data is set, PUSH the envelope to
+//      /api/internal/tool-result — this is what surfaces the result
+//      to the canvas as a ToolResultComplete (toolName + uuid
+//      stamped by the bridge so the plugin can't impersonate).
+//   3. Return the text representation (message + instructions) so
+//      the matching `tool_call_result` event carries something
+//      meaningful for the tool-call history pane.
+async function dispatchToPlugin(call: FakeToolCall, port: number, chatSessionId: string): Promise<string> {
+  if (call.result !== undefined) return call.result;
+  const endpoint = PLUGIN_ENDPOINTS[call.toolName];
+  if (!endpoint) return '{"ok":true}';
+  const token = getCurrentToken();
+  const authHeaders: Record<string, string> = token ? { Authorization: `Bearer ${token}` } : {};
+  try {
+    const response = await fetch(`http://localhost:${port}${endpoint}`, {
+      method: "POST",
+      headers: { "Content-Type": "application/json", ...authHeaders },
+      body: JSON.stringify(call.args),
+    });
+    if (!response.ok) {
+      const errBody = await response.text();
+      return JSON.stringify({ error: `plugin ${call.toolName} returned ${response.status}: ${errBody.slice(0, 200)}` });
+    }
+    const envelope = ((await response.json()) ?? {}) as PluginEnvelope;
+    if (envelope.data !== undefined) {
+      // Query key is `session`, not `chatSessionId` — matches the
+      // `getSessionQuery(req)` reader and what the MCP bridge's
+      // postJson(...) helper passes (`?session=${SESSION_ID}`).
+      const toolResultUrl = `http://localhost:${port}${API_ROUTES.agent.internal.toolResult}?session=${encodeURIComponent(chatSessionId)}`;
+      const pushRes = await fetch(toolResultUrl, {
+        method: "POST",
+        headers: { "Content-Type": "application/json", ...authHeaders },
+        body: JSON.stringify({ ...envelope, toolName: call.toolName, uuid: makeUuid() }),
+      });
+      if (!pushRes.ok) {
+        // Fail loudly per codex review — a swallowed publish would
+        // leave the canvas blank while the chat reads "Done", which
+        // masks a real wiring break. Surface the failure as the
+        // tool result so the test fails loud instead of timing out
+        // on an absent View.
+        const errBody = await pushRes.text();
+        return JSON.stringify({
+          error: `tool-result push failed for ${call.toolName}: ${pushRes.status} ${errBody.slice(0, 200)}`,
+        });
+      }
+    }
+    const text: string[] = [];
+    if (typeof envelope.message === "string") text.push(envelope.message);
+    if (typeof envelope.instructions === "string") text.push(envelope.instructions);
+    return text.length > 0 ? text.join("\n") : "Done";
+  } catch (err) {
+    // Don't tear down the chat turn on plugin-dispatch failure —
+    // surface the error in the tool_result so the test sees it.
+    return JSON.stringify({ error: err instanceof Error ? err.message : String(err) });
+  }
+}
+// Look up a project-scope skill seeded by `placeProjectSkill` and
+// extract the canary line the seeded body asks the model to echo
+// back ("respond with this exact line and nothing else: X").
+// Returns null when the file is missing or the marker shape is
+// absent — caller falls through to default echo.
+async function replyFromSeededSkill(workspacePath: string, slug: string): Promise<string | null> {
+  const skillFile = path.join(workspacePath, WORKSPACE_DIRS.claudeSkills, slug, "SKILL.md");
+  let body: string;
+  try {
+    body = await readFile(skillFile, "utf8");
+  } catch {
+    return null;
+  }
+  // Line-by-line scan to avoid backtracking surprises.
+  for (const line of body.split(/\r?\n/)) {
+    const match = line.match(/respond with this exact line(?: and nothing else)?:\s*(.+)/i);
+    if (match) return match[1].trim();
+  }
+  return null;
+}
+// ── Backend wiring ────────────────────────────────────────────────
+let responseFn: FakeResponseFn = defaultResponse;
+/** Replace the default echo + slash-command generator. Useful for
+ *  unit tests that want full control over what the fake backend
+ *  emits. Pair with `resetFakeResponse()` in teardown so the next
+ *  test sees a clean state. */
+export function setFakeResponse(generator: FakeResponseFn): void {
+  responseFn = generator;
+}
+/** Restore the default generator AND clear per-session history. */
+export function resetFakeResponse(): void {
+  responseFn = defaultResponse;
+  sessionTurns.clear();
+}
+// Abort is checked between every yield. Real claude-code kills the
+// subprocess on abort; the echo stub has no subprocess, so the
+// faithful equivalent is "stop emitting immediately".
+function aborted(input: AgentInput): boolean {
+  return input.abortSignal?.aborted === true;
+}
+async function* runFakeEchoAgent(input: AgentInput): AsyncGenerator<AgentEvent> {
+  if (aborted(input)) return;
+  yield { type: EVENT_TYPES.claudeSessionId, id: randomUUID() };
+  const response = await responseFn(input);
+  // Error short-circuit: surface the error and stop, exactly like
+  // the claude-code backend on a non-zero CLI exit.
+  if (response.error !== undefined) {
+    if (aborted(input)) return;
+    yield { type: EVENT_TYPES.error, message: response.error };
+    return;
+  }
+  for (const call of response.toolCalls ?? []) {
+    if (aborted(input)) return;
+    const toolUseId = `fake-${randomUUID()}`;
+    yield {
+      type: EVENT_TYPES.toolCall,
+      toolUseId,
+      toolName: call.toolName,
+      args: call.args,
+    };
+    // Partial-stream simulation: skip the result half.
+    if (response.omitToolResult) continue;
+    // Run the actual plugin handler AND push the envelope to
+    // /api/internal/tool-result so the canvas mounts the View — same
+    // two-step the MCP bridge does for real Claude.
+    const content = await dispatchToPlugin(call, input.port, input.sessionId);
+    if (aborted(input)) return;
+    yield {
+      type: EVENT_TYPES.toolCallResult,
+      toolUseId,
+      content,
+    };
+  }
+  if (response.text !== undefined && !aborted(input)) {
+    yield { type: EVENT_TYPES.text, message: response.text };
+  }
+}
+export const fakeEchoBackend: LLMBackend = {
+  id: "fake-echo",
+  // Resume-by-token / MCP aren't meaningfully replayable from a
+  // stub. Flag them unsupported so callers that depend on the real
+  // Claude semantics opt out instead of getting silently wrong
+  // behavior.
+  capabilities: { sessionResume: false, mcp: false },
+  runAgent: runFakeEchoAgent,
+};

package/server/agent/backend/index.ts CHANGED Viewed

@@ -3,12 +3,27 @@
 // env / settings. Callers go through getActiveBackend() rather than
 // importing a concrete adapter so adding a backend doesn't require
 // touching every call site.
+//
+// Tests / CI swap in `fakeEchoBackend` via setActiveBackend() at
+// server bootstrap; the decision is made once and read with zero
+// per-call overhead by the agent orchestrator.
 import { claudeCodeBackend } from "./claude-code.js";
 import type { LLMBackend } from "./types.js";
 export type { AgentInput, BackendCapabilities, LLMBackend } from "./types.js";
+let activeBackend: LLMBackend = claudeCodeBackend;
+/** Replace the active backend. Intended for server-bootstrap wiring
+ *  (e.g. CI sets `MULMOCLAUDE_FAKE_AGENT=1`, the boot script then
+ *  passes `fakeEchoBackend` here). Not safe to call mid-flight — the
+ *  in-flight agent generators have already captured the previous
+ *  backend reference, and swapping under them would race. */
+export function setActiveBackend(backend: LLMBackend): void {
+  activeBackend = backend;
+}
 export function getActiveBackend(): LLMBackend {
-  return claudeCodeBackend;
+  return activeBackend;
 }

package/server/agent/config.ts CHANGED Viewed

@@ -1,19 +1,28 @@
-import { dirname, join } from "path";
+import { basename, dirname, join } from "path";
 import { homedir, tmpdir } from "os";
 import { createRequire } from "node:module";
 import type { Role } from "../../src/config/roles.js";
 import { mcpTools, isMcpToolEnabled } from "./mcp-tools/index.js";
 import { getActiveToolDescriptors } from "./activeTools.js";
 import type { EffortLevel, McpServerSpec } from "../system/config.js";
+import { startStdioHttpShim, type ShimHandle } from "./stdioHttpShim.js";
 import { getCurrentToken } from "../api/auth/token.js";
 import type { Attachment } from "@mulmobridge/protocol";
 import { isImageMime, isNativeAttachmentMime } from "@mulmobridge/client";
 import { convertAttachment } from "./attachmentConverter.js";
 import { log } from "../system/logger/index.js";
+import { preflightUserServers, logPreflightResult } from "./mcpPreflight.js";
 export const CONTAINER_WORKSPACE_PATH = "/home/node/mulmoclaude";
-const BASE_ALLOWED_TOOLS = ["Bash", "Read", "Write", "Edit", "Glob", "Grep", "WebFetch", "WebSearch"];
+// `Skill` is the tool Claude Code uses to execute a discovered
+// `.claude/skills/<name>/SKILL.md`. Because `--allowedTools` is passed
+// as a strict allowlist, omitting it permission-denies every
+// `Skill({skill:"…"})` call — the harness errors with
+// `Execute skill: <name>` and the model falls back to Glob+Read.
+// Bare `Skill` (no parens) permits all skills. See
+// plans/fix-skill-tool-allowlist.md.
+const BASE_ALLOWED_TOOLS = ["Bash", "Read", "Write", "Edit", "Glob", "Grep", "WebFetch", "WebSearch", "Skill"];
 /** Tool names the agent is allowed to call this session. Drives
  *  `PLUGIN_NAMES` env (the MCP child's filter) and the CLI's
@@ -72,33 +81,65 @@ function prepareUserStdioServer(spec: Extract<McpServerSpec, { type: "stdio" }>,
   return { ...spec, args };
 }
-export function prepareUserServers(userServers: Record<string, McpServerSpec>, useDocker: boolean, hostWorkspacePath: string): Record<string, McpServerSpec> {
+export interface PreparedUserServers {
+  servers: Record<string, McpServerSpec>;
+  /** Host-side stdio→HTTP gateways started for opted-in servers
+   *  (#1421 Phase B). The caller MUST `close()` each one when the
+   *  agent turn ends, or host processes / ports leak. */
+  shims: ShimHandle[];
+}
+// Async because the opt-in stdio→HTTP path spawns a host gateway and
+// waits for it to listen before the spec can be rewritten to http.
+export async function prepareUserServers(
+  userServers: Record<string, McpServerSpec>,
+  useDocker: boolean,
+  hostWorkspacePath: string,
+): Promise<PreparedUserServers> {
+  // Drop catalog-known entries that are missing required config (#1352).
+  // The dedup cache inside `logPreflightResult` keeps per-agent-run
+  // calls quiet so a Settings UI fix only logs once when it transitions
+  // missing → ok.
+  const preflight = preflightUserServers(userServers);
+  logPreflightResult(preflight, "agent-run");
   const out: Record<string, McpServerSpec> = {};
-  for (const [serverId, spec] of Object.entries(userServers)) {
+  const shims: ShimHandle[] = [];
+  for (const [serverId, spec] of Object.entries(preflight.ready)) {
     if (spec.enabled === false) continue;
     if (spec.type === "http") {
       out[serverId] = prepareUserHttpServer(spec, useDocker);
-    } else {
-      // Stay symmetric with `userServerAllowedToolNames`: stdio
-      // servers can't run inside the sandbox image (see
-      // docs/mcp-sandbox.md for the full rationale — #162 / #1334).
-      // Claude CLI 2.1.x silently exits 1 when a stdio MCP fails to
-      // start, so passing the spec through here would mask the
-      // failure as a generic boot error. Drop + log per skipped
-      // entry so an operator scanning the log knows why their MCP
-      // didn't load.
-      if (useDocker) {
-        log.info("mcp", "skipping stdio server in Docker sandbox", {
-          serverId,
-          transport: "stdio",
-          reason: "sandbox image is too minimal to host arbitrary stdio MCP runtimes",
-        });
+      continue;
+    }
+    if (!useDocker) {
+      out[serverId] = prepareUserStdioServer(spec, useDocker, hostWorkspacePath);
+      continue;
+    }
+    // Docker mode + stdio. Default: drop (the sandbox image can't
+    // host arbitrary stdio runtimes — docs/mcp-sandbox.md, #162 /
+    // #1334). Exception: an explicit, UI-acknowledged opt-in
+    // (#1421 Phase B) runs the server on the HOST behind a
+    // stdio↔HTTP gateway and rewrites the spec to http so the
+    // sandboxed agent can still reach it.
+    if (spec.hostExecInDocker === true) {
+      const shim = await startStdioHttpShim(serverId, spec, hostWorkspacePath);
+      if (shim) {
+        shims.push(shim);
+        out[serverId] = { type: "http", url: rewriteLocalhostForDocker(shim.url, useDocker) };
         continue;
       }
-      out[serverId] = prepareUserStdioServer(spec, useDocker, hostWorkspacePath);
+      // Shim failed to come up — fall through to the safe default
+      // (drop + log) rather than wiring a half-broken server.
     }
+    log.info("mcp", "skipping stdio server in Docker sandbox", {
+      serverId,
+      transport: "stdio",
+      reason:
+        spec.hostExecInDocker === true
+          ? "host-exec shim unavailable — see mcp-shim warnings"
+          : "sandbox image is too minimal to host arbitrary stdio MCP runtimes",
+    });
   }
-  return out;
+  return { servers: out, shims };
 }
 // When running in Docker the MCP server subprocess won't inherit the host
@@ -374,13 +415,22 @@ export interface McpConfigPaths {
   argPath: string;
 }
+// `sessionId` reaches a filesystem path here. `basename` strips any
+// directory components (the recognised path-traversal barrier — a
+// crafted `../../x` collapses to `x`); the char-strip then removes
+// any residual non-id chars (CodeQL js/path-injection).
+function safeSessionSegment(sessionId: string): string {
+  return basename(sessionId).replace(/[^A-Za-z0-9_-]/g, "_");
+}
 export function resolveMcpConfigPaths(opts: { workspacePath: string; sessionId: string; useDocker: boolean }): McpConfigPaths {
+  const sid = safeSessionSegment(opts.sessionId);
   if (opts.useDocker) {
-    const hostPath = join(opts.workspacePath, ".mulmoclaude", `mcp-${opts.sessionId}.json`);
-    const argPath = `${CONTAINER_WORKSPACE_PATH}/.mulmoclaude/mcp-${opts.sessionId}.json`;
+    const hostPath = join(opts.workspacePath, ".mulmoclaude", `mcp-${sid}.json`);
+    const argPath = `${CONTAINER_WORKSPACE_PATH}/.mulmoclaude/mcp-${sid}.json`;
     return { hostPath, argPath };
   }
-  const hostPath = join(tmpdir(), `mulmoclaude-mcp-${opts.sessionId}.json`);
+  const hostPath = join(tmpdir(), `mulmoclaude-mcp-${sid}.json`);
   return { hostPath, argPath: hostPath };
 }