npm - @united-workforce/cli - Versions diffs - 0.6.1 → 0.7.0 - Mend

@united-workforce/cli 0.6.1 → 0.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (78) hide show

package/README.md +89 -1
package/dist/__tests__/agent-resolution-llm-free.test.js +9 -2
package/dist/__tests__/agent-resolution-llm-free.test.js.map +1 -1
package/dist/__tests__/broker-prompt.test.d.ts +10 -0
package/dist/__tests__/broker-prompt.test.d.ts.map +1 -0
package/dist/__tests__/broker-prompt.test.js +129 -0
package/dist/__tests__/broker-prompt.test.js.map +1 -0
package/dist/__tests__/config.test.js +33 -37
package/dist/__tests__/config.test.js.map +1 -1
package/dist/__tests__/e2e-broker-step.test.d.ts +13 -0
package/dist/__tests__/e2e-broker-step.test.d.ts.map +1 -0
package/dist/__tests__/e2e-broker-step.test.js +278 -0
package/dist/__tests__/e2e-broker-step.test.js.map +1 -0
package/dist/__tests__/e2e-mock-agent.test.js +1 -1
package/dist/__tests__/e2e-mock-agent.test.js.map +1 -1
package/dist/__tests__/setup-agent-discovery.test.js +17 -5
package/dist/__tests__/setup-agent-discovery.test.js.map +1 -1
package/dist/__tests__/setup-no-llm.test.js +5 -2
package/dist/__tests__/setup-no-llm.test.js.map +1 -1
package/dist/__tests__/step-ask.test.js +9 -6
package/dist/__tests__/step-ask.test.js.map +1 -1
package/dist/__tests__/thread-agent-failure-suspended.test.js +3 -3
package/dist/__tests__/thread-agent-failure-suspended.test.js.map +1 -1
package/dist/__tests__/thread-poke.test.js +6 -6
package/dist/__tests__/thread-poke.test.js.map +1 -1
package/dist/__tests__/thread-resume.test.js +2 -2
package/dist/__tests__/thread-resume.test.js.map +1 -1
package/dist/__tests__/thread-suspend-step.test.js +1 -1
package/dist/__tests__/thread-suspend-step.test.js.map +1 -1
package/dist/commands/broker-step.d.ts +110 -0
package/dist/commands/broker-step.d.ts.map +1 -0
package/dist/commands/broker-step.js +450 -0
package/dist/commands/broker-step.js.map +1 -0
package/dist/commands/config.d.ts.map +1 -1
package/dist/commands/config.js +2 -23
package/dist/commands/config.js.map +1 -1
package/dist/commands/prompt.js +3 -3
package/dist/commands/setup.d.ts.map +1 -1
package/dist/commands/setup.js +8 -1
package/dist/commands/setup.js.map +1 -1
package/dist/commands/step.d.ts +6 -5
package/dist/commands/step.d.ts.map +1 -1
package/dist/commands/step.js +11 -154
package/dist/commands/step.js.map +1 -1
package/dist/commands/thread.d.ts +4 -0
package/dist/commands/thread.d.ts.map +1 -1
package/dist/commands/thread.js +77 -151
package/dist/commands/thread.js.map +1 -1
package/package.json +5 -4
package/src/__tests__/agent-resolution-llm-free.test.ts +14 -2
package/src/__tests__/broker-prompt.test.ts +142 -0
package/src/__tests__/config.test.ts +35 -39
package/src/__tests__/e2e-broker-step.test.ts +320 -0
package/src/__tests__/e2e-mock-agent.test.ts +1 -1
package/src/__tests__/setup-agent-discovery.test.ts +17 -5
package/src/__tests__/setup-no-llm.test.ts +5 -2
package/src/__tests__/step-ask.test.ts +9 -6
package/src/__tests__/thread-agent-failure-suspended.test.ts +3 -3
package/src/__tests__/thread-poke.test.ts +6 -6
package/src/__tests__/thread-resume.test.ts +2 -2
package/src/__tests__/thread-suspend-step.test.ts +1 -1
package/src/commands/broker-step.ts +636 -0
package/src/commands/config.ts +2 -24
package/src/commands/prompt.ts +3 -3
package/src/commands/setup.ts +9 -1
package/src/commands/step.ts +21 -204
package/src/commands/thread.ts +87 -192
package/dist/.build-fingerprint +0 -1
package/dist/__tests__/adapter-json-roundtrip.test.d.ts +0 -2
package/dist/__tests__/adapter-json-roundtrip.test.d.ts.map +0 -1
package/dist/__tests__/adapter-json-roundtrip.test.js +0 -160
package/dist/__tests__/adapter-json-roundtrip.test.js.map +0 -1
package/dist/__tests__/spawn-agent-json.test.d.ts +0 -2
package/dist/__tests__/spawn-agent-json.test.d.ts.map +0 -1
package/dist/__tests__/spawn-agent-json.test.js +0 -79
package/dist/__tests__/spawn-agent-json.test.js.map +0 -1
package/src/__tests__/adapter-json-roundtrip.test.ts +0 -193
package/src/__tests__/spawn-agent-json.test.ts +0 -100

package/src/commands/setup.ts CHANGED Viewed

@@ -205,6 +205,14 @@ export async function _promptAgentSelection(
 // ──────────────────────────────────────────────────────────────────────────────
+/**
+ * Default Sumeru host used when seeding a fresh agents.<alias> entry.
+ * Phase 3 (#380) breaking change — agents are routed through the broker via
+ * `host` + `gateway`, replacing the legacy `command` + `args` CLI binary
+ * path.
+ */
+const DEFAULT_SUMERU_HOST = "http://127.0.0.1:7900";
 /**
  * Merge setup args into config.yaml structure. Non-destructive — preserves
  * existing entries (including agentOverrides). Engine config is LLM-free, so
@@ -219,7 +227,7 @@ function mergeConfig(existing: Record<string, unknown>, args: SetupArgs): Record
   const agentName = _agentNameFromBinary(args.agent);
   if (!agents[agentName]) {
-    agents[agentName] = { command: `uwf-${agentName}`, args: [] };
+    agents[agentName] = { host: DEFAULT_SUMERU_HOST, gateway: agentName };
   }
   const merged: Record<string, unknown> = {

package/src/commands/step.ts CHANGED Viewed

@@ -1,8 +1,5 @@
-import { execFileSync } from "node:child_process";
 import type { CasStore } from "@ocas/core";
 import type {
-  AgentAlias,
-  AgentConfig,
   CasRef,
   StartEntry,
   StepEntry,
@@ -10,11 +7,8 @@ import type {
   ThreadForkOutput,
   ThreadId,
   ThreadStepsOutput,
-  WorkflowConfig,
-  WorkflowPayload,
 } from "@united-workforce/protocol";
 import { createLogger, generateUlid } from "@united-workforce/util";
-import { getAskSessionId, loadWorkflowConfig, setAskSessionId } from "@united-workforce/util-agent";
 import { createUwfStore, setThread, type UwfStore } from "../store.js";
 import {
   collectOrderedSteps,
@@ -456,148 +450,13 @@ export async function cmdStepRead(
 }
 // ── step ask ────────────────────────────────────────────────────────────────
-function parseAgentOverride(override: string): AgentConfig {
-  const parts = override
-    .trim()
-    .split(/\s+/)
-    .filter((p) => p.length > 0);
-  const command = parts[0];
-  if (command === undefined) {
-    fail("agent override must not be empty");
-  }
-  return { command, args: parts.slice(1) };
-}
-function resolveAskAgentConfig(
-  config: WorkflowConfig,
-  workflow: WorkflowPayload | null,
-  role: string,
-  agentOverride: string | null,
-  recordedAgent: string,
-): AgentConfig {
-  if (agentOverride !== null) {
-    const fromAlias = config.agents[agentOverride as AgentAlias];
-    if (fromAlias !== undefined) {
-      return fromAlias;
-    }
-    return parseAgentOverride(agentOverride);
-  }
-  // Try to resolve via the recorded agent name as a config alias.
-  const fromRecorded = config.agents[recordedAgent as AgentAlias];
-  if (fromRecorded !== undefined) {
-    return fromRecorded;
-  }
-  // Fall back to default agent for the workflow / role.
-  if (workflow !== null && config.agentOverrides !== null) {
-    const roleOverrides = config.agentOverrides[workflow.name];
-    if (roleOverrides !== undefined && roleOverrides[role] !== undefined) {
-      const alias = roleOverrides[role];
-      const agentConfig = config.agents[alias];
-      if (agentConfig !== undefined) {
-        return agentConfig;
-      }
-    }
-  }
-  // Treat the recorded value as a raw command path.
-  return parseAgentOverride(recordedAgent);
-}
-/**
- * Derive the agent name used for cache file partitioning from an executable
- * path or alias.  Examples:
- *   uwf-hermes        → hermes
- *   uwf-claude-code   → claude-code
- *   /tmp/mock-agent.sh → mock
- *   /usr/bin/agent    → agent
- */
-function deriveAgentName(commandPath: string): string {
-  const basename = commandPath.split(/[/\\]/).pop() ?? commandPath;
-  // Strip a trailing extension (.sh, .js, .mjs, .cjs)
-  const noExt = basename.replace(/\.(sh|js|mjs|cjs|ts)$/i, "");
-  // Strip the `uwf-` prefix introduced by agentLabel().
-  const noPrefix = noExt.startsWith("uwf-") ? noExt.slice(4) : noExt;
-  // Strip the trailing `-agent` suffix used by tests / generic agent shells.
-  const noSuffix = noPrefix.endsWith("-agent") ? noPrefix.slice(0, -"-agent".length) : noPrefix;
-  return noSuffix === "" ? noExt : noSuffix;
-}
-function loadDetailNode(
-  store: CasStore,
-  detailRef: CasRef,
-): { sessionId: string | null; payload: Record<string, unknown> } {
-  const detailNode = store.get(detailRef);
-  if (detailNode === null) {
-    fail(`detail node not found: ${detailRef}`);
-  }
-  const payload = detailNode.payload as Record<string, unknown>;
-  const sessionId = typeof payload.sessionId === "string" ? payload.sessionId : null;
-  return { sessionId, payload };
-}
-function spawnAskAgent(agent: AgentConfig, argv: string[], cwd: string): { stdout: string } {
-  try {
-    const stdout = execFileSync(agent.command, [...agent.args, ...argv], {
-      encoding: "utf8",
-      stdio: ["ignore", "pipe", "pipe"],
-      maxBuffer: 50 * 1024 * 1024,
-      cwd,
-    });
-    return { stdout };
-  } catch (e) {
-    const err = e as NodeJS.ErrnoException & { stderr: Buffer | string | null };
-    if (err.code === "ENOENT") {
-      fail(
-        `"${agent.command}" not found in PATH. Install it or check your PATH config. Run: which ${agent.command}`,
-      );
-    }
-    const stderr =
-      err.stderr == null
-        ? ""
-        : typeof err.stderr === "string"
-          ? err.stderr
-          : err.stderr.toString("utf8");
-    const detail = stderr.trim() !== "" ? `: ${stderr.trim()}` : "";
-    fail(`agent command failed (${agent.command})${detail}`);
-  }
-}
-function resolveAskWorkflow(uwf: UwfStore, payload: StepNodePayload): WorkflowPayload | null {
-  const startNode = uwf.store.cas.get(payload.start);
-  if (startNode === null) {
-    return null;
-  }
-  const start = startNode.payload as { workflow: CasRef };
-  const workflowNode = uwf.store.cas.get(start.workflow);
-  if (workflowNode === null) {
-    return null;
-  }
-  return workflowNode.payload as WorkflowPayload;
-}
-async function performFork(
-  agent: AgentConfig,
-  agentName: string,
-  stepHash: CasRef,
-  sourceSessionId: string,
-  storageRoot: string,
-  cwd: string,
-): Promise<string> {
-  const cached = await getAskSessionId(agentName, stepHash, storageRoot);
-  if (cached !== null) {
-    return cached;
-  }
-  const { stdout } = spawnAskAgent(agent, ["--mode", "fork", "--session", sourceSessionId], cwd);
-  const newSessionId = stdout.trim().split("\n").pop()?.trim() ?? "";
-  if (newSessionId === "") {
-    fail(`agent fork did not return a session id (${agent.command})`);
-  }
-  await setAskSessionId(agentName, stepHash, newSessionId, storageRoot);
-  return newSessionId;
-}
+//
+// Phase 3 (#380) — Option B: `step ask` is disabled while broker integration
+// lands. The pre-broker spawn-agent path depended on the legacy
+// `agents.<alias>: {command, args}` config shape; that shape was replaced by
+// `{host, gateway}` and the equivalent broker `ask`/`fork` primitives are
+// scheduled for Phase 4 (#381). The command exits non-zero with a clear
+// migration pointer so existing scripts fail fast rather than silently.
 export type CmdStepAskOptions = {
   prompt: string;
@@ -607,64 +466,22 @@ export type CmdStepAskOptions = {
 };
 /**
- * Ask a follow-up question to a historical step's agent (read-only).
- *
- * Does NOT write a new StepNode and does NOT mutate thread state.  The agent's
- * raw stdout is returned so the CLI entry point can stream it directly.
+ * `uwf step ask` is unavailable in 0.x while broker integration (#381) is in
+ * progress. The legacy spawn-agent code path was removed alongside the
+ * `agents.<alias>: {command, args}` config shape. Use `uwf thread exec` /
+ * `uwf thread resume` instead — those routes go through `broker.send()` and
+ * preserve the Sumeru session.
  */
 export async function cmdStepAsk(
-  storageRoot: string,
-  stepHash: CasRef,
-  options: CmdStepAskOptions,
+  _storageRoot: string,
+  _stepHash: CasRef,
+  _options: CmdStepAskOptions,
 ): Promise<string> {
-  const uwf = await createUwfStore(storageRoot);
-  const node = uwf.store.cas.get(stepHash);
-  if (node === null) {
-    fail(`CAS node not found: ${stepHash}`);
-  }
-  if (node.type !== uwf.schemas.stepNode) {
-    fail(`node ${stepHash} is not a StepNode`);
-  }
-  const payload = node.payload as StepNodePayload;
-  if (payload.detail === null) {
-    fail(`step ${stepHash} has no detail; cannot ask`);
-  }
-  const detailRef = payload.detail;
-  const { sessionId: sourceSessionId } = loadDetailNode(uwf.store.cas, detailRef);
-  const workflow = resolveAskWorkflow(uwf, payload);
-  const config = await loadWorkflowConfig(storageRoot);
-  const agent = resolveAskAgentConfig(
-    config,
-    workflow,
-    payload.role,
-    options.agentOverride,
-    payload.agent,
+  fail(
+    "step ask is unavailable in 0.x while broker integration (#381) is in progress. " +
+      "The pre-broker spawn-agent path was removed in #380; equivalent ask/fork primitives " +
+      "will return in Phase 4 once the Sumeru broker exposes session-fork APIs. " +
+      "Use `uwf thread resume <id> -p '...'` to continue a suspended thread, or " +
+      "`uwf thread exec <id>` to advance an idle thread.",
   );
-  const agentName = deriveAgentName(agent.command);
-  const cwd = payload.cwd !== "" ? payload.cwd : process.cwd();
-  // Fork path: fork (or reuse cached fork) → ask with that session.
-  if (options.fork && sourceSessionId !== null) {
-    const askSessionId = await performFork(
-      agent,
-      agentName,
-      stepHash,
-      sourceSessionId,
-      storageRoot,
-      cwd,
-    );
-    const argv = ["--mode", "ask", "--session", askSessionId, "--prompt", options.prompt];
-    argv.push("--detail", detailRef);
-    const { stdout } = spawnAskAgent(agent, argv, cwd);
-    return stdout;
-  }
-  // Fallback path: ask without forking; inject detail ref for context.
-  const argv = ["--mode", "ask", "--prompt", options.prompt];
-  argv.push("--detail", detailRef);
-  const { stdout } = spawnAskAgent(agent, argv, cwd);
-  return stdout;
 }

package/src/commands/thread.ts CHANGED Viewed

@@ -1,11 +1,9 @@
-import { execFileSync, spawn } from "node:child_process";
+import { spawn } from "node:child_process";
 import { access, readFile } from "node:fs/promises";
 import { dirname, isAbsolute, join, resolve as resolvePath } from "node:path";
 import type { VarStore } from "@ocas/core";
 import { validate } from "@ocas/core";
 import type {
-  AgentAlias,
-  AgentConfig,
   CasRef,
   StartNodePayload,
   StartOutput,
@@ -31,7 +29,6 @@ import {
   generateUlid,
   type ProcessLogger,
 } from "@united-workforce/util";
-import type { AdapterOutput } from "@united-workforce/util-agent";
 import { getEnvPath, loadWorkflowConfig } from "@united-workforce/util-agent";
 import { config as loadDotenv } from "dotenv";
 import { parse } from "yaml";
@@ -61,6 +58,7 @@ import {
 } from "../store.js";
 import { checkWorkflowFilenameConsistency, isCasRef, parseWorkflowPayload } from "../validate.js";
 import { validateWorkflow } from "../validate-semantic.js";
+import { type BrokerStepResult, executeBrokerStep } from "./broker-step.js";
 import {
   getConfigPath,
   getNestedValue,
@@ -213,7 +211,6 @@ function resolveCurrentRole(uwf: UwfStore, head: CasRef, workflowRef: CasRef): s
 const PL_THREAD_START = "7HNQ4B2X";
 const PL_MODERATOR = "M3K8V9T1";
-const PL_AGENT_SPAWN = "R5J2W8N4";
 const PL_AGENT_DONE = "C6P9E3H7";
 const PL_AGENT_ERROR = "Z3F7K8M2";
 const PL_THREAD_ARCHIVED = "F4D8Q2K5";
@@ -1120,140 +1117,6 @@ function loadWorkflowPayload(uwf: UwfStore, workflowRef: CasRef): WorkflowPayloa
   return node.payload as WorkflowPayload;
 }
-function parseAgentOverride(override: string): AgentConfig {
-  const parts = override
-    .trim()
-    .split(/\s+/)
-    .filter((p) => p.length > 0);
-  const command = parts[0];
-  if (command === undefined) {
-    fail("agent override must not be empty");
-  }
-  return { command, args: parts.slice(1) };
-}
-function resolveAgentConfig(
-  config: WorkflowConfig,
-  workflow: WorkflowPayload,
-  role: string,
-  agentOverride: string | null,
-): AgentConfig {
-  if (agentOverride !== null) {
-    // Try config alias first (e.g. "hermes" → config.agents.hermes),
-    // then fall back to raw command name (e.g. "uwf-hermes" or "/usr/bin/agent").
-    const fromAlias = config.agents[agentOverride as AgentAlias];
-    if (fromAlias !== undefined) {
-      return fromAlias;
-    }
-    return parseAgentOverride(agentOverride);
-  }
-  let alias: AgentAlias = config.defaultAgent;
-  if (config.agentOverrides !== null) {
-    const roleOverrides = config.agentOverrides[workflow.name];
-    if (roleOverrides !== undefined && roleOverrides[role] !== undefined) {
-      alias = roleOverrides[role];
-    }
-  }
-  const agentConfig = config.agents[alias];
-  if (agentConfig === undefined) {
-    fail(`unknown agent alias in config: ${alias}`);
-  }
-  return agentConfig;
-}
-function executeAgentCommand(
-  agent: AgentConfig,
-  argv: readonly string[],
-  cwd: string,
-  plog: ProcessLogger,
-): string {
-  try {
-    return execFileSync(agent.command, argv, {
-      encoding: "utf8",
-      stdio: ["ignore", "pipe", "pipe"],
-      maxBuffer: 50 * 1024 * 1024, // 50 MB — stream-json output can be large
-      cwd,
-    });
-  } catch (e) {
-    const err = e as NodeJS.ErrnoException & { stderr?: Buffer | string | null };
-    if (err.code === "ENOENT") {
-      failStep(
-        plog,
-        `"${agent.command}" not found in PATH. Install it or check your PATH config. Run: which ${agent.command}`,
-      );
-    }
-    const stderr =
-      err.stderr == null
-        ? ""
-        : typeof err.stderr === "string"
-          ? err.stderr
-          : err.stderr.toString("utf8");
-    const detail = stderr.trim() !== "" ? `: ${stderr.trim()}` : "";
-    failStep(plog, `agent command failed (${agent.command})${detail}`);
-  }
-}
-function parseAgentOutput(stdout: string, plog: ProcessLogger): unknown {
-  const line = stdout.trim().split("\n").pop()?.trim() ?? "";
-  try {
-    return JSON.parse(line);
-  } catch {
-    failStep(plog, `agent stdout last line is not valid JSON: ${line || "(empty)"}`);
-  }
-}
-function validateAndNormalizeOutput(
-  parsed: unknown,
-  line: string,
-  plog: ProcessLogger,
-): AdapterOutput {
-  const obj = parsed as Record<string, unknown>;
-  if (
-    typeof obj !== "object" ||
-    obj === null ||
-    typeof obj.stepHash !== "string" ||
-    !isCasRef(obj.stepHash as string)
-  ) {
-    failStep(plog, `agent stdout JSON missing valid stepHash: ${line}`);
-  }
-  // Normalize isError / errorMessage so downstream code can rely on them.
-  // Legacy adapters that don't emit these fields default to isError=false.
-  if (obj.isError !== undefined && typeof obj.isError !== "boolean") {
-    failStep(plog, `agent stdout JSON has non-boolean isError: ${line}`);
-  }
-  if (obj.isError === undefined) {
-    obj.isError = false;
-  }
-  if (
-    obj.errorMessage !== undefined &&
-    obj.errorMessage !== null &&
-    typeof obj.errorMessage !== "string"
-  ) {
-    failStep(plog, `agent stdout JSON has non-string errorMessage: ${line}`);
-  }
-  if (obj.errorMessage === undefined) {
-    obj.errorMessage = null;
-  }
-  return obj as unknown as AdapterOutput;
-}
-function spawnAgent(
-  plog: ProcessLogger,
-  agent: AgentConfig,
-  threadId: ThreadId,
-  role: string,
-  edgePrompt: string,
-  cwd: string,
-): AdapterOutput {
-  const argv = [...agent.args, "--thread", threadId, "--role", role, "--prompt", edgePrompt];
-  const stdout = executeAgentCommand(agent, argv, cwd, plog);
-  const line = stdout.trim().split("\n").pop()?.trim() ?? "";
-  const parsed = parseAgentOutput(stdout, plog);
-  return validateAndNormalizeOutput(parsed, line, plog);
-}
 function archiveThread(uwf: UwfStore, threadId: ThreadId, _workflow: CasRef, _head: CasRef): void {
   completeThread(uwf.varStore, threadId, "end");
 }
@@ -1412,6 +1275,10 @@ function resolveCurrentRoleFromChain(
  * replacing the head step's output. The new step's `prev` points to the OLD head's
  * `prev` — semantically replacing (not appending to) the head. The moderator is NOT
  * re-evaluated for routing; the role of the head step is re-used.
+ *
+ * Phase 3 (#380) — drives the broker via `executeBrokerStep` rather than the
+ * legacy `spawnAgent` path. The replace-semantics StepNode is built directly by
+ * passing `prevHash = oldHeadPayload.prev`, so no post-hoc rewrite is needed.
  */
 export async function cmdThreadPoke(
   storageRoot: string,
@@ -1431,59 +1298,71 @@ export async function cmdThreadPoke(
     context: { thread: threadId, workflow: workflowHash },
   });
-  // Resolve the agent: --agent override wins; otherwise read from old head step's `agent` field.
   const config = await loadWorkflowConfig(storageRoot);
   const workflow = loadWorkflowPayload(uwf, workflowHash);
   const role = oldHeadPayload.role;
-  const agent =
-    agentOverride !== null
-      ? resolveAgentConfig(config, workflow, role, agentOverride)
-      : parseAgentOverride(oldHeadPayload.agent);
   const effectiveCwd = oldHeadPayload.cwd !== "" ? oldHeadPayload.cwd : threadCwd;
-  plog.log(PL_THREAD_POKE, `poke role=${role} agent=${agent.command}`, null);
-  plog.log(PL_AGENT_SPAWN, `spawning agent command=${agent.command}`, {
-    args: [...agent.args, threadId, role].join(" "),
-  });
+  plog.log(PL_THREAD_POKE, `poke role=${role}`, null);
   loadDotenv({ path: getEnvPath(storageRoot) });
-  // Spawn the agent. The agent will create a new StepNode with prev=oldHead (it reads
-  // the active thread head). After the agent returns, we rewrite that node's prev so
-  // that the new head replaces the old head instead of appending after it.
-  let agentResult: AdapterOutput;
+  // Replace semantics: the new step's `prev` is the OLD head's prev, not the
+  // OLD head itself. `executeBrokerStep` writes the StepNode with this prev,
+  // so no post-hoc rewrite is needed.
+  let result: BrokerStepResult;
   try {
-    agentResult = spawnAgent(plog, agent, threadId, role, prompt, effectiveCwd);
+    result = await executeBrokerStep({
+      storageRoot,
+      uwf,
+      config,
+      workflow,
+      threadId,
+      role,
+      edgePrompt: prompt,
+      effectiveCwd,
+      startHash: chain.startHash,
+      prevHash: oldHeadPayload.prev,
+      agentOverride,
+      previousAttempts: null,
+      plog,
+    });
   } catch (e) {
     if (e instanceof StepFailureError) {
-      // Fatal agent failure in poke — persist suspended state before propagating
+      // Fatal broker failure in poke — persist suspended state before propagating
       const uwfErr = await createUwfStore(storageRoot);
       const errEntry = getThread(uwfErr.varStore, threadId) ?? entry;
       setThread(uwfErr.varStore, threadId, markThreadSuspended(errEntry, role, e.message));
     }
     throw e;
   }
-  const agentStepHash = agentResult.stepHash as CasRef;
-  plog.log(PL_AGENT_DONE, `agent returned head=${agentStepHash}`, null);
+  const replacedHash = result.stepHash;
+  plog.log(PL_AGENT_DONE, `broker returned head=${replacedHash}`, null);
   const uwfAfter = await createUwfStore(storageRoot);
-  const agentNode = uwfAfter.store.cas.get(agentStepHash);
-  if (agentNode === null || agentNode.type !== uwfAfter.schemas.stepNode) {
-    failStep(plog, `agent returned hash that is not a StepNode: ${agentStepHash}`);
-  }
-  const agentPayload = agentNode.payload as StepNodePayload;
-  // Rewrite the new step so that its `prev` points to the OLD head's prev (replace semantics).
-  const replacedPayload: StepNodePayload = {
-    ...agentPayload,
-    prev: oldHeadPayload.prev,
-  };
-  const replacedHash = await uwfAfter.store.cas.put(uwfAfter.schemas.stepNode, replacedPayload);
-  const replacedNode = uwfAfter.store.cas.get(replacedHash);
-  if (replacedNode === null || !validate(uwfAfter.store, replacedNode)) {
-    failStep(plog, "rewritten StepNode failed schema validation");
+  // Recoverable broker error: do NOT advance head, persist suspended state.
+  if (result.isError) {
+    const errorMsg = result.errorMessage ?? "broker reported error";
+    plog.log(
+      PL_AGENT_ERROR,
+      `poke recoverable failure stepHash=${replacedHash} message=${errorMsg}`,
+      null,
+    );
+    setThread(uwfAfter.varStore, threadId, markThreadSuspended(entry, role, errorMsg));
+    return {
+      workflow: workflowHash,
+      thread: threadId,
+      head: entry.head,
+      status: "suspended",
+      currentRole: role,
+      suspendedRole: role,
+      suspendMessage: errorMsg,
+      done: false,
+      background: null,
+      error: { stepHash: replacedHash, message: errorMsg },
+    };
   }
   // Update thread head to the replaced step. Status becomes idle (no moderator re-route).
@@ -1928,16 +1807,11 @@ async function cmdThreadStepOnce(
   const { role, edgePrompt, effectiveCwd } = targetOrOutput;
   const config = await loadWorkflowConfig(storageRoot);
-  const agent = resolveAgentConfig(config, workflow, role, agentOverride);
-  plog.log(PL_AGENT_SPAWN, `spawning agent command=${agent.command}`, {
-    args: [...agent.args, threadId, role].join(" "),
-  });
   loadDotenv({ path: getEnvPath(storageRoot) });
-  // Wrap agent execution in a try-catch: when the agent command crashes
-  // (non-zero exit, unparseable output, invalid CAS node, etc.), failStep throws
+  // Wrap broker execution in a try-catch: when the broker raises a fatal
+  // error (HTTP failure, schema validation crash, etc.), failStep throws
   // StepFailureError. We catch it to persist suspended state before re-throwing
   // so the CLI still exits non-zero.
   try {
@@ -1950,7 +1824,10 @@ async function cmdThreadStepOnce(
       role,
       edgePrompt,
       effectiveCwd,
-      agent,
+      uwf,
+      config,
+      chain.startHash,
+      agentOverride,
       plog,
     );
   } catch (e) {
@@ -1965,8 +1842,13 @@ async function cmdThreadStepOnce(
 }
 /**
- * Execute the agent command and process the result. Separated from cmdThreadStepOnce
+ * Execute the broker step and process the result. Separated from cmdThreadStepOnce
  * so that fatal failures (StepFailureError) can be caught and handled by the caller.
+ *
+ * Phase 3 (#380) — drives the broker via `executeBrokerStep` rather than the
+ * legacy `spawnAgent` path. The broker writes the StepNode (including the
+ * frontmatter retry chain) directly into CAS; the CLI only advances the head
+ * pointer afterwards.
  */
 async function executeAndProcessAgentStep(
   storageRoot: string,
@@ -1977,30 +1859,43 @@ async function executeAndProcessAgentStep(
   role: string,
   edgePrompt: string,
   effectiveCwd: string,
-  agent: AgentConfig,
+  uwf: UwfStore,
+  config: WorkflowConfig,
+  startHash: CasRef,
+  agentOverride: string | null,
   plog: ProcessLogger,
 ): Promise<StepOutput> {
-  const agentResult = spawnAgent(plog, agent, threadId, role, edgePrompt, effectiveCwd);
-  const newHead = agentResult.stepHash as CasRef;
+  const result = await executeBrokerStep({
+    storageRoot,
+    uwf,
+    config,
+    workflow,
+    threadId,
+    role,
+    edgePrompt,
+    effectiveCwd,
+    startHash,
+    prevHash: headHash === startHash ? null : headHash,
+    agentOverride,
+    previousAttempts: null,
+    plog,
+  });
-  plog.log(PL_AGENT_DONE, `agent returned head=${newHead}`, null);
+  const newHead = result.stepHash;
+  plog.log(PL_AGENT_DONE, `broker returned head=${newHead}`, null);
   const uwfAfter = await createUwfStore(storageRoot);
-  const newNode = uwfAfter.store.cas.get(newHead);
-  if (newNode === null || newNode.type !== uwfAfter.schemas.stepNode) {
-    failStep(plog, `agent returned hash that is not a StepNode: ${newHead}`);
-  }
-  // Recoverable failure: agent persisted a failed StepNode (e.g. frontmatter
+  // Recoverable failure: broker persisted a failed StepNode (e.g. frontmatter
   // validation exhausted retries) but the engine MUST NOT advance head. The
   // moderator graph is also untouched — the same role will be replayed on the
   // next exec (until eventual success records `previousAttempts` linking the
   // failed step hashes).
-  if (agentResult.isError === true) {
-    const errorMsg = agentResult.errorMessage ?? "agent reported error";
+  if (result.isError === true) {
+    const errorMsg = result.errorMessage ?? "broker reported error";
     plog.log(
       PL_AGENT_ERROR,
-      `agent reported recoverable failure stepHash=${newHead} message=${errorMsg}`,
+      `broker reported recoverable failure stepHash=${newHead} message=${errorMsg}`,
       null,
     );

package/dist/.build-fingerprint DELETED Viewed

	@@ -1 +0,0 @@
1	- 8f6475d4155e0628083a10a7c1b3bc83482b887cdcfd2a704a00492f70553d87

package/dist/__tests__/adapter-json-roundtrip.test.d.ts DELETED Viewed

	@@ -1,2 +0,0 @@
1	- export {};
2	- //# sourceMappingURL=adapter-json-roundtrip.test.d.ts.map

package/dist/__tests__/adapter-json-roundtrip.test.d.ts.map DELETED Viewed

	@@ -1 +0,0 @@
1	- {"version":3,"file":"adapter-json-roundtrip.test.d.ts","sourceRoot":"","sources":["../../src/__tests__/adapter-json-roundtrip.test.ts"],"names":[],"mappings":""}