npm - @desplega.ai/agent-swarm - Versions diffs - 1.87.0 → 1.88.0 - Mend

@desplega.ai/agent-swarm 1.87.0 → 1.88.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (59) hide show

package/README.md +2 -1
package/openapi.json +13 -1
package/package.json +5 -5
package/src/be/db.ts +49 -7
package/src/be/migrations/080_skill_system_defaults.sql +8 -0
package/src/be/modelsdev-cache.json +1123 -1034
package/src/be/seed/registry.ts +3 -2
package/src/be/seed-skills/index.ts +172 -0
package/src/cli.tsx +33 -4
package/src/commands/e2b-stack-wizard.tsx +394 -0
package/src/commands/e2b.ts +1352 -53
package/src/commands/onboard/dashboard-url.ts +29 -0
package/src/commands/onboard/steps/post-dashboard.tsx +3 -1
package/src/commands/onboard.tsx +3 -1
package/src/commands/runner.ts +1 -0
package/src/e2b/dispatch.ts +234 -18
package/src/http/memory.ts +13 -1
package/src/http/skills.ts +53 -0
package/src/http/webhooks.ts +75 -0
package/src/integrations/kapso/client.ts +82 -0
package/src/memory/automatic-task-gate.ts +47 -0
package/src/prompts/base-prompt.ts +16 -1
package/src/prompts/session-templates.ts +51 -0
package/src/providers/claude-adapter.ts +19 -0
package/src/providers/codex-adapter.ts +22 -0
package/src/providers/ctx-mode-env.ts +10 -0
package/src/providers/opencode-adapter.ts +50 -1
package/src/slack/blocks.ts +12 -4
package/src/slack/watcher.ts +3 -3
package/src/telemetry.ts +14 -1
package/src/templates.d.ts +4 -0
package/src/tests/base-prompt.test.ts +41 -0
package/src/tests/claude-adapter.test.ts +86 -1
package/src/tests/codex-adapter.test.ts +89 -0
package/src/tests/e2b-dispatch.test.ts +603 -11
package/src/tests/http-api-integration.test.ts +113 -0
package/src/tests/kapso-client.test.ts +74 -1
package/src/tests/kapso-inbound.test.ts +60 -2
package/src/tests/opencode-adapter.test.ts +95 -0
package/src/tests/prompt-template-session.test.ts +4 -2
package/src/tests/self-improvement.test.ts +89 -0
package/src/tests/skill-update-scope.test.ts +88 -1
package/src/tests/slack-blocks.test.ts +15 -0
package/src/tests/system-default-skills.test.ts +119 -0
package/src/tests/telemetry-init.test.ts +86 -0
package/src/tools/skills/skill-delete.ts +14 -0
package/src/tools/skills/skill-update.ts +14 -0
package/src/tools/store-progress.ts +19 -5
package/src/types.ts +1 -0
package/templates/skills/artifacts/config.json +1 -0
package/templates/skills/kv-storage/config.json +1 -0
package/templates/skills/pages/config.json +1 -0
package/templates/skills/scheduled-task-resilience/config.json +1 -0
package/templates/skills/swarm-scripts/SKILL.md +91 -0
package/templates/skills/swarm-scripts/config.json +14 -0
package/templates/skills/swarm-scripts/content.md +86 -0
package/templates/skills/workflow-iterate/config.json +1 -0
package/templates/skills/workflow-structured-output/config.json +1 -0
package/tsconfig.json +2 -1

package/src/commands/e2b.ts CHANGED Viewed

@@ -1,4 +1,6 @@
 import { dirname, resolve } from "node:path";
+import { render } from "ink";
+import { createElement } from "react";
 import {
   buildImageTemplate,
   buildTemplate,
@@ -8,8 +10,11 @@ import {
   killSandbox,
   listSandboxes,
   sandboxPortUrl,
+  setSandboxTimeout,
   setTemplateVisibility,
   startDetachedProcess,
+  streamSandboxLog,
+  ttlRemaining,
   waitForAgentRegistration,
   waitForHttpOk,
 } from "../e2b/dispatch";
@@ -29,8 +34,20 @@ import {
   selectEnv,
   splitKeys,
 } from "../e2b/env";
-type ParsedFlags = {
+import { getAppUrl } from "../utils/constants";
+import {
+  DEFAULT_STACK_TIMEOUT_SEC,
+  DEFAULT_STACK_WORKERS,
+  STACK_INTEGRATIONS,
+  StackWizard,
+  type StackWizardDefaults,
+  type StackWizardResult,
+  type StackWizardSkips,
+  SwarmPicker,
+  slugify,
+} from "./e2b-stack-wizard.tsx";
+export type ParsedFlags = {
   command?: string;
   positionals: string[];
   values: Map<string, string[]>;
@@ -43,10 +60,110 @@ type StartedRole = {
   url?: string;
 };
-const DEFAULT_API_PORT = 3013;
-const BOOLEAN_FLAGS = new Set(["dry-run", "json", "no-cache", "no-wait"]);
+/**
+ * Env scope for role-scoped secret/env-file layering. A lead is E2B
+ * `SwarmRole === "worker"` but gets its own `"lead"` env scope so lead and
+ * worker env never cross-contaminate.
+ */
+export type EnvScope = "api" | "lead" | "worker";
+/**
+ * The swarm-grouping role stamped onto `metadata.swarmRole`. Distinct from the
+ * E2B `SwarmRole` ("api" | "worker") because a lead is E2B `SwarmRole:"worker"`
+ * but a separate grouping role for `e2b swarms` purposes. Used by `swarms info`
+ * to resolve which sandbox is the API vs lead vs workers.
+ */
+export type MetadataSwarmRole = "api" | "lead" | "worker";
+/**
+ * Per-instance launch spec threaded through {@link startRole}. `swarmRole` is
+ * the E2B template/entrypoint dimension (api vs worker). `agentRole` is the
+ * swarm-side role written to `AGENT_ROLE` (a lead is `swarmRole:"worker"` +
+ * `agentRole:"lead"`). `envScope` selects which scoped `--{scope}-env-file` /
+ * `--{scope}-secret` flags layer on top of the shared ones.
+ */
+export type LaunchSpec = {
+  swarmRole: SwarmRole;
+  agentRole?: "worker" | "lead";
+  envScope: EnvScope;
+  /**
+   * The grouping role stamped onto `metadata.swarmRole`. Defaults to a sensible
+   * value derived from `swarmRole`/`agentRole` (api → "api", lead → "lead",
+   * worker → "worker") when omitted. Kept explicit on the spec so the stack's
+   * lead and workers tag distinctly even though both are E2B `SwarmRole:"worker"`.
+   */
+  metadataSwarmRole?: MetadataSwarmRole;
+  /**
+   * Flag the explicit AGENT_ID override is read from (default `"agent-id"`).
+   * The stack's lead reads `"lead-agent-id"` so a single `--agent-id` never
+   * collides the lead and a worker onto the same agent record.
+   */
+  agentIdFlag?: string;
+  /**
+   * Prefix for the generated default AGENT_ID (`<prefix>-<sandboxID>`). Workers
+   * use `"e2b"` (legacy, unchanged); the stack's lead uses `"e2b-lead"`. The
+   * sandbox ID is unique per sandbox, so every instance still registers
+   * distinctly even without an explicit `--agent-id`.
+   */
+  agentIdPrefix?: string;
+};
+/** The byte-identical specs for the legacy `start-api` / `start-worker` paths. */
+const API_SPEC: LaunchSpec = { swarmRole: "api", envScope: "api", metadataSwarmRole: "api" };
+const WORKER_SPEC: LaunchSpec = {
+  swarmRole: "worker",
+  envScope: "worker",
+  metadataSwarmRole: "worker",
+};
-function parseFlags(argv: string[]): ParsedFlags {
+/**
+ * Stack-specific specs. The lead is E2B `SwarmRole === "worker"` (same template
+ * + entrypoint) but pins `agentRole:"lead"`, its own `"lead"` env scope, a
+ * dedicated `--lead-agent-id` override + `e2b-lead-<sandboxID>` default, and a
+ * `"lead"` grouping role so `e2b swarms` can tell it apart from the workers.
+ */
+const STACK_LEAD_SPEC: LaunchSpec = {
+  swarmRole: "worker",
+  agentRole: "lead",
+  envScope: "lead",
+  agentIdFlag: "lead-agent-id",
+  agentIdPrefix: "e2b-lead",
+  metadataSwarmRole: "lead",
+};
+const STACK_WORKER_SPEC: LaunchSpec = {
+  swarmRole: "worker",
+  agentRole: "worker",
+  envScope: "worker",
+  metadataSwarmRole: "worker",
+};
+const DEFAULT_API_PORT = 3013;
+const BOOLEAN_FLAGS = new Set([
+  "dry-run",
+  "json",
+  "no-cache",
+  "no-wait",
+  "all",
+  "yes",
+  "non-interactive",
+  "no-lead",
+  "reveal-key",
+  // `swarms logs --follow` tails live output. Boolean so it never swallows the
+  // next positional/flag (e.g. the slug or `--role`).
+  "follow",
+  // `swarms add --add-lead` adds a lead to an existing swarm (in addition to or
+  // instead of workers). Boolean so it never swallows the next positional slug.
+  "add-lead",
+  // Integration disable shortcuts: `--no-<integration>` sets the matching
+  // API-side `*_DISABLE=true`. The `--integrations <csv>` allowlist is the
+  // value-bearing alternative (handled separately).
+  "no-slack",
+  "no-github",
+  "no-jira",
+  "no-linear",
+]);
+export function parseFlags(argv: string[]): ParsedFlags {
   const [command, ...rest] = argv;
   const positionals: string[] = [];
   const values = new Map<string, string[]>();
@@ -194,25 +311,80 @@ function e2bApiBase(flags: ParsedFlags, controllerEnv: EnvMap): string {
   return value(flags, "e2b-api-base") || controllerEnv.E2B_API_URL || DEFAULT_E2B_API_BASE;
 }
-async function loadRuntimeEnv(
+/** Read every `--{key}` env-file (repeatable) and merge them left-to-right. */
+async function loadEnvFiles(flags: ParsedFlags, key: string): Promise<EnvMap> {
+  const paths = values(flags, key).map((path) => absolutePath(path));
+  const merged: EnvMap = {};
+  for (const env of await Promise.all(paths.map((path) => readDotenvFile(path)))) {
+    Object.assign(merged, env);
+  }
+  return merged;
+}
+/** Apply every `--{key} KEY=VALUE` secret (repeatable) onto `target`, in order. */
+function applySecrets(flags: ParsedFlags, key: string, target: EnvMap): void {
+  for (const raw of values(flags, key)) {
+    const [secretKey, secretValue] = parseKeyValue(raw, `--${key}`);
+    target[secretKey] = secretValue;
+  }
+}
+/** Integrations toggleable via `--integrations <csv>` / `--no-<integration>`. */
+const E2B_INTEGRATIONS = ["slack", "github", "jira", "linear"] as const;
+type E2BIntegration = (typeof E2B_INTEGRATIONS)[number];
+/**
+ * Resolve which integrations are enabled. Default: all on. `--integrations
+ * <csv>` is an allowlist — anything not listed is disabled. `--no-<integration>`
+ * disables a single one (and stacks on top of the allowlist). Returns a map of
+ * integration → enabled.
+ */
+export function resolveIntegrationToggles(flags: ParsedFlags): Record<E2BIntegration, boolean> {
+  const allowlistRaw = splitKeys(values(flags, "integrations")).map((s) => s.toLowerCase());
+  const hasAllowlist = allowlistRaw.length > 0;
+  const toggles = {} as Record<E2BIntegration, boolean>;
+  for (const integration of E2B_INTEGRATIONS) {
+    // With an allowlist, only listed integrations stay on; without one, all on.
+    let enabled = hasAllowlist ? allowlistRaw.includes(integration) : true;
+    if (booleanFlag(flags, `no-${integration}`)) enabled = false;
+    toggles[integration] = enabled;
+  }
+  return toggles;
+}
+/**
+ * Stamp `*_DISABLE=true` for any integration the operator turned off. These envs
+ * are read API-side, so the caller only applies this to the API runtime scope.
+ */
+function applyIntegrationDisables(flags: ParsedFlags, target: EnvMap): void {
+  const toggles = resolveIntegrationToggles(flags);
+  for (const integration of E2B_INTEGRATIONS) {
+    if (!toggles[integration]) {
+      target[`${integration.toUpperCase()}_DISABLE`] = "true";
+    }
+  }
+}
+export async function loadRuntimeEnv(
   flags: ParsedFlags,
-  role: SwarmRole,
+  spec: LaunchSpec,
   apiUrl?: string,
 ): Promise<EnvMap> {
-  const envFiles = values(flags, "env-file").map((path) => absolutePath(path));
-  const fileEnv: EnvMap = {};
-  for (const env of await Promise.all(envFiles.map((path) => readDotenvFile(path)))) {
-    Object.assign(fileEnv, env);
-  }
+  const role = spec.swarmRole;
+  const scope = spec.envScope;
+  // Precedence (lowest → highest, later overrides earlier):
+  //   forward-keys (process.env) < shared --env-file < scoped --{scope}-env-file
+  //   < shared --secret < scoped --{scope}-secret < forced API_KEY/AGENT_SWARM_API_KEY.
+  // Scoped flags LAYER ON TOP of the shared ones — they never replace them.
   const inheritKeys = [...DEFAULT_E2B_FORWARD_KEYS, ...splitKeys(values(flags, "inherit-env"))];
-  const inherited = selectEnv(process.env, inheritKeys);
-  const runtime: EnvMap = { ...inherited, ...fileEnv };
+  const runtime: EnvMap = selectEnv(process.env, inheritKeys);
-  for (const raw of values(flags, "secret")) {
-    const [key, secretValue] = parseKeyValue(raw, "--secret");
-    runtime[key] = secretValue;
-  }
+  Object.assign(runtime, await loadEnvFiles(flags, "env-file"));
+  Object.assign(runtime, await loadEnvFiles(flags, `${scope}-env-file`));
+  applySecrets(flags, "secret", runtime);
+  applySecrets(flags, `${scope}-secret`, runtime);
   let swarmApiKey: string;
   try {
@@ -242,12 +414,19 @@ async function loadRuntimeEnv(
     runtime.SCRIPT_RUNTIME_DIR = value(flags, "script-runtime-dir", "/app/scripts-runtime");
     runtime.TS_LIB_DIR = value(flags, "ts-lib-dir", "/app/typescript-lib");
     runtime.SCRIPT_TYPES_DIR = value(flags, "script-types-dir", "/app/script-types");
+    // Integration toggles are read API-side, so they only ever apply to the API
+    // sandbox's runtime env. `--no-<integration>` / `--integrations <csv>`
+    // resolve to `*_DISABLE=true` here.
+    applyIntegrationDisables(flags, runtime);
   } else {
     if (!apiUrl) {
       throw new Error("Worker startup requires --api-url, or use start-stack to create API first.");
     }
     runtime.MCP_BASE_URL = apiUrl;
-    runtime.AGENT_ROLE = value(flags, "agent-role", "worker");
+    // AGENT_ROLE comes from the spec (so start-stack can pin lead/worker per
+    // instance); when the spec leaves it unset we fall back to the global
+    // --agent-role flag, keeping start-worker byte-identical to before.
+    runtime.AGENT_ROLE = spec.agentRole ?? value(flags, "agent-role", "worker");
     runtime.HARNESS_PROVIDER = value(flags, "provider", runtime.HARNESS_PROVIDER || "claude");
     runtime.WORKER_YOLO = value(flags, "worker-yolo", "false");
     runtime.WORKER_LOG_DIR = value(flags, "worker-log-dir", "/logs");
@@ -297,19 +476,89 @@ async function loadRuntimeEnv(
   return runtime;
 }
-function parseMetadata(flags: ParsedFlags, role: SwarmRole): Record<string, string> {
+/**
+ * Reserved sandbox-metadata keys this dispatcher stamps on every launch. They
+ * are read back by `e2b list`, `e2b kill --all`, and the `e2b swarms` family to
+ * group/inspect sandboxes — operators should not override them via `--metadata`.
+ *
+ *   app        — "agent-swarm" (provenance; every sandbox we create)
+ *   role       — E2B SwarmRole ("api" | "worker"); template/entrypoint dimension
+ *   launcher   — "agent-swarm-e2b" (the dispatcher tag `kill --all` filters on)
+ *   swarm      — shared slug grouping every sandbox of one launch (Phase 4)
+ *   swarmRole  — grouping role ("api" | "lead" | "worker"); a lead is E2B
+ *                role:"worker" but swarmRole:"lead", so `swarms info` can tell
+ *                the lead apart from the workers
+ *   apiPort    — (API sandbox only) the port the swarm API listens on, so
+ *                `swarms info` reconstructs the API URL without guessing
+ *   agentId    — (lead/worker only) the agent ID it registered under, when known
+ *                pre-create (explicit --agent-id / --lead-agent-id / env). When
+ *                absent (auto `<prefix>-<sandboxID>` default), `swarms info`
+ *                reconstructs it from the sandbox ID + swarmRole.
+ */
+const RESERVED_METADATA_KEYS = [
+  "app",
+  "role",
+  "launcher",
+  "swarm",
+  "swarmRole",
+  "apiPort",
+  "agentId",
+] as const;
+type MetadataTagging = {
+  /** E2B SwarmRole — the template/entrypoint dimension. */
+  role: SwarmRole;
+  /** Shared swarm slug for grouping (Phase 4). Omitted on legacy single-role launches. */
+  swarm?: string;
+  /** Grouping role for `e2b swarms` (api | lead | worker). */
+  swarmRole?: MetadataSwarmRole;
+  /** API port (API sandbox only) so `swarms info` rebuilds the URL deterministically. */
+  apiPort?: number;
+  /** Resolved agent ID (lead/worker only) when known before sandbox creation. */
+  agentId?: string;
+};
+function parseMetadata(flags: ParsedFlags, tagging: MetadataTagging): Record<string, string> {
   const metadata: Record<string, string> = {
     app: "agent-swarm",
-    role,
+    role: tagging.role,
     launcher: "agent-swarm-e2b",
   };
+  if (tagging.swarm) metadata.swarm = tagging.swarm;
+  if (tagging.swarmRole) metadata.swarmRole = tagging.swarmRole;
+  if (tagging.apiPort !== undefined) metadata.apiPort = String(tagging.apiPort);
+  if (tagging.agentId) metadata.agentId = tagging.agentId;
+  const reserved = new Set<string>(RESERVED_METADATA_KEYS);
   for (const raw of values(flags, "metadata")) {
     const [key, metadataValue] = parseKeyValue(raw, "--metadata");
+    if (reserved.has(key)) {
+      // The dispatcher owns these keys (grouping/teardown depend on them); a
+      // user override would silently break `kill --all` / the `swarms` family.
+      console.warn(`e2b: ignoring --metadata ${key}=… (reserved by the dispatcher)`);
+      continue;
+    }
     metadata[key] = metadataValue;
   }
   return metadata;
 }
+/** The grouping role to stamp for a spec (defaults from swarmRole/agentRole). */
+function metadataSwarmRoleForSpec(spec: LaunchSpec): MetadataSwarmRole {
+  if (spec.metadataSwarmRole) return spec.metadataSwarmRole;
+  if (spec.swarmRole === "api") return "api";
+  return spec.agentRole === "lead" ? "lead" : "worker";
+}
+/**
+ * The auto-generated AGENT_ID prefix for a grouping role (mirrors the prefixes
+ * in {@link startRole}). Lets `swarms info` reconstruct an agent ID from a
+ * sandbox ID when `metadata.agentId` is absent (the auto `<prefix>-<sandboxID>`
+ * default was used).
+ */
+function agentIdPrefixForSwarmRole(swarmRole: MetadataSwarmRole): string {
+  return swarmRole === "lead" ? "e2b-lead" : "e2b";
+}
 function roleTemplate(flags: ParsedFlags, role: SwarmRole): string {
   return value(
     flags,
@@ -322,9 +571,24 @@ function localDockerfile(role: SwarmRole): string {
   return role === "api" ? "Dockerfile" : "Dockerfile.worker";
 }
+function formatDuration(secondsLeft: number): string {
+  if (secondsLeft <= 0) return "expired";
+  const hours = Math.floor(secondsLeft / 3600);
+  const minutes = Math.floor((secondsLeft % 3600) / 60);
+  const parts: string[] = [];
+  if (hours > 0) parts.push(`${hours}h`);
+  // Always show minutes when under an hour, otherwise show them alongside hours.
+  if (minutes > 0 || hours === 0) parts.push(`${minutes}m`);
+  return parts.join(" ");
+}
 function printHumanStart(result: StartedRole, env: EnvMap): void {
   console.log(`${result.role} sandbox: ${result.sandbox.sandboxID}`);
   if (result.url) console.log(`${result.role} url: ${result.url}`);
+  const ttl = ttlRemaining(result.sandbox);
+  if (ttl.expiresAt && ttl.secondsLeft !== undefined) {
+    console.log(`${result.role} expires: ${ttl.expiresAt} (in ${formatDuration(ttl.secondsLeft)})`);
+  }
   console.log(
     redactWithEnv(`inspect: e2b sandbox info ${result.sandbox.sandboxID} --format json`, env),
   );
@@ -340,18 +604,37 @@ function publicStartedRole(result: StartedRole, env: EnvMap): StartedRole {
 async function startRole(
   flags: ParsedFlags,
   cwd: string,
-  role: SwarmRole,
+  spec: LaunchSpec,
   apiUrl?: string,
 ): Promise<StartedRole> {
+  const role = spec.swarmRole;
   const controllerEnv = await loadE2BControllerEnv(flags, cwd);
-  const runtimeEnv = await loadRuntimeEnv(flags, role, apiUrl);
+  const runtimeEnv = await loadRuntimeEnv(flags, spec, apiUrl);
   const controllerApiKey = e2bControllerApiKey(controllerEnv);
   const template = roleTemplate(flags, role);
   const timeoutSec = integerFlag(flags, "timeout-sec", 3600);
   const apiBase = e2bApiBase(flags, controllerEnv);
   const dryRun = booleanFlag(flags, "dry-run");
   const port = Number.parseInt(runtimeEnv.PORT || String(DEFAULT_API_PORT), 10);
-  const metadata = parseMetadata(flags, role);
+  const swarmSlug = value(flags, "swarm") || undefined;
+  const metadataSwarmRole = metadataSwarmRoleForSpec(spec);
+  // Resolve the agent ID we can know BEFORE the sandbox exists: an explicit
+  // --agent-id / --lead-agent-id flag, or AGENT_ID from the runtime env. The
+  // auto `<prefix>-<sandboxID>` default depends on the not-yet-created sandbox
+  // ID, so it is NOT stamped here — `swarms info` reconstructs it from the
+  // sandbox ID + swarmRole instead.
+  const preCreateAgentId =
+    role === "worker"
+      ? value(flags, spec.agentIdFlag ?? "agent-id") || runtimeEnv.AGENT_ID || undefined
+      : undefined;
+  const metadata = parseMetadata(flags, {
+    role,
+    swarm: swarmSlug,
+    swarmRole: metadataSwarmRole,
+    apiPort: role === "api" ? port : undefined,
+    agentId: preCreateAgentId,
+  });
   if (dryRun) {
     const fakeSandbox = {
@@ -360,6 +643,7 @@ async function startRole(
       envdAccessToken: "dry-run",
       domain: "e2b.app",
       metadata,
+      expiresAt: new Date(Date.now() + timeoutSec * 1000).toISOString(),
     };
     return {
       role,
@@ -379,7 +663,14 @@ async function startRole(
   try {
     if (role === "worker" && !runtimeEnv.AGENT_ID) {
-      runtimeEnv.AGENT_ID = value(flags, "agent-id", `e2b-${sandbox.sandboxID}`);
+      // Per-instance AGENT_ID. The explicit-override flag and the generated
+      // default prefix come from the spec so the stack's lead never collides
+      // with a worker (lead → --lead-agent-id / e2b-lead-<id>; worker →
+      // --agent-id / e2b-<id>). Sandbox IDs are unique, so each instance
+      // registers distinctly even without an explicit override.
+      const agentIdFlag = spec.agentIdFlag ?? "agent-id";
+      const agentIdPrefix = spec.agentIdPrefix ?? "e2b";
+      runtimeEnv.AGENT_ID = value(flags, agentIdFlag, `${agentIdPrefix}-${sandbox.sandboxID}`);
     }
     const entrypoint = role === "api" ? "/api-entrypoint.sh" : "/docker-entrypoint.sh";
@@ -541,8 +832,8 @@ async function templateVisibilityCommand(
 }
 async function startApiCommand(flags: ParsedFlags, cwd: string): Promise<void> {
-  const result = await startRole(flags, cwd, "api");
-  const runtimeEnv = await loadRuntimeEnv(flags, "api");
+  const result = await startRole(flags, cwd, API_SPEC);
+  const runtimeEnv = await loadRuntimeEnv(flags, API_SPEC);
   if (booleanFlag(flags, "json")) {
     console.log(JSON.stringify(publicStartedRole(result, runtimeEnv), null, 2));
   } else {
@@ -552,8 +843,8 @@ async function startApiCommand(flags: ParsedFlags, cwd: string): Promise<void> {
 async function startWorkerCommand(flags: ParsedFlags, cwd: string): Promise<void> {
   const apiUrl = value(flags, "api-url");
-  const result = await startRole(flags, cwd, "worker", apiUrl);
-  const runtimeEnv = await loadRuntimeEnv(flags, "worker", apiUrl);
+  const result = await startRole(flags, cwd, WORKER_SPEC, apiUrl);
+  const runtimeEnv = await loadRuntimeEnv(flags, WORKER_SPEC, apiUrl);
   if (booleanFlag(flags, "json")) {
     console.log(JSON.stringify(publicStartedRole(result, runtimeEnv), null, 2));
   } else {
@@ -587,39 +878,183 @@ async function cleanupStartedRoles(
   }
 }
+async function resyncStackTimeout(
+  flags: ParsedFlags,
+  cwd: string,
+  started: StartedRole[],
+): Promise<void> {
+  if (booleanFlag(flags, "dry-run") || started.length === 0) return;
+  const timeoutSec = integerFlag(flags, "timeout-sec", 3600);
+  const controllerEnv = await loadE2BControllerEnv(flags, cwd);
+  const controllerApiKey = e2bControllerApiKey(controllerEnv);
+  const apiBase = e2bApiBase(flags, controllerEnv);
+  for (const role of started) {
+    try {
+      await setSandboxTimeout({
+        sandboxId: role.sandbox.sandboxID,
+        apiKey: controllerApiKey,
+        apiBase,
+        e2bEnv: controllerEnv,
+        timeoutMs: timeoutSec * 1000,
+      });
+    } catch (err) {
+      // A re-sync failure is non-fatal — the sandbox is still up with its
+      // original (slightly shorter) TTL. setSandboxTimeout already redacts.
+      const message = err instanceof Error ? err.message : String(err);
+      console.warn(
+        redactWithEnv(
+          `e2b: failed to re-sync TTL for ${role.role} sandbox ${role.sandbox.sandboxID}: ${message}`,
+          controllerEnv,
+        ),
+      );
+    }
+  }
+}
+/**
+ * `start-stack` should run headless (no prompts, never read stdin) whenever:
+ *   - `--yes` / `--non-interactive` is passed,
+ *   - `--dry-run` is passed (CI/preview path), or
+ *   - we're not on an interactive TTY (piped / redirected stdin or stdout).
+ * Critically, the piped case (`echo | … start-stack …`) MUST take this path so
+ * it exits without hanging on a prompt that no one can answer.
+ */
+function isStackHeadless(flags: ParsedFlags): boolean {
+  return (
+    booleanFlag(flags, "yes") ||
+    booleanFlag(flags, "non-interactive") ||
+    booleanFlag(flags, "dry-run") ||
+    !isInteractiveTty()
+  );
+}
 async function startStackCommand(flags: ParsedFlags, cwd: string): Promise<void> {
+  // `--agent-role` is meaningless for the split topology (API + lead + workers
+  // each get a fixed role). Warn and point the operator at the right tool
+  // rather than silently ignoring an intent to change roles.
+  if (value(flags, "agent-role")) {
+    console.warn(
+      "e2b start-stack: --agent-role is ignored (the stack pins API/lead/worker roles). " +
+        "Use --no-lead for an API + workers topology, or start-worker --agent-role for a single custom-role worker.",
+    );
+  }
+  // Normalize a user-supplied --swarm into a clean slug so the value is
+  // consistent whether it came from a flag or the wizard. We do NOT synthesize
+  // the random fallback here: doing so would mark `swarm` as "set" and make the
+  // wizard skip its Swarm-name step, so a TTY operator without --swarm could
+  // never name the swarm. The `swarm-<short-random>` default is applied AFTER
+  // the wizard (below) — by which point either the operator named it or we fill
+  // it in for the headless / unnamed path.
+  const swarmFlag = value(flags, "swarm");
+  if (swarmFlag) {
+    setFlagValue(flags, "swarm", slugify(swarmFlag));
+  }
+  // Interactive wizard (TTY only). Headless runs (--yes / --non-interactive /
+  // --dry-run / non-TTY) skip it entirely and rely on flags + defaults. The
+  // wizard may set/overwrite the swarm slug if the operator names the swarm.
+  if (!isStackHeadless(flags)) {
+    await runStackWizard(flags);
+  }
+  // Now that the wizard (if any) has run, GENERATE a shared slug when neither
+  // the flag nor the wizard produced one. Every sandbox of this launch then
+  // shares a single grouping slug stamped onto metadata.swarm (read by
+  // `e2b swarms`). This lands on `flags` BEFORE any startRole call so all roles
+  // inherit it.
+  if (!value(flags, "swarm")) {
+    setFlagValue(flags, "swarm", generateSwarmSlug());
+  }
+  // A single explicit --agent-id is reused verbatim for every worker in the loop
+  // below, but the API registration path reuses the row for an existing
+  // X-Agent-ID — so N workers would collapse into one agent record and the wait
+  // loop would poll the same agent N times. Reject the shared explicit ID for
+  // multi-worker stacks; the per-sandbox `e2b-<sandboxID>` default (or a
+  // single-worker stack) stays unaffected. `--workers` is resolved here so a
+  // wizard-chosen count is also covered.
+  const explicitWorkerAgentId = value(flags, STACK_WORKER_SPEC.agentIdFlag ?? "agent-id");
+  if (explicitWorkerAgentId && integerFlag(flags, "workers", 1) > 1) {
+    throw new Error(
+      "e2b start-stack: --agent-id cannot be shared across multiple workers " +
+        "(it collapses them into a single agent record). Drop --agent-id to use " +
+        "the per-sandbox default, or run --workers 1.",
+    );
+  }
+  // Echo the resolved slug up front so the operator can group/inspect/extend the
+  // launch via `e2b swarms <cmd> <slug>` even if a later role fails. Under --json
+  // STDOUT must carry ONLY the final JSON payload, so route this human echo to
+  // STDERR (still visible to the operator, never pollutes `... --json | jq`).
+  const swarmSlug = value(flags, "swarm");
+  if (booleanFlag(flags, "json")) {
+    console.error(`swarm: ${swarmSlug}`);
+  } else {
+    console.log(`swarm: ${swarmSlug}`);
+  }
+  const noLead = booleanFlag(flags, "no-lead");
   const started: StartedRole[] = [];
+  let lead: StartedRole | undefined;
   const workers: StartedRole[] = [];
   try {
-    const api = await startRole(flags, cwd, "api");
+    const api = await startRole(flags, cwd, API_SPEC);
     started.push(api);
     if (!api.url) throw new Error("API sandbox did not produce a public URL");
+    // (2) One lead, unless --no-lead retains the legacy homogeneous topology.
+    if (!noLead) {
+      lead = await startRole(flags, cwd, STACK_LEAD_SPEC, api.url);
+      // The lead MUST be in `started[]` so a mid-launch failure tears it down,
+      // and so the TTL re-sync pass below covers it.
+      started.push(lead);
+    }
+    // (3) N workers.
     const workerCount = integerFlag(flags, "workers", 1);
     for (let i = 0; i < workerCount; i++) {
-      const worker = await startRole(flags, cwd, "worker", api.url);
+      const worker = await startRole(flags, cwd, STACK_WORKER_SPEC, api.url);
       workers.push(worker);
       started.push(worker);
     }
-    const runtimeEnv = await loadRuntimeEnv(flags, "api");
+    // Re-sync the whole stack to a single wall-clock TTL. The API sandbox is
+    // created first, so by the time the last worker is up its remaining TTL is
+    // shorter than the API's. One setSandboxTimeout pass aligns every sandbox
+    // to `timeoutSec` from now (E2B clamps to the tier max as usual). Dry-run
+    // short-circuits — never touches E2B.
+    await resyncStackTimeout(flags, cwd, started);
+    const runtimeEnv = await loadRuntimeEnv(flags, API_SPEC);
     if (booleanFlag(flags, "json")) {
-      console.log(
-        JSON.stringify(
-          {
-            api: publicStartedRole(api, runtimeEnv),
-            workers: workers.map((worker) => publicStartedRole(worker, runtimeEnv)),
-          },
-          null,
-          2,
-        ),
-      );
+      // Legacy shape under --no-lead: {api, workers}. New shape with a lead:
+      // {api, lead, workers}.
+      const payload: Record<string, unknown> = {
+        api: publicStartedRole(api, runtimeEnv),
+      };
+      if (lead) payload.lead = publicStartedRole(lead, runtimeEnv);
+      payload.workers = workers.map((worker) => publicStartedRole(worker, runtimeEnv));
+      console.log(JSON.stringify(payload, null, 2));
     } else {
       printHumanStart(api, runtimeEnv);
+      if (lead) printHumanStart(lead, runtimeEnv);
       for (const worker of workers) {
         printHumanStart(worker, runtimeEnv);
       }
+      // Dashboard deep-link (key hidden unless --reveal-key). Only printed on the
+      // human path — the --json payload is consumed programmatically and the URL
+      // would otherwise embed the swarm key in machine output.
+      printDashboardDeepLink(flags, {
+        apiUrl: api.url,
+        apiKey: runtimeEnv.AGENT_SWARM_API_KEY,
+        name: swarmSlug,
+        env: runtimeEnv,
+      });
     }
   } catch (err) {
     await cleanupStartedRoles(flags, cwd, started);
@@ -627,13 +1062,315 @@ async function startStackCommand(flags: ParsedFlags, cwd: string): Promise<void>
   }
 }
-async function killCommand(flags: ParsedFlags, cwd: string): Promise<void> {
+/** Set/replace a single-value flag in place (mirrors `--key value`). */
+function setFlagValue(flags: ParsedFlags, key: string, value: string): void {
+  flags.values.set(key, [value]);
+}
+/**
+ * Compute which wizard steps to skip because the operator already supplied the
+ * value on the command line. A step is skipped when its driving flag is present.
+ */
+function stackWizardSkips(flags: ParsedFlags): StackWizardSkips {
+  return {
+    swarm: Boolean(value(flags, "swarm")),
+    workers: flags.values.has("workers"),
+    provider: flags.values.has("provider"),
+    timeout: flags.values.has("timeout-sec"),
+    envFiles: flags.values.has("env-file"),
+    integrations:
+      flags.values.has("integrations") ||
+      STACK_INTEGRATIONS.some((i) => booleanFlag(flags, `no-${i}`)),
+  };
+}
+/** Seed the wizard with whatever the flags already resolve to. */
+function stackWizardDefaults(flags: ParsedFlags): StackWizardDefaults {
+  return {
+    swarmSlug: value(flags, "swarm") || undefined,
+    workers: integerFlag(flags, "workers", DEFAULT_STACK_WORKERS),
+    provider: value(flags, "provider", "claude"),
+    timeoutSec: integerFlag(flags, "timeout-sec", DEFAULT_STACK_TIMEOUT_SEC),
+    envFiles: values(flags, "env-file"),
+    integrations: resolveIntegrationToggles(flags),
+    noLead: booleanFlag(flags, "no-lead"),
+  };
+}
+/**
+ * Fold the wizard's answers back onto `flags` so the single headless launch
+ * path below picks them up. Only values the wizard actually collected are
+ * written; flag-provided values were skipped in the wizard and remain as-is.
+ */
+function applyWizardResultToFlags(flags: ParsedFlags, result: StackWizardResult): void {
+  setFlagValue(flags, "swarm", result.swarmSlug);
+  setFlagValue(flags, "workers", String(result.workers));
+  setFlagValue(flags, "provider", result.provider);
+  setFlagValue(flags, "timeout-sec", String(result.timeoutSec));
+  if (result.envFiles.length > 0) {
+    flags.values.set("env-file", result.envFiles);
+  }
+  // A disabled integration becomes `--no-<integration>` (→ API `*_DISABLE`).
+  for (const integration of STACK_INTEGRATIONS) {
+    if (!result.integrations[integration]) {
+      flags.booleans.add(`no-${integration}`);
+    }
+  }
+  if (result.noLead) flags.booleans.add("no-lead");
+}
+/**
+ * Reconstruct the equivalent headless one-shot command from the resolved flags,
+ * so an operator who ran the wizard can copy/paste it for a repeatable CI run.
+ * Secrets are NOT included — only the topology-shaping flags the wizard sets.
+ */
+function buildOneShotCommand(flags: ParsedFlags): string {
+  const parts = ["agent-swarm e2b start-stack --yes"];
+  const slug = value(flags, "swarm");
+  if (slug) parts.push(`--swarm ${slug}`);
+  parts.push(`--workers ${integerFlag(flags, "workers", DEFAULT_STACK_WORKERS)}`);
+  const provider = value(flags, "provider");
+  if (provider) parts.push(`--provider ${provider}`);
+  parts.push(`--timeout-sec ${integerFlag(flags, "timeout-sec", DEFAULT_STACK_TIMEOUT_SEC)}`);
+  for (const file of values(flags, "env-file")) {
+    parts.push(`--env-file ${file}`);
+  }
+  for (const integration of STACK_INTEGRATIONS) {
+    if (booleanFlag(flags, `no-${integration}`)) parts.push(`--no-${integration}`);
+  }
+  if (booleanFlag(flags, "no-lead")) parts.push("--no-lead");
+  return parts.join(" ");
+}
+/**
+ * Render the Ink wizard, await the operator's answers, fold them onto `flags`,
+ * and echo the equivalent `--yes` command. Only called on an interactive TTY
+ * (see {@link isStackHeadless}).
+ */
+async function runStackWizard(flags: ParsedFlags): Promise<void> {
+  const skips = stackWizardSkips(flags);
+  const defaults = stackWizardDefaults(flags);
+  let resolved: StackWizardResult | undefined;
+  const instance = render(
+    createElement(StackWizard, {
+      defaults,
+      skips,
+      onComplete: (result: StackWizardResult) => {
+        resolved = result;
+      },
+    }),
+  );
+  await instance.waitUntilExit();
+  if (!resolved) {
+    throw new Error("stack wizard exited without producing a configuration");
+  }
+  applyWizardResultToFlags(flags, resolved);
+  console.log("\nEquivalent one-shot command:");
+  console.log(`  ${buildOneShotCommand(flags)}\n`);
+}
+/**
+ * Generate a fresh swarm slug (`swarm-<short-random>`) when the operator did not
+ * name the swarm. Shared across every sandbox of one launch via `metadata.swarm`.
+ * `crypto.randomUUID()` is overkill; a short hex tail keeps the slug readable
+ * while staying collision-free enough for a handful of concurrent launches.
+ */
+function generateSwarmSlug(): string {
+  const tail = Math.random().toString(16).slice(2, 8);
+  return `swarm-${tail}`;
+}
+/**
+ * Mask a swarm API key for display: keep a short non-sensitive prefix/suffix and
+ * elide the middle. Short keys are fully masked. Never prints the whole key.
+ */
+function maskKey(key: string): string {
+  if (!key) return "(none)";
+  if (key.length <= 8) return "****";
+  return `${key.slice(0, 4)}…${key.slice(-4)}`;
+}
+/**
+ * Report where `resolveSwarmApiKey` sourced the key from, for `swarms info`. The
+ * precedence mirrors {@link resolveSwarmApiKey} (explicit > AGENT_SWARM_API_KEY >
+ * API_KEY > getApiKey()/env default). Returns a human label, never the value.
+ *
+ * `runtime` is built from `selectEnv(process.env, FORWARD_KEYS)` by the caller,
+ * so its AGENT_SWARM_API_KEY / API_KEY entries already reflect the process env —
+ * no direct `process.env` reads here (that path is owned by getApiKey(), per the
+ * api-key boundary). A resolved key with neither entry came from getApiKey().
+ */
+function swarmApiKeySource(flags: ParsedFlags, runtime: EnvMap): string {
+  if (value(flags, "api-key")) return "from --api-key";
+  if (runtime.AGENT_SWARM_API_KEY) return "from AGENT_SWARM_API_KEY";
+  if (runtime.API_KEY) return "from API_KEY";
+  return "from getApiKey() default";
+}
+export type DashboardDeepLinkParts = {
+  apiUrl?: string;
+  apiKey?: string;
+  name?: string;
+};
+/**
+ * Build the dashboard deep-link the SPA reads. The SPA expects **camelCase**
+ * `apiUrl` / `apiKey` / `name` query params (see ui/src/hooks/use-config.ts) and
+ * silently ignores snake_case — so these MUST stay camelCase.
+ *
+ * When `reveal` is false the `apiKey` param is replaced with a placeholder so the
+ * key never lands in logs/scrollback by default. When `reveal` is true the real
+ * key is embedded — the caller is responsible for the secret warning and for NOT
+ * routing the revealed URL through a redactor (the key would be scrubbed out).
+ */
+export function buildDashboardDeepLink(parts: DashboardDeepLinkParts, reveal: boolean): string {
+  const params = new URLSearchParams();
+  if (parts.apiUrl) params.set("apiUrl", parts.apiUrl);
+  // URLSearchParams percent-encodes the placeholder's spaces/em-dash; build the
+  // query manually so the hidden hint stays human-readable in the printed URL.
+  const keyParam = reveal
+    ? parts.apiKey
+      ? `apiKey=${encodeURIComponent(parts.apiKey)}`
+      : ""
+    : "apiKey=<hidden — pass --reveal-key>";
+  if (parts.name) params.set("name", parts.name);
+  const encodedRest = params.toString();
+  const query = [keyParam, encodedRest].filter(Boolean).join("&");
+  return `${getAppUrl()}${query ? `?${query}` : ""}`;
+}
+/**
+ * Print the dashboard deep-link. Default: key hidden. With `--reveal-key`: emit
+ * the full key-bearing URL RAW (not via redactWithEnv — a redactor would mask
+ * the very key the operator asked to reveal) under an explicit secret warning.
+ */
+function printDashboardDeepLink(
+  flags: ParsedFlags,
+  opts: { apiUrl?: string; apiKey?: string; name?: string; env: EnvMap },
+): void {
+  if (!opts.apiUrl) return;
+  const reveal = booleanFlag(flags, "reveal-key");
+  const parts: DashboardDeepLinkParts = {
+    apiUrl: opts.apiUrl,
+    apiKey: opts.apiKey,
+    name: opts.name,
+  };
+  if (reveal) {
+    console.log("\n⚠ secret: the URL below embeds the swarm API key — do not share or paste it.");
+    // Intentionally NOT redacted: the operator asked to reveal the key.
+    console.log(`dashboard: ${buildDashboardDeepLink(parts, true)}`);
+  } else {
+    console.log(`dashboard: ${buildDashboardDeepLink(parts, false)}`);
+    console.log("  (pass --reveal-key to embed the swarm API key for one-click connect)");
+  }
+}
+function isInteractiveTty(): boolean {
+  return Boolean(process.stdin.isTTY && process.stdout.isTTY);
+}
+/**
+ * Prompt for a yes/no confirmation on an interactive TTY. Returns true when the
+ * operator answers "y"/"yes". In a non-TTY (CI, piped) context there is no one
+ * to ask, so we require an explicit `--yes` to proceed and otherwise refuse.
+ */
+async function confirm(prompt: string, flags: ParsedFlags): Promise<boolean> {
+  if (booleanFlag(flags, "yes")) return true;
+  if (!isInteractiveTty()) return false;
+  process.stdout.write(`${prompt} [y/N] `);
+  for await (const line of console) {
+    const answer = line.trim().toLowerCase();
+    return answer === "y" || answer === "yes";
+  }
+  return false;
+}
+async function extendCommand(flags: ParsedFlags, cwd: string): Promise<void> {
   const ids = flags.positionals;
-  if (ids.length === 0) throw new Error("kill requires at least one sandbox ID");
+  if (ids.length === 0) throw new Error("extend requires at least one sandbox ID");
+  const timeoutSec = integerFlag(flags, "timeout-sec", 3600);
+  const dryRun = booleanFlag(flags, "dry-run");
+  if (dryRun) {
+    // Short-circuit before any SDK/network work so --dry-run never touches E2B.
+    for (const id of ids) {
+      console.log(`would extend ${id} to ${timeoutSec}s TTL`);
+    }
+    return;
+  }
   const controllerEnv = await loadE2BControllerEnv(flags, cwd);
+  const controllerApiKey = e2bControllerApiKey(controllerEnv);
   const apiBase = e2bApiBase(flags, controllerEnv);
+  let failures = 0;
+  for (const id of ids) {
+    try {
+      const ttl = await setSandboxTimeout({
+        sandboxId: id,
+        apiKey: controllerApiKey,
+        apiBase,
+        e2bEnv: controllerEnv,
+        timeoutMs: timeoutSec * 1000,
+      });
+      if (ttl.expiresAt && ttl.secondsLeft !== undefined) {
+        console.log(
+          `extended ${id} — expires ${ttl.expiresAt} (in ${formatDuration(ttl.secondsLeft)})`,
+        );
+      } else {
+        console.log(`extended ${id}`);
+      }
+    } catch (err) {
+      failures++;
+      // setSandboxTimeout already produces a redacted message.
+      const message = err instanceof Error ? err.message : String(err);
+      console.error(redactWithEnv(`e2b: extend failed: ${message}`, controllerEnv));
+    }
+  }
+  if (failures > 0) {
+    throw new Error(`extend failed for ${failures} of ${ids.length} sandbox(es)`);
+  }
+}
+async function killCommand(flags: ParsedFlags, cwd: string): Promise<void> {
+  const controllerEnv = await loadE2BControllerEnv(flags, cwd);
+  const apiBase = e2bApiBase(flags, controllerEnv);
+  const controllerApiKey = e2bControllerApiKey(controllerEnv);
+  let ids = flags.positionals;
+  if (booleanFlag(flags, "all")) {
+    // Sweep everything this dispatcher launched. The launcher tag is stamped on
+    // every sandbox by parseMetadata, so this never touches unrelated sandboxes.
+    const sandboxes = await listSandboxes(controllerApiKey, apiBase);
+    ids = sandboxes
+      .filter((sandbox) => sandbox.metadata?.launcher === "agent-swarm-e2b")
+      .map((sandbox) => sandbox.sandboxID);
+    if (ids.length === 0) {
+      console.log("no agent-swarm sandboxes to kill");
+      return;
+    }
+    // Guard against an accidental fleet-wide teardown. A single target is
+    // unambiguous; multiple targets require confirmation (or --yes in CI).
+    if (ids.length > 1) {
+      const ok = await confirm(
+        `Kill ${ids.length} agent-swarm sandboxes (${ids.join(", ")})?`,
+        flags,
+      );
+      if (!ok) {
+        console.log("aborted (pass --yes to skip this prompt)");
+        return;
+      }
+    }
+  }
+  if (ids.length === 0) throw new Error("kill requires at least one sandbox ID (or --all)");
   for (const id of ids) {
-    await killSandbox(id, e2bControllerApiKey(controllerEnv), apiBase);
+    await killSandbox(id, controllerApiKey, apiBase);
     console.log(`killed ${id}`);
   }
 }
@@ -653,6 +1390,504 @@ async function listCommand(flags: ParsedFlags, cwd: string): Promise<void> {
   }
 }
+/** Bucket key for sandboxes carrying no `metadata.swarm` tag (legacy/standalone). */
+const UNGROUPED_BUCKET = "(ungrouped)";
+/**
+ * Group dispatcher sandboxes by `metadata.swarm`. Sandboxes with no swarm tag
+ * (legacy `start-api`/`start-worker` launches, or anything created before Phase
+ * 4) land in the `(ungrouped)` bucket. Returns an insertion-ordered map.
+ */
+function groupSandboxesBySwarm(sandboxes: E2BSandboxInfo[]): Map<string, E2BSandboxInfo[]> {
+  const groups = new Map<string, E2BSandboxInfo[]>();
+  for (const sandbox of sandboxes) {
+    const slug = sandbox.metadata?.swarm || UNGROUPED_BUCKET;
+    const bucket = groups.get(slug);
+    if (bucket) bucket.push(sandbox);
+    else groups.set(slug, [sandbox]);
+  }
+  return groups;
+}
+/** The grouping role for a sandbox, defaulting from the E2B `role` when absent. */
+function sandboxSwarmRole(sandbox: E2BSandboxInfo): MetadataSwarmRole {
+  const swarmRole = sandbox.metadata?.swarmRole;
+  if (swarmRole === "api" || swarmRole === "lead" || swarmRole === "worker") return swarmRole;
+  // Pre-Phase-4 sandboxes only carry the E2B role (api|worker). Map worker → worker.
+  return sandbox.metadata?.role === "api" ? "api" : "worker";
+}
+/** The agent ID for a lead/worker sandbox: metadata if present, else reconstructed. */
+function sandboxAgentId(sandbox: E2BSandboxInfo): string {
+  const explicit = sandbox.metadata?.agentId;
+  if (explicit) return explicit;
+  // Auto-generated default was `<prefix>-<sandboxID>` (see startRole). Rebuild it
+  // so `swarms info` can name + probe the agent even without a stamped agentId.
+  return `${agentIdPrefixForSwarmRole(sandboxSwarmRole(sandbox))}-${sandbox.sandboxID}`;
+}
+/** The API URL for a swarm's API sandbox, preferring its own custom `domain`. */
+function swarmApiUrl(apiSandbox: E2BSandboxInfo, controllerEnv: EnvMap): string {
+  const port = Number.parseInt(apiSandbox.metadata?.apiPort || String(DEFAULT_API_PORT), 10);
+  // sandboxPortUrl already prefers the sandbox's own `domain` field over the
+  // configured controller domain (custom-domain correctness), falling back to
+  // the controller env's E2B_DOMAIN/E2B_SANDBOX_URL only when domain is absent.
+  return sandboxPortUrl(apiSandbox, port, controllerEnv);
+}
+/** A short role-count summary for a group, e.g. "1 api, 1 lead, 2 worker". */
+function roleCountSummary(sandboxes: E2BSandboxInfo[]): string {
+  const counts: Record<MetadataSwarmRole, number> = { api: 0, lead: 0, worker: 0 };
+  for (const sandbox of sandboxes) counts[sandboxSwarmRole(sandbox)]++;
+  return (["api", "lead", "worker"] as const)
+    .filter((role) => counts[role] > 0)
+    .map((role) => `${counts[role]} ${role}`)
+    .join(", ");
+}
+/** The shortest remaining TTL across a group's sandboxes (the group's true expiry). */
+function groupTtlSummary(sandboxes: E2BSandboxInfo[]): string {
+  let minSeconds: number | undefined;
+  for (const sandbox of sandboxes) {
+    const { secondsLeft } = ttlRemaining(sandbox);
+    if (secondsLeft === undefined) continue;
+    if (minSeconds === undefined || secondsLeft < minSeconds) minSeconds = secondsLeft;
+  }
+  return minSeconds === undefined ? "ttl unknown" : `expires in ${formatDuration(minSeconds)}`;
+}
+/** Probe `GET <apiUrl>/health` once, unauthenticated. Returns up/down + detail. */
+async function probeHealth(apiUrl: string): Promise<{ up: boolean; detail: string }> {
+  try {
+    const response = await fetch(`${apiUrl.replace(/\/+$/, "")}/health`);
+    return { up: response.ok, detail: `${response.status} ${response.statusText}`.trim() };
+  } catch (err) {
+    return { up: false, detail: err instanceof Error ? err.message : String(err) };
+  }
+}
+async function swarmsListCommand(flags: ParsedFlags, cwd: string): Promise<void> {
+  const controllerEnv = await loadE2BControllerEnv(flags, cwd);
+  const apiBase = e2bApiBase(flags, controllerEnv);
+  const sandboxes = await listSandboxes(e2bControllerApiKey(controllerEnv), apiBase);
+  const groups = groupSandboxesBySwarm(sandboxes);
+  if (booleanFlag(flags, "json")) {
+    const payload = [...groups.entries()].map(([slug, members]) => ({
+      swarm: slug,
+      count: members.length,
+      roles: roleCountSummary(members),
+      sandboxIDs: members.map((m) => m.sandboxID),
+    }));
+    console.log(JSON.stringify(redactObjectWithEnv(payload, controllerEnv), null, 2));
+    return;
+  }
+  if (groups.size === 0) {
+    console.log("no swarms found");
+    return;
+  }
+  for (const [slug, members] of groups) {
+    console.log(
+      `${slug}\t${members.length} sandbox(es)\t${roleCountSummary(members)}\t${groupTtlSummary(
+        members,
+      )}`,
+    );
+  }
+}
+/**
+ * Select the sandboxes belonging to a swarm slug that WE launched. Restricting
+ * to the `launcher === "agent-swarm-e2b"` tag (stamped by parseMetadata) matches
+ * the `kill --all` ownership guard: without it, a foreign E2B sandbox using a
+ * generic `metadata.swarm` key with a colliding slug would be pulled into the
+ * group, so `swarms kill/info/logs/add <slug>` could operate on / delete
+ * unrelated sandboxes. Pure (no I/O) so the ownership guarantee is unit-testable.
+ */
+export function swarmGroupMembers(sandboxes: E2BSandboxInfo[], slug: string): E2BSandboxInfo[] {
+  return sandboxes.filter(
+    (sandbox) =>
+      sandbox.metadata?.swarm === slug && sandbox.metadata?.launcher === "agent-swarm-e2b",
+  );
+}
+/** Find the sandboxes belonging to a swarm slug (throws if the group is empty). */
+async function resolveSwarmGroup(
+  flags: ParsedFlags,
+  cwd: string,
+  slug: string,
+): Promise<{ members: E2BSandboxInfo[]; controllerEnv: EnvMap; apiBase: string }> {
+  const controllerEnv = await loadE2BControllerEnv(flags, cwd);
+  const apiBase = e2bApiBase(flags, controllerEnv);
+  const sandboxes = await listSandboxes(e2bControllerApiKey(controllerEnv), apiBase);
+  const members = swarmGroupMembers(sandboxes, slug);
+  if (members.length === 0) {
+    throw new Error(`no swarm found with slug "${slug}" (try: e2b swarms list)`);
+  }
+  return { members, controllerEnv, apiBase };
+}
+async function swarmsInfoCommand(flags: ParsedFlags, cwd: string): Promise<void> {
+  const slug = flags.positionals[1];
+  if (!slug) throw new Error("swarms info requires a slug: e2b swarms info <slug>");
+  const { members, controllerEnv } = await resolveSwarmGroup(flags, cwd, slug);
+  const api = members.find((m) => sandboxSwarmRole(m) === "api");
+  const lead = members.find((m) => sandboxSwarmRole(m) === "lead");
+  const workers = members.filter((m) => sandboxSwarmRole(m) === "worker");
+  // Re-resolve the swarm API key LOCALLY (never from the sandbox) so we can build
+  // the deep-link / authed probe. Source is reported; the value is masked.
+  const runtime: EnvMap = selectEnv(process.env, [...DEFAULT_E2B_FORWARD_KEYS]);
+  let resolvedKey = "";
+  let keySource: string;
+  try {
+    resolvedKey = resolveSwarmApiKey(runtime, value(flags, "api-key"));
+    keySource = swarmApiKeySource(flags, runtime);
+  } catch {
+    keySource = "unresolved (set AGENT_SWARM_API_KEY / API_KEY or pass --api-key)";
+  }
+  const apiUrl = api ? swarmApiUrl(api, controllerEnv) : undefined;
+  console.log(`swarm: ${slug}`);
+  console.log(`sandboxes: ${members.length} (${roleCountSummary(members)})`);
+  if (apiUrl) console.log(`api url: ${apiUrl}`);
+  console.log(`api key: ${maskKey(resolvedKey)} (${keySource})`);
+  // Per-sandbox lines, grouped API → lead → workers (resolved by swarmRole), each
+  // with its agent ID (lead/workers) and remaining TTL.
+  const ttlText = (member: E2BSandboxInfo): string => {
+    const { secondsLeft } = ttlRemaining(member);
+    return secondsLeft !== undefined ? `expires in ${formatDuration(secondsLeft)}` : "ttl unknown";
+  };
+  if (api) console.log(`  api    ${api.sandboxID}  ${ttlText(api)}`);
+  if (lead) {
+    console.log(`  lead   ${lead.sandboxID}  ${sandboxAgentId(lead)}  ${ttlText(lead)}`);
+  }
+  for (const worker of workers) {
+    console.log(`  worker ${worker.sandboxID}  ${sandboxAgentId(worker)}  ${ttlText(worker)}`);
+  }
+  // Single-shot unauthenticated health probe.
+  if (apiUrl) {
+    const health = await probeHealth(apiUrl);
+    console.log(`health: ${health.up ? "up" : "down"} (${health.detail})`);
+    // If the key resolved, do one authenticated probe to detect a key mismatch.
+    if (resolvedKey) {
+      try {
+        const authed = await fetch(`${apiUrl.replace(/\/+$/, "")}/api/agents`, {
+          headers: { Authorization: `Bearer ${resolvedKey}` },
+        });
+        if (authed.status === 401) {
+          console.warn(
+            "warning: authenticated probe returned 401 — the resolved key may not match the launch key.",
+          );
+        }
+      } catch {
+        // A network error on the authed probe is non-fatal; the unauth health
+        // probe above already reported reachability.
+      }
+    }
+  }
+  // Dashboard deep-link (masked by default; --reveal-key embeds the key raw).
+  printDashboardDeepLink(flags, {
+    apiUrl,
+    apiKey: resolvedKey || undefined,
+    name: slug,
+    env: controllerEnv,
+  });
+}
+async function swarmsKillCommand(flags: ParsedFlags, cwd: string): Promise<void> {
+  const all = booleanFlag(flags, "all");
+  const controllerEnv = await loadE2BControllerEnv(flags, cwd);
+  const apiBase = e2bApiBase(flags, controllerEnv);
+  const controllerApiKey = e2bControllerApiKey(controllerEnv);
+  // Build the ordered kill list. Within each group: every non-API sandbox first,
+  // then the API LAST (so workers/lead never lose their API mid-teardown).
+  function orderGroup(members: E2BSandboxInfo[]): E2BSandboxInfo[] {
+    const apiLast = [...members].sort((a, b) => {
+      const aApi = sandboxSwarmRole(a) === "api" ? 1 : 0;
+      const bApi = sandboxSwarmRole(b) === "api" ? 1 : 0;
+      return aApi - bApi;
+    });
+    return apiLast;
+  }
+  let targets: E2BSandboxInfo[];
+  let label: string;
+  if (all) {
+    const sandboxes = await listSandboxes(controllerApiKey, apiBase);
+    const swarmTagged = sandboxes.filter((s) => s.metadata?.launcher === "agent-swarm-e2b");
+    if (swarmTagged.length === 0) {
+      console.log("no agent-swarm swarms to kill");
+      return;
+    }
+    // Order each group api-last, then concatenate.
+    const grouped = groupSandboxesBySwarm(swarmTagged);
+    targets = [...grouped.values()].flatMap(orderGroup);
+    label = `all ${grouped.size} swarm(s) (${targets.length} sandboxes)`;
+  } else {
+    const slug = flags.positionals[1];
+    if (!slug) throw new Error("swarms kill requires a slug (or --all): e2b swarms kill <slug>");
+    const { members } = await resolveSwarmGroup(flags, cwd, slug);
+    targets = orderGroup(members);
+    label = `swarm "${slug}" (${targets.length} sandboxes)`;
+  }
+  const ok = await confirm(`Kill ${label}?`, flags);
+  if (!ok) {
+    console.log("aborted (pass --yes to skip this prompt)");
+    return;
+  }
+  for (const sandbox of targets) {
+    await killSandbox(sandbox.sandboxID, controllerApiKey, apiBase);
+    console.log(`killed ${sandbox.sandboxID} (${sandboxSwarmRole(sandbox)})`);
+  }
+}
+async function swarmsAddCommand(flags: ParsedFlags, cwd: string): Promise<void> {
+  let slug = flags.positionals[1];
+  // No slug on a TTY → offer a picker of existing swarms.
+  if (!slug) {
+    if (!isInteractiveTty()) {
+      throw new Error("swarms add requires a slug: e2b swarms add <slug>");
+    }
+    slug = await pickSwarmSlug(flags, cwd);
+    if (!slug) {
+      console.log("aborted (no swarm selected)");
+      return;
+    }
+  }
+  const { members, controllerEnv, apiBase } = await resolveSwarmGroup(flags, cwd, slug);
+  const api = members.find((m) => sandboxSwarmRole(m) === "api");
+  if (!api) {
+    throw new Error(`swarm "${slug}" has no API sandbox — cannot add members to it`);
+  }
+  const apiUrl = swarmApiUrl(api, controllerEnv);
+  const controllerApiKey = e2bControllerApiKey(controllerEnv);
+  // Stamp the existing slug + point new members at the existing API. The slug
+  // flows into metadata via parseMetadata; MCP_BASE_URL via the apiUrl arg below.
+  setFlagValue(flags, "swarm", slug);
+  // Compute the group's current end so new members re-sync to the SAME wall-clock
+  // expiry (reuse setSandboxTimeout). The shortest remaining TTL is the group's
+  // true end; new members align to that rather than a fresh full TTL.
+  const groupEndSeconds = members
+    .map((m) => ttlRemaining(m).secondsLeft)
+    .filter((s): s is number => s !== undefined);
+  const resyncSeconds = groupEndSeconds.length > 0 ? Math.min(...groupEndSeconds) : undefined;
+  const addLead = booleanFlag(flags, "add-lead");
+  const workerCount = integerFlag(flags, "workers", addLead ? 0 : 1);
+  const added: StartedRole[] = [];
+  try {
+    if (addLead) {
+      const lead = await startRole(flags, cwd, STACK_LEAD_SPEC, apiUrl);
+      added.push(lead);
+    }
+    for (let i = 0; i < workerCount; i++) {
+      const worker = await startRole(flags, cwd, STACK_WORKER_SPEC, apiUrl);
+      added.push(worker);
+    }
+  } catch (err) {
+    await cleanupStartedRoles(flags, cwd, added);
+    throw err;
+  }
+  // Re-sync the freshly-added members to the group's current end (best-effort).
+  if (resyncSeconds !== undefined && !booleanFlag(flags, "dry-run")) {
+    for (const role of added) {
+      try {
+        await setSandboxTimeout({
+          sandboxId: role.sandbox.sandboxID,
+          apiKey: controllerApiKey,
+          apiBase,
+          e2bEnv: controllerEnv,
+          timeoutMs: resyncSeconds * 1000,
+        });
+      } catch (err) {
+        const message = err instanceof Error ? err.message : String(err);
+        console.warn(
+          redactWithEnv(
+            `e2b: failed to re-sync TTL for added ${role.role} sandbox ${role.sandbox.sandboxID}: ${message}`,
+            controllerEnv,
+          ),
+        );
+      }
+    }
+  }
+  const runtimeEnv = await loadRuntimeEnv(flags, STACK_WORKER_SPEC, apiUrl);
+  if (booleanFlag(flags, "json")) {
+    console.log(
+      JSON.stringify(
+        { swarm: slug, added: added.map((r) => publicStartedRole(r, runtimeEnv)) },
+        null,
+        2,
+      ),
+    );
+  } else {
+    console.log(`added ${added.length} member(s) to swarm ${slug}:`);
+    for (const role of added) {
+      printHumanStart(role, runtimeEnv);
+    }
+  }
+}
+/** Render a one-shot Ink picker over existing swarm slugs. Returns "" if cancelled. */
+async function pickSwarmSlug(flags: ParsedFlags, cwd: string): Promise<string> {
+  const controllerEnv = await loadE2BControllerEnv(flags, cwd);
+  const apiBase = e2bApiBase(flags, controllerEnv);
+  const sandboxes = await listSandboxes(e2bControllerApiKey(controllerEnv), apiBase);
+  const groups = groupSandboxesBySwarm(sandboxes);
+  const slugs = [...groups.keys()].filter((slug) => slug !== UNGROUPED_BUCKET);
+  if (slugs.length === 0) {
+    throw new Error("no existing swarms to add to (create one with e2b start-stack)");
+  }
+  let chosen = "";
+  const instance = render(
+    createElement(SwarmPicker, {
+      slugs: slugs.map((slug) => {
+        const members = groups.get(slug) ?? [];
+        return { slug, label: `${slug} (${roleCountSummary(members)})` };
+      }),
+      onSelect: (slug: string) => {
+        chosen = slug;
+      },
+    }),
+  );
+  await instance.waitUntilExit();
+  return chosen;
+}
+/** The E2B `role` (api|worker) a swarm sandbox launched its entrypoint under. */
+function sandboxE2BRole(sandbox: E2BSandboxInfo): "api" | "worker" {
+  // The entrypoint's tee log path keys off the E2B role, not the grouping role:
+  // a lead is grouping-role "lead" but E2B role "worker" (so its log lives at
+  // /tmp/agent-swarm-e2b-worker.log). Map back via the grouping role.
+  return sandboxSwarmRole(sandbox) === "api" ? "api" : "worker";
+}
+/**
+ * `e2b swarms logs <slug> [--role api|lead|worker] [--follow]` — stream the
+ * entrypoint log of a swarm's sandbox(es).
+ *
+ * Resolution: filter the swarm's members by `--role` (default: `api`, the most
+ * useful single target — it carries the API boot lines + health). Reading the
+ * deterministic per-role tee'd log path means NO PID bookkeeping is needed.
+ *
+ * Output is UNTRUSTED entrypoint stdout that can embed tokens, so every chunk is
+ * routed through `redactWithEnv` (→ scrubSecrets) at this egress point before it
+ * touches the terminal.
+ */
+async function swarmsLogsCommand(flags: ParsedFlags, cwd: string): Promise<void> {
+  const slug = flags.positionals[1];
+  if (!slug) throw new Error("swarms logs requires a slug: e2b swarms logs <slug>");
+  const roleFlag = value(flags, "role") || "api";
+  if (roleFlag !== "api" && roleFlag !== "lead" && roleFlag !== "worker") {
+    throw new Error("--role must be one of api|lead|worker");
+  }
+  const { members, controllerEnv, apiBase } = await resolveSwarmGroup(flags, cwd, slug);
+  const targets = members.filter((m) => sandboxSwarmRole(m) === roleFlag);
+  if (targets.length === 0) {
+    throw new Error(`swarm "${slug}" has no ${roleFlag} sandbox`);
+  }
+  // Egress redaction set. `controllerEnv` only carries E2B-controller + locally
+  // resolved values, so launch-time secrets supplied via --secret / --env-file /
+  // --inherit-env / a launch-specific --api-key would NOT be redacted unless the
+  // operator re-supplies them here. Resolve runtime env the SAME way the launch
+  // path does (loadRuntimeEnv with API_SPEC handles --env-file/--secret/
+  // --inherit-env/--api-key + scoped flags) so any re-supplied launch secret is
+  // scrubbed. A missing swarm API key must NOT hard-fail `swarms logs` (the start
+  // path tolerates this only under --dry-run), so degrade to controllerEnv-only.
+  let redactionEnv: EnvMap = controllerEnv;
+  try {
+    redactionEnv = { ...controllerEnv, ...(await loadRuntimeEnv(flags, API_SPEC)) };
+  } catch {
+    redactionEnv = controllerEnv;
+  }
+  const follow = booleanFlag(flags, "follow");
+  const tailLines = integerFlag(flags, "tail", 200);
+  const controllerApiKey = e2bControllerApiKey(controllerEnv);
+  // Multi-target follow would interleave two live streams ambiguously; restrict
+  // --follow to a single sandbox and point multi-worker users at --role/history.
+  if (follow && targets.length > 1) {
+    throw new Error(
+      `swarm "${slug}" has ${targets.length} ${roleFlag} sandboxes — --follow needs a single target (omit --follow for history, or there is no per-sandbox selector yet)`,
+    );
+  }
+  // SIGINT (Ctrl-C) cleanly stops a --follow stream by aborting the tail.
+  const controller = new AbortController();
+  if (follow) {
+    process.once("SIGINT", () => controller.abort());
+  }
+  for (const target of targets) {
+    if (targets.length > 1) {
+      console.log(`==> ${roleFlag} ${target.sandboxID} <==`);
+    }
+    await streamSandboxLog({
+      sandboxId: target.sandboxID,
+      role: sandboxE2BRole(target),
+      apiKey: controllerApiKey,
+      apiBase,
+      e2bEnv: controllerEnv,
+      tailLines,
+      follow,
+      signal: follow ? controller.signal : undefined,
+      // Egress scrub: entrypoint output can embed secrets — redact every chunk.
+      // Scrubbed = known token shapes (scrubSecrets) + the controller env + any
+      // launch secrets re-supplied here via --secret/--env-file/--inherit-env/
+      // --api-key (folded into redactionEnv). Residual limitation: an arbitrary
+      // secret known ONLY to a prior launch (never re-supplied, no known shape)
+      // is NOT recoverable here and can stream raw — re-pass it to `swarms logs`
+      // to scrub it, or treat the logs as sensitive.
+      onChunk: (chunk) => process.stdout.write(redactWithEnv(chunk, redactionEnv)),
+    });
+  }
+}
+async function swarmsCommand(flags: ParsedFlags, cwd: string): Promise<void> {
+  const sub = flags.positionals[0];
+  switch (sub) {
+    case undefined:
+    case "list":
+      await swarmsListCommand(flags, cwd);
+      return;
+    case "info":
+      await swarmsInfoCommand(flags, cwd);
+      return;
+    case "kill":
+      await swarmsKillCommand(flags, cwd);
+      return;
+    case "add":
+      await swarmsAddCommand(flags, cwd);
+      return;
+    case "logs":
+      await swarmsLogsCommand(flags, cwd);
+      return;
+    default:
+      throw new Error(`Unknown e2b swarms subcommand: ${sub} (expected list|info|kill|add|logs)`);
+  }
+}
 function printE2BHelp(): void {
   console.log(`
 agent-swarm e2b
@@ -662,20 +1897,78 @@ Usage:
   agent-swarm e2b delete-template <template-name...>
   agent-swarm e2b publish-template <template-name...>
   agent-swarm e2b unpublish-template <template-name...>
-  agent-swarm e2b start-api --template <template> [--env-file .env]
-  agent-swarm e2b start-worker --template <template> --api-url <https-url> [--env-file .env]
-  agent-swarm e2b start-stack --api-template <template> --worker-template <template> [--workers 1]
+  agent-swarm e2b start-api [--template <name>] [--env-file .env]
+  agent-swarm e2b start-worker --api-url <https-url> [--template <name>] [--env-file .env]
+  agent-swarm e2b start-stack [--swarm <slug>] [--workers <n>] [--no-lead] [--yes]
   agent-swarm e2b list [--json]
-  agent-swarm e2b kill <sandbox-id...>
+  agent-swarm e2b swarms list | info <slug> | kill <slug> | add <slug> | logs <slug>
+  agent-swarm e2b extend <sandbox-id...> --timeout-sec <seconds>
+  agent-swarm e2b kill <sandbox-id...> | --all
 Common options:
-  --env-file <path>          Load runtime env/secrets for API or worker (repeatable)
-  --secret KEY=VALUE         Add/override one runtime secret (repeatable)
+  --env-file <path>          Load runtime env/secrets for all roles (repeatable)
+  --secret KEY=VALUE         Add/override one runtime secret for all roles (repeatable)
   --inherit-env KEY[,KEY]    Forward extra local env vars into the sandbox
-  --api-key <key>            Swarm API key passed to API/worker (required unless env provides one)
+  --api-key <key>            Swarm API key for API/worker (required unless env provides one)
+  --api-url <https-url>      Public API URL a worker connects to (start-worker)
   --agent-id <id>            Worker agent ID (default: e2b-<sandbox-id>)
-  --timeout-sec <seconds>    Sandbox TTL (default 3600)
+  --agent-role worker|lead   Role for start-worker (ignored by start-stack)
+  --provider <name>          Harness provider for workers (default claude)
+  --template <name>          Override the E2B template for the role
+  --api-template / --worker-template <name>   Per-role E2B template overrides
+  --timeout-sec <seconds>    Sandbox TTL (default 3600); for extend, the new TTL from now
+  --no-wait                  Skip waiting for API health / worker registration
   --e2b-api-key-file <path>  Read the E2B controller API key from a file
+start-stack (API + lead + N workers):
+  Provisions an API, one lead, and N workers. Interactive wizard on a TTY;
+  headless under --yes / --non-interactive / --dry-run / a non-TTY.
+  --swarm <slug>             Swarm name/slug (used for the wizard + echoed command)
+  --workers <n>              Worker count (default 1)
+  --no-lead                  Legacy topology: API + N workers, no lead
+  --lead-agent-id <id>       Lead agent ID (default: e2b-lead-<sandbox-id>)
+  --yes                      Skip the wizard; use flags + defaults (CI/headless)
+  --non-interactive          Same as --yes for prompting (never reads stdin)
+  --integrations <csv>       Allowlist of integrations to keep on (slack,github,jira,linear)
+  --no-slack / --no-github / --no-jira / --no-linear
+                             Disable an integration (sets the API's <NAME>_DISABLE=true)
+  JSON shape: {api, lead, workers:[...]} — or {api, workers:[...]} with --no-lead.
+Role-scoped env (layer ON TOP of the shared --env-file/--secret, never replace):
+  --api-env-file <path>      Env file applied only to the API sandbox (repeatable)
+  --lead-env-file <path>     Env file applied only to the lead sandbox (repeatable)
+  --worker-env-file <path>   Env file applied only to worker sandboxes (repeatable)
+  --api-secret KEY=VALUE     Secret applied only to the API sandbox (repeatable)
+  --lead-secret KEY=VALUE    Secret applied only to the lead sandbox (repeatable)
+  --worker-secret KEY=VALUE  Secret applied only to worker sandboxes (repeatable)
+  Precedence (highest wins): forward-keys < --env-file < --<scope>-env-file
+    < --secret < --<scope>-secret < forced API_KEY/AGENT_SWARM_API_KEY.
+swarms (group by metadata.swarm slug):
+  list                       Group sandboxes by swarm (ungrouped → "(ungrouped)")
+  info <slug>                API URL, key source (masked), roles, per-sandbox TTL,
+                             a one-shot /health probe, and the dashboard deep-link
+  kill <slug> | --all        Tear down a swarm (API last) or every swarm (--all)
+  add <slug>                 Add worker(s)/--add-lead to an existing swarm, TTL
+                             re-synced to the group's current end. No slug on a
+                             TTY → swarm picker. --workers <n> sets the count.
+  logs <slug>                Stream a sandbox's entrypoint log (envd-tracked +
+                             tee'd to file). --role api|lead|worker (default api),
+                             --follow to tail live, --tail <n> history lines
+                             (default 200). Output is scrubbed for secrets.
+  --reveal-key               Embed the swarm API key in the dashboard deep-link
+                             (printed RAW — the URL is a secret; hidden otherwise)
+extend:
+  Extend (or reduce) a live sandbox's TTL. E2B clamps to your tier max, so the
+  printed expiry reflects what was actually applied. --dry-run never contacts E2B.
+kill:
+  --all                      Kill every sandbox launched by this dispatcher
+                             (metadata.launcher === agent-swarm-e2b)
+  --yes                      Skip the multi-sandbox confirmation prompt (required in CI)
+Global:
   --json                     Print machine-readable output
   --dry-run                  Print/derive planned work without touching E2B
 `);
@@ -714,6 +2007,12 @@ export async function runE2BCommand(argv: string[]): Promise<void> {
       case "list":
         await listCommand(flags, cwd);
         return;
+      case "swarms":
+        await swarmsCommand(flags, cwd);
+        return;
+      case "extend":
+        await extendCommand(flags, cwd);
+        return;
       case "kill":
         await killCommand(flags, cwd);
         return;