npm - @desplega.ai/agent-swarm - Versions diffs - 1.87.0 → 1.88.0 - Mend

@desplega.ai/agent-swarm 1.87.0 → 1.88.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (59) hide show

package/README.md +2 -1
package/openapi.json +13 -1
package/package.json +5 -5
package/src/be/db.ts +49 -7
package/src/be/migrations/080_skill_system_defaults.sql +8 -0
package/src/be/modelsdev-cache.json +1123 -1034
package/src/be/seed/registry.ts +3 -2
package/src/be/seed-skills/index.ts +172 -0
package/src/cli.tsx +33 -4
package/src/commands/e2b-stack-wizard.tsx +394 -0
package/src/commands/e2b.ts +1352 -53
package/src/commands/onboard/dashboard-url.ts +29 -0
package/src/commands/onboard/steps/post-dashboard.tsx +3 -1
package/src/commands/onboard.tsx +3 -1
package/src/commands/runner.ts +1 -0
package/src/e2b/dispatch.ts +234 -18
package/src/http/memory.ts +13 -1
package/src/http/skills.ts +53 -0
package/src/http/webhooks.ts +75 -0
package/src/integrations/kapso/client.ts +82 -0
package/src/memory/automatic-task-gate.ts +47 -0
package/src/prompts/base-prompt.ts +16 -1
package/src/prompts/session-templates.ts +51 -0
package/src/providers/claude-adapter.ts +19 -0
package/src/providers/codex-adapter.ts +22 -0
package/src/providers/ctx-mode-env.ts +10 -0
package/src/providers/opencode-adapter.ts +50 -1
package/src/slack/blocks.ts +12 -4
package/src/slack/watcher.ts +3 -3
package/src/telemetry.ts +14 -1
package/src/templates.d.ts +4 -0
package/src/tests/base-prompt.test.ts +41 -0
package/src/tests/claude-adapter.test.ts +86 -1
package/src/tests/codex-adapter.test.ts +89 -0
package/src/tests/e2b-dispatch.test.ts +603 -11
package/src/tests/http-api-integration.test.ts +113 -0
package/src/tests/kapso-client.test.ts +74 -1
package/src/tests/kapso-inbound.test.ts +60 -2
package/src/tests/opencode-adapter.test.ts +95 -0
package/src/tests/prompt-template-session.test.ts +4 -2
package/src/tests/self-improvement.test.ts +89 -0
package/src/tests/skill-update-scope.test.ts +88 -1
package/src/tests/slack-blocks.test.ts +15 -0
package/src/tests/system-default-skills.test.ts +119 -0
package/src/tests/telemetry-init.test.ts +86 -0
package/src/tools/skills/skill-delete.ts +14 -0
package/src/tools/skills/skill-update.ts +14 -0
package/src/tools/store-progress.ts +19 -5
package/src/types.ts +1 -0
package/templates/skills/artifacts/config.json +1 -0
package/templates/skills/kv-storage/config.json +1 -0
package/templates/skills/pages/config.json +1 -0
package/templates/skills/scheduled-task-resilience/config.json +1 -0
package/templates/skills/swarm-scripts/SKILL.md +91 -0
package/templates/skills/swarm-scripts/config.json +14 -0
package/templates/skills/swarm-scripts/content.md +86 -0
package/templates/skills/workflow-iterate/config.json +1 -0
package/templates/skills/workflow-structured-output/config.json +1 -0
package/tsconfig.json +2 -1

package/src/tests/e2b-dispatch.test.ts CHANGED Viewed

@@ -1,13 +1,28 @@
-import { describe, expect, test } from "bun:test";
+import { afterEach, beforeEach, describe, expect, test } from "bun:test";
+import { mkdtempSync, writeFileSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import {
+  buildDashboardDeepLink,
+  type LaunchSpec,
+  loadRuntimeEnv,
+  parseFlags,
+  resolveIntegrationToggles,
+  runE2BCommand,
+  swarmGroupMembers,
+} from "../commands/e2b";
+import { buildOnboardDashboardUrl } from "../commands/onboard/dashboard-url";
 import {
-  buildDetachedShell,
   buildImageTemplate,
   buildTemplateArgs,
+  buildTrackedShell,
   deleteTemplate,
   type E2BSandboxInfo,
   e2bSdkConnectionOptions,
+  sandboxLogPath,
   sandboxPortHost,
   setTemplateVisibility,
+  ttlRemaining,
   waitForAgentRegistration,
 } from "../e2b/dispatch";
 import {
@@ -144,16 +159,74 @@ describe("E2B dispatch helpers", () => {
     ).toBe("3013-sbx123.sandboxes.internal:8443");
   });
-  test("buildDetachedShell backgrounds command and captures pid without invalid shell chaining", () => {
-    const shell = buildDetachedShell("/api-entrypoint.sh", "/tmp/api.log", "/tmp/api.pid");
+  test("ttlRemaining reads authoritative endAt when present", () => {
+    const expiresAt = new Date(Date.now() + 1800 * 1000).toISOString();
+    const sandbox: E2BSandboxInfo = {
+      sandboxID: "sbx123",
+      templateID: "tpl",
+      endAt: expiresAt,
+    };
+    const ttl = ttlRemaining(sandbox);
+    expect(ttl.expiresAt).toBe(expiresAt);
+    // ~1800s remaining; allow a small window for wall-clock drift during the test.
+    expect(ttl.secondsLeft).toBeGreaterThan(1790);
+    expect(ttl.secondsLeft).toBeLessThanOrEqual(1800);
+  });
+  test("ttlRemaining falls back to client-side expiresAt and prefers endAt over it", () => {
+    const fallback = new Date(Date.now() + 600 * 1000).toISOString();
+    const fallbackOnly: E2BSandboxInfo = {
+      sandboxID: "sbx456",
+      templateID: "tpl",
+      expiresAt: fallback,
+    };
+    const fallbackTtl = ttlRemaining(fallbackOnly);
+    expect(fallbackTtl.expiresAt).toBe(fallback);
+    expect(fallbackTtl.secondsLeft).toBeGreaterThan(590);
+    expect(fallbackTtl.secondsLeft).toBeLessThanOrEqual(600);
+    // endAt is authoritative and wins over the client-side fallback.
+    const authoritative = new Date(Date.now() + 3600 * 1000).toISOString();
+    const both = ttlRemaining({ ...fallbackOnly, endAt: authoritative });
+    expect(both.expiresAt).toBe(authoritative);
+    expect(both.secondsLeft).toBeGreaterThan(3590);
+  });
+  test("ttlRemaining returns empty for absent endAt/expiresAt and clamps expired to zero", () => {
+    expect(ttlRemaining({ sandboxID: "none", templateID: "tpl" })).toEqual({});
+    const expired = ttlRemaining({
+      sandboxID: "old",
+      templateID: "tpl",
+      endAt: new Date(Date.now() - 60 * 1000).toISOString(),
+    });
+    expect(expired.secondsLeft).toBe(0);
+  });
+  test("buildTrackedShell pipes the entrypoint through tee to the log path (Phase 5)", () => {
+    const logPath = sandboxLogPath("api");
+    const shell = buildTrackedShell("/api-entrypoint.sh", logPath);
+    // Phase 5: the entrypoint runs as the SDK BACKGROUND command itself (envd
+    // owns/streams it), no longer a detached `nohup … &` grandchild.
+    expect(logPath).toBe("/tmp/agent-swarm-e2b-api.log");
+    expect(shell).toBe(
+      "set -o pipefail; /api-entrypoint.sh 2>&1 | tee /tmp/agent-swarm-e2b-api.log",
+    );
+    // Must tee to the deterministic file so `swarms logs` can read full history.
+    expect(shell).toContain(`tee ${logPath}`);
+    // pipefail makes the pipeline exit reflect the entrypoint (not tee) for the
+    // early-failure poll in startDetachedProcess.
+    expect(shell).toContain("set -o pipefail");
+    // The old detach primitives are gone.
+    expect(shell).not.toContain("nohup");
+    expect(shell).not.toContain("kill -0");
+    expect(shell).not.toContain("sleep 2");
+  });
-    expect(shell).toContain("nohup /api-entrypoint.sh >/tmp/api.log 2>&1 </dev/null & pid=$!");
-    expect(shell).toContain("sleep 2");
-    expect(shell).toContain('kill -0 "$pid"');
-    expect(shell).toContain("cat /tmp/api.log >&2");
-    expect(shell).toContain("pid=$!");
-    expect(shell).not.toContain("&;");
-    expect(shell).not.toContain("& &&");
+  test("sandboxLogPath is deterministic per E2B role", () => {
+    expect(sandboxLogPath("api")).toBe("/tmp/agent-swarm-e2b-api.log");
+    expect(sandboxLogPath("worker")).toBe("/tmp/agent-swarm-e2b-worker.log");
   });
   test("E2B SDK connection options preserve loaded controller endpoints", () => {
@@ -328,3 +401,522 @@ describe("E2B dispatch helpers", () => {
     });
   });
 });
+describe("E2B namespaced env scoping", () => {
+  const API_SPEC: LaunchSpec = { swarmRole: "api", envScope: "api" };
+  const LEAD_SPEC: LaunchSpec = { swarmRole: "worker", agentRole: "lead", envScope: "lead" };
+  const WORKER_SPEC: LaunchSpec = { swarmRole: "worker", agentRole: "worker", envScope: "worker" };
+  // A dummy MCP base URL — loadRuntimeEnv requires one for non-api roles.
+  const API_URL = "https://api.example.com";
+  // Phase 2 layering is precedence-only; --dry-run keeps the swarm-API-key
+  // resolution from throwing without touching E2B. We snapshot/restore the
+  // forward-key env vars so ambient values can't leak into the assertions.
+  const previous: Record<string, string | undefined> = {};
+  beforeEach(() => {
+    for (const key of ["AGENT_SWARM_API_KEY", "API_KEY", "HARNESS_PROVIDER"]) {
+      previous[key] = process.env[key];
+      delete process.env[key];
+    }
+  });
+  afterEach(() => {
+    for (const [key, value] of Object.entries(previous)) {
+      if (value === undefined) delete process.env[key];
+      else process.env[key] = value;
+    }
+  });
+  async function resolveAllScopes(argv: string[]) {
+    const flags = parseFlags(["start-stack", ...argv, "--dry-run"]);
+    const [api, lead, worker] = await Promise.all([
+      loadRuntimeEnv(flags, API_SPEC),
+      loadRuntimeEnv(flags, LEAD_SPEC, API_URL),
+      loadRuntimeEnv(flags, WORKER_SPEC, API_URL),
+    ]);
+    return { api, lead, worker };
+  }
+  test("--worker-secret lands only in the worker scope", async () => {
+    const { api, lead, worker } = await resolveAllScopes(["--worker-secret", "FOO=x"]);
+    expect(worker.FOO).toBe("x");
+    expect(lead.FOO).toBeUndefined();
+    expect(api.FOO).toBeUndefined();
+  });
+  test("--lead-secret lands only in the lead scope", async () => {
+    const { api, lead, worker } = await resolveAllScopes(["--lead-secret", "K=v"]);
+    expect(lead.K).toBe("v");
+    expect(worker.K).toBeUndefined();
+    expect(api.K).toBeUndefined();
+  });
+  test("--api-secret lands only in the api scope", async () => {
+    const { api, lead, worker } = await resolveAllScopes(["--api-secret", "ZED=q"]);
+    expect(api.ZED).toBe("q");
+    expect(lead.ZED).toBeUndefined();
+    expect(worker.ZED).toBeUndefined();
+  });
+  test("shared --secret applies to all three scopes", async () => {
+    const { api, lead, worker } = await resolveAllScopes(["--secret", "BAR=y"]);
+    expect(api.BAR).toBe("y");
+    expect(lead.BAR).toBe("y");
+    expect(worker.BAR).toBe("y");
+  });
+  test("scoped --secret layers on top of the shared --secret without replacing it", async () => {
+    // Shared sets SHARED + OVERRIDE; worker scope overrides OVERRIDE and adds
+    // WORKER_ONLY. The shared value must survive in the non-overridden scopes.
+    const { api, lead, worker } = await resolveAllScopes([
+      "--secret",
+      "SHARED=shared",
+      "--secret",
+      "OVERRIDE=shared-val",
+      "--worker-secret",
+      "OVERRIDE=worker-val",
+      "--worker-secret",
+      "WORKER_ONLY=w",
+    ]);
+    expect(api.SHARED).toBe("shared");
+    expect(lead.SHARED).toBe("shared");
+    expect(worker.SHARED).toBe("shared");
+    expect(worker.OVERRIDE).toBe("worker-val");
+    expect(lead.OVERRIDE).toBe("shared-val");
+    expect(api.OVERRIDE).toBe("shared-val");
+    expect(worker.WORKER_ONLY).toBe("w");
+    expect(lead.WORKER_ONLY).toBeUndefined();
+    expect(api.WORKER_ONLY).toBeUndefined();
+  });
+  test("scoped --{scope}-env-file layers over the shared --env-file", async () => {
+    const dir = mkdtempSync(join(tmpdir(), "e2b-env-scope-"));
+    const sharedFile = join(dir, "shared.env");
+    const workerFile = join(dir, "worker.env");
+    writeFileSync(sharedFile, "SHARED_FILE=base\nFROM_SHARED=keep\n");
+    writeFileSync(workerFile, "SHARED_FILE=override\nWORKER_FILE_ONLY=w\n");
+    const { api, lead, worker } = await resolveAllScopes([
+      "--env-file",
+      sharedFile,
+      "--worker-env-file",
+      workerFile,
+    ]);
+    // Shared file is visible everywhere.
+    expect(api.FROM_SHARED).toBe("keep");
+    expect(lead.FROM_SHARED).toBe("keep");
+    expect(worker.FROM_SHARED).toBe("keep");
+    // Worker-scoped file overrides the shared value only in the worker scope.
+    expect(worker.SHARED_FILE).toBe("override");
+    expect(lead.SHARED_FILE).toBe("base");
+    expect(api.SHARED_FILE).toBe("base");
+    // Worker-only key never bleeds into the other scopes.
+    expect(worker.WORKER_FILE_ONLY).toBe("w");
+    expect(lead.WORKER_FILE_ONLY).toBeUndefined();
+    expect(api.WORKER_FILE_ONLY).toBeUndefined();
+  });
+  test("scoped --secret wins over both shared and scoped env-files (precedence order)", async () => {
+    const dir = mkdtempSync(join(tmpdir(), "e2b-env-prec-"));
+    const sharedFile = join(dir, "shared.env");
+    const workerFile = join(dir, "worker.env");
+    writeFileSync(sharedFile, "PREC=from-shared-file\n");
+    writeFileSync(workerFile, "PREC=from-worker-file\n");
+    const { worker } = await resolveAllScopes([
+      "--env-file",
+      sharedFile,
+      "--worker-env-file",
+      workerFile,
+      "--secret",
+      "PREC=from-shared-secret",
+      "--worker-secret",
+      "PREC=from-worker-secret",
+    ]);
+    // Highest-precedence non-forced layer wins.
+    expect(worker.PREC).toBe("from-worker-secret");
+  });
+  test("AGENT_ROLE comes from the spec; lead spec yields AGENT_ROLE=lead", async () => {
+    const { lead, worker } = await resolveAllScopes([]);
+    expect(lead.AGENT_ROLE).toBe("lead");
+    expect(worker.AGENT_ROLE).toBe("worker");
+  });
+  test("worker spec without an agentRole falls back to the global --agent-role", async () => {
+    // start-worker stays identical: WORKER_SPEC carries agentRole:"worker" only
+    // in start-stack; the legacy path uses a spec with no agentRole and relies
+    // on --agent-role. Mirror that here with an agentRole-less worker spec.
+    const flags = parseFlags(["start-worker", "--agent-role", "lead", "--dry-run"]);
+    const legacyWorkerSpec: LaunchSpec = { swarmRole: "worker", envScope: "worker" };
+    const env = await loadRuntimeEnv(flags, legacyWorkerSpec, API_URL);
+    expect(env.AGENT_ROLE).toBe("lead");
+  });
+  test("forced API_KEY/AGENT_SWARM_API_KEY win over a user --secret API_KEY", async () => {
+    // A user must not be able to break swarm auth by overriding API_KEY via a
+    // scoped or shared secret — the forced resolution always applies last.
+    const flags = parseFlags([
+      "start-api",
+      "--api-key",
+      "forced-key",
+      "--secret",
+      "API_KEY=attacker",
+      "--dry-run",
+    ]);
+    const env = await loadRuntimeEnv(flags, API_SPEC);
+    expect(env.API_KEY).toBe("forced-key");
+    expect(env.AGENT_SWARM_API_KEY).toBe("forced-key");
+  });
+});
+describe("E2B start-stack topology (Phase 3)", () => {
+  const previous: Record<string, string | undefined> = {};
+  beforeEach(() => {
+    for (const key of ["AGENT_SWARM_API_KEY", "API_KEY", "HARNESS_PROVIDER"]) {
+      previous[key] = process.env[key];
+      delete process.env[key];
+    }
+  });
+  afterEach(() => {
+    for (const [key, value] of Object.entries(previous)) {
+      if (value === undefined) delete process.env[key];
+      else process.env[key] = value;
+    }
+  });
+  /** Run `e2b <argv>` capturing stdout, then parse the JSON it printed. */
+  async function runStackJson(argv: string[]): Promise<Record<string, unknown>> {
+    const originalLog = console.log;
+    const lines: string[] = [];
+    console.log = (...args: unknown[]) => {
+      lines.push(args.map(String).join(" "));
+    };
+    const previousExitCode = process.exitCode;
+    try {
+      await runE2BCommand(argv);
+    } finally {
+      console.log = originalLog;
+    }
+    // A clean dry-run must not set a failure exit code.
+    expect(process.exitCode ?? 0).toBe(previousExitCode ?? 0);
+    // Phase 4 prepends a "swarm: <slug>" echo before the JSON; parse from the
+    // first line that opens the JSON object so the preamble is skipped.
+    const jsonStart = lines.findIndex((l) => l.trim().startsWith("{"));
+    return JSON.parse(lines.slice(Math.max(jsonStart, 0)).join("\n")) as Record<string, unknown>;
+  }
+  test("dry-run stack provisions api + lead + N workers", async () => {
+    const payload = await runStackJson([
+      "start-stack",
+      "--dry-run",
+      "--yes",
+      "--workers",
+      "2",
+      "--swarm",
+      "test",
+      "--json",
+    ]);
+    expect(payload.api).toBeDefined();
+    expect(payload.lead).toBeDefined();
+    expect(Array.isArray(payload.workers)).toBe(true);
+    expect((payload.workers as unknown[]).length).toBe(2);
+    // The lead is E2B SwarmRole "worker" with AGENT_ROLE lead.
+    expect((payload.lead as { role: string }).role).toBe("worker");
+    expect((payload.api as { role: string }).role).toBe("api");
+  });
+  test("--no-lead keeps the legacy api + workers topology (no lead key)", async () => {
+    const payload = await runStackJson([
+      "start-stack",
+      "--dry-run",
+      "--yes",
+      "--no-lead",
+      "--workers",
+      "2",
+      "--swarm",
+      "test",
+      "--json",
+    ]);
+    expect(payload.api).toBeDefined();
+    expect(payload.lead).toBeUndefined();
+    expect(Array.isArray(payload.workers)).toBe(true);
+    expect((payload.workers as unknown[]).length).toBe(2);
+  });
+  test("rejects a shared explicit --agent-id across multiple workers", async () => {
+    // A single explicit --agent-id reused for N>1 workers would collapse them
+    // into one agent record (the API reuses the row for an existing X-Agent-ID).
+    // The guard must fire before any sandbox is provisioned, even on dry-run.
+    // runE2BCommand swallows the throw into a stderr line + exitCode=1, so assert
+    // on those rather than on a propagated exception.
+    const originalError = console.error;
+    const errLines: string[] = [];
+    console.error = (...args: unknown[]) => {
+      errLines.push(args.map(String).join(" "));
+    };
+    const previousExitCode = process.exitCode;
+    try {
+      await runE2BCommand([
+        "start-stack",
+        "--dry-run",
+        "--yes",
+        "--workers",
+        "2",
+        "--swarm",
+        "test",
+        "--agent-id",
+        "fixed-worker",
+        "--json",
+      ]);
+    } finally {
+      console.error = originalError;
+    }
+    expect(process.exitCode).toBe(1);
+    process.exitCode = previousExitCode ?? 0;
+    expect(errLines.join("\n")).toContain("--agent-id cannot be shared across multiple workers");
+  });
+  test("allows an explicit --agent-id for a single-worker stack", async () => {
+    // One worker + explicit ID is unambiguous — no collision, so it must pass.
+    const payload = await runStackJson([
+      "start-stack",
+      "--dry-run",
+      "--yes",
+      "--workers",
+      "1",
+      "--swarm",
+      "test",
+      "--agent-id",
+      "fixed-worker",
+      "--json",
+    ]);
+    expect((payload.workers as unknown[]).length).toBe(1);
+  });
+  test("integration toggles disable only the unlisted/--no-<x> integrations", () => {
+    // Default: all on.
+    expect(resolveIntegrationToggles(parseFlags(["start-stack"]))).toEqual({
+      slack: true,
+      github: true,
+      jira: true,
+      linear: true,
+    });
+    // --no-slack flips just slack off.
+    expect(resolveIntegrationToggles(parseFlags(["start-stack", "--no-slack"]))).toMatchObject({
+      slack: false,
+      github: true,
+    });
+    // --integrations is an allowlist: only github stays on.
+    expect(
+      resolveIntegrationToggles(parseFlags(["start-stack", "--integrations", "github"])),
+    ).toEqual({
+      slack: false,
+      github: true,
+      jira: false,
+      linear: false,
+    });
+  });
+  test("integration disables land only on the API runtime scope", async () => {
+    const flags = parseFlags([
+      "start-stack",
+      "--no-slack",
+      "--integrations",
+      "github",
+      "--dry-run",
+      "--api-key",
+      "k",
+    ]);
+    const api = await loadRuntimeEnv(flags, { swarmRole: "api", envScope: "api" });
+    const worker = await loadRuntimeEnv(
+      flags,
+      { swarmRole: "worker", agentRole: "worker", envScope: "worker" },
+      "https://api.example.com",
+    );
+    expect(api.SLACK_DISABLE).toBe("true");
+    expect(api.JIRA_DISABLE).toBe("true");
+    expect(api.LINEAR_DISABLE).toBe("true");
+    // github stayed on via the allowlist.
+    expect(api.GITHUB_DISABLE).toBeUndefined();
+    // The worker scope never carries these API-side toggles.
+    expect(worker.SLACK_DISABLE).toBeUndefined();
+  });
+});
+describe("E2B swarm grouping + deep-link (Phase 4)", () => {
+  const previous: Record<string, string | undefined> = {};
+  beforeEach(() => {
+    for (const key of ["AGENT_SWARM_API_KEY", "API_KEY", "HARNESS_PROVIDER", "APP_URL"]) {
+      previous[key] = process.env[key];
+      delete process.env[key];
+    }
+  });
+  afterEach(() => {
+    for (const [key, value] of Object.entries(previous)) {
+      if (value === undefined) delete process.env[key];
+      else process.env[key] = value;
+    }
+  });
+  /** Run `e2b <argv>` capturing stdout lines (no JSON parse). */
+  async function runStackLines(argv: string[]): Promise<string[]> {
+    const originalLog = console.log;
+    const lines: string[] = [];
+    console.log = (...args: unknown[]) => {
+      lines.push(args.map(String).join(" "));
+    };
+    try {
+      await runE2BCommand(argv);
+    } finally {
+      console.log = originalLog;
+    }
+    return lines;
+  }
+  test("dry-run stack stamps swarm + swarmRole onto every sandbox's metadata", async () => {
+    const lines = await runStackLines([
+      "start-stack",
+      "--dry-run",
+      "--yes",
+      "--workers",
+      "1",
+      "--swarm",
+      "demo",
+      "--json",
+    ]);
+    // The "swarm: demo" echo precedes the JSON; parse only the JSON tail.
+    const jsonStart = lines.findIndex((l) => l.trim().startsWith("{"));
+    const payload = JSON.parse(lines.slice(jsonStart).join("\n")) as {
+      api: { sandbox: { metadata: Record<string, string> } };
+      lead: { sandbox: { metadata: Record<string, string> } };
+      workers: { sandbox: { metadata: Record<string, string> } }[];
+    };
+    // Shared slug across all roles.
+    expect(payload.api.sandbox.metadata.swarm).toBe("demo");
+    expect(payload.lead.sandbox.metadata.swarm).toBe("demo");
+    expect(payload.workers[0]?.sandbox.metadata.swarm).toBe("demo");
+    // Distinct grouping roles (lead is E2B role:"worker" but swarmRole:"lead").
+    expect(payload.api.sandbox.metadata.swarmRole).toBe("api");
+    expect(payload.lead.sandbox.metadata.swarmRole).toBe("lead");
+    expect(payload.workers[0]?.sandbox.metadata.swarmRole).toBe("worker");
+    // API carries its port; lead/worker do not (they carry agentId reconstruction-ready data).
+    expect(payload.api.sandbox.metadata.apiPort).toBe("3013");
+  });
+  test("a stack with no --swarm generates a shared slug and echoes it", async () => {
+    const lines = await runStackLines(["start-stack", "--dry-run", "--yes", "--workers", "1"]);
+    const swarmLine = lines.find((l) => l.startsWith("swarm: "));
+    expect(swarmLine).toBeDefined();
+    const slug = swarmLine?.slice("swarm: ".length).trim() ?? "";
+    expect(slug).toMatch(/^swarm-[0-9a-f]{6}$/);
+  });
+  test("e2b dashboard deep-link uses camelCase params and hides the key by default", () => {
+    const masked = buildDashboardDeepLink(
+      { apiUrl: "https://api.example.com", apiKey: "super-secret-key", name: "demo" },
+      false,
+    );
+    // camelCase params the SPA reads.
+    expect(masked).toContain("apiUrl=https%3A%2F%2Fapi.example.com");
+    expect(masked).toContain("name=demo");
+    // Key hidden — the real value MUST NOT appear.
+    expect(masked).toContain("apiKey=<hidden — pass --reveal-key>");
+    expect(masked).not.toContain("super-secret-key");
+    // Never snake_case.
+    expect(masked).not.toContain("api_url");
+    expect(masked).not.toContain("api_key");
+  });
+  test("e2b dashboard deep-link embeds the real key only when revealed", () => {
+    const revealed = buildDashboardDeepLink(
+      { apiUrl: "https://api.example.com", apiKey: "super-secret-key", name: "demo" },
+      true,
+    );
+    expect(revealed).toContain("apiKey=super-secret-key");
+    expect(revealed).not.toContain("<hidden");
+    expect(revealed).toContain("apiUrl=https%3A%2F%2Fapi.example.com");
+  });
+  test("--reveal-key gating: default masks the key in stack output, flag reveals it", async () => {
+    process.env.APP_URL = "https://dash.example.com";
+    const baseArgs = [
+      "start-stack",
+      "--dry-run",
+      "--yes",
+      "--workers",
+      "1",
+      "--api-key",
+      "k3y-s3cr3t-value",
+    ];
+    const maskedLines = await runStackLines(baseArgs);
+    const maskedDash = maskedLines.find((l) => l.startsWith("dashboard: ")) ?? "";
+    expect(maskedDash).toContain("apiKey=<hidden — pass --reveal-key>");
+    expect(maskedDash).not.toContain("k3y-s3cr3t-value");
+    const revealedLines = await runStackLines([...baseArgs, "--reveal-key"]);
+    const revealedDash = revealedLines.find((l) => l.startsWith("dashboard: ")) ?? "";
+    expect(revealedDash).toContain("apiKey=k3y-s3cr3t-value");
+    expect(revealedDash).not.toContain("<hidden");
+  });
+  test("onboarding dashboard builder emits camelCase apiUrl/apiKey (not snake_case)", () => {
+    const url = buildOnboardDashboardUrl({
+      apiUrl: "http://localhost:3013",
+      apiKey: "onboard-key",
+    });
+    expect(url).toContain("apiUrl=http%3A%2F%2Flocalhost%3A3013");
+    expect(url).toContain("apiKey=onboard-key");
+    // The bug we fixed: snake_case is silently ignored by the SPA.
+    expect(url).not.toContain("api_url");
+    expect(url).not.toContain("api_key");
+    expect(url.startsWith("https://app.agent-swarm.dev?")).toBe(true);
+  });
+  test("swarmGroupMembers restricts a named swarm to dispatcher-owned sandboxes", () => {
+    const sandboxes: E2BSandboxInfo[] = [
+      // Ours: matching slug + our launcher tag.
+      {
+        sandboxID: "ours-api",
+        templateID: "tpl",
+        metadata: { swarm: "myswarm", launcher: "agent-swarm-e2b", swarmRole: "api" },
+      },
+      {
+        sandboxID: "ours-worker",
+        templateID: "tpl",
+        metadata: { swarm: "myswarm", launcher: "agent-swarm-e2b", swarmRole: "worker" },
+      },
+      // Foreign: same slug, but NOT launched by us — must be excluded so
+      // `swarms kill/info/logs/add` can never touch it.
+      {
+        sandboxID: "foreign-collision",
+        templateID: "tpl",
+        metadata: { swarm: "myswarm" },
+      },
+      // Ours, but a different swarm — excluded by the slug filter.
+      {
+        sandboxID: "ours-other",
+        templateID: "tpl",
+        metadata: { swarm: "otherswarm", launcher: "agent-swarm-e2b" },
+      },
+    ];
+    const members = swarmGroupMembers(sandboxes, "myswarm");
+    expect(members.map((m) => m.sandboxID).sort()).toEqual(["ours-api", "ours-worker"]);
+    // The foreign sandbox with a colliding generic `metadata.swarm` is dropped.
+    expect(members.some((m) => m.sandboxID === "foreign-collision")).toBe(false);
+  });
+});