npm - @vellumai/cli - Versions diffs - 0.6.6 → 0.7.1 - Mend

@vellumai/cli 0.6.6 → 0.7.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (61) hide show

package/AGENTS.md +8 -2
package/README.md +49 -0
package/package.json +1 -1
package/src/__tests__/assistant-config.test.ts +1 -7
package/src/__tests__/backup.test.ts +475 -0
package/src/__tests__/config-utils.test.ts +146 -0
package/src/__tests__/env-drift.test.ts +10 -32
package/src/__tests__/llm-provider-env-var-parity.test.ts +1 -21
package/src/__tests__/multi-local.test.ts +0 -5
package/src/__tests__/sleep.test.ts +1 -2
package/src/__tests__/teleport.test.ts +988 -1266
package/src/commands/backup.ts +117 -71
package/src/commands/client.ts +10 -9
package/src/commands/env.ts +93 -0
package/src/commands/events.ts +2 -0
package/src/commands/exec.ts +58 -13
package/src/commands/login.ts +77 -12
package/src/commands/logs.ts +2 -7
package/src/commands/ps.ts +144 -25
package/src/commands/restore.ts +26 -47
package/src/commands/sleep.ts +5 -2
package/src/commands/ssh.ts +17 -7
package/src/commands/teleport.ts +462 -584
package/src/commands/terminal.ts +9 -221
package/src/commands/tunnel.ts +2 -7
package/src/commands/upgrade.ts +108 -7
package/src/commands/wake.ts +2 -1
package/src/components/DefaultMainScreen.tsx +328 -154
package/src/index.ts +5 -7
package/src/lib/__tests__/docker.test.ts +50 -74
package/src/lib/__tests__/job-polling.test.ts +278 -0
package/src/lib/__tests__/local-runtime-client.test.ts +480 -0
package/src/lib/__tests__/platform-client-signed-url.test.ts +405 -0
package/src/lib/__tests__/runtime-url.test.ts +87 -0
package/src/lib/__tests__/terminal-session.test.ts +202 -0
package/src/lib/assistant-client.ts +5 -21
package/src/lib/assistant-config.ts +46 -24
package/src/lib/cli-error.ts +1 -0
package/src/lib/client-identity.ts +67 -0
package/src/lib/docker.ts +75 -77
package/src/lib/environments/__tests__/paths.test.ts +2 -0
package/src/lib/environments/resolve.ts +89 -7
package/src/lib/environments/seeds.ts +8 -5
package/src/lib/environments/types.ts +10 -0
package/src/lib/hatch-local.ts +15 -120
package/src/lib/health-check.ts +98 -0
package/src/lib/job-polling.ts +195 -0
package/src/lib/local-runtime-client.ts +231 -0
package/src/lib/local.ts +165 -72
package/src/lib/orphan-detection.ts +2 -35
package/src/lib/platform-client.ts +190 -194
package/src/lib/platform-releases.ts +23 -0
package/src/lib/retire-local.ts +6 -2
package/src/lib/runtime-url.ts +30 -0
package/src/lib/sync-cloud-assistants.ts +126 -0
package/src/lib/terminal-client.ts +6 -1
package/src/lib/terminal-session.ts +536 -0
package/src/lib/tui-log.ts +60 -0
package/src/lib/xdg-log.ts +10 -4
package/src/shared/provider-env-vars.ts +2 -3
package/src/__tests__/orphan-detection.test.ts +0 -214

package/AGENTS.md CHANGED Viewed

@@ -41,6 +41,12 @@ Every command must have high-quality `--help` output. Follow the same standards
    AI agents parse help text to decide which command to run and how. Avoid vague
    language — say exactly what the command does and where state is stored.
+## Boundary: No integration-specific references
+The CLI is a generic lifecycle manager. It must **never** contain references to specific skills, integrations, or features (e.g. "Meet", "Slack", "Telegram"). Environment variables, volume mounts, and device passthroughs defined here must use generic names (e.g. `VELLUM_AVATAR_DEVICE`, not `VELLUM_MEET_AVATAR_DEVICE`). The skill that uses a resource decides how to interpret it — the CLI just passes it through.
+Cross-package imports into `skills/` are forbidden. The CLI is distributed as an npm package; anything outside `cli/` is not included in the tarball and will fail to resolve at runtime.
 ## Boundary: No `.vellum/` directory access
 The CLI must **never** read from or write to the `.vellum/` directory (e.g. `~/.vellum/protected/`, `<instanceDir>/.vellum/`). That directory structure is an **assistant daemon / gateway implementation detail**. The CLI's job is to spawn those processes and pass configuration via environment variables — not to reach into their internal storage.
@@ -62,9 +68,9 @@ The CLI creates and manages Docker volumes for containerized instances. See the
 **Meet Docker-in-Docker support** (assistant container only): The assistant container runs an inner `dockerd` that hosts the Meet-bot containers as nested children. The CLI supports this by:
 - Creating a dedicated `<name>-dockerd-data` volume mounted at `/var/lib/docker` so pulled images and container state persist across assistant restarts.
-- Running the assistant container with `--privileged` (or `CAP_SYS_ADMIN` + `CAP_NET_ADMIN`) so the inner dockerd can configure cgroups, overlay mounts, and container networking.
+- Running the assistant container with `CAP_SYS_ADMIN` + `CAP_NET_ADMIN` plus `--security-opt seccomp=unconfined` + `--security-opt apparmor=unconfined` so the inner dockerd can configure cgroups, overlay mounts, and container networking without the default seccomp profile blocking clone/unshare/pivot_root syscalls or the default AppArmor profile denying its mount operations. `--privileged` is deliberately avoided — dropping it shrinks the escape surface by withholding the rest of the host capability set and access to host device nodes.
 - No longer bind-mounting the host's `/var/run/docker.sock`; Meet-bot spawning happens entirely inside the assistant container.
 Both are wired in `serviceDockerRunArgs()` in `lib/docker.ts`.
-The privileged assistant container is acceptable for single-user local deployments. Managed/multi-tenant mode needs a different spawn model (e.g. a Kubernetes job runner) and is out of scope for this CLI.
+This capability + security-opt set is acceptable for single-user local deployments. Managed/multi-tenant mode needs a different spawn model (e.g. a Kubernetes job runner) and is out of scope for this CLI.

package/README.md CHANGED Viewed

@@ -97,6 +97,55 @@ VELLUM_CUSTOM_HOST=user@10.0.0.1 vellum hatch --remote custom
 When hatching on GCP in interactive mode (without `-d`), the CLI displays an animated progress TUI that polls the instance's startup script output in real time. Press `Ctrl+C` to detach -- the instance will continue running in the background.
+### `terminal`
+Open an interactive shell into a managed assistant container. Useful for debugging, inspecting state, or working alongside the assistant in a shared `tmux` session.
+```bash
+vellum terminal [name] [options]
+vellum terminal attach <session> [name] [options]
+vellum terminal list [name] [options]
+```
+Only available for managed assistants (those running in a Vellum Cloud container). Local assistants don't have a container to terminal into.
+#### Subcommands
+| Subcommand         | Description                                                              |
+| ------------------ | ------------------------------------------------------------------------ |
+| _(none)_           | Open an interactive shell session inside the container.                  |
+| `attach <session>` | Attach to an existing `tmux` session by name inside the container.       |
+| `list`             | List the `tmux` sessions currently running inside the container.         |
+#### Options
+| Option               | Description                                                                                  |
+| -------------------- | -------------------------------------------------------------------------------------------- |
+| `[name]`             | Positional. Name of the assistant to target. Defaults to the active assistant set via `vellum use`. |
+| `--assistant <name>` | Explicit form of the assistant name. Equivalent to the positional argument.                  |
+If no assistant is named and no active assistant is set, the CLI uses the only managed assistant in the lockfile -- or errors out if there's more than one. Use `vellum ps` to see your assistants and `vellum use <name>` to set the active one.
+#### Examples
+```bash
+# Open a shell in the active managed assistant
+vellum terminal
+# Target a specific assistant by name
+vellum terminal my-assistant
+vellum terminal --assistant my-assistant
+# List running tmux sessions inside the container
+vellum terminal list
+# Attach to a named tmux session
+vellum terminal attach my-session
+vellum terminal attach my-session my-assistant
+```
+This pairs well with the [`terminal-sessions` skill](https://github.com/vellum-ai/vellum-assistant/tree/main/skills/terminal-sessions), which lets the assistant create and manage its own `tmux` sessions. You can `vellum terminal attach` into one of those sessions to watch the assistant work in real time -- for example, pairing on a long-running Claude Code run.
 ### `retire`
 Delete a provisioned assistant instance. The cloud provider and connection details are automatically resolved from the saved assistant config (written during `hatch`).

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@vellumai/cli",
-  "version": "0.6.6",
+  "version": "0.7.1",
   "description": "CLI tools for vellum-assistant",
   "type": "module",
   "exports": {

package/src/__tests__/assistant-config.test.ts CHANGED Viewed

@@ -216,7 +216,7 @@ describe("migrateLegacyEntry", () => {
   test("synthesises full resources when none exist", () => {
     /**
      * Tests that a legacy local entry with no resources object gets a
-     * complete resources object synthesised with default ports and pidFile.
+     * complete resources object synthesised with default ports.
      */
     // GIVEN a local entry with no resources
@@ -239,7 +239,6 @@ describe("migrateLegacyEntry", () => {
     expect(resources.gatewayPort).toBe(7830);
     expect(resources.qdrantPort).toBe(6333);
     expect(resources.cesPort).toBe(8090);
-    expect(resources.pidFile).toContain("vellum.pid");
   });
   test("infers gateway port from runtimeUrl", () => {
@@ -312,7 +311,6 @@ describe("migrateLegacyEntry", () => {
     expect(resources.gatewayPort).toBe(7830);
     expect(resources.qdrantPort).toBe(6333);
     expect(resources.cesPort).toBe(8090);
-    expect(resources.pidFile).toBe("/custom/path/.vellum/vellum.pid");
   });
   test("does not overwrite existing resources fields", () => {
@@ -331,7 +329,6 @@ describe("migrateLegacyEntry", () => {
         gatewayPort: 8001,
         qdrantPort: 8002,
         cesPort: 8003,
-        pidFile: "/my/path/.vellum/vellum.pid",
       },
     };
@@ -366,7 +363,6 @@ describe("migrateLegacyEntry", () => {
         daemonPort: 7821,
         gatewayPort: 7830,
         qdrantPort: 6333,
-        pidFile: "/new/path/.vellum/vellum.pid",
       },
     };
@@ -393,7 +389,6 @@ describe("migrateLegacyEntry", () => {
         daemonPort: 7821,
         gatewayPort: 7830,
         qdrantPort: 6333,
-        pidFile: "/custom/path/.vellum/vellum.pid",
       },
     };
     // WHEN we migrate the entry
@@ -415,7 +410,6 @@ describe("migrateLegacyEntry", () => {
         gatewayPort: 8001,
         qdrantPort: 8002,
         cesPort: 9090,
-        pidFile: "/my/path/.vellum/vellum.pid",
       },
     };
     const changed = migrateLegacyEntry(entry);

package/src/__tests__/backup.test.ts ADDED Viewed

@@ -0,0 +1,475 @@
+import {
+  afterAll,
+  afterEach,
+  beforeEach,
+  describe,
+  expect,
+  mock,
+  spyOn,
+  test,
+} from "bun:test";
+import { mkdtempSync, rmSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+// ---------------------------------------------------------------------------
+// Lockfile isolation (mirrors teleport.test.ts)
+// ---------------------------------------------------------------------------
+const testDir = mkdtempSync(join(tmpdir(), "cli-backup-test-"));
+process.env.VELLUM_LOCKFILE_DIR = testDir;
+// ---------------------------------------------------------------------------
+// Mocks set up before importing the module under test
+// ---------------------------------------------------------------------------
+import * as fs from "node:fs";
+import * as assistantConfig from "../lib/assistant-config.js";
+import * as backupOps from "../lib/backup-ops.js";
+import * as guardianToken from "../lib/guardian-token.js";
+import * as localRuntimeClient from "../lib/local-runtime-client.js";
+import { MigrationInProgressError } from "../lib/local-runtime-client.js";
+import * as platformClient from "../lib/platform-client.js";
+const findAssistantByNameMock = spyOn(
+  assistantConfig,
+  "findAssistantByName",
+).mockReturnValue(null);
+const readPlatformTokenMock = spyOn(
+  platformClient,
+  "readPlatformToken",
+).mockReturnValue("platform-token");
+const getPlatformUrlMock = spyOn(
+  platformClient,
+  "getPlatformUrl",
+).mockReturnValue("https://platform.vellum.ai");
+const platformRequestSignedUrlMock = spyOn(
+  platformClient,
+  "platformRequestSignedUrl",
+).mockImplementation(async (params) => ({
+  url:
+    params.operation === "upload"
+      ? "https://storage.googleapis.com/bucket/signed-upload"
+      : "https://storage.googleapis.com/bucket/signed-download",
+  bundleKey: params.bundleKey ?? "uploads/org-1/bundle-abc.vbundle",
+  expiresAt: new Date(Date.now() + 3600_000).toISOString(),
+}));
+const localRuntimeExportToGcsMock = spyOn(
+  localRuntimeClient,
+  "localRuntimeExportToGcs",
+).mockResolvedValue({ jobId: "platform-export-job-1" });
+const localRuntimePollJobStatusMock = spyOn(
+  localRuntimeClient,
+  "localRuntimePollJobStatus",
+).mockResolvedValue({
+  jobId: "platform-export-job-1",
+  type: "export",
+  status: "complete",
+  result: { manifest_sha256: "abc123def456" },
+});
+// Mode 1 (runtime-direct local backup) uses guardian tokens. Don't exercise
+// it here, but the spies need to exist so the module under test can import
+// them without surprises.
+spyOn(guardianToken, "loadGuardianToken").mockReturnValue({
+  accessToken: "local-token",
+  accessTokenExpiresAt: new Date(Date.now() + 60_000).toISOString(),
+} as unknown as ReturnType<typeof guardianToken.loadGuardianToken>);
+spyOn(guardianToken, "leaseGuardianToken").mockResolvedValue({
+  accessToken: "leased-token",
+  accessTokenExpiresAt: new Date(Date.now() + 60_000).toISOString(),
+} as unknown as Awaited<ReturnType<typeof guardianToken.leaseGuardianToken>>);
+const getBackupsDirMock = spyOn(backupOps, "getBackupsDir").mockReturnValue(
+  "/tmp/backups-default",
+);
+const mkdirSyncMock = spyOn(fs, "mkdirSync").mockImplementation(
+  (() => undefined) as never,
+);
+const writeFileSyncMock = spyOn(fs, "writeFileSync").mockImplementation(
+  () => undefined,
+);
+let originalFetch: typeof globalThis.fetch;
+let exitMock: ReturnType<typeof mock>;
+const VELLUM_ENTRY = {
+  assistantId: "11111111-2222-3333-4444-555555555555",
+  runtimeUrl: "https://platform.vellum.ai",
+  cloud: "vellum",
+  species: "vellum",
+  hatchedAt: new Date().toISOString(),
+} satisfies assistantConfig.AssistantEntry;
+function setArgv(...rest: string[]) {
+  process.argv = ["bun", "vellum", "backup", ...rest];
+}
+beforeEach(() => {
+  originalFetch = globalThis.fetch;
+  exitMock = mock((code?: number) => {
+    throw new Error(`process.exit:${code}`);
+  });
+  process.exit = exitMock as unknown as typeof process.exit;
+  findAssistantByNameMock.mockReset();
+  findAssistantByNameMock.mockReturnValue(null);
+  readPlatformTokenMock.mockReset();
+  readPlatformTokenMock.mockReturnValue("platform-token");
+  getPlatformUrlMock.mockReset();
+  getPlatformUrlMock.mockReturnValue("https://platform.vellum.ai");
+  platformRequestSignedUrlMock.mockReset();
+  platformRequestSignedUrlMock.mockImplementation(async (params) => ({
+    url:
+      params.operation === "upload"
+        ? "https://storage.googleapis.com/bucket/signed-upload"
+        : "https://storage.googleapis.com/bucket/signed-download",
+    bundleKey: params.bundleKey ?? "uploads/org-1/bundle-abc.vbundle",
+    expiresAt: new Date(Date.now() + 3600_000).toISOString(),
+  }));
+  localRuntimeExportToGcsMock.mockReset();
+  localRuntimeExportToGcsMock.mockResolvedValue({
+    jobId: "platform-export-job-1",
+  });
+  localRuntimePollJobStatusMock.mockReset();
+  localRuntimePollJobStatusMock.mockResolvedValue({
+    jobId: "platform-export-job-1",
+    type: "export",
+    status: "complete",
+    result: { manifest_sha256: "abc123def456" },
+  });
+  getBackupsDirMock.mockReset();
+  getBackupsDirMock.mockReturnValue("/tmp/backups-default");
+  mkdirSyncMock.mockReset();
+  mkdirSyncMock.mockImplementation((() => undefined) as never);
+  writeFileSyncMock.mockReset();
+  writeFileSyncMock.mockImplementation(() => undefined);
+});
+afterEach(() => {
+  globalThis.fetch = originalFetch;
+});
+afterAll(() => {
+  // Restore module-level spies so they don't bleed into other test files
+  // when bun test runs the whole suite.
+  findAssistantByNameMock.mockRestore();
+  readPlatformTokenMock.mockRestore();
+  getPlatformUrlMock.mockRestore();
+  platformRequestSignedUrlMock.mockRestore();
+  localRuntimeExportToGcsMock.mockRestore();
+  localRuntimePollJobStatusMock.mockRestore();
+  getBackupsDirMock.mockRestore();
+  mkdirSyncMock.mockRestore();
+  writeFileSyncMock.mockRestore();
+  rmSync(testDir, { recursive: true, force: true });
+});
+import { backup } from "../commands/backup.js";
+// ---------------------------------------------------------------------------
+// Helper: simulated GCS download response
+// ---------------------------------------------------------------------------
+function mockGcsDownload(body: Uint8Array, ok = true, status = 200) {
+  globalThis.fetch = mock(async () => {
+    const responseBody: BodyInit = ok
+      ? new Blob([body as unknown as ArrayBuffer])
+      : "boom";
+    return new Response(responseBody, {
+      status,
+      statusText: ok ? "OK" : "Error",
+    });
+  }) as unknown as typeof globalThis.fetch;
+}
+describe("vellum backup <platform-managed>: GCS happy path", () => {
+  test("requests upload URL → kicks off runtime export → polls → downloads from GCS → writes file", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    setArgv("my-platform");
+    const bytes = new Uint8Array([1, 2, 3, 4]);
+    mockGcsDownload(bytes);
+    await backup();
+    // Upload-URL request to the platform.
+    expect(platformRequestSignedUrlMock).toHaveBeenCalledWith(
+      expect.objectContaining({ operation: "upload" }),
+      "platform-token",
+      "https://platform.vellum.ai",
+    );
+    // Runtime export-to-gcs kicked off via the entry-aware helper. URL
+    // construction is exercised in `local-runtime-client.test.ts`; here we
+    // assert the helper got the right entry + token + params.
+    expect(localRuntimeExportToGcsMock).toHaveBeenCalledWith(
+      expect.objectContaining({
+        cloud: "vellum",
+        runtimeUrl: "https://platform.vellum.ai",
+        assistantId: "11111111-2222-3333-4444-555555555555",
+      }),
+      "platform-token",
+      expect.objectContaining({
+        uploadUrl: "https://storage.googleapis.com/bucket/signed-upload",
+        description: "CLI backup",
+      }),
+    );
+    // Poll uses the entry-aware helper (wildcard URL, NOT the dedicated
+    // platform jobs/{id}/ endpoint).
+    expect(localRuntimePollJobStatusMock).toHaveBeenCalledWith(
+      expect.objectContaining({ cloud: "vellum" }),
+      "platform-token",
+      "platform-export-job-1",
+    );
+    // Download URL keyed off the upload's bundleKey.
+    expect(platformRequestSignedUrlMock).toHaveBeenCalledWith(
+      {
+        operation: "download",
+        bundleKey: "uploads/org-1/bundle-abc.vbundle",
+      },
+      "platform-token",
+      "https://platform.vellum.ai",
+    );
+    // GCS fetch went directly to the signed download URL with no auth.
+    const gcsFetch = globalThis.fetch as unknown as ReturnType<typeof mock>;
+    expect(gcsFetch).toHaveBeenCalledWith(
+      "https://storage.googleapis.com/bucket/signed-download",
+    );
+    // File written to disk with the bytes from GCS.
+    expect(writeFileSyncMock).toHaveBeenCalledTimes(1);
+    const [outputPath, written] = writeFileSyncMock.mock.calls[0]!;
+    expect(written).toEqual(bytes);
+    expect(typeof outputPath).toBe("string");
+    expect(outputPath as string).toMatch(
+      /\/tmp\/backups-default\/my-platform-.*\.vbundle$/,
+    );
+    expect(mkdirSyncMock).toHaveBeenCalled();
+  });
+  test("--output override is respected", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    setArgv("my-platform", "--output", "/custom/path/backup.vbundle");
+    mockGcsDownload(new Uint8Array([7, 7, 7]));
+    await backup();
+    expect(writeFileSyncMock).toHaveBeenCalledTimes(1);
+    expect(writeFileSyncMock.mock.calls[0]![0]).toBe(
+      "/custom/path/backup.vbundle",
+    );
+  });
+  test("default output path is getBackupsDir() + name-timestamp.vbundle", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    setArgv("my-platform");
+    mockGcsDownload(new Uint8Array([1]));
+    await backup();
+    const [outputPath] = writeFileSyncMock.mock.calls[0]!;
+    expect(outputPath as string).toMatch(
+      /^\/tmp\/backups-default\/my-platform-/,
+    );
+    expect(outputPath as string).toMatch(/\.vbundle$/);
+  });
+  test("signed-URL requests target entry.runtimeUrl, not getPlatformUrl() — regression for staging/dev assistants", async () => {
+    // Assistant lives on a non-default platform instance (e.g. staging).
+    // `getPlatformUrl()` still returns the default — picking it up for
+    // signed URLs would target the wrong GCS bucket.
+    const stagingEntry = {
+      ...VELLUM_ENTRY,
+      runtimeUrl: "https://staging-platform.vellum.ai",
+    };
+    findAssistantByNameMock.mockReturnValue(stagingEntry);
+    getPlatformUrlMock.mockReturnValue("https://platform.vellum.ai");
+    setArgv("my-platform");
+    mockGcsDownload(new Uint8Array([9]));
+    await backup();
+    // Both upload and download URL requests are pinned to the entry's
+    // runtimeUrl. The signed URLs returned by the platform target the
+    // GCS bucket the runtime can reach, not the default platform's.
+    expect(platformRequestSignedUrlMock).toHaveBeenCalledWith(
+      expect.objectContaining({ operation: "upload" }),
+      "platform-token",
+      "https://staging-platform.vellum.ai",
+    );
+    expect(platformRequestSignedUrlMock).toHaveBeenCalledWith(
+      expect.objectContaining({ operation: "download" }),
+      "platform-token",
+      "https://staging-platform.vellum.ai",
+    );
+    // No call should have used the default platform URL.
+    const calls = platformRequestSignedUrlMock.mock.calls;
+    for (const call of calls) {
+      expect(call[2]).toBe("https://staging-platform.vellum.ai");
+    }
+  });
+  test("download-URL request uses the refreshed platform token if polling re-authed mid-export", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    setArgv("my-platform");
+    // Simulate a poll-loop refresh: the helper fires `refreshOn401`
+    // before resolving terminal. We trigger that hook to mutate the
+    // token captured by backupPlatform's closure.
+    localRuntimePollJobStatusMock.mockReset();
+    localRuntimePollJobStatusMock.mockImplementation(async () => ({
+      jobId: "platform-export-job-1",
+      type: "export",
+      status: "complete",
+      result: {},
+    }));
+    // Make readPlatformToken return a fresh value on the second call,
+    // mimicking the "user re-ran `vellum login` in another terminal"
+    // scenario. The helper's pollJobUntilDone calls refreshOn401 only
+    // when its own request 401s — for the test we drive the refresh
+    // directly by overriding the mock to surface a fresh token at the
+    // download-step boundary.
+    readPlatformTokenMock.mockReset();
+    readPlatformTokenMock.mockReturnValueOnce("platform-token-old");
+    readPlatformTokenMock.mockReturnValue("platform-token-new");
+    // Hook into pollJobUntilDone via overriding poll to intercept the
+    // refresh call. Easier: just verify the second-arg token to the
+    // download signed-URL request equals the one we'll inject by
+    // letting backup re-read the platform token mid-flight. The current
+    // implementation only re-reads inside pollJobUntilDone's
+    // `refreshOn401`, so we simulate a refresh by overriding poll to
+    // throw-and-recover. Instead we directly assert the regression
+    // behavior: backup uses `exportPlatformToken` (the closure variable)
+    // for the download URL — verified by the structural assertion that
+    // the same variable is used for upload, kickoff, poll, AND download.
+    mockGcsDownload(new Uint8Array([1]));
+    await backup();
+    // All four token-bearing platform calls (upload signed-URL, runtime
+    // export-to-gcs kickoff, poll, download signed-URL) must use the
+    // same token string. If the download step fell back to the captured
+    // `platformToken` parameter instead of `exportPlatformToken`, a
+    // future poll-loop refresh would silently break this invariant.
+    const uploadCallToken = platformRequestSignedUrlMock.mock.calls.find(
+      (c) => (c[0] as { operation: string }).operation === "upload",
+    )![1];
+    const downloadCallToken = platformRequestSignedUrlMock.mock.calls.find(
+      (c) => (c[0] as { operation: string }).operation === "download",
+    )![1];
+    expect(downloadCallToken).toBe(uploadCallToken);
+    const kickoffToken = localRuntimeExportToGcsMock.mock.calls[0]![1];
+    expect(downloadCallToken).toBe(kickoffToken);
+    const pollToken = localRuntimePollJobStatusMock.mock.calls[0]![1];
+    expect(downloadCallToken).toBe(pollToken);
+  });
+});
+describe("vellum backup <platform-managed>: failure cases", () => {
+  test("not logged in (no platform token) exits with 'Run vellum login'", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    readPlatformTokenMock.mockReturnValue(null);
+    setArgv("my-platform");
+    const consoleErrorSpy = spyOn(console, "error").mockImplementation(
+      () => undefined,
+    );
+    try {
+      await expect(backup()).rejects.toThrow("process.exit:1");
+      expect(consoleErrorSpy).toHaveBeenCalledWith(
+        expect.stringContaining("Not logged in"),
+      );
+    } finally {
+      consoleErrorSpy.mockRestore();
+    }
+  });
+  test("MigrationInProgressError on kickoff exits with 'Another backup or teleport export'", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    localRuntimeExportToGcsMock.mockRejectedValue(
+      new MigrationInProgressError("export_in_progress", "existing-job-99"),
+    );
+    setArgv("my-platform");
+    const consoleErrorSpy = spyOn(console, "error").mockImplementation(
+      () => undefined,
+    );
+    try {
+      await expect(backup()).rejects.toThrow("process.exit:1");
+      const calls = consoleErrorSpy.mock.calls.map((c) => c[0]);
+      expect(
+        calls.some(
+          (m) =>
+            typeof m === "string" &&
+            m.includes("Another backup or teleport export") &&
+            m.includes("existing-job-99"),
+        ),
+      ).toBe(true);
+    } finally {
+      consoleErrorSpy.mockRestore();
+    }
+  });
+  test("terminal=failed exits with 'Export failed: <reason>'", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    localRuntimePollJobStatusMock.mockResolvedValue({
+      jobId: "platform-export-job-1",
+      type: "export",
+      status: "failed",
+      error: "vbundle build crashed",
+    });
+    setArgv("my-platform");
+    const consoleErrorSpy = spyOn(console, "error").mockImplementation(
+      () => undefined,
+    );
+    try {
+      await expect(backup()).rejects.toThrow("process.exit:1");
+      expect(consoleErrorSpy).toHaveBeenCalledWith(
+        expect.stringContaining("Export failed: vbundle build crashed"),
+      );
+    } finally {
+      consoleErrorSpy.mockRestore();
+    }
+  });
+  test("GCS fetch !ok exits with 'Failed to fetch bundle from GCS (<status>)'", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    setArgv("my-platform");
+    mockGcsDownload(new Uint8Array(), false, 403);
+    const consoleErrorSpy = spyOn(console, "error").mockImplementation(
+      () => undefined,
+    );
+    try {
+      await expect(backup()).rejects.toThrow("process.exit:1");
+      const calls = consoleErrorSpy.mock.calls.map((c) => c[0]);
+      expect(
+        calls.some(
+          (m) =>
+            typeof m === "string" &&
+            m.includes("Failed to fetch bundle from GCS") &&
+            m.includes("403"),
+        ),
+      ).toBe(true);
+    } finally {
+      consoleErrorSpy.mockRestore();
+    }
+  });
+});