npm - @vellumai/cli - Versions diffs - 0.7.0 → 0.7.1 - Mend

@vellumai/cli 0.7.0 → 0.7.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (40) hide show

package/README.md +49 -0
package/package.json +1 -1
package/src/__tests__/backup.test.ts +475 -0
package/src/__tests__/config-utils.test.ts +35 -48
package/src/__tests__/teleport.test.ts +86 -28
package/src/commands/backup.ts +117 -71
package/src/commands/client.ts +10 -9
package/src/commands/exec.ts +21 -8
package/src/commands/hatch.ts +2 -6
package/src/commands/login.ts +15 -33
package/src/commands/logs.ts +2 -7
package/src/commands/ps.ts +41 -6
package/src/commands/restore.ts +26 -47
package/src/commands/ssh.ts +2 -5
package/src/commands/teleport.ts +38 -24
package/src/commands/tunnel.ts +2 -7
package/src/commands/upgrade.ts +108 -7
package/src/components/DefaultMainScreen.tsx +25 -3
package/src/index.ts +2 -7
package/src/lib/__tests__/local-runtime-client.test.ts +122 -25
package/src/lib/__tests__/platform-client-signed-url.test.ts +2 -2
package/src/lib/__tests__/runtime-url.test.ts +87 -0
package/src/lib/__tests__/terminal-session.test.ts +202 -0
package/src/lib/assistant-client.ts +5 -21
package/src/lib/assistant-config.ts +34 -16
package/src/lib/cli-error.ts +1 -0
package/src/lib/client-identity.ts +1 -1
package/src/lib/config-utils.ts +1 -97
package/src/lib/docker.ts +2 -2
package/src/lib/job-polling.ts +1 -1
package/src/lib/local-runtime-client.ts +81 -28
package/src/lib/local.ts +27 -58
package/src/lib/platform-client.ts +1 -220
package/src/lib/platform-releases.ts +23 -0
package/src/lib/runtime-url.ts +30 -0
package/src/lib/sync-cloud-assistants.ts +126 -0
package/src/lib/terminal-client.ts +6 -1
package/src/lib/terminal-session.ts +127 -48
package/src/lib/tui-log.ts +60 -0
package/src/lib/xdg-log.ts +10 -4

package/README.md CHANGED Viewed

@@ -97,6 +97,55 @@ VELLUM_CUSTOM_HOST=user@10.0.0.1 vellum hatch --remote custom
 When hatching on GCP in interactive mode (without `-d`), the CLI displays an animated progress TUI that polls the instance's startup script output in real time. Press `Ctrl+C` to detach -- the instance will continue running in the background.
+### `terminal`
+Open an interactive shell into a managed assistant container. Useful for debugging, inspecting state, or working alongside the assistant in a shared `tmux` session.
+```bash
+vellum terminal [name] [options]
+vellum terminal attach <session> [name] [options]
+vellum terminal list [name] [options]
+```
+Only available for managed assistants (those running in a Vellum Cloud container). Local assistants don't have a container to terminal into.
+#### Subcommands
+| Subcommand         | Description                                                              |
+| ------------------ | ------------------------------------------------------------------------ |
+| _(none)_           | Open an interactive shell session inside the container.                  |
+| `attach <session>` | Attach to an existing `tmux` session by name inside the container.       |
+| `list`             | List the `tmux` sessions currently running inside the container.         |
+#### Options
+| Option               | Description                                                                                  |
+| -------------------- | -------------------------------------------------------------------------------------------- |
+| `[name]`             | Positional. Name of the assistant to target. Defaults to the active assistant set via `vellum use`. |
+| `--assistant <name>` | Explicit form of the assistant name. Equivalent to the positional argument.                  |
+If no assistant is named and no active assistant is set, the CLI uses the only managed assistant in the lockfile -- or errors out if there's more than one. Use `vellum ps` to see your assistants and `vellum use <name>` to set the active one.
+#### Examples
+```bash
+# Open a shell in the active managed assistant
+vellum terminal
+# Target a specific assistant by name
+vellum terminal my-assistant
+vellum terminal --assistant my-assistant
+# List running tmux sessions inside the container
+vellum terminal list
+# Attach to a named tmux session
+vellum terminal attach my-session
+vellum terminal attach my-session my-assistant
+```
+This pairs well with the [`terminal-sessions` skill](https://github.com/vellum-ai/vellum-assistant/tree/main/skills/terminal-sessions), which lets the assistant create and manage its own `tmux` sessions. You can `vellum terminal attach` into one of those sessions to watch the assistant work in real time -- for example, pairing on a long-running Claude Code run.
 ### `retire`
 Delete a provisioned assistant instance. The cloud provider and connection details are automatically resolved from the saved assistant config (written during `hatch`).

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@vellumai/cli",
-  "version": "0.7.0",
+  "version": "0.7.1",
   "description": "CLI tools for vellum-assistant",
   "type": "module",
   "exports": {

package/src/__tests__/backup.test.ts ADDED Viewed

@@ -0,0 +1,475 @@
+import {
+  afterAll,
+  afterEach,
+  beforeEach,
+  describe,
+  expect,
+  mock,
+  spyOn,
+  test,
+} from "bun:test";
+import { mkdtempSync, rmSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+// ---------------------------------------------------------------------------
+// Lockfile isolation (mirrors teleport.test.ts)
+// ---------------------------------------------------------------------------
+const testDir = mkdtempSync(join(tmpdir(), "cli-backup-test-"));
+process.env.VELLUM_LOCKFILE_DIR = testDir;
+// ---------------------------------------------------------------------------
+// Mocks set up before importing the module under test
+// ---------------------------------------------------------------------------
+import * as fs from "node:fs";
+import * as assistantConfig from "../lib/assistant-config.js";
+import * as backupOps from "../lib/backup-ops.js";
+import * as guardianToken from "../lib/guardian-token.js";
+import * as localRuntimeClient from "../lib/local-runtime-client.js";
+import { MigrationInProgressError } from "../lib/local-runtime-client.js";
+import * as platformClient from "../lib/platform-client.js";
+const findAssistantByNameMock = spyOn(
+  assistantConfig,
+  "findAssistantByName",
+).mockReturnValue(null);
+const readPlatformTokenMock = spyOn(
+  platformClient,
+  "readPlatformToken",
+).mockReturnValue("platform-token");
+const getPlatformUrlMock = spyOn(
+  platformClient,
+  "getPlatformUrl",
+).mockReturnValue("https://platform.vellum.ai");
+const platformRequestSignedUrlMock = spyOn(
+  platformClient,
+  "platformRequestSignedUrl",
+).mockImplementation(async (params) => ({
+  url:
+    params.operation === "upload"
+      ? "https://storage.googleapis.com/bucket/signed-upload"
+      : "https://storage.googleapis.com/bucket/signed-download",
+  bundleKey: params.bundleKey ?? "uploads/org-1/bundle-abc.vbundle",
+  expiresAt: new Date(Date.now() + 3600_000).toISOString(),
+}));
+const localRuntimeExportToGcsMock = spyOn(
+  localRuntimeClient,
+  "localRuntimeExportToGcs",
+).mockResolvedValue({ jobId: "platform-export-job-1" });
+const localRuntimePollJobStatusMock = spyOn(
+  localRuntimeClient,
+  "localRuntimePollJobStatus",
+).mockResolvedValue({
+  jobId: "platform-export-job-1",
+  type: "export",
+  status: "complete",
+  result: { manifest_sha256: "abc123def456" },
+});
+// Mode 1 (runtime-direct local backup) uses guardian tokens. Don't exercise
+// it here, but the spies need to exist so the module under test can import
+// them without surprises.
+spyOn(guardianToken, "loadGuardianToken").mockReturnValue({
+  accessToken: "local-token",
+  accessTokenExpiresAt: new Date(Date.now() + 60_000).toISOString(),
+} as unknown as ReturnType<typeof guardianToken.loadGuardianToken>);
+spyOn(guardianToken, "leaseGuardianToken").mockResolvedValue({
+  accessToken: "leased-token",
+  accessTokenExpiresAt: new Date(Date.now() + 60_000).toISOString(),
+} as unknown as Awaited<ReturnType<typeof guardianToken.leaseGuardianToken>>);
+const getBackupsDirMock = spyOn(backupOps, "getBackupsDir").mockReturnValue(
+  "/tmp/backups-default",
+);
+const mkdirSyncMock = spyOn(fs, "mkdirSync").mockImplementation(
+  (() => undefined) as never,
+);
+const writeFileSyncMock = spyOn(fs, "writeFileSync").mockImplementation(
+  () => undefined,
+);
+let originalFetch: typeof globalThis.fetch;
+let exitMock: ReturnType<typeof mock>;
+const VELLUM_ENTRY = {
+  assistantId: "11111111-2222-3333-4444-555555555555",
+  runtimeUrl: "https://platform.vellum.ai",
+  cloud: "vellum",
+  species: "vellum",
+  hatchedAt: new Date().toISOString(),
+} satisfies assistantConfig.AssistantEntry;
+function setArgv(...rest: string[]) {
+  process.argv = ["bun", "vellum", "backup", ...rest];
+}
+beforeEach(() => {
+  originalFetch = globalThis.fetch;
+  exitMock = mock((code?: number) => {
+    throw new Error(`process.exit:${code}`);
+  });
+  process.exit = exitMock as unknown as typeof process.exit;
+  findAssistantByNameMock.mockReset();
+  findAssistantByNameMock.mockReturnValue(null);
+  readPlatformTokenMock.mockReset();
+  readPlatformTokenMock.mockReturnValue("platform-token");
+  getPlatformUrlMock.mockReset();
+  getPlatformUrlMock.mockReturnValue("https://platform.vellum.ai");
+  platformRequestSignedUrlMock.mockReset();
+  platformRequestSignedUrlMock.mockImplementation(async (params) => ({
+    url:
+      params.operation === "upload"
+        ? "https://storage.googleapis.com/bucket/signed-upload"
+        : "https://storage.googleapis.com/bucket/signed-download",
+    bundleKey: params.bundleKey ?? "uploads/org-1/bundle-abc.vbundle",
+    expiresAt: new Date(Date.now() + 3600_000).toISOString(),
+  }));
+  localRuntimeExportToGcsMock.mockReset();
+  localRuntimeExportToGcsMock.mockResolvedValue({
+    jobId: "platform-export-job-1",
+  });
+  localRuntimePollJobStatusMock.mockReset();
+  localRuntimePollJobStatusMock.mockResolvedValue({
+    jobId: "platform-export-job-1",
+    type: "export",
+    status: "complete",
+    result: { manifest_sha256: "abc123def456" },
+  });
+  getBackupsDirMock.mockReset();
+  getBackupsDirMock.mockReturnValue("/tmp/backups-default");
+  mkdirSyncMock.mockReset();
+  mkdirSyncMock.mockImplementation((() => undefined) as never);
+  writeFileSyncMock.mockReset();
+  writeFileSyncMock.mockImplementation(() => undefined);
+});
+afterEach(() => {
+  globalThis.fetch = originalFetch;
+});
+afterAll(() => {
+  // Restore module-level spies so they don't bleed into other test files
+  // when bun test runs the whole suite.
+  findAssistantByNameMock.mockRestore();
+  readPlatformTokenMock.mockRestore();
+  getPlatformUrlMock.mockRestore();
+  platformRequestSignedUrlMock.mockRestore();
+  localRuntimeExportToGcsMock.mockRestore();
+  localRuntimePollJobStatusMock.mockRestore();
+  getBackupsDirMock.mockRestore();
+  mkdirSyncMock.mockRestore();
+  writeFileSyncMock.mockRestore();
+  rmSync(testDir, { recursive: true, force: true });
+});
+import { backup } from "../commands/backup.js";
+// ---------------------------------------------------------------------------
+// Helper: simulated GCS download response
+// ---------------------------------------------------------------------------
+function mockGcsDownload(body: Uint8Array, ok = true, status = 200) {
+  globalThis.fetch = mock(async () => {
+    const responseBody: BodyInit = ok
+      ? new Blob([body as unknown as ArrayBuffer])
+      : "boom";
+    return new Response(responseBody, {
+      status,
+      statusText: ok ? "OK" : "Error",
+    });
+  }) as unknown as typeof globalThis.fetch;
+}
+describe("vellum backup <platform-managed>: GCS happy path", () => {
+  test("requests upload URL → kicks off runtime export → polls → downloads from GCS → writes file", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    setArgv("my-platform");
+    const bytes = new Uint8Array([1, 2, 3, 4]);
+    mockGcsDownload(bytes);
+    await backup();
+    // Upload-URL request to the platform.
+    expect(platformRequestSignedUrlMock).toHaveBeenCalledWith(
+      expect.objectContaining({ operation: "upload" }),
+      "platform-token",
+      "https://platform.vellum.ai",
+    );
+    // Runtime export-to-gcs kicked off via the entry-aware helper. URL
+    // construction is exercised in `local-runtime-client.test.ts`; here we
+    // assert the helper got the right entry + token + params.
+    expect(localRuntimeExportToGcsMock).toHaveBeenCalledWith(
+      expect.objectContaining({
+        cloud: "vellum",
+        runtimeUrl: "https://platform.vellum.ai",
+        assistantId: "11111111-2222-3333-4444-555555555555",
+      }),
+      "platform-token",
+      expect.objectContaining({
+        uploadUrl: "https://storage.googleapis.com/bucket/signed-upload",
+        description: "CLI backup",
+      }),
+    );
+    // Poll uses the entry-aware helper (wildcard URL, NOT the dedicated
+    // platform jobs/{id}/ endpoint).
+    expect(localRuntimePollJobStatusMock).toHaveBeenCalledWith(
+      expect.objectContaining({ cloud: "vellum" }),
+      "platform-token",
+      "platform-export-job-1",
+    );
+    // Download URL keyed off the upload's bundleKey.
+    expect(platformRequestSignedUrlMock).toHaveBeenCalledWith(
+      {
+        operation: "download",
+        bundleKey: "uploads/org-1/bundle-abc.vbundle",
+      },
+      "platform-token",
+      "https://platform.vellum.ai",
+    );
+    // GCS fetch went directly to the signed download URL with no auth.
+    const gcsFetch = globalThis.fetch as unknown as ReturnType<typeof mock>;
+    expect(gcsFetch).toHaveBeenCalledWith(
+      "https://storage.googleapis.com/bucket/signed-download",
+    );
+    // File written to disk with the bytes from GCS.
+    expect(writeFileSyncMock).toHaveBeenCalledTimes(1);
+    const [outputPath, written] = writeFileSyncMock.mock.calls[0]!;
+    expect(written).toEqual(bytes);
+    expect(typeof outputPath).toBe("string");
+    expect(outputPath as string).toMatch(
+      /\/tmp\/backups-default\/my-platform-.*\.vbundle$/,
+    );
+    expect(mkdirSyncMock).toHaveBeenCalled();
+  });
+  test("--output override is respected", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    setArgv("my-platform", "--output", "/custom/path/backup.vbundle");
+    mockGcsDownload(new Uint8Array([7, 7, 7]));
+    await backup();
+    expect(writeFileSyncMock).toHaveBeenCalledTimes(1);
+    expect(writeFileSyncMock.mock.calls[0]![0]).toBe(
+      "/custom/path/backup.vbundle",
+    );
+  });
+  test("default output path is getBackupsDir() + name-timestamp.vbundle", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    setArgv("my-platform");
+    mockGcsDownload(new Uint8Array([1]));
+    await backup();
+    const [outputPath] = writeFileSyncMock.mock.calls[0]!;
+    expect(outputPath as string).toMatch(
+      /^\/tmp\/backups-default\/my-platform-/,
+    );
+    expect(outputPath as string).toMatch(/\.vbundle$/);
+  });
+  test("signed-URL requests target entry.runtimeUrl, not getPlatformUrl() — regression for staging/dev assistants", async () => {
+    // Assistant lives on a non-default platform instance (e.g. staging).
+    // `getPlatformUrl()` still returns the default — picking it up for
+    // signed URLs would target the wrong GCS bucket.
+    const stagingEntry = {
+      ...VELLUM_ENTRY,
+      runtimeUrl: "https://staging-platform.vellum.ai",
+    };
+    findAssistantByNameMock.mockReturnValue(stagingEntry);
+    getPlatformUrlMock.mockReturnValue("https://platform.vellum.ai");
+    setArgv("my-platform");
+    mockGcsDownload(new Uint8Array([9]));
+    await backup();
+    // Both upload and download URL requests are pinned to the entry's
+    // runtimeUrl. The signed URLs returned by the platform target the
+    // GCS bucket the runtime can reach, not the default platform's.
+    expect(platformRequestSignedUrlMock).toHaveBeenCalledWith(
+      expect.objectContaining({ operation: "upload" }),
+      "platform-token",
+      "https://staging-platform.vellum.ai",
+    );
+    expect(platformRequestSignedUrlMock).toHaveBeenCalledWith(
+      expect.objectContaining({ operation: "download" }),
+      "platform-token",
+      "https://staging-platform.vellum.ai",
+    );
+    // No call should have used the default platform URL.
+    const calls = platformRequestSignedUrlMock.mock.calls;
+    for (const call of calls) {
+      expect(call[2]).toBe("https://staging-platform.vellum.ai");
+    }
+  });
+  test("download-URL request uses the refreshed platform token if polling re-authed mid-export", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    setArgv("my-platform");
+    // Simulate a poll-loop refresh: the helper fires `refreshOn401`
+    // before resolving terminal. We trigger that hook to mutate the
+    // token captured by backupPlatform's closure.
+    localRuntimePollJobStatusMock.mockReset();
+    localRuntimePollJobStatusMock.mockImplementation(async () => ({
+      jobId: "platform-export-job-1",
+      type: "export",
+      status: "complete",
+      result: {},
+    }));
+    // Make readPlatformToken return a fresh value on the second call,
+    // mimicking the "user re-ran `vellum login` in another terminal"
+    // scenario. The helper's pollJobUntilDone calls refreshOn401 only
+    // when its own request 401s — for the test we drive the refresh
+    // directly by overriding the mock to surface a fresh token at the
+    // download-step boundary.
+    readPlatformTokenMock.mockReset();
+    readPlatformTokenMock.mockReturnValueOnce("platform-token-old");
+    readPlatformTokenMock.mockReturnValue("platform-token-new");
+    // Hook into pollJobUntilDone via overriding poll to intercept the
+    // refresh call. Easier: just verify the second-arg token to the
+    // download signed-URL request equals the one we'll inject by
+    // letting backup re-read the platform token mid-flight. The current
+    // implementation only re-reads inside pollJobUntilDone's
+    // `refreshOn401`, so we simulate a refresh by overriding poll to
+    // throw-and-recover. Instead we directly assert the regression
+    // behavior: backup uses `exportPlatformToken` (the closure variable)
+    // for the download URL — verified by the structural assertion that
+    // the same variable is used for upload, kickoff, poll, AND download.
+    mockGcsDownload(new Uint8Array([1]));
+    await backup();
+    // All four token-bearing platform calls (upload signed-URL, runtime
+    // export-to-gcs kickoff, poll, download signed-URL) must use the
+    // same token string. If the download step fell back to the captured
+    // `platformToken` parameter instead of `exportPlatformToken`, a
+    // future poll-loop refresh would silently break this invariant.
+    const uploadCallToken = platformRequestSignedUrlMock.mock.calls.find(
+      (c) => (c[0] as { operation: string }).operation === "upload",
+    )![1];
+    const downloadCallToken = platformRequestSignedUrlMock.mock.calls.find(
+      (c) => (c[0] as { operation: string }).operation === "download",
+    )![1];
+    expect(downloadCallToken).toBe(uploadCallToken);
+    const kickoffToken = localRuntimeExportToGcsMock.mock.calls[0]![1];
+    expect(downloadCallToken).toBe(kickoffToken);
+    const pollToken = localRuntimePollJobStatusMock.mock.calls[0]![1];
+    expect(downloadCallToken).toBe(pollToken);
+  });
+});
+describe("vellum backup <platform-managed>: failure cases", () => {
+  test("not logged in (no platform token) exits with 'Run vellum login'", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    readPlatformTokenMock.mockReturnValue(null);
+    setArgv("my-platform");
+    const consoleErrorSpy = spyOn(console, "error").mockImplementation(
+      () => undefined,
+    );
+    try {
+      await expect(backup()).rejects.toThrow("process.exit:1");
+      expect(consoleErrorSpy).toHaveBeenCalledWith(
+        expect.stringContaining("Not logged in"),
+      );
+    } finally {
+      consoleErrorSpy.mockRestore();
+    }
+  });
+  test("MigrationInProgressError on kickoff exits with 'Another backup or teleport export'", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    localRuntimeExportToGcsMock.mockRejectedValue(
+      new MigrationInProgressError("export_in_progress", "existing-job-99"),
+    );
+    setArgv("my-platform");
+    const consoleErrorSpy = spyOn(console, "error").mockImplementation(
+      () => undefined,
+    );
+    try {
+      await expect(backup()).rejects.toThrow("process.exit:1");
+      const calls = consoleErrorSpy.mock.calls.map((c) => c[0]);
+      expect(
+        calls.some(
+          (m) =>
+            typeof m === "string" &&
+            m.includes("Another backup or teleport export") &&
+            m.includes("existing-job-99"),
+        ),
+      ).toBe(true);
+    } finally {
+      consoleErrorSpy.mockRestore();
+    }
+  });
+  test("terminal=failed exits with 'Export failed: <reason>'", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    localRuntimePollJobStatusMock.mockResolvedValue({
+      jobId: "platform-export-job-1",
+      type: "export",
+      status: "failed",
+      error: "vbundle build crashed",
+    });
+    setArgv("my-platform");
+    const consoleErrorSpy = spyOn(console, "error").mockImplementation(
+      () => undefined,
+    );
+    try {
+      await expect(backup()).rejects.toThrow("process.exit:1");
+      expect(consoleErrorSpy).toHaveBeenCalledWith(
+        expect.stringContaining("Export failed: vbundle build crashed"),
+      );
+    } finally {
+      consoleErrorSpy.mockRestore();
+    }
+  });
+  test("GCS fetch !ok exits with 'Failed to fetch bundle from GCS (<status>)'", async () => {
+    findAssistantByNameMock.mockReturnValue(VELLUM_ENTRY);
+    setArgv("my-platform");
+    mockGcsDownload(new Uint8Array(), false, 403);
+    const consoleErrorSpy = spyOn(console, "error").mockImplementation(
+      () => undefined,
+    );
+    try {
+      await expect(backup()).rejects.toThrow("process.exit:1");
+      const calls = consoleErrorSpy.mock.calls.map((c) => c[0]);
+      expect(
+        calls.some(
+          (m) =>
+            typeof m === "string" &&
+            m.includes("Failed to fetch bundle from GCS") &&
+            m.includes("403"),
+        ),
+      ).toBe(true);
+    } finally {
+      consoleErrorSpy.mockRestore();
+    }
+  });
+});

package/src/__tests__/config-utils.test.ts CHANGED Viewed

@@ -1,6 +1,19 @@
+import { readFileSync, rmSync } from "fs";
 import { describe, expect, test } from "bun:test";
-import { buildInitialConfig, buildNestedConfig } from "../lib/config-utils.js";
+import { buildNestedConfig, writeInitialConfig } from "../lib/config-utils.js";
+function readInitialConfig(
+  configValues: Record<string, string>,
+): Record<string, unknown> {
+  const path = writeInitialConfig(configValues);
+  expect(path).toBeDefined();
+  try {
+    return JSON.parse(readFileSync(path!, "utf-8")) as Record<string, unknown>;
+  } finally {
+    if (path !== undefined) rmSync(path, { force: true });
+  }
+}
 describe("config-utils", () => {
   test("buildNestedConfig only converts dot-notation values", () => {
@@ -19,9 +32,9 @@ describe("config-utils", () => {
     });
   });
-  test("buildInitialConfig seeds mainAgent callSite for Anthropic default", () => {
+  test("writeInitialConfig does not add a mainAgent callSite for Anthropic defaults", () => {
     expect(
-      buildInitialConfig({
+      readInitialConfig({
         "llm.default.provider": "anthropic",
         "llm.default.model": "claude-opus-4-7",
       }),
@@ -31,41 +44,35 @@ describe("config-utils", () => {
           provider: "anthropic",
           model: "claude-opus-4-7",
         },
-        callSites: {
-          mainAgent: {
-            model: "claude-opus-4-7",
-            maxTokens: 32000,
-          },
-        },
       },
     });
   });
-  test("buildInitialConfig seeds Opus when provider falls back to Anthropic", () => {
+  test("writeInitialConfig preserves profile-based Anthropic model selection", () => {
     expect(
-      buildInitialConfig({
-        "services.inference.mode": "managed",
+      readInitialConfig({
+        "llm.activeProfile": "quality-optimized",
+        "llm.profiles.quality-optimized.provider": "anthropic",
+        "llm.profiles.quality-optimized.model": "claude-opus-4-7",
+        "llm.profiles.quality-optimized.maxTokens": "32000",
       }),
     ).toEqual({
-      services: {
-        inference: {
-          mode: "managed",
-        },
-      },
       llm: {
-        callSites: {
-          mainAgent: {
+        activeProfile: "quality-optimized",
+        profiles: {
+          "quality-optimized": {
+            provider: "anthropic",
             model: "claude-opus-4-7",
-            maxTokens: 32000,
+            maxTokens: "32000",
           },
         },
       },
     });
   });
-  test("buildInitialConfig preserves explicit mainAgent overrides", () => {
+  test("writeInitialConfig preserves explicit mainAgent overrides without rewriting them", () => {
     expect(
-      buildInitialConfig({
+      readInitialConfig({
         "llm.default.provider": "anthropic",
         "llm.default.model": "claude-opus-4-7",
         "llm.callSites.mainAgent.model": "claude-haiku-4-5-20251001",
@@ -85,9 +92,9 @@ describe("config-utils", () => {
     });
   });
-  test("buildInitialConfig respects explicit non-default Anthropic models", () => {
+  test("writeInitialConfig respects explicit non-default Anthropic models", () => {
     expect(
-      buildInitialConfig({
+      readInitialConfig({
         "llm.default.provider": "anthropic",
         "llm.default.model": "claude-haiku-4-5-20251001",
       }),
@@ -101,9 +108,9 @@ describe("config-utils", () => {
     });
   });
-  test("buildInitialConfig respects active profile provider overrides", () => {
+  test("writeInitialConfig leaves active OpenAI profile config unchanged", () => {
     expect(
-      buildInitialConfig({
+      readInitialConfig({
         "llm.activeProfile": "fast",
         "llm.profiles.fast.provider": "openai",
         "llm.profiles.fast.model": "gpt-5.5",
@@ -121,29 +128,9 @@ describe("config-utils", () => {
     });
   });
-  test("buildInitialConfig uses active profile model when deciding to seed", () => {
-    expect(
-      buildInitialConfig({
-        "llm.activeProfile": "fast",
-        "llm.profiles.fast.provider": "anthropic",
-        "llm.profiles.fast.model": "claude-haiku-4-5-20251001",
-      }),
-    ).toEqual({
-      llm: {
-        activeProfile: "fast",
-        profiles: {
-          fast: {
-            provider: "anthropic",
-            model: "claude-haiku-4-5-20251001",
-          },
-        },
-      },
-    });
-  });
-  test("buildInitialConfig does not seed Opus for non-Anthropic providers", () => {
+  test("writeInitialConfig does not add Opus for non-Anthropic providers", () => {
     expect(
-      buildInitialConfig({
+      readInitialConfig({
         "llm.default.provider": "openai",
         "llm.default.model": "gpt-5.5",
       }),