npm - @vellumai/assistant - Versions diffs - 0.8.2 → 0.8.3 - Mend

@vellumai/assistant 0.8.2 → 0.8.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (231) hide show

package/ARCHITECTURE.md +11 -12
package/docker-entrypoint.sh +13 -1
package/docker-init-apt-root.sh +79 -6
package/openapi.yaml +336 -21
package/package.json +1 -1
package/src/__tests__/agent-loop-exit-reason.test.ts +272 -0
package/src/__tests__/agent-loop-provider-error-recording.test.ts +195 -0
package/src/__tests__/compactor-tail-resolution.test.ts +107 -1
package/src/__tests__/config-get-vision-flag.test.ts +136 -0
package/src/__tests__/config-loader-backfill.test.ts +115 -18
package/src/__tests__/context-token-estimator.test.ts +30 -65
package/src/__tests__/conversation-agent-loop.test.ts +57 -1
package/src/__tests__/conversation-media-retry.test.ts +19 -8
package/src/__tests__/conversation-runtime-assembly.test.ts +26 -4
package/src/__tests__/date-context.test.ts +45 -0
package/src/__tests__/external-plugin-loader.test.ts +91 -19
package/src/__tests__/guardian-action-no-hardcoded-copy.test.ts +0 -1
package/src/__tests__/guardian-dispatch.test.ts +1 -0
package/src/__tests__/heartbeat-service.test.ts +24 -164
package/src/__tests__/helpers/channel-test-adapter.ts +0 -2
package/src/__tests__/host-app-control-proxy.test.ts +241 -0
package/src/__tests__/host-proxy-preactivation.test.ts +200 -13
package/src/__tests__/injector-background-turn.test.ts +153 -0
package/src/__tests__/injector-chain.test.ts +5 -0
package/src/__tests__/lifecycle-memory-v2-seed.test.ts +9 -2
package/src/__tests__/llm-callsite-catalog.test.ts +25 -0
package/src/__tests__/llm-catalog-parity.test.ts +3 -0
package/src/__tests__/llm-request-log-agent-loop-exit-reason.test.ts +116 -0
package/src/__tests__/llm-request-log-error-payload.test.ts +138 -0
package/src/__tests__/llm-request-log-source-clickhouse.test.ts +2 -0
package/src/__tests__/llm-resolver.test.ts +255 -2
package/src/__tests__/managed-profile-guard.test.ts +10 -0
package/src/__tests__/notification-decision-fallback.test.ts +0 -91
package/src/__tests__/notification-decision-strategy.test.ts +14 -31
package/src/__tests__/notification-deep-link.test.ts +15 -0
package/src/__tests__/notification-guardian-path.test.ts +1 -2
package/src/__tests__/notification-platform-adapter.test.ts +5 -4
package/src/__tests__/notification-telegram-adapter.test.ts +1 -0
package/src/__tests__/notification-vellum-adapter.test.ts +113 -0
package/src/__tests__/openai-provider.test.ts +218 -3
package/src/__tests__/openai-responses-cutover-guard.test.ts +3 -3
package/src/__tests__/openrouter-provider-only.test.ts +51 -3
package/src/__tests__/openrouter-token-estimation.test.ts +34 -25
package/src/__tests__/platform-proxy-context.test.ts +6 -1
package/src/__tests__/plugin-tool-contribution.test.ts +3 -3
package/src/__tests__/plugin-types.test.ts +2 -2
package/src/__tests__/provider-catalog-visibility.test.ts +16 -0
package/src/__tests__/provider-platform-proxy-integration.test.ts +27 -25
package/src/__tests__/secret-routes-platform-proxy.test.ts +1 -1
package/src/__tests__/system-prompt.test.ts +6 -73
package/src/__tests__/workspace-migration-087-memory-router-balanced-profile.test.ts +228 -0
package/src/a2a/__tests__/agent-card.test.ts +98 -0
package/src/a2a/__tests__/e2e-a2a-channel.test.ts +597 -0
package/src/a2a/__tests__/protocol-helpers.test.ts +113 -0
package/src/a2a/__tests__/task-store.test.ts +246 -0
package/src/a2a/agent-card.ts +58 -0
package/src/a2a/feature-gate.ts +8 -0
package/src/a2a/protocol-constants.ts +21 -0
package/src/a2a/protocol-errors.ts +50 -0
package/src/a2a/protocol-types.ts +162 -0
package/src/a2a/task-store.ts +168 -0
package/src/agent/loop.ts +167 -18
package/src/channels/config.ts +9 -0
package/src/channels/types.ts +14 -0
package/src/cli/{__tests__ → commands/__tests__}/notifications.test.ts +201 -28
package/src/cli/commands/__tests__/schedules.test.ts +469 -0
package/src/cli/commands/notifications.ts +65 -35
package/src/cli/commands/plugins.ts +67 -0
package/src/cli/commands/schedules.ts +297 -5
package/src/cli/lib/__tests__/search-plugins.test.ts +261 -0
package/src/cli/lib/install-from-github.ts +8 -9
package/src/cli/lib/search-plugins.ts +163 -0
package/src/cli/program.ts +14 -0
package/src/config/assistant-feature-flags.ts +24 -54
package/src/config/bundled-skills/app-builder/SKILL.md +117 -1
package/src/config/bundled-skills/phone-calls/SKILL.md +1 -1
package/src/config/call-site-defaults.ts +105 -0
package/src/config/feature-flag-registry.json +21 -29
package/src/config/llm-resolver.ts +52 -1
package/src/config/schema.ts +2 -0
package/src/config/schemas/__tests__/memory-v2.test.ts +3 -3
package/src/config/schemas/channels.ts +9 -0
package/src/config/schemas/conversations.ts +10 -0
package/src/config/schemas/heartbeat.ts +14 -0
package/src/config/schemas/llm.ts +1 -3
package/src/config/schemas/memory-retrospective.ts +1 -1
package/src/config/schemas/memory-v2.ts +4 -4
package/src/config/schemas/memory.ts +3 -1
package/src/config/seed-inference-profiles.ts +99 -29
package/src/context/compactor.ts +72 -12
package/src/context/token-estimator.ts +32 -34
package/src/daemon/__tests__/conversation-lifecycle-auto-analyze.test.ts +3 -22
package/src/daemon/conversation-agent-loop-handlers.ts +78 -0
package/src/daemon/conversation-agent-loop.ts +29 -2
package/src/daemon/conversation-runtime-assembly.ts +9 -0
package/src/daemon/conversation.ts +0 -7
package/src/daemon/date-context.ts +40 -0
package/src/daemon/guardian-action-generators.ts +1 -125
package/src/daemon/handlers/__tests__/config-a2a-complete.test.ts +248 -0
package/src/daemon/handlers/__tests__/config-a2a-invite.test.ts +154 -0
package/src/daemon/handlers/__tests__/config-a2a-redeem.test.ts +133 -0
package/src/daemon/handlers/__tests__/config-a2a.test.ts +95 -0
package/src/daemon/handlers/config-a2a.ts +289 -0
package/src/daemon/handlers/conversations.ts +1 -0
package/src/daemon/host-app-control-proxy.ts +69 -18
package/src/daemon/host-proxy-preactivation.ts +85 -18
package/src/daemon/lifecycle.ts +49 -61
package/src/daemon/memory-v2-startup.ts +49 -13
package/src/daemon/message-types/notifications.ts +21 -0
package/src/daemon/pkb-reminder-builder.test.ts +10 -53
package/src/daemon/pkb-reminder-builder.ts +4 -19
package/src/daemon/process-message.ts +3 -0
package/src/daemon/skill-memory-refresh.ts +5 -1
package/src/daemon/wake-target-adapter.ts +2 -0
package/src/export/__tests__/transcript-formatter.test.ts +121 -0
package/src/export/transcript-formatter.ts +54 -20
package/src/heartbeat/__tests__/heartbeat-service.test.ts +44 -0
package/src/heartbeat/heartbeat-service.ts +34 -191
package/src/home/__tests__/feed-types.test.ts +40 -0
package/src/home/feed-types.ts +14 -2
package/src/ipc/cli-client.ts +147 -45
package/src/memory/__tests__/conversation-queries.test.ts +220 -0
package/src/memory/__tests__/memory-retrospective-enqueue.test.ts +2 -50
package/src/memory/__tests__/memory-retrospective-job.test.ts +87 -4
package/src/memory/conversation-queries.ts +87 -1
package/src/memory/conversation-title-service.ts +26 -4
package/src/memory/db-init.ts +6 -0
package/src/memory/graph/__tests__/conversation-graph-memory-v2-routing.test.ts +84 -3
package/src/memory/graph/conversation-graph-memory.ts +18 -6
package/src/memory/graph/tools.ts +6 -37
package/src/memory/invite-store.ts +53 -0
package/src/memory/llm-request-log-source-clickhouse.ts +7 -2
package/src/memory/llm-request-log-store.ts +92 -1
package/src/memory/memory-retrospective-enqueue.ts +1 -20
package/src/memory/memory-retrospective-job.ts +33 -6
package/src/memory/migrations/250-provider-connection-base-url-and-models.ts +28 -0
package/src/memory/migrations/251-a2a-tasks.ts +49 -0
package/src/memory/migrations/252-llm-request-log-agent-loop-exit-reason.ts +32 -0
package/src/memory/migrations/index.ts +3 -0
package/src/memory/migrations/registry.ts +8 -0
package/src/memory/schema/a2a.ts +15 -0
package/src/memory/schema/index.ts +1 -0
package/src/memory/schema/inference.ts +2 -0
package/src/memory/schema/infrastructure.ts +1 -0
package/src/memory/v2/__tests__/activation-store.test.ts +25 -23
package/src/memory/v2/__tests__/cli-command-store.test.ts +404 -0
package/src/memory/v2/__tests__/frontmatter-sweep.test.ts +25 -4
package/src/memory/v2/__tests__/injection.test.ts +190 -3
package/src/memory/v2/__tests__/static-context.test.ts +12 -1
package/src/memory/v2/activation-store.ts +14 -16
package/src/memory/v2/cli-command-content.ts +19 -0
package/src/memory/v2/cli-command-store.ts +304 -0
package/src/memory/v2/frontmatter-sweep.ts +7 -1
package/src/memory/v2/injection.ts +49 -20
package/src/memory/v2/page-index.ts +38 -13
package/src/memory/v2/static-context.ts +4 -4
package/src/memory/v2/types.ts +23 -0
package/src/messaging/providers/a2a/__tests__/deliver.test.ts +274 -0
package/src/messaging/providers/a2a/deliver.ts +156 -0
package/src/messaging/providers/gmail/client.ts +9 -2
package/src/messaging/providers/index.ts +11 -2
package/src/notifications/__tests__/broadcaster.test.ts +203 -0
package/src/notifications/__tests__/decision-engine.test.ts +283 -0
package/src/notifications/__tests__/deterministic-checks.test.ts +286 -0
package/src/notifications/__tests__/emit-signal-home-feed.test.ts +1 -0
package/src/notifications/__tests__/home-feed-side-effect.test.ts +430 -7
package/src/notifications/adapters/macos.ts +12 -2
package/src/notifications/broadcaster.ts +29 -4
package/src/notifications/copy-composer.ts +17 -64
package/src/notifications/decision-engine.ts +111 -44
package/src/notifications/deterministic-checks.ts +96 -0
package/src/notifications/emit-signal.ts +1 -0
package/src/notifications/home-feed-side-effect.ts +85 -6
package/src/notifications/signal.ts +0 -4
package/src/notifications/types.ts +8 -0
package/src/oauth/platform-connection.test.ts +43 -3
package/src/oauth/platform-connection.ts +13 -4
package/src/plugins/defaults/injectors.ts +38 -19
package/src/plugins/external-plugin-loader.ts +82 -10
package/src/plugins/types.ts +16 -7
package/src/prompts/__tests__/system-prompt.test.ts +6 -51
package/src/prompts/__tests__/task-progress-hint-section.test.ts +4 -8
package/src/prompts/system-prompt.ts +0 -8
package/src/prompts/templates/BOOTSTRAP.md +5 -5
package/src/prompts/templates/system-sections.ts +0 -9
package/src/providers/__tests__/inference.test.ts +2 -0
package/src/providers/call-site-routing.ts +24 -6
package/src/providers/connection-resolution.ts +63 -13
package/src/providers/inference/__tests__/adapter-factory-openai-compatible.test.ts +74 -0
package/src/providers/inference/__tests__/connections-openai-compatible.test.ts +175 -0
package/src/providers/inference/__tests__/connections-status-label.test.ts +15 -0
package/src/providers/inference/adapter-factory.ts +9 -20
package/src/providers/inference/auth.ts +12 -0
package/src/providers/inference/backfill.ts +14 -1
package/src/providers/inference/connections.ts +85 -5
package/src/providers/inference/resolve-auth.ts +2 -0
package/src/providers/model-catalog.ts +199 -244
package/src/providers/model-intents.ts +3 -3
package/src/providers/openai/__tests__/chat-completions-provider-reasoning.test.ts +235 -0
package/src/providers/openai/chat-completions-provider.ts +159 -6
package/src/providers/openrouter/client.ts +42 -4
package/src/providers/platform-proxy/constants.ts +3 -4
package/src/providers/provider-catalog-visibility.ts +3 -1
package/src/providers/provider-send-message.ts +27 -12
package/src/providers/registry.ts +30 -1
package/src/runtime/agent-wake.ts +61 -1
package/src/runtime/auth/route-policy.ts +13 -0
package/src/runtime/http-server.ts +7 -16
package/src/runtime/http-types.ts +0 -47
package/src/runtime/routes/__tests__/consolidation-routes.test.ts +258 -0
package/src/runtime/routes/__tests__/conversation-query-routes.test.ts +66 -4
package/src/runtime/routes/__tests__/inference-provider-connection-routes.test.ts +275 -44
package/src/runtime/routes/__tests__/llm-call-sites-routes.test.ts +12 -0
package/src/runtime/routes/channel-availability-routes.ts +5 -0
package/src/runtime/routes/consolidation-routes.ts +100 -0
package/src/runtime/routes/conversation-query-routes.ts +70 -11
package/src/runtime/routes/conversation-routes.ts +7 -0
package/src/runtime/routes/index.ts +2 -0
package/src/runtime/routes/inference-provider-connection-routes.ts +134 -1
package/src/runtime/routes/integrations/a2a.ts +235 -0
package/src/runtime/routes/llm-call-sites-routes.ts +11 -1
package/src/runtime/routes/subagents-routes.ts +41 -0
package/src/subagent/manager.ts +2 -0
package/src/tools/memory/register.ts +1 -9
package/src/tools/registry.ts +2 -2
package/src/tools/types.ts +37 -2
package/src/workspace/migrations/087-memory-router-balanced-profile.ts +91 -0
package/src/workspace/migrations/registry.ts +2 -0
package/src/__tests__/guardian-action-conversation-turn.test.ts +0 -441
package/src/memory/graph/__tests__/remember-description.test.ts +0 -55
package/src/runtime/guardian-action-conversation-turn.ts +0 -99

package/src/__tests__/config-get-vision-flag.test.ts ADDED Viewed

@@ -0,0 +1,136 @@
+/**
+ * Verifies that `GET /v1/config` enriches each profile in `llm.profiles`
+ * with `supportsVision` resolved from the model catalog.
+ */
+import { describe, expect, mock, test } from "bun:test";
+import { makeMockLogger } from "./helpers/mock-logger.js";
+mock.module("../util/logger.js", () => ({
+  getLogger: () => makeMockLogger(),
+}));
+// ---------------------------------------------------------------------------
+// Mocks for handleGetConfig's transitive deps
+// ---------------------------------------------------------------------------
+let rawConfig: Record<string, unknown> = {};
+mock.module("../config/loader.js", () => ({
+  loadRawConfig: () => structuredClone(rawConfig),
+  saveRawConfig: () => {},
+  deepMergeOverwrite: () => {},
+  getConfig: () => rawConfig,
+  getDeploymentContextDefaults: () => ({}),
+  fillContextDefaultsForMissingKeys: () => {},
+  invalidateConfigCache: () => {},
+  setNestedValue: () => {},
+}));
+mock.module("../providers/registry.js", () => ({
+  initializeProviders: async () => {},
+}));
+mock.module("../memory/embedding-backend.js", () => ({
+  clearEmbeddingBackendCache: () => {},
+}));
+mock.module("../security/secret-allowlist.js", () => ({
+  validateAllowlistFile: () => null,
+}));
+import { ROUTES } from "../runtime/routes/conversation-query-routes.js";
+const configGetRoute = ROUTES.find((r) => r.operationId === "config_get")!;
+// ---------------------------------------------------------------------------
+// Tests
+// ---------------------------------------------------------------------------
+describe("GET /v1/config profile vision enrichment", () => {
+  test("profile with a non-vision model gets supportsVision: false", () => {
+    rawConfig = {
+      llm: {
+        profiles: {
+          "test-no-vision": {
+            provider: "fireworks",
+            model: "accounts/fireworks/models/kimi-k2p5",
+          },
+        },
+      },
+    };
+    const result = configGetRoute.handler({}) as {
+      llm?: {
+        profiles?: Record<string, { supportsVision?: boolean }>;
+      };
+    };
+    expect(result?.llm?.profiles?.["test-no-vision"]?.supportsVision).toBe(
+      false,
+    );
+  });
+  test("profile with a vision-capable model gets supportsVision: true", () => {
+    rawConfig = {
+      llm: {
+        profiles: {
+          "test-vision": {
+            provider: "anthropic",
+            model: "claude-opus-4-6",
+          },
+        },
+      },
+    };
+    const result = configGetRoute.handler({}) as {
+      llm?: {
+        profiles?: Record<string, { supportsVision?: boolean }>;
+      };
+    };
+    expect(result?.llm?.profiles?.["test-vision"]?.supportsVision).toBe(true);
+  });
+  test("profile with an unknown model defaults supportsVision to true (fail-open)", () => {
+    rawConfig = {
+      llm: {
+        profiles: {
+          "test-unknown": {
+            provider: "anthropic",
+            model: "some-unknown-model-xyz",
+          },
+        },
+      },
+    };
+    const result = configGetRoute.handler({}) as {
+      llm?: {
+        profiles?: Record<string, { supportsVision?: boolean }>;
+      };
+    };
+    expect(result?.llm?.profiles?.["test-unknown"]?.supportsVision).toBe(true);
+  });
+  test("profile without provider/model is left without supportsVision", () => {
+    rawConfig = {
+      llm: {
+        profiles: {
+          "test-empty": {},
+        },
+      },
+    };
+    const result = configGetRoute.handler({}) as {
+      llm?: {
+        profiles?: Record<string, { supportsVision?: boolean }>;
+      };
+    };
+    expect(
+      result?.llm?.profiles?.["test-empty"]?.supportsVision,
+    ).toBeUndefined();
+  });
+});

package/src/__tests__/config-loader-backfill.test.ts CHANGED Viewed

@@ -7,6 +7,7 @@ import {
   writeFileSync,
 } from "node:fs";
 import { join } from "node:path";
+import { Database } from "bun:sqlite";
 import {
   afterAll,
   afterEach,
@@ -17,6 +18,8 @@ import {
   test,
 } from "bun:test";
+import { drizzle } from "drizzle-orm/bun-sqlite";
 // ---------------------------------------------------------------------------
 // Mocks — declared before imports that depend on platform/logger
 // ---------------------------------------------------------------------------
@@ -73,6 +76,12 @@ import {
   mergeDefaultWorkspaceConfig,
 } from "../config/loader.js";
 import { seedInferenceProfiles } from "../config/seed-inference-profiles.js";
+import type { DrizzleDb } from "../memory/db-connection.js";
+import { migrateCreateProviderConnections } from "../memory/migrations/243-provider-connections.js";
+import { migrateProviderConnectionStatusLabel } from "../memory/migrations/244-provider-connection-status-label.js";
+import { migrateProviderConnectionBaseUrlAndModels } from "../memory/migrations/250-provider-connection-base-url-and-models.js";
+import * as schema from "../memory/schema.js";
+import { getConnection } from "../providers/inference/connections.js";
 import { _setStorePath } from "../security/encrypted-store.js";
 // ---------------------------------------------------------------------------
@@ -83,15 +92,26 @@ function writeConfig(obj: unknown): void {
   writeFileSync(CONFIG_PATH, JSON.stringify(obj, null, 2) + "\n");
 }
-function mergeDefaultConfigAndSeedInferenceProfiles(): void {
+function mergeDefaultConfigAndSeedInferenceProfiles(db?: DrizzleDb): void {
   const defaultConfigMerge = mergeDefaultWorkspaceConfig();
   seedInferenceProfiles({
     preserveProfileNames: defaultConfigMerge.providedLlmProfileNames,
     preserveActiveProfile: defaultConfigMerge.providedLlmActiveProfile,
     isHatch: defaultConfigMerge.hadOverlay,
+    db,
   });
 }
+function createProviderConnectionsDb(): DrizzleDb {
+  const sqlite = new Database(":memory:");
+  sqlite.exec("PRAGMA journal_mode=WAL");
+  const db = drizzle(sqlite, { schema });
+  migrateCreateProviderConnections(db);
+  migrateProviderConnectionStatusLabel(db);
+  migrateProviderConnectionBaseUrlAndModels(db);
+  return db;
+}
 // ---------------------------------------------------------------------------
 // Tests: deepMergeOverwrite (unit) — JSON-null-as-deletion semantics
 //
@@ -523,7 +543,7 @@ describe("loadConfig startup behavior", () => {
     expect(raw.llm.profiles["custom-balanced"].provider_connection).toBe(
       "anthropic-personal",
     );
-    // Managed profiles are also seeded for anthropic-managed.
+    // Managed balanced profile is seeded for anthropic-managed.
     expect(raw.llm.profiles.balanced.provider).toBe("anthropic");
     expect(raw.llm.profiles.balanced.provider_connection).toBe(
       "anthropic-managed",
@@ -589,11 +609,8 @@ describe("loadConfig startup behavior", () => {
     const overlayPath = join(WORKSPACE_DIR, "hatch-overlay.json");
     writeFileSync(
       overlayPath,
-      JSON.stringify(
-        { llm: { default: { provider: "openai" } } },
-        null,
-        2,
-      ) + "\n",
+      JSON.stringify({ llm: { default: { provider: "openai" } } }, null, 2) +
+        "\n",
     );
     process.env.VELLUM_DEFAULT_WORKSPACE_CONFIG_PATH = overlayPath;
@@ -617,7 +634,7 @@ describe("loadConfig startup behavior", () => {
       "gpt-5.4-nano",
     );
-    // Managed anthropic profiles are also seeded.
+    // Managed profiles are also seeded (balanced uses Anthropic).
     expect(raw.llm.profiles.balanced.provider).toBe("anthropic");
     expect(raw.llm.profiles.balanced.provider_connection).toBe(
       "anthropic-managed",
@@ -981,11 +998,8 @@ describe("seedInferenceProfiles BYOK-mode managed profile labels", () => {
     const overlayPath = join(WORKSPACE_DIR, "hatch-overlay.json");
     writeFileSync(
       overlayPath,
-      JSON.stringify(
-        { llm: { default: { provider: "anthropic" } } },
-        null,
-        2,
-      ) + "\n",
+      JSON.stringify({ llm: { default: { provider: "anthropic" } } }, null, 2) +
+        "\n",
     );
     process.env.VELLUM_DEFAULT_WORKSPACE_CONFIG_PATH = overlayPath;
@@ -997,6 +1011,92 @@ describe("seedInferenceProfiles BYOK-mode managed profile labels", () => {
     expect(config.llm.profiles["cost-optimized"]?.status).toBe("disabled");
   });
+  test("off-platform managed-inference hatch keeps selected managed connection active", () => {
+    const overlayPath = join(WORKSPACE_DIR, "hatch-overlay.json");
+    writeFileSync(
+      overlayPath,
+      JSON.stringify(
+        {
+          llm: {
+            default: { provider: "anthropic" },
+            activeProfile: "balanced",
+          },
+        },
+        null,
+        2,
+      ) + "\n",
+    );
+    process.env.VELLUM_DEFAULT_WORKSPACE_CONFIG_PATH = overlayPath;
+    const db = createProviderConnectionsDb();
+    mergeDefaultConfigAndSeedInferenceProfiles(db);
+    const raw = JSON.parse(readFileSync(CONFIG_PATH, "utf-8"));
+    expect(raw.llm.activeProfile).toBe("balanced");
+    expect(raw.llm.profiles.balanced.provider_connection).toBe(
+      "anthropic-managed",
+    );
+    expect("status" in raw.llm.profiles.balanced).toBe(false);
+    expect(getConnection(db, "anthropic-managed")?.status).toBe("active");
+    expect(getConnection(db, "openai-managed")?.status).toBe("disabled");
+    expect(getConnection(db, "gemini-managed")?.status).toBe("disabled");
+  });
+  test("off-platform managed-inference hatch respects explicit non-managed active connection", () => {
+    const overlayPath = join(WORKSPACE_DIR, "hatch-overlay.json");
+    writeFileSync(
+      overlayPath,
+      JSON.stringify(
+        {
+          llm: {
+            default: { provider: "anthropic" },
+            profiles: {
+              balanced: {
+                source: "managed",
+                provider: "anthropic",
+                provider_connection: "anthropic-personal",
+                model: "claude-sonnet-4-6",
+              },
+            },
+            activeProfile: "balanced",
+          },
+        },
+        null,
+        2,
+      ) + "\n",
+    );
+    process.env.VELLUM_DEFAULT_WORKSPACE_CONFIG_PATH = overlayPath;
+    const db = createProviderConnectionsDb();
+    mergeDefaultConfigAndSeedInferenceProfiles(db);
+    const raw = JSON.parse(readFileSync(CONFIG_PATH, "utf-8"));
+    expect(raw.llm.activeProfile).toBe("balanced");
+    expect(raw.llm.profiles.balanced.provider_connection).toBe(
+      "anthropic-personal",
+    );
+    expect(getConnection(db, "anthropic-managed")?.status).toBe("disabled");
+    expect(getConnection(db, "openai-managed")?.status).toBe("disabled");
+    expect(getConnection(db, "gemini-managed")?.status).toBe("disabled");
+  });
+  test("off-platform BYOK hatch still disables managed connections", () => {
+    const overlayPath = join(WORKSPACE_DIR, "hatch-overlay.json");
+    writeFileSync(
+      overlayPath,
+      JSON.stringify({ llm: { default: { provider: "anthropic" } } }, null, 2) +
+        "\n",
+    );
+    process.env.VELLUM_DEFAULT_WORKSPACE_CONFIG_PATH = overlayPath;
+    const db = createProviderConnectionsDb();
+    mergeDefaultConfigAndSeedInferenceProfiles(db);
+    expect(getConnection(db, "anthropic-managed")?.status).toBe("disabled");
+    expect(getConnection(db, "openai-managed")?.status).toBe("disabled");
+    expect(getConnection(db, "gemini-managed")?.status).toBe("disabled");
+  });
   test("non-hatch off-platform boot does NOT auto-disable freshly-materialized managed profiles", () => {
     // Existing installs that upgrade to a version where the managed
     // profile didn't previously exist (e.g. a new template added later)
@@ -1029,11 +1129,8 @@ describe("seedInferenceProfiles BYOK-mode managed profile labels", () => {
     const overlayPath = join(WORKSPACE_DIR, "hatch-overlay.json");
     writeFileSync(
       overlayPath,
-      JSON.stringify(
-        { llm: { default: { provider: "anthropic" } } },
-        null,
-        2,
-      ) + "\n",
+      JSON.stringify({ llm: { default: { provider: "anthropic" } } }, null, 2) +
+        "\n",
     );
     process.env.VELLUM_DEFAULT_WORKSPACE_CONFIG_PATH = overlayPath;

package/src/__tests__/context-token-estimator.test.ts CHANGED Viewed

@@ -219,36 +219,7 @@ describe("token estimator", () => {
     expect(largeFileTokens).toBe(smallFileTokens);
   });
-  // Non-Anthropic providers use base64 payload size for image estimation
-  test("scales image token estimate with base64 payload size (non-Anthropic)", () => {
-    const smallImageTokens = estimateContentBlockTokens(
-      {
-        type: "image",
-        source: {
-          type: "base64",
-          media_type: "image/png",
-          data: "a".repeat(64),
-        },
-      },
-      { providerName: "openai" },
-    );
-    const largeImageTokens = estimateContentBlockTokens(
-      {
-        type: "image",
-        source: {
-          type: "base64",
-          media_type: "image/png",
-          data: "a".repeat(60_000),
-        },
-      },
-      { providerName: "openai" },
-    );
-    expect(largeImageTokens).toBeGreaterThan(smallImageTokens);
-    expect(largeImageTokens - smallImageTokens).toBeGreaterThan(1000);
-  });
-  test("estimates Anthropic image tokens from dimensions, not base64 size", () => {
+  test("estimates image tokens from dimensions, not base64 size", () => {
     // Build a minimal valid PNG header encoding 1920x1080 dimensions.
     // PNG header: 8-byte signature + 4-byte IHDR length + 4-byte "IHDR" + 4-byte width + 4-byte height = 24 bytes minimum
     const pngHeader = Buffer.alloc(24);
@@ -278,55 +249,49 @@ describe("token estimator", () => {
     const fullPayload = Buffer.concat([pngHeader, padding]);
     const base64Data = fullPayload.toString("base64");
-    const anthropicTokens = estimateContentBlockTokens(
-      {
-        type: "image",
-        source: { type: "base64", media_type: "image/png", data: base64Data },
-      },
-      { providerName: "anthropic" },
-    );
     // 1920x1080 scaled to fit 1568px bounding box: dimScale = 1568/1920 = 0.8167
     // scaledWidth = round(1920 * 0.8167) = 1568, scaledHeight = round(1080 * 0.8167) = 882
     // pixels = 1568 * 882 = 1,382,976 > 1,200,000 → mpScale = sqrt(1200000/1382976) = 0.9315
     // scaledWidth = round(1568 * 0.9315) = 1461, scaledHeight = round(882 * 0.9315) = 822
     // tokens = ceil(1461 * 822 / 750) = ceil(1601.26) = ~1,602
-    // With IMAGE_BLOCK_OVERHEAD_TOKENS and media_type overhead, still well under 5000
-    expect(anthropicTokens).toBeLessThan(5_000);
-    // Verify it's NOT using base64 size (which would be ~50,000+ tokens)
-    const nonAnthropicTokens = estimateContentBlockTokens(
-      {
-        type: "image",
-        source: { type: "base64", media_type: "image/png", data: base64Data },
-      },
-      { providerName: "openai" },
-    );
-    expect(nonAnthropicTokens).toBeGreaterThan(50_000);
+    // With IMAGE_BLOCK_OVERHEAD_TOKENS and media_type overhead, still well under 5000.
+    // Same result for every provider — dimension-based estimate is universal.
+    for (const providerName of ["anthropic", "openai", "openrouter"]) {
+      const tokens = estimateContentBlockTokens(
+        {
+          type: "image",
+          source: { type: "base64", media_type: "image/png", data: base64Data },
+        },
+        { providerName },
+      );
+      expect(tokens).toBeLessThan(5_000);
+    }
   });
-  test("falls back to max tokens when Anthropic image dimensions can't be parsed", () => {
+  test("falls back to max tokens when image dimensions can't be parsed", () => {
     // Corrupted base64 that won't parse as a valid image header
     const corruptedData = Buffer.from(
       "not-a-valid-image-header-at-all",
     ).toString("base64");
-    const tokens = estimateContentBlockTokens(
-      {
-        type: "image",
-        source: {
-          type: "base64",
-          media_type: "image/png",
-          data: corruptedData,
+    for (const providerName of ["anthropic", "openai", "openrouter"]) {
+      const tokens = estimateContentBlockTokens(
+        {
+          type: "image",
+          source: {
+            type: "base64",
+            media_type: "image/png",
+            data: corruptedData,
+          },
         },
-      },
-      { providerName: "anthropic" },
-    );
+        { providerName },
+      );
-    // Should fall back to ANTHROPIC_IMAGE_MAX_TOKENS (1,600)
-    // Total = 16 (block overhead) + ceil(9/4) (media_type) + 1600 = 1619
-    expect(tokens).toBeGreaterThanOrEqual(1_600);
-    expect(tokens).toBeLessThan(2_000);
+      // Falls back to the per-image cap (1,600 tokens). Total = 16 (block
+      // overhead) + ceil(9/4) (media_type) + 1600 = 1619.
+      expect(tokens).toBeGreaterThanOrEqual(1_600);
+      expect(tokens).toBeLessThan(2_000);
+    }
   });
   test("Anthropic image tokens are the same for same-dimension images regardless of payload size", () => {

package/src/__tests__/conversation-agent-loop.test.ts CHANGED Viewed

@@ -386,6 +386,7 @@ mock.module("../daemon/history-repair.js", () => ({
 const recordUsageMock = mock(() => {});
 const recordRequestLogMock = mock(() => {});
+const backfillMessageIdOnLogsMock = mock(() => {});
 mock.module("../daemon/conversation-usage.js", () => ({
   recordUsage: recordUsageMock,
 }));
@@ -482,7 +483,7 @@ mock.module("../memory/archive-store.js", () => ({
 mock.module("../memory/llm-request-log-store.js", () => ({
   recordRequestLog: recordRequestLogMock,
-  backfillMessageIdOnLogs: () => {},
+  backfillMessageIdOnLogs: backfillMessageIdOnLogsMock,
 }));
 let mockHasProactiveArtifactCompleted = true;
@@ -658,6 +659,7 @@ beforeEach(() => {
   mockInjectionBlocks = {};
   recordUsageMock.mockClear();
   recordRequestLogMock.mockClear();
+  backfillMessageIdOnLogsMock.mockClear();
   syncMessageToDiskMock.mockClear();
   rebuildConversationDiskViewFromDbStateMock.mockClear();
   updateMessageMetadataMock.mockClear();
@@ -2855,6 +2857,60 @@ describe("session-agent-loop", () => {
       );
       expect(conversationErrors.length).toBeGreaterThanOrEqual(1);
     });
+    test("pipes synthetic assistant message id into provider-error log rows via backfill", async () => {
+      // Codex P1 regression test: the provider-failure turn must not leave
+      // its `llm_request_logs` row orphaned. Without the backfill call in
+      // the synthetic-message branch, a later turn's `handleMessageComplete`
+      // sweep would wrong-attach this row to the wrong assistant message.
+      const events: ServerMessage[] = [];
+      const agentLoopRun: AgentLoopRun = async (messages, onEvent) => {
+        // 1) handleProviderError -> writes an `llm_request_logs` row with
+        //    messageId=null (the orphan we are trying to link).
+        onEvent({
+          type: "provider_error",
+          error: new Error("upstream 500"),
+          rawRequest: { model: "gpt-4.1", messages: [] },
+          actualProvider: "openai",
+        });
+        // 2) handleError -> sets `state.providerErrorUserMessage`, which
+        //    activates the synthetic-message branch below the loop.
+        onEvent({
+          type: "error",
+          error: new Error("upstream 500"),
+        });
+        // Provider returned no assistant content — same messages back.
+        return messages;
+      };
+      const ctx = makeCtx({ agentLoopRun });
+      await runAgentLoopImpl(ctx, "hello", "msg-1", (msg) => events.push(msg));
+      // The orphan was written with messageId=undefined.
+      expect(recordRequestLogMock).toHaveBeenCalledTimes(1);
+      const recordCall = recordRequestLogMock.mock.calls[0] as unknown as [
+        string,
+        string,
+        string,
+        string | undefined,
+        string | undefined,
+      ];
+      expect(recordCall[0]).toBe("test-conv");
+      expect(recordCall[3]).toBeUndefined();
+      // The synthetic-message branch then piped the assigned message id
+      // (from the mocked `addMessage` -> `{ id: "mock-msg-id" }`) into the
+      // backfill primitive, scoped to this conversation.
+      expect(backfillMessageIdOnLogsMock).toHaveBeenCalledTimes(1);
+      const backfillCall =
+        backfillMessageIdOnLogsMock.mock.calls[0] as unknown as [
+          string,
+          string,
+        ];
+      expect(backfillCall[0]).toBe("test-conv");
+      expect(backfillCall[1]).toBe("mock-msg-id");
+    });
   });
   describe("pkbSystemReminderBlock metadata persistence", () => {

package/src/__tests__/conversation-media-retry.test.ts CHANGED Viewed

@@ -23,7 +23,11 @@ function makeImageBlockWithSize(
 ): Extract<ContentBlock, { type: "image" }> {
   return {
     type: "image",
-    source: { type: "base64", media_type: "image/png", data: "A".repeat(dataLength) },
+    source: {
+      type: "base64",
+      media_type: "image/png",
+      data: "A".repeat(dataLength),
+    },
   };
 }
@@ -103,16 +107,19 @@ describe("stripMediaPayloadsForRetry", () => {
   // ---------------------------------------------------------------------------
   test("budget-aware: keeps images that fit within token budget", () => {
-    // Non-Anthropic estimation: estimateTextTokens(base64Data) + overhead (~19 tokens).
-    // Data length 4000 → 1000 data tokens + 19 overhead ≈ 1019 tokens/image.
-    // Budget of 3500 allows 3 images (3 * 1019 = 3057 <= 3500) but not 4.
-    const images = Array.from({ length: 5 }, () => makeImageBlockWithSize(4000));
+    // Dimension-based estimation: when the base64 data has no parseable image
+    // header, fall back to IMAGE_MAX_TOKENS (1600) + overhead (~19 tokens) ≈
+    // 1619 tokens/image. Budget of 5000 allows 3 images (3 * 1619 = 4857
+    // <= 5000) but not 4 (4 * 1619 = 6476 > 5000).
+    const images = Array.from({ length: 5 }, () =>
+      makeImageBlockWithSize(4000),
+    );
     const messages: Message[] = [
       makeUserMessage({ type: "text", text: "describe these" }, ...images),
     ];
     const result = stripMediaPayloadsForRetry(messages, {
-      mediaTokenBudget: 3500,
+      mediaTokenBudget: 5000,
       providerName: "mock",
     });
     expect(result.modified).toBe(true);
@@ -120,7 +127,9 @@ describe("stripMediaPayloadsForRetry", () => {
     const content = result.messages[0].content;
     const keptImages = content.filter((b) => b.type === "image");
     const stubs = content.filter(
-      (b) => b.type === "text" && (b as { text: string }).text.includes("Image omitted"),
+      (b) =>
+        b.type === "text" &&
+        (b as { text: string }).text.includes("Image omitted"),
     );
     expect(keptImages.length).toBe(3);
     expect(stubs.length).toBe(2);
@@ -174,7 +183,9 @@ describe("stripMediaPayloadsForRetry", () => {
     const content = result.messages[0].content;
     const keptImages = content.filter((b) => b.type === "image");
     const stubs = content.filter(
-      (b) => b.type === "text" && (b as { text: string }).text.includes("Image omitted"),
+      (b) =>
+        b.type === "text" &&
+        (b as { text: string }).text.includes("Image omitted"),
     );
     expect(keptImages.length).toBe(3);
     expect(stubs.length).toBe(2);

package/src/__tests__/conversation-runtime-assembly.test.ts CHANGED Viewed

@@ -930,6 +930,28 @@ describe("stripInjectionsForCompaction with NOW.md", () => {
       "Hello",
     );
   });
+  test("strips <background_turn> blocks", () => {
+    const messages: Message[] = [
+      {
+        role: "user",
+        content: [
+          {
+            type: "text",
+            text: "<background_turn>\nGuardian isn't watching — notify on anything noteworthy.\n</background_turn>",
+          },
+          { type: "text", text: "Hello" },
+        ],
+      },
+    ];
+    const result = stripInjectionsForCompaction(messages);
+    expect(result.length).toBe(1);
+    expect(result[0].content.length).toBe(1);
+    expect((result[0].content[0] as { type: "text"; text: string }).text).toBe(
+      "Hello",
+    );
+  });
 });
 // ---------------------------------------------------------------------------
@@ -1880,7 +1902,7 @@ describe("applyRuntimeInjections — PKB relevance hints", () => {
     },
   ];
-  const FLAT_REMINDER = buildPkbReminder([], false);
+  const FLAT_REMINDER = buildPkbReminder([]);
   // Use a platform-agnostic absolute workspace root so the tests work on
   // macOS and Linux runners alike. `pkbRoot` sits under `pkbWorkingDir` to
@@ -2136,7 +2158,7 @@ describe("applyRuntimeInjections — PKB relevance hints", () => {
       role: "user",
       content: [
         { type: "text", text: "hello" },
-        { type: "text", text: buildPkbReminder([], false) },
+        { type: "text", text: buildPkbReminder([]) },
       ],
     };
     const hintedMessage: Message = {
@@ -2145,7 +2167,7 @@ describe("applyRuntimeInjections — PKB relevance hints", () => {
         { type: "text", text: "hello" },
         {
           type: "text",
-          text: buildPkbReminder(["topics/alpha.md", "topics/beta.md"], false),
+          text: buildPkbReminder(["topics/alpha.md", "topics/beta.md"]),
         },
       ],
     };
@@ -4827,7 +4849,7 @@ describe("applyRuntimeInjections blocks.pkbSystemReminder", () => {
       mode: "full",
     });
-    const expected = buildPkbReminder([], false);
+    const expected = buildPkbReminder([]);
     expect(blocks.pkbSystemReminder).toBe(expected);
   });