npm - @vellumai/assistant - Versions diffs - 0.8.2 → 0.8.3 - Mend

@vellumai/assistant 0.8.2 → 0.8.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (231) hide show

package/ARCHITECTURE.md +11 -12
package/docker-entrypoint.sh +13 -1
package/docker-init-apt-root.sh +79 -6
package/openapi.yaml +336 -21
package/package.json +1 -1
package/src/__tests__/agent-loop-exit-reason.test.ts +272 -0
package/src/__tests__/agent-loop-provider-error-recording.test.ts +195 -0
package/src/__tests__/compactor-tail-resolution.test.ts +107 -1
package/src/__tests__/config-get-vision-flag.test.ts +136 -0
package/src/__tests__/config-loader-backfill.test.ts +115 -18
package/src/__tests__/context-token-estimator.test.ts +30 -65
package/src/__tests__/conversation-agent-loop.test.ts +57 -1
package/src/__tests__/conversation-media-retry.test.ts +19 -8
package/src/__tests__/conversation-runtime-assembly.test.ts +26 -4
package/src/__tests__/date-context.test.ts +45 -0
package/src/__tests__/external-plugin-loader.test.ts +91 -19
package/src/__tests__/guardian-action-no-hardcoded-copy.test.ts +0 -1
package/src/__tests__/guardian-dispatch.test.ts +1 -0
package/src/__tests__/heartbeat-service.test.ts +24 -164
package/src/__tests__/helpers/channel-test-adapter.ts +0 -2
package/src/__tests__/host-app-control-proxy.test.ts +241 -0
package/src/__tests__/host-proxy-preactivation.test.ts +200 -13
package/src/__tests__/injector-background-turn.test.ts +153 -0
package/src/__tests__/injector-chain.test.ts +5 -0
package/src/__tests__/lifecycle-memory-v2-seed.test.ts +9 -2
package/src/__tests__/llm-callsite-catalog.test.ts +25 -0
package/src/__tests__/llm-catalog-parity.test.ts +3 -0
package/src/__tests__/llm-request-log-agent-loop-exit-reason.test.ts +116 -0
package/src/__tests__/llm-request-log-error-payload.test.ts +138 -0
package/src/__tests__/llm-request-log-source-clickhouse.test.ts +2 -0
package/src/__tests__/llm-resolver.test.ts +255 -2
package/src/__tests__/managed-profile-guard.test.ts +10 -0
package/src/__tests__/notification-decision-fallback.test.ts +0 -91
package/src/__tests__/notification-decision-strategy.test.ts +14 -31
package/src/__tests__/notification-deep-link.test.ts +15 -0
package/src/__tests__/notification-guardian-path.test.ts +1 -2
package/src/__tests__/notification-platform-adapter.test.ts +5 -4
package/src/__tests__/notification-telegram-adapter.test.ts +1 -0
package/src/__tests__/notification-vellum-adapter.test.ts +113 -0
package/src/__tests__/openai-provider.test.ts +218 -3
package/src/__tests__/openai-responses-cutover-guard.test.ts +3 -3
package/src/__tests__/openrouter-provider-only.test.ts +51 -3
package/src/__tests__/openrouter-token-estimation.test.ts +34 -25
package/src/__tests__/platform-proxy-context.test.ts +6 -1
package/src/__tests__/plugin-tool-contribution.test.ts +3 -3
package/src/__tests__/plugin-types.test.ts +2 -2
package/src/__tests__/provider-catalog-visibility.test.ts +16 -0
package/src/__tests__/provider-platform-proxy-integration.test.ts +27 -25
package/src/__tests__/secret-routes-platform-proxy.test.ts +1 -1
package/src/__tests__/system-prompt.test.ts +6 -73
package/src/__tests__/workspace-migration-087-memory-router-balanced-profile.test.ts +228 -0
package/src/a2a/__tests__/agent-card.test.ts +98 -0
package/src/a2a/__tests__/e2e-a2a-channel.test.ts +597 -0
package/src/a2a/__tests__/protocol-helpers.test.ts +113 -0
package/src/a2a/__tests__/task-store.test.ts +246 -0
package/src/a2a/agent-card.ts +58 -0
package/src/a2a/feature-gate.ts +8 -0
package/src/a2a/protocol-constants.ts +21 -0
package/src/a2a/protocol-errors.ts +50 -0
package/src/a2a/protocol-types.ts +162 -0
package/src/a2a/task-store.ts +168 -0
package/src/agent/loop.ts +167 -18
package/src/channels/config.ts +9 -0
package/src/channels/types.ts +14 -0
package/src/cli/{__tests__ → commands/__tests__}/notifications.test.ts +201 -28
package/src/cli/commands/__tests__/schedules.test.ts +469 -0
package/src/cli/commands/notifications.ts +65 -35
package/src/cli/commands/plugins.ts +67 -0
package/src/cli/commands/schedules.ts +297 -5
package/src/cli/lib/__tests__/search-plugins.test.ts +261 -0
package/src/cli/lib/install-from-github.ts +8 -9
package/src/cli/lib/search-plugins.ts +163 -0
package/src/cli/program.ts +14 -0
package/src/config/assistant-feature-flags.ts +24 -54
package/src/config/bundled-skills/app-builder/SKILL.md +117 -1
package/src/config/bundled-skills/phone-calls/SKILL.md +1 -1
package/src/config/call-site-defaults.ts +105 -0
package/src/config/feature-flag-registry.json +21 -29
package/src/config/llm-resolver.ts +52 -1
package/src/config/schema.ts +2 -0
package/src/config/schemas/__tests__/memory-v2.test.ts +3 -3
package/src/config/schemas/channels.ts +9 -0
package/src/config/schemas/conversations.ts +10 -0
package/src/config/schemas/heartbeat.ts +14 -0
package/src/config/schemas/llm.ts +1 -3
package/src/config/schemas/memory-retrospective.ts +1 -1
package/src/config/schemas/memory-v2.ts +4 -4
package/src/config/schemas/memory.ts +3 -1
package/src/config/seed-inference-profiles.ts +99 -29
package/src/context/compactor.ts +72 -12
package/src/context/token-estimator.ts +32 -34
package/src/daemon/__tests__/conversation-lifecycle-auto-analyze.test.ts +3 -22
package/src/daemon/conversation-agent-loop-handlers.ts +78 -0
package/src/daemon/conversation-agent-loop.ts +29 -2
package/src/daemon/conversation-runtime-assembly.ts +9 -0
package/src/daemon/conversation.ts +0 -7
package/src/daemon/date-context.ts +40 -0
package/src/daemon/guardian-action-generators.ts +1 -125
package/src/daemon/handlers/__tests__/config-a2a-complete.test.ts +248 -0
package/src/daemon/handlers/__tests__/config-a2a-invite.test.ts +154 -0
package/src/daemon/handlers/__tests__/config-a2a-redeem.test.ts +133 -0
package/src/daemon/handlers/__tests__/config-a2a.test.ts +95 -0
package/src/daemon/handlers/config-a2a.ts +289 -0
package/src/daemon/handlers/conversations.ts +1 -0
package/src/daemon/host-app-control-proxy.ts +69 -18
package/src/daemon/host-proxy-preactivation.ts +85 -18
package/src/daemon/lifecycle.ts +49 -61
package/src/daemon/memory-v2-startup.ts +49 -13
package/src/daemon/message-types/notifications.ts +21 -0
package/src/daemon/pkb-reminder-builder.test.ts +10 -53
package/src/daemon/pkb-reminder-builder.ts +4 -19
package/src/daemon/process-message.ts +3 -0
package/src/daemon/skill-memory-refresh.ts +5 -1
package/src/daemon/wake-target-adapter.ts +2 -0
package/src/export/__tests__/transcript-formatter.test.ts +121 -0
package/src/export/transcript-formatter.ts +54 -20
package/src/heartbeat/__tests__/heartbeat-service.test.ts +44 -0
package/src/heartbeat/heartbeat-service.ts +34 -191
package/src/home/__tests__/feed-types.test.ts +40 -0
package/src/home/feed-types.ts +14 -2
package/src/ipc/cli-client.ts +147 -45
package/src/memory/__tests__/conversation-queries.test.ts +220 -0
package/src/memory/__tests__/memory-retrospective-enqueue.test.ts +2 -50
package/src/memory/__tests__/memory-retrospective-job.test.ts +87 -4
package/src/memory/conversation-queries.ts +87 -1
package/src/memory/conversation-title-service.ts +26 -4
package/src/memory/db-init.ts +6 -0
package/src/memory/graph/__tests__/conversation-graph-memory-v2-routing.test.ts +84 -3
package/src/memory/graph/conversation-graph-memory.ts +18 -6
package/src/memory/graph/tools.ts +6 -37
package/src/memory/invite-store.ts +53 -0
package/src/memory/llm-request-log-source-clickhouse.ts +7 -2
package/src/memory/llm-request-log-store.ts +92 -1
package/src/memory/memory-retrospective-enqueue.ts +1 -20
package/src/memory/memory-retrospective-job.ts +33 -6
package/src/memory/migrations/250-provider-connection-base-url-and-models.ts +28 -0
package/src/memory/migrations/251-a2a-tasks.ts +49 -0
package/src/memory/migrations/252-llm-request-log-agent-loop-exit-reason.ts +32 -0
package/src/memory/migrations/index.ts +3 -0
package/src/memory/migrations/registry.ts +8 -0
package/src/memory/schema/a2a.ts +15 -0
package/src/memory/schema/index.ts +1 -0
package/src/memory/schema/inference.ts +2 -0
package/src/memory/schema/infrastructure.ts +1 -0
package/src/memory/v2/__tests__/activation-store.test.ts +25 -23
package/src/memory/v2/__tests__/cli-command-store.test.ts +404 -0
package/src/memory/v2/__tests__/frontmatter-sweep.test.ts +25 -4
package/src/memory/v2/__tests__/injection.test.ts +190 -3
package/src/memory/v2/__tests__/static-context.test.ts +12 -1
package/src/memory/v2/activation-store.ts +14 -16
package/src/memory/v2/cli-command-content.ts +19 -0
package/src/memory/v2/cli-command-store.ts +304 -0
package/src/memory/v2/frontmatter-sweep.ts +7 -1
package/src/memory/v2/injection.ts +49 -20
package/src/memory/v2/page-index.ts +38 -13
package/src/memory/v2/static-context.ts +4 -4
package/src/memory/v2/types.ts +23 -0
package/src/messaging/providers/a2a/__tests__/deliver.test.ts +274 -0
package/src/messaging/providers/a2a/deliver.ts +156 -0
package/src/messaging/providers/gmail/client.ts +9 -2
package/src/messaging/providers/index.ts +11 -2
package/src/notifications/__tests__/broadcaster.test.ts +203 -0
package/src/notifications/__tests__/decision-engine.test.ts +283 -0
package/src/notifications/__tests__/deterministic-checks.test.ts +286 -0
package/src/notifications/__tests__/emit-signal-home-feed.test.ts +1 -0
package/src/notifications/__tests__/home-feed-side-effect.test.ts +430 -7
package/src/notifications/adapters/macos.ts +12 -2
package/src/notifications/broadcaster.ts +29 -4
package/src/notifications/copy-composer.ts +17 -64
package/src/notifications/decision-engine.ts +111 -44
package/src/notifications/deterministic-checks.ts +96 -0
package/src/notifications/emit-signal.ts +1 -0
package/src/notifications/home-feed-side-effect.ts +85 -6
package/src/notifications/signal.ts +0 -4
package/src/notifications/types.ts +8 -0
package/src/oauth/platform-connection.test.ts +43 -3
package/src/oauth/platform-connection.ts +13 -4
package/src/plugins/defaults/injectors.ts +38 -19
package/src/plugins/external-plugin-loader.ts +82 -10
package/src/plugins/types.ts +16 -7
package/src/prompts/__tests__/system-prompt.test.ts +6 -51
package/src/prompts/__tests__/task-progress-hint-section.test.ts +4 -8
package/src/prompts/system-prompt.ts +0 -8
package/src/prompts/templates/BOOTSTRAP.md +5 -5
package/src/prompts/templates/system-sections.ts +0 -9
package/src/providers/__tests__/inference.test.ts +2 -0
package/src/providers/call-site-routing.ts +24 -6
package/src/providers/connection-resolution.ts +63 -13
package/src/providers/inference/__tests__/adapter-factory-openai-compatible.test.ts +74 -0
package/src/providers/inference/__tests__/connections-openai-compatible.test.ts +175 -0
package/src/providers/inference/__tests__/connections-status-label.test.ts +15 -0
package/src/providers/inference/adapter-factory.ts +9 -20
package/src/providers/inference/auth.ts +12 -0
package/src/providers/inference/backfill.ts +14 -1
package/src/providers/inference/connections.ts +85 -5
package/src/providers/inference/resolve-auth.ts +2 -0
package/src/providers/model-catalog.ts +199 -244
package/src/providers/model-intents.ts +3 -3
package/src/providers/openai/__tests__/chat-completions-provider-reasoning.test.ts +235 -0
package/src/providers/openai/chat-completions-provider.ts +159 -6
package/src/providers/openrouter/client.ts +42 -4
package/src/providers/platform-proxy/constants.ts +3 -4
package/src/providers/provider-catalog-visibility.ts +3 -1
package/src/providers/provider-send-message.ts +27 -12
package/src/providers/registry.ts +30 -1
package/src/runtime/agent-wake.ts +61 -1
package/src/runtime/auth/route-policy.ts +13 -0
package/src/runtime/http-server.ts +7 -16
package/src/runtime/http-types.ts +0 -47
package/src/runtime/routes/__tests__/consolidation-routes.test.ts +258 -0
package/src/runtime/routes/__tests__/conversation-query-routes.test.ts +66 -4
package/src/runtime/routes/__tests__/inference-provider-connection-routes.test.ts +275 -44
package/src/runtime/routes/__tests__/llm-call-sites-routes.test.ts +12 -0
package/src/runtime/routes/channel-availability-routes.ts +5 -0
package/src/runtime/routes/consolidation-routes.ts +100 -0
package/src/runtime/routes/conversation-query-routes.ts +70 -11
package/src/runtime/routes/conversation-routes.ts +7 -0
package/src/runtime/routes/index.ts +2 -0
package/src/runtime/routes/inference-provider-connection-routes.ts +134 -1
package/src/runtime/routes/integrations/a2a.ts +235 -0
package/src/runtime/routes/llm-call-sites-routes.ts +11 -1
package/src/runtime/routes/subagents-routes.ts +41 -0
package/src/subagent/manager.ts +2 -0
package/src/tools/memory/register.ts +1 -9
package/src/tools/registry.ts +2 -2
package/src/tools/types.ts +37 -2
package/src/workspace/migrations/087-memory-router-balanced-profile.ts +91 -0
package/src/workspace/migrations/registry.ts +2 -0
package/src/__tests__/guardian-action-conversation-turn.test.ts +0 -441
package/src/memory/graph/__tests__/remember-description.test.ts +0 -55
package/src/runtime/guardian-action-conversation-turn.ts +0 -99

package/src/context/compactor.ts CHANGED Viewed

@@ -439,6 +439,44 @@ function resolveTailStartIndex(
   return null;
 }
+/**
+ * Walk a model-chosen tail index backward until it lands on a user message
+ * that does not contain client-side `tool_result` blocks. Prevents the
+ * orphan-`tool_result` failure where the matching assistant `tool_use` sits
+ * in the discarded prefix and Anthropic rejects the next call with
+ * `unexpected tool_use_id found in tool_result blocks`.
+ *
+ * Walking back (rather than forward) preserves the recent context the model
+ * deliberately chose to keep; the tail just expands by the few messages
+ * needed to re-anchor the orphaned `tool_result` against its `tool_use`.
+ *
+ * Returns 0 when the walk falls off the front — the caller treats this as
+ * "nothing to compact" via the existing `tailIndex === 0` branch.
+ *
+ * Only `type === "tool_result"` blocks count. Server-side tools
+ * (`server_tool_use` / `web_search_tool_result`) are self-paired inside an
+ * assistant message and never trigger an adjustment.
+ */
+export function adjustTailIndexForToolPairing(
+  messages: Message[],
+  tailIndex: number,
+): number {
+  let k = tailIndex;
+  while (k > 0) {
+    const m = messages[k];
+    if (
+      m.role === "user" &&
+      // guard:allow-tool-result-only — server-side web_search_tool_result is
+      // self-paired inside its assistant message and never spans user turns.
+      !m.content.some((block) => block.type === "tool_result")
+    ) {
+      return k;
+    }
+    k--;
+  }
+  return 0;
+}
 // ---------------------------------------------------------------------------
 // Retained-image hydration
 // ---------------------------------------------------------------------------
@@ -655,8 +693,12 @@ export async function runAssistantDrivenCompaction(
   }
   const timestamps = buildTimestampIndex(args.messages);
-  const tailIndex = resolveTailStartIndex(args.messages, timestamps, parsed);
-  if (tailIndex == null) {
+  const resolvedTailIndex = resolveTailStartIndex(
+    args.messages,
+    timestamps,
+    parsed,
+  );
+  if (resolvedTailIndex == null) {
     log.warn(
       {
         timestamp: parsed.tailStartTimestamp,
@@ -680,6 +722,22 @@ export async function runAssistantDrivenCompaction(
     };
   }
+  const tailIndex = adjustTailIndexForToolPairing(
+    args.messages,
+    resolvedTailIndex,
+  );
+  if (tailIndex !== resolvedTailIndex) {
+    log.info(
+      {
+        conversationId: args.conversationId,
+        originalTailIndex: resolvedTailIndex,
+        tailIndex,
+        walkedBy: resolvedTailIndex - tailIndex,
+      },
+      "Adjusted compaction tail backward to preserve tool_use/tool_result pairing",
+    );
+  }
   if (tailIndex === 0) {
     return {
       ...emptyResult(
@@ -762,6 +820,9 @@ export async function runAssistantDrivenCompaction(
       compactedMessages: compactableMessages.length,
       compactedPersistedMessages,
       tailIndex,
+      ...(tailIndex !== resolvedTailIndex
+        ? { originalTailIndex: resolvedTailIndex }
+        : {}),
       retainedImages: resolved.length,
       summaryChars: summaryText.length,
     },
@@ -885,10 +946,12 @@ export async function runEmergencyCompaction(
   const splitIndex = findLastToolPairStart(args.messages);
   if (splitIndex == null || splitIndex === 0) {
-    log.info(
-      "Emergency compaction: no tool pair found — falling through",
+    log.info("Emergency compaction: no tool pair found — falling through");
+    return emptyResult(
+      args,
+      thresholdTokens,
+      "no tool pair for emergency split",
     );
-    return emptyResult(args, thresholdTokens, "no tool pair for emergency split");
   }
   const keptTail = stripInjectionsForCompaction(
@@ -904,8 +967,7 @@ export async function runEmergencyCompaction(
   const prefixBudget = args.maxInputTokens - instructionBudget - outputBudget;
   let prefixEstimate = estimatePromptTokens(prefix, args.systemPrompt, {
-    providerName:
-      args.provider.tokenEstimationProvider ?? args.provider.name,
+    providerName: args.provider.tokenEstimationProvider ?? args.provider.name,
   });
   if (prefixEstimate > prefixBudget && prefix.length > 1) {
@@ -920,10 +982,7 @@ export async function runEmergencyCompaction(
     // Drop messages from the front until we fit. Keep at least the first
     // message (may be an existing summary) and try to preserve recent context.
     let dropCount = 0;
-    while (
-      prefixEstimate > prefixBudget &&
-      dropCount < prefix.length - 1
-    ) {
+    while (prefixEstimate > prefixBudget && dropCount < prefix.length - 1) {
       dropCount++;
       const truncated = prefix.slice(dropCount);
       prefixEstimate = estimatePromptTokens(truncated, args.systemPrompt, {
@@ -1015,7 +1074,8 @@ export async function runEmergencyCompaction(
       compactedMessages: compactedCount,
       keptTailMessages: keptTail.length,
       summaryChars: summaryText.length,
-      prefixTruncated: prefix[0]?.content?.[0]?.type === "text" &&
+      prefixTruncated:
+        prefix[0]?.content?.[0]?.type === "text" &&
         (prefix[0].content[0] as { text: string }).text.includes("truncated"),
     },
     "Applied emergency mid-turn compaction",

package/src/context/token-estimator.ts CHANGED Viewed

@@ -33,18 +33,24 @@ const OTHER_BLOCK_TOKENS = 16;
 const SYSTEM_PROMPT_OVERHEAD_TOKENS = 8;
 const GEMINI_INLINE_FILE_MIME_TYPES = new Set(["application/pdf"]);
-// Anthropic scales images to fit within 1568x1568 maintaining aspect ratio,
-// then charges ~(width * height) / 750 tokens.
-const ANTHROPIC_IMAGE_MAX_DIMENSION = 1568;
-// Anthropic caps images at ~1.2 megapixels in addition to the 1568px dimension limit.
-// Images exceeding this are further scaled down. The docs state images above ~1,600 tokens
-// are resized. 1,200,000 / 750 = 1,600 tokens, matching the documented threshold.
-// Reference table (max sizes that won't be resized):
+// Dimension-based image token estimate, used as a universal default for every
+// provider. The formula and constants below come from Anthropic's published
+// vision spec — scale to a 1568x1568 bounding box, then charge
+// ~(width * height) / 750 tokens, with a ~1.2-megapixel cap that lands at
+// ~1,600 tokens per image. Reference table (max sizes that won't be resized):
 //   1:1 → 1092x1092 (~1,590 tokens)   1:2 → 784x1568 (~1,639 tokens)
 // See: https://platform.claude.com/docs/en/build-with-claude/vision#evaluate-image-size
-const ANTHROPIC_IMAGE_MAX_PIXELS = 1_200_000;
-const ANTHROPIC_IMAGE_TOKENS_PER_PIXEL = 1 / 750;
-const ANTHROPIC_IMAGE_MAX_TOKENS = 1_600;
+//
+// Other multimodal providers (OpenAI/GPT-4V tile pricing, Moonshot/Kimi,
+// Gemini fixed-cost, OpenRouter pass-through) price differently in detail,
+// but every published rate lands in the same hundreds-to-low-thousands range
+// per image. Using this formula as the default gets compaction within ~2-3x
+// of reality instead of the ~30-100x over-counting produced by treating the
+// raw base64 payload as if it were text.
+const IMAGE_MAX_DIMENSION = 1568;
+const IMAGE_MAX_PIXELS = 1_200_000;
+const IMAGE_TOKENS_PER_PIXEL = 1 / 750;
+const IMAGE_MAX_TOKENS = 1_600;
 // Anthropic renders each PDF page as an image (~1,568 tokens at standard
 // resolution) plus any extracted text. Typical PDF pages are 50-150 KB.
@@ -103,45 +109,37 @@ function estimateFileDataTokens(
   return 0;
 }
-function estimateAnthropicImageTokens(width: number, height: number): number {
+function estimateImageTokensByDimensions(
+  width: number,
+  height: number,
+): number {
   // Step 1: Scale to fit within 1568px bounding box
-  const dimScale = Math.min(
-    1,
-    ANTHROPIC_IMAGE_MAX_DIMENSION / Math.max(width, height),
-  );
+  const dimScale = Math.min(1, IMAGE_MAX_DIMENSION / Math.max(width, height));
   let scaledWidth = Math.round(width * dimScale);
   let scaledHeight = Math.round(height * dimScale);
   // Step 2: Scale further if exceeds megapixel budget
   const pixels = scaledWidth * scaledHeight;
-  if (pixels > ANTHROPIC_IMAGE_MAX_PIXELS) {
-    const mpScale = Math.sqrt(ANTHROPIC_IMAGE_MAX_PIXELS / pixels);
+  if (pixels > IMAGE_MAX_PIXELS) {
+    const mpScale = Math.sqrt(IMAGE_MAX_PIXELS / pixels);
     scaledWidth = Math.round(scaledWidth * mpScale);
     scaledHeight = Math.round(scaledHeight * mpScale);
   }
-  return Math.ceil(
-    scaledWidth * scaledHeight * ANTHROPIC_IMAGE_TOKENS_PER_PIXEL,
-  );
+  return Math.ceil(scaledWidth * scaledHeight * IMAGE_TOKENS_PER_PIXEL);
 }
 function estimateImageTokens(
   block: Extract<ContentBlock, { type: "image" }>,
-  options?: TokenEstimatorOptions,
 ): number {
-  if (options?.providerName === "anthropic") {
-    const dims = parseImageDimensions(
-      block.source.data,
-      block.source.media_type,
-    );
-    if (dims) {
-      return estimateAnthropicImageTokens(dims.width, dims.height);
-    }
-    // Fallback: if dimensions can't be parsed, use Anthropic's max
-    return ANTHROPIC_IMAGE_MAX_TOKENS;
+  const dims = parseImageDimensions(block.source.data, block.source.media_type);
+  if (dims) {
+    return estimateImageTokensByDimensions(dims.width, dims.height);
   }
-  // Non-Anthropic: keep existing base64-size heuristic
-  return estimateTextTokens(block.source.data);
+  // Dimensions unparseable (corrupt header, exotic format): use the per-image
+  // cap rather than the raw base64 length, which over-counts by 30-100x for
+  // non-Anthropic providers and trips spurious compaction.
+  return IMAGE_MAX_TOKENS;
 }
 export function estimateContentBlockTokens(
@@ -188,7 +186,7 @@ export function estimateContentBlockTokens(
       return (
         IMAGE_BLOCK_OVERHEAD_TOKENS +
         estimateTextTokens(block.source.media_type) +
-        estimateImageTokens(block, options)
+        estimateImageTokens(block)
       );
     case "file":
       return (

package/src/daemon/__tests__/conversation-lifecycle-auto-analyze.test.ts CHANGED Viewed

@@ -97,7 +97,6 @@ mock.module("../../memory/auto-analysis-enqueue.js", () => ({
   },
 }));
-let memoryRetroEnabled = false;
 const memoryRetroCalls: Array<{
   conversationId: string;
   trigger: string;
@@ -108,7 +107,6 @@ mock.module("../../memory/memory-retrospective-enqueue.js", () => ({
     conversationId: string;
     trigger: string;
   }) => {
-    if (!memoryRetroEnabled) return;
     memoryRetroCalls.push(args);
   },
   // Also export sibling functions other modules import from this file, so
@@ -205,7 +203,6 @@ describe("disposeConversation — auto-analysis enqueue", () => {
     autoAnalyzeCalls.length = 0;
     memoryRetroCalls.length = 0;
     autoAnalyzeEnabled = true;
-    memoryRetroEnabled = false;
     autoAnalysisConversations.clear();
     v2Enabled = false;
   });
@@ -390,13 +387,11 @@ describe("disposeConversation — memory-retrospective lifecycle safety net", ()
     autoAnalyzeCalls.length = 0;
     memoryRetroCalls.length = 0;
     autoAnalyzeEnabled = false;
-    memoryRetroEnabled = false;
     autoAnalysisConversations.clear();
     v2Enabled = false;
   });
-  test("guardian conversation + flag on — enqueues memory-retrospective with trigger 'lifecycle'", () => {
-    memoryRetroEnabled = true;
+  test("guardian conversation — enqueues memory-retrospective with trigger 'lifecycle'", () => {
     const ctx = makeDisposeContext({
       conversationId: "conv-retro",
       trustClass: "guardian",
@@ -411,20 +406,7 @@ describe("disposeConversation — memory-retrospective lifecycle safety net", ()
     });
   });
-  test("flag off — no memory-retrospective enqueue", () => {
-    memoryRetroEnabled = false;
-    const ctx = makeDisposeContext({
-      conversationId: "conv-retro-off",
-      trustClass: "guardian",
-    });
-    disposeConversation(ctx);
-    expect(memoryRetroCalls).toHaveLength(0);
-  });
-  test("untrusted actor — no memory-retrospective enqueue even when flag is on", () => {
-    memoryRetroEnabled = true;
+  test("untrusted actor — no memory-retrospective enqueue", () => {
     const ctx = makeDisposeContext({
       conversationId: "conv-retro-untrusted",
       trustClass: "unknown",
@@ -443,8 +425,7 @@ describe("disposeConversation — memory-retrospective lifecycle safety net", ()
   // outside the `!isAutoAnalysis` guard, so it fired even for auto-analysis
   // conversations. Mirrors the indexer-time gate in `indexer.ts` and
   // matches the existing graph_extract recursion-guard semantics.
-  test("auto-analysis conversation — does NOT enqueue memory-retrospective even with flag on", () => {
-    memoryRetroEnabled = true;
+  test("auto-analysis conversation — does NOT enqueue memory-retrospective", () => {
     autoAnalysisConversations.add("conv-auto-retro");
     const ctx = makeDisposeContext({
       conversationId: "conv-auto-retro",

package/src/daemon/conversation-agent-loop-handlers.ts CHANGED Viewed

@@ -23,7 +23,9 @@ import {
 } from "../memory/conversation-crud.js";
 import {
   backfillMessageIdOnLogs,
+  buildProviderErrorResponsePayload,
   recordRequestLog,
+  setAgentLoopExitReasonOnLatestLog,
 } from "../memory/llm-request-log-store.js";
 import { backfillMemoryRecallLogMessageId } from "../memory/memory-recall-log-store.js";
 import { backfillMemoryV2ActivationMessageId } from "../memory/memory-v2-activation-log-store.js";
@@ -1166,6 +1168,52 @@ function handleUsage(
   state.llmCallStartedEmitted = false;
 }
+/**
+ * Persist a provider-rejected LLM call as an `llm_request_logs` row.
+ *
+ * Mirrors `handleUsage`'s recording side-effect for the failure path: the
+ * loop only reaches the success branch (and emits `usage`) when the
+ * provider returns a response, so without this handler a rejected call
+ * leaves nothing in the inspector — only a pino line saying "The AI
+ * provider rejected the request." The row's `messageId` is left null
+ * here and linked via one of two backfill paths, depending on how the
+ * turn unwinds:
+ *
+ *   - Multi-call turn where a later call also produces a real assistant
+ *     response: `handleMessageComplete` -> `backfillMessageIdOnLogs`
+ *     sweeps this row with the rest, same as a successful-call row.
+ *   - Pure provider-failure turn (no real assistant response): the
+ *     synthetic error-message branch in `conversation-agent-loop.ts`
+ *     persists a stand-in assistant message and calls
+ *     `backfillMessageIdOnLogs` itself, since `message_complete` is
+ *     never emitted on that path. Closing the orphan window inside the
+ *     same synchronous turn prevents a later turn's sweep from wrong-
+ *     attaching this row to an unrelated assistant message.
+ *
+ * Failures inside the recording itself are logged and swallowed — this
+ * mirrors `handleUsage`'s non-fatal stance so a DB hiccup never escalates
+ * a provider rejection into a dispatcher-level throw.
+ */
+function handleProviderError(
+  deps: EventHandlerDeps,
+  event: Extract<AgentEvent, { type: "provider_error" }>,
+): void {
+  try {
+    recordRequestLog(
+      deps.ctx.conversationId,
+      JSON.stringify(event.rawRequest),
+      JSON.stringify(buildProviderErrorResponsePayload(event.error)),
+      undefined,
+      event.actualProvider,
+    );
+  } catch (err) {
+    deps.rlog.warn(
+      { err },
+      "Failed to persist provider-error LLM request log (non-fatal)",
+    );
+  }
+}
 // ── Dispatcher ───────────────────────────────────────────────────────
 /** Routes an AgentEvent to the appropriate handler. */
@@ -1254,12 +1302,42 @@ export async function dispatchAgentEvent(
       case "error":
         handleError(state, deps, event);
         break;
+      case "provider_error":
+        handleProviderError(deps, event);
+        break;
       case "message_complete":
         await handleMessageComplete(state, deps, event);
         break;
       case "usage":
         handleUsage(state, deps, event);
         break;
+      case "agent_loop_exit":
+        // Stamp the exit reason onto the most-recent llm_request_logs
+        // row for this conversation. The final `usage` event of the run
+        // lands its row immediately before this event arrives (in the
+        // normal-dispatch path; the wake path handles ordering
+        // explicitly via `pendingExitReason`).
+        //
+        // Wrapped in try/catch so a DB hiccup here can't tear down the
+        // surrounding dispatch — the outer try/catch already swallows
+        // errors, but logging here gives the diagnosis hook a clear
+        // attribution to the exit handler specifically.
+        try {
+          setAgentLoopExitReasonOnLatestLog(
+            deps.ctx.conversationId,
+            event.reason,
+          );
+        } catch (err) {
+          log.warn(
+            {
+              err,
+              conversationId: deps.ctx.conversationId,
+              reason: event.reason,
+            },
+            "Failed to persist agent_loop_exit_reason (non-fatal)",
+          );
+        }
+        break;
     }
   } catch (err) {
     log.error(

package/src/daemon/conversation-agent-loop.ts CHANGED Viewed

@@ -71,7 +71,9 @@ import {
   isReplaceableTitle,
   queueRegenerateConversationTitle,
 } from "../memory/conversation-title-service.js";
+import { isBackgroundConversationType } from "../memory/conversation-types.js";
 import type { ConversationGraphMemory } from "../memory/graph/conversation-graph-memory.js";
+import { backfillMessageIdOnLogs } from "../memory/llm-request-log-store.js";
 import { recordMemoryRecallLog } from "../memory/memory-recall-log-store.js";
 import { enqueueMemoryRetrospectiveOnCompaction } from "../memory/memory-retrospective-enqueue.js";
 import { PKB_WORKSPACE_SCOPE } from "../memory/pkb/types.js";
@@ -109,6 +111,7 @@ import type {
   MemoryResult,
   OverflowReduceArgs,
   OverflowReduceResult,
+  PersistAddResult,
   PersistArgs,
   PersistResult,
   TurnContext as PluginTurnContext,
@@ -1616,6 +1619,9 @@ export async function runAgentLoopImpl(
       transportHints: ctx.transportHints ?? null,
       slackRuntimeContextNotice: ctx.slackRuntimeContextNotice ?? null,
       isNonInteractive: !isInteractiveResolved,
+      isBackgroundConversation: isBackgroundConversationType(
+        turnStartConversation?.conversationType,
+      ),
       subagentStatusBlock,
       slackChronologicalMessages,
       slackActiveThreadFocusBlock,
@@ -2942,7 +2948,7 @@ export async function runAgentLoopImpl(
       const errorAssistantMessage = createAssistantMessage(
         state.providerErrorUserMessage,
       );
-      await runPipeline<PersistArgs, PersistResult>(
+      const errorPersistResult = (await runPipeline<PersistArgs, PersistResult>(
         "persistence",
         getMiddlewaresFor("persistence"),
         defaultPersistenceTerminal,
@@ -2955,9 +2961,30 @@ export async function runAgentLoopImpl(
         },
         buildPluginTurnContext(ctx, reqId),
         DEFAULT_TIMEOUTS.persistence,
-      );
+      )) as PersistAddResult;
       persistedErrorAssistantMessage = true;
       newMessages.push(errorAssistantMessage);
+      // Pipe the just-assigned message id into any orphaned LLM request log
+      // row(s) for this turn. The success path links rows via
+      // `handleMessageComplete` -> `backfillMessageIdOnLogs`, but provider-
+      // failure turns never fire `message_complete` (the synthetic assistant
+      // message is persisted directly above), so without this call the rows
+      // from `handleProviderError` stay with `message_id IS NULL` and a
+      // later turn's backfill sweep would wrong-attach them to that turn's
+      // assistant message. Scope is per-conversation, so concurrent runs on
+      // other conversations cannot collide. Non-fatal — a DB hiccup must
+      // not escalate a provider rejection into a turn-level throw.
+      try {
+        backfillMessageIdOnLogs(
+          ctx.conversationId,
+          errorPersistResult.message.id,
+        );
+      } catch (err) {
+        rlog.warn(
+          { err },
+          "Failed to backfill message_id on provider-error LLM request logs (non-fatal)",
+        );
+      }
       // Do NOT send assistant_text_delta here — handleProviderError already
       // emitted a conversation_error event for this same error text, and the
       // client renders it as an InlineChatErrorAlert. Sending a text delta

package/src/daemon/conversation-runtime-assembly.ts CHANGED Viewed

@@ -1652,6 +1652,7 @@ const RUNTIME_INJECTION_PREFIXES = [
   "<interface_turn_context>", // backward-compat: strip legacy separate interface blocks
   // NOTE: <turn_context> is intentionally NOT stripped — unified turn context
   // blocks persist in history so the assistant retains temporal/actor grounding.
+  "<background_turn>",
   "<memory_context __injected>",
   "<memory_context>", // backward-compat: strip legacy blocks from pre-__injected history
   // The static `memory-v2-static` block (opens `<memory>\n…`) IS stripped
@@ -1966,6 +1967,13 @@ export interface RuntimeInjectionOptions {
   nowScratchpad?: string | null;
   subagentStatusBlock?: string | null;
   isNonInteractive?: boolean;
+  /**
+   * True when the active conversation's type is "background" or "scheduled".
+   * Forwarded to {@link TurnInjectionInputs.isBackgroundConversation} so the
+   * `background-turn` injector can wrap the tail user message with the
+   * configured reminder.
+   */
+  isBackgroundConversation?: boolean;
   transportHints?: string[] | null;
   slackRuntimeContextNotice?: string | null;
   /**
@@ -2056,6 +2064,7 @@ function buildTurnInjectionInputs(
     voiceCallControlPrompt: options.voiceCallControlPrompt,
     transportHints: options.transportHints,
     isNonInteractive: options.isNonInteractive,
+    isBackgroundConversation: options.isBackgroundConversation,
     activeDocuments: options.activeDocuments,
   };
 }

package/src/daemon/conversation.ts CHANGED Viewed

@@ -54,7 +54,6 @@ import {
   getConversationOriginChannel,
   getConversationOverrideProfileFromRow,
 } from "../memory/conversation-crud.js";
-import { isBackgroundConversationType } from "../memory/conversation-types.js";
 import { ConversationGraphMemory } from "../memory/graph/conversation-graph-memory.js";
 import { shouldExposePersonalMemory } from "../memory/v2/static-context.js";
 import { PermissionPrompter } from "../permissions/prompter.js";
@@ -489,9 +488,6 @@ export class Conversation {
                 channelPersona: persona.channelPersona,
                 userSlug: persona.userSlug,
                 onboardingContext: this.getOnboardingContext(),
-                isBackgroundConversation: isBackgroundConversationType(
-                  getConversation(this.conversationId)?.conversationType,
-                ),
               });
             })(),
       };
@@ -583,9 +579,6 @@ export class Conversation {
             channelPersona: persona.channelPersona,
             userSlug: persona.userSlug,
             onboardingContext: this.getOnboardingContext(),
-            isBackgroundConversation: isBackgroundConversationType(
-              getConversation(this.conversationId)?.conversationType,
-            ),
           });
         })();
     const tools = buildToolDefinitions();

package/src/daemon/date-context.ts CHANGED Viewed

@@ -326,6 +326,46 @@ function formatLocalDate(date: Date, timeZone: string): string {
   ).padStart(2, "0")}`;
 }
+const localTimestampFormatterCache = new Map<string, Intl.DateTimeFormat>();
+function getLocalTimestampFormatter(timeZone: string): Intl.DateTimeFormat {
+  let fmt = localTimestampFormatterCache.get(timeZone);
+  if (!fmt) {
+    fmt = new Intl.DateTimeFormat("en-CA", {
+      timeZone,
+      year: "numeric",
+      month: "2-digit",
+      day: "2-digit",
+      hour: "2-digit",
+      minute: "2-digit",
+      second: "2-digit",
+      hourCycle: "h23",
+    });
+    localTimestampFormatterCache.set(timeZone, fmt);
+  }
+  return fmt;
+}
+/**
+ * Format an epoch-millis instant as `YYYY-MM-DD HH:MM:SS` in the given
+ * IANA timezone. When `timeZone` is omitted or `"UTC"`, falls back to a
+ * pure-UTC `toISOString` slice so callers can opt in incrementally.
+ *
+ * The internal `Intl.DateTimeFormat` is memoized by `timeZone` because
+ * constructing it is ~1ms in V8 — material when rendering long transcripts.
+ */
+export function formatLocalTimestamp(ms: number, timeZone?: string): string {
+  if (!timeZone || timeZone === "UTC") {
+    return new Date(ms).toISOString().replace("T", " ").slice(0, 19);
+  }
+  const parts = getLocalTimestampFormatter(timeZone).formatToParts(
+    new Date(ms),
+  );
+  const v: Record<string, string> = {};
+  for (const p of parts) v[p.type] = p.value;
+  return `${v.year}-${v.month}-${v.day} ${v.hour}:${v.minute}:${v.second}`;
+}
 export function resolveTurnTimezoneContext(
   options: TemporalContextOptions = {},
 ): TurnTimezoneContext {