npm - @vellumai/assistant - Versions diffs - 0.4.23 → 0.4.26 - Mend

@vellumai/assistant 0.4.23 → 0.4.26

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (63) hide show

package/bun.lock +3 -0
package/package.json +2 -1
package/src/__tests__/__snapshots__/ipc-snapshot.test.ts.snap +0 -15
package/src/__tests__/assistant-events-sse-hardening.test.ts +9 -3
package/src/__tests__/call-controller.test.ts +80 -0
package/src/__tests__/config-schema.test.ts +38 -178
package/src/__tests__/conversation-routes-guardian-reply.test.ts +4 -1
package/src/__tests__/credential-security-invariants.test.ts +0 -2
package/src/__tests__/guardian-verify-setup-skill-regression.test.ts +2 -2
package/src/__tests__/ipc-snapshot.test.ts +0 -9
package/src/__tests__/onboarding-template-contract.test.ts +10 -20
package/src/__tests__/relay-server.test.ts +3 -3
package/src/__tests__/runtime-events-sse-parity.test.ts +10 -0
package/src/__tests__/runtime-events-sse.test.ts +7 -0
package/src/__tests__/session-runtime-assembly.test.ts +34 -8
package/src/__tests__/system-prompt.test.ts +7 -1
package/src/__tests__/trusted-contact-approval-notifier.test.ts +12 -8
package/src/__tests__/twilio-routes-twiml.test.ts +2 -2
package/src/__tests__/twilio-routes.test.ts +2 -3
package/src/__tests__/voice-quality.test.ts +21 -132
package/src/calls/call-controller.ts +34 -29
package/src/calls/relay-server.ts +11 -5
package/src/calls/twilio-routes.ts +4 -38
package/src/calls/voice-quality.ts +7 -63
package/src/config/bundled-skills/guardian-verify-setup/SKILL.md +7 -10
package/src/config/bundled-skills/messaging/SKILL.md +3 -5
package/src/config/bundled-skills/phone-calls/SKILL.md +144 -83
package/src/config/bundled-skills/sms-setup/SKILL.md +0 -20
package/src/config/bundled-skills/twilio-setup/SKILL.md +9 -17
package/src/config/bundled-skills/voice-setup/SKILL.md +36 -1
package/src/config/bundled-skills/voice-setup/icon.svg +20 -0
package/src/config/calls-schema.ts +3 -53
package/src/config/elevenlabs-schema.ts +33 -0
package/src/config/schema.ts +183 -137
package/src/config/types.ts +0 -1
package/src/daemon/handlers/browser.ts +1 -6
package/src/daemon/ipc-contract/browser.ts +5 -14
package/src/daemon/ipc-contract-inventory.json +0 -2
package/src/daemon/session-agent-loop-handlers.ts +3 -0
package/src/daemon/session-runtime-assembly.ts +9 -7
package/src/mcp/client.ts +2 -1
package/src/memory/conversation-crud.ts +339 -166
package/src/runtime/auth/middleware.ts +87 -26
package/src/runtime/routes/events-routes.ts +7 -0
package/src/runtime/routes/inbound-message-handler.ts +3 -4
package/src/schedule/scheduler.ts +159 -45
package/src/security/secure-keys.ts +3 -3
package/src/tools/browser/browser-manager.ts +72 -228
package/src/tools/browser/browser-screencast.ts +0 -5
package/src/tools/network/script-proxy/certs.ts +7 -237
package/src/tools/network/script-proxy/connect-tunnel.ts +1 -82
package/src/tools/network/script-proxy/http-forwarder.ts +2 -151
package/src/tools/network/script-proxy/logging.ts +12 -196
package/src/tools/network/script-proxy/mitm-handler.ts +2 -270
package/src/tools/network/script-proxy/policy.ts +4 -152
package/src/tools/network/script-proxy/router.ts +2 -60
package/src/tools/network/script-proxy/server.ts +5 -137
package/src/tools/network/script-proxy/types.ts +19 -125
package/src/tools/system/voice-config.ts +23 -1
package/src/util/logger.ts +4 -1
package/src/__tests__/elevenlabs-config.test.ts +0 -95
package/src/__tests__/twilio-routes-elevenlabs.test.ts +0 -407
package/src/calls/elevenlabs-config.ts +0 -32

package/src/__tests__/runtime-events-sse-parity.test.ts CHANGED Viewed

@@ -106,6 +106,11 @@ async function publishAndReadFrame(
   await assistantEventHub.publish(event);
   const reader = response.body!.getReader();
+  // The first chunk is the immediate heartbeat comment enqueued in start().
+  await reader.read();
+  // The second chunk is the actual assistant event.
   const { value } = await reader.read();
   ac.abort();
@@ -366,6 +371,11 @@ describe("SSE IPC parity — streaming/delta message types", () => {
     await assistantEventHub.publish(published);
     const reader = response.body!.getReader();
+    // The first chunk is the immediate heartbeat comment enqueued in start().
+    await reader.read();
+    // The second chunk is the actual assistant event.
     const { value } = await reader.read();
     ac.abort();

package/src/__tests__/runtime-events-sse.test.ts CHANGED Viewed

@@ -168,6 +168,13 @@ describe("SSE assistant-events endpoint", () => {
     // Read the first frame directly from the response body stream.
     const reader = response.body!.getReader();
+    // The first chunk is the immediate heartbeat comment enqueued in start().
+    const initial = await reader.read();
+    expect(initial.done).toBe(false);
+    expect(new TextDecoder().decode(initial.value)).toBe(": heartbeat\n\n");
+    // The second chunk is the actual assistant event.
     const { value, done } = await reader.read();
     ac.abort();

package/src/__tests__/session-runtime-assembly.test.ts CHANGED Viewed

@@ -44,6 +44,14 @@ describe("resolveChannelCapabilities", () => {
     expect(caps.supportsVoiceInput).toBe(true);
   });
+  test("vellum channel with vellum interface supports dynamic UI", () => {
+    const caps = resolveChannelCapabilities("vellum", "vellum");
+    expect(caps.channel).toBe("vellum");
+    expect(caps.dashboardCapable).toBe(false);
+    expect(caps.supportsDynamicUi).toBe(true);
+    expect(caps.supportsVoiceInput).toBe(false);
+  });
   test("defaults to vellum for null source channel", () => {
     const caps = resolveChannelCapabilities(null);
     expect(caps.channel).toBe("vellum");
@@ -407,6 +415,24 @@ describe("trust-gating via channel capabilities", () => {
     expect(injected).toContain("Present information as well-formatted text");
     expect(injected).toContain("desktop app");
   });
+  test("vellum web interface allows dynamic UI but constrains dashboard references", () => {
+    const caps = resolveChannelCapabilities("vellum", "vellum");
+    const message: Message = {
+      role: "user",
+      content: [{ type: "text", text: "Show me a form" }],
+    };
+    const result = injectChannelCapabilityContext(message, caps);
+    const injected = (result.content[0] as { type: "text"; text: string }).text;
+    expect(injected).toContain("CHANNEL CONSTRAINTS");
+    expect(injected).toContain("Do NOT reference the dashboard UI");
+    expect(injected).not.toContain("Do NOT use ui_show");
+    expect(injected).not.toContain("Present information as well-formatted text");
+    expect(injected).toContain("supports_dynamic_ui: true");
+    expect(injected).toContain("dashboard_capable: false");
+  });
 });
 // ---------------------------------------------------------------------------
@@ -994,12 +1020,12 @@ describe("sanitizePttActivationKey", () => {
     expect(sanitizePttActivationKey("none")).toBe("none");
   });
-  test('returns "unknown" for invalid keys', () => {
-    expect(sanitizePttActivationKey("malicious\nprompt injection")).toBe(
-      "unknown",
-    );
-    expect(sanitizePttActivationKey("arbitrary_value")).toBe("unknown");
-    expect(sanitizePttActivationKey("")).toBe("unknown");
+  test("returns undefined for invalid keys", () => {
+    expect(
+      sanitizePttActivationKey("malicious\nprompt injection"),
+    ).toBeUndefined();
+    expect(sanitizePttActivationKey("arbitrary_value")).toBeUndefined();
+    expect(sanitizePttActivationKey("")).toBeUndefined();
   });
 });
@@ -1015,11 +1041,11 @@ describe("resolveChannelCapabilities with PTT metadata", () => {
     expect(caps.pttActivationKey).toBe("fn");
   });
-  test("sanitizes invalid pttActivationKey to unknown", () => {
+  test("sanitizes invalid pttActivationKey to undefined", () => {
     const caps = resolveChannelCapabilities("macos", "macos", {
       pttActivationKey: "evil\nprompt",
     });
-    expect(caps.pttActivationKey).toBe("unknown");
+    expect(caps.pttActivationKey).toBeUndefined();
   });
   test("passes through microphonePermissionGranted", () => {

package/src/__tests__/system-prompt.test.ts CHANGED Viewed

@@ -75,9 +75,15 @@ const {
   buildPhoneCallsRoutingSection,
 } = await import("../config/system-prompt.js");
-/** Strip the Configuration and Skills sections so base-prompt tests stay focused. */
+/** Strip the Configuration, Skills, and hardcoded preamble sections so base-prompt tests stay focused. */
 function basePrompt(result: string): string {
   let s = result;
+  // Strip the hardcoded em-dash instruction preamble
+  const emDashLine =
+    "IMPORTANT: Never use em dashes (\u2014) in your messages. Use commas, periods, or just start a new sentence instead.";
+  if (s.startsWith(emDashLine)) {
+    s = s.slice(emDashLine.length).replace(/^\n\n/, "");
+  }
   for (const heading of [
     "## Configuration",
     "## Skills Catalog",

package/src/__tests__/trusted-contact-approval-notifier.test.ts CHANGED Viewed

@@ -120,8 +120,14 @@ mock.module("../config/env.js", () => ({
   getGatewayInternalBaseUrl: () => "http://localhost:3000",
 }));
+// ── User reference mock ──
+mock.module("../config/user-reference.js", () => ({
+  resolveUserReference: () => "my human",
+}));
 // Import module under test AFTER mocks are set up
 import type { ChannelId } from "../channels/types.js";
+import { resolveUserReference } from "../config/user-reference.js";
 import type { GuardianContext } from "../runtime/guardian-context-resolver.js";
 // We need to test the private functions by importing the module.
@@ -220,9 +226,7 @@ async function simulateNotifierPoll(params: {
     }
   }
-  const waitingText = guardianName
-    ? `Waiting for ${guardianName}'s approval...`
-    : "Waiting for your guardian's approval...";
+  const waitingText = `Waiting for ${guardianName ?? resolveUserReference()}'s approval...`;
   try {
     await deliverChannelReply(
@@ -330,7 +334,7 @@ describe("trusted-contact pending-approval notifier", () => {
     );
   });
-  test("uses generic phrasing when no guardian name is available", async () => {
+  test("falls back to user reference when no guardian name is available", async () => {
     mockPendingApprovals = [
       {
         requestId: "req-3",
@@ -359,11 +363,11 @@ describe("trusted-contact pending-approval notifier", () => {
     expect(deliveredReplies).toHaveLength(1);
     expect(deliveredReplies[0].payload.text).toBe(
-      "Waiting for your guardian's approval...",
+      "Waiting for my human's approval...",
     );
   });
-  test("uses generic phrasing when no guardian binding exists", async () => {
+  test("falls back to user reference when no guardian binding exists", async () => {
     mockPendingApprovals = [
       {
         requestId: "req-4",
@@ -388,7 +392,7 @@ describe("trusted-contact pending-approval notifier", () => {
     expect(deliveredReplies).toHaveLength(1);
     expect(deliveredReplies[0].payload.text).toBe(
-      "Waiting for your guardian's approval...",
+      "Waiting for my human's approval...",
     );
   });
@@ -736,7 +740,7 @@ describe("trusted-contact pending-approval notifier", () => {
     expect(deliveredReplies).toHaveLength(1);
     // Falls back to generic phrasing
     expect(deliveredReplies[0].payload.text).toBe(
-      "Waiting for your guardian's approval...",
+      "Waiting for my human's approval...",
     );
   });
 });

package/src/__tests__/twilio-routes-twiml.test.ts CHANGED Viewed

@@ -46,7 +46,7 @@ describe("generateTwiML with voice quality profile", () => {
     expect(twiml).toContain('voice="voice123-turbo_v2_5-1_0.5_0.75"');
   });
-  test("voice attribute reflects configured voice for twilio_standard mode", () => {
+  test("voice attribute reflects configured Google voice", () => {
     const twiml = generateTwiML(callSessionId, relayUrl, welcomeGreeting, {
       language: "en-US",
       transcriptionProvider: "Deepgram",
@@ -57,7 +57,7 @@ describe("generateTwiML with voice quality profile", () => {
     expect(twiml).toContain('voice="Google.en-US-Journey-O"');
   });
-  test("voice attribute reflects configured voice for twilio_elevenlabs_tts mode", () => {
+  test("voice attribute reflects configured ElevenLabs voice", () => {
     const twiml = generateTwiML(callSessionId, relayUrl, welcomeGreeting, {
       language: "en-US",
       transcriptionProvider: "Deepgram",

package/src/__tests__/twilio-routes.test.ts CHANGED Viewed

@@ -60,13 +60,12 @@ const mockConfigObj = {
   memory: { enabled: false },
   rateLimit: { maxRequestsPerMinute: 0, maxTokensPerSession: 0 },
   secretDetection: { enabled: false },
+  elevenlabs: { voiceId: "21m00Tcm4TlvDq8ikWAM" },
   calls: {
     voice: {
-      mode: "twilio_standard",
       language: "en-US",
       transcriptionProvider: "Deepgram",
-      fallbackToStandardOnError: true,
-      elevenlabs: { voiceId: "" },
+      elevenlabs: {},
     },
   },
 };

package/src/__tests__/voice-quality.test.ts CHANGED Viewed

@@ -8,7 +8,6 @@ mock.module("../config/loader.js", () => ({
 import {
   buildElevenLabsVoiceSpec,
-  isVoiceProfileValid,
   resolveVoiceQualityProfile,
 } from "../calls/voice-quality.js";
@@ -62,176 +61,66 @@ describe("buildElevenLabsVoiceSpec", () => {
 });
 describe("resolveVoiceQualityProfile", () => {
-  test("returns standard profile for twilio_standard mode", () => {
+  test("always returns ElevenLabs ttsProvider", () => {
     mockConfig = {
+      elevenlabs: { voiceId: "21m00Tcm4TlvDq8ikWAM" },
       calls: {
         voice: {
-          mode: "twilio_standard",
           language: "en-US",
-          transcriptionProvider: "Google",
-          fallbackToStandardOnError: false,
-          elevenlabs: {},
-        },
-      },
-    };
-    const profile = resolveVoiceQualityProfile();
-    expect(profile.mode).toBe("twilio_standard");
-    expect(profile.ttsProvider).toBe("Google");
-    expect(profile.voice).toBe("Google.en-US-Journey-O");
-    expect(profile.validationErrors).toHaveLength(0);
-  });
-  test("returns elevenlabs profile for twilio_elevenlabs_tts mode", () => {
-    mockConfig = {
-      calls: {
-        voice: {
-          mode: "twilio_elevenlabs_tts",
-          language: "en-US",
-          transcriptionProvider: "Google",
-          fallbackToStandardOnError: false,
-          elevenlabs: { voiceId: "elvoice1" },
+          transcriptionProvider: "Deepgram",
         },
       },
     };
     const profile = resolveVoiceQualityProfile();
-    expect(profile.mode).toBe("twilio_elevenlabs_tts");
     expect(profile.ttsProvider).toBe("ElevenLabs");
-    expect(profile.voice).toBe("elvoice1");
-    expect(profile.validationErrors).toHaveLength(0);
-  });
-  test("falls back to standard when voiceId missing and fallback enabled", () => {
-    mockConfig = {
-      calls: {
-        voice: {
-          mode: "twilio_elevenlabs_tts",
-          language: "en-US",
-          transcriptionProvider: "Google",
-          fallbackToStandardOnError: true,
-          elevenlabs: { voiceId: "" },
-        },
-      },
-    };
-    const profile = resolveVoiceQualityProfile();
-    expect(profile.mode).toBe("twilio_standard");
-    expect(profile.validationErrors.length).toBeGreaterThan(0);
-    expect(profile.validationErrors[0]).toContain("falling back");
-  });
-  test("returns validation error when voiceId missing and fallback disabled", () => {
-    mockConfig = {
-      calls: {
-        voice: {
-          mode: "twilio_elevenlabs_tts",
-          language: "en-US",
-          transcriptionProvider: "Google",
-          fallbackToStandardOnError: false,
-          elevenlabs: { voiceId: "" },
-        },
-      },
-    };
-    const profile = resolveVoiceQualityProfile();
-    expect(profile.mode).toBe("twilio_elevenlabs_tts");
-    expect(profile.validationErrors.length).toBeGreaterThan(0);
-    expect(profile.validationErrors[0]).toContain("voiceId is required");
   });
-  test("returns elevenlabs_agent profile with agentId", () => {
+  test("voice ID comes from elevenlabs.voiceId", () => {
     mockConfig = {
+      elevenlabs: { voiceId: "custom-voice-123" },
       calls: {
         voice: {
-          mode: "elevenlabs_agent",
           language: "en-US",
-          transcriptionProvider: "Google",
-          fallbackToStandardOnError: false,
-          elevenlabs: { voiceId: "voice1", agentId: "agent123" },
+          transcriptionProvider: "Deepgram",
         },
       },
     };
     const profile = resolveVoiceQualityProfile();
-    expect(profile.mode).toBe("elevenlabs_agent");
-    expect(profile.agentId).toBe("agent123");
-    expect(profile.validationErrors).toHaveLength(0);
+    expect(profile.voice).toBe("custom-voice-123");
   });
-  test("falls back to standard when agentId missing and fallback enabled", () => {
+  test("uses language from calls.voice config", () => {
     mockConfig = {
+      elevenlabs: { voiceId: "abc" },
       calls: {
         voice: {
-          mode: "elevenlabs_agent",
-          language: "en-US",
+          language: "es-MX",
           transcriptionProvider: "Google",
-          fallbackToStandardOnError: true,
-          elevenlabs: { voiceId: "voice1", agentId: "" },
         },
       },
     };
     const profile = resolveVoiceQualityProfile();
-    expect(profile.mode).toBe("twilio_standard");
-    expect(profile.validationErrors[0]).toContain("falling back");
+    expect(profile.language).toBe("es-MX");
+    expect(profile.transcriptionProvider).toBe("Google");
   });
-  test("returns validation error when agentId missing and fallback disabled", () => {
+  test("builds voice spec with model and tuning params", () => {
     mockConfig = {
-      calls: {
-        voice: {
-          mode: "elevenlabs_agent",
-          language: "en-US",
-          transcriptionProvider: "Google",
-          fallbackToStandardOnError: false,
-          elevenlabs: { voiceId: "voice1", agentId: "" },
-        },
+      elevenlabs: {
+        voiceId: "voice1",
+        voiceModelId: "turbo_v2_5",
+        speed: 0.9,
+        stability: 0.8,
+        similarityBoost: 0.9,
       },
-    };
-    const profile = resolveVoiceQualityProfile();
-    expect(profile.mode).toBe("elevenlabs_agent");
-    expect(profile.validationErrors.length).toBeGreaterThan(0);
-    expect(profile.validationErrors[0]).toContain("agentId is required");
-  });
-  test("returns standard profile for unknown mode", () => {
-    mockConfig = {
       calls: {
         voice: {
-          mode: "unknown_mode",
           language: "en-US",
-          transcriptionProvider: "Google",
-          fallbackToStandardOnError: false,
-          elevenlabs: {},
+          transcriptionProvider: "Deepgram",
         },
       },
     };
     const profile = resolveVoiceQualityProfile();
-    expect(profile.mode).toBe("twilio_standard");
-  });
-});
-describe("isVoiceProfileValid", () => {
-  test("returns true for profile with no errors", () => {
-    expect(
-      isVoiceProfileValid({
-        mode: "twilio_standard",
-        language: "en-US",
-        transcriptionProvider: "Google",
-        ttsProvider: "Google",
-        voice: "Google.en-US-Journey-O",
-        fallbackToStandardOnError: false,
-        validationErrors: [],
-      }),
-    ).toBe(true);
-  });
-  test("returns false for profile with errors", () => {
-    expect(
-      isVoiceProfileValid({
-        mode: "twilio_elevenlabs_tts",
-        language: "en-US",
-        transcriptionProvider: "Google",
-        ttsProvider: "ElevenLabs",
-        voice: "",
-        fallbackToStandardOnError: false,
-        validationErrors: ["voiceId is required"],
-      }),
-    ).toBe(false);
+    expect(profile.voice).toBe("voice1-turbo_v2_5-0.9_0.8_0.9");
   });
 });

package/src/calls/call-controller.ts CHANGED Viewed

@@ -44,11 +44,13 @@ const log = getLogger('call-controller');
 type ControllerState = 'idle' | 'processing' | 'speaking';
 /**
- * Tracks a pending guardian consultation independently of the controller's
+ * Tracks a pending guardian input request independently of the controller's
  * turn state. This allows the call to continue normal turn processing
- * (idle -> processing -> speaking) while a consultation is outstanding.
+ * (idle -> processing -> speaking) while a guardian consultation is outstanding.
+ * Also used to suppress the silence nudge ("Are you still there?") while
+ * the caller is waiting on a guardian decision.
  */
-interface PendingConsultation {
+interface PendingGuardianInput {
   questionText: string;
   questionId: string;
   toolApprovalMeta: { toolName: string; inputDigest: string } | null;
@@ -191,16 +193,17 @@ export class CallController {
   private durationTimer: ReturnType<typeof setTimeout> | null = null;
   private durationWarningTimer: ReturnType<typeof setTimeout> | null = null;
   /**
-   * Tracks the currently pending guardian consultation, if any. Decoupled
+   * Tracks the currently pending guardian input request, if any. Decoupled
    * from the controller's turn state so callers can continue to trigger
-   * normal turns while consultation is outstanding.
+   * normal turns while a guardian consultation is outstanding. Also
+   * suppresses the silence nudge while non-null.
    */
-  private pendingConsultation: PendingConsultation | null = null;
+  private pendingGuardianInput: PendingGuardianInput | null = null;
   private durationEndTimer: ReturnType<typeof setTimeout> | null = null;
   private task: string | null;
   /** True when the call session was created via the inbound path (no outbound task). */
   private isInbound: boolean;
-  /** Instructions queued while an LLM turn is in-flight or during pending consultation */
+  /** Instructions queued while an LLM turn is in-flight or during pending guardian input */
   private pendingInstructions: string[] = [];
   /** Ensures the call opener is triggered at most once per call. */
   private initialGreetingStarted = false;
@@ -271,7 +274,7 @@ export class CallController {
    * incoming answers to the correct consultation record.
    */
   getPendingConsultationQuestionId(): string | null {
-    return this.pendingConsultation?.questionId ?? null;
+    return this.pendingGuardianInput?.questionId ?? null;
   }
   /**
@@ -357,7 +360,7 @@ export class CallController {
    * speaking.
    */
   async handleUserAnswer(answerText: string): Promise<boolean> {
-    if (!this.pendingConsultation) {
+    if (!this.pendingGuardianInput) {
       log.warn(
         { callSessionId: this.callSessionId, state: this.state },
         'handleUserAnswer called but no pending consultation exists',
@@ -366,8 +369,8 @@ export class CallController {
     }
     // Clear the consultation timeout and record
-    clearTimeout(this.pendingConsultation.timer);
-    this.pendingConsultation = null;
+    clearTimeout(this.pendingGuardianInput.timer);
+    this.pendingGuardianInput = null;
     updateCallSession(this.callSessionId, { status: 'in_progress' });
@@ -436,7 +439,7 @@ export class CallController {
     if (this.silenceTimer) clearTimeout(this.silenceTimer);
     if (this.durationTimer) clearTimeout(this.durationTimer);
     if (this.durationWarningTimer) clearTimeout(this.durationWarningTimer);
-    if (this.pendingConsultation) { clearTimeout(this.pendingConsultation.timer); this.pendingConsultation = null; }
+    if (this.pendingGuardianInput) { clearTimeout(this.pendingGuardianInput.timer); this.pendingGuardianInput = null; }
     if (this.durationEndTimer) { clearTimeout(this.durationEndTimer); this.durationEndTimer = null; }
     this.llmRunVersion++;
     this.abortCurrentTurn();
@@ -713,30 +716,30 @@ export class CallController {
           // the prior pending consultation (preserves tool scope on re-asks).
           const effectiveToolMeta = toolApprovalMeta
             ? { toolName: toolApprovalMeta.toolName, inputDigest: toolApprovalMeta.inputDigest }
-            : this.pendingConsultation?.toolApprovalMeta ?? null;
+            : this.pendingGuardianInput?.toolApprovalMeta ?? null;
           // Coalesce repeated identical asks: if a consultation is already
           // pending for the same tool/action (or same informational question),
           // avoid churning requests and just keep the existing one.
-          if (this.pendingConsultation) {
+          if (this.pendingGuardianInput) {
             const isSameToolAction =
-              effectiveToolMeta && this.pendingConsultation.toolApprovalMeta
-                ? effectiveToolMeta.toolName === this.pendingConsultation.toolApprovalMeta.toolName
-                  && effectiveToolMeta.inputDigest === this.pendingConsultation.toolApprovalMeta.inputDigest
-                : !effectiveToolMeta && !this.pendingConsultation.toolApprovalMeta;
+              effectiveToolMeta && this.pendingGuardianInput.toolApprovalMeta
+                ? effectiveToolMeta.toolName === this.pendingGuardianInput.toolApprovalMeta.toolName
+                  && effectiveToolMeta.inputDigest === this.pendingGuardianInput.toolApprovalMeta.inputDigest
+                : !effectiveToolMeta && !this.pendingGuardianInput.toolApprovalMeta;
             if (isSameToolAction) {
               // Same tool/action — coalesce. Keep the existing consultation
               // alive and skip creating a new request.
               log.info(
-                { callSessionId: this.callSessionId, questionId: this.pendingConsultation.questionId },
+                { callSessionId: this.callSessionId, questionId: this.pendingGuardianInput.questionId },
                 'Coalescing repeated ASK_GUARDIAN — same tool/action already pending',
               );
               recordCallEvent(this.callSessionId, 'guardian_consult_coalesced', { question: questionText });
               // Fall through to normal turn completion (idle + flushPendingInstructions)
             } else {
               // Materially different intent — supersede the old consultation.
-              clearTimeout(this.pendingConsultation.timer);
+              clearTimeout(this.pendingGuardianInput.timer);
               // Expire the previous consultation's storage records so stale
               // guardian answers cannot match the old request.
@@ -752,7 +755,7 @@ export class CallController {
                 );
               }
-              this.pendingConsultation = null;
+              this.pendingGuardianInput = null;
               // Dispatch the new consultation with effective tool metadata.
               // The previous request ID is passed through so the dispatch
@@ -773,10 +776,10 @@ export class CallController {
         // Without this, the consultation timeout can fire on an already-ended
         // call, overwriting 'completed' status back to 'in_progress' and
         // starting a new LLM turn on a dead session. Similarly, a late
-        // handleUserAnswer could be accepted since pendingConsultation is
+        // handleUserAnswer could be accepted since pendingGuardianInput is
         // still non-null.
-        if (this.pendingConsultation) {
-          clearTimeout(this.pendingConsultation.timer);
+        if (this.pendingGuardianInput) {
+          clearTimeout(this.pendingGuardianInput.timer);
           // Expire store-side consultation records so clients don't observe
           // a completed call with a dangling pendingQuestion, and guardian
@@ -787,7 +790,7 @@ export class CallController {
             expireCanonicalGuardianRequest(previousRequest.id);
           }
-          this.pendingConsultation = null;
+          this.pendingGuardianInput = null;
         }
         const currentSession = getCallSession(this.callSessionId);
@@ -928,7 +931,7 @@ export class CallController {
     // record, not the global controller state.
     const consultationTimer = setTimeout(() => {
       // Only fire if this consultation is still the active one
-      if (!this.pendingConsultation || this.pendingConsultation.questionId !== pendingQuestion.id) return;
+      if (!this.pendingGuardianInput || this.pendingGuardianInput.questionId !== pendingQuestion.id) return;
       log.info({ callSessionId: this.callSessionId }, 'Guardian consultation timed out');
@@ -960,7 +963,7 @@ export class CallController {
       // Expire pending questions and update call state
       expirePendingQuestions(this.callSessionId);
-      this.pendingConsultation = null;
+      this.pendingGuardianInput = null;
       updateCallSession(this.callSessionId, { status: 'in_progress' });
       this.guardianUnavailableForCall = true;
       recordCallEvent(this.callSessionId, 'guardian_consultation_timed_out', { question: questionText });
@@ -982,7 +985,7 @@ export class CallController {
       }
     }, getUserConsultationTimeoutMs());
-    this.pendingConsultation = {
+    this.pendingGuardianInput = {
       questionText,
       questionId: pendingQuestion.id,
       toolApprovalMeta: effectiveToolMeta,
@@ -1067,7 +1070,9 @@ export class CallController {
       // During guardian wait states, the relay heartbeat timer handles
       // periodic updates — suppress the generic "Are you still there?"
       // which is confusing when the caller is waiting on a decision.
-      if (this.relay.getConnectionState() === 'awaiting_guardian_decision') {
+      // Two paths: in-call consultation (pendingGuardianInput) and
+      // inbound access-request wait (relay state).
+      if (this.pendingGuardianInput || this.relay.getConnectionState() === 'awaiting_guardian_decision') {
         log.debug({ callSessionId: this.callSessionId }, 'Silence timeout suppressed during guardian wait');
         return;
       }

package/src/calls/relay-server.ts CHANGED Viewed

@@ -11,6 +11,7 @@ import { randomInt } from 'node:crypto';
 import type { ServerWebSocket } from 'bun';
 import { getConfig } from '../config/loader.js';
+import { resolveUserReference } from '../config/user-reference.js';
 import { getAssistantName } from '../daemon/identity-helpers.js';
 import { getCanonicalGuardianRequest } from '../memory/canonical-guardian-store.js';
 import { listActiveBindingsByAssistant } from '../memory/channel-guardian-store.js';
@@ -1214,10 +1215,14 @@ export class RelayConnection {
     updateCallSession(this.callSessionId, { status: 'waiting_on_user' });
-    // Start the heartbeat timer for periodic progress updates
-    this.accessRequestWaitStartedAt = Date.now();
+    // Start the heartbeat timer for periodic progress updates.
+    // Delay the first heartbeat by the estimated TTS playback duration so
+    // the initial hold message finishes before any heartbeat fires.
     this.heartbeatSequence = 0;
-    this.scheduleNextHeartbeat();
+    this.accessRequestHeartbeatTimer = setTimeout(() => {
+      this.accessRequestWaitStartedAt = Date.now();
+      this.scheduleNextHeartbeat();
+    }, getTtsPlaybackDelayMs());
     // Poll the canonical request status
     this.accessRequestPollTimer = setInterval(() => {
@@ -1658,7 +1663,7 @@ export class RelayConnection {
   /**
    * Resolve a human-readable guardian label for voice wait copy.
    * Prefers displayName from the guardian binding metadata, falls back
-   * to @username, then "my guardian".
+   * to @username, then the user's preferred name from USER.md.
    */
   private resolveGuardianLabel(): string {
     const assistantId = this.accessRequestAssistantId ?? DAEMON_INTERNAL_ASSISTANT_ID;
@@ -1690,7 +1695,8 @@ export class RelayConnection {
         // ignore malformed metadata
       }
     }
-    return 'my guardian';
+    return resolveUserReference();
   }
   /**