npm - @vellumai/assistant - Versions diffs - 0.3.16 → 0.3.19 - Mend

@vellumai/assistant 0.3.16 → 0.3.19

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (114) hide show

package/ARCHITECTURE.md +74 -13
package/README.md +6 -0
package/docs/architecture/http-token-refresh.md +23 -1
package/docs/architecture/security.md +80 -0
package/package.json +1 -1
package/src/__tests__/__snapshots__/ipc-snapshot.test.ts.snap +4 -0
package/src/__tests__/access-request-decision.test.ts +4 -7
package/src/__tests__/call-controller.test.ts +170 -0
package/src/__tests__/channel-guardian.test.ts +3 -1
package/src/__tests__/checker.test.ts +139 -48
package/src/__tests__/config-watcher.test.ts +11 -13
package/src/__tests__/conversation-pairing.test.ts +103 -3
package/src/__tests__/guardian-action-conversation-turn.test.ts +1 -1
package/src/__tests__/guardian-action-followup-executor.test.ts +1 -1
package/src/__tests__/guardian-action-grant-mint-consume.test.ts +511 -0
package/src/__tests__/guardian-action-late-reply.test.ts +131 -0
package/src/__tests__/guardian-action-store.test.ts +182 -0
package/src/__tests__/guardian-dispatch.test.ts +180 -0
package/src/__tests__/guardian-grant-minting.test.ts +543 -0
package/src/__tests__/ipc-snapshot.test.ts +22 -0
package/src/__tests__/non-member-access-request.test.ts +1 -2
package/src/__tests__/notification-broadcaster.test.ts +115 -4
package/src/__tests__/notification-decision-strategy.test.ts +2 -1
package/src/__tests__/notification-deep-link.test.ts +44 -1
package/src/__tests__/notification-guardian-path.test.ts +157 -0
package/src/__tests__/notification-thread-candidate-validation.test.ts +215 -0
package/src/__tests__/remote-skill-policy.test.ts +215 -0
package/src/__tests__/scoped-approval-grants.test.ts +521 -0
package/src/__tests__/scoped-grant-security-matrix.test.ts +443 -0
package/src/__tests__/slack-channel-config.test.ts +3 -3
package/src/__tests__/trust-store.test.ts +23 -21
package/src/__tests__/trusted-contact-lifecycle-notifications.test.ts +5 -7
package/src/__tests__/trusted-contact-multichannel.test.ts +2 -6
package/src/__tests__/trusted-contact-verification.test.ts +9 -9
package/src/__tests__/update-bulletin-state.test.ts +1 -1
package/src/__tests__/update-bulletin.test.ts +66 -3
package/src/__tests__/update-template-contract.test.ts +6 -11
package/src/__tests__/voice-scoped-grant-consumer.test.ts +571 -0
package/src/__tests__/voice-session-bridge.test.ts +109 -9
package/src/calls/call-controller.ts +150 -8
package/src/calls/call-domain.ts +12 -0
package/src/calls/guardian-action-sweep.ts +1 -1
package/src/calls/guardian-dispatch.ts +16 -0
package/src/calls/relay-server.ts +13 -0
package/src/calls/voice-session-bridge.ts +46 -5
package/src/cli/core-commands.ts +41 -1
package/src/config/bundled-skills/notifications/SKILL.md +18 -0
package/src/config/schema.ts +6 -0
package/src/config/skills-schema.ts +27 -0
package/src/config/templates/UPDATES.md +5 -6
package/src/config/update-bulletin-format.ts +2 -0
package/src/config/update-bulletin-state.ts +1 -1
package/src/config/update-bulletin-template-path.ts +6 -0
package/src/config/update-bulletin.ts +21 -6
package/src/daemon/config-watcher.ts +3 -2
package/src/daemon/daemon-control.ts +64 -10
package/src/daemon/handlers/config-channels.ts +18 -0
package/src/daemon/handlers/config-slack-channel.ts +1 -1
package/src/daemon/handlers/identity.ts +45 -25
package/src/daemon/handlers/sessions.ts +1 -1
package/src/daemon/handlers/skills.ts +45 -2
package/src/daemon/ipc-contract/sessions.ts +1 -1
package/src/daemon/ipc-contract/skills.ts +1 -0
package/src/daemon/ipc-contract/workspace.ts +12 -1
package/src/daemon/ipc-contract-inventory.json +1 -0
package/src/daemon/lifecycle.ts +8 -0
package/src/daemon/server.ts +25 -3
package/src/daemon/session-process.ts +450 -184
package/src/daemon/tls-certs.ts +17 -12
package/src/daemon/tool-side-effects.ts +1 -1
package/src/memory/channel-delivery-store.ts +18 -20
package/src/memory/channel-guardian-store.ts +39 -42
package/src/memory/conversation-crud.ts +2 -2
package/src/memory/conversation-queries.ts +2 -2
package/src/memory/conversation-store.ts +24 -25
package/src/memory/db-init.ts +17 -1
package/src/memory/embedding-local.ts +16 -7
package/src/memory/fts-reconciler.ts +41 -26
package/src/memory/guardian-action-store.ts +65 -7
package/src/memory/guardian-verification.ts +1 -0
package/src/memory/jobs-worker.ts +2 -2
package/src/memory/migrations/032-guardian-delivery-conversation-index.ts +15 -0
package/src/memory/migrations/032-notification-delivery-thread-decision.ts +20 -0
package/src/memory/migrations/033-scoped-approval-grants.ts +51 -0
package/src/memory/migrations/034-guardian-action-tool-metadata.ts +12 -0
package/src/memory/migrations/index.ts +6 -2
package/src/memory/schema-migration.ts +1 -0
package/src/memory/schema.ts +36 -1
package/src/memory/scoped-approval-grants.ts +509 -0
package/src/memory/search/semantic.ts +3 -3
package/src/notifications/README.md +158 -17
package/src/notifications/broadcaster.ts +68 -50
package/src/notifications/conversation-pairing.ts +96 -18
package/src/notifications/decision-engine.ts +6 -3
package/src/notifications/deliveries-store.ts +12 -0
package/src/notifications/emit-signal.ts +1 -0
package/src/notifications/thread-candidates.ts +60 -25
package/src/notifications/types.ts +2 -1
package/src/permissions/checker.ts +28 -16
package/src/permissions/defaults.ts +14 -4
package/src/runtime/guardian-action-followup-executor.ts +1 -1
package/src/runtime/guardian-action-grant-minter.ts +97 -0
package/src/runtime/http-server.ts +11 -11
package/src/runtime/routes/access-request-decision.ts +1 -1
package/src/runtime/routes/debug-routes.ts +4 -4
package/src/runtime/routes/guardian-approval-interception.ts +120 -4
package/src/runtime/routes/inbound-message-handler.ts +100 -33
package/src/runtime/routes/integration-routes.ts +2 -2
package/src/security/tool-approval-digest.ts +67 -0
package/src/skills/remote-skill-policy.ts +131 -0
package/src/tools/permission-checker.ts +1 -2
package/src/tools/secret-detection-handler.ts +1 -1
package/src/tools/system/voice-config.ts +1 -1
package/src/version.ts +29 -2

package/src/notifications/README.md CHANGED Viewed

@@ -5,22 +5,51 @@ Signal-driven notification architecture where producers emit free-form events an
 ## Lifecycle
 ```
-Producer → NotificationSignal → Decision Engine (LLM) → Deterministic Checks → Broadcaster → Conversation Pairing → Adapters → Delivery
-                                       ↑                                                            ↓
-                               Preference Summary                                    notification_thread_created IPC
+Producer → NotificationSignal → Candidate Generation → Decision Engine (LLM) → Deterministic Checks → Broadcaster → Conversation Pairing → Adapters → Delivery
+                                                              ↑                                                            ↓
+                                                      Preference Summary                                    notification_thread_created IPC
+                                                      Thread Candidates                                     (creation-only — not emitted on reuse)
 ```
 ### 1. Signal
 A producer calls `emitNotificationSignal()` with a free-form event name, attention hints (urgency, requiresAction, deadlineAt), and a context payload. The signal is persisted as a `notification_events` row.
-### 2. Decision
+### 2. Candidate Generation
-The decision engine (`decision-engine.ts`) sends the signal to an LLM (configured via `notifications.decisionModelIntent`) along with available channels and the user's preference summary. The LLM responds with a structured decision: whether to notify, which channels, rendered copy per channel, and a deduplication key.
+Before the decision engine runs, the system builds a **thread candidate set** per channel (`thread-candidates.ts`). This is a compact snapshot of recent notification-sourced conversations that the decision engine can choose to reuse instead of starting a new thread.
-When the LLM is unavailable or returns invalid output, a deterministic fallback fires: high-urgency + requires-action signals notify on all channels; everything else is suppressed.
+**How candidates are generated:**
-### 3. Deterministic Checks
+- For each selected channel, the system queries `notification_deliveries` joined with `notification_decisions` and `notification_events` to find conversations that were created by the notification pipeline within the last 24 hours.
+- Up to 5 candidates per channel are returned, deduplicated by conversation ID, most-recent first.
+- Each candidate includes: `conversationId`, `title`, `updatedAt`, `latestSourceEventName`, and `channel`.
+- **Guardian context enrichment**: When candidates exist, a batch query counts pending (unresolved) guardian approval requests per conversation. Candidates with `pendingUnresolvedRequestCount > 0` carry a `guardianContext` field so the LLM can make informed reuse decisions for threads with active guardian questions.
+- **Candidate-affinity hints**: Guardian dispatch (`guardian-dispatch.ts`) includes `activeGuardianRequestCount` in the signal's `contextPayload`. When multiple guardian questions arise in the same call session, this hint nudges the decision engine toward reusing the existing thread rather than creating a new one for each question.
+The candidate set is serialized into a compact `<thread-candidates>` block in the decision engine's system prompt. Candidate generation is wrapped in try/catch — a failure does not block the decision path; the engine simply proceeds without candidates (all channels default to `start_new`).
+### 3. Decision
+The decision engine (`decision-engine.ts`) sends the signal to an LLM (configured via `notifications.decisionModelIntent`) along with available channels, the user's preference summary, and the thread candidate set. The LLM responds with a structured decision: whether to notify, which channels, rendered copy per channel, a deduplication key, and **per-channel thread actions**.
+**Thread actions:** For each selected channel, the LLM decides:
+- `start_new` — create a fresh conversation thread for this delivery.
+- `reuse_existing` — append to an existing candidate thread (must provide a `conversationId` from the candidate set).
+The LLM is guided to prefer `reuse_existing` when the signal is a continuation or update of an existing notification thread (same event type, related context), and `start_new` when the signal is a distinct event deserving its own thread.
+**Validation and fallback:** Thread actions are strictly validated against the candidate set (`validateThreadActions` in `decision-engine.ts`):
+- A `reuse_existing` action with an empty or missing `conversationId` is downgraded to `start_new` with a warning.
+- A `reuse_existing` action referencing a conversation ID not in the candidate set is downgraded to `start_new` with a warning.
+- Unknown action values are silently ignored; the channel defaults to `start_new` downstream.
+- Channels with no thread action in the decision output default to `start_new`.
+When the LLM is unavailable or returns invalid output, a deterministic fallback fires: high-urgency + requires-action signals notify on all channels; everything else is suppressed. The fallback path does not produce thread actions (all channels use `start_new`).
+### 4. Deterministic Checks
 Hard invariants that the LLM cannot override (`deterministic-checks.ts`):
@@ -29,11 +58,11 @@ Hard invariants that the LLM cannot override (`deterministic-checks.ts`):
 - **Channel availability** -- at least one selected channel must be connected
 - **Deduplication** -- same `dedupeKey` within the dedupe window (1 hour default) is suppressed
-### 4. Dispatch
+### 5. Dispatch
 `runtime-dispatch.ts` handles two early-exit cases (shouldNotify=false, no channels), then delegates to the broadcaster.
-### 5. Broadcast, Conversation Pairing, and Delivery
+### 6. Broadcast, Conversation Pairing, and Delivery
 The broadcaster (`broadcaster.ts`) iterates over selected channels (vellum first for fast IPC push), resolves destinations via `destination-resolver.ts`, pairs each delivery with a conversation via `conversation-pairing.ts`, pulls rendered copy from the decision (falling back to `copy-composer.ts` templates), and dispatches through channel adapters. Each delivery attempt is recorded in `notification_deliveries` with `conversation_id`, `message_id`, and `conversation_strategy` columns.
@@ -73,9 +102,19 @@ Each policy defines:
 ## Conversation Pairing Invariant
-**Every notification delivery gets a conversation.** Before the adapter sends a notification, `pairDeliveryWithConversation()` (in `conversation-pairing.ts`) materializes a conversation and seed message based on the channel's conversation strategy:
+**Every notification delivery gets a conversation.** Before the adapter sends a notification, `pairDeliveryWithConversation()` (in `conversation-pairing.ts`) materializes a conversation and seed message based on the channel's conversation strategy and the decision engine's per-channel thread action:
+### Thread Reuse Path (`reuse_existing`)
+When the decision engine selects `reuse_existing` for a channel with a valid candidate `conversationId`:
-- **`start_new_conversation`**: Creates a new conversation with `threadType: 'standard'` and `source: 'notification'`, plus an assistant message containing the thread seed. Memory indexing is skipped on the seed message to prevent notification copy from polluting conversational recall.
+1. The pairing function looks up the target conversation.
+2. If the conversation exists and has `source: 'notification'`, the seed message is **appended** to the existing thread (not a new conversation). The result has `createdNewConversation: false`.
+3. If the target is invalid (does not exist, or has a different `source`), the function falls back to creating a new conversation and sets `threadDecisionFallbackUsed: true` on the result. A warning is logged with the invalid target details.
+### New Thread Path (`start_new` / default)
+- **`start_new_conversation`**: Creates a new conversation with `threadType: 'standard'` and `source: 'notification'`, plus an assistant message containing the thread seed. Memory indexing is skipped on the seed message to prevent notification copy from polluting conversational recall. The result has `createdNewConversation: true`.
 - **`continue_existing_conversation`**: Currently materializes a background audit conversation per delivery (true continuation via binding key lookup is planned for a future PR). The audit trail records the intended strategy without adding visible sidebar threads.
 - **`not_deliverable`**: Returns `{ conversationId: null, messageId: null }`.
@@ -133,9 +172,22 @@ Take out the trash
 Reminder. Take out the trash. Action required.
 ```
-## Thread Surfacing via `notification_thread_created` IPC
+## Thread Surfacing via `notification_thread_created` IPC (Creation-Only)
-When a vellum notification thread is paired with a conversation (strategy `start_new_conversation`), the broadcaster emits a `notification_thread_created` IPC event **immediately**, before waiting for slower channel deliveries (e.g. Telegram). This avoids a race where a slow Telegram delivery delays the IPC push past the macOS deep-link retry window.
+The `notification_thread_created` IPC event is emitted **only when a brand-new conversation is actually created** by the broadcaster. Reused threads do not trigger this event — the macOS/iOS client already knows about the conversation from the original creation.
+This is enforced in `broadcaster.ts` by gating the IPC emission on `pairing.createdNewConversation === true`:
+```ts
+// Emit notification_thread_created only when a NEW conversation was
+// actually created. Reusing an existing thread should not fire the IPC
+// event — the client already knows about the conversation.
+if (pairing.createdNewConversation && pairing.strategy === 'start_new_conversation') {
+  // ... emit IPC event
+}
+```
+When a vellum notification thread **is** newly created (strategy `start_new_conversation`), the broadcaster emits the IPC event **immediately**, before waiting for slower channel deliveries (e.g. Telegram). This avoids a race where a slow Telegram delivery delays the IPC push past the macOS deep-link retry window.
 The IPC event payload:
@@ -152,7 +204,12 @@ The macOS/iOS client listens for this event and surfaces the thread in the sideb
 ### Per-Dispatch Thread Callback
-`emitNotificationSignal()` accepts an optional `onThreadCreated` callback. This lets producers run domain side effects (for example, creating cross-channel guardian delivery rows) as soon as vellum pairing occurs, without introducing a second thread-creation path.
+`emitNotificationSignal()` accepts an optional `onThreadCreated` callback (`options.onThreadCreated`). This lets producers run domain side effects (for example, creating cross-channel guardian delivery rows) as soon as vellum pairing occurs, without introducing a second thread-creation path.
+**Important distinction between the two callbacks:**
+- **Per-dispatch `options.onThreadCreated`**: Fires for **both** new and reused vellum conversation pairings. Callers like `dispatchGuardianQuestion` rely on this to create delivery bookkeeping rows before `emitNotificationSignal()` returns, regardless of whether the conversation was newly created or reused.
+- **Class-level `this.onThreadCreated` (IPC)**: Fires **only** when a brand-new conversation is created (`createdNewConversation === true && strategy === 'start_new_conversation'`). This emits the `notification_thread_created` IPC event so macOS/iOS clients surface the new thread in the sidebar. Reused threads do not trigger this event because the client already knows about the conversation.
 ## Reminder Routing Metadata and Trigger-Time Enforcement
@@ -248,8 +305,8 @@ Connected channels are resolved at signal emission time by `getConnectedChannels
 The system uses a single conversation materialization path for **all** notifications -- there are no legacy bypass paths or dual-broadcast mechanisms. Every notification, including guardian questions and ingress escalation alerts, flows through `emitNotificationSignal()`:
 1. `emitNotificationSignal()` evaluates the signal and dispatches to channels.
-2. `NotificationBroadcaster` pairs each delivery with a conversation via `pairDeliveryWithConversation()`.
-3. For vellum deliveries, the broadcaster merges `conversationId` into `deepLinkMetadata` and emits `notification_thread_created`.
+2. `NotificationBroadcaster` pairs each delivery with a conversation via `pairDeliveryWithConversation()`, executing the per-channel thread action (start_new or reuse_existing).
+3. For vellum deliveries, the broadcaster merges `conversationId` into `deepLinkMetadata` and emits `notification_thread_created` only when a new conversation was created (not on reuse).
 Guardian dispatch follows this same path and uses the optional `onThreadCreated` callback to attach guardian-delivery bookkeeping to the canonical vellum conversation.
@@ -257,6 +314,89 @@ Guardian dispatch follows this same path and uses the optional `onThreadCreated`
 For notification flows that create conversations, the conversation must be created **before** the IPC event is emitted. This ensures the macOS client can immediately fetch the conversation contents when it receives the thread-created event.
+## Thread Decision Audit Trail
+Every thread routing decision is persisted for observability:
+### Decision-Level Audit (`notification_decisions`)
+When the decision is persisted, a `threadActions` summary is included in `validationResults`:
+```json
+{
+  "threadActions": {
+    "vellum": "start_new",
+    "telegram": "reuse:conv-abc-123"
+  }
+}
+```
+### Delivery-Level Audit (`notification_deliveries`)
+Three columns on `notification_deliveries` record the per-channel thread decision:
+| Column | Type | Description |
+|--------|------|-------------|
+| `thread_action` | TEXT | `'start_new'` or `'reuse_existing'` — what the model decided |
+| `thread_target_conversation_id` | TEXT | The candidate `conversationId` when action is `reuse_existing` |
+| `thread_decision_fallback_used` | INTEGER | `1` if `reuse_existing` was attempted but the target was invalid, so a new conversation was created instead |
+### Query Examples
+```sql
+-- Thread reuse decisions with fallback tracking
+SELECT d.channel, d.thread_action, d.thread_target_conversation_id,
+       d.thread_decision_fallback_used, d.conversation_id
+FROM notification_deliveries d
+WHERE d.thread_action IS NOT NULL
+ORDER BY d.created_at DESC
+LIMIT 20;
+-- Reuse failures (model hallucinated an invalid conversation ID)
+SELECT d.channel, d.thread_target_conversation_id, d.conversation_id
+FROM notification_deliveries d
+WHERE d.thread_decision_fallback_used = 1
+ORDER BY d.created_at DESC;
+```
+## Guardian Multi-Request Disambiguation in Reused Threads
+When the decision engine routes multiple guardian questions to the **same** conversation (via `reuse_existing`), those questions share a single thread. The guardian needs a way to indicate which question they are answering. This is handled via **request-code disambiguation**.
+### How Request Codes Work
+Each `guardian_action_request` is assigned a unique 6-character hex code (e.g. `A1B2C3`) at creation time by `generateRequestCode()` in `guardian-action-store.ts`. The code is included in the notification copy delivered to the guardian.
+### Disambiguation Flow
+The disambiguation logic is identical on all channels — mac/vellum (`session-process.ts`), Telegram, and SMS (`inbound-message-handler.ts`):
+1. **Single pending delivery in the thread**: The guardian's reply is matched to the sole pending request automatically. No request code prefix is needed. This is the **single-match fast path**.
+2. **Multiple pending deliveries in the thread**: The guardian must prefix their reply with the request code of the question they are answering (e.g. `A1B2C3 yes, allow it`). Matching is case-insensitive.
+3. **No code match**: If the guardian's reply does not start with any active request code, a **disambiguation message** is sent back listing all active request codes so the guardian can retry with the correct prefix.
+### Channel Parity
+The disambiguation invariant is enforced identically across:
+- **Mac/Vellum** (`session-process.ts`): Intercepts user messages in conversations with pending guardian action deliveries before the agent loop runs.
+- **Telegram** (`inbound-message-handler.ts`): Intercepts inbound messages matched to conversations with pending guardian action deliveries.
+- **SMS** (`inbound-message-handler.ts`): Same codepath as Telegram.
+All three paths use the same pattern: look up pending deliveries by conversation, apply single-match fast path or request-code prefix matching, and send disambiguation messages via the guardian action message composer when ambiguous.
+### Disambiguation Message Generation
+All disambiguation messages are generated through `composeGuardianActionMessageGenerative()` in `guardian-action-message-composer.ts`, which uses a 2-tier priority chain (LLM generator with deterministic fallback). Three disambiguation scenarios exist:
+| Scenario | When triggered |
+|----------|---------------|
+| `guardian_disambiguation` | Multiple pending approval requests in a thread |
+| `guardian_expired_disambiguation` | Multiple expired requests with late replies |
+| `guardian_followup_disambiguation` | Multiple follow-up deliveries awaiting guardian action |
 ## Key Files
 | File | Purpose |
@@ -264,7 +404,8 @@ For notification flows that create conversations, the conversation must be creat
 | `../channels/config.ts` | Channel policy registry -- single source of truth for per-channel notification behavior |
 | `emit-signal.ts` | Single entry point for producers; orchestrates the full pipeline |
 | `signal.ts` | `NotificationSignal` and `AttentionHints` type definitions |
-| `types.ts` | Channel adapter interfaces, delivery types, decision output contract |
+| `types.ts` | Channel adapter interfaces, delivery types, decision output contract, `ThreadAction` union |
+| `thread-candidates.ts` | Builds per-channel candidate set of recent notification conversations for the decision engine |
 | `conversation-pairing.ts` | Materializes conversation + message per delivery based on channel strategy |
 | `decision-engine.ts` | LLM-based routing with forced tool_choice; deterministic fallback |
 | `deterministic-checks.ts` | Pre-send gate checks (dedupe, source-active, channel availability) |

package/src/notifications/broadcaster.ts CHANGED Viewed

@@ -24,6 +24,7 @@ import type {
   NotificationDecision,
   NotificationDeliveryResult,
   RenderedChannelCopy,
+  ThreadAction,
 } from './types.js';
 const log = getLogger('notif-broadcaster');
@@ -125,8 +126,36 @@ export class NotificationBroadcaster {
         copy = fallbackCopy[channel] ?? { title: 'Notification', body: signal.sourceEventName };
       }
-      // Pair the delivery with a conversation before sending
-      const pairing = await pairDeliveryWithConversation(signal, channel, copy);
+      // Resolve the per-channel thread action from the decision (default: start_new)
+      const threadAction: ThreadAction | undefined = decision.threadActions?.[channel];
+      // Check for duplicate delivery BEFORE pairing to avoid side effects
+      // (e.g. appending seed messages to existing threads) on retry paths
+      // where a delivery row already exists.
+      const persistedDecisionId = decision.persistedDecisionId;
+      const hasPersistedDecision = typeof persistedDecisionId === 'string';
+      if (hasPersistedDecision) {
+        const existingDelivery = findDeliveryByDecisionAndChannel(persistedDecisionId, channel);
+        if (existingDelivery) {
+          log.info(
+            { channel, signalId: signal.signalId, existingDeliveryId: existingDelivery.id },
+            'Delivery already exists for this decision+channel — skipping duplicate',
+          );
+          results.push({
+            channel,
+            destination: destination.endpoint ?? channel,
+            status: 'skipped',
+            errorMessage: 'Duplicate delivery skipped',
+            conversationId: existingDelivery.conversationId ?? undefined,
+            messageId: existingDelivery.messageId ?? undefined,
+            conversationStrategy: existingDelivery.conversationStrategy ?? undefined,
+          });
+          continue;
+        }
+      }
+      // Pair the delivery with a conversation before sending, passing the thread action
+      const pairing = await pairDeliveryWithConversation(signal, channel, copy, { threadAction });
       // For the vellum channel, merge the conversationId into deep-link metadata
       // so the macOS/iOS client can navigate directly to the notification thread.
@@ -134,20 +163,36 @@ export class NotificationBroadcaster {
       if (channel === 'vellum' && pairing.conversationId) {
         deepLinkTarget = { ...deepLinkTarget, conversationId: pairing.conversationId };
-        // Emit notification_thread_created immediately when the vellum
-        // conversation is paired, BEFORE waiting for adapter send or other
-        // channel deliveries. This avoids a race where slow Telegram delivery
-        // delays the IPC push past the macOS deep-link retry window.
-        if (pairing.strategy === 'start_new_conversation') {
-          const threadTitle =
-            copy.threadTitle ??
-            copy.title ??
-            signal.sourceEventName;
-          const info: ThreadCreatedInfo = {
-            conversationId: pairing.conversationId,
-            title: threadTitle,
-            sourceEventName: signal.sourceEventName,
-          };
+        const threadTitle =
+          copy.threadTitle ??
+          copy.title ??
+          signal.sourceEventName;
+        const info: ThreadCreatedInfo = {
+          conversationId: pairing.conversationId,
+          title: threadTitle,
+          sourceEventName: signal.sourceEventName,
+        };
+        // The per-dispatch onThreadCreated callback fires whenever a vellum
+        // conversation is paired (new or reused) because callers like
+        // dispatchGuardianQuestion rely on it to create delivery bookkeeping
+        // rows before emitNotificationSignal() returns.
+        if (options?.onThreadCreated) {
+          try {
+            options.onThreadCreated(info);
+          } catch (err) {
+            log.error(
+              { err, signalId: signal.signalId },
+              'per-dispatch onThreadCreated callback failed — continuing broadcast',
+            );
+          }
+        }
+        // Emit notification_thread_created IPC event only when a NEW
+        // conversation was actually created. Reusing an existing thread
+        // should not fire the IPC event — the client already knows about
+        // the conversation.
+        if (pairing.createdNewConversation && pairing.strategy === 'start_new_conversation') {
           if (this.onThreadCreated) {
             try {
               this.onThreadCreated(info);
@@ -155,16 +200,6 @@ export class NotificationBroadcaster {
               log.error({ err, signalId: signal.signalId }, 'onThreadCreated callback failed — continuing broadcast');
             }
           }
-          if (options?.onThreadCreated) {
-            try {
-              options.onThreadCreated(info);
-            } catch (err) {
-              log.error(
-                { err, signalId: signal.signalId },
-                'per-dispatch onThreadCreated callback failed — continuing broadcast',
-              );
-            }
-          }
         }
       }
@@ -179,33 +214,15 @@ export class NotificationBroadcaster {
         deepLinkTarget,
       };
-      // Only create a delivery audit record when we have a persisted decision ID
-      // for the FK. If decision persistence failed (persistedDecisionId is
-      // undefined), we still dispatch via the adapter but skip the delivery
-      // record — using dedupeKey would violate the FK constraint.
-      const persistedDecisionId = decision.persistedDecisionId;
-      const hasPersistedDecision = typeof persistedDecisionId === 'string';
+      // Compute thread decision audit fields for the delivery record
+      const threadAudit = {
+        threadAction: threadAction?.action ?? 'start_new',
+        threadTargetConversationId: threadAction?.action === 'reuse_existing' ? threadAction.conversationId : undefined,
+        threadDecisionFallbackUsed: pairing.threadDecisionFallbackUsed,
+      };
       try {
         if (hasPersistedDecision) {
-          const existingDelivery = findDeliveryByDecisionAndChannel(persistedDecisionId, channel);
-          if (existingDelivery) {
-            log.info(
-              { channel, signalId: signal.signalId, existingDeliveryId: existingDelivery.id },
-              'Delivery already exists for this decision+channel — skipping duplicate',
-            );
-            results.push({
-              channel,
-              destination: destinationLabel,
-              status: 'skipped',
-              errorMessage: 'Duplicate delivery skipped',
-              conversationId: existingDelivery.conversationId ?? undefined,
-              messageId: existingDelivery.messageId ?? undefined,
-              conversationStrategy: existingDelivery.conversationStrategy ?? undefined,
-            });
-            continue;
-          }
           createDelivery({
             id: deliveryId,
             notificationDecisionId: persistedDecisionId,
@@ -219,6 +236,7 @@ export class NotificationBroadcaster {
             conversationId: pairing.conversationId ?? undefined,
             messageId: pairing.messageId ?? undefined,
             conversationStrategy: pairing.strategy,
+            ...threadAudit,
           });
         } else {
           log.warn(

package/src/notifications/conversation-pairing.ts CHANGED Viewed

@@ -5,16 +5,20 @@
  * before the adapter sends it. This ensures every delivery has an
  * auditable conversation trail and enables the macOS/iOS client to
  * deep-link directly into the notification thread.
+ *
+ * When the decision engine selects `reuse_existing` for a channel and
+ * the target conversation is valid, the seed message is appended to the
+ * existing thread instead of creating a new one.
  */
 import type { ConversationStrategy } from '../channels/config.js';
 import { getConversationStrategy } from '../channels/config.js';
 import type { ChannelId } from '../channels/types.js';
-import { addMessage,createConversation } from '../memory/conversation-store.js';
+import { addMessage, createConversation, getConversation } from '../memory/conversation-store.js';
 import { getLogger } from '../util/logger.js';
 import type { NotificationSignal } from './signal.js';
 import { composeThreadSeed, isThreadSeedSane } from './thread-seed-composer.js';
-import type { NotificationChannel } from './types.js';
+import type { NotificationChannel, ThreadAction } from './types.js';
 import type { RenderedChannelCopy } from './types.js';
 const log = getLogger('notification-conversation-pairing');
@@ -23,6 +27,15 @@ export interface PairingResult {
   conversationId: string | null;
   messageId: string | null;
   strategy: ConversationStrategy;
+  /** True when a brand-new conversation was created; false when an existing one was reused. */
+  createdNewConversation: boolean;
+  /** When the model requested reuse_existing but the target was invalid, this is true. */
+  threadDecisionFallbackUsed: boolean;
+}
+export interface PairingOptions {
+  /** Per-channel thread action from the decision engine. */
+  threadAction?: ThreadAction;
 }
 /**
@@ -31,6 +44,12 @@ export interface PairingResult {
  * Looks up the channel's conversation strategy from the policy registry
  * and materializes a conversation + assistant message accordingly.
  *
+ * When `options.threadAction` is `reuse_existing`, the function attempts
+ * to look up the target conversation. If it exists and has the right source,
+ * the seed message is appended to it. If the target is invalid or stale,
+ * a new conversation is created instead (with `threadDecisionFallbackUsed`
+ * set to true on the result).
+ *
  * Errors are caught and logged — this function never throws so the
  * notification pipeline is not disrupted by pairing failures.
  */
@@ -38,22 +57,15 @@ export async function pairDeliveryWithConversation(
   signal: NotificationSignal,
   channel: NotificationChannel,
   copy: RenderedChannelCopy,
+  options?: PairingOptions,
 ): Promise<PairingResult> {
   try {
     const strategy = getConversationStrategy(channel as ChannelId);
     if (strategy === 'not_deliverable') {
-      return { conversationId: null, messageId: null, strategy: 'not_deliverable' };
+      return { conversationId: null, messageId: null, strategy: 'not_deliverable', createdNewConversation: false, threadDecisionFallbackUsed: false };
     }
-    // For both start_new_conversation and continue_existing_conversation,
-    // we create a new conversation per notification delivery for now.
-    //
-    // True conversation continuation (reusing an existing conversation scoped
-    // to channel + assistant via a key like `notif:{assistantId}:{channel}:ongoing`)
-    // requires external chat binding lookup which is complex. A future PR will
-    // add that capability. For this milestone we materialize conversations and
-    // record the intended strategy so the audit trail is complete.
     const title = copy.threadTitle ?? copy.title ?? signal.sourceEventName;
     // Only start_new_conversation threads should be user-visible. For channels
@@ -62,6 +74,75 @@ export async function pairDeliveryWithConversation(
     // true continuation-by-key is implemented.
     const threadType = strategy === 'start_new_conversation' ? 'standard' : 'background';
+    // Prefer model-provided threadSeedMessage when present and sane;
+    // fall back to the runtime composer which adapts verbosity to the
+    // delivery surface (vellum/macos = richer, telegram = compact).
+    const messageContent = isThreadSeedSane(copy.threadSeedMessage)
+      ? copy.threadSeedMessage
+      : composeThreadSeed(signal, channel, copy);
+    const threadAction = options?.threadAction;
+    // Attempt to reuse an existing conversation when the model requests it
+    if (threadAction?.action === 'reuse_existing') {
+      const targetId = threadAction.conversationId;
+      const existing = getConversation(targetId);
+      if (existing && existing.source === 'notification') {
+        // Append the seed message to the existing conversation thread
+        const message = await addMessage(existing.id, 'assistant', messageContent, undefined, { skipIndexing: true });
+        log.info(
+          {
+            signalId: signal.signalId,
+            channel,
+            strategy,
+            conversationId: existing.id,
+            messageId: message.id,
+            threadAction: 'reuse_existing',
+          },
+          'Reused existing notification conversation for delivery',
+        );
+        return {
+          conversationId: existing.id,
+          messageId: message.id,
+          strategy,
+          createdNewConversation: false,
+          threadDecisionFallbackUsed: false,
+        };
+      }
+      // Target is invalid/stale — fall back to creating a new conversation
+      log.warn(
+        {
+          signalId: signal.signalId,
+          channel,
+          targetConversationId: targetId,
+          targetExists: !!existing,
+          targetSource: existing?.source,
+        },
+        'Thread reuse target invalid — falling back to new conversation',
+      );
+      const conversation = createConversation({
+        title,
+        threadType,
+        source: 'notification',
+      });
+      const message = await addMessage(conversation.id, 'assistant', messageContent, undefined, { skipIndexing: true });
+      return {
+        conversationId: conversation.id,
+        messageId: message.id,
+        strategy,
+        createdNewConversation: true,
+        threadDecisionFallbackUsed: true,
+      };
+    }
+    // Default path: create a new conversation
     // Memory indexing is skipped on the seed message below to prevent
     // notification copy from polluting conversational recall.
     const conversation = createConversation({
@@ -70,12 +151,6 @@ export async function pairDeliveryWithConversation(
       source: 'notification',
     });
-    // Prefer model-provided threadSeedMessage when present and sane;
-    // fall back to the runtime composer which adapts verbosity to the
-    // delivery surface (vellum/macos = richer, telegram = compact).
-    const messageContent = isThreadSeedSane(copy.threadSeedMessage)
-      ? copy.threadSeedMessage
-      : composeThreadSeed(signal, channel, copy);
     // Skip memory indexing — notification audit messages are not conversational
     // memory and should not pollute recall or incur embedding/extraction overhead.
     const message = await addMessage(conversation.id, 'assistant', messageContent, undefined, { skipIndexing: true });
@@ -87,6 +162,7 @@ export async function pairDeliveryWithConversation(
         strategy,
         conversationId: conversation.id,
         messageId: message.id,
+        threadAction: threadAction?.action ?? 'start_new',
       },
       'Paired notification delivery with conversation',
     );
@@ -95,6 +171,8 @@ export async function pairDeliveryWithConversation(
       conversationId: conversation.id,
       messageId: message.id,
       strategy,
+      createdNewConversation: true,
+      threadDecisionFallbackUsed: false,
     };
   } catch (err) {
     log.error(
@@ -108,6 +186,6 @@ export async function pairDeliveryWithConversation(
         return 'not_deliverable' as const;
       }
     })();
-    return { conversationId: null, messageId: null, strategy: fallbackStrategy };
+    return { conversationId: null, messageId: null, strategy: fallbackStrategy, createdNewConversation: false, threadDecisionFallbackUsed: false };
   }
 }

package/src/notifications/decision-engine.ts CHANGED Viewed

@@ -19,7 +19,7 @@ import { getLogger } from '../util/logger.js';
 import { createDecision } from './decisions-store.js';
 import { getPreferenceSummary } from './preference-summary.js';
 import type { NotificationSignal, RoutingIntent } from './signal.js';
-import { type ThreadCandidateSet, buildThreadCandidates, serializeCandidatesForPrompt } from './thread-candidates.js';
+import { buildThreadCandidates, serializeCandidatesForPrompt,type ThreadCandidateSet } from './thread-candidates.js';
 import type { NotificationChannel, NotificationDecision, RenderedChannelCopy, ThreadAction } from './types.js';
 const log = getLogger('notification-decision-engine');
@@ -385,13 +385,16 @@ export function validateThreadActions(
     if (action.action === 'start_new') {
       result[channel] = { action: 'start_new' };
     } else if (action.action === 'reuse_existing') {
-      const conversationId = action.conversationId;
-      if (typeof conversationId !== 'string' || !conversationId.trim()) {
+      const rawConversationId = action.conversationId;
+      if (typeof rawConversationId !== 'string' || !rawConversationId.trim()) {
         log.warn({ channel }, 'LLM returned reuse_existing without conversationId — downgrading to start_new');
         result[channel] = { action: 'start_new' };
         continue;
       }
+      // Normalize: the LLM may return a valid ID with leading/trailing whitespace
+      const conversationId = rawConversationId.trim();
       // Strict validation: the conversationId must exist in the candidate set
       const candidateIds = validCandidateIds.get(channel);
       if (!candidateIds || !candidateIds.has(conversationId)) {