npm - @vellumai/assistant - Versions diffs - 0.5.13 → 0.5.15 - Mend

@vellumai/assistant 0.5.13 → 0.5.15

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (425) hide show

package/.env.example +1 -6
package/AGENTS.md +4 -0
package/ARCHITECTURE.md +0 -1
package/bunfig.toml +1 -0
package/docs/architecture/memory.md +3 -3
package/openapi.yaml +127 -22
package/package.json +1 -1
package/src/__tests__/access-request-decision.test.ts +2 -32
package/src/__tests__/actor-token-service.test.ts +1 -31
package/src/__tests__/anthropic-provider.test.ts +53 -40
package/src/__tests__/app-git-history.test.ts +9 -17
package/src/__tests__/app-git-service.test.ts +14 -20
package/src/__tests__/app-store-dir-names.test.ts +10 -20
package/src/__tests__/approval-cascade.test.ts +2 -19
package/src/__tests__/approval-primitive.test.ts +2 -27
package/src/__tests__/approval-routes-http.test.ts +2 -30
package/src/__tests__/assistant-events-sse-hardening.test.ts +2 -28
package/src/__tests__/assistant-feature-flags-integration.test.ts +2 -45
package/src/__tests__/attachments-store.test.ts +5 -32
package/src/__tests__/audit-log-rotation.test.ts +5 -36
package/src/__tests__/avatar-e2e.test.ts +1 -9
package/src/__tests__/avatar-generator.test.ts +1 -7
package/src/__tests__/browser-fill-credential.test.ts +0 -4
package/src/__tests__/browser-manager.test.ts +0 -6
package/src/__tests__/call-controller.test.ts +1 -22
package/src/__tests__/call-conversation-messages.test.ts +0 -21
package/src/__tests__/call-domain.test.ts +0 -25
package/src/__tests__/call-pointer-messages.test.ts +0 -21
package/src/__tests__/call-recovery.test.ts +0 -22
package/src/__tests__/call-routes-http.test.ts +0 -24
package/src/__tests__/call-store.test.ts +0 -21
package/src/__tests__/cancel-resolves-conversation-key.test.ts +0 -24
package/src/__tests__/canonical-guardian-store.test.ts +48 -21
package/src/__tests__/channel-approval-routes.test.ts +6 -26
package/src/__tests__/channel-approvals.test.ts +1 -38
package/src/__tests__/channel-delivery-store.test.ts +0 -21
package/src/__tests__/channel-guardian.test.ts +0 -26
package/src/__tests__/channel-reply-delivery.test.ts +5 -0
package/src/__tests__/channel-retry-sweep.test.ts +0 -21
package/src/__tests__/checker.test.ts +26 -61
package/src/__tests__/clawhub.test.ts +9 -25
package/src/__tests__/cli-command-risk-guard.test.ts +0 -18
package/src/__tests__/config-loader-backfill.test.ts +9 -28
package/src/__tests__/config-schema-cmd.test.ts +5 -25
package/src/__tests__/config-schema.test.ts +21 -40
package/src/__tests__/config-watcher.test.ts +4 -91
package/src/__tests__/confirmation-request-guardian-bridge.test.ts +0 -21
package/src/__tests__/contacts-tools.test.ts +0 -21
package/src/__tests__/context-memory-e2e.test.ts +0 -21
package/src/__tests__/context-window-manager.test.ts +130 -3
package/src/__tests__/conversation-abort-tool-results.test.ts +0 -4
package/src/__tests__/conversation-agent-loop-overflow.test.ts +0 -4
package/src/__tests__/conversation-agent-loop.test.ts +0 -4
package/src/__tests__/conversation-attachments.test.ts +1 -24
package/src/__tests__/conversation-attention-store.test.ts +0 -21
package/src/__tests__/conversation-attention-telegram.test.ts +0 -22
package/src/__tests__/conversation-clear-safety.test.ts +0 -22
package/src/__tests__/conversation-confirmation-signals.test.ts +2 -21
package/src/__tests__/conversation-delete-schedule-cleanup.test.ts +0 -24
package/src/__tests__/conversation-disk-view-integration.test.ts +1 -23
package/src/__tests__/conversation-disk-view.test.ts +5 -27
package/src/__tests__/conversation-error.test.ts +1 -1
package/src/__tests__/conversation-fork-crud.test.ts +1 -33
package/src/__tests__/conversation-fork-route.test.ts +0 -27
package/src/__tests__/conversation-history-web-search.test.ts +23 -16
package/src/__tests__/conversation-init.benchmark.test.ts +22 -43
package/src/__tests__/conversation-key-store-disk-view.test.ts +8 -34
package/src/__tests__/conversation-load-history-repair.test.ts +0 -4
package/src/__tests__/conversation-pre-run-repair.test.ts +0 -4
package/src/__tests__/conversation-provider-retry-repair.test.ts +0 -4
package/src/__tests__/conversation-queue.test.ts +8 -8
package/src/__tests__/conversation-routes-disk-view.test.ts +13 -51
package/src/__tests__/conversation-runtime-assembly.test.ts +64 -38
package/src/__tests__/conversation-slash-commands.test.ts +5 -0
package/src/__tests__/conversation-slash-queue.test.ts +0 -4
package/src/__tests__/conversation-slash-unknown.test.ts +0 -4
package/src/__tests__/conversation-speed-override.test.ts +326 -0
package/src/__tests__/conversation-starter-routes.test.ts +0 -23
package/src/__tests__/conversation-store.test.ts +0 -21
package/src/__tests__/conversation-unread-route.test.ts +0 -24
package/src/__tests__/conversation-usage.test.ts +56 -21
package/src/__tests__/conversation-wipe.test.ts +0 -21
package/src/__tests__/conversation-workspace-cache-state.test.ts +0 -4
package/src/__tests__/conversation-workspace-injection.test.ts +0 -4
package/src/__tests__/conversation-workspace-tool-tracking.test.ts +0 -4
package/src/__tests__/credential-execution-shell-lockdown.test.ts +8 -5
package/src/__tests__/credential-vault-unit.test.ts +9 -428
package/src/__tests__/credentials-cli.test.ts +10 -10
package/src/__tests__/daemon-assistant-events.test.ts +0 -19
package/src/__tests__/date-context.test.ts +77 -97
package/src/__tests__/db-conversation-fork-lineage-migration.test.ts +7 -24
package/src/__tests__/db-llm-request-log-provider-migration.test.ts +29 -42
package/src/__tests__/delete-managed-skill-tool.test.ts +2 -10
package/src/__tests__/deterministic-verification-control-plane.test.ts +1 -26
package/src/__tests__/docker-signing-key-bootstrap.test.ts +61 -15
package/src/__tests__/dynamic-skill-workflow-prompt.test.ts +2 -36
package/src/__tests__/email-cli.test.ts +6 -6
package/src/__tests__/ephemeral-permissions.test.ts +5 -17
package/src/__tests__/first-greeting.test.ts +4 -32
package/src/__tests__/followup-tools.test.ts +0 -21
package/src/__tests__/gateway-only-enforcement.test.ts +0 -20
package/src/__tests__/guardian-action-conversation-turn.test.ts +0 -23
package/src/__tests__/guardian-action-followup-executor.test.ts +0 -23
package/src/__tests__/guardian-action-followup-store.test.ts +0 -21
package/src/__tests__/guardian-action-grant-mint-consume.test.ts +0 -21
package/src/__tests__/guardian-action-late-reply.test.ts +0 -21
package/src/__tests__/guardian-action-store.test.ts +0 -21
package/src/__tests__/guardian-action-sweep.test.ts +0 -21
package/src/__tests__/guardian-binding-drift-heal.test.ts +0 -23
package/src/__tests__/guardian-decision-primitive-canonical.test.ts +172 -22
package/src/__tests__/guardian-dispatch.test.ts +0 -21
package/src/__tests__/guardian-grant-minting.test.ts +0 -22
package/src/__tests__/guardian-outbound-http.test.ts +0 -22
package/src/__tests__/guardian-principal-id-roundtrip.test.ts +0 -23
package/src/__tests__/guardian-routing-invariants.test.ts +0 -22
package/src/__tests__/guardian-routing-state.test.ts +0 -22
package/src/__tests__/guardian-verification-voice-binding.test.ts +0 -24
package/src/__tests__/headless-browser-interactions.test.ts +0 -4
package/src/__tests__/headless-browser-navigate.test.ts +0 -4
package/src/__tests__/headless-browser-read-tools.test.ts +0 -4
package/src/__tests__/headless-browser-snapshot.test.ts +0 -4
package/src/__tests__/heartbeat-service.test.ts +99 -26
package/src/__tests__/hooks-blocking.test.ts +3 -3
package/src/__tests__/hooks-config.test.ts +7 -7
package/src/__tests__/hooks-discovery.test.ts +3 -3
package/src/__tests__/hooks-integration.test.ts +5 -5
package/src/__tests__/hooks-manager.test.ts +3 -3
package/src/__tests__/hooks-runner.test.ts +5 -23
package/src/__tests__/hooks-settings.test.ts +3 -3
package/src/__tests__/hooks-templates.test.ts +3 -3
package/src/__tests__/http-conversation-lineage.test.ts +0 -27
package/src/__tests__/identity-intro-cache.test.ts +0 -4
package/src/__tests__/inbound-invite-redemption.test.ts +0 -22
package/src/__tests__/inline-skill-load-permissions.test.ts +5 -16
package/src/__tests__/intent-routing.test.ts +2 -55
package/src/__tests__/invite-redemption-service.test.ts +0 -21
package/src/__tests__/invite-routes-http.test.ts +0 -21
package/src/__tests__/jobs-store-qdrant-breaker.test.ts +0 -17
package/src/__tests__/journal-context.test.ts +8 -75
package/src/__tests__/list-messages-attachments.test.ts +0 -22
package/src/__tests__/llm-context-route-provider.test.ts +0 -21
package/src/__tests__/llm-request-log-turn-query.test.ts +46 -28
package/src/__tests__/llm-usage-store.test.ts +0 -21
package/src/__tests__/log-export-workspace.test.ts +1 -1
package/src/__tests__/managed-skill-lifecycle.test.ts +1 -1
package/src/__tests__/managed-store.test.ts +1 -1
package/src/__tests__/mcp-cli.test.ts +7 -10
package/src/__tests__/memory-context-benchmark.benchmark.test.ts +0 -21
package/src/__tests__/memory-jobs-worker-backoff.test.ts +0 -11
package/src/__tests__/memory-lifecycle-e2e.test.ts +0 -21
package/src/__tests__/memory-recall-log-store.test.ts +0 -27
package/src/__tests__/memory-recall-quality.test.ts +0 -21
package/src/__tests__/memory-regressions.experimental.test.ts +31 -30
package/src/__tests__/memory-regressions.test.ts +282 -70
package/src/__tests__/memory-retrieval.benchmark.test.ts +0 -21
package/src/__tests__/memory-upsert-concurrency.test.ts +0 -21
package/src/__tests__/messaging-send-tool.test.ts +201 -0
package/src/__tests__/migration-cross-version-compatibility.test.ts +18 -13
package/src/__tests__/migration-export-http.test.ts +7 -1
package/src/__tests__/migration-import-commit-http.test.ts +16 -14
package/src/__tests__/migration-import-preflight-http.test.ts +27 -44
package/src/__tests__/migration-validate-http.test.ts +1 -28
package/src/__tests__/native-web-search.test.ts +25 -22
package/src/__tests__/non-member-access-request.test.ts +0 -22
package/src/__tests__/notification-guardian-path.test.ts +0 -21
package/src/__tests__/notification-schedule-dedup.test.ts +1 -25
package/src/__tests__/oauth-apps-routes.test.ts +103 -2
package/src/__tests__/oauth-cli.test.ts +52 -0
package/src/__tests__/oauth-provider-profiles.test.ts +0 -16
package/src/__tests__/oauth-provider-serializer.test.ts +232 -0
package/src/__tests__/oauth-providers-routes.test.ts +257 -0
package/src/__tests__/oauth-store.test.ts +0 -21
package/src/__tests__/onboarding-template-contract.test.ts +2 -2
package/src/__tests__/openai-provider.test.ts +261 -0
package/src/__tests__/pairing-concurrent.test.ts +6 -6
package/src/__tests__/pairing-routes.test.ts +7 -1
package/src/__tests__/path-policy.test.ts +1 -1
package/src/__tests__/platform.test.ts +64 -88
package/src/__tests__/playbook-execution.test.ts +0 -21
package/src/__tests__/playbook-tools.test.ts +0 -21
package/src/__tests__/pricing.test.ts +100 -0
package/src/__tests__/relay-server.test.ts +1 -25
package/src/__tests__/runtime-attachment-metadata.test.ts +0 -24
package/src/__tests__/runtime-events-sse-parity.test.ts +2 -24
package/src/__tests__/runtime-events-sse.test.ts +0 -24
package/src/__tests__/sandbox-diagnostics.test.ts +2 -1
package/src/__tests__/scaffold-managed-skill-tool.test.ts +1 -1
package/src/__tests__/schedule-store.test.ts +0 -21
package/src/__tests__/schedule-tools.test.ts +0 -21
package/src/__tests__/scheduler-recurrence.test.ts +0 -21
package/src/__tests__/scoped-approval-grants.test.ts +0 -21
package/src/__tests__/scoped-grant-security-matrix.test.ts +0 -21
package/src/__tests__/secret-allowlist.test.ts +1 -1
package/src/__tests__/secret-ingress-channel.test.ts +0 -5
package/src/__tests__/secret-ingress-cli.test.ts +0 -6
package/src/__tests__/secret-ingress-http.test.ts +0 -5
package/src/__tests__/secret-ingress.test.ts +0 -5
package/src/__tests__/send-endpoint-busy.test.ts +0 -24
package/src/__tests__/sequence-store.test.ts +0 -21
package/src/__tests__/server-history-render.test.ts +0 -24
package/src/__tests__/shell-tool-proxy-mode.test.ts +0 -4
package/src/__tests__/skill-load-inline-command.test.ts +9 -0
package/src/__tests__/skill-load-inline-includes.test.ts +9 -0
package/src/__tests__/skill-load-tool.test.ts +11 -0
package/src/__tests__/skills-uninstall.test.ts +10 -8
package/src/__tests__/skills.test.ts +1 -1
package/src/__tests__/slack-channel-config.test.ts +1 -1
package/src/__tests__/slack-inbound-verification.test.ts +0 -22
package/src/__tests__/starter-bundle.test.ts +4 -1
package/src/__tests__/suggestion-routes.test.ts +2 -0
package/src/__tests__/system-prompt.test.ts +1 -1
package/src/__tests__/terminal-tools.test.ts +1 -1
package/src/__tests__/test-preload.ts +31 -0
package/src/__tests__/tool-execution-abort-cleanup.test.ts +1 -1
package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +1 -1
package/src/__tests__/tool-executor.test.ts +0 -20
package/src/__tests__/tool-input-summary.test.ts +124 -0
package/src/__tests__/tool-preview-lifecycle.test.ts +2 -1
package/src/__tests__/trust-store.test.ts +7 -1
package/src/__tests__/trusted-contact-inline-approval-integration.test.ts +1 -1
package/src/__tests__/trusted-contact-lifecycle-notifications.test.ts +1 -1
package/src/__tests__/trusted-contact-multichannel.test.ts +1 -1
package/src/__tests__/trusted-contact-verification.test.ts +1 -1
package/src/__tests__/turn-boundary-resolution.test.ts +1 -1
package/src/__tests__/twilio-routes.test.ts +1 -1
package/src/__tests__/update-bulletin.test.ts +1 -1
package/src/__tests__/vbundle-pax-and-symlink.test.ts +1 -1
package/src/__tests__/vellum-self-knowledge-inline-command.test.ts +1 -0
package/src/__tests__/voice-scoped-grant-consumer.test.ts +1 -1
package/src/__tests__/voice-session-bridge.test.ts +1 -1
package/src/__tests__/workspace-migration-009-backfill-conversation-disk-view.test.ts +4 -4
package/src/__tests__/workspace-migration-013-repair-conversation-disk-view.test.ts +1 -1
package/src/__tests__/workspace-migration-down-functions.test.ts +15 -3
package/src/__tests__/workspace-migration-seed-device-id.test.ts +40 -4
package/src/agent/loop.ts +6 -9
package/src/approvals/guardian-decision-primitive.ts +46 -18
package/src/approvals/guardian-request-resolvers.ts +19 -2
package/src/calls/active-call-lease.ts +2 -2
package/src/cli/AGENTS.md +1 -1
package/src/cli/commands/doctor.ts +9 -9
package/src/cli/commands/memory.ts +142 -0
package/src/cli/commands/oauth/__tests__/connect.test.ts +13 -11
package/src/cli/commands/oauth/__tests__/ping.test.ts +1 -1
package/src/cli/commands/oauth/connect.ts +13 -12
package/src/cli/commands/oauth/index.ts +1 -1
package/src/cli/commands/oauth/providers.ts +47 -62
package/src/cli/commands/platform/__tests__/connect.test.ts +72 -46
package/src/cli/commands/platform/__tests__/disconnect.test.ts +54 -1
package/src/cli/commands/platform/__tests__/status.test.ts +36 -0
package/src/cli/commands/platform/connect.ts +17 -7
package/src/cli/commands/platform/disconnect.ts +28 -3
package/src/cli/commands/platform/index.ts +3 -3
package/src/cli.ts +1 -299
package/src/config/assistant-feature-flags.ts +23 -15
package/src/config/bundled-skills/app-builder/TOOLS.json +16 -0
package/src/config/bundled-skills/app-builder/tools/app-create.ts +4 -0
package/src/config/bundled-skills/app-builder/tools/app-delete.ts +5 -1
package/src/config/bundled-skills/app-builder/tools/app-generate-icon.ts +9 -1
package/src/config/bundled-skills/app-builder/tools/app-refresh.ts +5 -1
package/src/config/bundled-skills/contacts/TOOLS.json +8 -0
package/src/config/bundled-skills/contacts/tools/contact-search.ts +10 -1
package/src/config/bundled-skills/contacts/tools/contact-upsert.ts +16 -2
package/src/config/bundled-skills/media-processing/tools/ingest-media.ts +1 -0
package/src/config/bundled-skills/messaging/SKILL.md +7 -7
package/src/config/bundled-skills/messaging/tools/messaging-send.ts +37 -0
package/src/config/bundled-skills/slack/SKILL.md +18 -0
package/src/config/env-registry.ts +15 -11
package/src/config/env.ts +1 -11
package/src/config/feature-flag-registry.json +16 -0
package/src/config/schema.ts +4 -0
package/src/config/schemas/heartbeat.ts +6 -1
package/src/config/schemas/inference.ts +14 -3
package/src/config/schemas/memory-processing.ts +16 -8
package/src/config/schemas/memory-retrieval.ts +3 -3
package/src/config/skills.ts +1 -1
package/src/context/window-manager.ts +174 -51
package/src/credential-execution/executable-discovery.ts +2 -2
package/src/daemon/approved-devices-store.ts +2 -2
package/src/daemon/assistant-attachments.ts +2 -0
package/src/daemon/config-watcher.ts +4 -50
package/src/daemon/conversation-agent-loop-handlers.ts +9 -1
package/src/daemon/conversation-agent-loop.ts +12 -0
package/src/daemon/conversation-error.ts +3 -5
package/src/daemon/conversation-history.ts +7 -3
package/src/daemon/conversation-lifecycle.ts +16 -0
package/src/daemon/conversation-messaging.ts +1 -0
package/src/daemon/conversation-notifiers.ts +67 -30
package/src/daemon/conversation-process.ts +161 -2
package/src/daemon/conversation-queue-manager.ts +2 -0
package/src/daemon/conversation-runtime-assembly.ts +33 -11
package/src/daemon/conversation-slash.ts +14 -3
package/src/daemon/conversation-tool-setup.ts +2 -0
package/src/daemon/conversation-usage.ts +32 -4
package/src/daemon/conversation.ts +33 -1
package/src/daemon/daemon-control.ts +32 -16
package/src/daemon/date-context.ts +47 -45
package/src/daemon/dictation-profile-store.ts +2 -2
package/src/daemon/handlers/conversations.ts +19 -0
package/src/daemon/handlers/shared.ts +14 -21
package/src/daemon/lifecycle.ts +5 -7
package/src/daemon/message-types/conversations.ts +2 -0
package/src/daemon/message-types/guardian-actions.ts +3 -17
package/src/daemon/message-types/integrations.ts +11 -1
package/src/daemon/message-types/messages.ts +1 -0
package/src/daemon/pairing-store.ts +2 -79
package/src/daemon/server.ts +154 -8
package/src/daemon/watch-handler.ts +65 -21
package/src/email/guardrails.ts +3 -3
package/src/heartbeat/heartbeat-service.ts +14 -7
package/src/hooks/cli.ts +2 -2
package/src/hooks/config.ts +2 -2
package/src/hooks/discovery.ts +2 -2
package/src/hooks/manager.ts +2 -2
package/src/hooks/runner.ts +5 -2
package/src/hooks/templates.ts +2 -2
package/src/memory/admin.ts +181 -2
package/src/memory/app-git-service.ts +61 -4
package/src/memory/attachments-store.ts +2 -0
package/src/memory/canonical-guardian-store.ts +16 -0
package/src/memory/db-init.ts +8 -0
package/src/memory/embedding-local.ts +5 -2
package/src/memory/indexer.ts +44 -26
package/src/memory/items-extractor.ts +34 -82
package/src/memory/job-handlers/batch-extraction.ts +741 -0
package/src/memory/job-handlers/journal-carry-forward.test.ts +383 -0
package/src/memory/job-handlers/journal-carry-forward.ts +255 -0
package/src/memory/jobs-store.ts +28 -0
package/src/memory/jobs-worker.ts +56 -9
package/src/memory/lifecycle-events-store.ts +4 -2
package/src/memory/llm-request-log-store.ts +40 -2
package/src/memory/llm-usage-store.ts +4 -3
package/src/memory/migrations/199-guardian-request-enrichment-columns.ts +71 -0
package/src/memory/migrations/200-usage-llm-call-count.ts +20 -0
package/src/memory/migrations/index.ts +2 -0
package/src/memory/query-expansion.ts +83 -0
package/src/memory/retriever.test.ts +119 -0
package/src/memory/retriever.ts +513 -105
package/src/memory/schema/guardian.ts +4 -0
package/src/memory/schema/infrastructure.ts +1 -0
package/src/memory/search/formatting.test.ts +140 -0
package/src/memory/search/formatting.ts +143 -198
package/src/memory/search/mmr.ts +136 -0
package/src/memory/search/staleness.ts +0 -15
package/src/memory/search/tier-classifier.ts +10 -21
package/src/memory/search/types.ts +17 -0
package/src/messaging/providers/slack/adapter.ts +51 -5
package/src/notifications/broadcaster.ts +13 -0
package/src/notifications/copy-composer.ts +8 -0
package/src/oauth/connect-orchestrator.ts +1 -1
package/src/oauth/connection-resolver.ts +2 -2
package/src/oauth/provider-serializer.ts +116 -0
package/src/permissions/trust-store.ts +24 -7
package/src/prompts/__tests__/build-cli-reference-section.test.ts +5 -0
package/src/prompts/journal-context.ts +50 -35
package/src/prompts/persona-resolver.ts +1 -1
package/src/prompts/system-prompt.ts +27 -28
package/src/prompts/templates/BOOTSTRAP.md +14 -1
package/src/prompts/templates/HEARTBEAT.md +10 -0
package/src/prompts/templates/NOW.md +19 -25
package/src/prompts/templates/SOUL.md +13 -1
package/src/prompts/templates/UPDATES.md +12 -0
package/src/prompts/update-bulletin.ts +1 -1
package/src/providers/anthropic/client.ts +89 -18
package/src/providers/model-catalog.ts +22 -2
package/src/providers/model-intents.ts +2 -2
package/src/providers/openai/client.ts +40 -1
package/src/providers/retry.ts +23 -4
package/src/providers/types.ts +2 -0
package/src/runtime/assistant-scope.ts +1 -1
package/src/runtime/auth/__tests__/credential-service.test.ts +1 -0
package/src/runtime/auth/route-policy.ts +1 -0
package/src/runtime/auth/token-service.ts +51 -29
package/src/runtime/confirmation-request-guardian-bridge.ts +3 -1
package/src/runtime/guardian-decision-types.ts +16 -10
package/src/runtime/http-server.ts +3 -14
package/src/runtime/http-types.ts +1 -0
package/src/runtime/migrations/vbundle-builder.ts +7 -4
package/src/runtime/migrations/vbundle-import-analyzer.ts +0 -4
package/src/runtime/migrations/vbundle-importer.ts +1 -1
package/src/runtime/routes/conversation-query-routes.ts +40 -8
package/src/runtime/routes/conversation-routes.ts +125 -3
package/src/runtime/routes/guardian-action-routes.ts +9 -3
package/src/runtime/routes/identity-routes.ts +25 -4
package/src/runtime/routes/llm-context-normalization.ts +1 -0
package/src/runtime/routes/log-export-routes.ts +34 -12
package/src/runtime/routes/migration-routes.ts +6 -10
package/src/runtime/routes/oauth-apps.ts +2 -9
package/src/runtime/routes/oauth-providers.ts +60 -0
package/src/runtime/routes/pairing-routes.ts +0 -8
package/src/runtime/routes/settings-routes.ts +0 -1
package/src/runtime/routes/telemetry-routes.ts +16 -4
package/src/security/encrypted-store.ts +2 -2
package/src/security/secret-allowlist.ts +3 -3
package/src/signals/emit-event.ts +42 -0
package/src/signals/user-message.ts +37 -0
package/src/telemetry/usage-telemetry-reporter.test.ts +83 -19
package/src/telemetry/usage-telemetry-reporter.ts +23 -17
package/src/tools/browser/runtime-check.ts +2 -2
package/src/tools/credentials/vault.ts +2 -249
package/src/tools/memory/definitions.ts +1 -1
package/src/tools/memory/handlers.test.ts +50 -8
package/src/tools/memory/handlers.ts +3 -1
package/src/tools/side-effects.ts +1 -6
package/src/tools/terminal/safe-env.ts +3 -2
package/src/tools/terminal/shell.ts +11 -14
package/src/tools/tool-approval-handler.ts +20 -1
package/src/tools/tool-input-summary.ts +66 -0
package/src/tools/types.ts +4 -0
package/src/usage/types.ts +4 -0
package/src/util/device-id.ts +10 -10
package/src/util/platform.ts +71 -33
package/src/util/pricing.ts +19 -6
package/src/util/strip-comment-lines.ts +28 -0
package/src/workspace/git-service.ts +8 -18
package/src/workspace/migrations/003-seed-device-id.ts +6 -4
package/src/workspace/migrations/016-extract-feature-flags-to-protected.ts +7 -1
package/src/workspace/migrations/017-seed-persona-dirs.ts +2 -4
package/src/workspace/migrations/021-move-signals-to-workspace.ts +84 -0
package/src/workspace/migrations/022-move-hooks-to-workspace.ts +94 -0
package/src/workspace/migrations/023-move-config-files-to-workspace.ts +86 -0
package/src/workspace/migrations/024-move-runtime-files-to-workspace.ts +126 -0
package/src/workspace/migrations/migrate-to-workspace-volume.ts +3 -6
package/src/workspace/migrations/registry.ts +8 -0
package/src/signals/confirm.ts +0 -82
package/src/signals/trust-rule.ts +0 -174

package/src/memory/retriever.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { asc, eq, inArray, sql } from "drizzle-orm";
+import { and, asc, eq, inArray, notInArray, sql } from "drizzle-orm";
 import type { AssistantConfig } from "../config/types.js";
 import { estimateTextTokens } from "../context/token-estimator.js";
@@ -9,6 +9,7 @@ import {
   computeRetryDelay,
   isRetryableNetworkError,
 } from "../util/retry.js";
+import { getConversationDirName } from "./conversation-directories.js";
 import { getDb } from "./db.js";
 import {
   embedWithBackend,
@@ -17,22 +18,19 @@ import {
   logMemoryEmbeddingWarning,
 } from "./embedding-backend.js";
 import { isQdrantBreakerOpen } from "./qdrant-circuit-breaker.js";
+import { expandQueryWithHyDE } from "./query-expansion.js";
 import {
   conversations,
   memoryItems,
   memoryItemSources,
   messages,
 } from "./schema.js";
-import {
-  buildTwoLayerInjection,
-  CAPABILITY_KINDS,
-  IDENTITY_KINDS,
-  PREFERENCE_KINDS,
-} from "./search/formatting.js";
+import { buildMemoryInjection } from "./search/formatting.js";
+import { applyMMR } from "./search/mmr.js";
 import { isQdrantConnectionError, semanticSearch } from "./search/semantic.js";
-import { applyStaleDemotion, computeStaleness } from "./search/staleness.js";
+import { computeStaleness } from "./search/staleness.js";
 import {
-  classifyTiers,
+  filterByMinScore,
   type TieredCandidate,
 } from "./search/tier-classifier.js";
 import type {
@@ -50,6 +48,7 @@ export {
   escapeXmlTags,
   formatAbsoluteTime,
   formatRelativeTime,
+  lookupSupersessionChain,
 } from "./search/formatting.js";
 export type {
   DegradationReason,
@@ -64,6 +63,10 @@ const log = getLogger("memory-retriever");
 const EMBED_MAX_RETRIES = 3;
 const EMBED_BASE_DELAY_MS = 500;
+/** MMR diversity penalty applied to near-duplicate items after score filtering.
+ *  0 = no penalty, 1 = maximum penalty. */
+const MMR_PENALTY = 0.6;
 /**
  * Wrap embedWithBackend with retry + exponential backoff for transient failures
  * (network errors, 429s, 5xx). Aborts immediately if the caller's signal fires.
@@ -234,20 +237,141 @@ async function generateQueryEmbedding(
   return { queryVector, provider, model, degraded, degradation, reason };
 }
+/** Result from HyDE-expanded search. */
+interface HyDESearchResult {
+  candidates: Candidate[];
+  hydeExpanded: boolean;
+  hydeDocCount: number;
+}
 /**
- * Memory recall pipeline: hybrid search → tier classification →
- * staleness annotation → two-layer XML injection.
+ * Run HyDE-expanded search: generate hypothetical documents, embed them
+ * alongside the raw query in parallel, run parallel semantic searches,
+ * and merge all candidate arrays.
+ *
+ * Falls back to raw-query-only search on any HyDE failure (expansion
+ * error, embedding error for hypothetical docs). The raw query search
+ * always runs regardless of HyDE success.
+ */
+async function runHyDESearch(
+  query: string,
+  rawQueryVector: number[],
+  config: AssistantConfig,
+  signal: AbortSignal | undefined,
+  provider: string,
+  model: string,
+  limit: number,
+  excludeMessageIds: string[],
+  scopeIds: string[] | undefined,
+  sparseVector: { indices: number[]; values: number[] } | undefined,
+): Promise<HyDESearchResult> {
+  // Always search with the raw query — this is our baseline
+  const rawSearchPromise = semanticSearch(
+    rawQueryVector,
+    provider,
+    model,
+    limit,
+    excludeMessageIds,
+    scopeIds,
+    sparseVector,
+  );
+  // Suppress unhandled rejection if Qdrant rejects before we await
+  rawSearchPromise.catch(() => {});
+  // Attempt HyDE expansion — returns [] on any failure
+  let hypotheticalDocs: string[];
+  try {
+    hypotheticalDocs = await expandQueryWithHyDE(query, config, signal);
+  } catch {
+    // expandQueryWithHyDE already catches internally, but be defensive
+    hypotheticalDocs = [];
+  }
+  if (hypotheticalDocs.length === 0) {
+    // No hypothetical docs — fall back to raw query only
+    const rawResults = await rawSearchPromise;
+    return {
+      candidates: rawResults,
+      hydeExpanded: false,
+      hydeDocCount: 0,
+    };
+  }
+  log.debug(
+    { hydeDocCount: hypotheticalDocs.length },
+    "HyDE expansion produced hypothetical documents",
+  );
+  // Embed all hypothetical docs in parallel with the raw search
+  let hydeVectors: number[][] = [];
+  try {
+    const hydeEmbedResult = await embedWithRetry(config, hypotheticalDocs, {
+      signal,
+    });
+    hydeVectors = hydeEmbedResult.vectors;
+  } catch (err) {
+    log.warn(
+      { err: err instanceof Error ? err.message : String(err) },
+      "Failed to embed HyDE hypothetical docs; falling back to raw query",
+    );
+    const rawResults = await rawSearchPromise;
+    return {
+      candidates: rawResults,
+      hydeExpanded: false,
+      hydeDocCount: 0,
+    };
+  }
+  // Run parallel semantic searches for each hypothetical doc embedding,
+  // generating per-doc sparse embeddings so sparse and dense components match.
+  const hydeSearchPromises = hydeVectors.map((vector, i) => {
+    const docSparseVector = generateSparseEmbedding(hypotheticalDocs[i]!);
+    return semanticSearch(
+      vector,
+      provider,
+      model,
+      limit,
+      excludeMessageIds,
+      scopeIds,
+      docSparseVector,
+    ).catch((err) => {
+      log.warn(
+        { err: err instanceof Error ? err.message : String(err) },
+        "HyDE hypothetical doc search failed; skipping",
+      );
+      return [] as Candidate[];
+    });
+  });
+  // Await all searches in parallel (raw + hypothetical)
+  const [rawResults, ...hydeResults] = await Promise.all([
+    rawSearchPromise,
+    ...hydeSearchPromises,
+  ]);
+  // Merge all candidate arrays into a single flat array
+  const allCandidates = [rawResults, ...hydeResults].flat();
+  return {
+    candidates: allCandidates,
+    hydeExpanded: true,
+    hydeDocCount: hypotheticalDocs.length,
+  };
+}
+/**
+ * Memory recall pipeline: hybrid search → score filtering →
+ * staleness annotation → unified XML injection.
  *
  * Pipeline steps:
  *   1. Build query text (caller provides via buildMemoryQuery)
  *   2. Generate dense + sparse embeddings
  *   3. Hybrid search on Qdrant (dense + sparse RRF fusion)
  *   4. Deduplicate results
- *   5. Classify tiers (score > 0.6 → tier 1, > 0.4 → tier 2)
- *   6. Enrich item candidates with metadata for staleness
- *   7. Compute staleness per item
- *   8. Demote very_stale tier 1 → tier 2
- *   9. Build two-layer XML injection with budget allocation
+ *   5. Filter by minimum score threshold
+ *   6. Enrich candidates with source labels and item metadata
+ *   7. Compute staleness per item (for debugging/logging)
+ *   8. Build unified XML injection with budget allocation
  */
 export async function buildMemoryRecall(
   query: string,
@@ -300,26 +424,49 @@ export async function buildMemoryRecall(
     options?.scopePolicyOverride,
   );
-  const HYBRID_LIMIT = 20;
+  const HYBRID_LIMIT = 40;
   let hybridCandidates: Candidate[] = [];
   let semanticSearchFailed = false;
   let sparseVectorUsed = false;
+  let hydeExpanded = false;
+  let hydeDocCount = 0;
   const hybridSearchStart = Date.now();
   const qdrantBreakerOpen = isQdrantBreakerOpen();
   if (queryVector && !qdrantBreakerOpen) {
     try {
-      hybridCandidates = await semanticSearch(
-        queryVector,
-        provider ?? "unknown",
-        model ?? "unknown",
-        HYBRID_LIMIT,
-        excludeMessageIds,
-        scopeIds,
-        sparseVectorAvailable ? sparseVector : undefined,
-      );
-      sparseVectorUsed = sparseVectorAvailable;
+      if (options?.hydeEnabled) {
+        // ── HyDE path: expand query into hypothetical docs and search in parallel ──
+        const hydeCandidates = await runHyDESearch(
+          query,
+          queryVector,
+          config,
+          signal,
+          provider ?? "unknown",
+          model ?? "unknown",
+          HYBRID_LIMIT,
+          excludeMessageIds,
+          scopeIds,
+          sparseVectorAvailable ? sparseVector : undefined,
+        );
+        hybridCandidates = hydeCandidates.candidates;
+        hydeExpanded = hydeCandidates.hydeExpanded;
+        hydeDocCount = hydeCandidates.hydeDocCount;
+        sparseVectorUsed = sparseVectorAvailable || hydeExpanded;
+      } else {
+        // ── Standard path: single raw query search ──
+        hybridCandidates = await semanticSearch(
+          queryVector,
+          provider ?? "unknown",
+          model ?? "unknown",
+          HYBRID_LIMIT,
+          excludeMessageIds,
+          scopeIds,
+          sparseVectorAvailable ? sparseVector : undefined,
+        );
+        sparseVectorUsed = sparseVectorAvailable;
+      }
     } catch (err) {
       semanticSearchFailed = true;
       if (isQdrantConnectionError(err)) {
@@ -363,8 +510,9 @@ export async function buildMemoryRecall(
   // from messages that were removed by context compaction should be kept —
   // those messages are no longer in the conversation history and memory is
   // the only way they can influence the response.
+  let inContextMessageIds: Set<string> | null = null;
   if (conversationId) {
-    const inContextMessageIds = getEffectiveInContextMessageIds(conversationId);
+    inContextMessageIds = getEffectiveInContextMessageIds(conversationId);
     if (inContextMessageIds) {
       for (const [key, c] of candidateMap) {
         if (c.type === "segment") {
@@ -413,11 +561,12 @@ export async function buildMemoryRecall(
           }
           // Filter items whose ALL sources are in-context
+          const contextIds = inContextMessageIds;
           for (const [key, c] of candidateMap) {
             if (c.type !== "item") continue;
             const sourceMessageIds = itemSourceMap.get(c.id);
             if (!sourceMessageIds || sourceMessageIds.length === 0) continue;
-            if (sourceMessageIds.every((mid) => inContextMessageIds.has(mid))) {
+            if (sourceMessageIds.every((mid) => contextIds.has(mid))) {
               candidateMap.delete(key);
             }
           }
@@ -436,26 +585,78 @@ export async function buildMemoryRecall(
   for (const c of allCandidates) {
     // Multiplicative scoring: importance, confidence, and recency amplify semantic
     // relevance but can't substitute for it. An irrelevant item (semantic ≈ 0)
-    // stays low regardless of metadata. Multiplier range: 0.4 (all zero) to 1.0.
+    // stays low regardless of metadata. Multiplier range: 0.35 (all zero) to 1.0.
     const metadataMultiplier =
-      0.4 + c.importance * 0.25 + c.confidence * 0.15 + c.recency * 0.2;
+      0.35 + c.importance * 0.3 + c.confidence * 0.1 + c.recency * 0.25;
     c.finalScore = c.semantic * metadataMultiplier;
   }
   allCandidates.sort((a, b) => b.finalScore - a.finalScore);
-  // ── Step 5: Tier classification ─────────────────────────────────
-  const tiered = classifyTiers(allCandidates);
+  // ── Step 5: Filter by minimum score threshold ───────────────────
+  const filtered = filterByMinScore(allCandidates);
+  // ── Step 5b: MMR diversity ranking ─────────────────────────────
+  const mmrRanked = applyMMR(filtered, MMR_PENALTY);
+  // MMR rewrites finalScore, so re-enforce the min-score threshold to
+  // drop candidates whose adjusted score fell below the cutoff.
+  const diversified = filterByMinScore(mmrRanked);
+  // ── Step 5c: Enrich candidates with source labels ──────────────
+  enrichSourceLabels(diversified);
+  // ── Serendipity: sample random memories for unexpected connections ──
+  const SERENDIPITY_COUNT = 3;
+  const serendipityCandidates = sampleSerendipityItems(
+    diversified,
+    SERENDIPITY_COUNT,
+    scopeIds,
+  );
+  // Filter serendipity items whose ALL sources are in-context (same logic
+  // as Step 4b) to prevent current-turn content leaking via random sampling.
+  if (inContextMessageIds && serendipityCandidates.length > 0) {
+    filterInContextItems(serendipityCandidates, inContextMessageIds);
+  }
-  // ── Step 5b: Enrich candidates with source labels ──────────────
-  enrichSourceLabels(tiered);
+  enrichSourceLabels(serendipityCandidates);
   // ── Step 6: Enrich with item metadata for staleness ─────────────
-  const itemIds = tiered.filter((c) => c.type === "item").map((c) => c.id);
+  const itemIds = diversified.filter((c) => c.type === "item").map((c) => c.id);
   const itemMetadataMap = enrichItemMetadata(itemIds);
-  // ── Step 7: Compute staleness per item ──────────────────────────
+  // ── Step 6b: Enrich item candidates with supersedes data ────────
+  const itemCandidatesForSupersedes = diversified.filter(
+    (c) => c.type === "item",
+  );
+  if (itemCandidatesForSupersedes.length > 0) {
+    try {
+      const db = getDb();
+      const supersedesRows = db
+        .select({ id: memoryItems.id, supersedes: memoryItems.supersedes })
+        .from(memoryItems)
+        .where(
+          inArray(
+            memoryItems.id,
+            itemCandidatesForSupersedes.map((c) => c.id),
+          ),
+        )
+        .all();
+      const supersedesMap = new Map(
+        supersedesRows.map((r) => [r.id, r.supersedes]),
+      );
+      for (const c of itemCandidatesForSupersedes) {
+        const sup = supersedesMap.get(c.id);
+        if (sup) c.supersedes = sup;
+      }
+    } catch (err) {
+      log.warn({ err }, "Failed to enrich candidates with supersedes data");
+    }
+  }
+  // ── Step 7: Compute staleness per item (for debugging/logging) ─
   const now = Date.now();
-  for (const c of tiered) {
+  for (const c of diversified) {
     if (c.type !== "item") continue;
     const meta = itemMetadataMap.get(c.id);
     if (!meta) continue;
@@ -470,10 +671,7 @@ export async function buildMemoryRecall(
     c.staleness = level;
   }
-  // ── Step 8: Demote very_stale tier 1 → tier 2 ──────────────────
-  const afterDemotion = applyStaleDemotion(tiered);
-  // ── Step 9: Budget allocation and two-layer injection ──────────
+  // ── Step 8: Budget allocation and unified injection ────────────
   const maxInjectTokens = Math.max(
     1,
     Math.floor(
@@ -482,53 +680,24 @@ export async function buildMemoryRecall(
     ),
   );
-  // Split into sections for two-layer injection
-  const identityItems = afterDemotion.filter(
-    (c) => c.tier === 1 && IDENTITY_KINDS.has(c.kind),
-  );
-  const preferences = afterDemotion.filter(
-    (c) => c.tier === 1 && PREFERENCE_KINDS.has(c.kind),
-  );
-  const capabilities = afterDemotion.filter(
-    (c) => c.tier === 1 && CAPABILITY_KINDS.has(c.kind),
-  );
-  const tier1Candidates = afterDemotion.filter(
-    (c) =>
-      c.tier === 1 &&
-      !IDENTITY_KINDS.has(c.kind) &&
-      !PREFERENCE_KINDS.has(c.kind) &&
-      !CAPABILITY_KINDS.has(c.kind),
-  );
-  const tier2Candidates = afterDemotion.filter((c) => c.tier === 2);
-  const injectedText = buildTwoLayerInjection({
-    identityItems,
-    tier1Candidates,
-    tier2Candidates,
-    preferences,
-    capabilities,
+  const injectedText = buildMemoryInjection({
+    candidates: diversified,
+    serendipityItems: serendipityCandidates,
     totalBudgetTokens: maxInjectTokens,
   });
   // ── Assemble result ─────────────────────────────────────────────
-  const selectedCount =
-    identityItems.length +
-    tier1Candidates.length +
-    tier2Candidates.length +
-    preferences.length +
-    capabilities.length;
-  const tier1Count = afterDemotion.filter((c) => c.tier === 1).length;
-  const tier2Count = afterDemotion.filter((c) => c.tier === 2).length;
+  const selectedCount = diversified.length + serendipityCandidates.length;
   const stalenessStats = {
-    fresh: afterDemotion.filter((c) => c.staleness === "fresh").length,
-    aging: afterDemotion.filter((c) => c.staleness === "aging").length,
-    stale: afterDemotion.filter((c) => c.staleness === "stale").length,
-    very_stale: afterDemotion.filter((c) => c.staleness === "very_stale")
-      .length,
+    fresh: diversified.filter((c) => c.staleness === "fresh").length,
+    aging: diversified.filter((c) => c.staleness === "aging").length,
+    stale: diversified.filter((c) => c.staleness === "stale").length,
+    very_stale: diversified.filter((c) => c.staleness === "very_stale").length,
   };
-  const topCandidates: MemoryRecallCandiateDebug[] = afterDemotion
+  const topCandidates: MemoryRecallCandiateDebug[] = [...diversified]
+    .sort((a, b) => b.finalScore - a.finalScore)
     .slice(0, 10)
     .map((c) => ({
       key: c.key,
@@ -537,6 +706,7 @@ export async function buildMemoryRecall(
       finalScore: c.finalScore,
       semantic: c.semantic,
       recency: c.recency,
+      ...(c.sourceLabel ? { sourceLabel: c.sourceLabel } : {}),
     }));
   const latencyMs = Date.now() - start;
@@ -560,13 +730,12 @@ export async function buildMemoryRecall(
       query: truncate(query, 120),
       hybridHits: hybridCandidates.length,
       mergedCount: allCandidates.length,
-      tier1Count,
-      tier2Count,
       stalenessStats,
       selectedCount,
       maxInjectTokens,
       injectedTokens: estimateTextTokens(injectedText),
       latencyMs,
+      ...(hydeExpanded ? { hydeExpanded, hydeDocCount } : {}),
     },
     "Memory recall completed",
   );
@@ -585,10 +754,13 @@ export async function buildMemoryRecall(
     injectedText,
     latencyMs,
     topCandidates,
-    tier1Count,
-    tier2Count,
+    tier1Count: 0,
+    tier2Count: 0,
     hybridSearchMs,
     sparseVectorUsed,
+    hydeExpanded,
+    hydeDocCount,
+    mmrApplied: true,
   };
   return result;
@@ -758,17 +930,17 @@ function enrichSourceLabels(candidates: TieredCandidate[]): void {
   try {
     const db = getDb();
-    // Collect item IDs for items that need source label lookup
+    // ── Items: find conversation via memoryItemSources → messages → conversations ──
     const itemCandidates = candidates.filter((c) => c.type === "item");
     const itemIds = itemCandidates.map((c) => c.id);
     if (itemIds.length > 0) {
-      // For items: find conversation titles via memoryItemSources → messages → conversations.
-      // Pick the most recent conversation title per item.
       const rows = db
         .select({
           memoryItemId: memoryItemSources.memoryItemId,
+          conversationId: conversations.id,
           title: conversations.title,
+          conversationCreatedAt: conversations.createdAt,
           conversationUpdatedAt: conversations.updatedAt,
         })
         .from(memoryItemSources)
@@ -783,36 +955,272 @@ function enrichSourceLabels(candidates: TieredCandidate[]): void {
         .where(inArray(memoryItemSources.memoryItemId, itemIds))
         .all();
-      // Group by item ID and pick the most recently updated conversation title
-      const titleMap = new Map<string, string>();
-      const updatedAtMap = new Map<string, number>();
+      // Group by item ID and pick the most recently updated conversation
+      const bestConvMap = new Map<
+        string,
+        {
+          title: string | null;
+          conversationId: string;
+          createdAt: number;
+          updatedAt: number;
+        }
+      >();
       for (const row of rows) {
-        if (!row.title) continue;
-        const existing = updatedAtMap.get(row.memoryItemId);
-        if (existing === undefined || row.conversationUpdatedAt > existing) {
-          titleMap.set(row.memoryItemId, row.title);
-          updatedAtMap.set(row.memoryItemId, row.conversationUpdatedAt);
+        const existing = bestConvMap.get(row.memoryItemId);
+        if (
+          existing === undefined ||
+          row.conversationUpdatedAt > existing.updatedAt
+        ) {
+          bestConvMap.set(row.memoryItemId, {
+            title: row.title,
+            conversationId: row.conversationId,
+            createdAt: row.conversationCreatedAt,
+            updatedAt: row.conversationUpdatedAt,
+          });
         }
       }
       for (const c of itemCandidates) {
-        const title = titleMap.get(c.id);
-        if (title) {
-          c.sourceLabel = title;
+        const conv = bestConvMap.get(c.id);
+        if (conv) {
+          if (conv.title) c.sourceLabel = conv.title;
+          const dirName = getConversationDirName(
+            conv.conversationId,
+            conv.createdAt,
+          );
+          c.sourcePath = `conversations/${dirName}/messages.jsonl`;
         }
       }
     }
-    // For segment candidates: the key format is "seg:<segmentId>" and the id is the segment's id.
-    // We can look up the conversation title via the segment's conversationId in memory_segments.
-    // However, segments already reference a conversationId in the schema — but the Candidate type
-    // doesn't carry it. For now, skip segment source labels as the join path would require
-    // importing memorySegments and an additional query. The primary value is item source labels.
+    // ── Segments: look up conversation via conversationId on the candidate ──
+    const segmentCandidates = candidates.filter(
+      (c) => (c.type === "segment" || c.type === "summary") && c.conversationId,
+    );
+    if (segmentCandidates.length > 0) {
+      const convIds = [
+        ...new Set(segmentCandidates.map((c) => c.conversationId!)),
+      ];
+      const convRows = db
+        .select({
+          id: conversations.id,
+          title: conversations.title,
+          createdAt: conversations.createdAt,
+        })
+        .from(conversations)
+        .where(inArray(conversations.id, convIds))
+        .all();
+      const convMap = new Map(convRows.map((r) => [r.id, r]));
+      for (const c of segmentCandidates) {
+        const conv = convMap.get(c.conversationId!);
+        if (conv) {
+          if (conv.title) c.sourceLabel = conv.title;
+          const dirName = getConversationDirName(conv.id, conv.createdAt);
+          c.sourcePath = `conversations/${dirName}/messages.jsonl`;
+        }
+      }
+    }
   } catch (err) {
     log.warn({ err }, "Failed to enrich candidates with source labels");
   }
 }
+/**
+ * Remove items from the array (in-place) whose ALL source messages are
+ * in the given in-context set. This prevents current-turn content from
+ * leaking into the injection via serendipity or other DB-sourced paths.
+ */
+function filterInContextItems(
+  candidates: TieredCandidate[],
+  inContextMessageIds: Set<string>,
+): void {
+  const itemIds = candidates.filter((c) => c.type === "item").map((c) => c.id);
+  if (itemIds.length === 0) return;
+  try {
+    const db = getDb();
+    const allSources = db
+      .select({
+        memoryItemId: memoryItemSources.memoryItemId,
+        messageId: memoryItemSources.messageId,
+      })
+      .from(memoryItemSources)
+      .where(inArray(memoryItemSources.memoryItemId, itemIds))
+      .all();
+    const itemSourceMap = new Map<string, string[]>();
+    for (const s of allSources) {
+      const existing = itemSourceMap.get(s.memoryItemId);
+      if (existing) existing.push(s.messageId);
+      else itemSourceMap.set(s.memoryItemId, [s.messageId]);
+    }
+    for (let i = candidates.length - 1; i >= 0; i--) {
+      const c = candidates[i];
+      if (c.type !== "item") continue;
+      const sourceMessageIds = itemSourceMap.get(c.id);
+      if (!sourceMessageIds || sourceMessageIds.length === 0) continue;
+      if (sourceMessageIds.every((mid) => inContextMessageIds.has(mid))) {
+        candidates.splice(i, 1);
+      }
+    }
+  } catch (err) {
+    log.warn(
+      { err },
+      "Failed to filter in-context serendipity items; skipping",
+    );
+  }
+}
+/**
+ * Sample random active memory items for serendipitous recall — items
+ * the user didn't ask about but might spark unexpected connections.
+ *
+ * Queries SQLite for random active items not already in the candidate pool,
+ * then selects up to `count` items with probability proportional to their
+ * importance value (importance-weighted sampling).
+ *
+ * Items with importance >= MIN_SERENDIPITY_IMPORTANCE are eligible, as are
+ * legacy items with NULL importance (not yet backfilled). This ensures
+ * genuinely significant memories and pre-importance-era items can both
+ * surface as echoes.
+ */
+const MIN_SERENDIPITY_IMPORTANCE = 0.7;
+function sampleSerendipityItems(
+  existingCandidates: TieredCandidate[],
+  count: number,
+  scopeIds?: string[],
+): TieredCandidate[] {
+  if (count <= 0) return [];
+  try {
+    const db = getDb();
+    // Collect IDs of item candidates already in the filtered set to exclude them
+    const existingItemIds = existingCandidates
+      .filter((c) => c.type === "item")
+      .map((c) => c.id);
+    const RANDOM_POOL_SIZE = 10;
+    // Build scope condition: match allowed scopes, or default to 'default'
+    // when no scope filter is set (prevents leaking private-scope items)
+    const scopeCondition = scopeIds
+      ? inArray(memoryItems.scopeId, scopeIds)
+      : eq(memoryItems.scopeId, "default");
+    const importanceFloor = sql`(${memoryItems.importance} >= ${MIN_SERENDIPITY_IMPORTANCE} OR ${memoryItems.importance} IS NULL)`;
+    const baseConditions =
+      existingItemIds.length > 0
+        ? and(
+            eq(memoryItems.status, "active"),
+            scopeCondition,
+            importanceFloor,
+            notInArray(memoryItems.id, existingItemIds),
+          )
+        : and(
+            eq(memoryItems.status, "active"),
+            scopeCondition,
+            importanceFloor,
+          );
+    // Use rowid-probe sampling instead of ORDER BY RANDOM() to avoid a
+    // full-table sort whose cost grows linearly with memory_items size.
+    // Strategy: get the rowid range, generate random rowids, and probe for
+    // the nearest eligible row with `rowid >= ?`. Each probe is O(log n)
+    // via B-tree lookup, so total cost is O(k·log n) instead of O(n·log n).
+    const range = db
+      .select({
+        minRowid: sql<number>`MIN(rowid)`,
+        maxRowid: sql<number>`MAX(rowid)`,
+        total: sql<number>`COUNT(*)`,
+      })
+      .from(memoryItems)
+      .where(baseConditions)
+      .get();
+    if (!range || range.total === 0) return [];
+    const columns = {
+      id: memoryItems.id,
+      kind: memoryItems.kind,
+      subject: memoryItems.subject,
+      statement: memoryItems.statement,
+      importance: memoryItems.importance,
+      firstSeenAt: memoryItems.firstSeenAt,
+    };
+    let rows;
+    if (range.total <= RANDOM_POOL_SIZE) {
+      // Few enough eligible rows — fetch all, no randomness needed at DB level
+      rows = db
+        .select(columns)
+        .from(memoryItems)
+        .where(baseConditions)
+        .all();
+    } else {
+      // Probe random rowids in the eligible range
+      const seen = new Set<string>();
+      rows = [];
+      const rowidSpan = range.maxRowid - range.minRowid + 1;
+      const maxAttempts = RANDOM_POOL_SIZE * 5;
+      for (let i = 0; i < maxAttempts && rows.length < RANDOM_POOL_SIZE; i++) {
+        const randomRowid =
+          range.minRowid + Math.floor(Math.random() * rowidSpan);
+        const row = db
+          .select(columns)
+          .from(memoryItems)
+          .where(and(baseConditions, sql`rowid >= ${randomRowid}`))
+          .orderBy(sql`rowid`)
+          .limit(1)
+          .get();
+        if (row && !seen.has(row.id)) {
+          seen.add(row.id);
+          rows.push(row);
+        }
+      }
+    }
+    if (rows.length === 0) return [];
+    // Importance-weighted sampling: sort by importance * random() descending
+    // and take the top `count` items
+    const weighted = rows
+      .map((row) => ({
+        row,
+        score: (row.importance ?? 0.5) * Math.random(),
+      }))
+      .sort((a, b) => b.score - a.score)
+      .slice(0, count);
+    // Convert to Candidate-compatible objects
+    return weighted.map(
+      ({ row }): TieredCandidate => ({
+        type: "item",
+        id: row.id,
+        key: `item:${row.id}`,
+        kind: row.kind,
+        text: row.statement,
+        source: "semantic",
+        importance: row.importance ?? 0.5,
+        confidence: 1,
+        semantic: 0,
+        recency: 0,
+        finalScore: 0,
+        createdAt: row.firstSeenAt,
+      }),
+    );
+  } catch (err) {
+    log.warn({ err }, "Failed to sample serendipity items");
+    return [];
+  }
+}
 /**
  * Inject memory recall as a text content block prepended to the last user
  * message. This follows the same pattern as workspace, temporal, and other