@vellumai/assistant 0.4.17 → 0.4.19
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/docs/runbook-trusted-contacts.md +5 -3
- package/eslint.config.mjs +2 -2
- package/package.json +1 -1
- package/src/__tests__/access-request-decision.test.ts +128 -120
- package/src/__tests__/account-registry.test.ts +121 -110
- package/src/__tests__/active-skill-tools.test.ts +200 -172
- package/src/__tests__/actor-token-service.test.ts +341 -274
- package/src/__tests__/agent-loop-thinking.test.ts +28 -19
- package/src/__tests__/agent-loop.test.ts +798 -378
- package/src/__tests__/anthropic-provider.test.ts +405 -247
- package/src/__tests__/app-builder-tool-scripts.test.ts +97 -97
- package/src/__tests__/app-bundler.test.ts +112 -79
- package/src/__tests__/app-executors.test.ts +205 -178
- package/src/__tests__/app-git-history.test.ts +90 -73
- package/src/__tests__/app-git-service.test.ts +67 -53
- package/src/__tests__/app-open-proxy.test.ts +29 -25
- package/src/__tests__/approval-conversation-turn.test.ts +100 -81
- package/src/__tests__/approval-hardcoded-copy-guard.test.ts +45 -17
- package/src/__tests__/approval-message-composer.test.ts +119 -119
- package/src/__tests__/approval-primitive.test.ts +264 -233
- package/src/__tests__/approval-routes-http.test.ts +4 -3
- package/src/__tests__/asset-materialize-tool.test.ts +250 -178
- package/src/__tests__/asset-search-tool.test.ts +251 -191
- package/src/__tests__/assistant-attachment-directive.test.ts +187 -142
- package/src/__tests__/assistant-attachments.test.ts +254 -186
- package/src/__tests__/assistant-event-hub.test.ts +105 -63
- package/src/__tests__/assistant-event.test.ts +66 -58
- package/src/__tests__/assistant-events-sse-hardening.test.ts +113 -73
- package/src/__tests__/assistant-feature-flag-guard.test.ts +78 -52
- package/src/__tests__/assistant-feature-flag-guardrails.test.ts +48 -45
- package/src/__tests__/assistant-feature-flags-integration.test.ts +118 -77
- package/src/__tests__/assistant-id-boundary-guard.test.ts +158 -104
- package/src/__tests__/attachments-store.test.ts +240 -183
- package/src/__tests__/attachments.test.ts +70 -62
- package/src/__tests__/audit-log-rotation.test.ts +50 -35
- package/src/__tests__/browser-fill-credential.test.ts +169 -101
- package/src/__tests__/browser-manager.test.ts +97 -75
- package/src/__tests__/browser-runtime-check.test.ts +16 -15
- package/src/__tests__/browser-skill-baseline-tool-payload.test.ts +12 -10
- package/src/__tests__/browser-skill-endstate.test.ts +97 -72
- package/src/__tests__/bundle-scanner.test.ts +47 -22
- package/src/__tests__/bundled-asset.test.ts +74 -47
- package/src/__tests__/call-constants.test.ts +19 -19
- package/src/__tests__/call-controller.test.ts +0 -1
- package/src/__tests__/call-conversation-messages.test.ts +90 -65
- package/src/__tests__/call-domain.test.ts +149 -121
- package/src/__tests__/call-pointer-message-composer.test.ts +113 -83
- package/src/__tests__/call-pointer-messages.test.ts +213 -154
- package/src/__tests__/call-pointer-no-hardcoded-copy.guard.test.ts +9 -10
- package/src/__tests__/call-recovery.test.ts +232 -212
- package/src/__tests__/call-routes-http.test.ts +0 -1
- package/src/__tests__/call-start-guardian-guard.test.ts +32 -30
- package/src/__tests__/call-state-machine.test.ts +62 -51
- package/src/__tests__/call-state.test.ts +89 -75
- package/src/__tests__/call-store.test.ts +387 -316
- package/src/__tests__/callback-handoff-copy.test.ts +84 -82
- package/src/__tests__/canonical-guardian-store.test.ts +331 -280
- package/src/__tests__/channel-approval-routes.test.ts +1643 -1115
- package/src/__tests__/channel-approval.test.ts +139 -137
- package/src/__tests__/channel-approvals.test.ts +7 -2
- package/src/__tests__/channel-delivery-store.test.ts +232 -194
- package/src/__tests__/channel-guardian.test.ts +5 -3
- package/src/__tests__/channel-invite-transport.test.ts +107 -92
- package/src/__tests__/channel-policy.test.ts +42 -38
- package/src/__tests__/channel-readiness-service.test.ts +119 -102
- package/src/__tests__/channel-reply-delivery.test.ts +147 -118
- package/src/__tests__/channel-retry-sweep.test.ts +153 -110
- package/src/__tests__/checker.test.ts +3309 -1850
- package/src/__tests__/clarification-resolver.test.ts +91 -79
- package/src/__tests__/classifier.test.ts +64 -54
- package/src/__tests__/claude-code-skill-regression.test.ts +42 -37
- package/src/__tests__/claude-code-tool-profiles.test.ts +31 -29
- package/src/__tests__/clawhub.test.ts +92 -82
- package/src/__tests__/cli.test.ts +30 -30
- package/src/__tests__/clipboard.test.ts +53 -46
- package/src/__tests__/commit-guarantee.test.ts +59 -52
- package/src/__tests__/commit-message-enrichment-service.test.ts +203 -75
- package/src/__tests__/compaction.benchmark.test.ts +33 -31
- package/src/__tests__/computer-use-session-compaction.test.ts +60 -50
- package/src/__tests__/computer-use-session-lifecycle.test.ts +145 -117
- package/src/__tests__/computer-use-session-working-dir.test.ts +62 -48
- package/src/__tests__/computer-use-skill-baseline.test.ts +22 -19
- package/src/__tests__/computer-use-skill-endstate.test.ts +45 -31
- package/src/__tests__/computer-use-skill-lifecycle-cleanup.test.ts +121 -88
- package/src/__tests__/computer-use-skill-manifest-regression.test.ts +65 -42
- package/src/__tests__/computer-use-skill-proxy-bridge.test.ts +33 -18
- package/src/__tests__/computer-use-tools.test.ts +121 -98
- package/src/__tests__/config-schema.test.ts +443 -347
- package/src/__tests__/config-watcher.test.ts +96 -81
- package/src/__tests__/confirmation-request-guardian-bridge.test.ts +148 -133
- package/src/__tests__/conflict-intent-tokenization.test.ts +96 -78
- package/src/__tests__/conflict-policy.test.ts +151 -80
- package/src/__tests__/conflict-store.test.ts +203 -157
- package/src/__tests__/connection-policy.test.ts +89 -59
- package/src/__tests__/contacts-tools.test.ts +247 -178
- package/src/__tests__/context-memory-e2e.test.ts +306 -214
- package/src/__tests__/context-token-estimator.test.ts +114 -74
- package/src/__tests__/context-window-manager.test.ts +269 -167
- package/src/__tests__/contradiction-checker.test.ts +161 -135
- package/src/__tests__/conversation-attention-store.test.ts +350 -290
- package/src/__tests__/conversation-attention-telegram.test.ts +0 -1
- package/src/__tests__/conversation-pairing.test.ts +220 -113
- package/src/__tests__/conversation-routes-guardian-reply.test.ts +8 -0
- package/src/__tests__/conversation-store.test.ts +390 -235
- package/src/__tests__/credential-broker-browser-fill.test.ts +325 -250
- package/src/__tests__/credential-broker-server-use.test.ts +283 -243
- package/src/__tests__/credential-broker.test.ts +128 -74
- package/src/__tests__/credential-host-pattern-match.test.ts +64 -44
- package/src/__tests__/credential-metadata-store.test.ts +360 -311
- package/src/__tests__/credential-policy-validate.test.ts +81 -65
- package/src/__tests__/credential-resolve.test.ts +212 -145
- package/src/__tests__/credential-security-e2e.test.ts +144 -103
- package/src/__tests__/credential-security-invariants.test.ts +253 -208
- package/src/__tests__/credential-selection.test.ts +254 -146
- package/src/__tests__/credential-vault-unit.test.ts +531 -341
- package/src/__tests__/credential-vault.test.ts +761 -484
- package/src/__tests__/daemon-assistant-events.test.ts +91 -66
- package/src/__tests__/daemon-lifecycle.test.ts +258 -190
- package/src/__tests__/daemon-server-session-init.test.ts +2 -1
- package/src/__tests__/date-context.test.ts +314 -249
- package/src/__tests__/db-migration-rollback.test.ts +259 -130
- package/src/__tests__/db-schedule-syntax-migration.test.ts +78 -41
- package/src/__tests__/delete-managed-skill-tool.test.ts +77 -53
- package/src/__tests__/deterministic-verification-control-plane.test.ts +0 -1
- package/src/__tests__/dictation-mode-detection.test.ts +77 -55
- package/src/__tests__/dictation-profile-store.test.ts +70 -56
- package/src/__tests__/dictation-text-processing.test.ts +53 -35
- package/src/__tests__/diff.test.ts +102 -98
- package/src/__tests__/domain-normalize.test.ts +54 -54
- package/src/__tests__/domain-policy.test.ts +71 -55
- package/src/__tests__/dynamic-page-surface.test.ts +31 -33
- package/src/__tests__/dynamic-skill-workflow-prompt.test.ts +69 -69
- package/src/__tests__/edit-engine.test.ts +56 -56
- package/src/__tests__/elevenlabs-client.test.ts +117 -91
- package/src/__tests__/elevenlabs-config.test.ts +32 -31
- package/src/__tests__/email-classifier.test.ts +15 -12
- package/src/__tests__/email-cli.test.ts +121 -108
- package/src/__tests__/emit-signal-routing-intent.test.ts +76 -69
- package/src/__tests__/encrypted-store.test.ts +180 -154
- package/src/__tests__/entity-extractor.test.ts +108 -87
- package/src/__tests__/entity-search.test.ts +664 -258
- package/src/__tests__/ephemeral-permissions.test.ts +224 -188
- package/src/__tests__/event-bus.test.ts +81 -77
- package/src/__tests__/extract-email.test.ts +29 -20
- package/src/__tests__/file-edit-tool.test.ts +62 -44
- package/src/__tests__/file-ops-service.test.ts +131 -114
- package/src/__tests__/file-read-tool.test.ts +48 -31
- package/src/__tests__/file-write-tool.test.ts +43 -37
- package/src/__tests__/filesystem-tools.test.ts +238 -209
- package/src/__tests__/followup-tools.test.ts +237 -162
- package/src/__tests__/forbidden-legacy-symbols.test.ts +19 -20
- package/src/__tests__/frontmatter.test.ts +96 -81
- package/src/__tests__/fuzzy-match-property.test.ts +75 -81
- package/src/__tests__/fuzzy-match.test.ts +71 -65
- package/src/__tests__/gateway-client-managed-outbound.test.ts +76 -57
- package/src/__tests__/gateway-only-enforcement.test.ts +0 -1
- package/src/__tests__/gateway-only-guard.test.ts +0 -1
- package/src/__tests__/gemini-image-service.test.ts +113 -100
- package/src/__tests__/gemini-provider.test.ts +297 -220
- package/src/__tests__/get-weather.test.ts +188 -114
- package/src/__tests__/gmail-integration.test.ts +13 -5
- package/src/__tests__/guardian-action-conversation-turn.test.ts +226 -171
- package/src/__tests__/guardian-action-copy-generator.test.ts +111 -93
- package/src/__tests__/guardian-action-followup-executor.test.ts +0 -1
- package/src/__tests__/guardian-action-followup-store.test.ts +199 -167
- package/src/__tests__/guardian-action-grant-mint-consume.test.ts +297 -250
- package/src/__tests__/guardian-action-late-reply.test.ts +462 -316
- package/src/__tests__/guardian-action-no-hardcoded-copy.test.ts +23 -18
- package/src/__tests__/guardian-action-store.test.ts +158 -109
- package/src/__tests__/guardian-action-sweep.test.ts +114 -100
- package/src/__tests__/guardian-actions-endpoint.test.ts +440 -256
- package/src/__tests__/guardian-control-plane-policy.test.ts +497 -331
- package/src/__tests__/guardian-decision-primitive-canonical.test.ts +217 -215
- package/src/__tests__/guardian-dispatch.test.ts +316 -256
- package/src/__tests__/guardian-grant-minting.test.ts +247 -178
- package/src/__tests__/guardian-outbound-http.test.ts +5 -3
- package/src/__tests__/guardian-principal-id-roundtrip.test.ts +99 -96
- package/src/__tests__/guardian-question-copy.test.ts +17 -17
- package/src/__tests__/guardian-question-mode.test.ts +134 -100
- package/src/__tests__/guardian-routing-invariants.test.ts +0 -1
- package/src/__tests__/guardian-routing-state.test.ts +0 -1
- package/src/__tests__/guardian-verification-intent-routing.test.ts +94 -88
- package/src/__tests__/guardian-verification-voice-binding.test.ts +0 -1
- package/src/__tests__/guardian-verify-setup-skill-regression.test.ts +0 -1
- package/src/__tests__/handle-user-message-secret-resume.test.ts +7 -2
- package/src/__tests__/handlers-add-trust-rule-metadata.test.ts +92 -76
- package/src/__tests__/handlers-cu-observation-blob.test.ts +103 -70
- package/src/__tests__/handlers-ipc-blob-probe.test.ts +77 -51
- package/src/__tests__/handlers-slack-config.test.ts +63 -54
- package/src/__tests__/handlers-task-submit-slash.test.ts +18 -18
- package/src/__tests__/handlers-telegram-config.test.ts +662 -329
- package/src/__tests__/handlers-twitter-config.test.ts +525 -298
- package/src/__tests__/handlers-user-message-approval-consumption.test.ts +5 -2
- package/src/__tests__/headless-browser-interactions.test.ts +444 -280
- package/src/__tests__/headless-browser-navigate.test.ts +116 -79
- package/src/__tests__/headless-browser-read-tools.test.ts +123 -86
- package/src/__tests__/headless-browser-snapshot.test.ts +71 -56
- package/src/__tests__/heartbeat-service.test.ts +76 -58
- package/src/__tests__/history-repair-observability.test.ts +14 -14
- package/src/__tests__/history-repair.test.ts +171 -167
- package/src/__tests__/home-base-bootstrap.test.ts +30 -27
- package/src/__tests__/hooks-blocking.test.ts +86 -37
- package/src/__tests__/hooks-cli.test.ts +104 -68
- package/src/__tests__/hooks-config.test.ts +81 -43
- package/src/__tests__/hooks-discovery.test.ts +106 -96
- package/src/__tests__/hooks-integration.test.ts +78 -72
- package/src/__tests__/hooks-manager.test.ts +99 -61
- package/src/__tests__/hooks-runner.test.ts +94 -71
- package/src/__tests__/hooks-settings.test.ts +69 -64
- package/src/__tests__/hooks-templates.test.ts +85 -54
- package/src/__tests__/hooks-ts-runner.test.ts +82 -45
- package/src/__tests__/hooks-watch.test.ts +32 -22
- package/src/__tests__/host-file-edit-tool.test.ts +190 -148
- package/src/__tests__/host-file-read-tool.test.ts +86 -63
- package/src/__tests__/host-file-write-tool.test.ts +98 -64
- package/src/__tests__/host-shell-tool.test.ts +342 -233
- package/src/__tests__/inbound-invite-redemption.test.ts +0 -1
- package/src/__tests__/ingress-member-store.test.ts +163 -159
- package/src/__tests__/ingress-reconcile.test.ts +13 -6
- package/src/__tests__/ingress-routes-http.test.ts +441 -356
- package/src/__tests__/ingress-url-consistency.test.ts +125 -64
- package/src/__tests__/integration-status.test.ts +93 -73
- package/src/__tests__/intent-routing.test.ts +148 -118
- package/src/__tests__/invite-redemption-service.test.ts +163 -121
- package/src/__tests__/ipc-blob-store.test.ts +104 -91
- package/src/__tests__/ipc-contract-inventory.test.ts +27 -15
- package/src/__tests__/ipc-contract.test.ts +24 -23
- package/src/__tests__/ipc-protocol.test.ts +52 -46
- package/src/__tests__/ipc-roundtrip.benchmark.test.ts +61 -50
- package/src/__tests__/ipc-snapshot.test.ts +1135 -1056
- package/src/__tests__/ipc-validate.test.ts +240 -179
- package/src/__tests__/key-migration.test.ts +123 -90
- package/src/__tests__/keychain.test.ts +150 -123
- package/src/__tests__/lifecycle-docs-guard.test.ts +65 -64
- package/src/__tests__/llm-usage-store.test.ts +112 -87
- package/src/__tests__/managed-skill-lifecycle.test.ts +147 -108
- package/src/__tests__/managed-store.test.ts +411 -360
- package/src/__tests__/mcp-cli.test.ts +190 -124
- package/src/__tests__/mcp-health-check.test.ts +26 -21
- package/src/__tests__/media-generate-image.test.ts +122 -99
- package/src/__tests__/media-reuse-story.e2e.test.ts +282 -214
- package/src/__tests__/media-visibility-policy.test.ts +86 -38
- package/src/__tests__/memory-context-benchmark.benchmark.test.ts +146 -100
- package/src/__tests__/memory-lifecycle-e2e.test.ts +385 -297
- package/src/__tests__/memory-query-builder.test.ts +32 -33
- package/src/__tests__/memory-recall-quality.test.ts +761 -407
- package/src/__tests__/memory-regressions.experimental.test.ts +443 -380
- package/src/__tests__/memory-regressions.test.ts +3725 -2642
- package/src/__tests__/memory-retrieval-budget.test.ts +7 -8
- package/src/__tests__/memory-retrieval.benchmark.test.ts +144 -109
- package/src/__tests__/memory-upsert-concurrency.test.ts +292 -201
- package/src/__tests__/messaging-send-tool.test.ts +36 -29
- package/src/__tests__/migration-cli-flows.test.ts +69 -53
- package/src/__tests__/migration-ordering.test.ts +103 -86
- package/src/__tests__/mime-builder.test.ts +55 -32
- package/src/__tests__/mock-signup-server.test.ts +384 -246
- package/src/__tests__/model-intents.test.ts +61 -37
- package/src/__tests__/no-direct-anthropic-sdk-imports.test.ts +9 -12
- package/src/__tests__/no-is-trusted-guard.test.ts +24 -21
- package/src/__tests__/non-member-access-request.test.ts +3 -2
- package/src/__tests__/notification-broadcaster.test.ts +99 -81
- package/src/__tests__/notification-decision-fallback.test.ts +223 -178
- package/src/__tests__/notification-decision-strategy.test.ts +375 -337
- package/src/__tests__/notification-deep-link.test.ts +67 -61
- package/src/__tests__/notification-guardian-path.test.ts +248 -206
- package/src/__tests__/notification-routing-intent.test.ts +166 -93
- package/src/__tests__/notification-thread-candidate-validation.test.ts +78 -75
- package/src/__tests__/notification-thread-candidates.test.ts +64 -61
- package/src/__tests__/oauth-callback-registry.test.ts +40 -30
- package/src/__tests__/oauth-connect-handler.test.ts +109 -89
- package/src/__tests__/oauth-scope-policy.test.ts +63 -55
- package/src/__tests__/oauth2-gateway-transport.test.ts +252 -174
- package/src/__tests__/onboarding-starter-tasks.test.ts +93 -89
- package/src/__tests__/onboarding-template-contract.test.ts +93 -94
- package/src/__tests__/openai-provider.test.ts +366 -274
- package/src/__tests__/pairing-concurrent.test.ts +18 -12
- package/src/__tests__/pairing-routes.test.ts +45 -41
- package/src/__tests__/parallel-tool.benchmark.test.ts +108 -58
- package/src/__tests__/parser.test.ts +316 -226
- package/src/__tests__/path-classifier.test.ts +24 -25
- package/src/__tests__/path-policy.test.ts +187 -147
- package/src/__tests__/phone.test.ts +36 -36
- package/src/__tests__/platform-move-helper.test.ts +48 -40
- package/src/__tests__/platform-socket-path.test.ts +23 -24
- package/src/__tests__/platform-workspace-migration.test.ts +464 -414
- package/src/__tests__/platform.test.ts +61 -53
- package/src/__tests__/playbook-execution.test.ts +397 -265
- package/src/__tests__/playbook-tools.test.ts +267 -196
- package/src/__tests__/prebuilt-home-base-seed.test.ts +30 -27
- package/src/__tests__/pricing.test.ts +316 -136
- package/src/__tests__/profile-compiler.test.ts +206 -188
- package/src/__tests__/provider-commit-message-generator.test.ts +114 -106
- package/src/__tests__/provider-error-scenarios.test.ts +212 -158
- package/src/__tests__/provider-fail-open-selection.test.ts +51 -44
- package/src/__tests__/provider-registry-ollama.test.ts +13 -9
- package/src/__tests__/provider-streaming.benchmark.test.ts +232 -183
- package/src/__tests__/proxy-approval-callback.test.ts +180 -119
- package/src/__tests__/public-ingress-urls.test.ts +112 -94
- package/src/__tests__/qdrant-manager.test.ts +147 -98
- package/src/__tests__/ratelimit.test.ts +152 -82
- package/src/__tests__/recording-handler.test.ts +273 -151
- package/src/__tests__/recording-intent-fallback.test.ts +94 -75
- package/src/__tests__/recording-intent-handler.test.ts +9 -2
- package/src/__tests__/recording-intent.test.ts +578 -379
- package/src/__tests__/recording-state-machine.test.ts +530 -316
- package/src/__tests__/recurrence-engine-rruleset.test.ts +150 -92
- package/src/__tests__/recurrence-engine.test.ts +81 -41
- package/src/__tests__/recurrence-types.test.ts +63 -44
- package/src/__tests__/relay-server.test.ts +2131 -1602
- package/src/__tests__/reminder-store.test.ts +158 -80
- package/src/__tests__/reminder.test.ts +113 -109
- package/src/__tests__/remote-skill-policy.test.ts +96 -72
- package/src/__tests__/request-file-tool.test.ts +74 -67
- package/src/__tests__/response-tier.test.ts +131 -74
- package/src/__tests__/runtime-attachment-metadata.test.ts +0 -1
- package/src/__tests__/runtime-events-sse-parity.test.ts +167 -145
- package/src/__tests__/runtime-events-sse.test.ts +0 -1
- package/src/__tests__/sandbox-diagnostics.test.ts +66 -56
- package/src/__tests__/sandbox-host-parity.test.ts +377 -301
- package/src/__tests__/scaffold-managed-skill-tool.test.ts +213 -161
- package/src/__tests__/schedule-store.test.ts +268 -205
- package/src/__tests__/schedule-tools.test.ts +702 -524
- package/src/__tests__/scheduler-recurrence.test.ts +240 -130
- package/src/__tests__/scoped-approval-grants.test.ts +258 -168
- package/src/__tests__/scoped-grant-security-matrix.test.ts +160 -146
- package/src/__tests__/script-proxy-certs.test.ts +38 -35
- package/src/__tests__/script-proxy-connect-tunnel.test.ts +71 -46
- package/src/__tests__/script-proxy-decision-trace.test.ts +161 -84
- package/src/__tests__/script-proxy-http-forwarder.test.ts +146 -129
- package/src/__tests__/script-proxy-injection-runtime.test.ts +139 -113
- package/src/__tests__/script-proxy-mitm-handler.test.ts +226 -142
- package/src/__tests__/script-proxy-policy-runtime.test.ts +126 -86
- package/src/__tests__/script-proxy-policy.test.ts +308 -153
- package/src/__tests__/script-proxy-rewrite-specificity.test.ts +74 -62
- package/src/__tests__/script-proxy-router.test.ts +111 -77
- package/src/__tests__/script-proxy-session-manager.test.ts +156 -113
- package/src/__tests__/script-proxy-session-runtime.test.ts +28 -24
- package/src/__tests__/secret-allowlist.test.ts +105 -90
- package/src/__tests__/secret-ingress-handler.test.ts +41 -30
- package/src/__tests__/secret-onetime-send.test.ts +67 -50
- package/src/__tests__/secret-prompt-log-hygiene.test.ts +35 -31
- package/src/__tests__/secret-response-routing.test.ts +50 -41
- package/src/__tests__/secret-scanner-executor.test.ts +152 -111
- package/src/__tests__/secret-scanner.test.ts +495 -413
- package/src/__tests__/secure-keys.test.ts +132 -121
- package/src/__tests__/send-endpoint-busy.test.ts +8 -3
- package/src/__tests__/send-notification-tool.test.ts +43 -42
- package/src/__tests__/sensitive-output-placeholders.test.ts +72 -64
- package/src/__tests__/sequence-store.test.ts +335 -167
- package/src/__tests__/server-history-render.test.ts +341 -202
- package/src/__tests__/session-abort-tool-results.test.ts +133 -70
- package/src/__tests__/session-confirmation-signals.test.ts +252 -160
- package/src/__tests__/session-conflict-gate.test.ts +775 -585
- package/src/__tests__/session-error.test.ts +222 -191
- package/src/__tests__/session-evictor.test.ts +79 -62
- package/src/__tests__/session-init.benchmark.test.ts +170 -108
- package/src/__tests__/session-load-history-repair.test.ts +273 -139
- package/src/__tests__/session-messaging-secret-redirect.test.ts +130 -90
- package/src/__tests__/session-pre-run-repair.test.ts +106 -59
- package/src/__tests__/session-profile-injection.test.ts +198 -130
- package/src/__tests__/session-provider-retry-repair.test.ts +223 -141
- package/src/__tests__/session-queue.test.ts +624 -321
- package/src/__tests__/session-runtime-assembly.test.ts +425 -329
- package/src/__tests__/session-runtime-workspace.test.ts +69 -61
- package/src/__tests__/session-skill-tools.test.ts +973 -678
- package/src/__tests__/session-slash-known.test.ts +185 -133
- package/src/__tests__/session-slash-queue.test.ts +147 -81
- package/src/__tests__/session-slash-unknown.test.ts +135 -90
- package/src/__tests__/session-surfaces-task-progress.test.ts +122 -87
- package/src/__tests__/session-tool-setup-app-refresh.test.ts +338 -177
- package/src/__tests__/session-tool-setup-memory-scope.test.ts +63 -40
- package/src/__tests__/session-tool-setup-side-effect-flag.test.ts +60 -37
- package/src/__tests__/session-tool-setup-tools-disabled.test.ts +28 -26
- package/src/__tests__/session-undo.test.ts +43 -30
- package/src/__tests__/session-workspace-cache-state.test.ts +108 -67
- package/src/__tests__/session-workspace-injection.test.ts +245 -117
- package/src/__tests__/session-workspace-tool-tracking.test.ts +260 -93
- package/src/__tests__/shared-filesystem-errors.test.ts +47 -47
- package/src/__tests__/shell-credential-ref.test.ts +126 -90
- package/src/__tests__/shell-identity.test.ts +134 -111
- package/src/__tests__/shell-parser-fuzz.test.ts +263 -179
- package/src/__tests__/shell-parser-property.test.ts +435 -288
- package/src/__tests__/shell-tool-proxy-mode.test.ts +142 -70
- package/src/__tests__/size-guard.test.ts +42 -44
- package/src/__tests__/skill-feature-flags-integration.test.ts +79 -52
- package/src/__tests__/skill-feature-flags.test.ts +75 -47
- package/src/__tests__/skill-include-graph.test.ts +143 -148
- package/src/__tests__/skill-load-feature-flag.test.ts +94 -59
- package/src/__tests__/skill-load-tool.test.ts +371 -199
- package/src/__tests__/skill-projection-feature-flag.test.ts +131 -88
- package/src/__tests__/skill-projection.benchmark.test.ts +93 -65
- package/src/__tests__/skill-script-runner-host.test.ts +460 -250
- package/src/__tests__/skill-script-runner-sandbox.test.ts +168 -108
- package/src/__tests__/skill-script-runner.test.ts +115 -74
- package/src/__tests__/skill-tool-factory.test.ts +140 -96
- package/src/__tests__/skill-tool-manifest.test.ts +306 -210
- package/src/__tests__/skill-version-hash.test.ts +70 -56
- package/src/__tests__/skills.test.ts +0 -1
- package/src/__tests__/slack-channel-config.test.ts +127 -84
- package/src/__tests__/slack-skill.test.ts +60 -47
- package/src/__tests__/slash-commands-catalog.test.ts +37 -31
- package/src/__tests__/slash-commands-parser.test.ts +71 -64
- package/src/__tests__/slash-commands-resolver.test.ts +143 -107
- package/src/__tests__/slash-commands-rewrite.test.ts +22 -22
- package/src/__tests__/sms-messaging-provider.test.ts +4 -0
- package/src/__tests__/speaker-identification.test.ts +28 -25
- package/src/__tests__/starter-bundle.test.ts +27 -23
- package/src/__tests__/starter-task-flow.test.ts +67 -52
- package/src/__tests__/subagent-manager-notify.test.ts +154 -108
- package/src/__tests__/subagent-tools.test.ts +311 -270
- package/src/__tests__/subagent-types.test.ts +40 -40
- package/src/__tests__/surface-mutex-cleanup.test.ts +42 -30
- package/src/__tests__/swarm-dag-pathological.test.ts +122 -111
- package/src/__tests__/swarm-orchestrator.test.ts +135 -101
- package/src/__tests__/swarm-plan-validator.test.ts +125 -73
- package/src/__tests__/swarm-recursion.test.ts +58 -46
- package/src/__tests__/swarm-router-planner.test.ts +99 -74
- package/src/__tests__/swarm-session-integration.test.ts +148 -91
- package/src/__tests__/swarm-tool.test.ts +65 -45
- package/src/__tests__/swarm-worker-backend.test.ts +59 -45
- package/src/__tests__/swarm-worker-runner.test.ts +133 -118
- package/src/__tests__/system-prompt.test.ts +311 -256
- package/src/__tests__/task-compiler.test.ts +176 -120
- package/src/__tests__/task-management-tools.test.ts +561 -456
- package/src/__tests__/task-memory-cleanup.test.ts +627 -362
- package/src/__tests__/task-runner.test.ts +117 -94
- package/src/__tests__/task-scheduler.test.ts +113 -84
- package/src/__tests__/task-tools.test.ts +349 -264
- package/src/__tests__/terminal-sandbox.test.ts +138 -108
- package/src/__tests__/terminal-tools.test.ts +350 -305
- package/src/__tests__/thread-seed-composer.test.ts +307 -180
- package/src/__tests__/tool-approval-handler.test.ts +238 -137
- package/src/__tests__/tool-audit-listener.test.ts +69 -69
- package/src/__tests__/tool-domain-event-publisher.test.ts +142 -132
- package/src/__tests__/tool-execution-abort-cleanup.test.ts +155 -146
- package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +136 -105
- package/src/__tests__/tool-executor-lifecycle-events.test.ts +355 -239
- package/src/__tests__/tool-executor-redaction.test.ts +112 -109
- package/src/__tests__/tool-executor-shell-integration.test.ts +130 -79
- package/src/__tests__/tool-executor.test.ts +1274 -674
- package/src/__tests__/tool-grant-request-escalation.test.ts +401 -283
- package/src/__tests__/tool-metrics-listener.test.ts +97 -85
- package/src/__tests__/tool-notification-listener.test.ts +42 -25
- package/src/__tests__/tool-permission-simulate-handler.test.ts +137 -113
- package/src/__tests__/tool-policy.test.ts +44 -25
- package/src/__tests__/tool-profiling-listener.test.ts +99 -93
- package/src/__tests__/tool-result-truncation.test.ts +5 -4
- package/src/__tests__/tool-trace-listener.test.ts +131 -111
- package/src/__tests__/top-level-renderer.test.ts +62 -58
- package/src/__tests__/top-level-scanner.test.ts +68 -64
- package/src/__tests__/trace-emitter.test.ts +56 -56
- package/src/__tests__/trust-context-guards.test.ts +65 -65
- package/src/__tests__/trust-store.test.ts +1239 -806
- package/src/__tests__/trusted-contact-approval-notifier.test.ts +0 -1
- package/src/__tests__/trusted-contact-inline-approval-integration.test.ts +0 -1
- package/src/__tests__/trusted-contact-lifecycle-notifications.test.ts +3 -2
- package/src/__tests__/trusted-contact-multichannel.test.ts +3 -2
- package/src/__tests__/trusted-contact-verification.test.ts +251 -231
- package/src/__tests__/turn-commit.test.ts +259 -200
- package/src/__tests__/twilio-provider.test.ts +140 -126
- package/src/__tests__/twilio-rest.test.ts +22 -18
- package/src/__tests__/twilio-routes-elevenlabs.test.ts +0 -1
- package/src/__tests__/twilio-routes-twiml.test.ts +55 -55
- package/src/__tests__/twilio-routes.test.ts +0 -1
- package/src/__tests__/twitter-auth-handler.test.ts +184 -139
- package/src/__tests__/twitter-cli-error-shaping.test.ts +88 -73
- package/src/__tests__/twitter-cli-routing.test.ts +146 -99
- package/src/__tests__/twitter-oauth-client.test.ts +82 -65
- package/src/__tests__/update-bulletin-format.test.ts +69 -66
- package/src/__tests__/update-bulletin-state.test.ts +66 -60
- package/src/__tests__/update-bulletin.test.ts +150 -114
- package/src/__tests__/update-template-contract.test.ts +15 -10
- package/src/__tests__/url-safety.test.ts +288 -265
- package/src/__tests__/user-reference.test.ts +32 -32
- package/src/__tests__/view-image-tool.test.ts +118 -96
- package/src/__tests__/voice-invite-redemption.test.ts +111 -106
- package/src/__tests__/voice-quality.test.ts +117 -102
- package/src/__tests__/voice-scoped-grant-consumer.test.ts +204 -146
- package/src/__tests__/voice-session-bridge.test.ts +351 -216
- package/src/__tests__/weather-skill-regression.test.ts +170 -120
- package/src/__tests__/web-fetch.test.ts +664 -526
- package/src/__tests__/web-search.test.ts +379 -213
- package/src/__tests__/work-item-output.test.ts +90 -53
- package/src/__tests__/workspace-git-service.test.ts +437 -356
- package/src/__tests__/workspace-heartbeat-service.test.ts +125 -91
- package/src/__tests__/workspace-lifecycle.test.ts +98 -64
- package/src/__tests__/workspace-policy.test.ts +139 -71
- package/src/cli/mcp.ts +81 -28
- package/src/commands/__tests__/cc-command-registry.test.ts +142 -134
- package/src/config/__tests__/feature-flag-registry-guard.test.ts +48 -39
- package/src/config/bundled-skills/chatgpt-import/tools/chatgpt-import.ts +25 -10
- package/src/config/bundled-skills/doordash/__tests__/doordash-session.test.ts +0 -1
- package/src/config/bundled-skills/guardian-verify-setup/SKILL.md +6 -11
- package/src/config/bundled-skills/messaging/SKILL.md +4 -3
- package/src/config/bundled-skills/messaging/tools/gmail-outreach-scan.ts +15 -5
- package/src/config/bundled-skills/messaging/tools/gmail-sender-digest.ts +16 -5
- package/src/config/bundled-skills/phone-calls/SKILL.md +1 -2
- package/src/config/bundled-skills/slack/tools/slack-scan-digest.ts +34 -32
- package/src/config/bundled-skills/sms-setup/SKILL.md +8 -16
- package/src/config/bundled-skills/telegram-setup/SKILL.md +3 -3
- package/src/config/bundled-skills/trusted-contacts/SKILL.md +13 -25
- package/src/config/bundled-skills/twilio-setup/SKILL.md +13 -23
- package/src/config/bundled-tool-registry.ts +2 -0
- package/src/config/env.ts +3 -4
- package/src/config/system-prompt.ts +32 -0
- package/src/mcp/client.ts +2 -7
- package/src/memory/db-connection.ts +16 -10
- package/src/messaging/providers/gmail/adapter.ts +10 -3
- package/src/messaging/providers/gmail/client.ts +280 -72
- package/src/runtime/auth/__tests__/context.test.ts +75 -65
- package/src/runtime/auth/__tests__/credential-service.test.ts +137 -114
- package/src/runtime/auth/__tests__/guard-tests.test.ts +84 -90
- package/src/runtime/auth/__tests__/ipc-auth-context.test.ts +40 -40
- package/src/runtime/auth/__tests__/middleware.test.ts +80 -74
- package/src/runtime/auth/__tests__/policy.test.ts +9 -9
- package/src/runtime/auth/__tests__/route-policy.test.ts +76 -65
- package/src/runtime/auth/__tests__/scopes.test.ts +68 -60
- package/src/runtime/auth/__tests__/subject.test.ts +54 -54
- package/src/runtime/auth/__tests__/token-service.test.ts +115 -108
- package/src/runtime/auth/scopes.ts +3 -0
- package/src/runtime/auth/token-service.ts +4 -1
- package/src/runtime/auth/types.ts +2 -1
- package/src/runtime/http-server.ts +2 -1
- package/src/security/secure-keys.ts +120 -54
- package/src/tools/browser/__tests__/auth-cache.test.ts +69 -63
- package/src/tools/browser/__tests__/auth-detector.test.ts +218 -157
- package/src/tools/browser/__tests__/jit-auth.test.ts +83 -99
- package/src/tools/terminal/safe-env.ts +7 -0
|
@@ -1,16 +1,23 @@
|
|
|
1
|
-
import { mkdtempSync, rmSync } from
|
|
2
|
-
import { tmpdir } from
|
|
3
|
-
import { join } from
|
|
4
|
-
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
|
|
8
|
-
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
|
|
13
|
-
|
|
1
|
+
import { mkdtempSync, rmSync } from "node:fs";
|
|
2
|
+
import { tmpdir } from "node:os";
|
|
3
|
+
import { join } from "node:path";
|
|
4
|
+
import {
|
|
5
|
+
afterAll,
|
|
6
|
+
beforeAll,
|
|
7
|
+
beforeEach,
|
|
8
|
+
describe,
|
|
9
|
+
expect,
|
|
10
|
+
mock,
|
|
11
|
+
test,
|
|
12
|
+
} from "bun:test";
|
|
13
|
+
|
|
14
|
+
import { DEFAULT_CONFIG } from "../config/defaults.js";
|
|
15
|
+
import { estimatePromptTokens } from "../context/token-estimator.js";
|
|
16
|
+
import { ContextWindowManager } from "../context/window-manager.js";
|
|
17
|
+
import { getDb, initializeDb, resetDb } from "../memory/db.js";
|
|
18
|
+
import { buildMemoryQuery } from "../memory/query-builder.js";
|
|
19
|
+
import { computeRecallBudget } from "../memory/retrieval-budget.js";
|
|
20
|
+
import { buildMemoryRecall } from "../memory/retriever.js";
|
|
14
21
|
import {
|
|
15
22
|
conversations,
|
|
16
23
|
memoryEntities,
|
|
@@ -19,30 +26,31 @@ import {
|
|
|
19
26
|
memoryItems,
|
|
20
27
|
memoryItemSources,
|
|
21
28
|
messages,
|
|
22
|
-
} from
|
|
23
|
-
import type { Message, Provider } from
|
|
29
|
+
} from "../memory/schema.js";
|
|
30
|
+
import type { Message, Provider } from "../providers/types.js";
|
|
24
31
|
|
|
25
|
-
const testDir = mkdtempSync(join(tmpdir(),
|
|
32
|
+
const testDir = mkdtempSync(join(tmpdir(), "context-memory-e2e-"));
|
|
26
33
|
|
|
27
|
-
mock.module(
|
|
34
|
+
mock.module("../util/platform.js", () => ({
|
|
28
35
|
getDataDir: () => testDir,
|
|
29
|
-
isMacOS: () => process.platform ===
|
|
30
|
-
isLinux: () => process.platform ===
|
|
31
|
-
isWindows: () => process.platform ===
|
|
32
|
-
getSocketPath: () => join(testDir,
|
|
33
|
-
getPidPath: () => join(testDir,
|
|
34
|
-
getDbPath: () => join(testDir,
|
|
35
|
-
getLogPath: () => join(testDir,
|
|
36
|
+
isMacOS: () => process.platform === "darwin",
|
|
37
|
+
isLinux: () => process.platform === "linux",
|
|
38
|
+
isWindows: () => process.platform === "win32",
|
|
39
|
+
getSocketPath: () => join(testDir, "test.sock"),
|
|
40
|
+
getPidPath: () => join(testDir, "test.pid"),
|
|
41
|
+
getDbPath: () => join(testDir, "test.db"),
|
|
42
|
+
getLogPath: () => join(testDir, "test.log"),
|
|
36
43
|
ensureDataDir: () => {},
|
|
37
44
|
}));
|
|
38
45
|
|
|
39
|
-
mock.module(
|
|
40
|
-
getLogger: () =>
|
|
41
|
-
|
|
42
|
-
|
|
46
|
+
mock.module("../util/logger.js", () => ({
|
|
47
|
+
getLogger: () =>
|
|
48
|
+
new Proxy({} as Record<string, unknown>, {
|
|
49
|
+
get: () => () => {},
|
|
50
|
+
}),
|
|
43
51
|
}));
|
|
44
52
|
|
|
45
|
-
mock.module(
|
|
53
|
+
mock.module("../memory/qdrant-client.js", () => ({
|
|
46
54
|
getQdrantClient: () => ({
|
|
47
55
|
searchWithFilter: async () => [],
|
|
48
56
|
upsertPoints: async () => {},
|
|
@@ -53,14 +61,19 @@ mock.module('../memory/qdrant-client.js', () => ({
|
|
|
53
61
|
|
|
54
62
|
function makeSummaryProvider(counter: { calls: number }): Provider {
|
|
55
63
|
return {
|
|
56
|
-
name:
|
|
64
|
+
name: "mock",
|
|
57
65
|
async sendMessage() {
|
|
58
66
|
counter.calls += 1;
|
|
59
67
|
return {
|
|
60
|
-
content: [
|
|
61
|
-
|
|
68
|
+
content: [
|
|
69
|
+
{
|
|
70
|
+
type: "text",
|
|
71
|
+
text: "## Goals\n- Keep memory stable\n## Decisions\n- Use progressive rollouts",
|
|
72
|
+
},
|
|
73
|
+
],
|
|
74
|
+
model: "mock-context-model",
|
|
62
75
|
usage: { inputTokens: 300, outputTokens: 60 },
|
|
63
|
-
stopReason:
|
|
76
|
+
stopReason: "end_turn",
|
|
64
77
|
};
|
|
65
78
|
},
|
|
66
79
|
};
|
|
@@ -70,28 +83,51 @@ function makeLongHistory(turns: number, finalUserText: string): Message[] {
|
|
|
70
83
|
const rows: Message[] = [];
|
|
71
84
|
for (let i = 0; i < turns; i++) {
|
|
72
85
|
rows.push({
|
|
73
|
-
role:
|
|
74
|
-
content: [
|
|
86
|
+
role: "user",
|
|
87
|
+
content: [
|
|
88
|
+
{
|
|
89
|
+
type: "text",
|
|
90
|
+
text: `[U${i}] Apollo planning thread ${i}: discuss rollout safeguards and runbooks.`,
|
|
91
|
+
},
|
|
92
|
+
],
|
|
75
93
|
});
|
|
76
94
|
rows.push({
|
|
77
|
-
role:
|
|
78
|
-
content: [
|
|
95
|
+
role: "assistant",
|
|
96
|
+
content: [
|
|
97
|
+
{
|
|
98
|
+
type: "text",
|
|
99
|
+
text: `[A${i}] Captured safeguards ${i}: staged rollout, monitoring, and rollback readiness.`,
|
|
100
|
+
},
|
|
101
|
+
],
|
|
79
102
|
});
|
|
80
103
|
}
|
|
81
104
|
rows.push({
|
|
82
|
-
role:
|
|
83
|
-
content: [{ type:
|
|
105
|
+
role: "user",
|
|
106
|
+
content: [{ type: "text", text: finalUserText }],
|
|
84
107
|
});
|
|
85
108
|
return rows;
|
|
86
109
|
}
|
|
87
110
|
|
|
88
|
-
function insertSegment(
|
|
111
|
+
function insertSegment(
|
|
112
|
+
id: string,
|
|
113
|
+
messageId: string,
|
|
114
|
+
conversationId: string,
|
|
115
|
+
role: string,
|
|
116
|
+
text: string,
|
|
117
|
+
createdAt: number,
|
|
118
|
+
): void {
|
|
89
119
|
const db = getDb();
|
|
90
120
|
db.run(`
|
|
91
121
|
INSERT INTO memory_segments (
|
|
92
122
|
id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at
|
|
93
123
|
) VALUES (
|
|
94
|
-
'${id}', '${messageId}', '${conversationId}', '${role}', 0, '${text.replace(
|
|
124
|
+
'${id}', '${messageId}', '${conversationId}', '${role}', 0, '${text.replace(
|
|
125
|
+
/'/g,
|
|
126
|
+
"''",
|
|
127
|
+
)}', ${Math.max(
|
|
128
|
+
6,
|
|
129
|
+
Math.ceil(text.split(/\s+/).length * 1.3),
|
|
130
|
+
)}, 'default', ${createdAt}, ${createdAt}
|
|
95
131
|
)
|
|
96
132
|
`);
|
|
97
133
|
}
|
|
@@ -107,42 +143,44 @@ function insertMemoryItem(opts: {
|
|
|
107
143
|
lastSeenAt: number;
|
|
108
144
|
}): void {
|
|
109
145
|
const db = getDb();
|
|
110
|
-
db.insert(memoryItems)
|
|
111
|
-
|
|
112
|
-
|
|
113
|
-
|
|
114
|
-
|
|
115
|
-
|
|
116
|
-
|
|
117
|
-
|
|
118
|
-
|
|
119
|
-
|
|
120
|
-
|
|
121
|
-
|
|
122
|
-
|
|
123
|
-
|
|
146
|
+
db.insert(memoryItems)
|
|
147
|
+
.values({
|
|
148
|
+
id: opts.id,
|
|
149
|
+
kind: opts.kind,
|
|
150
|
+
subject: opts.subject,
|
|
151
|
+
statement: opts.statement,
|
|
152
|
+
status: "active",
|
|
153
|
+
confidence: opts.confidence,
|
|
154
|
+
importance: opts.importance,
|
|
155
|
+
fingerprint: `fp-${opts.id}`,
|
|
156
|
+
firstSeenAt: opts.firstSeenAt,
|
|
157
|
+
lastSeenAt: opts.lastSeenAt,
|
|
158
|
+
lastUsedAt: null,
|
|
159
|
+
scopeId: "default",
|
|
160
|
+
})
|
|
161
|
+
.run();
|
|
124
162
|
}
|
|
125
163
|
|
|
126
|
-
describe(
|
|
164
|
+
describe("Context + Memory E2E regression", () => {
|
|
127
165
|
beforeAll(() => {
|
|
128
166
|
initializeDb();
|
|
129
167
|
});
|
|
130
168
|
|
|
131
169
|
beforeEach(() => {
|
|
132
170
|
const db = getDb();
|
|
133
|
-
db.run(
|
|
134
|
-
db.run(
|
|
135
|
-
db.run(
|
|
136
|
-
db.run(
|
|
137
|
-
db.run(
|
|
138
|
-
db.run(
|
|
139
|
-
db.run(
|
|
140
|
-
db.run(
|
|
141
|
-
db.run(
|
|
142
|
-
db.run(
|
|
143
|
-
db.run(
|
|
144
|
-
db.run(
|
|
145
|
-
db.run(
|
|
171
|
+
db.run("DELETE FROM memory_item_sources");
|
|
172
|
+
db.run("DELETE FROM memory_item_entities");
|
|
173
|
+
db.run("DELETE FROM memory_entity_relations");
|
|
174
|
+
db.run("DELETE FROM memory_entities");
|
|
175
|
+
db.run("DELETE FROM memory_embeddings");
|
|
176
|
+
db.run("DELETE FROM memory_summaries");
|
|
177
|
+
db.run("DELETE FROM memory_items");
|
|
178
|
+
db.run("DELETE FROM memory_segment_fts");
|
|
179
|
+
db.run("DELETE FROM memory_segments");
|
|
180
|
+
db.run("DELETE FROM messages");
|
|
181
|
+
db.run("DELETE FROM conversations");
|
|
182
|
+
db.run("DELETE FROM memory_jobs");
|
|
183
|
+
db.run("DELETE FROM memory_checkpoints");
|
|
146
184
|
});
|
|
147
185
|
|
|
148
186
|
afterAll(() => {
|
|
@@ -154,193 +192,237 @@ describe('Context + Memory E2E regression', () => {
|
|
|
154
192
|
}
|
|
155
193
|
});
|
|
156
194
|
|
|
157
|
-
test(
|
|
195
|
+
test("one-turn flow compacts context, enforces dynamic budget, and recalls relation-linked memory", async () => {
|
|
158
196
|
const db = getDb();
|
|
159
|
-
const conversationId =
|
|
197
|
+
const conversationId = "conv-context-memory-e2e";
|
|
160
198
|
const now = 1_700_900_000_000;
|
|
161
|
-
const currentMessageId =
|
|
162
|
-
const currentUserText =
|
|
163
|
-
|
|
164
|
-
|
|
165
|
-
|
|
166
|
-
|
|
167
|
-
|
|
168
|
-
|
|
169
|
-
|
|
170
|
-
|
|
171
|
-
|
|
172
|
-
|
|
173
|
-
|
|
174
|
-
|
|
175
|
-
|
|
199
|
+
const currentMessageId = "msg-e2e-current";
|
|
200
|
+
const currentUserText =
|
|
201
|
+
"For Apollo, what rollout should we use this week? Also tracking note: Apollo secret code 123XYZ.";
|
|
202
|
+
|
|
203
|
+
db.insert(conversations)
|
|
204
|
+
.values({
|
|
205
|
+
id: conversationId,
|
|
206
|
+
title: null,
|
|
207
|
+
createdAt: now,
|
|
208
|
+
updatedAt: now,
|
|
209
|
+
totalInputTokens: 0,
|
|
210
|
+
totalOutputTokens: 0,
|
|
211
|
+
totalEstimatedCost: 0,
|
|
212
|
+
contextSummary: null,
|
|
213
|
+
contextCompactedMessageCount: 0,
|
|
214
|
+
contextCompactedAt: null,
|
|
215
|
+
})
|
|
216
|
+
.run();
|
|
176
217
|
|
|
177
218
|
const seededMessages = [
|
|
178
219
|
{
|
|
179
|
-
id:
|
|
180
|
-
role:
|
|
181
|
-
text:
|
|
220
|
+
id: "msg-e2e-user-2",
|
|
221
|
+
role: "user",
|
|
222
|
+
text: "Historical deployment note kept for audit context.",
|
|
182
223
|
createdAt: now + 2_000,
|
|
183
224
|
},
|
|
184
225
|
{
|
|
185
|
-
id:
|
|
186
|
-
role:
|
|
187
|
-
text:
|
|
226
|
+
id: "msg-e2e-user-10",
|
|
227
|
+
role: "user",
|
|
228
|
+
text: "Sprint review confirmed Apollo rollout policy and guardrails.",
|
|
188
229
|
createdAt: now + 10_000,
|
|
189
230
|
},
|
|
190
231
|
{
|
|
191
|
-
id:
|
|
192
|
-
role:
|
|
193
|
-
text:
|
|
232
|
+
id: "msg-e2e-user-12",
|
|
233
|
+
role: "user",
|
|
234
|
+
text: "Playbook update captured HermesGate ramp guidance.",
|
|
194
235
|
createdAt: now + 12_000,
|
|
195
236
|
},
|
|
196
237
|
{
|
|
197
|
-
id:
|
|
198
|
-
role:
|
|
199
|
-
text:
|
|
238
|
+
id: "msg-e2e-assistant-12",
|
|
239
|
+
role: "assistant",
|
|
240
|
+
text: "Acknowledged rollout notes and linked them to operations memory.",
|
|
200
241
|
createdAt: now + 12_001,
|
|
201
242
|
},
|
|
202
243
|
] as const;
|
|
203
244
|
|
|
204
245
|
for (const row of seededMessages) {
|
|
205
|
-
db.insert(messages)
|
|
206
|
-
|
|
246
|
+
db.insert(messages)
|
|
247
|
+
.values({
|
|
248
|
+
id: row.id,
|
|
249
|
+
conversationId,
|
|
250
|
+
role: row.role,
|
|
251
|
+
content: JSON.stringify([{ type: "text", text: row.text }]),
|
|
252
|
+
createdAt: row.createdAt,
|
|
253
|
+
})
|
|
254
|
+
.run();
|
|
255
|
+
insertSegment(
|
|
256
|
+
`seg-${row.id}`,
|
|
257
|
+
row.id,
|
|
207
258
|
conversationId,
|
|
208
|
-
|
|
209
|
-
|
|
210
|
-
|
|
211
|
-
|
|
212
|
-
insertSegment(`seg-${row.id}`, row.id, conversationId, row.role, row.text, row.createdAt);
|
|
259
|
+
row.role,
|
|
260
|
+
row.text,
|
|
261
|
+
row.createdAt,
|
|
262
|
+
);
|
|
213
263
|
}
|
|
214
264
|
|
|
215
|
-
db.insert(messages)
|
|
216
|
-
|
|
265
|
+
db.insert(messages)
|
|
266
|
+
.values({
|
|
267
|
+
id: currentMessageId,
|
|
268
|
+
conversationId,
|
|
269
|
+
role: "user",
|
|
270
|
+
content: JSON.stringify([{ type: "text", text: currentUserText }]),
|
|
271
|
+
createdAt: now + 100_000,
|
|
272
|
+
})
|
|
273
|
+
.run();
|
|
274
|
+
insertSegment(
|
|
275
|
+
"seg-e2e-current",
|
|
276
|
+
currentMessageId,
|
|
217
277
|
conversationId,
|
|
218
|
-
|
|
219
|
-
|
|
220
|
-
|
|
221
|
-
|
|
222
|
-
insertSegment('seg-e2e-current', currentMessageId, conversationId, 'user', currentUserText, now + 100_000);
|
|
278
|
+
"user",
|
|
279
|
+
currentUserText,
|
|
280
|
+
now + 100_000,
|
|
281
|
+
);
|
|
223
282
|
|
|
224
|
-
db.insert(memoryEntities)
|
|
225
|
-
|
|
226
|
-
|
|
227
|
-
|
|
228
|
-
|
|
229
|
-
|
|
230
|
-
|
|
231
|
-
|
|
232
|
-
|
|
233
|
-
|
|
234
|
-
|
|
235
|
-
|
|
236
|
-
|
|
237
|
-
|
|
238
|
-
|
|
239
|
-
|
|
240
|
-
|
|
283
|
+
db.insert(memoryEntities)
|
|
284
|
+
.values([
|
|
285
|
+
{
|
|
286
|
+
id: "entity-apollo",
|
|
287
|
+
name: "Apollo",
|
|
288
|
+
type: "project",
|
|
289
|
+
aliases: JSON.stringify(["project-apollo"]),
|
|
290
|
+
description: null,
|
|
291
|
+
firstSeenAt: now,
|
|
292
|
+
lastSeenAt: now + 100_000,
|
|
293
|
+
mentionCount: 6,
|
|
294
|
+
},
|
|
295
|
+
{
|
|
296
|
+
id: "entity-hermes",
|
|
297
|
+
name: "HermesGate",
|
|
298
|
+
type: "strategy",
|
|
299
|
+
aliases: JSON.stringify(["hermes-gate"]),
|
|
300
|
+
description: null,
|
|
301
|
+
firstSeenAt: now,
|
|
302
|
+
lastSeenAt: now + 100_000,
|
|
303
|
+
mentionCount: 4,
|
|
304
|
+
},
|
|
305
|
+
])
|
|
306
|
+
.run();
|
|
307
|
+
|
|
308
|
+
db.insert(memoryEntityRelations)
|
|
309
|
+
.values({
|
|
310
|
+
id: "rel-apollo-hermes",
|
|
311
|
+
sourceEntityId: "entity-apollo",
|
|
312
|
+
targetEntityId: "entity-hermes",
|
|
313
|
+
relation: "uses",
|
|
314
|
+
evidence: "Apollo uses HermesGate for risky changes",
|
|
241
315
|
firstSeenAt: now,
|
|
242
|
-
lastSeenAt: now +
|
|
243
|
-
|
|
244
|
-
|
|
245
|
-
]).run();
|
|
246
|
-
|
|
247
|
-
db.insert(memoryEntityRelations).values({
|
|
248
|
-
id: 'rel-apollo-hermes',
|
|
249
|
-
sourceEntityId: 'entity-apollo',
|
|
250
|
-
targetEntityId: 'entity-hermes',
|
|
251
|
-
relation: 'uses',
|
|
252
|
-
evidence: 'Apollo uses HermesGate for risky changes',
|
|
253
|
-
firstSeenAt: now,
|
|
254
|
-
lastSeenAt: now + 50_000,
|
|
255
|
-
}).run();
|
|
316
|
+
lastSeenAt: now + 50_000,
|
|
317
|
+
})
|
|
318
|
+
.run();
|
|
256
319
|
|
|
257
320
|
insertMemoryItem({
|
|
258
|
-
id:
|
|
259
|
-
kind:
|
|
260
|
-
subject:
|
|
261
|
-
statement:
|
|
321
|
+
id: "item-apollo-direct",
|
|
322
|
+
kind: "preference",
|
|
323
|
+
subject: "apollo rollout policy",
|
|
324
|
+
statement:
|
|
325
|
+
"Apollo rollout policy favors staged canary releases with guarded traffic ramps.",
|
|
262
326
|
confidence: 0.95,
|
|
263
327
|
importance: 0.95,
|
|
264
328
|
firstSeenAt: now + 10_000,
|
|
265
329
|
lastSeenAt: now + 50_000,
|
|
266
330
|
});
|
|
267
|
-
db.insert(memoryItemSources)
|
|
268
|
-
|
|
269
|
-
|
|
270
|
-
|
|
271
|
-
|
|
272
|
-
|
|
273
|
-
|
|
274
|
-
|
|
275
|
-
|
|
276
|
-
|
|
331
|
+
db.insert(memoryItemSources)
|
|
332
|
+
.values({
|
|
333
|
+
memoryItemId: "item-apollo-direct",
|
|
334
|
+
messageId: "msg-e2e-user-10",
|
|
335
|
+
evidence: "User confirmed policy in sprint review",
|
|
336
|
+
createdAt: now + 10_000,
|
|
337
|
+
})
|
|
338
|
+
.run();
|
|
339
|
+
db.insert(memoryItemEntities)
|
|
340
|
+
.values({
|
|
341
|
+
memoryItemId: "item-apollo-direct",
|
|
342
|
+
entityId: "entity-apollo",
|
|
343
|
+
})
|
|
344
|
+
.run();
|
|
277
345
|
|
|
278
346
|
insertMemoryItem({
|
|
279
|
-
id:
|
|
280
|
-
kind:
|
|
281
|
-
subject:
|
|
282
|
-
statement:
|
|
347
|
+
id: "item-hermes-relation",
|
|
348
|
+
kind: "fact",
|
|
349
|
+
subject: "hermes rollout execution",
|
|
350
|
+
statement:
|
|
351
|
+
"HermesGate rollout guidance: start at 5% traffic and promote only after error budget checks pass.",
|
|
283
352
|
confidence: 0.8,
|
|
284
353
|
importance: 0.6,
|
|
285
354
|
firstSeenAt: now + 12_000,
|
|
286
355
|
lastSeenAt: now + 52_000,
|
|
287
356
|
});
|
|
288
|
-
db.insert(memoryItemSources)
|
|
289
|
-
|
|
290
|
-
|
|
291
|
-
|
|
292
|
-
|
|
293
|
-
|
|
294
|
-
|
|
295
|
-
|
|
296
|
-
|
|
297
|
-
|
|
357
|
+
db.insert(memoryItemSources)
|
|
358
|
+
.values({
|
|
359
|
+
memoryItemId: "item-hermes-relation",
|
|
360
|
+
messageId: "msg-e2e-user-12",
|
|
361
|
+
evidence: "Rollout playbook notes",
|
|
362
|
+
createdAt: now + 12_000,
|
|
363
|
+
})
|
|
364
|
+
.run();
|
|
365
|
+
db.insert(memoryItemEntities)
|
|
366
|
+
.values({
|
|
367
|
+
memoryItemId: "item-hermes-relation",
|
|
368
|
+
entityId: "entity-hermes",
|
|
369
|
+
})
|
|
370
|
+
.run();
|
|
298
371
|
|
|
299
372
|
insertMemoryItem({
|
|
300
|
-
id:
|
|
301
|
-
kind:
|
|
302
|
-
subject:
|
|
303
|
-
statement:
|
|
373
|
+
id: "item-apollo-stale",
|
|
374
|
+
kind: "event",
|
|
375
|
+
subject: "legacy deploy process",
|
|
376
|
+
statement:
|
|
377
|
+
"Legacy note from years ago: Apollo deployments were manual and unmonitored.",
|
|
304
378
|
confidence: 0.6,
|
|
305
379
|
importance: 0.3,
|
|
306
380
|
firstSeenAt: now - 400 * 24 * 60 * 60 * 1000,
|
|
307
381
|
lastSeenAt: now - 390 * 24 * 60 * 60 * 1000,
|
|
308
382
|
});
|
|
309
|
-
db.insert(memoryItemSources)
|
|
310
|
-
|
|
311
|
-
|
|
312
|
-
|
|
313
|
-
|
|
314
|
-
|
|
315
|
-
|
|
316
|
-
|
|
317
|
-
|
|
318
|
-
|
|
383
|
+
db.insert(memoryItemSources)
|
|
384
|
+
.values({
|
|
385
|
+
memoryItemId: "item-apollo-stale",
|
|
386
|
+
messageId: "msg-e2e-user-2",
|
|
387
|
+
evidence: "Historical note",
|
|
388
|
+
createdAt: now - 390 * 24 * 60 * 60 * 1000,
|
|
389
|
+
})
|
|
390
|
+
.run();
|
|
391
|
+
db.insert(memoryItemEntities)
|
|
392
|
+
.values({
|
|
393
|
+
memoryItemId: "item-apollo-stale",
|
|
394
|
+
entityId: "entity-apollo",
|
|
395
|
+
})
|
|
396
|
+
.run();
|
|
319
397
|
|
|
320
398
|
insertMemoryItem({
|
|
321
|
-
id:
|
|
322
|
-
kind:
|
|
323
|
-
subject:
|
|
324
|
-
statement:
|
|
399
|
+
id: "item-apollo-secret",
|
|
400
|
+
kind: "fact",
|
|
401
|
+
subject: "apollo secret",
|
|
402
|
+
statement: "Current-turn secret: Apollo code is 123XYZ.",
|
|
325
403
|
confidence: 0.99,
|
|
326
404
|
importance: 0.99,
|
|
327
405
|
firstSeenAt: now + 100_000,
|
|
328
406
|
lastSeenAt: now + 100_000,
|
|
329
407
|
});
|
|
330
|
-
db.insert(memoryItemSources)
|
|
331
|
-
|
|
332
|
-
|
|
333
|
-
|
|
334
|
-
|
|
335
|
-
|
|
336
|
-
|
|
337
|
-
|
|
338
|
-
|
|
339
|
-
|
|
408
|
+
db.insert(memoryItemSources)
|
|
409
|
+
.values({
|
|
410
|
+
memoryItemId: "item-apollo-secret",
|
|
411
|
+
messageId: currentMessageId,
|
|
412
|
+
evidence: "Current turn only",
|
|
413
|
+
createdAt: now + 100_000,
|
|
414
|
+
})
|
|
415
|
+
.run();
|
|
416
|
+
db.insert(memoryItemEntities)
|
|
417
|
+
.values({
|
|
418
|
+
memoryItemId: "item-apollo-secret",
|
|
419
|
+
entityId: "entity-apollo",
|
|
420
|
+
})
|
|
421
|
+
.run();
|
|
340
422
|
|
|
341
423
|
const summaryCounter = { calls: 0 };
|
|
342
424
|
const provider = makeSummaryProvider(summaryCounter);
|
|
343
|
-
const systemPrompt =
|
|
425
|
+
const systemPrompt = "System prompt for context + memory e2e";
|
|
344
426
|
const history = makeLongHistory(60, currentUserText);
|
|
345
427
|
const manager = new ContextWindowManager(provider, systemPrompt, {
|
|
346
428
|
...DEFAULT_CONFIG.contextWindow,
|
|
@@ -354,7 +436,9 @@ describe('Context + Memory E2E regression', () => {
|
|
|
354
436
|
const compacted = await manager.maybeCompact(history);
|
|
355
437
|
expect(compacted.compacted).toBe(true);
|
|
356
438
|
expect(compacted.summaryCalls).toBe(summaryCounter.calls);
|
|
357
|
-
expect(compacted.estimatedInputTokens).toBeLessThan(
|
|
439
|
+
expect(compacted.estimatedInputTokens).toBeLessThan(
|
|
440
|
+
compacted.previousEstimatedInputTokens,
|
|
441
|
+
);
|
|
358
442
|
|
|
359
443
|
const recallConfig = {
|
|
360
444
|
...DEFAULT_CONFIG,
|
|
@@ -363,7 +447,7 @@ describe('Context + Memory E2E regression', () => {
|
|
|
363
447
|
...DEFAULT_CONFIG.memory,
|
|
364
448
|
embeddings: {
|
|
365
449
|
...DEFAULT_CONFIG.memory.embeddings,
|
|
366
|
-
provider:
|
|
450
|
+
provider: "openai" as const,
|
|
367
451
|
required: false,
|
|
368
452
|
},
|
|
369
453
|
retrieval: {
|
|
@@ -405,16 +489,24 @@ describe('Context + Memory E2E regression', () => {
|
|
|
405
489
|
const recallBudget = computeRecallBudget({
|
|
406
490
|
estimatedPromptTokens,
|
|
407
491
|
maxInputTokens: recallConfig.contextWindow.maxInputTokens,
|
|
408
|
-
targetHeadroomTokens:
|
|
409
|
-
|
|
410
|
-
|
|
492
|
+
targetHeadroomTokens:
|
|
493
|
+
recallConfig.memory.retrieval.dynamicBudget.targetHeadroomTokens,
|
|
494
|
+
minInjectTokens:
|
|
495
|
+
recallConfig.memory.retrieval.dynamicBudget.minInjectTokens,
|
|
496
|
+
maxInjectTokens:
|
|
497
|
+
recallConfig.memory.retrieval.dynamicBudget.maxInjectTokens,
|
|
411
498
|
});
|
|
412
499
|
|
|
413
500
|
const recallQuery = buildMemoryQuery(currentUserText, compacted.messages);
|
|
414
|
-
const recall = await buildMemoryRecall(
|
|
415
|
-
|
|
416
|
-
|
|
417
|
-
|
|
501
|
+
const recall = await buildMemoryRecall(
|
|
502
|
+
recallQuery,
|
|
503
|
+
conversationId,
|
|
504
|
+
recallConfig,
|
|
505
|
+
{
|
|
506
|
+
excludeMessageIds: [currentMessageId],
|
|
507
|
+
maxInjectTokensOverride: recallBudget,
|
|
508
|
+
},
|
|
509
|
+
);
|
|
418
510
|
|
|
419
511
|
expect(recall.injectedTokens).toBeLessThanOrEqual(recallBudget);
|
|
420
512
|
expect(recall.relationSeedEntityCount).toBeGreaterThan(0);
|
|
@@ -422,12 +514,12 @@ describe('Context + Memory E2E regression', () => {
|
|
|
422
514
|
expect(recall.relationNeighborEntityCount).toBeGreaterThan(0);
|
|
423
515
|
expect(recall.relationExpandedItemCount).toBeGreaterThan(0);
|
|
424
516
|
|
|
425
|
-
expect(recall.injectedText).toContain(
|
|
426
|
-
expect(recall.injectedText).toContain(
|
|
427
|
-
expect(recall.injectedText).not.toContain(
|
|
517
|
+
expect(recall.injectedText).toContain("staged canary releases");
|
|
518
|
+
expect(recall.injectedText).toContain("start at 5% traffic");
|
|
519
|
+
expect(recall.injectedText).not.toContain("123XYZ");
|
|
428
520
|
|
|
429
|
-
const directIndex = recall.injectedText.indexOf(
|
|
430
|
-
const relationIndex = recall.injectedText.indexOf(
|
|
521
|
+
const directIndex = recall.injectedText.indexOf("staged canary releases");
|
|
522
|
+
const relationIndex = recall.injectedText.indexOf("start at 5% traffic");
|
|
431
523
|
expect(directIndex).toBeGreaterThanOrEqual(0);
|
|
432
524
|
expect(relationIndex).toBeGreaterThanOrEqual(0);
|
|
433
525
|
expect(directIndex).toBeLessThan(relationIndex);
|