@vellumai/assistant 0.6.4 → 0.6.6
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.prettierignore +5 -0
- package/AGENTS.md +9 -1
- package/ARCHITECTURE.md +43 -49
- package/Dockerfile +17 -3
- package/README.md +3 -4
- package/__tests__/permissions/gateway-threshold-reader.test.ts +283 -0
- package/bun.lock +8 -3
- package/docs/architecture/integrations.md +33 -59
- package/docs/architecture/memory.md +25 -30
- package/docs/architecture/security.md +19 -18
- package/docs/browser-use-architecture-phase2.md +63 -20
- package/docs/error-handling.md +111 -0
- package/docs/plugins.md +761 -0
- package/docs/skills.md +10 -10
- package/docs/stt-provider-onboarding.md +2 -1
- package/examples/plugins/echo/README.md +132 -0
- package/examples/plugins/echo/package.json +17 -0
- package/examples/plugins/echo/register.ts +187 -0
- package/knip.json +9 -2
- package/node_modules/@vellumai/ces-contracts/package.json +2 -1
- package/node_modules/@vellumai/ces-contracts/src/__tests__/trust-rules.test.ts +471 -0
- package/node_modules/@vellumai/ces-contracts/src/trust-rules.ts +398 -4
- package/node_modules/@vellumai/credential-storage/bun.lock +2 -2
- package/node_modules/@vellumai/credential-storage/package.json +2 -2
- package/node_modules/@vellumai/credential-storage/src/oauth-runtime.ts +20 -2
- package/node_modules/@vellumai/egress-proxy/bun.lock +2 -2
- package/node_modules/@vellumai/egress-proxy/package.json +2 -2
- package/node_modules/@vellumai/egress-proxy/src/types.ts +19 -0
- package/openapi.yaml +334 -78
- package/package.json +6 -3
- package/scripts/generate-openapi.ts +50 -11
- package/src/__tests__/agent-loop-callsite-precedence.test.ts +318 -0
- package/src/__tests__/agent-loop-sentry-hygiene.test.ts +137 -0
- package/src/__tests__/agent-loop.test.ts +112 -1
- package/src/__tests__/anthropic-error-formatting.test.ts +98 -0
- package/src/__tests__/anthropic-provider.test.ts +171 -2
- package/src/__tests__/app-compiler.test.ts +57 -0
- package/src/__tests__/approval-cascade.test.ts +36 -10
- package/src/__tests__/approval-routes-http.test.ts +134 -10
- package/src/__tests__/assistant-attachments.test.ts +44 -0
- package/src/__tests__/assistant-feature-flags-integration.test.ts +29 -0
- package/src/__tests__/auto-analysis-end-to-end.test.ts +1 -0
- package/src/__tests__/avatar-generator.test.ts +4 -2
- package/src/__tests__/browser-fill-credential.test.ts +1 -1
- package/src/__tests__/browser-identifier-parity-guard.test.ts +53 -0
- package/src/__tests__/browser-skill-baseline-tool-payload.test.ts +23 -33
- package/src/__tests__/browser-skill-endstate.test.ts +51 -182
- package/src/__tests__/btw-routes.test.ts +47 -1
- package/src/__tests__/bundled-asset.test.ts +6 -6
- package/src/__tests__/call-controller.test.ts +1 -2
- package/src/__tests__/call-site-routing-provider.test.ts +214 -0
- package/src/__tests__/catalog-cache.test.ts +96 -4
- package/src/__tests__/channel-approval-routes.test.ts +4 -4
- package/src/__tests__/channel-reply-delivery.test.ts +300 -2
- package/src/__tests__/checker.test.ts +870 -655
- package/src/__tests__/circuit-breaker-pipeline.test.ts +406 -0
- package/src/__tests__/cli-command-risk-guard.test.ts +30 -33
- package/src/__tests__/compaction-events.test.ts +501 -0
- package/src/__tests__/compaction-pipeline.test.ts +210 -0
- package/src/__tests__/compaction-strip-metadata-clear.test.ts +181 -0
- package/src/__tests__/compaction-timeout-recovery.test.ts +262 -0
- package/src/__tests__/compaction.benchmark.test.ts +1 -1
- package/src/__tests__/config-analysis.test.ts +11 -28
- package/src/__tests__/config-loader-backfill.test.ts +174 -0
- package/src/__tests__/config-loader-corrupt.test.ts +183 -0
- package/src/__tests__/config-loader-quarantine-bulletin.test.ts +202 -0
- package/src/__tests__/config-model-image-provider.test.ts +110 -0
- package/src/__tests__/config-schema-cmd.test.ts +11 -5
- package/src/__tests__/config-schema.test.ts +440 -114
- package/src/__tests__/config-watcher-cleanup-throttle.test.ts +0 -4
- package/src/__tests__/config-watcher.test.ts +2 -2
- package/src/__tests__/contact-store-user-file.test.ts +72 -73
- package/src/__tests__/contacts-tools.test.ts +26 -0
- package/src/__tests__/contacts-write.test.ts +4 -4
- package/src/__tests__/context-overflow-policy.test.ts +7 -7
- package/src/__tests__/context-token-estimator.test.ts +191 -1
- package/src/__tests__/context-window-manager.test.ts +883 -4
- package/src/__tests__/conversation-abort-tool-results.test.ts +32 -15
- package/src/__tests__/conversation-agent-loop-overflow.test.ts +86 -46
- package/src/__tests__/conversation-agent-loop.test.ts +435 -216
- package/src/__tests__/conversation-attachments.test.ts +1 -1
- package/src/__tests__/conversation-confirmation-signals.test.ts +36 -10
- package/src/__tests__/conversation-error.test.ts +37 -6
- package/src/__tests__/conversation-history-web-search.test.ts +7 -0
- package/src/__tests__/conversation-init.benchmark.test.ts +34 -12
- package/src/__tests__/conversation-lifecycle.test.ts +336 -0
- package/src/__tests__/conversation-load-history-repair.test.ts +27 -10
- package/src/__tests__/conversation-pairing.test.ts +174 -10
- package/src/__tests__/conversation-pre-run-repair.test.ts +32 -15
- package/src/__tests__/conversation-process-callsite.test.ts +309 -0
- package/src/__tests__/conversation-provider-retry-repair.test.ts +44 -21
- package/src/__tests__/conversation-queue.test.ts +68 -38
- package/src/__tests__/conversation-routes-disk-view.test.ts +36 -7
- package/src/__tests__/conversation-routes-slash-commands.test.ts +31 -3
- package/src/__tests__/conversation-runtime-assembly.test.ts +2877 -152
- package/src/__tests__/conversation-runtime-workspace.test.ts +35 -50
- package/src/__tests__/conversation-seed-composer.test.ts +2 -2
- package/src/__tests__/conversation-skill-tools.test.ts +12 -146
- package/src/__tests__/conversation-slash-queue.test.ts +39 -19
- package/src/__tests__/conversation-slash-unknown.test.ts +53 -16
- package/src/__tests__/conversation-speed-override.test.ts +36 -12
- package/src/__tests__/conversation-surfaces-standalone-payloads.test.ts +1035 -0
- package/src/__tests__/conversation-surfaces-standalone.test.ts +630 -0
- package/src/__tests__/conversation-title-service.test.ts +118 -2
- package/src/__tests__/conversation-tool-setup-app-refresh.test.ts +41 -2
- package/src/__tests__/conversation-tool-setup-batch-authorized.test.ts +1 -1
- package/src/__tests__/conversation-unread-route.test.ts +2 -2
- package/src/__tests__/conversation-usage.test.ts +4 -2
- package/src/__tests__/conversation-workspace-cache-state.test.ts +33 -9
- package/src/__tests__/conversation-workspace-injection.test.ts +46 -15
- package/src/__tests__/conversation-workspace-tool-tracking.test.ts +46 -15
- package/src/__tests__/credential-broker-browser-fill.test.ts +110 -0
- package/src/__tests__/credential-health-service.test.ts +78 -9
- package/src/__tests__/credential-security-invariants.test.ts +5 -2
- package/src/__tests__/credential-storage-oauth-compat.test.ts +18 -0
- package/src/__tests__/credential-storage-static-compat.test.ts +28 -0
- package/src/__tests__/credential-vault-unit.test.ts +135 -19
- package/src/__tests__/credentials-cli.test.ts +1 -9
- package/src/__tests__/cross-provider-web-search.test.ts +84 -0
- package/src/__tests__/daemon-server-persist-and-process-callsite.test.ts +92 -0
- package/src/__tests__/db-schedule-syntax-migration.test.ts +1 -0
- package/src/__tests__/delete-propagation.test.ts +437 -0
- package/src/__tests__/dm-backfill.test.ts +417 -0
- package/src/__tests__/dm-persistence.test.ts +227 -0
- package/src/__tests__/edit-propagation.test.ts +280 -0
- package/src/__tests__/empty-response-pipeline.test.ts +305 -0
- package/src/__tests__/ephemeral-permissions.test.ts +93 -3
- package/src/__tests__/estimator-calibration-integration.test.ts +208 -0
- package/src/__tests__/estimator-calibration.test.ts +213 -0
- package/src/__tests__/extension-id-sync-guard.test.ts +29 -10
- package/src/__tests__/file-write-tool.test.ts +151 -1
- package/src/__tests__/filing-service.test.ts +255 -0
- package/src/__tests__/first-greeting.test.ts +247 -5
- package/src/__tests__/gemini-provider.test.ts +0 -3
- package/src/__tests__/guardian-grant-minting.test.ts +8 -0
- package/src/__tests__/headless-browser-interactions.test.ts +1 -1
- package/src/__tests__/headless-browser-mode.test.ts +57 -0
- package/src/__tests__/heartbeat-service.test.ts +96 -15
- package/src/__tests__/history-repair-pipeline.test.ts +399 -0
- package/src/__tests__/host-browser-e2e-cloud.test.ts +307 -0
- package/src/__tests__/host-browser-e2e-self-hosted.test.ts +3 -3
- package/src/__tests__/host-proxy-interface.test.ts +36 -2
- package/src/__tests__/host-shell-tool.test.ts +124 -18
- package/src/__tests__/http-user-message-parity.test.ts +29 -1
- package/src/__tests__/image-credentials.test.ts +137 -0
- package/src/__tests__/image-service-dispatcher.test.ts +186 -0
- package/src/__tests__/inbound-slack-persistence.test.ts +340 -0
- package/src/__tests__/injector-chain.test.ts +526 -0
- package/src/__tests__/intent-routing.test.ts +1 -66
- package/src/__tests__/llm-call-pipeline.test.ts +285 -0
- package/src/__tests__/llm-catalog-parity.test.ts +174 -0
- package/src/__tests__/llm-context-normalization.test.ts +121 -0
- package/src/__tests__/llm-resolver.test.ts +214 -0
- package/src/__tests__/llm-schema.test.ts +223 -0
- package/src/__tests__/managed-proxy-context.test.ts +6 -2
- package/src/__tests__/media-generate-image.test.ts +119 -13
- package/src/__tests__/memory-retrieval-pipeline.test.ts +401 -0
- package/src/__tests__/memory-upsert-concurrency.test.ts +1 -0
- package/src/__tests__/messaging-skill-split.test.ts +3 -34
- package/src/__tests__/migration-import-from-url.test.ts +621 -0
- package/src/__tests__/model-intents.test.ts +11 -83
- package/src/__tests__/notification-broadcaster.test.ts +3 -3
- package/src/__tests__/notification-decision-fallback.test.ts +0 -10
- package/src/__tests__/notification-decision-identity.test.ts +0 -9
- package/src/__tests__/notification-decision-recipient-context.test.ts +0 -9
- package/src/__tests__/notification-decision-strategy.test.ts +0 -11
- package/src/__tests__/notification-schedule-notify-dedup.test.ts +108 -0
- package/src/__tests__/oauth-apps-routes.test.ts +1 -1
- package/src/__tests__/oauth-cli.test.ts +14 -12
- package/src/__tests__/oauth-connect-orchestrator.test.ts +4 -13
- package/src/__tests__/oauth-provider-serializer.test.ts +6 -4
- package/src/__tests__/oauth-provider-visibility.test.ts +3 -5
- package/src/__tests__/oauth-providers-routes.test.ts +3 -2
- package/src/__tests__/oauth-store.test.ts +46 -78
- package/src/__tests__/oauth2-gateway-transport.test.ts +8 -3
- package/src/__tests__/oauth2-refresh-retry.test.ts +279 -0
- package/src/__tests__/onboarding-template-contract.test.ts +16 -64
- package/src/__tests__/openai-image-service.test.ts +368 -0
- package/src/__tests__/openai-provider.test.ts +7 -0
- package/src/__tests__/openai-responses-provider.test.ts +396 -0
- package/src/__tests__/openrouter-provider-only.test.ts +135 -0
- package/src/__tests__/outbound-slack-persistence.test.ts +293 -0
- package/src/__tests__/overflow-reduce-pipeline.test.ts +676 -0
- package/src/__tests__/permission-checker-host-gate.test.ts +1 -25
- package/src/__tests__/permission-mode.test.ts +16 -0
- package/src/__tests__/permission-types.test.ts +0 -1
- package/src/__tests__/persist-onboarding-artifacts.test.ts +266 -0
- package/src/__tests__/persistence-pipeline.test.ts +377 -0
- package/src/__tests__/persona-resolver.test.ts +13 -13
- package/src/__tests__/pipeline-runner.test.ts +565 -0
- package/src/__tests__/pkb-autoinject.test.ts +37 -1
- package/src/__tests__/platform-bash-auto-approve.test.ts +1 -1
- package/src/__tests__/platform.test.ts +5 -2
- package/src/__tests__/plugin-bootstrap.test.ts +483 -0
- package/src/__tests__/plugin-registry.test.ts +273 -0
- package/src/__tests__/plugin-route-contribution.test.ts +288 -0
- package/src/__tests__/plugin-skill-contribution.test.ts +367 -0
- package/src/__tests__/plugin-tool-contribution.test.ts +286 -0
- package/src/__tests__/plugin-types.test.ts +320 -0
- package/src/__tests__/pricing.test.ts +93 -14
- package/src/__tests__/profiler-routes.test.ts +1 -1
- package/src/__tests__/provider-commit-message-generator.test.ts +14 -84
- package/src/__tests__/provider-env-vars-scope.test.ts +52 -0
- package/src/__tests__/provider-error-scenarios.test.ts +135 -6
- package/src/__tests__/provider-managed-proxy-integration.test.ts +42 -11
- package/src/__tests__/provider-registry-ollama.test.ts +1 -2
- package/src/__tests__/proxy-approval-callback.test.ts +69 -9
- package/src/__tests__/reaction-persistence.test.ts +561 -0
- package/src/__tests__/regenerate-fire-and-forget-trace.test.ts +1 -0
- package/src/__tests__/registry.test.ts +0 -2
- package/src/__tests__/relay-server.test.ts +1 -1
- package/src/__tests__/require-fresh-approval.test.ts +1 -1
- package/src/__tests__/retry-openrouter-only-normalization.test.ts +136 -0
- package/src/__tests__/retry-thinking-tool-choice.test.ts +226 -0
- package/src/__tests__/risk-classifier-parity.test.ts +230 -0
- package/src/__tests__/sanitize-config-for-transfer.test.ts +78 -1
- package/src/__tests__/schedule-routes.test.ts +131 -1
- package/src/__tests__/scheduler-recurrence.test.ts +14 -70
- package/src/__tests__/scheduler-reuse-conversation.test.ts +10 -50
- package/src/__tests__/secret-detection-handler.test.ts +0 -10
- package/src/__tests__/secret-ingress-http.test.ts +28 -0
- package/src/__tests__/secret-prompter-channel-fallback.test.ts +125 -0
- package/src/__tests__/secret-routes-managed-proxy.test.ts +2 -3
- package/src/__tests__/secret-scanner-executor.test.ts +1 -1
- package/src/__tests__/send-endpoint-busy.test.ts +29 -1
- package/src/__tests__/server-history-render.test.ts +31 -0
- package/src/__tests__/shell-identity.test.ts +0 -134
- package/src/__tests__/shell-parser-property.test.ts +13 -13
- package/src/__tests__/skill-cache-store.test.ts +182 -0
- package/src/__tests__/skills.test.ts +19 -33
- package/src/__tests__/slack-app-setup-skill-regression.test.ts +3 -1
- package/src/__tests__/slack-skill.test.ts +3 -8
- package/src/__tests__/starter-bundle.test.ts +35 -0
- package/src/__tests__/subagent-call-site-routing.test.ts +280 -0
- package/src/__tests__/suggestion-routes.test.ts +259 -3
- package/src/__tests__/system-prompt.test.ts +22 -35
- package/src/__tests__/task-memory-cleanup.test.ts +1 -0
- package/src/__tests__/task-runner.test.ts +3 -1
- package/src/__tests__/task-scheduler.test.ts +3 -15
- package/src/__tests__/tcc-sandbox-deny.test.ts +198 -0
- package/src/__tests__/terminal-tools.test.ts +8 -0
- package/src/__tests__/test-preload.ts +11 -0
- package/src/__tests__/test-support/browser-skill-harness.ts +2 -52
- package/src/__tests__/thread-backfill.test.ts +941 -0
- package/src/__tests__/title-generate-pipeline.test.ts +224 -0
- package/src/__tests__/token-estimate-pipeline.test.ts +431 -0
- package/src/__tests__/tool-error-pipeline.test.ts +244 -0
- package/src/__tests__/tool-execute-pipeline.test.ts +431 -0
- package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +2 -8
- package/src/__tests__/tool-executor-lifecycle-events.test.ts +2 -2
- package/src/__tests__/tool-executor-shell-integration.test.ts +7 -10
- package/src/__tests__/tool-executor.test.ts +201 -94
- package/src/__tests__/tool-result-truncate-pipeline.test.ts +356 -0
- package/src/__tests__/tool-result-truncation.test.ts +0 -110
- package/src/__tests__/trust-store.test.ts +442 -109
- package/src/__tests__/update-bulletin-job.test.ts +389 -0
- package/src/__tests__/usage-cache-backfill-migration.test.ts +3 -1
- package/src/__tests__/user-plugin-loader.test.ts +191 -0
- package/src/__tests__/verification-control-plane-policy.test.ts +1 -22
- package/src/__tests__/voice-session-bridge.test.ts +39 -0
- package/src/__tests__/volume-security-guard.test.ts +3 -2
- package/src/__tests__/web-search-history.test.ts +337 -0
- package/src/__tests__/workspace-migration-039-drop-legacy-llm-keys.test.ts +343 -0
- package/src/__tests__/workspace-migration-043-release-notes-latex-rendering.test.ts +202 -0
- package/src/__tests__/workspace-migration-045-release-notes-meet-avatar.test.ts +210 -0
- package/src/__tests__/workspace-migration-046-seed-conversation-starters-callsite.test.ts +185 -0
- package/src/__tests__/workspace-migration-049-release-notes-default-sonnet.test.ts +100 -0
- package/src/__tests__/workspace-migration-050-seed-main-agent-opus-callsite.test.ts +171 -0
- package/src/__tests__/workspace-migration-051-seed-conversation-summarization-callsite.test.ts +252 -0
- package/src/__tests__/workspace-migration-drop-user-md.test.ts +11 -11
- package/src/__tests__/workspace-migration-remove-hooks.test.ts +99 -0
- package/src/__tests__/workspace-migration-unify-llm-callsite-configs.test.ts +841 -0
- package/src/__tests__/workspace-policy.test.ts +22 -16
- package/src/acp/client-handler.ts +1 -2
- package/src/agent/loop.ts +545 -115
- package/src/approvals/__tests__/guardian-feed-event.test.ts +304 -0
- package/src/approvals/guardian-request-resolvers.ts +80 -0
- package/src/avatar/resvg-lazy.test.ts +136 -0
- package/src/avatar/resvg-lazy.ts +82 -9
- package/src/avatar/traits-png-sync.ts +21 -1
- package/src/backup/__tests__/backup-worker.test.ts +2 -13
- package/src/backup/backup-worker.ts +3 -15
- package/src/browser/__tests__/operations.test.ts +163 -0
- package/src/browser/identifiers.ts +51 -0
- package/src/browser/operations.ts +660 -0
- package/src/browser/types.ts +81 -0
- package/src/bundler/app-compiler.ts +84 -1
- package/src/calls/call-state.ts +2 -2
- package/src/calls/guardian-question-copy.ts +2 -2
- package/src/calls/telephony-stt-routing.ts +1 -1
- package/src/calls/voice-session-bridge.ts +1 -0
- package/src/channels/__tests__/types.test.ts +3 -3
- package/src/channels/types.ts +6 -4
- package/src/cli/AGENTS.md +1 -1
- package/src/cli/__tests__/notifications.test.ts +87 -211
- package/src/cli/commands/__tests__/attachment.test.ts +438 -0
- package/src/cli/commands/__tests__/backup.test.ts +1 -1
- package/src/cli/commands/__tests__/browser.test.ts +554 -0
- package/src/cli/commands/__tests__/cache.test.ts +623 -0
- package/src/cli/commands/__tests__/email-list.test.ts +6 -0
- package/src/cli/commands/__tests__/email-send.test.ts +93 -1
- package/src/cli/commands/__tests__/image-generation.test.ts +886 -0
- package/src/cli/commands/__tests__/inference-send.test.ts +463 -0
- package/src/cli/commands/__tests__/stt-transcribe.test.ts +454 -0
- package/src/cli/commands/__tests__/task.test.ts +913 -0
- package/src/cli/commands/__tests__/tts-synthesize.test.ts +606 -0
- package/src/cli/commands/__tests__/ui-confirm.test.ts +650 -0
- package/src/cli/commands/__tests__/ui.test.ts +1215 -0
- package/src/cli/commands/__tests__/watchers.test.ts +716 -0
- package/src/cli/commands/attachment.ts +182 -0
- package/src/cli/commands/backup.ts +2 -2
- package/src/cli/commands/browser.ts +350 -0
- package/src/cli/commands/cache.ts +341 -0
- package/src/cli/commands/clients.ts +138 -0
- package/src/cli/commands/completions.ts +2 -12
- package/src/cli/commands/config.ts +6 -6
- package/src/cli/commands/conversations-import.ts +347 -0
- package/src/cli/commands/conversations.ts +69 -8
- package/src/cli/commands/email.ts +234 -194
- package/src/cli/commands/image-generation.ts +299 -0
- package/src/cli/commands/inference.ts +200 -0
- package/src/cli/commands/memory.ts +127 -17
- package/src/cli/commands/notifications.ts +68 -103
- package/src/cli/commands/oauth/__tests__/providers-register.test.ts +1 -1
- package/src/cli/commands/oauth/__tests__/providers-update.test.ts +1 -1
- package/src/cli/commands/oauth/connect.ts +2 -2
- package/src/cli/commands/oauth/providers.ts +176 -8
- package/src/cli/commands/oauth/status.ts +46 -36
- package/src/cli/commands/platform/__tests__/callback-routes-list.test.ts +0 -1
- package/src/cli/commands/platform/__tests__/connect.test.ts +0 -1
- package/src/cli/commands/platform/__tests__/disconnect.test.ts +0 -1
- package/src/cli/commands/platform/__tests__/status.test.ts +0 -1
- package/src/cli/commands/skills.ts +3 -4
- package/src/cli/commands/stt.ts +339 -0
- package/src/cli/commands/task.ts +795 -0
- package/src/cli/commands/trust.ts +50 -19
- package/src/cli/commands/tts.ts +273 -0
- package/src/cli/commands/ui.ts +670 -0
- package/src/cli/commands/watchers.ts +509 -0
- package/src/cli/lib/daemon-credential-client.ts +0 -19
- package/src/cli/program.ts +39 -24
- package/src/cli.ts +0 -37
- package/src/config/__tests__/backup-schema.test.ts +7 -2
- package/src/config/bundled-skills/app-builder/SKILL.md +2 -2
- package/src/config/bundled-skills/app-builder/references/WIDGETS.md +10 -10
- package/src/config/bundled-skills/contacts/tools/contact-merge.ts +66 -87
- package/src/config/bundled-skills/contacts/tools/contact-search.ts +28 -51
- package/src/config/bundled-skills/contacts/tools/contact-upsert.ts +22 -40
- package/src/config/bundled-skills/image-studio/SKILL.md +2 -1
- package/src/config/bundled-skills/image-studio/TOOLS.json +2 -1
- package/src/config/bundled-skills/image-studio/tools/media-generate-image.ts +23 -39
- package/src/config/bundled-skills/media-processing/services/reduce.ts +1 -1
- package/src/config/bundled-skills/messaging/SKILL.md +5 -5
- package/src/config/bundled-skills/messaging/TOOLS.json +4 -0
- package/src/config/bundled-skills/messaging/tools/__tests__/messaging-feed-events.test.ts +207 -0
- package/src/config/bundled-skills/messaging/tools/messaging-archive-by-sender.ts +20 -1
- package/src/config/bundled-skills/messaging/tools/messaging-read.ts +15 -1
- package/src/config/bundled-skills/messaging/tools/messaging-search.ts +21 -1
- package/src/config/bundled-skills/messaging/tools/messaging-send.ts +69 -12
- package/src/config/bundled-skills/phone-calls/references/CONFIG.md +9 -8
- package/src/config/bundled-skills/schedule/SKILL.md +8 -3
- package/src/config/bundled-skills/schedule/TOOLS.json +15 -7
- package/src/config/bundled-skills/schedule/references/SCRIPT_MODE_PATTERNS.md +59 -0
- package/src/config/bundled-skills/settings/TOOLS.json +3 -3
- package/src/config/bundled-tool-registry.ts +0 -190
- package/src/config/env.ts +7 -2
- package/src/config/feature-flag-registry.json +42 -10
- package/src/config/llm-resolver.ts +128 -0
- package/src/config/loader.ts +194 -10
- package/src/config/raw-config-utils.ts +30 -2
- package/src/config/sanitize-for-transfer.ts +35 -0
- package/src/config/schema.ts +49 -41
- package/src/config/schemas/analysis.ts +3 -22
- package/src/config/schemas/backup.ts +1 -1
- package/src/config/schemas/calls.ts +0 -4
- package/src/config/schemas/conversations.ts +16 -0
- package/src/config/schemas/filing.ts +2 -7
- package/src/config/schemas/heartbeat.ts +0 -5
- package/src/config/schemas/inference.ts +3 -23
- package/src/config/schemas/llm.ts +317 -0
- package/src/config/schemas/memory-processing.ts +1 -9
- package/src/config/schemas/notifications.ts +4 -11
- package/src/config/schemas/platform.ts +3 -9
- package/src/config/schemas/security.ts +33 -0
- package/src/config/schemas/services.ts +9 -4
- package/src/config/schemas/stt.ts +1 -0
- package/src/config/schemas/tts.ts +64 -0
- package/src/config/schemas/updates.ts +1 -1
- package/src/config/schemas/workspace-git.ts +3 -40
- package/src/config/skill-state.ts +6 -2
- package/src/config/skills.ts +96 -7
- package/src/context/__tests__/compact-prompt.test.ts +63 -0
- package/src/context/__tests__/microcompact.test.ts +805 -0
- package/src/context/estimator-calibration.ts +136 -0
- package/src/context/microcompact.ts +443 -0
- package/src/context/prompts/compact.md +26 -0
- package/src/context/token-estimator.ts +61 -3
- package/src/context/tool-result-truncation.ts +3 -63
- package/src/context/window-manager.ts +417 -39
- package/src/credential-execution/approval-bridge.ts +0 -1
- package/src/credential-execution/executable-discovery.ts +19 -8
- package/src/credential-execution/process-manager.test.ts +109 -0
- package/src/credential-execution/process-manager.ts +65 -2
- package/src/credential-health/credential-health-service.ts +19 -6
- package/src/daemon/__tests__/conversation-feed-event.test.ts +317 -0
- package/src/daemon/__tests__/conversation-lifecycle-auto-analyze.test.ts +4 -12
- package/src/daemon/__tests__/conversation-tool-setup.test.ts +14 -15
- package/src/daemon/approval-generators.ts +29 -4
- package/src/daemon/assistant-attachments.ts +24 -13
- package/src/daemon/classifier.ts +2 -2
- package/src/daemon/config-watcher.ts +0 -3
- package/src/daemon/context-overflow-policy.ts +4 -13
- package/src/daemon/context-overflow-reducer.ts +4 -1
- package/src/daemon/conversation-agent-loop-handlers.ts +162 -34
- package/src/daemon/conversation-agent-loop.ts +1282 -599
- package/src/daemon/conversation-attachments.ts +2 -6
- package/src/daemon/conversation-error.ts +36 -1
- package/src/daemon/conversation-history.ts +10 -19
- package/src/daemon/conversation-lifecycle.ts +59 -17
- package/src/daemon/conversation-messaging.ts +73 -4
- package/src/daemon/conversation-notifiers.ts +2 -110
- package/src/daemon/conversation-process.ts +24 -11
- package/src/daemon/conversation-queue-manager.ts +3 -0
- package/src/daemon/conversation-runtime-assembly.ts +1063 -211
- package/src/daemon/conversation-slash.ts +2 -2
- package/src/daemon/conversation-surfaces.ts +389 -1
- package/src/daemon/conversation-tool-setup.ts +51 -9
- package/src/daemon/conversation-usage.ts +1 -1
- package/src/daemon/conversation.ts +197 -64
- package/src/daemon/external-plugins-bootstrap.ts +478 -0
- package/src/daemon/external-skills-bootstrap.ts +41 -0
- package/src/daemon/first-greeting.ts +191 -14
- package/src/daemon/guardian-action-generators.ts +34 -14
- package/src/daemon/handlers/config-model.test.ts +86 -0
- package/src/daemon/handlers/config-model.ts +65 -12
- package/src/daemon/handlers/conversations.ts +9 -2
- package/src/daemon/handlers/shared.ts +39 -11
- package/src/daemon/handlers/skills.ts +7 -3
- package/src/daemon/handlers/slack-channel-oauth-install.ts +197 -0
- package/src/daemon/lifecycle.ts +109 -82
- package/src/daemon/message-types/computer-use.ts +2 -34
- package/src/daemon/message-types/conversations.ts +63 -0
- package/src/daemon/message-types/messages.ts +21 -1
- package/src/daemon/message-types/trust.ts +0 -2
- package/src/daemon/parse-actual-tokens-from-error.test.ts +57 -1
- package/src/daemon/parse-actual-tokens-from-error.ts +66 -0
- package/src/daemon/pkb-context-tracker.test.ts +169 -0
- package/src/daemon/pkb-context-tracker.ts +125 -0
- package/src/daemon/pkb-reminder-builder.test.ts +70 -0
- package/src/daemon/pkb-reminder-builder.ts +31 -0
- package/src/daemon/providers-setup.ts +6 -0
- package/src/daemon/server.ts +122 -12
- package/src/daemon/shutdown-handlers.ts +2 -12
- package/src/daemon/tool-side-effects.ts +14 -65
- package/src/daemon/web-search-history.ts +126 -0
- package/src/events/domain-events.ts +0 -1
- package/src/filing/filing-service.ts +9 -10
- package/src/heartbeat/__tests__/heartbeat-feed-event.test.ts +160 -0
- package/src/heartbeat/heartbeat-service.ts +99 -28
- package/src/home/__tests__/feed-population-integration.test.ts +312 -0
- package/src/home/__tests__/feed-scheduler.test.ts +39 -11
- package/src/home/__tests__/rollup-producer.test.ts +44 -0
- package/src/home/assistant-feed-authoring.ts +4 -0
- package/src/home/emit-feed-event.ts +11 -0
- package/src/home/feed-scheduler.ts +20 -4
- package/src/home/feed-types.ts +97 -4
- package/src/home/relationship-state-writer.ts +2 -2
- package/src/home/rewrite-command-preview.ts +66 -0
- package/src/home/rollup-producer.ts +34 -5
- package/src/home/suggested-prompts.ts +101 -0
- package/src/ipc/__tests__/attachment-ipc.test.ts +213 -0
- package/src/ipc/__tests__/browser-ipc.test.ts +339 -0
- package/src/ipc/__tests__/cache-ipc.test.ts +266 -0
- package/src/ipc/__tests__/socket-path.test.ts +34 -0
- package/src/ipc/__tests__/task-ipc.test.ts +577 -0
- package/src/ipc/__tests__/ui-request-route.test.ts +495 -0
- package/src/ipc/__tests__/watcher-ipc.test.ts +295 -0
- package/src/ipc/cli-client.ts +2 -1
- package/src/ipc/cli-server.ts +26 -8
- package/src/ipc/gateway-client.ts +6 -3
- package/src/ipc/routes/attachment.ts +114 -0
- package/src/ipc/routes/browser-context.ts +63 -0
- package/src/ipc/routes/browser.ts +97 -0
- package/src/ipc/routes/cache.ts +96 -0
- package/src/ipc/routes/get-contact.ts +16 -0
- package/src/ipc/routes/index.ts +31 -1
- package/src/ipc/routes/list-clients.ts +31 -0
- package/src/ipc/routes/merge-contacts.ts +17 -0
- package/src/ipc/routes/notification.ts +133 -0
- package/src/ipc/routes/rename-conversation.ts +59 -0
- package/src/ipc/routes/search-contacts.ts +19 -0
- package/src/ipc/routes/task-queue.ts +226 -0
- package/src/ipc/routes/task.ts +173 -0
- package/src/ipc/routes/ui-request.ts +50 -0
- package/src/ipc/routes/upsert-contact.ts +25 -0
- package/src/ipc/routes/watcher.ts +203 -0
- package/src/ipc/socket-path.ts +76 -0
- package/src/media/app-icon-generator.ts +23 -46
- package/src/media/avatar-router.ts +26 -41
- package/src/media/gemini-image-service.ts +8 -41
- package/src/media/image-credentials.ts +73 -0
- package/src/media/image-service.ts +85 -0
- package/src/media/openai-image-service.ts +131 -0
- package/src/media/types.ts +46 -0
- package/src/memory/__tests__/conversation-analyze-job.test.ts +9 -8
- package/src/memory/__tests__/conversation-group-migration.test.ts +99 -0
- package/src/memory/admin.ts +18 -0
- package/src/memory/conversation-analyze-job.ts +14 -13
- package/src/memory/conversation-attention-store.ts +13 -6
- package/src/memory/conversation-crud.ts +133 -3
- package/src/memory/conversation-group-migration.ts +38 -6
- package/src/memory/conversation-queries.ts +57 -4
- package/src/memory/conversation-title-service.ts +32 -4
- package/src/memory/db-init.ts +10 -0
- package/src/memory/embedding-backend.ts +1 -1
- package/src/memory/embedding-gemini.test.ts +41 -2
- package/src/memory/embedding-gemini.ts +6 -1
- package/src/memory/graph/bootstrap.test.ts +282 -0
- package/src/memory/graph/bootstrap.ts +8 -5
- package/src/memory/graph/compaction.ts +299 -0
- package/src/memory/graph/consolidation.ts +4 -4
- package/src/memory/graph/conversation-graph-memory.ts +89 -29
- package/src/memory/graph/extraction.test.ts +272 -2
- package/src/memory/graph/extraction.ts +183 -53
- package/src/memory/graph/graph-search.test.ts +93 -0
- package/src/memory/graph/graph-search.ts +4 -1
- package/src/memory/graph/inspect.ts +2 -2
- package/src/memory/graph/narrative.ts +2 -2
- package/src/memory/graph/pattern-scan.ts +2 -2
- package/src/memory/graph/retriever.test.ts +459 -0
- package/src/memory/graph/retriever.ts +237 -48
- package/src/memory/graph/store.ts +41 -0
- package/src/memory/graph/tool-handlers.ts +27 -0
- package/src/memory/graph/tools.ts +6 -1
- package/src/memory/indexer.ts +5 -5
- package/src/memory/job-handlers/conversation-starters.ts +23 -20
- package/src/memory/job-handlers/summarization.ts +2 -2
- package/src/memory/job-utils.ts +7 -1
- package/src/memory/jobs/embed-pkb-file.test.ts +168 -0
- package/src/memory/jobs/embed-pkb-file.ts +54 -0
- package/src/memory/jobs-store.ts +44 -3
- package/src/memory/jobs-worker.ts +4 -0
- package/src/memory/migrations/041-approval-prompt-ts-tracker.ts +26 -0
- package/src/memory/migrations/140-backfill-usage-cache-accounting.ts +1 -1
- package/src/memory/migrations/149-oauth-tables.ts +1 -0
- package/src/memory/migrations/220-normalize-user-file-by-principal.ts +2 -2
- package/src/memory/migrations/222-strip-placeholder-sentinels-from-messages.ts +82 -0
- package/src/memory/migrations/223-schedule-script-column.ts +11 -0
- package/src/memory/migrations/224-oauth-providers-managed-service-is-paid.ts +24 -0
- package/src/memory/migrations/225-oauth-providers-available-scopes.ts +13 -0
- package/src/memory/migrations/index.ts +5 -0
- package/src/memory/pkb/pkb-index.test.ts +369 -0
- package/src/memory/pkb/pkb-index.ts +255 -0
- package/src/memory/pkb/pkb-reconcile.test.ts +252 -0
- package/src/memory/pkb/pkb-reconcile.ts +148 -0
- package/src/memory/pkb/pkb-search.test.ts +499 -0
- package/src/memory/pkb/pkb-search.ts +159 -0
- package/src/memory/pkb/types.ts +53 -0
- package/src/memory/qdrant-client.test.ts +60 -0
- package/src/memory/qdrant-client.ts +147 -1
- package/src/memory/schema/infrastructure.ts +1 -0
- package/src/memory/schema/oauth.ts +4 -1
- package/src/memory/slack-thread-store.ts +37 -0
- package/src/messaging/providers/gmail/adapter.ts +6 -16
- package/src/messaging/providers/gmail/client.ts +22 -0
- package/src/messaging/providers/gmail/types.ts +7 -0
- package/src/messaging/providers/slack/adapter.ts +14 -2
- package/src/messaging/providers/slack/backfill.test.ts +257 -0
- package/src/messaging/providers/slack/backfill.ts +101 -0
- package/src/messaging/providers/slack/message-metadata.test.ts +316 -0
- package/src/messaging/providers/slack/message-metadata.ts +123 -0
- package/src/messaging/providers/slack/render-transcript.test.ts +1421 -0
- package/src/messaging/providers/slack/render-transcript.ts +501 -0
- package/src/messaging/style-analyzer.ts +5 -2
- package/src/notifications/README.md +9 -5
- package/src/notifications/conversation-pairing.ts +78 -19
- package/src/notifications/copy-composer.ts +0 -5
- package/src/notifications/decision-engine.ts +3 -9
- package/src/notifications/emit-signal.ts +1 -1
- package/src/notifications/preference-extractor.ts +2 -6
- package/src/notifications/signal.ts +1 -2
- package/src/oauth/AGENTS.md +1 -1
- package/src/oauth/__tests__/identity-verifier.test.ts +2 -1
- package/src/oauth/connect-orchestrator.ts +8 -34
- package/src/oauth/connect-types.ts +6 -10
- package/src/oauth/manual-token-connection.ts +23 -0
- package/src/oauth/oauth-store.ts +31 -14
- package/src/oauth/platform-connection.test.ts +47 -0
- package/src/oauth/platform-connection.ts +15 -5
- package/src/oauth/provider-serializer.ts +6 -1
- package/src/oauth/seed-providers.ts +56 -106
- package/src/outbound-proxy/http-forwarder.ts +9 -0
- package/src/permissions/approval-policy.test.ts +1223 -0
- package/src/permissions/approval-policy.ts +309 -0
- package/src/permissions/arg-parser.test.ts +161 -0
- package/src/permissions/arg-parser.ts +141 -0
- package/src/permissions/bash-risk-classifier.test.ts +1620 -0
- package/src/permissions/bash-risk-classifier.ts +950 -0
- package/src/permissions/checker.ts +348 -711
- package/src/permissions/command-registry.test.ts +774 -0
- package/src/permissions/command-registry.ts +1005 -0
- package/src/permissions/defaults.ts +28 -79
- package/src/permissions/file-risk-classifier.test.ts +535 -0
- package/src/permissions/file-risk-classifier.ts +274 -0
- package/src/permissions/gateway-threshold-reader.ts +196 -0
- package/src/permissions/prompter.ts +4 -0
- package/src/permissions/risk-types.ts +262 -0
- package/src/permissions/schedule-risk-classifier.test.ts +129 -0
- package/src/permissions/schedule-risk-classifier.ts +85 -0
- package/src/permissions/secret-prompter.ts +53 -2
- package/src/permissions/shell-identity.ts +2 -42
- package/src/permissions/skill-risk-classifier.test.ts +311 -0
- package/src/permissions/skill-risk-classifier.ts +214 -0
- package/src/permissions/trust-client.ts +52 -25
- package/src/permissions/trust-store-interface.ts +1 -6
- package/src/permissions/trust-store.ts +161 -62
- package/src/permissions/types.ts +25 -14
- package/src/permissions/web-risk-classifier.test.ts +170 -0
- package/src/permissions/web-risk-classifier.ts +89 -0
- package/src/permissions/workspace-policy.ts +9 -19
- package/src/platform/client.ts +19 -1
- package/src/plugins/defaults/circuit-breaker.ts +146 -0
- package/src/plugins/defaults/compaction.ts +145 -0
- package/src/plugins/defaults/empty-response.ts +126 -0
- package/src/plugins/defaults/history-repair.ts +85 -0
- package/src/plugins/defaults/index.ts +116 -0
- package/src/plugins/defaults/injectors.ts +491 -0
- package/src/plugins/defaults/llm-call.ts +82 -0
- package/src/plugins/defaults/memory-retrieval.ts +226 -0
- package/src/plugins/defaults/overflow-reduce.ts +181 -0
- package/src/plugins/defaults/persistence.ts +129 -0
- package/src/plugins/defaults/title-generate.ts +95 -0
- package/src/plugins/defaults/token-estimate.ts +104 -0
- package/src/plugins/defaults/tool-error.ts +126 -0
- package/src/plugins/defaults/tool-execute.ts +89 -0
- package/src/plugins/defaults/tool-result-truncate.ts +88 -0
- package/src/plugins/pipeline.ts +316 -0
- package/src/plugins/plugin-skill-contributions.ts +292 -0
- package/src/plugins/registry.ts +241 -0
- package/src/plugins/types.ts +1134 -0
- package/src/plugins/user-loader.ts +177 -0
- package/src/prompts/persona-resolver.ts +3 -3
- package/src/prompts/system-prompt.ts +19 -20
- package/src/prompts/templates/BOOTSTRAP.md +27 -77
- package/src/prompts/templates/SOUL.md +2 -2
- package/src/prompts/update-bulletin-job.ts +190 -0
- package/src/providers/__tests__/context-overflow-error.test.ts +328 -0
- package/src/providers/__tests__/provider-env-vars.test.ts +102 -0
- package/src/providers/__tests__/retry-callsite.test.ts +424 -0
- package/src/providers/anthropic/client.ts +183 -14
- package/src/providers/call-site-routing.ts +71 -0
- package/src/providers/gemini/client.ts +65 -2
- package/src/providers/managed-proxy/constants.ts +2 -1
- package/src/providers/model-catalog.ts +524 -33
- package/src/providers/model-intents.ts +4 -4
- package/src/providers/openai/chat-completions-provider.ts +57 -1
- package/src/providers/openai/responses-provider.ts +86 -9
- package/src/providers/openrouter/client.ts +80 -9
- package/src/providers/provider-env-vars.ts +56 -0
- package/src/providers/provider-send-message.ts +22 -5
- package/src/providers/ratelimit.ts +4 -0
- package/src/providers/registry.ts +19 -8
- package/src/providers/retry.ts +174 -39
- package/src/providers/speech-to-text/__tests__/resolve.test.ts +55 -0
- package/src/providers/speech-to-text/deepgram-realtime.test.ts +61 -0
- package/src/providers/speech-to-text/deepgram-realtime.ts +57 -0
- package/src/providers/speech-to-text/google-gemini-live-stream.ts +4 -4
- package/src/providers/speech-to-text/provider-catalog.ts +17 -0
- package/src/providers/speech-to-text/resolve.ts +7 -0
- package/src/providers/speech-to-text/xai-realtime.test.ts +646 -0
- package/src/providers/speech-to-text/xai-realtime.ts +821 -0
- package/src/providers/speech-to-text/xai.test.ts +155 -0
- package/src/providers/speech-to-text/xai.ts +97 -0
- package/src/providers/types.ts +93 -3
- package/src/runtime/AGENTS.md +27 -18
- package/src/runtime/__tests__/agent-wake.test.ts +43 -2
- package/src/runtime/__tests__/browser-extension-pair-routes.test.ts +3 -3
- package/src/runtime/__tests__/client-registry.test.ts +293 -0
- package/src/runtime/__tests__/interactive-ui.test.ts +673 -0
- package/src/runtime/agent-wake.ts +63 -22
- package/src/runtime/auth/route-policy.ts +4 -0
- package/src/runtime/btw-sidechain.ts +13 -3
- package/src/runtime/channel-reply-delivery.ts +106 -2
- package/src/runtime/client-registry.ts +261 -0
- package/src/runtime/decision-token.ts +116 -0
- package/src/runtime/gateway-client.ts +2 -2
- package/src/runtime/http-router.ts +32 -0
- package/src/runtime/http-server.ts +129 -9
- package/src/runtime/http-types.ts +23 -3
- package/src/runtime/interactive-ui.ts +362 -0
- package/src/runtime/invite-instruction-generator.ts +2 -2
- package/src/runtime/migrations/__tests__/gcs-signed-url.test.ts +176 -0
- package/src/runtime/migrations/__tests__/vbundle-metadata-merge-integration.test.ts +390 -0
- package/src/runtime/migrations/__tests__/vbundle-metadata-merge.test.ts +221 -0
- package/src/runtime/migrations/__tests__/vbundle-streaming-importer.test.ts +1540 -0
- package/src/runtime/migrations/__tests__/vbundle-streaming-validator.test.ts +453 -0
- package/src/runtime/migrations/__tests__/vbundle-tar-stream.test.ts +222 -0
- package/src/runtime/migrations/gcs-signed-url.ts +162 -0
- package/src/runtime/migrations/vbundle-builder.ts +1 -22
- package/src/runtime/migrations/vbundle-importer.ts +154 -9
- package/src/runtime/migrations/vbundle-metadata-merge.ts +124 -0
- package/src/runtime/migrations/vbundle-streaming-importer.ts +2522 -0
- package/src/runtime/migrations/vbundle-streaming-validator.ts +244 -0
- package/src/runtime/migrations/vbundle-tar-stream.ts +217 -0
- package/src/runtime/migrations/vbundle-validator.ts +15 -6
- package/src/runtime/routes/__tests__/home-feed-routes.test.ts +111 -0
- package/src/runtime/routes/__tests__/migration-import-credential-filter.test.ts +114 -75
- package/src/runtime/routes/__tests__/migration-vellum-metadata-reconcile.test.ts +246 -0
- package/src/runtime/routes/approval-prompt-ts-tracker.ts +78 -0
- package/src/runtime/routes/approval-routes.ts +29 -17
- package/src/runtime/routes/approval-strategies/guardian-callback-strategy.ts +9 -0
- package/src/runtime/routes/avatar-routes.ts +20 -4
- package/src/runtime/routes/browser-extension-pair-routes.ts +27 -8
- package/src/runtime/routes/btw-routes.ts +1 -4
- package/src/runtime/routes/conversation-management-routes.ts +20 -2
- package/src/runtime/routes/conversation-routes.ts +351 -138
- package/src/runtime/routes/debug-routes.ts +1 -1
- package/src/runtime/routes/diagnostics-routes.ts +6 -4
- package/src/runtime/routes/events-routes.ts +16 -0
- package/src/runtime/routes/guardian-approval-interception.ts +33 -3
- package/src/runtime/routes/guardian-approval-prompt.ts +13 -3
- package/src/runtime/routes/home-feed-routes.ts +120 -2
- package/src/runtime/routes/inbound-message-handler.ts +987 -2
- package/src/runtime/routes/inbound-stages/background-dispatch.test.ts +113 -2
- package/src/runtime/routes/inbound-stages/background-dispatch.ts +61 -3
- package/src/runtime/routes/inbound-stages/edit-intercept.ts +129 -6
- package/src/runtime/routes/integrations/slack/channel.ts +25 -3
- package/src/runtime/routes/llm-context-normalization.ts +23 -1
- package/src/runtime/routes/memory-item-routes.test.ts +1 -0
- package/src/runtime/routes/migration-routes.ts +720 -127
- package/src/runtime/routes/playground/__tests__/force-compact.test.ts +284 -0
- package/src/runtime/routes/playground/__tests__/guard.test.ts +80 -0
- package/src/runtime/routes/playground/__tests__/inject-failures.test.ts +294 -0
- package/src/runtime/routes/playground/__tests__/reset-circuit.test.ts +271 -0
- package/src/runtime/routes/playground/__tests__/seed-conversation.test.ts +202 -0
- package/src/runtime/routes/playground/__tests__/seeded-conversations.test.ts +309 -0
- package/src/runtime/routes/playground/__tests__/state.test.ts +224 -0
- package/src/runtime/routes/playground/conversation-not-found.ts +29 -0
- package/src/runtime/routes/playground/deps.ts +56 -0
- package/src/runtime/routes/playground/force-compact.ts +73 -0
- package/src/runtime/routes/playground/guard.ts +37 -0
- package/src/runtime/routes/playground/index.ts +28 -0
- package/src/runtime/routes/playground/inject-failures.ts +159 -0
- package/src/runtime/routes/playground/reset-circuit.ts +115 -0
- package/src/runtime/routes/playground/seed-conversation.ts +139 -0
- package/src/runtime/routes/playground/seeded-conversations.ts +78 -0
- package/src/runtime/routes/playground/state.ts +78 -0
- package/src/runtime/routes/schedule-routes.ts +89 -8
- package/src/runtime/routes/settings-routes.ts +4 -2
- package/src/runtime/routes/trust-rules-routes.ts +30 -14
- package/src/runtime/routes/work-items-routes.test.ts +1 -1
- package/src/runtime/routes/work-items-routes.ts +3 -2
- package/src/runtime/services/__tests__/analyze-conversation.test.ts +25 -43
- package/src/runtime/services/analyze-conversation.ts +12 -16
- package/src/runtime/skill-route-registry.ts +97 -15
- package/src/schedule/run-script.ts +68 -0
- package/src/schedule/schedule-store.ts +7 -1
- package/src/schedule/scheduler.ts +56 -8
- package/src/security/__tests__/provider-key-env-fallback.test.ts +119 -0
- package/src/security/__tests__/untrusted-content.test.ts +109 -0
- package/src/security/oauth2.ts +98 -35
- package/src/security/secure-keys.ts +7 -8
- package/src/security/token-manager.ts +27 -13
- package/src/security/untrusted-content.ts +102 -0
- package/src/skills/catalog-cache.ts +35 -9
- package/src/skills/catalog-install.ts +31 -3
- package/src/skills/skill-cache-store.ts +97 -0
- package/src/stt/__tests__/daemon-batch-transcriber.test.ts +76 -0
- package/src/stt/daemon-batch-transcriber.ts +33 -0
- package/src/stt/stt-stream-session.ts +8 -1
- package/src/stt/types.ts +5 -1
- package/src/subagent/manager.ts +41 -13
- package/src/tasks/ephemeral-permissions.ts +9 -4
- package/src/telemetry/usage-telemetry-reporter.ts +27 -5
- package/src/tools/browser/__tests__/browser-status.test.ts +234 -2
- package/src/tools/browser/browser-execution.ts +150 -54
- package/src/tools/browser/cdp-client/__tests__/extension-cdp-client.test.ts +230 -0
- package/src/tools/browser/cdp-client/__tests__/factory.test.ts +146 -3
- package/src/tools/browser/cdp-client/cdp-inspect/discovery.ts +22 -0
- package/src/tools/browser/cdp-client/extension-cdp-client.ts +54 -3
- package/src/tools/browser/cdp-client/factory.ts +15 -4
- package/src/tools/credentials/tool-policy.ts +39 -5
- package/src/tools/credentials/vault.ts +9 -4
- package/src/tools/executor.ts +129 -73
- package/src/tools/filesystem/write.ts +52 -0
- package/src/tools/host-terminal/host-shell.ts +45 -5
- package/src/tools/memory/register.test.ts +185 -0
- package/src/tools/memory/register.ts +3 -1
- package/src/tools/network/script-proxy/session-manager.ts +37 -1
- package/src/tools/network/web-fetch.ts +20 -10
- package/src/tools/network/web-search.ts +19 -4
- package/src/tools/permission-checker.ts +116 -46
- package/src/tools/policy-context.ts +29 -8
- package/src/tools/registry.ts +195 -6
- package/src/tools/schedule/create.ts +23 -8
- package/src/tools/schedule/update.ts +3 -1
- package/src/tools/secret-detection-handler.ts +0 -51
- package/src/tools/side-effects.ts +0 -11
- package/src/tools/skills/execute.ts +2 -2
- package/src/tools/skills/sandbox-runner.ts +5 -2
- package/src/tools/system/avatar-generator.ts +6 -2
- package/src/tools/terminal/backends/native.ts +51 -2
- package/src/tools/terminal/safe-env.ts +3 -2
- package/src/tools/terminal/shell.ts +1 -0
- package/src/tools/tool-manifest.ts +6 -21
- package/src/tools/types.ts +40 -5
- package/src/tools/verification-control-plane-policy.ts +1 -1
- package/src/tts/__tests__/provider-adapters.test.ts +240 -13
- package/src/tts/provider-catalog.ts +18 -0
- package/src/tts/providers/index.ts +2 -0
- package/src/tts/providers/xai-provider.ts +224 -0
- package/src/tts/types.ts +46 -0
- package/src/types/tar-stream.d.ts +66 -0
- package/src/util/json.ts +17 -0
- package/src/util/platform.ts +9 -4
- package/src/util/pricing.ts +41 -8
- package/src/watcher/engine.ts +1 -1
- package/src/watcher/providers/google-calendar.ts +134 -8
- package/src/watcher/providers/outlook-calendar.ts +42 -2
- package/src/workspace/git-service.ts +23 -4
- package/src/workspace/migrations/006-services-config.ts +2 -4
- package/src/workspace/migrations/022-move-hooks-to-workspace.ts +2 -3
- package/src/workspace/migrations/038-unify-llm-callsite-configs.ts +516 -0
- package/src/workspace/migrations/039-drop-legacy-llm-keys.ts +171 -0
- package/src/workspace/migrations/040-seed-latency-callsite-defaults.ts +154 -0
- package/src/workspace/migrations/041-backfill-google-gmail-settings-scope.ts +56 -0
- package/src/workspace/migrations/042-fix-backfill-google-gmail-settings-scope.ts +70 -0
- package/src/workspace/migrations/043-release-notes-latex-rendering.ts +75 -0
- package/src/workspace/migrations/044-bump-stale-provider-stream-timeout.ts +51 -0
- package/src/workspace/migrations/045-release-notes-meet-avatar.ts +130 -0
- package/src/workspace/migrations/046-seed-conversation-starters-callsite.ts +108 -0
- package/src/workspace/migrations/047-remove-watch-callsites.ts +54 -0
- package/src/workspace/migrations/048-remove-workspace-hooks.ts +81 -0
- package/src/workspace/migrations/049-release-notes-default-sonnet.ts +80 -0
- package/src/workspace/migrations/050-seed-main-agent-opus-callsite.ts +86 -0
- package/src/workspace/migrations/051-seed-conversation-summarization-callsite.ts +128 -0
- package/src/workspace/migrations/AGENTS.md +1 -1
- package/src/workspace/migrations/registry.ts +28 -0
- package/src/workspace/provider-commit-message-generator.ts +19 -38
- package/tsconfig.json +1 -1
- package/hook-templates/debug-prompt-logger/hook.json +0 -7
- package/hook-templates/debug-prompt-logger/run.sh +0 -66
- package/src/__tests__/context-overflow-approval.test.ts +0 -156
- package/src/__tests__/gmail-archive-fallback.test.ts +0 -193
- package/src/__tests__/gmail-archive-gate.test.ts +0 -246
- package/src/__tests__/gmail-preferences.test.ts +0 -117
- package/src/__tests__/hooks-blocking.test.ts +0 -178
- package/src/__tests__/hooks-cli.test.ts +0 -182
- package/src/__tests__/hooks-config.test.ts +0 -108
- package/src/__tests__/hooks-discovery.test.ts +0 -211
- package/src/__tests__/hooks-integration.test.ts +0 -196
- package/src/__tests__/hooks-manager.test.ts +0 -226
- package/src/__tests__/hooks-runner.test.ts +0 -175
- package/src/__tests__/hooks-settings.test.ts +0 -160
- package/src/__tests__/hooks-templates.test.ts +0 -169
- package/src/__tests__/hooks-ts-runner.test.ts +0 -170
- package/src/__tests__/hooks-watch.test.ts +0 -112
- package/src/__tests__/notification-schedule-dedup.test.ts +0 -213
- package/src/__tests__/oauth-scope-policy.test.ts +0 -180
- package/src/__tests__/outlook-attachments.test.ts +0 -301
- package/src/__tests__/outlook-automation-tools.test.ts +0 -425
- package/src/__tests__/outlook-categories.test.ts +0 -212
- package/src/__tests__/outlook-compose-tools.test.ts +0 -325
- package/src/__tests__/outlook-declutter-tools.test.ts +0 -585
- package/src/__tests__/outlook-follow-up.test.ts +0 -196
- package/src/__tests__/outlook-trash.test.ts +0 -77
- package/src/__tests__/outlook-unsubscribe.test.ts +0 -279
- package/src/__tests__/send-notification-tool.test.ts +0 -83
- package/src/__tests__/update-bulletin-format.test.ts +0 -181
- package/src/__tests__/update-bulletin-state.test.ts +0 -135
- package/src/__tests__/update-bulletin.test.ts +0 -478
- package/src/__tests__/update-template-contract.test.ts +0 -29
- package/src/cli/commands/doctor.ts +0 -341
- package/src/cli/commands/shotgun.ts +0 -266
- package/src/config/bundled-skills/browser/SKILL.md +0 -88
- package/src/config/bundled-skills/browser/TOOLS.json +0 -516
- package/src/config/bundled-skills/browser/tools/browser-attach.ts +0 -12
- package/src/config/bundled-skills/browser/tools/browser-click.ts +0 -12
- package/src/config/bundled-skills/browser/tools/browser-close.ts +0 -12
- package/src/config/bundled-skills/browser/tools/browser-detach.ts +0 -12
- package/src/config/bundled-skills/browser/tools/browser-extract.ts +0 -12
- package/src/config/bundled-skills/browser/tools/browser-fill-credential.ts +0 -12
- package/src/config/bundled-skills/browser/tools/browser-hover.ts +0 -12
- package/src/config/bundled-skills/browser/tools/browser-navigate.ts +0 -12
- package/src/config/bundled-skills/browser/tools/browser-press-key.ts +0 -12
- package/src/config/bundled-skills/browser/tools/browser-screenshot.ts +0 -12
- package/src/config/bundled-skills/browser/tools/browser-scroll.ts +0 -12
- package/src/config/bundled-skills/browser/tools/browser-select-option.ts +0 -12
- package/src/config/bundled-skills/browser/tools/browser-snapshot.ts +0 -12
- package/src/config/bundled-skills/browser/tools/browser-status.ts +0 -12
- package/src/config/bundled-skills/browser/tools/browser-type.ts +0 -12
- package/src/config/bundled-skills/browser/tools/browser-wait-for-download.ts +0 -49
- package/src/config/bundled-skills/browser/tools/browser-wait-for.ts +0 -12
- package/src/config/bundled-skills/chatgpt-import/SKILL.md +0 -27
- package/src/config/bundled-skills/chatgpt-import/TOOLS.json +0 -27
- package/src/config/bundled-skills/chatgpt-import/tools/chatgpt-import.ts +0 -378
- package/src/config/bundled-skills/conversations/SKILL.md +0 -20
- package/src/config/bundled-skills/conversations/TOOLS.json +0 -23
- package/src/config/bundled-skills/conversations/tools/rename-conversation.ts +0 -66
- package/src/config/bundled-skills/gmail/SKILL.md +0 -221
- package/src/config/bundled-skills/gmail/TOOLS.json +0 -588
- package/src/config/bundled-skills/gmail/tools/gmail-archive.ts +0 -256
- package/src/config/bundled-skills/gmail/tools/gmail-attachments.ts +0 -112
- package/src/config/bundled-skills/gmail/tools/gmail-draft.ts +0 -44
- package/src/config/bundled-skills/gmail/tools/gmail-filters.ts +0 -81
- package/src/config/bundled-skills/gmail/tools/gmail-follow-up.ts +0 -108
- package/src/config/bundled-skills/gmail/tools/gmail-forward.ts +0 -146
- package/src/config/bundled-skills/gmail/tools/gmail-label.ts +0 -53
- package/src/config/bundled-skills/gmail/tools/gmail-outreach-scan.ts +0 -347
- package/src/config/bundled-skills/gmail/tools/gmail-preferences-tool.ts +0 -59
- package/src/config/bundled-skills/gmail/tools/gmail-preferences.ts +0 -82
- package/src/config/bundled-skills/gmail/tools/gmail-send-draft.ts +0 -26
- package/src/config/bundled-skills/gmail/tools/gmail-sender-digest.ts +0 -347
- package/src/config/bundled-skills/gmail/tools/gmail-trash.ts +0 -29
- package/src/config/bundled-skills/gmail/tools/gmail-unsubscribe.ts +0 -122
- package/src/config/bundled-skills/gmail/tools/gmail-vacation.ts +0 -67
- package/src/config/bundled-skills/gmail/tools/scan-result-store.ts +0 -100
- package/src/config/bundled-skills/gmail/tools/shared.ts +0 -47
- package/src/config/bundled-skills/google-calendar/SKILL.md +0 -51
- package/src/config/bundled-skills/google-calendar/TOOLS.json +0 -226
- package/src/config/bundled-skills/google-calendar/calendar-client.ts +0 -223
- package/src/config/bundled-skills/google-calendar/tools/calendar-check-availability.ts +0 -27
- package/src/config/bundled-skills/google-calendar/tools/calendar-create-event.ts +0 -48
- package/src/config/bundled-skills/google-calendar/tools/calendar-get-event.ts +0 -19
- package/src/config/bundled-skills/google-calendar/tools/calendar-list-events.ts +0 -36
- package/src/config/bundled-skills/google-calendar/tools/calendar-rsvp.ts +0 -58
- package/src/config/bundled-skills/google-calendar/tools/shared.ts +0 -17
- package/src/config/bundled-skills/google-calendar/types.ts +0 -97
- package/src/config/bundled-skills/heartbeat/SKILL.md +0 -43
- package/src/config/bundled-skills/notifications/SKILL.md +0 -40
- package/src/config/bundled-skills/notifications/TOOLS.json +0 -80
- package/src/config/bundled-skills/notifications/tools/send-notification.ts +0 -152
- package/src/config/bundled-skills/notifications/tools/shared.ts +0 -13
- package/src/config/bundled-skills/outlook/SKILL.md +0 -196
- package/src/config/bundled-skills/outlook/TOOLS.json +0 -530
- package/src/config/bundled-skills/outlook/tools/outlook-attachments.ts +0 -85
- package/src/config/bundled-skills/outlook/tools/outlook-categories.ts +0 -77
- package/src/config/bundled-skills/outlook/tools/outlook-draft.ts +0 -84
- package/src/config/bundled-skills/outlook/tools/outlook-follow-up.ts +0 -94
- package/src/config/bundled-skills/outlook/tools/outlook-forward.ts +0 -49
- package/src/config/bundled-skills/outlook/tools/outlook-outreach-scan.ts +0 -237
- package/src/config/bundled-skills/outlook/tools/outlook-rules.ts +0 -161
- package/src/config/bundled-skills/outlook/tools/outlook-send-draft.ts +0 -32
- package/src/config/bundled-skills/outlook/tools/outlook-sender-digest.ts +0 -272
- package/src/config/bundled-skills/outlook/tools/outlook-trash.ts +0 -29
- package/src/config/bundled-skills/outlook/tools/outlook-unsubscribe.ts +0 -129
- package/src/config/bundled-skills/outlook/tools/outlook-vacation.ts +0 -87
- package/src/config/bundled-skills/outlook/tools/shared.ts +0 -20
- package/src/config/bundled-skills/outlook-calendar/SKILL.md +0 -51
- package/src/config/bundled-skills/outlook-calendar/TOOLS.json +0 -221
- package/src/config/bundled-skills/outlook-calendar/calendar-client.ts +0 -252
- package/src/config/bundled-skills/outlook-calendar/tools/outlook-calendar-check-availability.ts +0 -53
- package/src/config/bundled-skills/outlook-calendar/tools/outlook-calendar-create-event.ts +0 -74
- package/src/config/bundled-skills/outlook-calendar/tools/outlook-calendar-get-event.ts +0 -18
- package/src/config/bundled-skills/outlook-calendar/tools/outlook-calendar-list-events.ts +0 -46
- package/src/config/bundled-skills/outlook-calendar/tools/outlook-calendar-rsvp.ts +0 -36
- package/src/config/bundled-skills/outlook-calendar/tools/shared.ts +0 -17
- package/src/config/bundled-skills/outlook-calendar/types.ts +0 -120
- package/src/config/bundled-skills/screen-watch/SKILL.md +0 -27
- package/src/config/bundled-skills/screen-watch/TOOLS.json +0 -35
- package/src/config/bundled-skills/screen-watch/tools/start-screen-watch.ts +0 -12
- package/src/config/bundled-skills/skills-catalog/SKILL.md +0 -84
- package/src/config/bundled-skills/slack/SKILL.md +0 -108
- package/src/config/bundled-skills/tasks/SKILL.md +0 -37
- package/src/config/bundled-skills/tasks/TOOLS.json +0 -353
- package/src/config/bundled-skills/tasks/icon.svg +0 -34
- package/src/config/bundled-skills/tasks/tools/task-delete.ts +0 -12
- package/src/config/bundled-skills/tasks/tools/task-list-add.ts +0 -12
- package/src/config/bundled-skills/tasks/tools/task-list-remove.ts +0 -12
- package/src/config/bundled-skills/tasks/tools/task-list-show.ts +0 -12
- package/src/config/bundled-skills/tasks/tools/task-list-update.ts +0 -12
- package/src/config/bundled-skills/tasks/tools/task-list.ts +0 -12
- package/src/config/bundled-skills/tasks/tools/task-queue-run.ts +0 -12
- package/src/config/bundled-skills/tasks/tools/task-run.ts +0 -12
- package/src/config/bundled-skills/tasks/tools/task-save.ts +0 -12
- package/src/config/bundled-skills/watcher/SKILL.md +0 -31
- package/src/config/bundled-skills/watcher/TOOLS.json +0 -167
- package/src/config/bundled-skills/watcher/tools/watcher-create.ts +0 -12
- package/src/config/bundled-skills/watcher/tools/watcher-delete.ts +0 -12
- package/src/config/bundled-skills/watcher/tools/watcher-digest.ts +0 -12
- package/src/config/bundled-skills/watcher/tools/watcher-list.ts +0 -12
- package/src/config/bundled-skills/watcher/tools/watcher-update.ts +0 -12
- package/src/daemon/context-overflow-approval.ts +0 -52
- package/src/daemon/watch-handler.ts +0 -399
- package/src/hooks/cli.ts +0 -253
- package/src/hooks/config.ts +0 -100
- package/src/hooks/discovery.ts +0 -135
- package/src/hooks/manager.ts +0 -179
- package/src/hooks/runner.ts +0 -117
- package/src/hooks/templates.ts +0 -77
- package/src/hooks/types.ts +0 -75
- package/src/oauth/scope-policy.ts +0 -89
- package/src/prompts/templates/UPDATES.md +0 -50
- package/src/prompts/update-bulletin-format.ts +0 -85
- package/src/prompts/update-bulletin-state.ts +0 -58
- package/src/prompts/update-bulletin-template-path.ts +0 -13
- package/src/prompts/update-bulletin.ts +0 -139
- package/src/runtime/gateway-internal-client.ts +0 -94
- package/src/runtime/routes/watch-routes.ts +0 -156
- package/src/shared/provider-env-vars.ts +0 -19
- package/src/signals/shotgun.ts +0 -203
- package/src/tools/watch/screen-watch.ts +0 -144
- package/src/tools/watch/watch-state.ts +0 -142
- package/src/tools/watcher/create.ts +0 -86
- package/src/tools/watcher/delete.ts +0 -36
- package/src/tools/watcher/digest.ts +0 -54
- package/src/tools/watcher/list.ts +0 -83
- package/src/tools/watcher/update.ts +0 -71
|
@@ -0,0 +1,208 @@
|
|
|
1
|
+
import { beforeEach, describe, expect, test } from "bun:test";
|
|
2
|
+
|
|
3
|
+
import {
|
|
4
|
+
getCalibrationSnapshot,
|
|
5
|
+
getCorrection,
|
|
6
|
+
recordEstimate,
|
|
7
|
+
resetCalibrations,
|
|
8
|
+
} from "../context/estimator-calibration.js";
|
|
9
|
+
import {
|
|
10
|
+
estimatePromptTokens,
|
|
11
|
+
getCalibrationProviderKey,
|
|
12
|
+
} from "../context/token-estimator.js";
|
|
13
|
+
import type { Message, Provider } from "../providers/types.js";
|
|
14
|
+
|
|
15
|
+
/**
|
|
16
|
+
* Integration-style tests that exercise the full self-calibration loop end
|
|
17
|
+
* to end:
|
|
18
|
+
* 1. Estimate is recorded for a `(provider, model)` pair via
|
|
19
|
+
* `handleUsage` (the record side still threads the provider-echoed
|
|
20
|
+
* model through `recordEstimate`).
|
|
21
|
+
* 2. A subsequent `estimatePromptTokens` lookup picks up the learned
|
|
22
|
+
* correction via the per-provider aggregate key `(provider, "")`.
|
|
23
|
+
* Lookup always uses the aggregate — model-specific keys are only
|
|
24
|
+
* read as a fallback inside `getCorrection`.
|
|
25
|
+
*
|
|
26
|
+
* Since the `modelId` lookup option has been removed from the public
|
|
27
|
+
* token-estimator API, the lookup side always converges to the aggregate.
|
|
28
|
+
* `recordEstimate` still updates both the specific `(provider, model)`
|
|
29
|
+
* key AND the `(provider, "")` aggregate on every sample, so the
|
|
30
|
+
* aggregate stays accurate even as per-model data accumulates.
|
|
31
|
+
*/
|
|
32
|
+
describe("estimator calibration — end-to-end recording → lookup", () => {
|
|
33
|
+
beforeEach(() => {
|
|
34
|
+
resetCalibrations();
|
|
35
|
+
});
|
|
36
|
+
|
|
37
|
+
/**
|
|
38
|
+
* Build a representative message history with enough content to clear the
|
|
39
|
+
* MIN_SAMPLE_MAGNITUDE floor (500 tokens). Each message repeats a block of
|
|
40
|
+
* text large enough to make the heuristic estimator produce a substantial
|
|
41
|
+
* token count so the calibration machinery actually runs.
|
|
42
|
+
*/
|
|
43
|
+
function largeHistory(): Message[] {
|
|
44
|
+
const body = "lorem ipsum dolor sit amet ".repeat(500);
|
|
45
|
+
return [
|
|
46
|
+
{ role: "user", content: [{ type: "text", text: body }] },
|
|
47
|
+
{ role: "assistant", content: [{ type: "text", text: body }] },
|
|
48
|
+
{ role: "user", content: [{ type: "text", text: body }] },
|
|
49
|
+
];
|
|
50
|
+
}
|
|
51
|
+
|
|
52
|
+
test("subsequent estimate picks up the aggregate-key correction", () => {
|
|
53
|
+
const provider: Provider = {
|
|
54
|
+
name: "anthropic",
|
|
55
|
+
async sendMessage() {
|
|
56
|
+
throw new Error("not used in this test");
|
|
57
|
+
},
|
|
58
|
+
};
|
|
59
|
+
const model = "claude-sonnet-4-5";
|
|
60
|
+
const history = largeHistory();
|
|
61
|
+
|
|
62
|
+
// 1. Raw estimate (what agent/loop.ts computes pre-send).
|
|
63
|
+
const preSend = estimatePromptTokens(history, "system", {
|
|
64
|
+
providerName: getCalibrationProviderKey(provider),
|
|
65
|
+
});
|
|
66
|
+
expect(preSend).toBeGreaterThan(0);
|
|
67
|
+
|
|
68
|
+
// Baseline: no correction recorded yet.
|
|
69
|
+
expect(getCorrection("anthropic", "")).toBe(1.0);
|
|
70
|
+
|
|
71
|
+
// 2. Provider returns ground truth (simulating `handleUsage`, which
|
|
72
|
+
// still records under (provider, event.model) and folds into the
|
|
73
|
+
// aggregate). Simulate a systematic 30% underestimate.
|
|
74
|
+
const groundTruth = Math.ceil(preSend * 1.3);
|
|
75
|
+
recordEstimate(
|
|
76
|
+
getCalibrationProviderKey(provider),
|
|
77
|
+
model,
|
|
78
|
+
preSend,
|
|
79
|
+
groundTruth,
|
|
80
|
+
);
|
|
81
|
+
|
|
82
|
+
// 3. Lookup under the aggregate key now returns the learned ratio.
|
|
83
|
+
expect(getCorrection("anthropic", "")).toBeCloseTo(1.3, 3);
|
|
84
|
+
|
|
85
|
+
// And the corrected estimate moves toward the ground truth.
|
|
86
|
+
const corrected = estimatePromptTokens(history, "system", {
|
|
87
|
+
providerName: getCalibrationProviderKey(provider),
|
|
88
|
+
});
|
|
89
|
+
// With correction factor ≈1.3, corrected estimate is within 1 token of
|
|
90
|
+
// the ground truth (Math.ceil rounding).
|
|
91
|
+
expect(corrected).toBeGreaterThan(preSend);
|
|
92
|
+
expect(Math.abs(corrected - groundTruth)).toBeLessThanOrEqual(1);
|
|
93
|
+
});
|
|
94
|
+
|
|
95
|
+
test("record with model writes both the specific and aggregate keys", () => {
|
|
96
|
+
// Simulate a preflight site that records against (anthropic, sonnet).
|
|
97
|
+
// `recordEstimate` also folds the sample into the `(anthropic, "")`
|
|
98
|
+
// aggregate so aggregate-key callers see the correction.
|
|
99
|
+
const provider: Provider = {
|
|
100
|
+
name: "anthropic",
|
|
101
|
+
async sendMessage() {
|
|
102
|
+
throw new Error("not used");
|
|
103
|
+
},
|
|
104
|
+
};
|
|
105
|
+
const history = largeHistory();
|
|
106
|
+
|
|
107
|
+
const preSend = estimatePromptTokens(history, "system", {
|
|
108
|
+
providerName: getCalibrationProviderKey(provider),
|
|
109
|
+
});
|
|
110
|
+
const groundTruth = Math.ceil(preSend * 1.25);
|
|
111
|
+
|
|
112
|
+
recordEstimate(
|
|
113
|
+
getCalibrationProviderKey(provider),
|
|
114
|
+
"claude-sonnet-4-5",
|
|
115
|
+
preSend,
|
|
116
|
+
groundTruth,
|
|
117
|
+
);
|
|
118
|
+
|
|
119
|
+
// A subsequent lookup via the token-estimator uses the per-provider
|
|
120
|
+
// aggregate (the only key the public API reads).
|
|
121
|
+
const correctedAggregate = estimatePromptTokens(history, "system", {
|
|
122
|
+
providerName: getCalibrationProviderKey(provider),
|
|
123
|
+
});
|
|
124
|
+
// Aggregate ratio ≈ 1.25 (first sample snaps to exact ratio).
|
|
125
|
+
expect(correctedAggregate).toBe(Math.ceil(preSend * 1.25));
|
|
126
|
+
});
|
|
127
|
+
|
|
128
|
+
test("wrapper provider (OpenRouter → Anthropic) uses the canonical key on both sides", () => {
|
|
129
|
+
// This is the Devin scenario: OpenRouter wraps Anthropic. If the record
|
|
130
|
+
// site used `name` ("openrouter") and the lookup site used
|
|
131
|
+
// `tokenEstimationProvider` ("anthropic"), the data would be scattered
|
|
132
|
+
// across mismatched keys and calibration would silently fail.
|
|
133
|
+
// `getCalibrationProviderKey` gives us one source of truth.
|
|
134
|
+
const openrouter: Provider = {
|
|
135
|
+
name: "openrouter",
|
|
136
|
+
tokenEstimationProvider: "anthropic",
|
|
137
|
+
async sendMessage() {
|
|
138
|
+
throw new Error("not used");
|
|
139
|
+
},
|
|
140
|
+
};
|
|
141
|
+
const model = "anthropic/claude-sonnet-4-5";
|
|
142
|
+
const history = largeHistory();
|
|
143
|
+
|
|
144
|
+
// Pre-send estimate via the canonical key.
|
|
145
|
+
const preSend = estimatePromptTokens(history, "system", {
|
|
146
|
+
providerName: getCalibrationProviderKey(openrouter),
|
|
147
|
+
});
|
|
148
|
+
expect(preSend).toBeGreaterThan(0);
|
|
149
|
+
|
|
150
|
+
// Provider returns ground truth. `handleUsage` uses the same helper
|
|
151
|
+
// to pick the calibration key, so the record and lookup sides agree.
|
|
152
|
+
const groundTruth = Math.ceil(preSend * 1.2);
|
|
153
|
+
recordEstimate(
|
|
154
|
+
getCalibrationProviderKey(openrouter),
|
|
155
|
+
model,
|
|
156
|
+
preSend,
|
|
157
|
+
groundTruth,
|
|
158
|
+
);
|
|
159
|
+
|
|
160
|
+
// Lookup under "anthropic" — the canonical upstream key — returns the
|
|
161
|
+
// ratio. See note above about precision=3.
|
|
162
|
+
expect(getCorrection("anthropic", model)).toBeCloseTo(1.2, 3);
|
|
163
|
+
// Aggregate under the canonical upstream key is also populated.
|
|
164
|
+
expect(getCorrection("anthropic", "")).toBeCloseTo(1.2, 3);
|
|
165
|
+
// And under the bare wrapper name stays at the default, because NOTHING
|
|
166
|
+
// was recorded under "openrouter".
|
|
167
|
+
expect(getCorrection("openrouter", "")).toBe(1.0);
|
|
168
|
+
|
|
169
|
+
// The snapshot reflects a single (provider, model) key + aggregate under
|
|
170
|
+
// the canonical upstream key — never under the wrapper name.
|
|
171
|
+
const keys = getCalibrationSnapshot().map(
|
|
172
|
+
(e) => `${e.provider}::${e.model}`,
|
|
173
|
+
);
|
|
174
|
+
expect(keys).toContain(`anthropic::${model}`);
|
|
175
|
+
expect(keys).toContain("anthropic::");
|
|
176
|
+
expect(keys).not.toContain(`openrouter::${model}`);
|
|
177
|
+
});
|
|
178
|
+
|
|
179
|
+
test("a run of consistent samples pulls the estimate toward ground truth", () => {
|
|
180
|
+
// The EWMA should converge quickly. After five consistent 1.3 samples
|
|
181
|
+
// the correction should be within 1% of 1.3, and the corrected estimate
|
|
182
|
+
// should be within 1% of the ground truth.
|
|
183
|
+
const model = "claude-sonnet-4-5";
|
|
184
|
+
const history = largeHistory();
|
|
185
|
+
|
|
186
|
+
const preSend = estimatePromptTokens(history, "system", {
|
|
187
|
+
providerName: "anthropic",
|
|
188
|
+
});
|
|
189
|
+
const groundTruth = Math.ceil(preSend * 1.3);
|
|
190
|
+
|
|
191
|
+
for (let i = 0; i < 5; i++) {
|
|
192
|
+
recordEstimate("anthropic", model, preSend, groundTruth);
|
|
193
|
+
}
|
|
194
|
+
|
|
195
|
+
const finalCorrection = getCorrection("anthropic", "");
|
|
196
|
+
// EWMA with alpha=0.2 on constant 1.3 stays at 1.3 from the first sample
|
|
197
|
+
// onward (all deltas are 0 after the initial snap). `precision=3` gives
|
|
198
|
+
// us ~0.0005 tolerance which covers the Math.ceil rounding noise.
|
|
199
|
+
expect(finalCorrection).toBeCloseTo(1.3, 3);
|
|
200
|
+
|
|
201
|
+
const corrected = estimatePromptTokens(history, "system", {
|
|
202
|
+
providerName: "anthropic",
|
|
203
|
+
});
|
|
204
|
+
// Corrected should be very close to the ground truth (within 1 token
|
|
205
|
+
// because of the Math.ceil rounding at the end of estimatePromptTokens).
|
|
206
|
+
expect(Math.abs(corrected - groundTruth)).toBeLessThanOrEqual(1);
|
|
207
|
+
});
|
|
208
|
+
});
|
|
@@ -0,0 +1,213 @@
|
|
|
1
|
+
import { beforeEach, describe, expect, test } from "bun:test";
|
|
2
|
+
|
|
3
|
+
import {
|
|
4
|
+
getCalibrationSnapshot,
|
|
5
|
+
getCorrection,
|
|
6
|
+
recordEstimate,
|
|
7
|
+
resetCalibrations,
|
|
8
|
+
} from "../context/estimator-calibration.js";
|
|
9
|
+
|
|
10
|
+
describe("estimator calibration", () => {
|
|
11
|
+
beforeEach(() => {
|
|
12
|
+
resetCalibrations();
|
|
13
|
+
});
|
|
14
|
+
|
|
15
|
+
test("default correction is 1.0 for unseen (provider, model)", () => {
|
|
16
|
+
expect(getCorrection("anthropic", "claude-sonnet-4-5")).toBe(1.0);
|
|
17
|
+
expect(getCorrection("openai", "gpt-5")).toBe(1.0);
|
|
18
|
+
});
|
|
19
|
+
|
|
20
|
+
test("first sample yields the exact ratio", () => {
|
|
21
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 130_000);
|
|
22
|
+
const ratio = getCorrection("anthropic", "claude-sonnet-4-5");
|
|
23
|
+
expect(ratio).toBeCloseTo(1.3, 5);
|
|
24
|
+
});
|
|
25
|
+
|
|
26
|
+
test("EWMA converges to the target ratio given consistent samples", () => {
|
|
27
|
+
// Seed with a ratio far from the target so the first sample is off,
|
|
28
|
+
// then hammer with consistent 1.3 samples and watch EWMA close the gap.
|
|
29
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 100_000);
|
|
30
|
+
for (let i = 0; i < 20; i++) {
|
|
31
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 130_000);
|
|
32
|
+
}
|
|
33
|
+
const ratio = getCorrection("anthropic", "claude-sonnet-4-5");
|
|
34
|
+
expect(ratio).toBeGreaterThan(1.25);
|
|
35
|
+
expect(ratio).toBeLessThan(1.35);
|
|
36
|
+
});
|
|
37
|
+
|
|
38
|
+
test("ten consistent 1.3 samples land within 0.05 of 1.3", () => {
|
|
39
|
+
for (let i = 0; i < 10; i++) {
|
|
40
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 130_000);
|
|
41
|
+
}
|
|
42
|
+
const ratio = getCorrection("anthropic", "claude-sonnet-4-5");
|
|
43
|
+
expect(Math.abs(ratio - 1.3)).toBeLessThan(0.05);
|
|
44
|
+
});
|
|
45
|
+
|
|
46
|
+
test("values below MIN_SAMPLE_MAGNITUDE are ignored", () => {
|
|
47
|
+
// Both below the floor
|
|
48
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 200, 400);
|
|
49
|
+
expect(getCorrection("anthropic", "claude-sonnet-4-5")).toBe(1.0);
|
|
50
|
+
|
|
51
|
+
// Estimated below the floor
|
|
52
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 200, 100_000);
|
|
53
|
+
expect(getCorrection("anthropic", "claude-sonnet-4-5")).toBe(1.0);
|
|
54
|
+
|
|
55
|
+
// Actual below the floor
|
|
56
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 200);
|
|
57
|
+
expect(getCorrection("anthropic", "claude-sonnet-4-5")).toBe(1.0);
|
|
58
|
+
});
|
|
59
|
+
|
|
60
|
+
test("ratios outside [1/3, 3] are discarded as outliers", () => {
|
|
61
|
+
// 4x too high
|
|
62
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 400_000);
|
|
63
|
+
expect(getCorrection("anthropic", "claude-sonnet-4-5")).toBe(1.0);
|
|
64
|
+
|
|
65
|
+
// 4x too low
|
|
66
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 25_000);
|
|
67
|
+
expect(getCorrection("anthropic", "claude-sonnet-4-5")).toBe(1.0);
|
|
68
|
+
|
|
69
|
+
// Just above the 3x edge — still discarded
|
|
70
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 300_001);
|
|
71
|
+
expect(getCorrection("anthropic", "claude-sonnet-4-5")).toBe(1.0);
|
|
72
|
+
|
|
73
|
+
// Exactly at the 3x edge — accepted (ratio === 3, not > 3)
|
|
74
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 300_000);
|
|
75
|
+
expect(getCorrection("anthropic", "claude-sonnet-4-5")).toBeCloseTo(3, 5);
|
|
76
|
+
});
|
|
77
|
+
|
|
78
|
+
test("resetCalibrations clears all state", () => {
|
|
79
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 130_000);
|
|
80
|
+
recordEstimate("openai", "gpt-5", 100_000, 90_000);
|
|
81
|
+
expect(getCorrection("anthropic", "claude-sonnet-4-5")).toBeCloseTo(1.3);
|
|
82
|
+
expect(getCorrection("openai", "gpt-5")).toBeCloseTo(0.9);
|
|
83
|
+
|
|
84
|
+
resetCalibrations();
|
|
85
|
+
expect(getCorrection("anthropic", "claude-sonnet-4-5")).toBe(1.0);
|
|
86
|
+
expect(getCorrection("openai", "gpt-5")).toBe(1.0);
|
|
87
|
+
expect(getCalibrationSnapshot()).toHaveLength(0);
|
|
88
|
+
});
|
|
89
|
+
|
|
90
|
+
test("distinct (provider, model) keys are independent", () => {
|
|
91
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 130_000);
|
|
92
|
+
recordEstimate("anthropic", "claude-opus-4-7", 100_000, 110_000);
|
|
93
|
+
recordEstimate("openai", "gpt-5", 100_000, 90_000);
|
|
94
|
+
recordEstimate("openai", "gpt-5", 100_000, 90_000);
|
|
95
|
+
recordEstimate("openai", "gpt-5", 100_000, 90_000);
|
|
96
|
+
|
|
97
|
+
expect(getCorrection("anthropic", "claude-sonnet-4-5")).toBeCloseTo(1.3, 5);
|
|
98
|
+
expect(getCorrection("anthropic", "claude-opus-4-7")).toBeCloseTo(1.1, 5);
|
|
99
|
+
// openai::gpt-5: after 3 EWMA steps of ratio 0.9, still exactly 0.9
|
|
100
|
+
// because the first sample snaps to ratio and subsequent deltas are 0.
|
|
101
|
+
expect(getCorrection("openai", "gpt-5")).toBeCloseTo(0.9, 5);
|
|
102
|
+
|
|
103
|
+
// Model separation: ensure a sample to one (provider, model) pair does
|
|
104
|
+
// not pollute another model under the same provider.
|
|
105
|
+
expect(getCorrection("anthropic", "claude-opus-4-7")).not.toBe(
|
|
106
|
+
getCorrection("anthropic", "claude-sonnet-4-5"),
|
|
107
|
+
);
|
|
108
|
+
});
|
|
109
|
+
|
|
110
|
+
test("snapshot reports current calibrations", () => {
|
|
111
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 130_000);
|
|
112
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 130_000);
|
|
113
|
+
recordEstimate("openai", "gpt-5", 100_000, 90_000);
|
|
114
|
+
|
|
115
|
+
const snap = getCalibrationSnapshot();
|
|
116
|
+
// Every non-empty-model sample also updates the per-provider aggregate
|
|
117
|
+
// key (provider, ""). Two providers × {specific model, aggregate} = 4.
|
|
118
|
+
expect(snap).toHaveLength(4);
|
|
119
|
+
|
|
120
|
+
const anthropicEntry = snap.find(
|
|
121
|
+
(e) => e.provider === "anthropic" && e.model === "claude-sonnet-4-5",
|
|
122
|
+
);
|
|
123
|
+
expect(anthropicEntry).toBeDefined();
|
|
124
|
+
expect(anthropicEntry?.samples).toBe(2);
|
|
125
|
+
expect(anthropicEntry?.ratio).toBeCloseTo(1.3, 5);
|
|
126
|
+
|
|
127
|
+
const openaiEntry = snap.find(
|
|
128
|
+
(e) => e.provider === "openai" && e.model === "gpt-5",
|
|
129
|
+
);
|
|
130
|
+
expect(openaiEntry).toBeDefined();
|
|
131
|
+
expect(openaiEntry?.samples).toBe(1);
|
|
132
|
+
expect(openaiEntry?.ratio).toBeCloseTo(0.9, 5);
|
|
133
|
+
|
|
134
|
+
// Per-provider aggregates are present and track the specific samples.
|
|
135
|
+
const anthropicAggregate = snap.find(
|
|
136
|
+
(e) => e.provider === "anthropic" && e.model === "",
|
|
137
|
+
);
|
|
138
|
+
expect(anthropicAggregate?.samples).toBe(2);
|
|
139
|
+
expect(anthropicAggregate?.ratio).toBeCloseTo(1.3, 5);
|
|
140
|
+
|
|
141
|
+
const openaiAggregate = snap.find(
|
|
142
|
+
(e) => e.provider === "openai" && e.model === "",
|
|
143
|
+
);
|
|
144
|
+
expect(openaiAggregate?.samples).toBe(1);
|
|
145
|
+
expect(openaiAggregate?.ratio).toBeCloseTo(0.9, 5);
|
|
146
|
+
});
|
|
147
|
+
|
|
148
|
+
test("specific-model lookup falls back to the per-provider aggregate when no model-specific samples exist", () => {
|
|
149
|
+
// Writing only to the aggregate simulates the case where callers without
|
|
150
|
+
// a resolved modelId have been recording, and then a model-specific
|
|
151
|
+
// caller asks for its correction.
|
|
152
|
+
recordEstimate("anthropic", "", 100_000, 130_000);
|
|
153
|
+
expect(getCorrection("anthropic", "")).toBeCloseTo(1.3, 5);
|
|
154
|
+
// The specific model has no own samples, but gets the aggregate.
|
|
155
|
+
expect(getCorrection("anthropic", "claude-sonnet-4-5")).toBeCloseTo(1.3, 5);
|
|
156
|
+
// An unseen provider still defaults to 1.0.
|
|
157
|
+
expect(getCorrection("gemini", "gemini-2.5-pro")).toBe(1.0);
|
|
158
|
+
});
|
|
159
|
+
|
|
160
|
+
test("specific-model samples take precedence over the aggregate", () => {
|
|
161
|
+
recordEstimate("anthropic", "", 100_000, 130_000); // aggregate = 1.3
|
|
162
|
+
recordEstimate("anthropic", "claude-opus-4-7", 100_000, 110_000); // specific = 1.1
|
|
163
|
+
expect(getCorrection("anthropic", "claude-opus-4-7")).not.toBeCloseTo(
|
|
164
|
+
1.3,
|
|
165
|
+
5,
|
|
166
|
+
);
|
|
167
|
+
// A different model under the same provider still falls back to the
|
|
168
|
+
// aggregate (which now reflects both samples via EWMA).
|
|
169
|
+
expect(getCorrection("anthropic", "claude-sonnet-4-5")).not.toBe(1.0);
|
|
170
|
+
});
|
|
171
|
+
|
|
172
|
+
test("recording with a specific model also updates the per-provider aggregate", () => {
|
|
173
|
+
// The calibration writes `(provider, model)` and every caller of
|
|
174
|
+
// `estimatePromptTokens` that cannot resolve a model falls back to
|
|
175
|
+
// `(provider, "")`. Without the aggregate update, those callers would
|
|
176
|
+
// stay at the 1.0 default forever, defeating the whole mechanism.
|
|
177
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 130_000);
|
|
178
|
+
expect(getCorrection("anthropic", "claude-sonnet-4-5")).toBeCloseTo(1.3, 5);
|
|
179
|
+
expect(getCorrection("anthropic", "")).toBeCloseTo(1.3, 5);
|
|
180
|
+
// A different provider is unaffected.
|
|
181
|
+
expect(getCorrection("openai", "")).toBe(1.0);
|
|
182
|
+
});
|
|
183
|
+
|
|
184
|
+
test("the per-provider aggregate tracks a rolling EWMA across models", () => {
|
|
185
|
+
// Samples across two models for one provider should each feed the
|
|
186
|
+
// aggregate EWMA, so a generic lookup reflects recent activity from
|
|
187
|
+
// any model on that provider.
|
|
188
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 120_000);
|
|
189
|
+
recordEstimate("anthropic", "claude-opus-4-7", 100_000, 120_000);
|
|
190
|
+
recordEstimate("anthropic", "claude-sonnet-4-5", 100_000, 120_000);
|
|
191
|
+
recordEstimate("anthropic", "claude-opus-4-7", 100_000, 120_000);
|
|
192
|
+
|
|
193
|
+
// After four consistent 1.2 samples (folded into both the model-specific
|
|
194
|
+
// and the aggregate keys) the EWMA for each sits very close to 1.2.
|
|
195
|
+
expect(getCorrection("anthropic", "")).toBeCloseTo(1.2, 1);
|
|
196
|
+
expect(getCorrection("anthropic", "claude-sonnet-4-5")).toBeCloseTo(1.2, 1);
|
|
197
|
+
expect(getCorrection("anthropic", "claude-opus-4-7")).toBeCloseTo(1.2, 1);
|
|
198
|
+
});
|
|
199
|
+
|
|
200
|
+
test("explicit empty-model recording does not double-count the aggregate", () => {
|
|
201
|
+
// When a caller passes an empty model string (degenerate case), the
|
|
202
|
+
// aggregate update path must not run — otherwise the sample would be
|
|
203
|
+
// folded into the EWMA twice and the ratio would be wrong.
|
|
204
|
+
recordEstimate("anthropic", "", 100_000, 120_000);
|
|
205
|
+
// Exactly one sample applied.
|
|
206
|
+
const snap = getCalibrationSnapshot().filter(
|
|
207
|
+
(e) => e.provider === "anthropic" && e.model === "",
|
|
208
|
+
);
|
|
209
|
+
expect(snap).toHaveLength(1);
|
|
210
|
+
expect(snap[0].samples).toBe(1);
|
|
211
|
+
expect(snap[0].ratio).toBeCloseTo(1.2, 5);
|
|
212
|
+
});
|
|
213
|
+
});
|
|
@@ -16,7 +16,7 @@ import { homedir } from "node:os";
|
|
|
16
16
|
import { join, resolve } from "node:path";
|
|
17
17
|
import { describe, expect, test } from "bun:test";
|
|
18
18
|
|
|
19
|
-
import {
|
|
19
|
+
import { getAllowedExtensionOrigins } from "../runtime/routes/browser-extension-pair-routes.js";
|
|
20
20
|
|
|
21
21
|
const repoRoot = resolve(__dirname, "..", "..", "..");
|
|
22
22
|
const CANONICAL_CONFIG_REL_PATH =
|
|
@@ -41,11 +41,15 @@ function parseCanonicalConfig(): AllowlistConfig {
|
|
|
41
41
|
const parsed = JSON.parse(raw) as Partial<AllowlistConfig>;
|
|
42
42
|
|
|
43
43
|
if (!Number.isInteger(parsed.version) || (parsed.version ?? 0) <= 0) {
|
|
44
|
-
throw new Error(
|
|
44
|
+
throw new Error(
|
|
45
|
+
"Invalid canonical config: version must be a positive integer",
|
|
46
|
+
);
|
|
45
47
|
}
|
|
46
48
|
|
|
47
49
|
if (!Array.isArray(parsed.allowedExtensionIds)) {
|
|
48
|
-
throw new Error(
|
|
50
|
+
throw new Error(
|
|
51
|
+
"Invalid canonical config: allowedExtensionIds must be an array",
|
|
52
|
+
);
|
|
49
53
|
}
|
|
50
54
|
|
|
51
55
|
if (parsed.allowedExtensionIds.length === 0) {
|
|
@@ -95,6 +99,7 @@ function listTextFilesRecursively(root: string): string[] {
|
|
|
95
99
|
".turbo",
|
|
96
100
|
".idea",
|
|
97
101
|
".vscode",
|
|
102
|
+
".codex-worktrees",
|
|
98
103
|
]);
|
|
99
104
|
|
|
100
105
|
const allowedExtensions = new Set([
|
|
@@ -171,7 +176,7 @@ describe("Chrome extension allowlist guard", () => {
|
|
|
171
176
|
const config = parseCanonicalConfig();
|
|
172
177
|
for (const id of config.allowedExtensionIds) {
|
|
173
178
|
const origin = `chrome-extension://${id}/`;
|
|
174
|
-
expect(
|
|
179
|
+
expect(getAllowedExtensionOrigins().has(origin)).toBe(true);
|
|
175
180
|
}
|
|
176
181
|
});
|
|
177
182
|
|
|
@@ -193,15 +198,23 @@ describe("Chrome extension allowlist guard", () => {
|
|
|
193
198
|
const expectedOrigins = new Set(
|
|
194
199
|
config.allowedExtensionIds.map((id) => `chrome-extension://${id}/`),
|
|
195
200
|
);
|
|
196
|
-
expect(new Set(
|
|
201
|
+
expect(new Set(getAllowedExtensionOrigins())).toEqual(expectedOrigins);
|
|
197
202
|
});
|
|
198
203
|
|
|
199
|
-
test("concrete extension IDs appear only in canonical config", () => {
|
|
204
|
+
test("concrete extension IDs appear only in canonical config or CWS URLs", () => {
|
|
205
|
+
// The canonical extension ID may also appear in Chrome Web Store URLs
|
|
206
|
+
// (e.g. chromewebstore.google.com/detail/.../ID) or in documentation
|
|
207
|
+
// referencing the published extension. Those are acceptable — they
|
|
208
|
+
// reference the published extension, not duplicate config. We flag
|
|
209
|
+
// files where the ID appears outside of a CWS URL context.
|
|
200
210
|
const config = parseCanonicalConfig();
|
|
201
211
|
const allFiles = listTextFilesRecursively(repoRoot);
|
|
202
212
|
|
|
213
|
+
const CWS_URL_PATTERN =
|
|
214
|
+
/chromewebstore\.google\.com\/detail\/[^/]+\/[a-p]{32}/g;
|
|
215
|
+
|
|
203
216
|
for (const extensionId of config.allowedExtensionIds) {
|
|
204
|
-
const
|
|
217
|
+
const unexpectedMatches: string[] = [];
|
|
205
218
|
for (const absPath of allFiles) {
|
|
206
219
|
const relPath = absPath.replace(`${repoRoot}/`, "");
|
|
207
220
|
let content: string;
|
|
@@ -212,11 +225,17 @@ describe("Chrome extension allowlist guard", () => {
|
|
|
212
225
|
if ((err as NodeJS.ErrnoException).code === "ENOENT") continue;
|
|
213
226
|
throw err;
|
|
214
227
|
}
|
|
215
|
-
if (content.includes(extensionId))
|
|
216
|
-
|
|
228
|
+
if (!content.includes(extensionId)) continue;
|
|
229
|
+
if (relPath === CANONICAL_CONFIG_REL_PATH) continue;
|
|
230
|
+
|
|
231
|
+
// Strip all CWS URLs and check if the ID still appears — if it
|
|
232
|
+
// does, the file is using the ID as a standalone config value.
|
|
233
|
+
const stripped = content.replace(CWS_URL_PATTERN, "");
|
|
234
|
+
if (stripped.includes(extensionId)) {
|
|
235
|
+
unexpectedMatches.push(relPath);
|
|
217
236
|
}
|
|
218
237
|
}
|
|
219
|
-
expect(
|
|
238
|
+
expect(unexpectedMatches).toEqual([]);
|
|
220
239
|
}
|
|
221
240
|
});
|
|
222
241
|
});
|
|
@@ -1,5 +1,6 @@
|
|
|
1
1
|
import {
|
|
2
2
|
existsSync,
|
|
3
|
+
mkdirSync,
|
|
3
4
|
mkdtempSync,
|
|
4
5
|
readFileSync,
|
|
5
6
|
realpathSync,
|
|
@@ -8,8 +9,47 @@ import {
|
|
|
8
9
|
} from "node:fs";
|
|
9
10
|
import { tmpdir } from "node:os";
|
|
10
11
|
import { join } from "node:path";
|
|
11
|
-
import {
|
|
12
|
+
import {
|
|
13
|
+
afterEach,
|
|
14
|
+
beforeAll,
|
|
15
|
+
beforeEach,
|
|
16
|
+
describe,
|
|
17
|
+
expect,
|
|
18
|
+
mock,
|
|
19
|
+
test,
|
|
20
|
+
} from "bun:test";
|
|
21
|
+
|
|
22
|
+
// Track calls to enqueuePkbIndexJob across tests. Captured via mock.module
|
|
23
|
+
// below; individual tests clear and inspect the array.
|
|
24
|
+
const enqueueCalls: Array<{
|
|
25
|
+
pkbRoot: string;
|
|
26
|
+
absPath: string;
|
|
27
|
+
memoryScopeId: string;
|
|
28
|
+
}> = [];
|
|
29
|
+
let enqueueThrows = false;
|
|
12
30
|
|
|
31
|
+
mock.module("../memory/jobs/embed-pkb-file.js", () => ({
|
|
32
|
+
enqueuePkbIndexJob: (input: {
|
|
33
|
+
pkbRoot: string;
|
|
34
|
+
absPath: string;
|
|
35
|
+
memoryScopeId: string;
|
|
36
|
+
}) => {
|
|
37
|
+
if (enqueueThrows) {
|
|
38
|
+
throw new Error("simulated enqueue failure");
|
|
39
|
+
}
|
|
40
|
+
enqueueCalls.push(input);
|
|
41
|
+
return "job-id";
|
|
42
|
+
},
|
|
43
|
+
}));
|
|
44
|
+
|
|
45
|
+
// Override workspace dir via VELLUM_WORKSPACE_DIR so PKB-root detection
|
|
46
|
+
// targets a temp directory without having to mock platform.js wholesale
|
|
47
|
+
// (which would destabilize the rest of the tool registry's dependency tree).
|
|
48
|
+
function setWorkspaceDir(dir: string): void {
|
|
49
|
+
process.env.VELLUM_WORKSPACE_DIR = dir;
|
|
50
|
+
}
|
|
51
|
+
|
|
52
|
+
import { PKB_WORKSPACE_SCOPE } from "../memory/pkb/types.js";
|
|
13
53
|
import { getTool } from "../tools/registry.js";
|
|
14
54
|
import type { Tool, ToolContext } from "../tools/types.js";
|
|
15
55
|
|
|
@@ -35,6 +75,24 @@ afterEach(() => {
|
|
|
35
75
|
}
|
|
36
76
|
});
|
|
37
77
|
|
|
78
|
+
const originalWorkspaceDirEnv = process.env.VELLUM_WORKSPACE_DIR;
|
|
79
|
+
|
|
80
|
+
beforeEach(() => {
|
|
81
|
+
enqueueCalls.length = 0;
|
|
82
|
+
enqueueThrows = false;
|
|
83
|
+
// Reset to a stable tmp path so the sandbox tests (which don't use pkb/)
|
|
84
|
+
// deterministically land outside any configured PKB root.
|
|
85
|
+
process.env.VELLUM_WORKSPACE_DIR = tmpdir();
|
|
86
|
+
});
|
|
87
|
+
|
|
88
|
+
afterEach(() => {
|
|
89
|
+
if (originalWorkspaceDirEnv === undefined) {
|
|
90
|
+
delete process.env.VELLUM_WORKSPACE_DIR;
|
|
91
|
+
} else {
|
|
92
|
+
process.env.VELLUM_WORKSPACE_DIR = originalWorkspaceDirEnv;
|
|
93
|
+
}
|
|
94
|
+
});
|
|
95
|
+
|
|
38
96
|
function makeTempDir(): string {
|
|
39
97
|
const dir = realpathSync(mkdtempSync(join(tmpdir(), "file-write-test-")));
|
|
40
98
|
testDirs.push(dir);
|
|
@@ -118,3 +176,95 @@ describe("file_write tool (sandbox)", () => {
|
|
|
118
176
|
expect(result.content).toContain("exceeds");
|
|
119
177
|
});
|
|
120
178
|
});
|
|
179
|
+
|
|
180
|
+
describe("file_write tool PKB re-index hook", () => {
|
|
181
|
+
test("enqueues a PKB re-index job when writing under pkb/", async () => {
|
|
182
|
+
const workingDir = makeTempDir();
|
|
183
|
+
setWorkspaceDir(workingDir);
|
|
184
|
+
mkdirSync(join(workingDir, "pkb"), { recursive: true });
|
|
185
|
+
|
|
186
|
+
const result = await fileWriteTool.execute(
|
|
187
|
+
{ path: "pkb/note.md", content: "# hello\nworld\n" },
|
|
188
|
+
makeContext(workingDir),
|
|
189
|
+
);
|
|
190
|
+
|
|
191
|
+
expect(result.isError).toBe(false);
|
|
192
|
+
expect(enqueueCalls).toHaveLength(1);
|
|
193
|
+
expect(enqueueCalls[0]).toEqual({
|
|
194
|
+
pkbRoot: join(workingDir, "pkb"),
|
|
195
|
+
absPath: join(workingDir, "pkb", "note.md"),
|
|
196
|
+
memoryScopeId: PKB_WORKSPACE_SCOPE,
|
|
197
|
+
});
|
|
198
|
+
});
|
|
199
|
+
|
|
200
|
+
test("always uses PKB_WORKSPACE_SCOPE regardless of context.memoryScopeId", async () => {
|
|
201
|
+
const workingDir = makeTempDir();
|
|
202
|
+
setWorkspaceDir(workingDir);
|
|
203
|
+
mkdirSync(join(workingDir, "pkb"), { recursive: true });
|
|
204
|
+
|
|
205
|
+
const ctx: ToolContext = {
|
|
206
|
+
...makeContext(workingDir),
|
|
207
|
+
memoryScopeId: "private:abc123",
|
|
208
|
+
};
|
|
209
|
+
|
|
210
|
+
const result = await fileWriteTool.execute(
|
|
211
|
+
{ path: "pkb/private.md", content: "secret\n" },
|
|
212
|
+
ctx,
|
|
213
|
+
);
|
|
214
|
+
|
|
215
|
+
expect(result.isError).toBe(false);
|
|
216
|
+
expect(enqueueCalls).toHaveLength(1);
|
|
217
|
+
// PKB files are workspace-level — the per-conversation scopeId is NOT
|
|
218
|
+
// threaded through so different conversations can't overwrite each
|
|
219
|
+
// other's Qdrant points via target_id upsert deduplication.
|
|
220
|
+
expect(enqueueCalls[0]?.memoryScopeId).toBe(PKB_WORKSPACE_SCOPE);
|
|
221
|
+
});
|
|
222
|
+
|
|
223
|
+
test("does NOT enqueue when writing outside pkb/", async () => {
|
|
224
|
+
const workingDir = makeTempDir();
|
|
225
|
+
setWorkspaceDir(workingDir);
|
|
226
|
+
|
|
227
|
+
const result = await fileWriteTool.execute(
|
|
228
|
+
{ path: "notes.md", content: "# not pkb\n" },
|
|
229
|
+
makeContext(workingDir),
|
|
230
|
+
);
|
|
231
|
+
|
|
232
|
+
expect(result.isError).toBe(false);
|
|
233
|
+
expect(enqueueCalls).toHaveLength(0);
|
|
234
|
+
});
|
|
235
|
+
|
|
236
|
+
test("does NOT enqueue for a sibling directory whose name is a pkb prefix", async () => {
|
|
237
|
+
// Guard against `<root>/pkbsomethingelse` being treated as inside `<root>/pkb`.
|
|
238
|
+
const workingDir = makeTempDir();
|
|
239
|
+
setWorkspaceDir(workingDir);
|
|
240
|
+
mkdirSync(join(workingDir, "pkbsibling"), { recursive: true });
|
|
241
|
+
|
|
242
|
+
const result = await fileWriteTool.execute(
|
|
243
|
+
{ path: "pkbsibling/file.md", content: "not pkb\n" },
|
|
244
|
+
makeContext(workingDir),
|
|
245
|
+
);
|
|
246
|
+
|
|
247
|
+
expect(result.isError).toBe(false);
|
|
248
|
+
expect(enqueueCalls).toHaveLength(0);
|
|
249
|
+
});
|
|
250
|
+
|
|
251
|
+
test("enqueue failure is swallowed and write result stays successful", async () => {
|
|
252
|
+
const workingDir = makeTempDir();
|
|
253
|
+
setWorkspaceDir(workingDir);
|
|
254
|
+
mkdirSync(join(workingDir, "pkb"), { recursive: true });
|
|
255
|
+
enqueueThrows = true;
|
|
256
|
+
|
|
257
|
+
const result = await fileWriteTool.execute(
|
|
258
|
+
{ path: "pkb/oops.md", content: "still writes\n" },
|
|
259
|
+
makeContext(workingDir),
|
|
260
|
+
);
|
|
261
|
+
|
|
262
|
+
expect(result.isError).toBe(false);
|
|
263
|
+
// The mock throws, so nothing gets pushed to enqueueCalls. The critical
|
|
264
|
+
// behavior is that the thrown error never surfaces through execute().
|
|
265
|
+
expect(enqueueCalls).toHaveLength(0);
|
|
266
|
+
expect(
|
|
267
|
+
existsSync(join(workingDir, "pkb", "oops.md")),
|
|
268
|
+
).toBe(true);
|
|
269
|
+
});
|
|
270
|
+
});
|