@vellumai/assistant 0.8.4 → 0.8.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/ARCHITECTURE.md +2 -2
- package/docs/browser-use-architecture-phase2.md +1 -1
- package/knip.json +2 -1
- package/openapi.yaml +809 -11
- package/package.json +1 -1
- package/src/__tests__/anthropic-provider.test.ts +34 -37
- package/src/__tests__/assistant-event-hub-self-exclusion.test.ts +293 -0
- package/src/__tests__/assistant-feature-flags-integration.test.ts +3 -3
- package/src/__tests__/audit-log-rotation.test.ts +70 -16
- package/src/__tests__/background-workers-disk-pressure.test.ts +3 -3
- package/src/__tests__/btw-routes.test.ts +2 -3
- package/src/__tests__/call-controller.test.ts +0 -1
- package/src/__tests__/cancel-resolves-conversation-key.test.ts +1 -1
- package/src/__tests__/channel-guardian.test.ts +3 -3
- package/src/__tests__/checker.test.ts +6 -15
- package/src/__tests__/compaction-events.test.ts +1 -0
- package/src/__tests__/compactor-call-site-logging.test.ts +214 -0
- package/src/__tests__/computer-use-skill-manifest-regression.test.ts +5 -11
- package/src/__tests__/computer-use-tools.test.ts +2 -4
- package/src/__tests__/confirmation-request-guardian-bridge.test.ts +0 -1
- package/src/__tests__/conversation-agent-loop-disk-pressure.test.ts +1 -1
- package/src/__tests__/conversation-agent-loop-inference-profile.test.ts +1 -1
- package/src/__tests__/conversation-agent-loop-overflow.test.ts +197 -2
- package/src/__tests__/conversation-agent-loop.test.ts +163 -122
- package/src/__tests__/conversation-app-control-instantiation.test.ts +2 -5
- package/src/__tests__/conversation-clear-safety.test.ts +25 -25
- package/src/__tests__/conversation-delete-schedule-cleanup.test.ts +1 -1
- package/src/__tests__/conversation-disk-view-integration.test.ts +2 -2
- package/src/__tests__/conversation-error.test.ts +31 -0
- package/src/__tests__/conversation-fork-crud.test.ts +178 -15
- package/src/__tests__/conversation-lifecycle.test.ts +52 -11
- package/src/__tests__/{conversation-load-cleaned-at.test.ts → conversation-load-history-stripped.test.ts} +13 -13
- package/src/__tests__/conversation-provider-retry-repair.test.ts +1 -0
- package/src/__tests__/conversation-routes-disk-view.test.ts +109 -0
- package/src/__tests__/conversation-routes-slash-commands.test.ts +35 -0
- package/src/__tests__/conversation-skill-tools.test.ts +2 -5
- package/src/__tests__/conversation-store.test.ts +1 -1
- package/src/__tests__/conversation-sync-tags.test.ts +99 -32
- package/src/__tests__/conversation-workspace-cache-state.test.ts +1 -0
- package/src/__tests__/conversation-workspace-injection.test.ts +1 -1
- package/src/__tests__/conversation-workspace-tool-tracking.test.ts +1 -1
- package/src/__tests__/credential-execution-feature-gates.test.ts +9 -7
- package/src/__tests__/credential-execution-tools.test.ts +6 -6
- package/src/__tests__/credential-security-invariants.test.ts +1 -0
- package/src/__tests__/credential-vault-unit.test.ts +2 -2
- package/src/__tests__/dynamic-page-surface.test.ts +2 -2
- package/src/__tests__/email-html-renderer.test.ts +12 -0
- package/src/__tests__/gateway-flag-listener.test.ts +237 -0
- package/src/__tests__/gemini-provider.test.ts +78 -0
- package/src/__tests__/guardian-dispatch.test.ts +0 -1
- package/src/__tests__/guardian-outbound-http.test.ts +7 -5
- package/src/__tests__/handlers-user-message-approval-consumption.test.ts +1 -1
- package/src/__tests__/heartbeat-disk-pressure.test.ts +4 -0
- package/src/__tests__/heartbeat-service.test.ts +4 -0
- package/src/__tests__/host-shell-tool.test.ts +1 -1
- package/src/__tests__/init-feature-flag-overrides.test.ts +5 -6
- package/src/__tests__/list-messages-tool-merge.test.ts +70 -11
- package/src/__tests__/llm-request-log-call-site.test.ts +136 -0
- package/src/__tests__/llm-request-log-source-clickhouse.test.ts +26 -0
- package/src/__tests__/llm-resolver.test.ts +77 -9
- package/src/__tests__/llm-usage-store.test.ts +66 -0
- package/src/__tests__/logger.test.ts +89 -0
- package/src/__tests__/mcp-abort-signal.test.ts +2 -2
- package/src/__tests__/media-generate-image.test.ts +31 -0
- package/src/__tests__/memory-v2-static-injector.test.ts +7 -7
- package/src/__tests__/model-intents.test.ts +2 -4
- package/src/__tests__/notification-guardian-path.test.ts +0 -1
- package/src/__tests__/onboarding-template-contract.test.ts +1 -1
- package/src/__tests__/openai-provider.test.ts +46 -0
- package/src/__tests__/openai-responses-provider.test.ts +114 -12
- package/src/__tests__/pending-interactions-resolved-event.test.ts +0 -1
- package/src/__tests__/platform-bash-auto-approve.test.ts +2 -2
- package/src/__tests__/platform.test.ts +2 -2
- package/src/__tests__/plugin-api-tool-definition.test.ts +92 -0
- package/src/__tests__/plugin-bootstrap.test.ts +2 -2
- package/src/__tests__/plugin-tool-contribution.test.ts +13 -6
- package/src/__tests__/plugin-types.test.ts +3 -2
- package/src/__tests__/prechat-onboarding-contract.test.ts +131 -98
- package/src/__tests__/pricing.test.ts +12 -0
- package/src/__tests__/prune-jobs-changes-parser.test.ts +61 -0
- package/src/__tests__/registry.test.ts +2 -8
- package/src/__tests__/require-fresh-approval.test.ts +2 -2
- package/src/__tests__/runtime-events-sse-bilingual.test.ts +154 -0
- package/src/__tests__/shell-tool-proxy-mode.test.ts +1 -1
- package/src/__tests__/skill-feature-flags.test.ts +2 -2
- package/src/__tests__/skill-projection-feature-flag.test.ts +4 -7
- package/src/__tests__/skill-projection.benchmark.test.ts +2 -6
- package/src/__tests__/skill-tool-factory.test.ts +1 -1
- package/src/__tests__/subagent-notify-parent.test.ts +1 -1
- package/src/__tests__/suggestion-routes.test.ts +1 -0
- package/src/__tests__/sync-message-contract.test.ts +59 -0
- package/src/__tests__/system-prompt.test.ts +145 -131
- package/src/__tests__/terminal-tools.test.ts +1 -1
- package/src/__tests__/tool-approval-handler.test.ts +1 -5
- package/src/__tests__/tool-execute-pipeline.test.ts +2 -2
- package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +2 -5
- package/src/__tests__/tool-executor-lifecycle-events.test.ts +15 -5
- package/src/__tests__/tool-executor.test.ts +9 -62
- package/src/__tests__/tool-grant-request-escalation.test.ts +1 -6
- package/src/__tests__/trusted-contact-approval-notifier.test.ts +0 -1
- package/src/__tests__/trusted-contact-inline-approval-integration.test.ts +1 -6
- package/src/__tests__/trusted-contact-multichannel.test.ts +0 -1
- package/src/__tests__/ui-file-upload-surface.test.ts +2 -2
- package/src/__tests__/usage-routes.test.ts +3 -0
- package/src/__tests__/verification-control-plane-policy.test.ts +2 -2
- package/src/__tests__/workspace-git-service.test.ts +6 -5
- package/src/__tests__/workspace-migration-089-move-memory-tree-out-of-v3.test.ts +86 -0
- package/src/acp/__tests__/prepare-agent-env.test.ts +146 -0
- package/src/acp/prepare-agent-env.ts +78 -0
- package/src/acp/session-manager.ts +1 -1
- package/src/agent/loop.ts +8 -0
- package/src/api/README.md +5 -0
- package/src/api/index.ts +4 -0
- package/src/api/package.json +10 -0
- package/src/background-wake/background-wake-routes.test.ts +233 -0
- package/src/background-wake/runtime-registry.ts +24 -0
- package/src/cli/commands/__tests__/browser.test.ts +23 -5
- package/src/cli/commands/__tests__/domain-register.test.ts +110 -0
- package/src/cli/commands/__tests__/domain-status.test.ts +33 -33
- package/src/cli/commands/__tests__/inference-send.test.ts +108 -5
- package/src/cli/commands/__tests__/memory-v2-compare-render.test.ts +98 -0
- package/src/cli/commands/__tests__/memory-v2.test.ts +1 -0
- package/src/cli/commands/__tests__/memory-v3-render.test.ts +340 -0
- package/src/cli/commands/browser.ts +247 -0
- package/src/cli/commands/domain.ts +91 -41
- package/src/cli/commands/inference.ts +93 -40
- package/src/cli/commands/memory-v2-compare-render.ts +115 -0
- package/src/cli/commands/memory-v2.ts +176 -1
- package/src/cli/commands/memory-v3-render.ts +344 -0
- package/src/cli/commands/memory-v3.ts +316 -0
- package/src/cli/program.ts +2 -0
- package/src/config/assistant-feature-flags.ts +21 -9
- package/src/config/bundled-skills/document-editor/SKILL.md +11 -2
- package/src/config/bundled-skills/document-editor/TOOLS.json +18 -0
- package/src/config/bundled-skills/document-editor/tools/document-open.ts +12 -0
- package/src/config/bundled-skills/image-studio/SKILL.md +4 -0
- package/src/config/bundled-skills/image-studio/tools/media-generate-image.ts +2 -2
- package/src/config/bundled-skills/media-processing/tools/ingest-media.ts +13 -8
- package/src/config/bundled-skills/messaging/tools/messaging-analyze-style.ts +10 -3
- package/src/config/bundled-skills/phone-calls/references/TRANSCRIPTS.md +16 -14
- package/src/config/bundled-skills/playbooks/tools/playbook-create.ts +7 -2
- package/src/config/bundled-skills/playbooks/tools/playbook-update.ts +7 -2
- package/src/config/bundled-tool-registry.ts +2 -0
- package/src/config/call-site-defaults.ts +7 -6
- package/src/config/feature-flag-registry.json +16 -0
- package/src/config/schemas/__tests__/memory-v2.test.ts +213 -1
- package/src/config/schemas/call-site-catalog.ts +21 -7
- package/src/config/schemas/llm.ts +12 -1
- package/src/config/schemas/memory-v2.ts +246 -0
- package/src/config/schemas/memory.ts +2 -1
- package/src/context/compactor.ts +52 -0
- package/src/conversations/__tests__/message-consolidation.test.ts +350 -0
- package/src/conversations/message-consolidation.ts +404 -0
- package/src/daemon/__tests__/conversation-tool-setup-exclude.test.ts +1 -1
- package/src/daemon/__tests__/meet-manifest-loader.test.ts +1 -1
- package/src/daemon/conversation-agent-loop-handlers.ts +2 -13
- package/src/daemon/conversation-agent-loop.ts +126 -76
- package/src/daemon/conversation-error.ts +31 -1
- package/src/daemon/conversation-lifecycle.ts +27 -22
- package/src/daemon/conversation-runtime-assembly.ts +10 -9
- package/src/daemon/conversation-tool-setup.ts +63 -3
- package/src/daemon/conversation-usage.ts +2 -0
- package/src/daemon/conversation.ts +14 -29
- package/src/daemon/disk-pressure-guard.ts +14 -2
- package/src/daemon/handlers/config-model.test.ts +1 -0
- package/src/daemon/handlers/conversations.ts +11 -3
- package/src/daemon/host-browser-proxy.ts +5 -5
- package/src/daemon/host-cu-proxy.ts +4 -4
- package/src/daemon/host-file-proxy.ts +4 -4
- package/src/daemon/host-proxy-base.ts +4 -4
- package/src/daemon/host-transfer-proxy.ts +10 -10
- package/src/daemon/lifecycle.ts +23 -20
- package/src/daemon/meet-manifest-loader.ts +1 -7
- package/src/daemon/message-types/conversations.ts +6 -9
- package/src/daemon/message-types/home.ts +1 -13
- package/src/daemon/message-types/messages.ts +6 -14
- package/src/daemon/message-types/sync.ts +14 -0
- package/src/daemon/shutdown-handlers.ts +24 -5
- package/src/daemon/switch-inference-profile-tool.ts +52 -0
- package/src/daemon/tool-setup-types.ts +13 -0
- package/src/events/relationship-state-updated.ts +25 -0
- package/src/heartbeat/__tests__/heartbeat-service.test.ts +1 -1
- package/src/home/home-greeting.ts +0 -9
- package/src/home/suggested-prompts.ts +0 -9
- package/src/ipc/gateway-flag-listener.ts +123 -0
- package/src/ipc/skill-routes/registries.ts +8 -12
- package/src/memory/__tests__/db-async-query.test.ts +165 -0
- package/src/memory/__tests__/db-maintenance.test.ts +115 -0
- package/src/memory/__tests__/jobs-store-enqueue-gate.test.ts +241 -0
- package/src/memory/__tests__/jobs-store-job-classes.test.ts +28 -1
- package/src/memory/__tests__/memory-retrospective-job.test.ts +7 -0
- package/src/memory/auto-analysis-enqueue.ts +5 -1
- package/src/memory/conversation-crud.ts +71 -70
- package/src/memory/conversation-starters-cadence.ts +3 -1
- package/src/memory/conversation-title-service.ts +19 -3
- package/src/memory/db-async-query.ts +214 -0
- package/src/memory/db-init.ts +10 -0
- package/src/memory/db-maintenance.ts +30 -21
- package/src/memory/graph/bootstrap.ts +8 -1
- package/src/memory/graph/capability-seed.ts +7 -3
- package/src/memory/graph/conversation-graph-memory.ts +100 -17
- package/src/memory/graph/extraction.ts +1 -5
- package/src/memory/graph/graph-search.ts +7 -1
- package/src/memory/indexer.ts +28 -18
- package/src/memory/job-handlers/cleanup.ts +76 -18
- package/src/memory/job-handlers/conversation-starters.ts +1 -4
- package/src/memory/jobs/embed-pkb-file.ts +6 -1
- package/src/memory/jobs-store.ts +14 -0
- package/src/memory/jobs-worker.ts +55 -22
- package/src/memory/llm-request-log-source-clickhouse.ts +42 -2
- package/src/memory/llm-request-log-source-local.ts +7 -0
- package/src/memory/llm-request-log-source.ts +9 -2
- package/src/memory/llm-request-log-store.ts +43 -1
- package/src/memory/llm-usage-store.ts +24 -0
- package/src/memory/memory-retrospective-enqueue.ts +8 -1
- package/src/memory/memory-retrospective-job.ts +5 -0
- package/src/memory/memory-v2-activation-log-store.ts +15 -6
- package/src/memory/migrations/260-rename-cleaned-at.ts +44 -0
- package/src/memory/migrations/261-llm-usage-add-raw-usage.ts +36 -0
- package/src/memory/migrations/262-memory-v3-coactivation.ts +57 -0
- package/src/memory/migrations/263-memory-v3-auto-edges.ts +50 -0
- package/src/memory/migrations/264-llm-request-log-call-site.ts +29 -0
- package/src/memory/migrations/index.ts +17 -0
- package/src/memory/migrations/registry.ts +33 -0
- package/src/memory/schema/conversations.ts +1 -1
- package/src/memory/schema/infrastructure.ts +21 -0
- package/src/memory/tool-usage-store.ts +36 -8
- package/src/memory/v2/__tests__/consolidation-job.test.ts +1 -0
- package/src/memory/v2/__tests__/harness-compare.test.ts +186 -0
- package/src/memory/v2/__tests__/harness-metrics.test.ts +74 -0
- package/src/memory/v2/__tests__/harness-oracle.test.ts +257 -0
- package/src/memory/v2/__tests__/harness-replay-input.test.ts +225 -0
- package/src/memory/v2/__tests__/harness-runner.test.ts +109 -0
- package/src/memory/v2/__tests__/injection.test.ts +127 -98
- package/src/memory/v2/__tests__/qdrant.test.ts +36 -0
- package/src/memory/v2/__tests__/router.test.ts +171 -3
- package/src/memory/v2/harness/compare.ts +57 -0
- package/src/memory/v2/harness/metrics.ts +124 -0
- package/src/memory/v2/harness/oracle.ts +145 -0
- package/src/memory/v2/harness/replay-input.ts +224 -0
- package/src/memory/v2/harness/retriever.ts +74 -0
- package/src/memory/v2/harness/router-retriever.ts +43 -0
- package/src/memory/v2/harness/runner.ts +106 -0
- package/src/memory/v2/harness/trace.ts +58 -0
- package/src/memory/v2/injection.ts +21 -15
- package/src/memory/v2/prompts/router.ts +26 -1
- package/src/memory/v2/qdrant.ts +14 -2
- package/src/memory/v2/router.ts +171 -18
- package/src/memory/v3/__tests__/coactivation-store.test.ts +422 -0
- package/src/memory/v3/__tests__/consolidation-job.test.ts +468 -0
- package/src/memory/v3/__tests__/edge-learning-job.test.ts +324 -0
- package/src/memory/v3/__tests__/edges.test.ts +563 -0
- package/src/memory/v3/__tests__/filter.test.ts +512 -0
- package/src/memory/v3/__tests__/gate.test.ts +574 -0
- package/src/memory/v3/__tests__/index-composition.test.ts +233 -0
- package/src/memory/v3/__tests__/loop.test.ts +530 -0
- package/src/memory/v3/__tests__/retriever.test.ts +226 -0
- package/src/memory/v3/__tests__/scouts.test.ts +440 -0
- package/src/memory/v3/__tests__/shadow-middleware.test.ts +312 -0
- package/src/memory/v3/__tests__/system-prompts.test.ts +154 -0
- package/src/memory/v3/__tests__/traversal.test.ts +469 -0
- package/src/memory/v3/__tests__/tree-index.test.ts +280 -0
- package/src/memory/v3/__tests__/tree-store.test.ts +529 -0
- package/src/memory/v3/__tests__/tree-walk.test.ts +707 -0
- package/src/memory/v3/__tests__/validate.test.ts +245 -0
- package/src/memory/v3/auto-edges.ts +223 -0
- package/src/memory/v3/coactivation-store.ts +124 -0
- package/src/memory/v3/consolidation-job.ts +323 -0
- package/src/memory/v3/edge-learning-job.ts +160 -0
- package/src/memory/v3/edges.ts +249 -0
- package/src/memory/v3/filter.ts +281 -0
- package/src/memory/v3/gate.ts +334 -0
- package/src/memory/v3/index-composition.ts +113 -0
- package/src/memory/v3/llm-capture.ts +46 -0
- package/src/memory/v3/loop.ts +382 -0
- package/src/memory/v3/maintenance.ts +144 -0
- package/src/memory/v3/prompt-context.ts +33 -0
- package/src/memory/v3/prompts/consolidation.ts +458 -0
- package/src/memory/v3/prompts/system-prompts.ts +196 -0
- package/src/memory/v3/retriever.ts +33 -0
- package/src/memory/v3/scouts.ts +420 -0
- package/src/memory/v3/shadow-middleware.ts +305 -0
- package/src/memory/v3/traversal.ts +206 -0
- package/src/memory/v3/tree-index.ts +237 -0
- package/src/memory/v3/tree-store.ts +394 -0
- package/src/memory/v3/tree-walk.ts +351 -0
- package/src/memory/v3/types.ts +65 -0
- package/src/memory/v3/validate.ts +300 -0
- package/src/notifications/adapters/macos.ts +18 -1
- package/src/notifications/adapters/platform.ts +1 -1
- package/src/notifications/decision-engine.ts +1 -4
- package/src/notifications/emit-signal.ts +29 -49
- package/src/permissions/prompter.ts +3 -3
- package/src/permissions/question-prompter.ts +5 -2
- package/src/permissions/secret-prompter.ts +2 -2
- package/src/plugin-api/index.ts +4 -0
- package/src/plugin-api/types.ts +7 -33
- package/src/plugins/defaults/index.ts +6 -0
- package/src/plugins/defaults/injectors.ts +18 -11
- package/src/plugins/external-plugin-loader.ts +5 -68
- package/src/plugins/types.ts +11 -16
- package/src/proactive-artifact/aux-message-injector.ts +17 -4
- package/src/prompts/__tests__/task-progress-hint-section.test.ts +3 -9
- package/src/prompts/persona-resolver.ts +36 -21
- package/src/prompts/sections.ts +39 -7
- package/src/prompts/system-prompt.ts +50 -185
- package/src/prompts/templates/BOOTSTRAP.md +2 -2
- package/src/prompts/templates/system-sections.ts +230 -8
- package/src/providers/__tests__/connection-model-compat.test.ts +234 -0
- package/src/providers/__tests__/retry-callsite.test.ts +85 -5
- package/src/providers/anthropic/client.ts +32 -66
- package/src/providers/call-site-routing.ts +14 -2
- package/src/providers/connection-model-compat.ts +38 -0
- package/src/providers/connection-resolution.ts +16 -2
- package/src/providers/gemini/client.ts +49 -6
- package/src/providers/inference/adapter-factory.ts +3 -0
- package/src/providers/minimax/client.ts +106 -0
- package/src/providers/model-catalog.ts +43 -0
- package/src/providers/model-intents.ts +1 -1
- package/src/providers/openai/chat-completions-provider.ts +6 -3
- package/src/providers/openai/codex-models.ts +18 -0
- package/src/providers/openai/responses-provider.ts +78 -21
- package/src/providers/provider-send-message.ts +7 -1
- package/src/providers/retry.ts +34 -3
- package/src/providers/thinking-config.ts +26 -1
- package/src/providers/usage-tracking.ts +2 -0
- package/src/runtime/AGENTS.md +2 -2
- package/src/runtime/agent-wake.ts +1 -0
- package/src/runtime/assistant-event-hub.ts +76 -6
- package/src/runtime/auth/route-policy.ts +36 -0
- package/src/runtime/btw-sidechain.ts +0 -6
- package/src/runtime/http-types.ts +0 -2
- package/src/runtime/migrations/vbundle-builder.ts +10 -3
- package/src/runtime/pending-interactions.ts +0 -1
- package/src/runtime/routes/__tests__/conversation-query-routes.test.ts +106 -0
- package/src/runtime/routes/__tests__/memory-v2-simulate-route.test.ts +25 -6
- package/src/runtime/routes/__tests__/plugins-routes.test.ts +512 -0
- package/src/runtime/routes/acp-routes.test.ts +255 -6
- package/src/runtime/routes/acp-routes.ts +8 -1
- package/src/runtime/routes/avatar-routes.ts +10 -10
- package/src/runtime/routes/background-wake-routes.ts +188 -0
- package/src/runtime/routes/browser-tabs-routes.ts +200 -0
- package/src/runtime/routes/btw-routes.ts +0 -6
- package/src/runtime/routes/conversation-cli-routes.ts +1 -1
- package/src/runtime/routes/conversation-list-routes.ts +12 -4
- package/src/runtime/routes/conversation-management-routes.ts +77 -20
- package/src/runtime/routes/conversation-query-routes.ts +142 -36
- package/src/runtime/routes/conversation-routes.ts +252 -410
- package/src/runtime/routes/conversation-starter-routes.ts +6 -3
- package/src/runtime/routes/disk-pressure-routes.ts +1 -1
- package/src/runtime/routes/domain-routes.ts +60 -10
- package/src/runtime/routes/email-routes.ts +5 -2
- package/src/runtime/routes/events-routes.ts +54 -10
- package/src/runtime/routes/group-routes.ts +24 -8
- package/src/runtime/routes/host-browser-routes.ts +10 -2
- package/src/runtime/routes/host-cu-routes.ts +2 -2
- package/src/runtime/routes/inbound-stages/acl-enforcement.ts +96 -3
- package/src/runtime/routes/index.ts +8 -0
- package/src/runtime/routes/inference-profile-session-handler.ts +22 -12
- package/src/runtime/routes/inference-profile-session-routes.ts +7 -1
- package/src/runtime/routes/llm-call-sites-routes.ts +32 -5
- package/src/runtime/routes/memory-item-routes.ts +8 -3
- package/src/runtime/routes/memory-v2-routes.ts +215 -5
- package/src/runtime/routes/memory-v3-routes.ts +316 -0
- package/src/runtime/routes/migration-routes.ts +21 -24
- package/src/runtime/routes/plugins-routes.ts +337 -0
- package/src/runtime/routes/rename-conversation-routes.ts +6 -2
- package/src/runtime/routes/secret-routes.ts +25 -5
- package/src/runtime/routes/settings-routes.ts +12 -11
- package/src/runtime/routes/slack-channel-routes.ts +5 -4
- package/src/runtime/routes/workspace-routes.ts +25 -10
- package/src/runtime/sync/resource-sync-events.ts +106 -38
- package/src/runtime/sync/sync-publisher.test.ts +49 -0
- package/src/runtime/sync/sync-publisher.ts +2 -1
- package/src/runtime/verification-outbound-actions.ts +73 -1
- package/src/telemetry/types.ts +12 -0
- package/src/telemetry/usage-telemetry-reporter.test.ts +48 -0
- package/src/telemetry/usage-telemetry-reporter.ts +1 -0
- package/src/tools/acp/spawn.test.ts +119 -0
- package/src/tools/acp/spawn.ts +15 -2
- package/src/tools/apps/definitions.ts +2 -8
- package/src/tools/ask-question/ask-question-tool.test.ts +3 -3
- package/src/tools/ask-question/ask-question-tool.ts +38 -45
- package/src/tools/browser/__tests__/pinned-tabs.test.ts +70 -0
- package/src/tools/browser/browser-execution.ts +16 -3
- package/src/tools/browser/cdp-client/__tests__/browser-tabs-factory.test.ts +402 -0
- package/src/tools/browser/cdp-client/__tests__/types.test.ts +3 -0
- package/src/tools/browser/cdp-client/cdp-inspect-client.ts +12 -0
- package/src/tools/browser/cdp-client/extension-cdp-client.ts +27 -1
- package/src/tools/browser/cdp-client/factory.ts +100 -17
- package/src/tools/browser/cdp-client/local-cdp-client.ts +12 -0
- package/src/tools/browser/cdp-client/types.ts +65 -0
- package/src/tools/browser/pinned-tabs.ts +96 -40
- package/src/tools/computer-use/definitions.ts +22 -78
- package/src/tools/credential-execution/make-authenticated-request.ts +3 -9
- package/src/tools/credential-execution/manage-secure-command-tool.ts +3 -9
- package/src/tools/credential-execution/run-authenticated-command.ts +3 -9
- package/src/tools/credentials/vault.ts +3 -9
- package/src/tools/document/document-tool.ts +59 -0
- package/src/tools/execution-target.ts +21 -23
- package/src/tools/executor.ts +6 -1
- package/src/tools/filesystem/edit.ts +3 -9
- package/src/tools/filesystem/list.ts +3 -9
- package/src/tools/filesystem/read.ts +3 -9
- package/src/tools/filesystem/write.ts +3 -9
- package/src/tools/host-filesystem/edit.ts +3 -9
- package/src/tools/host-filesystem/read.ts +3 -9
- package/src/tools/host-filesystem/transfer.ts +3 -9
- package/src/tools/host-filesystem/write.ts +3 -9
- package/src/tools/host-terminal/host-shell.ts +3 -9
- package/src/tools/mcp/mcp-tool-factory.ts +1 -8
- package/src/tools/memory/register.test.ts +1 -1
- package/src/tools/memory/register.ts +4 -9
- package/src/tools/network/web-fetch.ts +3 -9
- package/src/tools/network/web-search.ts +25 -32
- package/src/tools/registry.ts +7 -23
- package/src/tools/schema-transforms.ts +1 -1
- package/src/tools/skills/execute.ts +3 -9
- package/src/tools/skills/load.ts +3 -9
- package/src/tools/skills/skill-tool-factory.ts +1 -8
- package/src/tools/subagent/notify-parent.ts +3 -9
- package/src/tools/system/request-permission.ts +3 -9
- package/src/tools/terminal/shell.ts +3 -9
- package/src/tools/tool-defaults.ts +94 -0
- package/src/tools/types.ts +27 -98
- package/src/tools/ui-surface/definitions.ts +6 -22
- package/src/usage/pricing.ts +23 -0
- package/src/usage/types.ts +12 -0
- package/src/util/logger.ts +16 -7
- package/src/util/platform.ts +7 -2
- package/src/util/sqlite3-runtime.ts +65 -0
- package/src/workspace/migrations/086-revert-stale-gemini-mis-rewrites.ts +1 -0
- package/src/workspace/migrations/089-move-memory-tree-out-of-v3.ts +86 -0
- package/src/workspace/migrations/registry.ts +2 -0
- package/src/__tests__/compaction-strip-metadata-clear.test.ts +0 -206
- package/src/__tests__/message-complete-display-id.test.ts +0 -175
- package/src/daemon/query-complexity-router.ts +0 -75
- package/src/prompts/cache-boundary.ts +0 -8
|
@@ -6,8 +6,8 @@
|
|
|
6
6
|
* rendering, argument validation, and the no-message guard. They run
|
|
7
7
|
* entirely inside the CLI process and need no daemon stub.
|
|
8
8
|
*
|
|
9
|
-
*
|
|
10
|
-
*
|
|
9
|
+
* The IPC client is mocked with canned responses so tests can assert the
|
|
10
|
+
* request contract without opening an assistant socket.
|
|
11
11
|
*/
|
|
12
12
|
|
|
13
13
|
import {
|
|
@@ -23,6 +23,34 @@ import { Command } from "commander";
|
|
|
23
23
|
// ---------------------------------------------------------------------------
|
|
24
24
|
|
|
25
25
|
let mockStdinContent: string | null = null;
|
|
26
|
+
let lastIpcCall: {
|
|
27
|
+
method: string;
|
|
28
|
+
params?: Record<string, unknown>;
|
|
29
|
+
options?: { timeoutMs?: number };
|
|
30
|
+
} | null = null;
|
|
31
|
+
let mockIpcResult: {
|
|
32
|
+
ok: boolean;
|
|
33
|
+
result?: unknown;
|
|
34
|
+
error?: string;
|
|
35
|
+
} = {
|
|
36
|
+
ok: true,
|
|
37
|
+
result: {
|
|
38
|
+
response: "Hello from the model.",
|
|
39
|
+
model: "test-model",
|
|
40
|
+
usage: { inputTokens: 3, outputTokens: 4 },
|
|
41
|
+
},
|
|
42
|
+
};
|
|
43
|
+
|
|
44
|
+
mock.module("../../../ipc/cli-client.js", () => ({
|
|
45
|
+
cliIpcCall: async (
|
|
46
|
+
method: string,
|
|
47
|
+
params?: Record<string, unknown>,
|
|
48
|
+
options?: { timeoutMs?: number },
|
|
49
|
+
) => {
|
|
50
|
+
lastIpcCall = { method, params, options };
|
|
51
|
+
return mockIpcResult;
|
|
52
|
+
},
|
|
53
|
+
}));
|
|
26
54
|
|
|
27
55
|
mock.module("../../../providers/provider-send-message.js", () => ({
|
|
28
56
|
// The handler under test calls getConfiguredProvider before any of the
|
|
@@ -30,7 +58,10 @@ mock.module("../../../providers/provider-send-message.js", () => ({
|
|
|
30
58
|
// loads cleanly even though no test actually drives a request.
|
|
31
59
|
getConfiguredProvider: async () => null,
|
|
32
60
|
extractAllText: () => "",
|
|
33
|
-
userMessage: (text: string) => ({
|
|
61
|
+
userMessage: (text: string) => ({
|
|
62
|
+
role: "user",
|
|
63
|
+
content: [{ type: "text", text }],
|
|
64
|
+
}),
|
|
34
65
|
}));
|
|
35
66
|
|
|
36
67
|
mock.module("../../../config/loader.js", () => ({
|
|
@@ -44,8 +75,18 @@ mock.module("../../../config/loader.js", () => ({
|
|
|
44
75
|
}));
|
|
45
76
|
|
|
46
77
|
mock.module("../../../util/logger.js", () => ({
|
|
47
|
-
getLogger: () => ({
|
|
48
|
-
|
|
78
|
+
getLogger: () => ({
|
|
79
|
+
info: () => {},
|
|
80
|
+
warn: () => {},
|
|
81
|
+
error: () => {},
|
|
82
|
+
debug: () => {},
|
|
83
|
+
}),
|
|
84
|
+
getCliLogger: () => ({
|
|
85
|
+
info: () => {},
|
|
86
|
+
warn: () => {},
|
|
87
|
+
error: () => {},
|
|
88
|
+
debug: () => {},
|
|
89
|
+
}),
|
|
49
90
|
}));
|
|
50
91
|
|
|
51
92
|
mock.module("node:fs", () => ({
|
|
@@ -127,6 +168,15 @@ async function runCommand(
|
|
|
127
168
|
|
|
128
169
|
beforeEach(() => {
|
|
129
170
|
mockStdinContent = null;
|
|
171
|
+
lastIpcCall = null;
|
|
172
|
+
mockIpcResult = {
|
|
173
|
+
ok: true,
|
|
174
|
+
result: {
|
|
175
|
+
response: "Hello from the model.",
|
|
176
|
+
model: "test-model",
|
|
177
|
+
usage: { inputTokens: 3, outputTokens: 4 },
|
|
178
|
+
},
|
|
179
|
+
};
|
|
130
180
|
process.exitCode = 0;
|
|
131
181
|
});
|
|
132
182
|
|
|
@@ -142,6 +192,7 @@ describe("help text", () => {
|
|
|
142
192
|
expect(stdout).toContain("--model");
|
|
143
193
|
expect(stdout).toContain("--profile");
|
|
144
194
|
expect(stdout).toContain("--max-tokens");
|
|
195
|
+
expect(stdout).toContain("--timeout-seconds");
|
|
145
196
|
expect(stdout).toContain("--json");
|
|
146
197
|
expect(stdout).toContain("[message...]");
|
|
147
198
|
});
|
|
@@ -153,6 +204,7 @@ describe("help text", () => {
|
|
|
153
204
|
expect(stdout).toContain("--model");
|
|
154
205
|
expect(stdout).toContain("--profile");
|
|
155
206
|
expect(stdout).toContain("--max-tokens");
|
|
207
|
+
expect(stdout).toContain("--timeout-seconds");
|
|
156
208
|
expect(stdout).toContain("--json");
|
|
157
209
|
expect(stdout).toContain("[message...]");
|
|
158
210
|
});
|
|
@@ -225,3 +277,54 @@ describe("--max-tokens", () => {
|
|
|
225
277
|
expect(parsed.error).toContain("Invalid --max-tokens");
|
|
226
278
|
});
|
|
227
279
|
});
|
|
280
|
+
|
|
281
|
+
// ---------------------------------------------------------------------------
|
|
282
|
+
// IPC timeout
|
|
283
|
+
// ---------------------------------------------------------------------------
|
|
284
|
+
|
|
285
|
+
describe("--timeout-seconds", () => {
|
|
286
|
+
test("uses a long default IPC timeout for inference calls", async () => {
|
|
287
|
+
const { exitCode, stdout } = await runCommand([
|
|
288
|
+
"inference",
|
|
289
|
+
"send",
|
|
290
|
+
"--json",
|
|
291
|
+
"Hello",
|
|
292
|
+
]);
|
|
293
|
+
|
|
294
|
+
expect(exitCode).toBe(0);
|
|
295
|
+
expect(JSON.parse(stdout).ok).toBe(true);
|
|
296
|
+
expect(lastIpcCall!.method).toBe("inference_send");
|
|
297
|
+
expect(lastIpcCall!.options!.timeoutMs).toBe(32 * 60 * 1000);
|
|
298
|
+
});
|
|
299
|
+
|
|
300
|
+
test("passes custom timeout to IPC call", async () => {
|
|
301
|
+
const { exitCode } = await runCommand([
|
|
302
|
+
"llm",
|
|
303
|
+
"send",
|
|
304
|
+
"--timeout-seconds",
|
|
305
|
+
"300",
|
|
306
|
+
"Hello",
|
|
307
|
+
]);
|
|
308
|
+
|
|
309
|
+
expect(exitCode).toBe(0);
|
|
310
|
+
expect(lastIpcCall!.method).toBe("inference_send");
|
|
311
|
+
expect(lastIpcCall!.options!.timeoutMs).toBe(300_000);
|
|
312
|
+
});
|
|
313
|
+
|
|
314
|
+
test("errors on invalid timeout value", async () => {
|
|
315
|
+
const { exitCode, stdout } = await runCommand([
|
|
316
|
+
"inference",
|
|
317
|
+
"send",
|
|
318
|
+
"--timeout-seconds",
|
|
319
|
+
"0",
|
|
320
|
+
"--json",
|
|
321
|
+
"Hello",
|
|
322
|
+
]);
|
|
323
|
+
|
|
324
|
+
expect(exitCode).toBe(1);
|
|
325
|
+
expect(lastIpcCall).toBeNull();
|
|
326
|
+
const parsed = JSON.parse(stdout);
|
|
327
|
+
expect(parsed.ok).toBe(false);
|
|
328
|
+
expect(parsed.error).toContain("Invalid --timeout-seconds");
|
|
329
|
+
});
|
|
330
|
+
});
|
|
@@ -0,0 +1,98 @@
|
|
|
1
|
+
import { describe, expect, test } from "bun:test";
|
|
2
|
+
|
|
3
|
+
import type { ComparisonReport } from "../../../memory/v2/harness/runner.js";
|
|
4
|
+
import {
|
|
5
|
+
renderComparisonReport,
|
|
6
|
+
renderTurnTrace,
|
|
7
|
+
} from "../memory-v2-compare-render.js";
|
|
8
|
+
|
|
9
|
+
function sampleReport(): ComparisonReport {
|
|
10
|
+
return {
|
|
11
|
+
ks: [5, 10],
|
|
12
|
+
turnsConsidered: 3,
|
|
13
|
+
turnsScored: 1,
|
|
14
|
+
turnsSkipped: 2,
|
|
15
|
+
perTurn: [
|
|
16
|
+
{
|
|
17
|
+
conversationId: "c1",
|
|
18
|
+
turn: 7,
|
|
19
|
+
byRetriever: {
|
|
20
|
+
router: {
|
|
21
|
+
groundTruth: ["a", "b"],
|
|
22
|
+
selected: ["a", "x"],
|
|
23
|
+
hits: ["a"],
|
|
24
|
+
misses: ["b"],
|
|
25
|
+
extras: ["x"],
|
|
26
|
+
recallAtK: { 5: 0.5, 10: 0.5 },
|
|
27
|
+
hitsByLane: { tier1: 1 },
|
|
28
|
+
failureReason: null,
|
|
29
|
+
},
|
|
30
|
+
},
|
|
31
|
+
},
|
|
32
|
+
],
|
|
33
|
+
retrievers: [
|
|
34
|
+
{
|
|
35
|
+
name: "router",
|
|
36
|
+
aggregate: {
|
|
37
|
+
turns: 1,
|
|
38
|
+
meanRecallAtK: { 5: 0.5, 10: 0.5 },
|
|
39
|
+
failureRate: 0,
|
|
40
|
+
},
|
|
41
|
+
},
|
|
42
|
+
],
|
|
43
|
+
};
|
|
44
|
+
}
|
|
45
|
+
|
|
46
|
+
describe("memory v2 compare — renderComparisonReport", () => {
|
|
47
|
+
test("renders turn counts, recall@k, and per-lane attribution", () => {
|
|
48
|
+
const out = renderComparisonReport(sampleReport());
|
|
49
|
+
expect(out).toContain("considered 3, scored 1, skipped 2");
|
|
50
|
+
expect(out).toContain("Retriever: router");
|
|
51
|
+
expect(out).toContain("recall@5: 0.500");
|
|
52
|
+
expect(out).toContain("recall@10: 0.500");
|
|
53
|
+
expect(out).toContain("failures: 0.0%");
|
|
54
|
+
expect(out).toContain("hits by lane: tier1=1");
|
|
55
|
+
});
|
|
56
|
+
|
|
57
|
+
test("renders mean cost when present", () => {
|
|
58
|
+
const report = sampleReport();
|
|
59
|
+
report.retrievers[0]!.aggregate.meanCostUsd = 0.0123;
|
|
60
|
+
expect(renderComparisonReport(report)).toContain("mean cost: $0.0123");
|
|
61
|
+
});
|
|
62
|
+
|
|
63
|
+
test("handles a report with no scored turns", () => {
|
|
64
|
+
const out = renderComparisonReport({
|
|
65
|
+
ks: [5],
|
|
66
|
+
turnsConsidered: 4,
|
|
67
|
+
turnsScored: 0,
|
|
68
|
+
turnsSkipped: 4,
|
|
69
|
+
perTurn: [],
|
|
70
|
+
retrievers: [
|
|
71
|
+
{
|
|
72
|
+
name: "router",
|
|
73
|
+
aggregate: { turns: 0, meanRecallAtK: { 5: 0 }, failureRate: 0 },
|
|
74
|
+
},
|
|
75
|
+
],
|
|
76
|
+
});
|
|
77
|
+
expect(out).toContain("No turns scored");
|
|
78
|
+
});
|
|
79
|
+
});
|
|
80
|
+
|
|
81
|
+
describe("memory v2 compare — renderTurnTrace", () => {
|
|
82
|
+
test("renders the per-retriever breakdown for a scored turn", () => {
|
|
83
|
+
const out = renderTurnTrace(sampleReport(), "c1", 7);
|
|
84
|
+
expect(out).toContain("Turn c1:7");
|
|
85
|
+
expect(out).toContain("Retriever: router");
|
|
86
|
+
expect(out).toContain("selected (2): a, x");
|
|
87
|
+
expect(out).toContain("hits (1): a");
|
|
88
|
+
expect(out).toContain("misses (1): b");
|
|
89
|
+
expect(out).toContain("extras (1): x");
|
|
90
|
+
expect(out).toContain("(no descent trace — tier-based retriever)");
|
|
91
|
+
});
|
|
92
|
+
|
|
93
|
+
test("explains when the requested turn was not scored", () => {
|
|
94
|
+
const out = renderTurnTrace(sampleReport(), "c1", 999);
|
|
95
|
+
expect(out).toContain("not found");
|
|
96
|
+
expect(out).toContain("turnsSkipped=2");
|
|
97
|
+
});
|
|
98
|
+
});
|
|
@@ -0,0 +1,340 @@
|
|
|
1
|
+
import { describe, expect, test } from "bun:test";
|
|
2
|
+
|
|
3
|
+
import type {
|
|
4
|
+
LlmCallRecord,
|
|
5
|
+
MemoryV3SimulateResult,
|
|
6
|
+
MemoryV3TreeResult,
|
|
7
|
+
MemoryV3ValidateResult,
|
|
8
|
+
} from "../../../runtime/routes/memory-v3-routes.js";
|
|
9
|
+
import {
|
|
10
|
+
renderLlmCalls,
|
|
11
|
+
renderSimulation,
|
|
12
|
+
renderTree,
|
|
13
|
+
renderValidationReport,
|
|
14
|
+
reportHasDefects,
|
|
15
|
+
} from "../memory-v3-render.js";
|
|
16
|
+
|
|
17
|
+
function cleanReport(): MemoryV3ValidateResult {
|
|
18
|
+
return {
|
|
19
|
+
danglingChildRefs: [],
|
|
20
|
+
danglingChildRefCount: 0,
|
|
21
|
+
orphanPages: [],
|
|
22
|
+
orphanPageCount: 0,
|
|
23
|
+
cycles: [],
|
|
24
|
+
cycleCount: 0,
|
|
25
|
+
staleIndex: [],
|
|
26
|
+
staleIndexCount: 0,
|
|
27
|
+
unknownEdgeTargets: [],
|
|
28
|
+
unknownEdgeTargetCount: 0,
|
|
29
|
+
};
|
|
30
|
+
}
|
|
31
|
+
|
|
32
|
+
describe("memory v3 — renderValidationReport", () => {
|
|
33
|
+
test("renders 'none' for every empty category", () => {
|
|
34
|
+
const out = renderValidationReport(cleanReport());
|
|
35
|
+
expect(out).toContain("Memory v3 Tree Validation");
|
|
36
|
+
expect(out).toContain("Dangling child refs: none");
|
|
37
|
+
expect(out).toContain("Orphan pages: none");
|
|
38
|
+
expect(out).toContain("Cycles: none");
|
|
39
|
+
expect(out).toContain("Stale index: none");
|
|
40
|
+
expect(out).toContain("Unknown edge targets: none");
|
|
41
|
+
});
|
|
42
|
+
|
|
43
|
+
test("renders counts and offending ids for each defect category", () => {
|
|
44
|
+
const report: MemoryV3ValidateResult = {
|
|
45
|
+
danglingChildRefs: [{ node: "people", ref: "ghost", kind: "node" }],
|
|
46
|
+
danglingChildRefCount: 1,
|
|
47
|
+
orphanPages: ["stray-page"],
|
|
48
|
+
orphanPageCount: 1,
|
|
49
|
+
cycles: [{ from: "a", to: "b" }],
|
|
50
|
+
cycleCount: 1,
|
|
51
|
+
staleIndex: [
|
|
52
|
+
{ node: "root", child: "people", nodeMtimeMs: 1, childMtimeMs: 2 },
|
|
53
|
+
],
|
|
54
|
+
staleIndexCount: 1,
|
|
55
|
+
unknownEdgeTargets: [{ from: "p1", to: "missing" }],
|
|
56
|
+
unknownEdgeTargetCount: 1,
|
|
57
|
+
};
|
|
58
|
+
const out = renderValidationReport(report);
|
|
59
|
+
expect(out).toContain("Dangling child refs: 1");
|
|
60
|
+
expect(out).toContain("people → node:ghost");
|
|
61
|
+
expect(out).toContain("Orphan pages: 1");
|
|
62
|
+
expect(out).toContain("- stray-page");
|
|
63
|
+
expect(out).toContain("Cycles: 1");
|
|
64
|
+
expect(out).toContain("a → b");
|
|
65
|
+
expect(out).toContain("Stale index: 1");
|
|
66
|
+
expect(out).toContain("root (older than child people)");
|
|
67
|
+
expect(out).toContain("Unknown edge targets: 1");
|
|
68
|
+
expect(out).toContain("p1 → missing");
|
|
69
|
+
});
|
|
70
|
+
});
|
|
71
|
+
|
|
72
|
+
describe("memory v3 — reportHasDefects", () => {
|
|
73
|
+
test("false for a clean report", () => {
|
|
74
|
+
expect(reportHasDefects(cleanReport())).toBe(false);
|
|
75
|
+
});
|
|
76
|
+
|
|
77
|
+
test("true when any single category is non-empty", () => {
|
|
78
|
+
const report = cleanReport();
|
|
79
|
+
report.orphanPageCount = 1;
|
|
80
|
+
report.orphanPages = ["x"];
|
|
81
|
+
expect(reportHasDefects(report)).toBe(true);
|
|
82
|
+
});
|
|
83
|
+
});
|
|
84
|
+
|
|
85
|
+
describe("memory v3 — renderTree", () => {
|
|
86
|
+
test("renders an indented tree descending node and page children", () => {
|
|
87
|
+
const view: MemoryV3TreeResult = {
|
|
88
|
+
root: "_root",
|
|
89
|
+
nodes: [
|
|
90
|
+
{
|
|
91
|
+
id: "_root",
|
|
92
|
+
children: [
|
|
93
|
+
{ kind: "node", ref: "people" },
|
|
94
|
+
{ kind: "page", ref: "overview" },
|
|
95
|
+
],
|
|
96
|
+
},
|
|
97
|
+
{
|
|
98
|
+
id: "people",
|
|
99
|
+
children: [{ kind: "page", ref: "alice" }],
|
|
100
|
+
},
|
|
101
|
+
],
|
|
102
|
+
};
|
|
103
|
+
const out = renderTree(view);
|
|
104
|
+
expect(out).toBe(
|
|
105
|
+
["node:_root", " node:people", " page:alice", " page:overview"].join(
|
|
106
|
+
"\n",
|
|
107
|
+
),
|
|
108
|
+
);
|
|
109
|
+
});
|
|
110
|
+
|
|
111
|
+
test("marks a shared DAG sub-node as a re-entry rather than re-expanding", () => {
|
|
112
|
+
const view: MemoryV3TreeResult = {
|
|
113
|
+
root: "_root",
|
|
114
|
+
nodes: [
|
|
115
|
+
{
|
|
116
|
+
id: "_root",
|
|
117
|
+
children: [
|
|
118
|
+
{ kind: "node", ref: "a" },
|
|
119
|
+
{ kind: "node", ref: "b" },
|
|
120
|
+
],
|
|
121
|
+
},
|
|
122
|
+
{ id: "a", children: [{ kind: "node", ref: "shared" }] },
|
|
123
|
+
{ id: "b", children: [{ kind: "node", ref: "shared" }] },
|
|
124
|
+
{ id: "shared", children: [{ kind: "page", ref: "leaf" }] },
|
|
125
|
+
],
|
|
126
|
+
};
|
|
127
|
+
const out = renderTree(view);
|
|
128
|
+
// First reach under `a` expands; second reach under `b` is a marked re-entry.
|
|
129
|
+
expect(out).toContain(" node:a\n node:shared\n page:leaf");
|
|
130
|
+
expect(out).toContain("node:shared (↑ already shown)");
|
|
131
|
+
// The leaf page is expanded exactly once.
|
|
132
|
+
expect(out.match(/page:leaf/g)?.length).toBe(1);
|
|
133
|
+
});
|
|
134
|
+
|
|
135
|
+
test("bounds output on a cycle instead of looping forever", () => {
|
|
136
|
+
const view: MemoryV3TreeResult = {
|
|
137
|
+
root: "_root",
|
|
138
|
+
nodes: [
|
|
139
|
+
{ id: "_root", children: [{ kind: "node", ref: "a" }] },
|
|
140
|
+
{ id: "a", children: [{ kind: "node", ref: "_root" }] },
|
|
141
|
+
],
|
|
142
|
+
};
|
|
143
|
+
const out = renderTree(view);
|
|
144
|
+
expect(out).toContain("node:_root (↑ already shown)");
|
|
145
|
+
});
|
|
146
|
+
|
|
147
|
+
test("flags a child ref whose target node is missing", () => {
|
|
148
|
+
const view: MemoryV3TreeResult = {
|
|
149
|
+
root: "_root",
|
|
150
|
+
nodes: [{ id: "_root", children: [{ kind: "node", ref: "ghost" }] }],
|
|
151
|
+
};
|
|
152
|
+
const out = renderTree(view);
|
|
153
|
+
expect(out).toContain("node:ghost (missing)");
|
|
154
|
+
});
|
|
155
|
+
|
|
156
|
+
test("lists nodes unreachable from the root", () => {
|
|
157
|
+
const view: MemoryV3TreeResult = {
|
|
158
|
+
root: "_root",
|
|
159
|
+
nodes: [
|
|
160
|
+
{ id: "_root", children: [] },
|
|
161
|
+
{ id: "floating", children: [] },
|
|
162
|
+
],
|
|
163
|
+
};
|
|
164
|
+
const out = renderTree(view);
|
|
165
|
+
expect(out).toContain("Unreachable nodes (1):");
|
|
166
|
+
expect(out).toContain("- node:floating");
|
|
167
|
+
});
|
|
168
|
+
});
|
|
169
|
+
|
|
170
|
+
function simResult(): MemoryV3SimulateResult {
|
|
171
|
+
return {
|
|
172
|
+
query: "what should we ship next",
|
|
173
|
+
selectedSlugs: ["page-tree", "page-hot", "page-edge"],
|
|
174
|
+
sourceBySlug: {
|
|
175
|
+
"page-hot": "hot",
|
|
176
|
+
"page-tree": "tree",
|
|
177
|
+
"page-edge": "edge",
|
|
178
|
+
},
|
|
179
|
+
trace: {
|
|
180
|
+
passes: [
|
|
181
|
+
{
|
|
182
|
+
passNumber: 1,
|
|
183
|
+
scouts: [
|
|
184
|
+
{ lane: "hot", slugs: ["page-hot"] },
|
|
185
|
+
{ lane: "sparse", slugs: [] },
|
|
186
|
+
{ lane: "dense", slugs: ["d1", "d2"] },
|
|
187
|
+
],
|
|
188
|
+
treeLevels: [
|
|
189
|
+
{
|
|
190
|
+
node: "",
|
|
191
|
+
considered: ["people", "frames", "objects"],
|
|
192
|
+
descended: ["people", "frames"],
|
|
193
|
+
skipped: ["objects"],
|
|
194
|
+
reasoning: "query is about planning",
|
|
195
|
+
},
|
|
196
|
+
],
|
|
197
|
+
edgeExpansions: [{ from: "page-tree", pulled: ["page-edge"] }],
|
|
198
|
+
gate: { decision: "more", questions: ["narrow to roadmap?"] },
|
|
199
|
+
},
|
|
200
|
+
{
|
|
201
|
+
passNumber: 2,
|
|
202
|
+
scouts: [{ lane: "hot", slugs: [] }],
|
|
203
|
+
gate: { decision: "ready" },
|
|
204
|
+
},
|
|
205
|
+
],
|
|
206
|
+
},
|
|
207
|
+
cost: { ms: 1234 },
|
|
208
|
+
failureReason: null,
|
|
209
|
+
llmCalls: [],
|
|
210
|
+
effectiveConfig: {
|
|
211
|
+
passCap: 3,
|
|
212
|
+
lanes: { hot: true, sparse: true, dense: true, tree: true, edges: false },
|
|
213
|
+
},
|
|
214
|
+
};
|
|
215
|
+
}
|
|
216
|
+
|
|
217
|
+
describe("memory v3 — renderSimulation", () => {
|
|
218
|
+
test("renders query, effective config, per-pass trace, and grouped selection", () => {
|
|
219
|
+
const out = renderSimulation(simResult());
|
|
220
|
+
expect(out).toContain("Memory v3 Retrieval Simulation");
|
|
221
|
+
expect(out).toContain('Query: "what should we ship next"');
|
|
222
|
+
expect(out).toContain("passCap: 3");
|
|
223
|
+
// A disabled lane is surfaced in an `(off: …)` suffix.
|
|
224
|
+
expect(out).toContain("lanes: hot, sparse, dense, tree (off: edges)");
|
|
225
|
+
|
|
226
|
+
expect(out).toContain("Passes: 2");
|
|
227
|
+
expect(out).toContain("Pass 1");
|
|
228
|
+
expect(out).toContain("scouts: hot=1 sparse=0 dense=2");
|
|
229
|
+
// The root tree level ("" node) prints as [root] with branch counts.
|
|
230
|
+
expect(out).toContain("[root]: considered 3, descended 2, skipped 1");
|
|
231
|
+
expect(out).toContain("→ people, frames");
|
|
232
|
+
expect(out).toContain("reason: query is about planning");
|
|
233
|
+
expect(out).toContain("edges: 1 seed(s) expanded, 1 pulled");
|
|
234
|
+
expect(out).toContain("gate: more");
|
|
235
|
+
expect(out).toContain("? narrow to roadmap?");
|
|
236
|
+
expect(out).toContain("gate: ready");
|
|
237
|
+
|
|
238
|
+
expect(out).toContain("Selected: 3 page(s)");
|
|
239
|
+
expect(out).toContain("Cost: 1234 ms");
|
|
240
|
+
});
|
|
241
|
+
|
|
242
|
+
test("groups selected slugs by provenance lane in fanout order", () => {
|
|
243
|
+
const out = renderSimulation(simResult());
|
|
244
|
+
const hotAt = out.indexOf("hot (1)");
|
|
245
|
+
const treeAt = out.indexOf("tree (1)");
|
|
246
|
+
const edgeAt = out.indexOf("edge (1)");
|
|
247
|
+
expect(hotAt).toBeGreaterThan(-1);
|
|
248
|
+
expect(treeAt).toBeGreaterThan(-1);
|
|
249
|
+
expect(edgeAt).toBeGreaterThan(-1);
|
|
250
|
+
// hot precedes tree precedes edge in SIMULATE_LANE_ORDER.
|
|
251
|
+
expect(hotAt).toBeLessThan(treeAt);
|
|
252
|
+
expect(treeAt).toBeLessThan(edgeAt);
|
|
253
|
+
});
|
|
254
|
+
|
|
255
|
+
test("renders all lanes inline when none are disabled", () => {
|
|
256
|
+
const result = simResult();
|
|
257
|
+
result.effectiveConfig.lanes.edges = true;
|
|
258
|
+
const out = renderSimulation(result);
|
|
259
|
+
expect(out).toContain("lanes: hot, sparse, dense, tree, edges");
|
|
260
|
+
expect(out).not.toContain("(off:");
|
|
261
|
+
});
|
|
262
|
+
|
|
263
|
+
test("surfaces a failure reason when the loop degraded", () => {
|
|
264
|
+
const result = simResult();
|
|
265
|
+
result.failureReason = "dense filter failed open";
|
|
266
|
+
const out = renderSimulation(result);
|
|
267
|
+
expect(out).toContain("Failure: dense filter failed open");
|
|
268
|
+
});
|
|
269
|
+
});
|
|
270
|
+
|
|
271
|
+
function llmCall(over: Partial<LlmCallRecord> = {}): LlmCallRecord {
|
|
272
|
+
return {
|
|
273
|
+
pass: 1,
|
|
274
|
+
lane: "gate",
|
|
275
|
+
callSite: "memoryV3Gate",
|
|
276
|
+
request: {
|
|
277
|
+
systemPrompt: "SYS-PROMPT",
|
|
278
|
+
messages: [
|
|
279
|
+
{ role: "user", content: [{ type: "text", text: "USER-MSG" }] },
|
|
280
|
+
],
|
|
281
|
+
tools: [
|
|
282
|
+
{
|
|
283
|
+
name: "decide_selection",
|
|
284
|
+
description: "decide",
|
|
285
|
+
input_schema: { type: "object", properties: {} },
|
|
286
|
+
},
|
|
287
|
+
],
|
|
288
|
+
},
|
|
289
|
+
response: {
|
|
290
|
+
model: "stub-model",
|
|
291
|
+
stopReason: "tool_use",
|
|
292
|
+
usage: { inputTokens: 0, outputTokens: 0 },
|
|
293
|
+
content: [
|
|
294
|
+
{
|
|
295
|
+
type: "tool_use",
|
|
296
|
+
id: "tu-1",
|
|
297
|
+
name: "decide_selection",
|
|
298
|
+
input: { decision: "ready", selected_slugs: ["a"] },
|
|
299
|
+
},
|
|
300
|
+
],
|
|
301
|
+
},
|
|
302
|
+
ms: 42,
|
|
303
|
+
...over,
|
|
304
|
+
};
|
|
305
|
+
}
|
|
306
|
+
|
|
307
|
+
describe("memory v3 — renderLlmCalls", () => {
|
|
308
|
+
test("compact: one line per call with lane, node, and tool summary", () => {
|
|
309
|
+
const out = renderLlmCalls(
|
|
310
|
+
[
|
|
311
|
+
llmCall(),
|
|
312
|
+
llmCall({
|
|
313
|
+
lane: "descent",
|
|
314
|
+
callSite: "memoryV3Descent",
|
|
315
|
+
node: "people",
|
|
316
|
+
}),
|
|
317
|
+
],
|
|
318
|
+
{ full: false },
|
|
319
|
+
);
|
|
320
|
+
expect(out).toContain("LLM calls (2):");
|
|
321
|
+
expect(out).toContain("pass1 · gate");
|
|
322
|
+
expect(out).toContain("pass1 · descent · node=people");
|
|
323
|
+
expect(out).toContain("decide_selection");
|
|
324
|
+
expect(out).toContain("42ms");
|
|
325
|
+
// Compact mode must not dump the full system prompt.
|
|
326
|
+
expect(out).not.toContain("SYS-PROMPT");
|
|
327
|
+
});
|
|
328
|
+
|
|
329
|
+
test("full: includes system prompt, messages, tools, and tool_use input", () => {
|
|
330
|
+
const out = renderLlmCalls([llmCall()], { full: true });
|
|
331
|
+
expect(out).toContain("SYS-PROMPT");
|
|
332
|
+
expect(out).toContain("USER-MSG");
|
|
333
|
+
expect(out).toContain("decide_selection");
|
|
334
|
+
expect(out).toContain('"decision"');
|
|
335
|
+
});
|
|
336
|
+
|
|
337
|
+
test("renders 'none' when there are no calls", () => {
|
|
338
|
+
expect(renderLlmCalls([], { full: false })).toBe("LLM calls: none");
|
|
339
|
+
});
|
|
340
|
+
});
|