npm - @vellumai/assistant - Versions diffs - 0.5.15 → 0.5.16 - Mend

@vellumai/assistant 0.5.15 → 0.5.16

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (175) hide show

package/ARCHITECTURE.md +2 -2
package/docs/architecture/integrations.md +15 -14
package/knip.json +3 -1
package/openapi.yaml +11 -43
package/package.json +1 -1
package/src/__tests__/assistant-feature-flags-integration.test.ts +3 -375
package/src/__tests__/ces-rpc-credential-backend.test.ts +4 -1
package/src/__tests__/checker.test.ts +59 -0
package/src/__tests__/cli-command-risk-guard.test.ts +98 -10
package/src/__tests__/cli-memory.test.ts +372 -0
package/src/__tests__/computer-use-skill-manifest-regression.test.ts +12 -2
package/src/__tests__/config-schema.test.ts +0 -2
package/src/__tests__/config-watcher-feature-flags.test.ts +211 -0
package/src/__tests__/conversation-runtime-assembly.test.ts +7 -4
package/src/__tests__/conversation-slash-commands.test.ts +2 -6
package/src/__tests__/conversation-usage.test.ts +1 -0
package/src/__tests__/credential-security-e2e.test.ts +4 -1
package/src/__tests__/docker-signing-key-bootstrap.test.ts +7 -73
package/src/__tests__/dynamic-skill-workflow-prompt.test.ts +6 -7
package/src/__tests__/guardian-routing-invariants.test.ts +151 -0
package/src/__tests__/heartbeat-service.test.ts +1 -3
package/src/__tests__/intent-routing.test.ts +6 -18
package/src/__tests__/log-export-workspace.test.ts +2 -28
package/src/__tests__/managed-skill-lifecycle.test.ts +7 -37
package/src/__tests__/managed-store.test.ts +2 -10
package/src/__tests__/messaging-send-tool.test.ts +6 -6
package/src/__tests__/migration-cross-version-compatibility.test.ts +1 -29
package/src/__tests__/migration-export-http.test.ts +3 -34
package/src/__tests__/migration-import-commit-http.test.ts +1 -29
package/src/__tests__/migration-import-preflight-http.test.ts +3 -34
package/src/__tests__/no-domain-routing-in-prompt-guard.test.ts +2 -1
package/src/__tests__/oauth-apps-routes.test.ts +120 -10
package/src/__tests__/oauth-connect-orchestrator.test.ts +709 -0
package/src/__tests__/oauth-provider-serializer.test.ts +2 -1
package/src/__tests__/oauth-provider-visibility.test.ts +149 -0
package/src/__tests__/oauth-providers-routes.test.ts +5 -2
package/src/__tests__/oauth-store.test.ts +0 -5
package/src/__tests__/outlook-messaging-provider.test.ts +576 -0
package/src/__tests__/path-policy.test.ts +2 -17
package/src/__tests__/permission-types.test.ts +0 -1
package/src/__tests__/platform-callback-registration.test.ts +3 -7
package/src/__tests__/provider-commit-message-generator.test.ts +0 -1
package/src/__tests__/provider-error-scenarios.test.ts +0 -2
package/src/__tests__/qdrant-manager.test.ts +68 -21
package/src/__tests__/require-fresh-approval.test.ts +0 -1
package/src/__tests__/sandbox-diagnostics.test.ts +20 -29
package/src/__tests__/scaffold-managed-skill-tool.test.ts +2 -10
package/src/__tests__/secret-allowlist.test.ts +20 -35
package/src/__tests__/shell-credential-ref.test.ts +0 -5
package/src/__tests__/skill-load-feature-flag.test.ts +2 -43
package/src/__tests__/skill-load-inline-command.test.ts +3 -65
package/src/__tests__/skill-load-inline-includes.test.ts +3 -65
package/src/__tests__/skill-load-tool.test.ts +3 -67
package/src/__tests__/skill-memory.test.ts +362 -119
package/src/__tests__/skills.test.ts +22 -49
package/src/__tests__/slack-channel-config.test.ts +2 -21
package/src/__tests__/starter-bundle.test.ts +2 -8
package/src/__tests__/stt-hints.test.ts +7 -2
package/src/__tests__/system-prompt.test.ts +25 -45
package/src/__tests__/task-compiler.test.ts +0 -21
package/src/__tests__/task-management-tools.test.ts +0 -21
package/src/__tests__/task-memory-cleanup.test.ts +0 -21
package/src/__tests__/task-runner.test.ts +0 -21
package/src/__tests__/task-scheduler.test.ts +0 -21
package/src/__tests__/terminal-tools.test.ts +1 -17
package/src/__tests__/token-estimator-accuracy.benchmark.test.ts +0 -79
package/src/__tests__/tool-approval-handler.test.ts +1 -20
package/src/__tests__/tool-execution-abort-cleanup.test.ts +2 -11
package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +1 -25
package/src/__tests__/tool-executor-lifecycle-events.test.ts +0 -1
package/src/__tests__/tool-executor.test.ts +0 -1
package/src/__tests__/tool-grant-request-escalation.test.ts +1 -20
package/src/__tests__/tool-preview-lifecycle.test.ts +0 -20
package/src/__tests__/trust-store.test.ts +9 -41
package/src/__tests__/trusted-contact-approval-notifier.test.ts +1 -30
package/src/__tests__/trusted-contact-inline-approval-integration.test.ts +1 -21
package/src/__tests__/trusted-contact-lifecycle-notifications.test.ts +0 -22
package/src/__tests__/trusted-contact-multichannel.test.ts +0 -22
package/src/__tests__/trusted-contact-verification.test.ts +0 -22
package/src/__tests__/turn-boundary-resolution.test.ts +0 -28
package/src/__tests__/twilio-provider.test.ts +0 -16
package/src/__tests__/twilio-routes-twiml.test.ts +7 -12
package/src/__tests__/twilio-routes.test.ts +0 -24
package/src/__tests__/update-bulletin.test.ts +17 -89
package/src/__tests__/usage-cache-backfill-migration.test.ts +0 -20
package/src/__tests__/usage-routes.test.ts +0 -21
package/src/__tests__/user-reference.test.ts +1 -5
package/src/__tests__/vbundle-pax-and-symlink.test.ts +4 -34
package/src/__tests__/vellum-self-knowledge-inline-command.test.ts +2 -53
package/src/__tests__/voice-invite-redemption.test.ts +0 -21
package/src/__tests__/voice-scoped-grant-consumer.test.ts +0 -24
package/src/__tests__/voice-session-bridge.test.ts +0 -21
package/src/__tests__/workspace-migration-009-backfill-conversation-disk-view.test.ts +2 -23
package/src/__tests__/workspace-migration-012-rename-conversation-disk-view-dirs.test.ts +2 -2
package/src/__tests__/workspace-migration-013-repair-conversation-disk-view.test.ts +2 -23
package/src/__tests__/workspace-migration-down-functions.test.ts +0 -6
package/src/acp/client-handler.ts +1 -2
package/src/cli/__tests__/notifications.test.ts +0 -22
package/src/cli/cli-memory.ts +176 -0
package/src/cli/commands/oauth/__tests__/providers-update.test.ts +1 -1
package/src/cli/commands/oauth/connect.ts +15 -0
package/src/cli/commands/oauth/providers.ts +49 -42
package/src/cli/commands/platform/__tests__/connect.test.ts +2 -48
package/src/cli/commands/platform/__tests__/disconnect.test.ts +2 -48
package/src/cli/commands/platform/__tests__/status.test.ts +0 -50
package/src/config/bundled-skills/computer-use/TOOLS.json +7 -7
package/src/config/bundled-skills/messaging/SKILL.md +17 -2
package/src/config/bundled-skills/settings/TOOLS.json +3 -3
package/src/config/feature-flag-registry.json +16 -0
package/src/config/loader.ts +4 -0
package/src/config/schemas/security.ts +0 -6
package/src/config/schemas/services.ts +8 -0
package/src/context/window-manager.ts +28 -9
package/src/credential-execution/approval-bridge.ts +0 -1
package/src/daemon/config-watcher.ts +51 -0
package/src/daemon/conversation-agent-loop.ts +3 -2
package/src/daemon/conversation-process.ts +1 -0
package/src/daemon/conversation-usage.ts +1 -0
package/src/daemon/handlers/skills.ts +9 -1
package/src/daemon/lifecycle.ts +13 -4
package/src/daemon/message-types/conversations.ts +1 -0
package/src/daemon/providers-setup.ts +2 -0
package/src/daemon/server.ts +26 -22
package/src/events/domain-events.ts +1 -2
package/src/memory/db-init.ts +9 -0
package/src/memory/job-handlers/batch-extraction.ts +16 -4
package/src/memory/job-handlers/embedding.test.ts +3 -27
package/src/memory/job-handlers/journal-carry-forward.test.ts +1 -29
package/src/memory/llm-usage-store.ts +35 -2
package/src/memory/migrations/201-oauth-providers-feature-flag.ts +11 -0
package/src/memory/migrations/202-drop-callback-transport-column.ts +13 -0
package/src/memory/migrations/index.ts +2 -0
package/src/memory/qdrant-manager.ts +26 -5
package/src/memory/query-expansion.ts +1 -1
package/src/memory/retriever.test.ts +22 -20
package/src/memory/retriever.ts +10 -2
package/src/memory/schema/oauth.ts +1 -1
package/src/memory/search/mmr.ts +8 -5
package/src/memory/slack-thread-store.ts +17 -0
package/src/messaging/providers/outlook/adapter.ts +193 -0
package/src/messaging/providers/outlook/client.ts +311 -0
package/src/messaging/providers/outlook/types.ts +83 -0
package/src/notifications/adapters/slack.ts +1 -1
package/src/oauth/__tests__/identity-verifier.test.ts +1 -1
package/src/oauth/connect-orchestrator.ts +10 -3
package/src/oauth/oauth-store.ts +10 -11
package/src/oauth/provider-serializer.ts +3 -0
package/src/oauth/provider-visibility.ts +16 -0
package/src/oauth/seed-providers.ts +49 -17
package/src/permissions/checker.ts +39 -7
package/src/permissions/types.ts +2 -4
package/src/prompts/journal-context.ts +9 -11
package/src/prompts/system-prompt.ts +3 -64
package/src/prompts/templates/UPDATES.md +6 -0
package/src/runtime/auth/__tests__/credential-service.test.ts +1 -27
package/src/runtime/auth/__tests__/token-service.test.ts +1 -25
package/src/runtime/auth/route-policy.ts +0 -4
package/src/runtime/guardian-reply-router.ts +6 -2
package/src/runtime/routes/conversation-query-routes.ts +2 -58
package/src/runtime/routes/inbound-stages/background-dispatch.ts +43 -2
package/src/runtime/routes/memory-item-routes.test.ts +0 -17
package/src/runtime/routes/memory-item-routes.ts +103 -12
package/src/runtime/routes/oauth-apps.ts +18 -1
package/src/runtime/routes/oauth-providers.ts +13 -1
package/src/runtime/routes/settings-routes.ts +1 -0
package/src/runtime/routes/usage-routes.ts +19 -2
package/src/runtime/routes/work-items-routes.test.ts +0 -21
package/src/runtime/routes/workspace-routes.test.ts +3 -27
package/src/security/secret-allowlist.ts +4 -4
package/src/skills/skill-memory.ts +62 -23
package/src/tools/memory/handlers.test.ts +1 -29
package/src/tools/permission-checker.ts +0 -18
package/src/tools/skills/skill-script-runner.ts +1 -1
package/src/util/device-id.ts +3 -65
package/src/workspace/git-service.ts +27 -6

package/src/__tests__/checker.test.ts CHANGED Viewed

@@ -432,6 +432,12 @@ describe("Permission Checker", () => {
     // shell commands - high risk
     describe("shell — high risk", () => {
+      test("assistant trust clear is high risk", async () => {
+        expect(
+          await classifyRisk("bash", { command: "assistant trust clear" }),
+        ).toBe(RiskLevel.High);
+      });
       test("sudo is high risk", async () => {
         expect(await classifyRisk("bash", { command: "sudo rm -rf /" })).toBe(
           RiskLevel.High,
@@ -2017,6 +2023,9 @@ describe("Permission Checker", () => {
     function ensureSkillsDir(): void {
       mkdirSync(join(checkerTestDir, "skills"), { recursive: true });
     }
+    function ensureHooksDir(): void {
+      mkdirSync(join(checkerTestDir, "hooks"), { recursive: true });
+    }
     test("file_write to skill directory is High risk", async () => {
       ensureSkillsDir();
@@ -2147,6 +2156,56 @@ describe("Permission Checker", () => {
       expect(risk).toBe(RiskLevel.Low);
     });
+    test("file_write to hooks directory is High risk", async () => {
+      ensureHooksDir();
+      const hookPath = join(
+        checkerTestDir,
+        "hooks",
+        "post-tool-use",
+        "hook.sh",
+      );
+      const risk = await classifyRisk("file_write", { path: hookPath });
+      expect(risk).toBe(RiskLevel.High);
+    });
+    test("file_edit of hooks config is High risk", async () => {
+      ensureHooksDir();
+      const configPath = join(checkerTestDir, "hooks", "config.json");
+      const risk = await classifyRisk("file_edit", { path: configPath });
+      expect(risk).toBe(RiskLevel.High);
+    });
+    test("file_write to hooks directory prompts as High risk", async () => {
+      ensureHooksDir();
+      const hookPath = join(
+        checkerTestDir,
+        "hooks",
+        "post-tool-use",
+        "hook.sh",
+      );
+      const result = await check("file_write", { path: hookPath }, "/tmp");
+      expect(result.decision).toBe("prompt");
+    });
+    test("host_file_write to hooks directory is High risk", async () => {
+      ensureHooksDir();
+      const hookPath = join(
+        checkerTestDir,
+        "hooks",
+        "post-tool-use",
+        "hook.sh",
+      );
+      const risk = await classifyRisk("host_file_write", { path: hookPath });
+      expect(risk).toBe(RiskLevel.High);
+    });
+    test("host_file_edit of hooks config is High risk", async () => {
+      ensureHooksDir();
+      const configPath = join(checkerTestDir, "hooks", "config.json");
+      const risk = await classifyRisk("host_file_edit", { path: configPath });
+      expect(risk).toBe(RiskLevel.High);
+    });
     test("host_file_write to non-skill path remains Medium risk (via registry)", async () => {
       const normalPath = "/tmp/some-file.txt";
       const risk = await classifyRisk("host_file_write", { path: normalPath });

package/src/__tests__/cli-command-risk-guard.test.ts CHANGED Viewed

@@ -157,27 +157,55 @@ describe("CLI command risk guard: elevated assistant subcommands", () => {
     expect(risk).toBe(RiskLevel.Medium);
   });
-  test("--help on elevated subcommands is Low risk (read-only)", async () => {
-    const helpCommands = [
+  test("--help on non-elevated subcommands remains Low risk", async () => {
+    // GIVEN non-elevated subcommands with --help / -h flags
+    const lowRiskWithHelp = [
+      "assistant oauth --help",
+      "assistant credentials --help",
+      "assistant trust -h",
+      "assistant keys --help",
+      "assistant config --help",
+    ];
+    // WHEN classifying risk
+    // THEN they remain Low since the subcommand itself is Low
+    for (const command of lowRiskWithHelp) {
+      const risk = await classifyRisk("bash", { command });
+      expectLowRisk(command, risk);
+    }
+  });
+  test("--help does not downgrade risk on elevated subcommands", async () => {
+    // GIVEN elevated subcommands with --help / -h flags appended
+    const highRiskWithHelp = [
       "assistant oauth token --help",
       "assistant oauth mode --set --help",
       "assistant credentials reveal --help",
+      "assistant trust clear --help",
+      "assistant trust remove -h",
+      "assistant credentials set --help",
+      "assistant credentials delete -h",
+      "assistant keys set --help",
+      "assistant keys delete -h",
+    ];
+    const mediumRiskWithHelp = [
       "assistant oauth request --help",
       "assistant oauth connect --help",
       "assistant oauth disconnect -h",
     ];
-    for (const command of helpCommands) {
+    // WHEN classifying risk
+    // THEN --help does not bypass the elevated risk level
+    for (const command of highRiskWithHelp) {
       const risk = await classifyRisk("bash", { command });
-      expectLowRisk(command, risk);
+      expect(risk).toBe(RiskLevel.High);
     }
-  });
-  test("--help after -- option terminator does not downgrade risk", async () => {
-    const risk = await classifyRisk("bash", {
-      command: "assistant oauth token -- --help",
-    });
-    expect(risk).toBe(RiskLevel.High);
+    for (const command of mediumRiskWithHelp) {
+      const risk = await classifyRisk("bash", { command });
+      expect(risk).toBe(RiskLevel.Medium);
+    }
   });
   test("non-sensitive oauth subcommands remain Low risk", async () => {
@@ -205,6 +233,66 @@ describe("CLI command risk guard: elevated assistant subcommands", () => {
       expectLowRisk(command, risk);
     }
   });
+  test("assistant credentials set is High risk (modifies stored credentials)", async () => {
+    const risk = await classifyRisk("bash", {
+      command: "assistant credentials set",
+    });
+    expect(risk).toBe(RiskLevel.High);
+  });
+  test("assistant credentials delete is High risk (removes stored credentials)", async () => {
+    const risk = await classifyRisk("bash", {
+      command: "assistant credentials delete",
+    });
+    expect(risk).toBe(RiskLevel.High);
+  });
+  test("assistant keys set is High risk (modifies API keys)", async () => {
+    const risk = await classifyRisk("bash", {
+      command: "assistant keys set anthropic sk-ant-xxx",
+    });
+    expect(risk).toBe(RiskLevel.High);
+  });
+  test("assistant keys delete is High risk (removes API keys)", async () => {
+    const risk = await classifyRisk("bash", {
+      command: "assistant keys delete openai",
+    });
+    expect(risk).toBe(RiskLevel.High);
+  });
+  test("non-sensitive keys subcommands remain Low risk", async () => {
+    const lowRiskKeysCommands = ["assistant keys", "assistant keys list"];
+    for (const command of lowRiskKeysCommands) {
+      const risk = await classifyRisk("bash", { command });
+      expectLowRisk(command, risk);
+    }
+  });
+  test("assistant trust remove is High risk (removes trust rules)", async () => {
+    const risk = await classifyRisk("bash", {
+      command: "assistant trust remove abc123",
+    });
+    expect(risk).toBe(RiskLevel.High);
+  });
+  test("assistant trust clear is High risk (clears all trust rules)", async () => {
+    const risk = await classifyRisk("bash", {
+      command: "assistant trust clear",
+    });
+    expect(risk).toBe(RiskLevel.High);
+  });
+  test("non-sensitive trust subcommands remain Low risk", async () => {
+    const lowRiskTrustCommands = ["assistant trust", "assistant trust list"];
+    for (const command of lowRiskTrustCommands) {
+      const risk = await classifyRisk("bash", { command });
+      expectLowRisk(command, risk);
+    }
+  });
 });
 describe("CLI command risk guard: wrapper program propagation", () => {

package/src/__tests__/cli-memory.test.ts ADDED Viewed

@@ -0,0 +1,372 @@
+import { rmSync } from "node:fs";
+import { afterAll, beforeEach, describe, expect, mock, test } from "bun:test";
+import { Command } from "commander";
+import { eq } from "drizzle-orm";
+mock.module("../util/logger.js", () => ({
+  getLogger: () =>
+    new Proxy({} as Record<string, unknown>, {
+      get: () => () => {},
+    }),
+}));
+mock.module("../memory/qdrant-client.js", () => ({
+  getQdrantClient: () => ({
+    searchWithFilter: async () => [],
+    hybridSearch: async () => [],
+    upsertPoints: async () => {},
+    deletePoints: async () => {},
+  }),
+  initQdrantClient: () => {},
+}));
+// Controllable mock for buildCliProgram
+let mockCommands: { name: string; description: string }[] = [];
+function makeMockProgram(): Command {
+  const program = new Command();
+  for (const cmd of mockCommands) {
+    program.command(cmd.name).description(cmd.description);
+  }
+  return program;
+}
+mock.module("../cli/program.js", () => ({
+  buildCliProgram: () => makeMockProgram(),
+}));
+import { DEFAULT_CONFIG } from "../config/defaults.js";
+const TEST_CONFIG = {
+  ...DEFAULT_CONFIG,
+  memory: {
+    ...DEFAULT_CONFIG.memory,
+    enabled: true,
+    extraction: {
+      ...DEFAULT_CONFIG.memory.extraction,
+      useLLM: false,
+    },
+  },
+};
+mock.module("../config/loader.js", () => ({
+  loadConfig: () => TEST_CONFIG,
+  getConfig: () => TEST_CONFIG,
+  loadRawConfig: () => ({}),
+  saveRawConfig: () => {},
+  invalidateConfigCache: () => {},
+}));
+import {
+  buildCliCapabilityStatement,
+  seedCliCommandMemories,
+  upsertCliCapabilityMemory,
+} from "../cli/cli-memory.js";
+import { getDb, initializeDb, resetDb } from "../memory/db.js";
+import { memoryItems, memoryJobs } from "../memory/schema.js";
+import { ensureDataDir, getDbPath } from "../util/platform.js";
+ensureDataDir();
+initializeDb();
+afterAll(() => {
+  resetDb();
+});
+function resetTables() {
+  const db = getDb();
+  db.run("DELETE FROM memory_item_sources");
+  db.run("DELETE FROM memory_embeddings");
+  db.run("DELETE FROM memory_items");
+  db.run("DELETE FROM memory_jobs");
+}
+// ─── buildCliCapabilityStatement ────────────────────────────────────────────
+describe("buildCliCapabilityStatement", () => {
+  test("includes 'assistant' prefix, name, and description", () => {
+    const result = buildCliCapabilityStatement("doctor", "Run diagnostic checks");
+    expect(result).toContain('"assistant doctor"');
+    expect(result).toContain("Run diagnostic checks");
+  });
+  test("truncates long statements to 500 chars", () => {
+    const longDesc = "x".repeat(600);
+    const result = buildCliCapabilityStatement("test", longDesc);
+    expect(result.length).toBe(500);
+  });
+});
+// ─── upsertCliCapabilityMemory ──────────────────────────────────────────────
+describe("upsertCliCapabilityMemory", () => {
+  beforeEach(resetTables);
+  test("inserts with correct kind, subject, confidence, importance", () => {
+    upsertCliCapabilityMemory("doctor", "Run diagnostic checks");
+    const db = getDb();
+    const items = db.select().from(memoryItems).all();
+    expect(items).toHaveLength(1);
+    expect(items[0].kind).toBe("capability");
+    expect(items[0].subject).toBe("cli:doctor");
+    expect(items[0].confidence).toBe(1.0);
+    expect(items[0].importance).toBe(0.7);
+    expect(items[0].status).toBe("active");
+    expect(items[0].scopeId).toBe("default");
+    // Should also enqueue an embed_item job
+    const jobs = db.select().from(memoryJobs).all();
+    expect(jobs).toHaveLength(1);
+    expect(jobs[0].type).toBe("embed_item");
+  });
+  test("is idempotent (same entry only touches lastSeenAt)", () => {
+    upsertCliCapabilityMemory("doctor", "Run diagnostic checks");
+    const db = getDb();
+    const before = db.select().from(memoryItems).all();
+    expect(before).toHaveLength(1);
+    const originalLastSeen = before[0].lastSeenAt;
+    // Upsert again
+    upsertCliCapabilityMemory("doctor", "Run diagnostic checks");
+    const after = db.select().from(memoryItems).all();
+    expect(after).toHaveLength(1);
+    // Fingerprint should be the same, so only lastSeenAt changes
+    expect(after[0].fingerprint).toBe(before[0].fingerprint);
+    expect(after[0].lastSeenAt).toBeGreaterThanOrEqual(originalLastSeen);
+    // Should NOT enqueue a second embed job (only 1 from initial insert)
+    const jobs = db.select().from(memoryJobs).all();
+    expect(jobs).toHaveLength(1);
+  });
+  test("updates statement when description changes", () => {
+    upsertCliCapabilityMemory("doctor", "Original description");
+    const db = getDb();
+    const before = db.select().from(memoryItems).all();
+    expect(before).toHaveLength(1);
+    expect(before[0].statement).toContain("Original description");
+    // Change description
+    upsertCliCapabilityMemory("doctor", "Updated description");
+    const after = db.select().from(memoryItems).all();
+    expect(after).toHaveLength(1);
+    expect(after[0].statement).toContain("Updated description");
+    expect(after[0].fingerprint).not.toBe(before[0].fingerprint);
+    // Should enqueue a second embed job
+    const jobs = db.select().from(memoryJobs).all();
+    expect(jobs).toHaveLength(2);
+  });
+  test("reactivates soft-deleted items", () => {
+    upsertCliCapabilityMemory("doctor", "Run diagnostic checks");
+    const db = getDb();
+    // Soft-delete the item
+    db.update(memoryItems)
+      .set({ status: "deleted" })
+      .where(eq(memoryItems.subject, "cli:doctor"))
+      .run();
+    const deleted = db.select().from(memoryItems).all();
+    expect(deleted[0].status).toBe("deleted");
+    // Clear jobs from initial insert
+    db.run("DELETE FROM memory_jobs");
+    // Upsert again — should reactivate
+    upsertCliCapabilityMemory("doctor", "Run diagnostic checks");
+    const reactivated = db.select().from(memoryItems).all();
+    expect(reactivated).toHaveLength(1);
+    expect(reactivated[0].status).toBe("active");
+    // Should enqueue embed job for reactivated item
+    const jobs = db.select().from(memoryJobs).all();
+    expect(jobs).toHaveLength(1);
+    expect(jobs[0].type).toBe("embed_item");
+  });
+  test("does not throw on DB error", () => {
+    resetDb();
+    const db = getDb();
+    db.run("DROP TABLE IF EXISTS memory_items");
+    expect(() => {
+      upsertCliCapabilityMemory("doctor", "Run diagnostic checks");
+    }).not.toThrow();
+    // Restore DB state for subsequent tests.
+    resetDb();
+    const dbPath = getDbPath();
+    for (const ext of ["", "-wal", "-shm"]) {
+      rmSync(`${dbPath}${ext}`, { force: true });
+    }
+    initializeDb();
+  });
+});
+// ─── seedCliCommandMemories ─────────────────────────────────────────────────
+describe("seedCliCommandMemories", () => {
+  beforeEach(() => {
+    resetTables();
+    // Reset mock commands
+    mockCommands = [];
+  });
+  test("upserts capability memories for all commands", () => {
+    mockCommands = [
+      { name: "doctor", description: "Run diagnostic checks" },
+      { name: "config", description: "Manage configuration" },
+      { name: "keys", description: "Manage API keys" },
+    ];
+    seedCliCommandMemories();
+    const db = getDb();
+    const items = db
+      .select()
+      .from(memoryItems)
+      .where(eq(memoryItems.kind, "capability"))
+      .all();
+    expect(items).toHaveLength(3);
+    const subjects = items.map((i) => i.subject).sort();
+    expect(subjects).toEqual([
+      "cli:config",
+      "cli:doctor",
+      "cli:keys",
+    ]);
+    // All should be active
+    for (const item of items) {
+      expect(item.status).toBe("active");
+    }
+  });
+  test("prunes stale capabilities for commands no longer registered", () => {
+    // First seed with three commands
+    mockCommands = [
+      { name: "doctor", description: "Run diagnostic checks" },
+      { name: "config", description: "Manage configuration" },
+      { name: "keys", description: "Manage API keys" },
+    ];
+    seedCliCommandMemories();
+    const db = getDb();
+    const beforeItems = db
+      .select()
+      .from(memoryItems)
+      .where(eq(memoryItems.kind, "capability"))
+      .all();
+    expect(beforeItems).toHaveLength(3);
+    expect(beforeItems.every((i) => i.status === "active")).toBe(true);
+    // Now seed with only doctor — config and keys should be pruned
+    mockCommands = [
+      { name: "doctor", description: "Run diagnostic checks" },
+    ];
+    seedCliCommandMemories();
+    const afterItems = db
+      .select()
+      .from(memoryItems)
+      .where(eq(memoryItems.kind, "capability"))
+      .all();
+    expect(afterItems).toHaveLength(3); // still 3 rows, but 2 are soft-deleted
+    const active = afterItems.filter((i) => i.status === "active");
+    const deleted = afterItems.filter((i) => i.status === "deleted");
+    expect(active).toHaveLength(1);
+    expect(active[0].subject).toBe("cli:doctor");
+    expect(deleted).toHaveLength(2);
+    const deletedSubjects = deleted.map((i) => i.subject).sort();
+    expect(deletedSubjects).toEqual(["cli:config", "cli:keys"]);
+  });
+  test("handles empty command list without errors", () => {
+    // Pre-populate a CLI command so we can verify it gets pruned
+    upsertCliCapabilityMemory("old-command", "An old command");
+    const db = getDb();
+    const beforeItems = db.select().from(memoryItems).all();
+    expect(beforeItems).toHaveLength(1);
+    expect(beforeItems[0].status).toBe("active");
+    // Seed with empty commands
+    mockCommands = [];
+    seedCliCommandMemories();
+    // The existing command should be pruned (soft-deleted)
+    const afterItems = db.select().from(memoryItems).all();
+    expect(afterItems).toHaveLength(1);
+    expect(afterItems[0].status).toBe("deleted");
+  });
+  test("does not prune non-cli capability memories", () => {
+    // Pre-insert a skill capability memory directly into the DB
+    const db = getDb();
+    const now = Date.now();
+    db.insert(memoryItems)
+      .values({
+        id: "skill-test-item",
+        kind: "capability",
+        subject: "skill:test-skill",
+        statement: "The test skill does things.",
+        status: "active",
+        confidence: 1.0,
+        importance: 0.7,
+        fingerprint: "skill-test-fp",
+        sourceType: "extraction",
+        scopeId: "default",
+        firstSeenAt: now,
+        lastSeenAt: now,
+      })
+      .run();
+    // Seed with empty commands — CLI pruner runs but should skip skill:* items
+    mockCommands = [];
+    seedCliCommandMemories();
+    const item = db
+      .select()
+      .from(memoryItems)
+      .where(eq(memoryItems.subject, "skill:test-skill"))
+      .get();
+    expect(item).toBeDefined();
+    expect(item!.status).toBe("active");
+  });
+  test("does not throw on error", () => {
+    mockCommands = [
+      { name: "doctor", description: "Run diagnostic checks" },
+    ];
+    // Drop memory_items to force a DB error during the prune phase
+    resetDb();
+    const db = getDb();
+    db.run("DROP TABLE IF EXISTS memory_items");
+    expect(() => {
+      seedCliCommandMemories();
+    }).not.toThrow();
+    // Restore DB state for subsequent tests.
+    resetDb();
+    const dbPath = getDbPath();
+    for (const ext of ["", "-wal", "-shm"]) {
+      rmSync(`${dbPath}${ext}`, { force: true });
+    }
+    initializeDb();
+  });
+});

package/src/__tests__/computer-use-skill-manifest-regression.test.ts CHANGED Viewed

@@ -52,9 +52,19 @@ describe("computer-use skill manifest regression", () => {
     }
   });
-  test("all manifest tools have risk: low", () => {
+  test("read-only tools have risk: low, side-effect tools have risk: medium", () => {
+    const readOnlyTools = new Set([
+      "computer_use_observe",
+      "computer_use_wait",
+      "computer_use_done",
+      "computer_use_respond",
+    ]);
     for (const tool of manifest.tools) {
-      expect(tool.risk).toBe("low");
+      if (readOnlyTools.has(tool.name)) {
+        expect(tool.risk).toBe("low");
+      } else {
+        expect(tool.risk).toBe("medium");
+      }
     }
   });

package/src/__tests__/config-schema.test.ts CHANGED Viewed

@@ -421,7 +421,6 @@ describe("AssistantConfigSchema", () => {
     const result = AssistantConfigSchema.parse({});
     expect(result.permissions).toEqual({
       mode: "workspace",
-      dangerouslySkipPermissions: false,
     });
   });
@@ -1129,7 +1128,6 @@ describe("loadConfig with schema validation", () => {
     const config = loadConfig();
     expect(config.permissions).toEqual({
       mode: "workspace",
-      dangerouslySkipPermissions: false,
     });
   });