npm - @vellumai/assistant - Versions diffs - 0.6.0 → 0.6.1 - Mend

@vellumai/assistant 0.6.0 → 0.6.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (285) hide show

package/AGENTS.md +4 -0
package/ARCHITECTURE.md +68 -15
package/Dockerfile +2 -2
package/bun.lock +6 -2
package/docker-entrypoint.sh +32 -1
package/docs/architecture/integrations.md +1 -1
package/docs/architecture/memory.md +21 -24
package/openapi.yaml +538 -3
package/package.json +5 -1
package/src/__tests__/anthropic-provider.test.ts +160 -95
package/src/__tests__/app-dir-path-guard.test.ts +1 -0
package/src/__tests__/app-executors.test.ts +47 -1
package/src/__tests__/app-source-watcher.test.ts +159 -0
package/src/__tests__/checker.test.ts +38 -6
package/src/__tests__/config-schema.test.ts +5 -0
package/src/__tests__/conversation-agent-loop-overflow.test.ts +4 -6
package/src/__tests__/conversation-agent-loop.test.ts +4 -51
package/src/__tests__/conversation-history-web-search.test.ts +1 -1
package/src/__tests__/conversation-runtime-assembly.test.ts +653 -832
package/src/__tests__/conversation-runtime-workspace.test.ts +1 -93
package/src/__tests__/conversation-tool-setup-app-refresh.test.ts +17 -4
package/src/__tests__/conversation-wipe.test.ts +2 -6
package/src/__tests__/conversation-workspace-cache-state.test.ts +6 -12
package/src/__tests__/conversation-workspace-injection.test.ts +25 -26
package/src/__tests__/conversation-workspace-tool-tracking.test.ts +1 -1
package/src/__tests__/copy-composer-tc-templates.test.ts +335 -0
package/src/__tests__/date-context.test.ts +76 -210
package/src/__tests__/db-schedule-syntax-migration.test.ts +16 -1
package/src/__tests__/file-list-tool.test.ts +219 -0
package/src/__tests__/first-greeting.test.ts +1 -1
package/src/__tests__/heartbeat-service.test.ts +180 -3
package/src/__tests__/identity-routes.test.ts +328 -0
package/src/__tests__/injection-block.test.ts +24 -0
package/src/__tests__/install-skill-routing.test.ts +7 -6
package/src/__tests__/jobs-store-qdrant-breaker.test.ts +15 -14
package/src/__tests__/list-messages-tool-merge.test.ts +300 -0
package/src/__tests__/llm-context-normalization.test.ts +18 -18
package/src/__tests__/llm-context-route-provider.test.ts +101 -0
package/src/__tests__/llm-request-log-turn-query.test.ts +162 -0
package/src/__tests__/log-export-workspace.test.ts +72 -105
package/src/__tests__/mcp-abort-signal.test.ts +5 -0
package/src/__tests__/mcp-client-auth.test.ts +5 -0
package/src/__tests__/memory-recall-log-store.test.ts +132 -0
package/src/__tests__/migration-export-streaming.test.ts +304 -0
package/src/__tests__/migration-import-commit-http.test.ts +11 -10
package/src/__tests__/mock-fetch.ts +87 -0
package/src/__tests__/notification-decision-recipient-context.test.ts +282 -0
package/src/__tests__/onboarding-template-contract.test.ts +62 -14
package/src/__tests__/parser.test.ts +32 -0
package/src/__tests__/permission-checker-host-gate.test.ts +452 -0
package/src/__tests__/permission-controls-v2-flag.test.ts +55 -0
package/src/__tests__/permission-mode-sse.test.ts +418 -0
package/src/__tests__/permission-mode-store.test.ts +277 -0
package/src/__tests__/permission-mode.test.ts +101 -0
package/src/__tests__/platform-bash-auto-approve.test.ts +359 -0
package/src/__tests__/profiler-routes.test.ts +502 -0
package/src/__tests__/profiler-run-store.test.ts +441 -0
package/src/__tests__/proxy-approval-callback.test.ts +4 -75
package/src/__tests__/registry.test.ts +1 -1
package/src/__tests__/sandbox-host-parity.test.ts +5 -4
package/src/__tests__/scheduler-reuse-conversation.test.ts +368 -0
package/src/__tests__/scrub-corrupted-image-attachments.test.ts +278 -0
package/src/__tests__/search-skills-unified.test.ts +4 -3
package/src/__tests__/send-endpoint-busy.test.ts +42 -3
package/src/__tests__/set-permission-mode.test.ts +274 -0
package/src/__tests__/skill-load-feature-flag.test.ts +12 -0
package/src/__tests__/skill-memory.test.ts +2 -783
package/src/__tests__/strip-memory-injections.test.ts +187 -0
package/src/__tests__/subagent-detail.test.ts +84 -0
package/src/__tests__/subagent-disposal.test.ts +308 -0
package/src/__tests__/subagent-manager-notify.test.ts +19 -10
package/src/__tests__/subagent-notify-parent.test.ts +390 -0
package/src/__tests__/subagent-role-registry.test.ts +108 -0
package/src/__tests__/subagent-tool-filtering.test.ts +71 -0
package/src/__tests__/subagent-tools.test.ts +464 -4
package/src/__tests__/system-prompt-ask-mode.test.ts +139 -0
package/src/__tests__/task-memory-cleanup.test.ts +12 -12
package/src/__tests__/terminal-tools.test.ts +17 -27
package/src/__tests__/test-preload.ts +4 -0
package/src/__tests__/tool-executor.test.ts +4 -26
package/src/__tests__/tool-side-effects-slack-dm.test.ts +1 -0
package/src/__tests__/top-level-renderer.test.ts +10 -13
package/src/__tests__/trusted-contact-lifecycle-notifications.test.ts +116 -2
package/src/__tests__/workspace-migration-028-recover-conversations-from-disk-view.test.ts +387 -0
package/src/agent/loop.ts +6 -0
package/src/approvals/guardian-request-resolvers.ts +24 -0
package/src/avatar/traits-png-sync.ts +3 -3
package/src/cli/__tests__/run-assistant-command.ts +29 -0
package/src/cli/commands/__tests__/email-download.test.ts +245 -0
package/src/cli/commands/__tests__/email-list.test.ts +192 -0
package/src/cli/commands/__tests__/email-register.test.ts +186 -0
package/src/cli/commands/__tests__/email-send.test.ts +291 -0
package/src/cli/commands/__tests__/email-status.test.ts +181 -0
package/src/cli/commands/__tests__/email-unregister.test.ts +139 -0
package/src/cli/commands/__tests__/routes.test.ts +562 -0
package/src/cli/commands/conversations.ts +1 -8
package/src/cli/commands/email.ts +584 -835
package/src/cli/commands/memory.ts +1 -34
package/src/cli/commands/notifications.ts +7 -2
package/src/cli/commands/oauth/connect.ts +14 -5
package/src/cli/commands/routes.ts +396 -0
package/src/cli/commands/skills.ts +130 -20
package/src/cli/program.ts +2 -0
package/src/cli.ts +1 -120
package/src/config/bundled-skills/app-builder/SKILL.md +4 -1
package/src/config/bundled-skills/gmail/SKILL.md +2 -2
package/src/config/bundled-skills/messaging/SKILL.md +7 -0
package/src/config/bundled-skills/schedule/SKILL.md +22 -2
package/src/config/bundled-skills/schedule/TOOLS.json +8 -0
package/src/config/bundled-skills/settings/tools/avatar-get.ts +3 -13
package/src/config/bundled-skills/settings/tools/avatar-remove.ts +2 -4
package/src/config/bundled-skills/settings/tools/avatar-update.ts +5 -2
package/src/config/bundled-skills/slack/SKILL.md +2 -0
package/src/config/bundled-skills/subagent/SKILL.md +43 -3
package/src/config/bundled-skills/subagent/TOOLS.json +29 -4
package/src/config/env-registry.ts +63 -0
package/src/config/feature-flag-registry.json +17 -1
package/src/config/schema.ts +8 -0
package/src/config/schemas/filing.ts +51 -0
package/src/config/schemas/heartbeat.ts +15 -12
package/src/config/schemas/memory-lifecycle.ts +12 -0
package/src/config/schemas/security.ts +14 -0
package/src/daemon/app-source-watcher.ts +93 -0
package/src/daemon/config-watcher.ts +79 -1
package/src/daemon/conversation-agent-loop-handlers.ts +20 -0
package/src/daemon/conversation-agent-loop.ts +158 -65
package/src/daemon/conversation-history.ts +4 -19
package/src/daemon/conversation-lifecycle.ts +8 -14
package/src/daemon/conversation-process.ts +13 -7
package/src/daemon/conversation-runtime-assembly.ts +300 -306
package/src/daemon/conversation-tool-setup.ts +44 -14
package/src/daemon/conversation-workspace.ts +1 -2
package/src/daemon/conversation.ts +18 -0
package/src/daemon/date-context.ts +26 -53
package/src/daemon/first-greeting.ts +1 -1
package/src/daemon/handlers/conversations.ts +4 -7
package/src/daemon/handlers/shared.test.ts +143 -0
package/src/daemon/handlers/shared.ts +63 -5
package/src/daemon/handlers/skills.ts +11 -18
package/src/daemon/lifecycle.ts +199 -157
package/src/daemon/message-types/conversations.ts +25 -6
package/src/daemon/message-types/messages.ts +9 -1
package/src/daemon/message-types/schedules.ts +1 -0
package/src/daemon/message-types/settings.ts +6 -0
package/src/daemon/profiler-run-store.ts +557 -0
package/src/daemon/server.ts +89 -9
package/src/daemon/shutdown-handlers.ts +5 -0
package/src/daemon/tool-side-effects.ts +23 -3
package/src/export/transcript-formatter.ts +148 -0
package/src/filing/filing-service.ts +228 -0
package/src/heartbeat/heartbeat-service.ts +96 -7
package/src/mcp/client.ts +6 -0
package/src/mcp/mcp-oauth-provider.ts +149 -27
package/src/memory/admin.ts +33 -32
package/src/memory/app-store.ts +69 -0
package/src/memory/conversation-bootstrap.ts +1 -1
package/src/memory/conversation-crud.ts +136 -107
package/src/memory/conversation-group-migration.ts +1 -1
package/src/memory/conversation-queries.ts +58 -12
package/src/memory/conversation-title-service.ts +1 -0
package/src/memory/db-init.ts +182 -376
package/src/memory/graph/bootstrap.ts +75 -66
package/src/memory/graph/capability-seed.ts +167 -15
package/src/memory/graph/consolidation.ts +38 -4
package/src/memory/graph/conversation-graph-memory.ts +133 -104
package/src/memory/graph/extraction-job.ts +9 -4
package/src/memory/graph/extraction.ts +66 -23
package/src/memory/graph/graph-memory-state-store.ts +37 -0
package/src/memory/graph/graph-search.ts +29 -15
package/src/memory/graph/injection.ts +38 -8
package/src/memory/graph/inspect.ts +12 -3
package/src/memory/graph/retriever.ts +365 -262
package/src/memory/graph/store.test.ts +48 -0
package/src/memory/graph/store.ts +150 -11
package/src/memory/graph/tool-handlers.ts +84 -209
package/src/memory/graph/tools.ts +8 -52
package/src/memory/graph/types.ts +24 -0
package/src/memory/job-handlers/cleanup.ts +44 -1
package/src/memory/jobs-store.ts +70 -60
package/src/memory/jobs-worker.ts +44 -28
package/src/memory/llm-request-log-store.ts +96 -12
package/src/memory/memory-recall-log-store.ts +49 -5
package/src/memory/migrations/203-drop-memory-items-tables.ts +33 -1
package/src/memory/migrations/206-memory-graph-node-edits.ts +19 -0
package/src/memory/migrations/206-scrub-corrupted-image-attachments.ts +131 -0
package/src/memory/migrations/207-conversation-graph-memory-state.ts +20 -0
package/src/memory/migrations/208-conversations-last-message-at.ts +35 -0
package/src/memory/migrations/209-strip-thinking-from-consolidated.ts +85 -0
package/src/memory/migrations/210-schedule-reuse-conversation.ts +13 -0
package/src/memory/migrations/211-memory-recall-logs-query-context.ts +21 -0
package/src/memory/migrations/212-llm-request-logs-created-at-index.ts +19 -0
package/src/memory/migrations/index.ts +8 -0
package/src/memory/migrations/registry.ts +8 -0
package/src/memory/schema/conversations.ts +14 -0
package/src/memory/schema/infrastructure.ts +8 -1
package/src/memory/schema/memory-core.ts +0 -51
package/src/memory/schema/memory-graph.ts +15 -0
package/src/memory/task-memory-cleanup.ts +30 -11
package/src/notifications/copy-composer.ts +86 -0
package/src/notifications/decision-engine.ts +35 -0
package/src/permissions/checker.ts +12 -1
package/src/permissions/permission-mode-store.ts +180 -0
package/src/permissions/permission-mode.ts +31 -0
package/src/permissions/workspace-policy.ts +9 -0
package/src/prompts/system-prompt.ts +59 -7
package/src/prompts/templates/BOOTSTRAP-REFERENCE.md +100 -0
package/src/prompts/templates/BOOTSTRAP.md +70 -165
package/src/prompts/templates/HEARTBEAT.md +3 -1
package/src/prompts/templates/SOUL.md +25 -4
package/src/prompts/templates/UPDATES.md +8 -0
package/src/providers/anthropic/client.ts +107 -219
package/src/runtime/auth/route-policy.ts +23 -0
package/src/runtime/http-server.ts +32 -2
package/src/runtime/http-types.ts +12 -1
package/src/runtime/migrations/vbundle-builder.ts +389 -3
package/src/runtime/migrations/vbundle-importer.ts +8 -6
package/src/runtime/routes/__tests__/user-route-dispatcher.test.ts +378 -0
package/src/runtime/routes/app-management-routes.ts +1 -11
package/src/runtime/routes/approval-strategies/guardian-callback-strategy.ts +26 -0
package/src/runtime/routes/archive-utils.ts +29 -0
package/src/runtime/routes/avatar-routes.ts +2 -9
package/src/runtime/routes/btw-routes.ts +14 -1
package/src/runtime/routes/conversation-analysis-routes.ts +173 -0
package/src/runtime/routes/conversation-management-routes.ts +1 -14
package/src/runtime/routes/conversation-query-routes.ts +49 -3
package/src/runtime/routes/conversation-routes.ts +264 -44
package/src/runtime/routes/heartbeat-routes.ts +4 -10
package/src/runtime/routes/identity-routes.ts +53 -18
package/src/runtime/routes/llm-context-normalization.ts +14 -10
package/src/runtime/routes/log-export-routes.ts +23 -275
package/src/runtime/routes/memory-item-routes.test.ts +168 -233
package/src/runtime/routes/migration-routes.ts +18 -7
package/src/runtime/routes/profiler-routes.ts +350 -0
package/src/runtime/routes/schedule-routes.ts +27 -12
package/src/runtime/routes/settings-routes.ts +95 -8
package/src/runtime/routes/subagents-routes.ts +28 -7
package/src/runtime/routes/user-route-dispatcher.ts +223 -0
package/src/runtime/routes/user-routes.ts +41 -0
package/src/runtime/routes/workspace-routes.ts +0 -1
package/src/schedule/schedule-store.ts +30 -0
package/src/schedule/scheduler.ts +45 -18
package/src/skills/catalog-install.ts +10 -2
package/src/skills/managed-store.ts +2 -2
package/src/skills/skill-memory.ts +1 -293
package/src/subagent/index.ts +13 -3
package/src/subagent/manager.ts +308 -29
package/src/subagent/types.ts +68 -0
package/src/tasks/task-runner.ts +4 -4
package/src/tools/apps/executors.ts +29 -4
package/src/tools/filesystem/list.ts +93 -0
package/src/tools/permission-checker.ts +78 -0
package/src/tools/registry.ts +4 -0
package/src/tools/schedule/create.ts +3 -0
package/src/tools/schedule/list.ts +1 -0
package/src/tools/schedule/update.ts +6 -0
package/src/tools/shared/filesystem/errors.ts +5 -0
package/src/tools/shared/filesystem/file-ops-service.ts +90 -2
package/src/tools/shared/filesystem/types.ts +17 -0
package/src/tools/shared/shell-output.ts +31 -2
package/src/tools/subagent/abort.ts +12 -2
package/src/tools/subagent/message.ts +9 -2
package/src/tools/subagent/notify-parent.ts +79 -0
package/src/tools/subagent/read.ts +29 -8
package/src/tools/subagent/resolve.ts +21 -0
package/src/tools/subagent/spawn.ts +2 -0
package/src/tools/subagent/status.ts +11 -1
package/src/tools/system/avatar-generator.ts +3 -3
package/src/tools/system/register.ts +23 -0
package/src/tools/system/set-permission-mode.ts +103 -0
package/src/tools/terminal/parser.ts +30 -5
package/src/tools/terminal/safe-env.ts +16 -1
package/src/tools/tool-manifest.ts +6 -0
package/src/tools/types.ts +2 -0
package/src/util/logger.ts +1 -1
package/src/util/platform.ts +50 -17
package/src/workspace/migrations/023-move-config-files-to-workspace.ts +2 -2
package/src/workspace/migrations/024-move-runtime-files-to-workspace.ts +2 -2
package/src/workspace/migrations/028-recover-conversations-from-disk-view.ts +270 -0
package/src/workspace/migrations/029-seed-pkb.ts +84 -0
package/src/workspace/migrations/registry.ts +4 -0
package/src/workspace/top-level-renderer.ts +5 -9
package/src/__tests__/cli-memory.test.ts +0 -377
package/src/__tests__/clipboard.test.ts +0 -88
package/src/cli/cli-memory.ts +0 -179
package/src/util/clipboard.ts +0 -34

package/src/__tests__/profiler-run-store.test.ts ADDED Viewed

@@ -0,0 +1,441 @@
+/**
+ * Tests for the profiler run store: manifest management, retention sweep,
+ * active-run protection, oldest-first pruning, max-run-count pruning,
+ * active-run-over-budget signaling, and idempotent rescans.
+ */
+import {
+  existsSync,
+  mkdirSync,
+  readFileSync,
+  rmSync,
+  writeFileSync,
+} from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { afterEach, beforeEach, describe, expect, test } from "bun:test";
+import type { ProfilerRunManifest } from "../daemon/profiler-run-store.js";
+import { rescanRuns, runProfilerSweep } from "../daemon/profiler-run-store.js";
+// ── Test scaffolding ────────────────────────────────────────────────────
+let testDir: string;
+let runsDir: string;
+let origEnv: Record<string, string | undefined>;
+/**
+ * Create a fake profiler run directory with some payload files.
+ */
+function createRun(
+  runId: string,
+  opts?: {
+    sizeBytes?: number;
+    manifest?: Partial<ProfilerRunManifest>;
+  },
+): string {
+  const dir = join(runsDir, runId);
+  mkdirSync(dir, { recursive: true });
+  // Write a payload file of the requested size
+  const size = opts?.sizeBytes ?? 1024;
+  writeFileSync(join(dir, "profile.cpuprofile"), Buffer.alloc(size));
+  // Optionally write a pre-existing manifest
+  if (opts?.manifest) {
+    const m: ProfilerRunManifest = {
+      runId,
+      status: opts.manifest.status ?? "completed",
+      createdAt: opts.manifest.createdAt ?? new Date().toISOString(),
+      updatedAt: opts.manifest.updatedAt ?? new Date().toISOString(),
+      totalBytes: opts.manifest.totalBytes ?? size,
+    };
+    writeFileSync(join(dir, "manifest.json"), JSON.stringify(m, null, 2));
+  }
+  return dir;
+}
+function readManifestFromDisk(runId: string): ProfilerRunManifest | null {
+  const manifestPath = join(runsDir, runId, "manifest.json");
+  try {
+    return JSON.parse(readFileSync(manifestPath, "utf-8"));
+  } catch {
+    return null;
+  }
+}
+beforeEach(() => {
+  testDir = join(
+    tmpdir(),
+    `vellum-profiler-test-${Date.now()}-${Math.random().toString(36).slice(2)}`,
+  );
+  runsDir = join(testDir, "data", "profiler", "runs");
+  mkdirSync(runsDir, { recursive: true });
+  // Save and override env
+  origEnv = {
+    VELLUM_WORKSPACE_DIR: process.env.VELLUM_WORKSPACE_DIR,
+    VELLUM_PROFILER_RUN_ID: process.env.VELLUM_PROFILER_RUN_ID,
+    VELLUM_PROFILER_MAX_BYTES: process.env.VELLUM_PROFILER_MAX_BYTES,
+    VELLUM_PROFILER_MAX_RUNS: process.env.VELLUM_PROFILER_MAX_RUNS,
+    VELLUM_PROFILER_MIN_FREE_MB: process.env.VELLUM_PROFILER_MIN_FREE_MB,
+  };
+  // Point workspace dir to our temp directory
+  process.env.VELLUM_WORKSPACE_DIR = testDir;
+  // Clear profiler env vars
+  delete process.env.VELLUM_PROFILER_RUN_ID;
+  delete process.env.VELLUM_PROFILER_MAX_BYTES;
+  delete process.env.VELLUM_PROFILER_MAX_RUNS;
+  delete process.env.VELLUM_PROFILER_MIN_FREE_MB;
+});
+afterEach(() => {
+  // Restore env
+  for (const [key, value] of Object.entries(origEnv)) {
+    if (value === undefined) {
+      delete process.env[key];
+    } else {
+      process.env[key] = value;
+    }
+  }
+  // Clean up temp directory
+  if (existsSync(testDir)) {
+    rmSync(testDir, { recursive: true, force: true });
+  }
+});
+// ── Tests ───────────────────────────────────────────────────────────────
+describe("Profiler run store", () => {
+  describe("rescanRuns", () => {
+    test("returns empty array when no runs directory exists", () => {
+      // Remove the runs directory
+      rmSync(runsDir, { recursive: true, force: true });
+      const manifests = rescanRuns();
+      expect(manifests).toEqual([]);
+    });
+    test("returns empty array when runs directory is empty", () => {
+      const manifests = rescanRuns();
+      expect(manifests).toEqual([]);
+    });
+    test("creates manifests for run directories without existing manifests", () => {
+      createRun("run-001", { sizeBytes: 2048 });
+      createRun("run-002", { sizeBytes: 4096 });
+      const manifests = rescanRuns();
+      expect(manifests).toHaveLength(2);
+      const run1 = manifests.find((m) => m.runId === "run-001");
+      expect(run1).toBeDefined();
+      expect(run1!.status).toBe("completed");
+      // totalBytes includes manifest.json that rescan just wrote
+      expect(run1!.totalBytes).toBeGreaterThanOrEqual(2048);
+      const run2 = manifests.find((m) => m.runId === "run-002");
+      expect(run2).toBeDefined();
+      expect(run2!.status).toBe("completed");
+      expect(run2!.totalBytes).toBeGreaterThanOrEqual(4096);
+    });
+    test("marks the active run correctly", () => {
+      process.env.VELLUM_PROFILER_RUN_ID = "active-run";
+      createRun("active-run", { sizeBytes: 1024 });
+      createRun("old-run", { sizeBytes: 1024 });
+      const manifests = rescanRuns();
+      const active = manifests.find((m) => m.runId === "active-run");
+      const old = manifests.find((m) => m.runId === "old-run");
+      expect(active!.status).toBe("active");
+      expect(old!.status).toBe("completed");
+    });
+    test("transitions previously-active run to completed when no longer active", () => {
+      // Create a run with an "active" manifest
+      createRun("old-active", {
+        sizeBytes: 1024,
+        manifest: { status: "active", createdAt: "2025-01-01T00:00:00Z" },
+      });
+      // No VELLUM_PROFILER_RUN_ID set, so nothing is active
+      const manifests = rescanRuns();
+      const run = manifests.find((m) => m.runId === "old-active");
+      expect(run!.status).toBe("completed");
+      // Verify it was persisted to disk
+      const onDisk = readManifestFromDisk("old-active");
+      expect(onDisk!.status).toBe("completed");
+    });
+    test("is idempotent — repeated calls after initial scan produce the same result", () => {
+      createRun("run-a", { sizeBytes: 1024 });
+      process.env.VELLUM_PROFILER_RUN_ID = "run-a";
+      // First call writes the manifest, which changes totalBytes
+      rescanRuns();
+      // Second and third calls should be stable
+      const second = rescanRuns();
+      const third = rescanRuns();
+      expect(second).toHaveLength(1);
+      expect(third).toHaveLength(1);
+      expect(second[0]!.runId).toBe(third[0]!.runId);
+      expect(second[0]!.status).toBe(third[0]!.status);
+      expect(second[0]!.totalBytes).toBe(third[0]!.totalBytes);
+    });
+    test("preserves createdAt from existing manifest", () => {
+      const originalCreatedAt = "2024-06-15T12:00:00Z";
+      createRun("preserved-run", {
+        sizeBytes: 1024,
+        manifest: {
+          status: "completed",
+          createdAt: originalCreatedAt,
+        },
+      });
+      const manifests = rescanRuns();
+      const run = manifests.find((m) => m.runId === "preserved-run");
+      expect(run!.createdAt).toBe(originalCreatedAt);
+    });
+  });
+  describe("runProfilerSweep", () => {
+    test("no-ops when no runs exist", () => {
+      const result = runProfilerSweep();
+      expect(result.prunedCount).toBe(0);
+      expect(result.freedBytes).toBe(0);
+      expect(result.activeRunOverBudget).toBe(false);
+      expect(result.remainingRuns).toBe(0);
+    });
+    test("does not prune when under all budgets", () => {
+      process.env.VELLUM_PROFILER_MAX_BYTES = "1000000"; // 1 MB
+      process.env.VELLUM_PROFILER_MAX_RUNS = "10";
+      createRun("run-1", { sizeBytes: 1024 });
+      createRun("run-2", { sizeBytes: 1024 });
+      const result = runProfilerSweep();
+      expect(result.prunedCount).toBe(0);
+      expect(result.remainingRuns).toBe(2);
+      // Both directories still exist
+      expect(existsSync(join(runsDir, "run-1"))).toBe(true);
+      expect(existsSync(join(runsDir, "run-2"))).toBe(true);
+    });
+    test("prunes oldest completed runs when byte budget exceeded", () => {
+      // Set a very small byte budget
+      process.env.VELLUM_PROFILER_MAX_BYTES = "3000";
+      process.env.VELLUM_PROFILER_MAX_RUNS = "100";
+      process.env.VELLUM_PROFILER_MIN_FREE_MB = "0";
+      // Create runs with explicit timestamps for ordering
+      createRun("oldest", {
+        sizeBytes: 2000,
+        manifest: {
+          status: "completed",
+          createdAt: "2025-01-01T00:00:00Z",
+        },
+      });
+      createRun("middle", {
+        sizeBytes: 2000,
+        manifest: {
+          status: "completed",
+          createdAt: "2025-02-01T00:00:00Z",
+        },
+      });
+      createRun("newest", {
+        sizeBytes: 2000,
+        manifest: {
+          status: "completed",
+          createdAt: "2025-03-01T00:00:00Z",
+        },
+      });
+      const result = runProfilerSweep();
+      // Should prune until total bytes fit within 3000.
+      // Each run is ~2000 payload + manifest overhead. The sweep recomputes
+      // sizes so actual totals include the manifest file. At least 1 run
+      // should be pruned (the oldest).
+      expect(result.prunedCount).toBeGreaterThanOrEqual(1);
+      expect(result.freedBytes).toBeGreaterThan(0);
+      // The oldest should be gone
+      expect(existsSync(join(runsDir, "oldest"))).toBe(false);
+    });
+    test("prunes oldest completed runs when max-run-count exceeded", () => {
+      process.env.VELLUM_PROFILER_MAX_BYTES = "999999999";
+      process.env.VELLUM_PROFILER_MAX_RUNS = "2";
+      process.env.VELLUM_PROFILER_MIN_FREE_MB = "0";
+      createRun("run-a", {
+        sizeBytes: 100,
+        manifest: {
+          status: "completed",
+          createdAt: "2025-01-01T00:00:00Z",
+        },
+      });
+      createRun("run-b", {
+        sizeBytes: 100,
+        manifest: {
+          status: "completed",
+          createdAt: "2025-02-01T00:00:00Z",
+        },
+      });
+      createRun("run-c", {
+        sizeBytes: 100,
+        manifest: {
+          status: "completed",
+          createdAt: "2025-03-01T00:00:00Z",
+        },
+      });
+      createRun("run-d", {
+        sizeBytes: 100,
+        manifest: {
+          status: "completed",
+          createdAt: "2025-04-01T00:00:00Z",
+        },
+      });
+      const result = runProfilerSweep();
+      // 4 completed runs, max 2: should prune 2 oldest
+      expect(result.prunedCount).toBe(2);
+      expect(existsSync(join(runsDir, "run-a"))).toBe(false);
+      expect(existsSync(join(runsDir, "run-b"))).toBe(false);
+      expect(existsSync(join(runsDir, "run-c"))).toBe(true);
+      expect(existsSync(join(runsDir, "run-d"))).toBe(true);
+      expect(result.remainingRuns).toBe(2);
+    });
+    test("never deletes the active run", () => {
+      process.env.VELLUM_PROFILER_RUN_ID = "current";
+      process.env.VELLUM_PROFILER_MAX_BYTES = "500";
+      process.env.VELLUM_PROFILER_MAX_RUNS = "1";
+      process.env.VELLUM_PROFILER_MIN_FREE_MB = "0";
+      createRun("current", { sizeBytes: 2000 });
+      createRun("old-completed", {
+        sizeBytes: 2000,
+        manifest: {
+          status: "completed",
+          createdAt: "2025-01-01T00:00:00Z",
+        },
+      });
+      const result = runProfilerSweep();
+      // old-completed should be pruned, current should survive
+      expect(existsSync(join(runsDir, "current"))).toBe(true);
+      expect(existsSync(join(runsDir, "old-completed"))).toBe(false);
+      expect(result.prunedCount).toBe(1);
+    });
+    test("signals active-run-over-budget when active run exceeds byte budget", () => {
+      process.env.VELLUM_PROFILER_RUN_ID = "big-active";
+      process.env.VELLUM_PROFILER_MAX_BYTES = "500";
+      process.env.VELLUM_PROFILER_MAX_RUNS = "100";
+      process.env.VELLUM_PROFILER_MIN_FREE_MB = "0";
+      createRun("big-active", { sizeBytes: 10000 });
+      const result = runProfilerSweep();
+      expect(result.activeRunOverBudget).toBe(true);
+      // Active run must still exist
+      expect(existsSync(join(runsDir, "big-active"))).toBe(true);
+      expect(result.remainingRuns).toBe(1);
+    });
+    test("deletes single oversized completed run to recover space", () => {
+      process.env.VELLUM_PROFILER_MAX_BYTES = "100";
+      process.env.VELLUM_PROFILER_MAX_RUNS = "100";
+      process.env.VELLUM_PROFILER_MIN_FREE_MB = "0";
+      createRun("huge-completed", {
+        sizeBytes: 50000,
+        manifest: {
+          status: "completed",
+          createdAt: "2025-01-01T00:00:00Z",
+        },
+      });
+      const result = runProfilerSweep();
+      expect(result.prunedCount).toBe(1);
+      expect(result.freedBytes).toBeGreaterThanOrEqual(50000);
+      expect(existsSync(join(runsDir, "huge-completed"))).toBe(false);
+    });
+    test("creates profiler directories on first sweep if missing", () => {
+      // Remove everything
+      rmSync(join(testDir, "data", "profiler"), {
+        recursive: true,
+        force: true,
+      });
+      const result = runProfilerSweep();
+      expect(result.prunedCount).toBe(0);
+      expect(existsSync(runsDir)).toBe(true);
+    });
+    test("sweep is idempotent — repeated calls produce consistent state", () => {
+      process.env.VELLUM_PROFILER_MAX_BYTES = "999999";
+      process.env.VELLUM_PROFILER_MAX_RUNS = "10";
+      process.env.VELLUM_PROFILER_MIN_FREE_MB = "0";
+      createRun("stable-1", { sizeBytes: 1024 });
+      createRun("stable-2", { sizeBytes: 1024 });
+      const first = runProfilerSweep();
+      const second = runProfilerSweep();
+      expect(first.prunedCount).toBe(0);
+      expect(second.prunedCount).toBe(0);
+      expect(first.remainingRuns).toBe(second.remainingRuns);
+    });
+    test("active run is not counted against max completed runs", () => {
+      process.env.VELLUM_PROFILER_RUN_ID = "live";
+      process.env.VELLUM_PROFILER_MAX_BYTES = "999999";
+      process.env.VELLUM_PROFILER_MAX_RUNS = "2";
+      process.env.VELLUM_PROFILER_MIN_FREE_MB = "0";
+      createRun("live", { sizeBytes: 100 });
+      createRun("done-1", {
+        sizeBytes: 100,
+        manifest: {
+          status: "completed",
+          createdAt: "2025-01-01T00:00:00Z",
+        },
+      });
+      createRun("done-2", {
+        sizeBytes: 100,
+        manifest: {
+          status: "completed",
+          createdAt: "2025-02-01T00:00:00Z",
+        },
+      });
+      const result = runProfilerSweep();
+      // 2 completed runs = max, so nothing should be pruned
+      expect(result.prunedCount).toBe(0);
+      // Active + 2 completed = 3 remaining
+      expect(result.remainingRuns).toBe(3);
+      expect(existsSync(join(runsDir, "live"))).toBe(true);
+      expect(existsSync(join(runsDir, "done-1"))).toBe(true);
+      expect(existsSync(join(runsDir, "done-2"))).toBe(true);
+    });
+  });
+});

package/src/__tests__/proxy-approval-callback.test.ts CHANGED Viewed

@@ -189,7 +189,7 @@ describe("createProxyApprovalCallback", () => {
     expect(prompterSendToClient).not.toHaveBeenCalled();
   });
-  test("high-risk with plain allow rule (no allowHighRisk) falls through to prompt", async () => {
+  test("ask_missing_credential with allow rule auto-allows (medium risk)", async () => {
     findHighestPriorityRuleMock.mockReturnValue({
       id: "rule-hr-1",
       tool: "network_request",
@@ -198,53 +198,17 @@ describe("createProxyApprovalCallback", () => {
       decision: "allow" as const,
       priority: 100,
       createdAt: Date.now(),
-      // No allowHighRisk — should NOT auto-allow for high-risk decisions
     });
     const ctx = makeContext();
     const prompterSendToClient = mock(() => {});
     const prompter = new PermissionPrompter(prompterSendToClient);
-    const originalPrompt = prompter.prompt.bind(prompter);
-    prompter.prompt = async (...args) => {
-      const p = originalPrompt(...args);
-      await new Promise((r) => setTimeout(r, 10));
-      const call = (prompterSendToClient.mock.calls as unknown[][])[0];
-      const msg = call[0] as { requestId: string };
-      prompter.resolveConfirmation(msg.requestId, "allow");
-      return p;
-    };
     const callback = createProxyApprovalCallback(prompter, ctx);
-    // ask_missing_credential is high risk
     const result = await callback(makeAskMissingCredentialRequest());
     expect(result).toBe(true);
-    // Prompter SHOULD have been called — plain allow rule doesn't auto-allow high-risk
-    expect(prompterSendToClient).toHaveBeenCalled();
-  });
-  test("high-risk with allowHighRisk allow rule auto-allows without prompting", async () => {
-    findHighestPriorityRuleMock.mockReturnValue({
-      id: "rule-hr-2",
-      tool: "network_request",
-      pattern: "network_request:https://api.fal.ai:443/*",
-      scope: "/tmp/test-project",
-      decision: "allow" as const,
-      priority: 100,
-      createdAt: Date.now(),
-      allowHighRisk: true,
-    });
-    const ctx = makeContext();
-    const prompterSendToClient = mock(() => {});
-    const prompter = new PermissionPrompter(prompterSendToClient);
-    const callback = createProxyApprovalCallback(prompter, ctx);
-    const result = await callback(makeAskMissingCredentialRequest());
-    expect(result).toBe(true);
-    // Prompter should NOT have been called — allowHighRisk rule auto-allows
+    // Plain allow rule auto-allows medium-risk requests
     expect(prompterSendToClient).not.toHaveBeenCalled();
   });
@@ -436,7 +400,7 @@ describe("createProxyApprovalCallback", () => {
     await callback(makeAskUnauthenticatedRequest());
   });
-  test("uses high risk level for ask_missing_credential decisions", async () => {
+  test("uses medium risk level for ask_missing_credential decisions", async () => {
     const ctx = makeContext();
     const prompterSendToClient = mock(() => {});
     const prompter = new PermissionPrompter(prompterSendToClient);
@@ -447,8 +411,7 @@ describe("createProxyApprovalCallback", () => {
       await new Promise((r) => setTimeout(r, 10));
       const call = (prompterSendToClient.mock.calls as unknown[][])[0];
       const msg = call[0] as { requestId: string; riskLevel: string };
-      // Missing credential prompts are high risk — the target wants auth
-      expect(msg.riskLevel).toBe("high");
+      expect(msg.riskLevel).toBe("medium");
       prompter.resolveConfirmation(msg.requestId, "allow");
       return p;
     };
@@ -523,40 +486,6 @@ describe("createProxyApprovalCallback", () => {
   // in contrast to the proxied bash activation path which CANNOT (tested
   // in tool-executor.test.ts).
-  test("always_allow_high_risk persists rule with allowHighRisk flag", async () => {
-    const ctx = makeContext();
-    const prompterSendToClient = mock(() => {});
-    const prompter = new PermissionPrompter(prompterSendToClient);
-    const originalPrompt = prompter.prompt.bind(prompter);
-    prompter.prompt = async (...args) => {
-      const p = originalPrompt(...args);
-      await new Promise((r) => setTimeout(r, 10));
-      const call = (prompterSendToClient.mock.calls as unknown[][])[0];
-      const msg = call[0] as { requestId: string };
-      prompter.resolveConfirmation(
-        msg.requestId,
-        "always_allow_high_risk",
-        "network_request:https://api.fal.ai:443/*",
-        "/tmp/test-project",
-      );
-      return p;
-    };
-    const callback = createProxyApprovalCallback(prompter, ctx);
-    const result = await callback(makeAskMissingCredentialRequest());
-    expect(result).toBe(true);
-    expect(addRuleMock).toHaveBeenCalledWith(
-      "network_request",
-      "network_request:https://api.fal.ai:443/*",
-      "/tmp/test-project",
-      "allow",
-      100,
-      { allowHighRisk: true },
-    );
-  });
   test("one-time allow does NOT persist any rule", async () => {
     const ctx = makeContext();
     const prompterSendToClient = mock(() => {});

package/src/__tests__/registry.test.ts CHANGED Viewed

@@ -109,7 +109,7 @@ describe("tool registry dynamic-tools tools", () => {
 describe("tool manifest", () => {
   test("eager module tool names list contains expected count", () => {
-    expect(eagerModuleToolNames.length).toBe(9);
+    expect(eagerModuleToolNames.length).toBe(11);
   });
   test("explicit tools list includes memory and credential tools", () => {

package/src/__tests__/sandbox-host-parity.test.ts CHANGED Viewed

@@ -705,10 +705,11 @@ describe("Terminal output format: formatShellOutput shared by sandbox and host",
     const longOutput = "x".repeat(MAX_OUTPUT_LENGTH + 100);
     const result = formatShellOutput(longOutput, "", 0, false, 120);
-    expect(result.content.length).toBe(
-      MAX_OUTPUT_LENGTH + 1 + '<output_truncated limit="50K" />'.length,
-    );
-    expect(result.content).toContain("<output_truncated");
+    expect(result.content).toContain('limit="20K"');
+    expect(result.content).toContain('file="');
+    // The <output_truncated tag starts right after MAX_OUTPUT_LENGTH chars + 1 newline
+    const tagStart = result.content.indexOf("<output_truncated");
+    expect(tagStart).toBe(MAX_OUTPUT_LENGTH + 1);
   });
   test("timed-out command appends timeout tag and sets isError", () => {