npm - @vellumai/assistant - Versions diffs - 0.7.3 → 0.8.0 - Mend

@vellumai/assistant 0.7.3 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (169) hide show

package/ARCHITECTURE.md +29 -28
package/Dockerfile +1 -0
package/__tests__/permissions/gateway-threshold-reader.test.ts +236 -9
package/bun.lock +3 -0
package/knip.json +1 -0
package/node_modules/@vellumai/ipc-server-utils/bun.lock +24 -0
package/node_modules/@vellumai/ipc-server-utils/package.json +18 -0
package/node_modules/@vellumai/ipc-server-utils/src/index.ts +6 -0
package/node_modules/@vellumai/ipc-server-utils/src/socket-watchdog.test.ts +430 -0
package/node_modules/@vellumai/ipc-server-utils/src/socket-watchdog.ts +221 -0
package/node_modules/@vellumai/ipc-server-utils/tsconfig.json +20 -0
package/openapi.yaml +22 -4
package/package.json +3 -1
package/src/__tests__/annotate-risk-options.test.ts +291 -0
package/src/__tests__/approval-cascade.test.ts +8 -16
package/src/__tests__/approval-routes-http.test.ts +6 -0
package/src/__tests__/auto-analysis-end-to-end.test.ts +12 -25
package/src/__tests__/call-constants.test.ts +10 -1
package/src/__tests__/call-controller.test.ts +127 -0
package/src/__tests__/cli-memory-v2-reembed-skills.test.ts +58 -28
package/src/__tests__/config-loader-platform-defaults.test.ts +284 -1
package/src/__tests__/context-search-memory-source.test.ts +3 -26
package/src/__tests__/context-search-pkb-source.test.ts +12 -6
package/src/__tests__/conversation-abort-tool-results.test.ts +1 -6
package/src/__tests__/conversation-agent-loop-inference-profile.test.ts +1 -1
package/src/__tests__/conversation-agent-loop-overflow.test.ts +1 -1
package/src/__tests__/conversation-agent-loop.test.ts +3 -3
package/src/__tests__/conversation-confirmation-signals.test.ts +5 -13
package/src/__tests__/conversation-init.benchmark.test.ts +1 -1
package/src/__tests__/conversation-process-callsite.test.ts +1 -6
package/src/__tests__/conversation-provider-retry-repair.test.ts +1 -6
package/src/__tests__/conversation-runtime-assembly.test.ts +15 -6
package/src/__tests__/conversation-slash-unknown.test.ts +1 -6
package/src/__tests__/conversation-surfaces-action-delivery.test.ts +170 -9
package/src/__tests__/conversation-surfaces-data-persist.test.ts +73 -1
package/src/__tests__/conversation-tool-setup-app-refresh.test.ts +59 -0
package/src/__tests__/conversation-workspace-injection.test.ts +1 -7
package/src/__tests__/conversation-workspace-tool-tracking.test.ts +1 -7
package/src/__tests__/filing-service.test.ts +2 -19
package/src/__tests__/handlers-skills-memory-v2-reseed.test.ts +10 -26
package/src/__tests__/injector-chain.test.ts +24 -16
package/src/__tests__/injector-pkb-v2-silenced.test.ts +10 -7
package/src/__tests__/lifecycle-memory-v2-seed.test.ts +154 -67
package/src/__tests__/notification-decision-fallback.test.ts +91 -0
package/src/__tests__/notification-decision-strategy.test.ts +22 -0
package/src/__tests__/oauth-cli.test.ts +121 -0
package/src/__tests__/relay-server.test.ts +46 -2
package/src/__tests__/secret-prompt-log-hygiene.test.ts +7 -5
package/src/__tests__/secret-prompter-channel-fallback.test.ts +7 -5
package/src/__tests__/secret-response-routing.test.ts +7 -5
package/src/__tests__/server-history-render.test.ts +82 -0
package/src/__tests__/skill-include-graph.test.ts +31 -0
package/src/__tests__/skill-load-tool.test.ts +44 -16
package/src/__tests__/skills.test.ts +39 -0
package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +0 -42
package/src/__tests__/tool-executor.test.ts +155 -0
package/src/__tests__/voice-session-bridge.test.ts +3 -0
package/src/__tests__/workspace-migration-069-seed-onboarding-threads.test.ts +120 -0
package/src/__tests__/workspace-migration-071-remove-safe-storage-release-note.test.ts +206 -0
package/src/__tests__/workspace-migration-safe-storage-limits-release.test.ts +15 -27
package/src/agent/loop.ts +11 -0
package/src/approvals/guardian-decision-primitive.ts +0 -13
package/src/approvals/guardian-request-resolvers.ts +4 -32
package/src/calls/call-constants.ts +5 -8
package/src/calls/call-controller.ts +130 -67
package/src/calls/relay-server.ts +7 -1
package/src/calls/voice-session-bridge.ts +1 -1
package/src/cli/commands/memory-v2.ts +7 -7
package/src/cli/commands/oauth/__tests__/connect.test.ts +0 -254
package/src/cli/commands/oauth/connect.ts +10 -52
package/src/config/bundled-skills/app-builder/SKILL.md +1 -3
package/src/config/feature-flag-registry.json +1 -17
package/src/config/loader.ts +72 -19
package/src/config/schemas/memory-v2.ts +1 -1
package/src/daemon/__tests__/conversation-lifecycle-auto-analyze.test.ts +32 -0
package/src/daemon/conversation-agent-loop-handlers.ts +32 -0
package/src/daemon/conversation-agent-loop.ts +13 -10
package/src/daemon/conversation-lifecycle.ts +22 -8
package/src/daemon/conversation-surfaces.ts +16 -14
package/src/daemon/conversation-tool-setup.ts +9 -5
package/src/daemon/conversation.ts +1 -1
package/src/daemon/handlers/shared.ts +26 -0
package/src/daemon/host-bash-proxy.ts +1 -1
package/src/daemon/host-browser-proxy.ts +1 -1
package/src/daemon/host-cu-proxy.ts +1 -1
package/src/daemon/host-file-proxy.ts +1 -1
package/src/daemon/host-transfer-proxy.ts +2 -2
package/src/daemon/lifecycle.ts +88 -73
package/src/daemon/memory-v2-startup.ts +55 -14
package/src/daemon/message-types/messages.ts +19 -1
package/src/documents/document-store.ts +35 -1
package/src/filing/filing-service.ts +2 -3
package/src/heartbeat/heartbeat-service.ts +1 -1
package/src/ipc/assistant-server.ts +93 -36
package/src/ipc/skill-server.ts +99 -42
package/src/memory/__tests__/jobs-worker-v2-schedule.test.ts +10 -57
package/src/memory/context-search/sources/memory-v2.ts +1 -17
package/src/memory/context-search/sources/memory.ts +2 -2
package/src/memory/context-search/sources/pkb.ts +2 -3
package/src/memory/graph/__tests__/conversation-graph-memory-v2-routing.test.ts +104 -61
package/src/memory/graph/__tests__/handle-remember-v2.test.ts +11 -26
package/src/memory/graph/conversation-graph-memory.ts +32 -9
package/src/memory/graph/graph-search.test.ts +6 -5
package/src/memory/graph/graph-search.ts +3 -4
package/src/memory/graph/retriever.test.ts +12 -7
package/src/memory/graph/retriever.ts +4 -5
package/src/memory/graph/tool-handlers.ts +3 -4
package/src/memory/graph/tools.ts +4 -4
package/src/memory/indexer.ts +1 -2
package/src/memory/jobs/__tests__/embed-concept-page.test.ts +116 -0
package/src/memory/jobs/embed-concept-page.ts +223 -87
package/src/memory/jobs-worker.ts +8 -4
package/src/memory/pkb/pkb-search.test.ts +6 -5
package/src/memory/pkb/pkb-search.ts +4 -5
package/src/memory/qdrant-client.ts +3 -0
package/src/memory/search/semantic.ts +4 -5
package/src/memory/v2/__tests__/activation.test.ts +35 -5
package/src/memory/v2/__tests__/consolidation-job.test.ts +21 -32
package/src/memory/v2/__tests__/injection.test.ts +140 -23
package/src/memory/v2/__tests__/qdrant.test.ts +310 -9
package/src/memory/v2/__tests__/sim.test.ts +118 -7
package/src/memory/v2/__tests__/static-context.test.ts +1 -13
package/src/memory/v2/__tests__/sweep-job.test.ts +19 -33
package/src/memory/v2/consolidation-job.ts +7 -8
package/src/memory/v2/injection.ts +32 -12
package/src/memory/v2/page-store.ts +39 -0
package/src/memory/v2/prompts/consolidation.ts +5 -0
package/src/memory/v2/qdrant.ts +209 -48
package/src/memory/v2/sim.ts +67 -26
package/src/memory/v2/static-context.ts +4 -8
package/src/memory/v2/sweep-job.ts +5 -6
package/src/memory/v2/types.ts +7 -0
package/src/notifications/copy-composer.ts +46 -12
package/src/notifications/decision-engine.ts +46 -0
package/src/permissions/gateway-threshold-reader.ts +116 -8
package/src/permissions/prompter.ts +86 -96
package/src/permissions/secret-prompter.ts +31 -31
package/src/plugins/defaults/injectors.ts +1 -2
package/src/proactive-artifact/job.test.ts +51 -4
package/src/proactive-artifact/job.ts +16 -2
package/src/proactive-artifact/message-copy.ts +18 -1
package/src/prompts/templates/SOUL.md +13 -28
package/src/runtime/auth/route-policy.ts +1 -0
package/src/runtime/channel-approvals.ts +3 -2
package/src/runtime/guardian-reply-router.ts +0 -10
package/src/runtime/pending-interactions.ts +19 -15
package/src/runtime/routes/__tests__/memory-v2-routes.test.ts +147 -0
package/src/runtime/routes/approval-routes.ts +7 -3
package/src/runtime/routes/consolidation-routes.ts +8 -9
package/src/runtime/routes/conversation-query-routes.ts +44 -1
package/src/runtime/routes/debug-bash-routes.ts +2 -0
package/src/runtime/routes/filing-routes.ts +2 -3
package/src/runtime/routes/inbound-stages/guardian-reply-intercept.ts +0 -3
package/src/runtime/routes/memory-item-routes.test.ts +3 -9
package/src/runtime/routes/memory-item-routes.ts +5 -6
package/src/runtime/routes/memory-v2-routes.ts +103 -17
package/src/skills/include-graph.ts +35 -13
package/src/tools/document/document-tool.ts +20 -0
package/src/tools/executor.ts +18 -2
package/src/tools/memory/register.test.ts +7 -5
package/src/tools/permission-checker.ts +15 -0
package/src/tools/skills/load.ts +24 -20
package/src/tools/tool-name-aliases.ts +19 -0
package/src/tools/types.ts +19 -1
package/src/workspace/migrations/067-release-notes-safe-storage-limits.ts +4 -62
package/src/workspace/migrations/069-seed-onboarding-threads.ts +28 -0
package/src/workspace/migrations/070-memory-v2-summary-schema-rebuild.ts +31 -0
package/src/workspace/migrations/071-remove-safe-storage-release-note.ts +111 -0
package/src/workspace/migrations/registry.ts +6 -0

package/src/__tests__/relay-server.test.ts CHANGED Viewed

@@ -362,7 +362,9 @@ function getLatestAssistantText(conversationId: string): string | null {
     if (Array.isArray(parsed)) {
       return parsed
         .filter(
-          (block): block is {
+          (
+            block,
+          ): block is {
             type: string;
             text?: string;
             surfaceType?: string;
@@ -2332,7 +2334,7 @@ describe("relay-server", () => {
       expect(relay.getConnectionState()).toBe("awaiting_name");
-      // Fallback prompt should NOT include assistant name but should include guardian label
+      // Fallback prompt should use the existing guardian-label wording.
       const textMessages = ws.sentMessages
         .map((raw) => JSON.parse(raw) as { type: string; token?: string })
         .filter((m) => m.type === "text");
@@ -2348,6 +2350,48 @@ describe("relay-server", () => {
     }
   });
+  test("inbound voice: unknown caller name capture does not speak a UUID assistant name", async () => {
+    const prevName = mockAssistantName;
+    mockAssistantName = "11111111-2222-4333-8444-555555555555";
+    const db = getDb();
+    db.run("DELETE FROM contact_channels");
+    db.run("DELETE FROM contacts");
+    try {
+      ensureConversation("conv-invite-uuid-name");
+      const session = createCallSession({
+        conversationId: "conv-invite-uuid-name",
+        provider: "twilio",
+        fromNumber: "+12125550157",
+        toNumber: "+12125550111",
+      });
+      const { ws, relay } = createMockWs(session.id);
+      await relay.handleMessage(
+        JSON.stringify({
+          type: "setup",
+          callSid: "CA_invite_uuid_name",
+          from: "+12125550157",
+          to: "+12125550111",
+        }),
+      );
+      expect(relay.getConnectionState()).toBe("awaiting_name");
+      const promptText = ws.sentMessages
+        .map((raw) => JSON.parse(raw) as { type: string; token?: string })
+        .filter((m) => m.type === "text")
+        .map((m) => m.token ?? "")
+        .join("");
+      expect(promptText).toContain("Hi, this is my human's assistant.");
+      expect(promptText).not.toContain("11111111-2222-4333-8444-555555555555");
+      relay.destroy();
+    } finally {
+      mockAssistantName = prevName;
+    }
+  });
   // ── Friend-initiated in-call guardian approval flow ────────────────────
   test("name capture flow: caller provides name and enters guardian decision wait", async () => {

package/src/__tests__/secret-prompt-log-hygiene.test.ts CHANGED Viewed

@@ -39,15 +39,17 @@ mock.module("../runtime/assistant-event-hub.js", () => ({
 }));
 // Stub pendingInteractions — SecretPrompter registers/resolves there now
+// Use a real Map so SecretPrompter can store and retrieve promptResolve/promptReject callbacks.
+const _piStore = new Map<string, object>();
 mock.module("../runtime/pending-interactions.js", () => ({
-  register: () => {},
-  resolve: () => undefined,
-  get: () => undefined,
-  getAll: () => [],
+  register: (id: string, entry: object) => _piStore.set(id, entry),
+  resolve: (id: string) => { const e = _piStore.get(id); _piStore.delete(id); return e; },
+  get: (id: string) => _piStore.get(id),
+  getAll: () => [..._piStore.values()],
   getByConversation: () => [],
   getByKind: () => [],
   removeByConversation: () => {},
-  clear: () => {},
+  clear: () => _piStore.clear(),
 }));
 // Use a tiny timeout so the setTimeout branch fires quickly in tests

package/src/__tests__/secret-prompter-channel-fallback.test.ts CHANGED Viewed

@@ -38,15 +38,17 @@ mock.module("../runtime/assistant-event-hub.js", () => ({
   broadcastMessage: (msg: ServerMessage) => broadcastMessages.push(msg),
 }));
+// Use a real Map so SecretPrompter can store and retrieve promptResolve/promptReject callbacks.
+const _piStore = new Map<string, object>();
 mock.module("../runtime/pending-interactions.js", () => ({
-  register: () => {},
-  resolve: () => undefined,
-  get: () => undefined,
-  getAll: () => [],
+  register: (id: string, entry: object) => _piStore.set(id, entry),
+  resolve: (id: string) => { const e = _piStore.get(id); _piStore.delete(id); return e; },
+  get: (id: string) => _piStore.get(id),
+  getAll: () => [..._piStore.values()],
   getByConversation: () => [],
   getByKind: () => [],
   removeByConversation: () => {},
-  clear: () => {},
+  clear: () => _piStore.clear(),
 }));
 const { SecretPrompter } = await import("../permissions/secret-prompter.js");

package/src/__tests__/secret-response-routing.test.ts CHANGED Viewed

@@ -11,15 +11,17 @@ mock.module("../runtime/assistant-event-hub.js", () => ({
   broadcastMessage: (msg: ServerMessage) => broadcastedMessages.push(msg),
 }));
+// Use a real Map so SecretPrompter can store and retrieve promptResolve/promptReject callbacks.
+const _piStore = new Map<string, object>();
 mock.module("../runtime/pending-interactions.js", () => ({
-  register: () => {},
-  resolve: () => undefined,
-  get: () => undefined,
-  getAll: () => [],
+  register: (id: string, entry: object) => _piStore.set(id, entry),
+  resolve: (id: string) => { const e = _piStore.get(id); _piStore.delete(id); return e; },
+  get: (id: string) => _piStore.get(id),
+  getAll: () => [..._piStore.values()],
   getByConversation: () => [],
   getByKind: () => [],
   removeByConversation: () => {},
-  clear: () => {},
+  clear: () => _piStore.clear(),
 }));
 const { SecretPrompter } = await import("../permissions/secret-prompter.js");

package/src/__tests__/server-history-render.test.ts CHANGED Viewed

@@ -154,6 +154,88 @@ describe("renderHistoryContent", () => {
     ]);
   });
+  // ── Persisted risk-option ladders (Phase B of conflation track) ─────────────
+  test("hydrates persisted _risk*Options annotations onto tool calls", () => {
+    // Mirrors what `annotatePersistedAssistantMessage` writes to the DB so the
+    // rule editor's chip ladder survives chat-history reload. Without these,
+    // hydrated chips fall back to the synthesized `*` allowlist (see web's
+    // `synthesizeFallbackOption` in RuleEditorModal.tsx).
+    const scopeOptions = [
+      { pattern: "exact", label: "exact: rm -rf /tmp" },
+      { pattern: "by-program", label: "All rm" },
+    ];
+    const allowlistOptions = [
+      { label: "exact", description: "exact match", pattern: "rm -rf /tmp" },
+      { label: "All rm", description: "All rm commands", pattern: "rm *" },
+    ];
+    const directoryScopeOptions = [
+      { scope: "/Users/me/code", label: "in code/" },
+      { scope: "everywhere", label: "Everywhere" },
+    ];
+    const output = renderHistoryContent([
+      {
+        type: "tool_use",
+        id: "tu_1",
+        name: "bash",
+        input: { command: "rm -rf /tmp" },
+        _riskLevel: "high",
+        _matchedTrustRuleId: "rule_42",
+        _riskScopeOptions: scopeOptions,
+        _riskAllowlistOptions: allowlistOptions,
+        _riskDirectoryScopeOptions: directoryScopeOptions,
+      },
+    ]);
+    const [entry] = output.toolCalls;
+    expect(entry.riskLevel).toBe("high");
+    expect(entry.matchedTrustRuleId).toBe("rule_42");
+    expect(entry.riskScopeOptions).toEqual(scopeOptions);
+    expect(entry.riskAllowlistOptions).toEqual(allowlistOptions);
+    expect(entry.riskDirectoryScopeOptions).toEqual(directoryScopeOptions);
+  });
+  test("ignores non-array _risk*Options annotations", () => {
+    // Defensive: a malformed persisted block should not throw or coerce.
+    const output = renderHistoryContent([
+      {
+        type: "tool_use",
+        id: "tu_1",
+        name: "bash",
+        input: { command: "ls" },
+        _riskLevel: "low",
+        _riskScopeOptions: "not an array",
+        _riskAllowlistOptions: { not: "an array" },
+        _riskDirectoryScopeOptions: 42,
+      },
+    ]);
+    const [entry] = output.toolCalls;
+    expect(entry.riskLevel).toBe("low");
+    expect(entry.riskScopeOptions).toBeUndefined();
+    expect(entry.riskAllowlistOptions).toBeUndefined();
+    expect(entry.riskDirectoryScopeOptions).toBeUndefined();
+  });
+  test("omits absent _risk*Options annotations", () => {
+    const output = renderHistoryContent([
+      {
+        type: "tool_use",
+        id: "tu_1",
+        name: "bash",
+        input: { command: "ls" },
+        _riskLevel: "low",
+      },
+    ]);
+    const [entry] = output.toolCalls;
+    expect(entry.riskLevel).toBe("low");
+    expect(entry.riskScopeOptions).toBeUndefined();
+    expect(entry.riskAllowlistOptions).toBeUndefined();
+    expect(entry.riskDirectoryScopeOptions).toBeUndefined();
+  });
   test("handles mixed text and tool blocks", () => {
     const output = renderHistoryContent([
       { type: "text", text: "Let me look that up." },

package/src/__tests__/skill-include-graph.test.ts CHANGED Viewed

@@ -6,6 +6,7 @@ import {
   getImmediateChildren,
   indexCatalogById,
   traverseIncludes,
+  validateIncludeCycles,
   validateIncludes,
 } from "../skills/include-graph.js";
@@ -299,6 +300,36 @@ describe("validateIncludes — cycle detection", () => {
   });
 });
+describe("validateIncludeCycles", () => {
+  test("skips missing children while still detecting available cycles", () => {
+    const catalog = [
+      makeSkill("root", ["missing", "a"]),
+      makeSkill("a", ["b"]),
+      makeSkill("b", ["a"]),
+    ];
+    const index = indexCatalogById(catalog);
+    const result = validateIncludeCycles("root", index);
+    expect(result.ok).toBe(false);
+    if (!result.ok && result.error === "cycle") {
+      expect(result.cyclePath).toEqual(["a", "b", "a"]);
+    }
+  });
+  test("returns success when the only invalid edges are missing children", () => {
+    const catalog = [makeSkill("root", ["missing"])];
+    const index = indexCatalogById(catalog);
+    const result = validateIncludeCycles("root", index);
+    expect(result.ok).toBe(true);
+    if (result.ok) {
+      expect(result.visited).toEqual(["root"]);
+    }
+  });
+});
 describe("collectAllMissing", () => {
   test("returns empty set when skill has no includes", () => {
     const catalog = [makeSkill("root")];

package/src/__tests__/skill-load-tool.test.ts CHANGED Viewed

@@ -266,17 +266,19 @@ describe("skill_load tool", () => {
     expect(markers.length).toBe(1);
   });
-  test("returns error when skill has missing include", async () => {
+  test("continues when skill has missing include", async () => {
     writeSkillWithIncludes("parent", "Parent", "Has missing child", "Body", [
       "missing-child",
     ]);
     writeFileSync(join(TEST_DIR, "skills", "SKILLS.md"), "- parent\n");
     const result = await executeSkillLoad({ skill: "parent" });
-    expect(result.isError).toBe(true);
+    expect(result.isError).toBe(false);
+    expect(result.content).toContain("Skill: Parent");
+    expect(result.content).toContain("Suggested Included Skills (not loaded):");
     expect(result.content).toContain("missing-child");
-    expect(result.content).toContain("not found");
-    expect(result.content).not.toContain("<loaded_skill");
+    expect(result.content).toContain('<loaded_skill id="parent"');
+    expect(result.content).not.toContain('<loaded_skill id="missing-child"');
   });
   test("returns error when skill has circular include", async () => {
@@ -317,7 +319,7 @@ describe("skill_load tool", () => {
     expect(result.content).toContain("<loaded_skill");
   });
-  test("failed include validation (missing) emits no loaded_skill marker", async () => {
+  test("missing include emits only the parent loaded_skill marker", async () => {
     const skillDir = join(TEST_DIR, "skills", "marker-missing");
     mkdirSync(skillDir, { recursive: true });
     writeFileSync(
@@ -327,9 +329,13 @@ describe("skill_load tool", () => {
     writeFileSync(join(TEST_DIR, "skills", "SKILLS.md"), "- marker-missing\n");
     const result = await executeSkillLoad({ skill: "marker-missing" });
-    expect(result.isError).toBe(true);
-    expect(result.content).not.toContain("<loaded_skill");
-    expect(result.content).not.toMatch(/<loaded_skill\s/);
+    expect(result.isError).toBe(false);
+    expect(result.content).toContain("Suggested Included Skills (not loaded):");
+    expect(result.content).toContain("nonexistent");
+    const markers = result.content.match(/<loaded_skill/g) || [];
+    expect(markers.length).toBe(1);
+    expect(result.content).toContain('<loaded_skill id="marker-missing"');
+    expect(result.content).not.toContain('<loaded_skill id="nonexistent"');
   });
   test("failed include validation (cycle) emits no loaded_skill marker", async () => {
@@ -365,6 +371,28 @@ describe("skill_load tool", () => {
     expect(result.content).toContain("Skill: No Includes");
   });
+  test("bundled app-builder loads when frontend-design is unavailable", async () => {
+    const result = await executeSkillLoad({ skill: "app-builder" });
+    expect(result.isError).toBe(false);
+    expect(result.content).toContain("Skill: App Builder");
+    expect(result.content).toContain("Suggested Included Skills (not loaded):");
+    expect(result.content).toContain("frontend-design");
+    expect(result.content).toContain('<loaded_skill id="app-builder"');
+    expect(result.content).not.toContain('<loaded_skill id="frontend-design"');
+  });
+  test("bundled phone-calls loads when setup includes are unavailable", async () => {
+    const result = await executeSkillLoad({ skill: "phone-calls" });
+    expect(result.isError).toBe(false);
+    expect(result.content).toContain("Skill: Phone Calls");
+    expect(result.content).toContain("Suggested Included Skills (not loaded):");
+    expect(result.content).toContain("twilio-setup");
+    expect(result.content).toContain('<loaded_skill id="phone-calls"');
+    expect(result.content).not.toContain('<loaded_skill id="twilio-setup"');
+  });
   test("skill_load output includes immediate child metadata", async () => {
     writeSkill("child-skill", "Child Skill", "A child skill", "Child body");
     const parentDir = join(TEST_DIR, "skills", "parent-with-children");
@@ -883,7 +911,7 @@ describe("skill_load tool", () => {
     expect(mockAutoInstall).toHaveBeenCalledWith("trans-c");
   });
-  test("returns error when auto-install of missing include fails", async () => {
+  test("continues when auto-install of missing include fails", async () => {
     writeSkillWithIncludes(
       "fail-parent",
       "Fail Parent",
@@ -902,10 +930,12 @@ describe("skill_load tool", () => {
     });
     const result = await executeSkillLoad({ skill: "fail-parent" });
-    expect(result.isError).toBe(true);
+    expect(result.isError).toBe(false);
+    expect(result.content).toContain("Skill: Fail Parent");
+    expect(result.content).toContain("Suggested Included Skills (not loaded):");
     expect(result.content).toContain("dep-x");
-    expect(result.content).toContain("not found");
-    expect(result.content).not.toContain("<loaded_skill");
+    expect(result.content).toContain('<loaded_skill id="fail-parent"');
+    expect(result.content).not.toContain('<loaded_skill id="dep-x"');
   });
   test("stops after MAX_INSTALL_ROUNDS", async () => {
@@ -941,10 +971,8 @@ describe("skill_load tool", () => {
     });
     const result = await executeSkillLoad({ skill: "loop-root" });
-    // Should terminate with an error (the final dep is still missing)
-    expect(result.isError).toBe(true);
-    expect(result.content).toContain("not found");
-    // Should have terminated — installCount should be bounded by MAX_INSTALL_ROUNDS (5)
+    expect(result.isError).toBe(false);
+    expect(result.content).toContain("Suggested Included Skills (not loaded):");
     expect(installCount).toBeLessThanOrEqual(5);
   });
 });

package/src/__tests__/skills.test.ts CHANGED Viewed

@@ -1,6 +1,7 @@
 import {
   existsSync,
   mkdirSync,
+  readdirSync,
   readFileSync,
   rmSync,
   symlinkSync,
@@ -678,3 +679,41 @@ describe("bundled computer-use skill", () => {
     ]);
   });
 });
+describe("skill source ownership", () => {
+  const BUNDLED_SKILLS_DIR = join(
+    import.meta.dir,
+    "..",
+    "config",
+    "bundled-skills",
+  );
+  const FIRST_PARTY_SKILLS_DIR = join(
+    import.meta.dir,
+    "..",
+    "..",
+    "..",
+    "skills",
+  );
+  function collectSourceSkillIds(rootDir: string): string[] {
+    return readdirSync(rootDir, { withFileTypes: true })
+      .filter(
+        (entry) =>
+          entry.isDirectory() &&
+          existsSync(join(rootDir, entry.name, "SKILL.md")),
+      )
+      .map((entry) => entry.name)
+      .sort((a, b) => a.localeCompare(b));
+  }
+  test("bundled skills are not duplicated in the first-party source catalog", () => {
+    const firstPartyIds = new Set(
+      collectSourceSkillIds(FIRST_PARTY_SKILLS_DIR),
+    );
+    const duplicates = collectSourceSkillIds(BUNDLED_SKILLS_DIR).filter((id) =>
+      firstPartyIds.has(id),
+    );
+    expect(duplicates).toEqual([]);
+  });
+});

package/src/__tests__/tool-execution-pipeline.benchmark.test.ts CHANGED Viewed

@@ -30,16 +30,6 @@ mock.module("../util/logger.js", () => ({
     }),
 }));
-// Allow toggling between no-rule and matched-rule paths
-let mockRuleResponse: import("../permissions/types.js").TrustRule | null = null;
-mock.module("../permissions/trust-store.js", () => ({
-  addRule: () => {},
-  findHighestPriorityRule: () => mockRuleResponse,
-  onRulesChanged: () => {},
-  clearCache: () => {},
-}));
 mock.module("../config/loader.js", () => ({
   getConfig: () => ({
     ui: {},
@@ -302,38 +292,6 @@ describe("Tool execution pipeline benchmark", () => {
     expect(results[0].decision).toBe("allow");
   });
-  test("check: matched allow-rule path for medium-risk tool", async () => {
-    // Exercise the code path where findHighestPriorityRule returns a matching
-    // allow rule, rather than always falling through to the no-rule default.
-    mockRuleResponse = {
-      id: "bench:allow-file_write",
-      tool: "file_write",
-      pattern: "**",
-      scope: "/tmp",
-      decision: "allow",
-      priority: 90,
-      createdAt: Date.now(),
-    };
-    try {
-      const { timings, results } = await benchmarkAsync(
-        () => check("file_write", { path: "/tmp/out.txt" }, "/tmp"),
-        ITERATIONS,
-      );
-      const p50 = percentile(timings, 50);
-      const p95 = percentile(timings, 95);
-      expect(p50).toBeLessThan(10);
-      expect(p95).toBeLessThan(20);
-      // Medium-risk with a matching allow rule should auto-allow
-      expect(results[0].decision).toBe("allow");
-      expect(results[0].matchedRule?.id).toBe("bench:allow-file_write");
-    } finally {
-      mockRuleResponse = null;
-    }
-  });
   test("check: permission cost is stable across different input paths", async () => {
     // Verify that the permission check cost doesn't vary with input path length/complexity.
     // Actual tool-execution-time independence is tested in the ToolExecutor section below.

package/src/__tests__/tool-executor.test.ts CHANGED Viewed

@@ -73,6 +73,11 @@ let cachedAssessmentOverride:
       riskLevel: string;
       reason: string;
       scopeOptions: Array<{ pattern: string; label: string }>;
+      allowlistOptions?: Array<{
+        label: string;
+        description: string;
+        pattern: string;
+      }>;
       directoryScopeOptions?: Array<{ scope: string; label: string }>;
       matchType: string;
     }
@@ -202,6 +207,32 @@ describe("ToolExecutor allowedToolNames gating", () => {
     expect(result.content).toBe("ok");
   });
+  test("canonicalizes app-builder create_app alias before active-tool gating", async () => {
+    const executor = new ToolExecutor(makePrompter());
+    const allowed = new Set(["app_create"]);
+    const result = await executor.execute(
+      "create_app",
+      { name: "Calculator" },
+      makeContext({ allowedToolNames: allowed }),
+    );
+    expect(result.isError).toBe(false);
+    expect(result.content).toBe("ok");
+  });
+  test("preserves exact active create_app tool before applying compatibility aliases", async () => {
+    const executor = new ToolExecutor(makePrompter());
+    const allowed = new Set(["create_app", "app_create"]);
+    const result = await executor.execute(
+      "create_app",
+      { name: "Custom App" },
+      makeContext({ allowedToolNames: allowed }),
+    );
+    expect(result.isError).toBe(false);
+    expect(lastCheckArgs?.toolName).toBe("create_app");
+  });
   test("blocks execution when tool is NOT in the allowed set", async () => {
     const executor = new ToolExecutor(makePrompter());
     const allowed = new Set(["file_read", "bash"]);
@@ -1123,4 +1154,128 @@ describe("ToolExecutionResult includes risk metadata from classifier assessment"
       { scope: "/tmp", label: "Anywhere in tmp/" },
     ]);
   });
+  test("auto-approved tool result includes riskAllowlistOptions when classifier emits them (Minimatch-glob shape for save path)", async () => {
+    cachedAssessmentOverride = {
+      riskLevel: "medium",
+      reason: "Reads workspace files",
+      // Display ladder (regex shape — not for save).
+      scopeOptions: [
+        { pattern: "^echo\\b.*hello$", label: "echo hello" },
+        { pattern: "^echo\\b", label: "echo *" },
+      ],
+      // Save ladder (Minimatch-glob shape — what gateway matches against).
+      allowlistOptions: [
+        {
+          label: "echo hello",
+          description: "This exact command",
+          pattern: "echo hello",
+        },
+        {
+          label: "echo *",
+          description: "Any echo command",
+          pattern: "action:echo",
+        },
+      ],
+      matchType: "registry",
+    };
+    const executor = new ToolExecutor(makePrompter());
+    const result = await executor.execute(
+      "file_read",
+      { path: "README.md" },
+      makeContext({ requireFreshApproval: true }),
+    );
+    expect(result.isError).toBe(false);
+    // Both shapes flow through independently — same labels, different patterns.
+    expect(result.riskScopeOptions).toEqual([
+      { pattern: "^echo\\b.*hello$", label: "echo hello" },
+      { pattern: "^echo\\b", label: "echo *" },
+    ]);
+    expect(result.riskAllowlistOptions).toEqual([
+      {
+        label: "echo hello",
+        description: "This exact command",
+        pattern: "echo hello",
+      },
+      {
+        label: "echo *",
+        description: "Any echo command",
+        pattern: "action:echo",
+      },
+    ]);
+  });
+  test("riskAllowlistOptions is undefined when classifier did not produce allowlist (e.g. web-risk classifier)", async () => {
+    cachedAssessmentOverride = {
+      riskLevel: "low",
+      reason: "GET request to public URL",
+      scopeOptions: [{ pattern: "https://example.com/.*", label: "example.com" }],
+      // allowlistOptions intentionally omitted — some classifiers don't emit them.
+      matchType: "registry",
+    };
+    const executor = new ToolExecutor(makePrompter());
+    const result = await executor.execute(
+      "file_read",
+      { path: "README.md" },
+      makeContext({ requireFreshApproval: true }),
+    );
+    expect(result.isError).toBe(false);
+    // Display ladder still flows; save ladder is absent so the client must
+    // fall back to a synthesized option (or omit save).
+    expect(result.riskScopeOptions).toEqual([
+      { pattern: "https://example.com/.*", label: "example.com" },
+    ]);
+    expect(result.riskAllowlistOptions).toBeUndefined();
+  });
+  test("riskAllowlistOptions is undefined when no classifier ran (MCP tools)", async () => {
+    // cachedAssessmentOverride is undefined — no classifier ran.
+    const executor = new ToolExecutor(makePrompter());
+    const result = await executor.execute(
+      "file_read",
+      { path: "README.md" },
+      makeContext(),
+    );
+    expect(result.isError).toBe(false);
+    expect(result.riskScopeOptions).toBeUndefined();
+    expect(result.riskAllowlistOptions).toBeUndefined();
+  });
+  test("denied tool result still carries riskAllowlistOptions for the rule editor save path", async () => {
+    checkResultOverride = { decision: "deny", reason: "Blocked by deny rule" };
+    cachedAssessmentOverride = {
+      riskLevel: "high",
+      reason: "Recursive force delete",
+      scopeOptions: [{ pattern: "^rm\\s+-rf", label: "rm -rf *" }],
+      allowlistOptions: [
+        {
+          label: "rm -rf *",
+          description: "Any rm -rf command",
+          pattern: "action:rm",
+        },
+      ],
+      matchType: "registry",
+    };
+    const executor = new ToolExecutor(makePrompter());
+    const result = await executor.execute(
+      "file_read",
+      { path: "anything" },
+      makeContext({ requireFreshApproval: true }),
+    );
+    expect(result.isError).toBe(true);
+    expect(result.riskAllowlistOptions).toEqual([
+      {
+        label: "rm -rf *",
+        description: "Any rm -rf command",
+        pattern: "action:rm",
+      },
+    ]);
+  });
 });

package/src/__tests__/voice-session-bridge.test.ts CHANGED Viewed

@@ -652,6 +652,9 @@ describe("voice-session-bridge", () => {
     expect(prompt).toContain(
       "If your assistant name is not known, skip the name and just identify yourself as the guardian's assistant.",
     );
+    expect(prompt).toContain(
+      "Never use a UUID-shaped internal assistant ID as your spoken name.",
+    );
     expect(prompt).toContain(
       'Do NOT say "I\'m calling" or "I\'m calling on behalf of".',
     );