npm - @vellumai/assistant - Versions diffs - 0.5.9 → 0.5.11 - Mend

@vellumai/assistant 0.5.9 → 0.5.11

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (278) hide show

package/AGENTS.md +9 -1
package/ARCHITECTURE.md +48 -48
package/Dockerfile +2 -0
package/README.md +1 -1
package/docs/architecture/integrations.md +6 -13
package/docs/architecture/memory.md +7 -12
package/docs/architecture/security.md +5 -5
package/docs/credential-execution-service.md +9 -9
package/docs/skills.md +1 -1
package/node_modules/@vellumai/credential-storage/src/index.ts +2 -2
package/node_modules/@vellumai/credential-storage/src/static-credentials.ts +1 -1
package/openapi.yaml +7130 -0
package/package.json +2 -1
package/scripts/generate-openapi.ts +562 -0
package/src/__tests__/acp-session.test.ts +239 -44
package/src/__tests__/assistant-feature-flag-guard.test.ts +8 -8
package/src/__tests__/assistant-feature-flag-guardrails.test.ts +5 -86
package/src/__tests__/assistant-feature-flags-integration.test.ts +7 -14
package/src/__tests__/browser-skill-endstate.test.ts +1 -1
package/src/__tests__/btw-routes.test.ts +8 -0
package/src/__tests__/bundled-skill-retrieval-guard.test.ts +10 -10
package/src/__tests__/channel-approvals.test.ts +7 -7
package/src/__tests__/channel-readiness-service.test.ts +41 -0
package/src/__tests__/config-schema.test.ts +10 -2
package/src/__tests__/context-memory-e2e.test.ts +2 -6
package/src/__tests__/conversation-skill-tools.test.ts +1 -3
package/src/__tests__/conversation-title-service.test.ts +2 -15
package/src/__tests__/credential-execution-feature-gates.test.ts +4 -8
package/src/__tests__/credential-execution-managed-contract.test.ts +8 -8
package/src/__tests__/credential-security-e2e.test.ts +4 -4
package/src/__tests__/credential-security-invariants.test.ts +3 -3
package/src/__tests__/credentials-cli.test.ts +3 -3
package/src/__tests__/dynamic-skill-workflow-prompt.test.ts +1 -1
package/src/__tests__/gateway-only-guard.test.ts +3 -0
package/src/__tests__/heartbeat-service.test.ts +35 -0
package/src/__tests__/host-shell-tool.test.ts +1 -1
package/src/__tests__/inline-skill-load-permissions.test.ts +3 -3
package/src/__tests__/llm-request-log-turn-query.test.ts +64 -0
package/src/__tests__/log-export-workspace.test.ts +1 -1
package/src/__tests__/mcp-client-auth.test.ts +1 -1
package/src/__tests__/memory-lifecycle-e2e.test.ts +2 -2
package/src/__tests__/memory-recall-log-store.test.ts +182 -0
package/src/__tests__/memory-recall-quality.test.ts +6 -8
package/src/__tests__/memory-regressions.test.ts +53 -42
package/src/__tests__/memory-retrieval.benchmark.test.ts +5 -9
package/src/__tests__/messaging-skill-split.test.ts +2 -17
package/src/__tests__/oauth-cli.test.ts +98 -551
package/src/__tests__/platform-callback-registration.test.ts +119 -0
package/src/__tests__/secret-ingress-channel.test.ts +261 -0
package/src/__tests__/secret-ingress-cli.test.ts +201 -0
package/src/__tests__/secret-ingress-http.test.ts +312 -0
package/src/__tests__/secret-ingress.test.ts +283 -0
package/src/__tests__/secret-onetime-send.test.ts +4 -4
package/src/__tests__/skill-feature-flags-integration.test.ts +4 -4
package/src/__tests__/skill-feature-flags.test.ts +11 -19
package/src/__tests__/skill-load-feature-flag.test.ts +1 -1
package/src/__tests__/skill-load-inline-command.test.ts +3 -3
package/src/__tests__/skill-load-inline-includes.test.ts +2 -2
package/src/__tests__/skill-memory.test.ts +2 -4
package/src/__tests__/skill-projection-feature-flag.test.ts +2 -4
package/src/__tests__/skill-projection.benchmark.test.ts +1 -3
package/src/__tests__/skills.test.ts +16 -2
package/src/__tests__/slack-channel-config.test.ts +1 -1
package/src/__tests__/slack-skill.test.ts +5 -69
package/src/__tests__/vellum-self-knowledge-inline-command.test.ts +1 -1
package/src/__tests__/workspace-migration-015-migrate-credentials-to-keychain.test.ts +5 -238
package/src/__tests__/workspace-migration-016-migrate-credentials-from-keychain.test.ts +5 -206
package/src/__tests__/workspace-migration-018-rekey-compound-credential-keys.test.ts +181 -0
package/src/__tests__/workspace-migrations-runner.test.ts +15 -7
package/src/acp/client-handler.ts +113 -31
package/src/acp/session-manager.ts +29 -27
package/src/approvals/guardian-request-resolvers.ts +1 -1
package/src/cli/AGENTS.md +73 -0
package/src/cli/commands/autonomy.ts +3 -5
package/src/cli/commands/credential-execution.ts +1 -2
package/src/cli/commands/credentials.ts +4 -4
package/src/cli/commands/memory.ts +2 -3
package/src/cli/commands/oauth/__tests__/connect.test.ts +785 -0
package/src/cli/commands/oauth/__tests__/disconnect.test.ts +760 -0
package/src/cli/commands/oauth/__tests__/mode.test.ts +672 -0
package/src/cli/commands/oauth/__tests__/ping.test.ts +690 -0
package/src/cli/commands/oauth/__tests__/status.test.ts +579 -0
package/src/cli/commands/oauth/__tests__/token.test.ts +467 -0
package/src/cli/commands/oauth/apps.ts +29 -11
package/src/cli/commands/oauth/connect.ts +373 -0
package/src/cli/commands/oauth/connections.ts +14 -493
package/src/cli/commands/oauth/disconnect.ts +333 -0
package/src/cli/commands/oauth/index.ts +62 -10
package/src/cli/commands/oauth/mode.ts +263 -0
package/src/cli/commands/oauth/ping.ts +222 -0
package/src/cli/commands/oauth/providers.ts +30 -3
package/src/cli/commands/oauth/request.ts +576 -0
package/src/cli/commands/oauth/shared.ts +132 -0
package/src/cli/commands/oauth/status.ts +202 -0
package/src/cli/commands/oauth/token.ts +159 -0
package/src/cli/commands/platform.ts +20 -14
package/src/cli.ts +82 -17
package/src/config/assistant-feature-flags.ts +74 -11
package/src/config/bundled-skills/_shared/CLI_RETRIEVAL_PATTERN.md +1 -1
package/src/config/bundled-skills/app-builder/tools/app-create.ts +1 -1
package/src/config/bundled-skills/messaging/SKILL.md +13 -36
package/src/config/bundled-skills/messaging/TOOLS.json +9 -9
package/src/config/bundled-skills/messaging/tools/messaging-analyze-style.ts +1 -1
package/src/config/bundled-skills/notifications/SKILL.md +1 -1
package/src/config/bundled-skills/schedule/SKILL.md +2 -2
package/src/config/bundled-skills/settings/SKILL.md +5 -3
package/src/config/bundled-skills/settings/TOOLS.json +17 -0
package/src/config/bundled-skills/settings/tools/avatar-get.ts +50 -0
package/src/config/bundled-skills/settings/tools/avatar-remove.ts +7 -0
package/src/config/bundled-skills/settings/tools/avatar-update.ts +6 -1
package/src/config/bundled-skills/settings/tools/identity-avatar.ts +55 -0
package/src/config/bundled-skills/skills-catalog/SKILL.md +3 -3
package/src/config/bundled-skills/slack/SKILL.md +58 -44
package/src/config/bundled-tool-registry.ts +2 -19
package/src/config/env.ts +5 -1
package/src/config/feature-flag-registry.json +57 -41
package/src/config/loader.ts +4 -0
package/src/config/schemas/platform.ts +0 -8
package/src/config/schemas/security.ts +9 -1
package/src/config/schemas/services.ts +1 -1
package/src/config/skill-state.ts +1 -3
package/src/config/skills.ts +2 -4
package/src/credential-execution/feature-gates.ts +9 -16
package/src/credential-execution/process-manager.ts +12 -0
package/src/daemon/config-watcher.ts +4 -0
package/src/daemon/conversation-agent-loop-handlers.ts +10 -0
package/src/daemon/conversation-agent-loop.ts +49 -2
package/src/daemon/conversation-memory.ts +0 -1
package/src/daemon/handlers/config-slack-channel.ts +43 -1
package/src/daemon/handlers/conversations.ts +41 -33
package/src/daemon/lifecycle.ts +28 -5
package/src/daemon/message-types/acp.ts +0 -15
package/src/daemon/message-types/memory.ts +0 -1
package/src/daemon/message-types/messages.ts +9 -1
package/src/daemon/message-types/schedules.ts +9 -0
package/src/daemon/server.ts +19 -7
package/src/email/feature-gate.ts +3 -3
package/src/heartbeat/heartbeat-service.ts +48 -0
package/src/inbound/platform-callback-registration.ts +61 -7
package/src/mcp/mcp-oauth-provider.ts +3 -3
package/src/memory/app-store.ts +3 -3
package/src/memory/conversation-crud.ts +124 -0
package/src/memory/conversation-title-service.ts +7 -17
package/src/memory/db-init.ts +8 -0
package/src/memory/embedding-local.ts +47 -2
package/src/memory/indexer.ts +13 -10
package/src/memory/items-extractor.ts +12 -4
package/src/memory/job-utils.ts +5 -0
package/src/memory/jobs-store.ts +10 -2
package/src/memory/journal-memory.ts +6 -2
package/src/memory/llm-request-log-store.ts +88 -21
package/src/memory/memory-recall-log-store.ts +128 -0
package/src/memory/migrations/194-memory-recall-logs.ts +50 -0
package/src/memory/migrations/195-oauth-providers-ping-config.ts +23 -0
package/src/memory/migrations/index.ts +2 -0
package/src/memory/migrations/validate-migration-state.ts +14 -1
package/src/memory/retriever.test.ts +4 -5
package/src/memory/schema/infrastructure.ts +31 -0
package/src/memory/schema/oauth.ts +3 -0
package/src/messaging/providers/telegram-bot/adapter.ts +1 -1
package/src/oauth/connect-orchestrator.ts +54 -0
package/src/oauth/manual-token-connection.ts +5 -5
package/src/oauth/oauth-store.ts +26 -5
package/src/oauth/seed-providers.ts +10 -1
package/src/permissions/checker.ts +2 -2
package/src/permissions/trust-client.ts +2 -2
package/src/platform/client.ts +2 -2
package/src/prompts/journal-context.ts +6 -1
package/src/providers/anthropic/client.ts +143 -1
package/src/runtime/auth/__tests__/middleware.test.ts +19 -0
package/src/runtime/auth/route-policy.ts +0 -1
package/src/runtime/btw-sidechain.ts +7 -1
package/src/runtime/channel-approvals.ts +2 -2
package/src/runtime/channel-readiness-service.ts +30 -7
package/src/runtime/http-router.ts +31 -0
package/src/runtime/http-server.ts +21 -4
package/src/runtime/http-types.ts +2 -0
package/src/runtime/pending-interactions.ts +21 -3
package/src/runtime/routes/acp-routes.ts +46 -28
package/src/runtime/routes/app-management-routes.ts +123 -0
package/src/runtime/routes/app-routes.ts +31 -0
package/src/runtime/routes/approval-routes.ts +108 -3
package/src/runtime/routes/attachment-routes.ts +45 -0
package/src/runtime/routes/avatar-routes.ts +16 -0
package/src/runtime/routes/brain-graph-routes.ts +18 -0
package/src/runtime/routes/btw-routes.ts +20 -0
package/src/runtime/routes/call-routes.ts +81 -0
package/src/runtime/routes/channel-readiness-routes.ts +48 -7
package/src/runtime/routes/channel-routes.ts +18 -0
package/src/runtime/routes/channel-verification-routes.ts +49 -1
package/src/runtime/routes/contact-routes.ts +77 -0
package/src/runtime/routes/conversation-attention-routes.ts +37 -0
package/src/runtime/routes/conversation-management-routes.ts +94 -0
package/src/runtime/routes/conversation-query-routes.ts +78 -0
package/src/runtime/routes/conversation-routes.ts +115 -38
package/src/runtime/routes/conversation-starter-routes.ts +29 -0
package/src/runtime/routes/debug-routes.ts +23 -0
package/src/runtime/routes/diagnostics-routes.ts +30 -0
package/src/runtime/routes/documents-routes.ts +42 -0
package/src/runtime/routes/events-routes.ts +10 -0
package/src/runtime/routes/global-search-routes.ts +35 -0
package/src/runtime/routes/guardian-action-routes.ts +47 -2
package/src/runtime/routes/guardian-approval-prompt.ts +77 -2
package/src/runtime/routes/heartbeat-routes.ts +278 -0
package/src/runtime/routes/host-bash-routes.ts +16 -1
package/src/runtime/routes/host-cu-routes.ts +23 -1
package/src/runtime/routes/host-file-routes.ts +18 -1
package/src/runtime/routes/identity-routes.ts +35 -0
package/src/runtime/routes/inbound-message-handler.ts +46 -25
package/src/runtime/routes/inbound-stages/secret-ingress-check.ts +30 -2
package/src/runtime/routes/inbound-stages/transcribe-audio.ts +1 -2
package/src/runtime/routes/integrations/twilio.ts +32 -22
package/src/runtime/routes/invite-routes.ts +83 -0
package/src/runtime/routes/log-export-routes.ts +14 -0
package/src/runtime/routes/memory-item-routes.ts +99 -1
package/src/runtime/routes/migration-rollback-routes.ts +25 -0
package/src/runtime/routes/migration-routes.ts +40 -0
package/src/runtime/routes/notification-routes.ts +20 -0
package/src/runtime/routes/oauth-apps.ts +11 -3
package/src/runtime/routes/pairing-routes.ts +15 -0
package/src/runtime/routes/recording-routes.ts +72 -0
package/src/runtime/routes/schedule-routes.ts +77 -5
package/src/runtime/routes/secret-routes.ts +63 -1
package/src/runtime/routes/settings-routes.ts +91 -1
package/src/runtime/routes/skills-routes.ts +98 -16
package/src/runtime/routes/subagents-routes.ts +38 -3
package/src/runtime/routes/surface-action-routes.ts +66 -24
package/src/runtime/routes/surface-content-routes.ts +20 -0
package/src/runtime/routes/telemetry-routes.ts +12 -0
package/src/runtime/routes/trace-event-routes.ts +25 -0
package/src/runtime/routes/trust-rules-routes.ts +46 -0
package/src/runtime/routes/tts-routes.ts +15 -4
package/src/runtime/routes/upgrade-broadcast-routes.ts +38 -0
package/src/runtime/routes/usage-routes.ts +59 -0
package/src/runtime/routes/watch-routes.ts +28 -0
package/src/runtime/routes/work-items-routes.ts +59 -0
package/src/runtime/routes/workspace-commit-routes.ts +12 -0
package/src/runtime/routes/workspace-routes.ts +102 -0
package/src/schedule/scheduler.ts +7 -1
package/src/security/AGENTS.md +7 -0
package/src/security/credential-backend.ts +1 -1
package/src/security/encrypted-store.ts +3 -3
package/src/security/oauth2.ts +55 -0
package/src/security/secret-ingress.ts +174 -0
package/src/security/secret-patterns.ts +133 -0
package/src/security/secret-scanner.ts +28 -117
package/src/signals/confirm.ts +12 -8
package/src/signals/user-message.ts +18 -3
package/src/skills/skill-memory.ts +1 -2
package/src/tasks/task-runner.ts +7 -1
package/src/tools/credentials/broker.ts +1 -1
package/src/tools/credentials/metadata-store.ts +1 -1
package/src/tools/credentials/vault.ts +2 -3
package/src/tools/memory/definitions.ts +1 -1
package/src/tools/memory/handlers.test.ts +2 -4
package/src/tools/skills/load.ts +1 -1
package/src/tools/terminal/safe-env.ts +7 -0
package/src/tools/tool-manifest.ts +1 -1
package/src/util/log-redact.ts +9 -34
package/src/workspace/migrations/015-migrate-credentials-to-keychain.ts +13 -148
package/src/workspace/migrations/016-migrate-credentials-from-keychain.ts +7 -145
package/src/workspace/migrations/AGENTS.md +11 -0
package/src/workspace/migrations/runner.ts +16 -6
package/src/workspace/migrations/types.ts +7 -0
package/docs/architecture/keychain-broker.md +0 -69
package/src/__tests__/keychain-broker-client.test.ts +0 -800
package/src/cli/commands/oauth/platform.ts +0 -525
package/src/config/bundled-skills/slack/TOOLS.json +0 -272
package/src/config/bundled-skills/slack/tools/shared.ts +0 -34
package/src/config/bundled-skills/slack/tools/slack-add-reaction.ts +0 -27
package/src/config/bundled-skills/slack/tools/slack-channel-details.ts +0 -38
package/src/config/bundled-skills/slack/tools/slack-channel-permissions.ts +0 -146
package/src/config/bundled-skills/slack/tools/slack-configure-channels.ts +0 -105
package/src/config/bundled-skills/slack/tools/slack-delete-message.ts +0 -26
package/src/config/bundled-skills/slack/tools/slack-edit-message.ts +0 -27
package/src/config/bundled-skills/slack/tools/slack-leave-channel.ts +0 -25
package/src/config/bundled-skills/slack/tools/slack-scan-digest.ts +0 -372
package/src/security/keychain-broker-client.ts +0 -446

package/src/__tests__/acp-session.test.ts CHANGED Viewed

@@ -1,11 +1,9 @@
 import { beforeEach, describe, expect, mock, test } from "bun:test";
-import {
-  resolvePermission,
-  VellumAcpClientHandler,
-} from "../acp/client-handler.js";
+import { VellumAcpClientHandler } from "../acp/client-handler.js";
 import { AcpSessionManager } from "../acp/session-manager.js";
 import type { ServerMessage } from "../daemon/message-protocol.js";
+import * as pendingInteractions from "../runtime/pending-interactions.js";
 // ---------------------------------------------------------------------------
 // VellumAcpClientHandler tests
@@ -14,18 +12,17 @@ import type { ServerMessage } from "../daemon/message-protocol.js";
 describe("VellumAcpClientHandler", () => {
   let sent: ServerMessage[];
   let sendToVellum: (msg: ServerMessage) => void;
-  let pendingPermissions: Map<string, { resolve: (optionId: string) => void }>;
   let handler: VellumAcpClientHandler;
   beforeEach(() => {
     sent = [];
     sendToVellum = (msg) => sent.push(msg);
-    pendingPermissions = new Map();
     handler = new VellumAcpClientHandler(
       "session-1",
       sendToVellum,
-      pendingPermissions,
+      "conv-parent",
     );
+    pendingInteractions.clear();
   });
   describe("sessionUpdate", () => {
@@ -152,7 +149,7 @@ describe("VellumAcpClientHandler", () => {
   });
   describe("requestPermission", () => {
-    test("sends permission request and resolves when permission is granted", async () => {
+    test("sends confirmation_request and resolves when permission is granted", async () => {
       const resultPromise = handler.requestPermission({
         toolCall: {
           title: "Run command",
@@ -165,52 +162,135 @@ describe("VellumAcpClientHandler", () => {
         ],
       } as any);
-      // Should have sent a permission request
+      // Should have sent a standard confirmation_request with ACP context
       expect(sent).toHaveLength(1);
       const msg = sent[0] as any;
-      expect(msg.type).toBe("acp_permission_request");
-      expect(msg.acpSessionId).toBe("session-1");
-      expect(msg.toolTitle).toBe("Run command");
-      expect(msg.toolKind).toBe("execute");
-      expect(msg.options).toHaveLength(2);
-      // A pending permission should exist
-      expect(pendingPermissions.size).toBe(1);
+      expect(msg.type).toBe("confirmation_request");
+      expect(msg.toolName).toBe("ACP Agent: Run command");
+      expect(msg.riskLevel).toBe("medium"); // ACP defaults to medium
+      expect(msg.persistentDecisionsAllowed).toBe(false);
+      expect(msg.allowlistOptions).toEqual([]);
+      // ACP-specific fields passed through for client rendering
+      expect(msg.acpToolKind).toBe("execute");
+      expect(msg.acpOptions).toEqual([
+        { optionId: "allow", name: "Allow", kind: "allow_once" },
+        { optionId: "deny", name: "Deny", kind: "reject_once" },
+      ]);
       const requestId = msg.requestId;
-      // Resolve the permission
-      resolvePermission(pendingPermissions, requestId, "allow");
+      // Resolve via the pendingInteractions tracker (same as POST /v1/confirm)
+      const interaction = pendingInteractions.resolve(requestId);
+      expect(interaction).toBeDefined();
+      expect(interaction!.kind).toBe("acp_confirmation");
+      interaction!.directResolve!("allow");
       const result = await resultPromise;
       expect(result).toEqual({
         outcome: { outcome: "selected", optionId: "allow" },
       });
-      expect(pendingPermissions.size).toBe(0);
     });
-  });
-});
-// ---------------------------------------------------------------------------
-// resolvePermission standalone tests
-// ---------------------------------------------------------------------------
+    test("maps deny decision to reject_once option", async () => {
+      const resultPromise = handler.requestPermission({
+        toolCall: {
+          title: "Write file",
+          kind: "edit",
+          rawInput: { path: "/tmp/test.txt" },
+        },
+        options: [
+          { optionId: "opt-allow", name: "Allow", kind: "allow_once" },
+          { optionId: "opt-deny", name: "Deny", kind: "reject_once" },
+        ],
+      } as any);
-describe("resolvePermission", () => {
-  test("resolves and removes the pending entry", () => {
-    let resolved = "";
-    const pending = new Map<string, { resolve: (id: string) => void }>();
-    pending.set("req-1", { resolve: (id) => (resolved = id) });
+      const msg = sent[0] as any;
+      expect(msg.riskLevel).toBe("medium"); // ACP defaults to medium
-    resolvePermission(pending, "req-1", "allow");
+      const interaction = pendingInteractions.resolve(msg.requestId);
+      interaction!.directResolve!("deny");
-    expect(resolved).toBe("allow");
-    expect(pending.size).toBe(0);
-  });
+      const result = await resultPromise;
+      expect(result).toEqual({
+        outcome: { outcome: "selected", optionId: "opt-deny" },
+      });
+    });
+    test("defaults riskLevel to medium for all ACP permissions", async () => {
+      handler.requestPermission({
+        toolCall: {
+          title: "Read file",
+          kind: "read",
+        },
+        options: [{ optionId: "allow", name: "Allow", kind: "allow_once" }],
+      } as any);
+      const msg = sent[0] as any;
+      expect(msg.riskLevel).toBe("medium");
+    });
+    test("ACP registration survives sendToVellum overwrite (makeEventSender race)", async () => {
+      // Simulate makeEventSender: when sendToVellum is called with a
+      // confirmation_request, it overwrites the pendingInteractions entry
+      // with a normal "confirmation" (no directResolve). This is what
+      // happens in production because sendToVellum goes through the
+      // conversation's event sender.
+      const overwritingSend = (msg: ServerMessage) => {
+        sent.push(msg);
+        if ((msg as any).type === "confirmation_request") {
+          pendingInteractions.register((msg as any).requestId, {
+            conversation: {} as any, // fake conversation
+            conversationId: "conv-123",
+            kind: "confirmation",
+            confirmationDetails: {
+              toolName: (msg as any).toolName,
+              input: (msg as any).input,
+              riskLevel: (msg as any).riskLevel,
+              allowlistOptions: [],
+              scopeOptions: [],
+            },
+            // NO directResolve — this is the bug scenario
+          });
+        }
+      };
+      // Create handler with the overwriting sender
+      const racyHandler = new VellumAcpClientHandler(
+        "session-racy",
+        overwritingSend,
+        "conv-racy",
+      );
+      const resultPromise = racyHandler.requestPermission({
+        toolCall: {
+          title: "Write file",
+          kind: "edit",
+          rawInput: "test",
+        },
+        options: [
+          { optionId: "yes", name: "Allow", kind: "allow_once" },
+          { optionId: "no", name: "Deny", kind: "reject_once" },
+        ],
+      } as any);
-  test("is a no-op when request ID is not found", () => {
-    const pending = new Map<string, { resolve: (id: string) => void }>();
-    // Should not throw
-    resolvePermission(pending, "nonexistent", "allow");
-    expect(pending.size).toBe(0);
+      const requestId = (sent[sent.length - 1] as any).requestId;
+      // The critical assertion: after requestPermission completes setup,
+      // the pendingInteractions entry must be the ACP one with directResolve,
+      // NOT the overwritten "confirmation" without it.
+      const interaction = pendingInteractions.resolve(requestId);
+      expect(interaction).toBeDefined();
+      expect(interaction!.kind).toBe("acp_confirmation");
+      expect(interaction!.directResolve).toBeDefined();
+      // Resolve it — this would fail silently if the overwrite won
+      interaction!.directResolve!("allow");
+      const result = await resultPromise;
+      expect(result).toEqual({
+        outcome: { outcome: "selected", optionId: "yes" },
+      });
+    });
   });
 });
@@ -270,11 +350,126 @@ describe("AcpSessionManager", () => {
     });
   });
-  describe("resolvePermission", () => {
-    test("logs warning for unknown request ID (no throw)", () => {
-      const manager = new AcpSessionManager(5);
-      // Should not throw — just logs a warning
-      manager.resolvePermission("unknown-req", "allow");
+  describe("session cleanup after prompt", () => {
+    test("completed session is removed from the session map", async () => {
+      let resolvePrompt: (v: { stopReason: string }) => void;
+      const promptPromise = new Promise<{ stopReason: string }>((r) => {
+        resolvePrompt = r;
+      });
+      const manager = new AcpSessionManager(1);
+      const sendToVellum = mock(() => {});
+      // Inject a fake session directly into the manager to avoid needing
+      // a real child process.
+      const fakeProcess = {
+        prompt: () => promptPromise,
+        kill: mock(() => {}),
+        spawn: mock(() => {}),
+        initialize: mock(() => Promise.resolve()),
+        createSession: mock(() => Promise.resolve("proto-session")),
+        cancel: mock(() => Promise.resolve()),
+      };
+      const fakeHandler = new VellumAcpClientHandler(
+        "test-session",
+        sendToVellum,
+        "conv-1",
+      );
+      // Access private sessions map via any cast
+      const sessions = (manager as any).sessions as Map<string, any>;
+      const entry = {
+        process: fakeProcess,
+        state: {
+          id: "test-session",
+          agentId: "agent-1",
+          acpSessionId: "proto-session",
+          status: "running",
+          startedAt: Date.now(),
+        },
+        clientHandler: fakeHandler,
+        sendToVellum,
+        currentPrompt: null as any,
+        parentConversationId: "conv-1",
+        cwd: "/tmp",
+      };
+      sessions.set("test-session", entry);
+      // Fire the prompt in the background via the private method
+      const bgPromise = (manager as any).firePromptInBackground(
+        "test-session",
+        entry,
+        "proto-session",
+        "do something",
+      );
+      entry.currentPrompt = bgPromise;
+      // Session exists before completion
+      expect((manager.getStatus() as any[]).length).toBe(1);
+      // Complete the prompt
+      resolvePrompt!({ stopReason: "end_turn" });
+      await bgPromise;
+      // Session should be cleaned up
+      expect((manager.getStatus() as any[]).length).toBe(0);
+      expect(fakeProcess.kill).toHaveBeenCalled();
+    });
+    test("failed session is removed from the session map", async () => {
+      const manager = new AcpSessionManager(1);
+      const sendToVellum = mock(() => {});
+      let rejectPrompt: (e: Error) => void;
+      const promptPromise = new Promise<{ stopReason: string }>((_r, rej) => {
+        rejectPrompt = rej;
+      });
+      const fakeProcess = {
+        prompt: () => promptPromise,
+        kill: mock(() => {}),
+      };
+      const fakeHandler = new VellumAcpClientHandler(
+        "test-session-2",
+        sendToVellum,
+        "conv-2",
+      );
+      const sessions = (manager as any).sessions as Map<string, any>;
+      const entry = {
+        process: fakeProcess,
+        state: {
+          id: "test-session-2",
+          agentId: "agent-1",
+          acpSessionId: "proto-session-2",
+          status: "running",
+          startedAt: Date.now(),
+        },
+        clientHandler: fakeHandler,
+        sendToVellum,
+        currentPrompt: null as any,
+        parentConversationId: "conv-2",
+        cwd: "/tmp",
+      };
+      sessions.set("test-session-2", entry);
+      const bgPromise = (manager as any).firePromptInBackground(
+        "test-session-2",
+        entry,
+        "proto-session-2",
+        "do something",
+      );
+      entry.currentPrompt = bgPromise;
+      expect((manager.getStatus() as any[]).length).toBe(1);
+      // Fail the prompt
+      rejectPrompt!(new Error("agent crashed"));
+      await bgPromise;
+      // Session should be cleaned up even on failure
+      expect((manager.getStatus() as any[]).length).toBe(0);
+      expect(fakeProcess.kill).toHaveBeenCalled();
     });
   });

package/src/__tests__/assistant-feature-flag-guard.test.ts CHANGED Viewed

@@ -7,11 +7,11 @@ import { describe, expect, test } from "bun:test";
  * Guard tests for assistant feature flags.
  *
  * 1. Key format validation: ensure production code uses the canonical
- *    `feature_flags.<flagId>.enabled` format, not the legacy
- *    `skills.<id>.enabled` format.
+ *    simple kebab-case format (e.g., "browser", "ces-tools"), not the
+ *    legacy `skills.<id>.enabled` format.
  *
  * 2. Declaration coverage: ensure all assistant-scope flag keys in the
- *    unified registry conform to the canonical format.
+ *    unified registry conform to the simple kebab-case format.
  *
  * See AGENTS.md "Assistant Feature Flags" for the full convention.
  */
@@ -53,7 +53,7 @@ function loadRegistry(): Registry {
   return JSON.parse(raw);
 }
-const CANONICAL_KEY_RE = /^feature_flags\.[a-z0-9][a-z0-9._-]*\.enabled$/;
+const CANONICAL_KEY_RE = /^[a-z0-9][a-z0-9-]*$/;
 /**
  * Files allowed to contain the legacy `skills.<id>.enabled` key format.
@@ -126,13 +126,13 @@ describe("assistant feature flag guard", () => {
     if (violations.length > 0) {
       const message = [
         "Found production files using the legacy `skills.<id>.enabled` key format.",
-        "New code must use the canonical format: `feature_flags.<id>.enabled`.",
+        'New code must use the canonical simple kebab-case format (e.g., "browser", "ces-tools").',
         'See AGENTS.md "Assistant Feature Flags" for the convention.',
         "",
         "Violations:",
         ...violations.map((f) => `  - ${f}`),
         "",
-        "To fix: replace `skills.<id>.enabled` with `feature_flags.<id>.enabled`.",
+        "To fix: replace `skills.<id>.enabled` with the simple kebab-case format.",
         "If backward-compat access is genuinely needed, add to LEGACY_KEY_ALLOWLIST in assistant-feature-flag-guard.test.ts.",
       ].join("\n");
@@ -144,7 +144,7 @@ describe("assistant feature flag guard", () => {
   // Test: unified registry key format (assistant-scope only)
   // ---------------------------------------------------------------------------
-  test("all assistant-scope keys in the unified registry use the canonical feature_flags.<id>.enabled format", () => {
+  test("all assistant-scope keys in the unified registry use the canonical simple kebab-case format", () => {
     const registry = loadRegistry();
     const assistantFlags = registry.flags.filter(
       (f) => f.scope === "assistant",
@@ -156,7 +156,7 @@ describe("assistant feature flag guard", () => {
     if (violations.length > 0) {
       const message = [
         "Found assistant-scope keys in the unified registry that do not match the canonical format.",
-        "Expected format: feature_flags.<flagId>.enabled",
+        'Expected format: simple kebab-case (e.g., "browser", "ces-tools")',
         "",
         "Violations:",
         ...violations.map((k) => `  - ${k}`),

package/src/__tests__/assistant-feature-flag-guardrails.test.ts CHANGED Viewed

@@ -1,8 +1,8 @@
 /**
  * Guard tests for assistant feature flag conventions:
  *
- * 1. Key format: all feature flag keys used in production code must follow the
- *    canonical `feature_flags.<flag_id>.enabled` format. Any remaining
+ * 1. Key format: all feature flag keys used in production code must use
+ *    simple kebab-case format (e.g., "browser", "ces-tools"). Any remaining
  *    `skills.<id>.enabled` usage outside of migration/backward-compat code is
  *    flagged — including template literal forms like `skills.${skillId}.enabled`.
  *
@@ -10,11 +10,6 @@
  *    `isAssistantFeatureFlagEnabled('<key>', ...)` in production code must be
  *    declared in the unified registry. This keeps flag usage declarative while
  *    allowing skills to exist without corresponding feature flags.
- *
- * 3. Indirect key coverage: all `feature_flags.<id>.enabled` string literals
- *    anywhere in production code (maps, constants, variables, etc.) must be
- *    declared in the unified registry. This catches indirect key patterns that
- *    Guard 2 would miss, such as flag keys stored in lookup maps or constants.
  */
 import { execSync } from "node:child_process";
@@ -115,8 +110,8 @@ describe("assistant feature flag key format guard", () => {
     if (violations.length > 0) {
       const message = [
         "Found production TypeScript files using legacy `skills.<id>.enabled` key format.",
-        "Use the canonical `feature_flags.<id>.enabled` format instead.",
-        "Call `isAssistantFeatureFlagEnabled(`feature_flags.${skillId}.enabled`, config)` to check skill flags.",
+        "Use simple kebab-case keys instead (e.g., `contacts`, `browser`).",
+        "Call `isAssistantFeatureFlagEnabled(skillId, config)` to check skill flags.",
         "",
         "Violations:",
         ...violations.map((f) => `  - ${f}`),
@@ -149,7 +144,7 @@ describe("assistant feature flag declaration coverage guard", () => {
     // multiline regex so that calls split across lines are still caught:
     //
     //   isAssistantFeatureFlagEnabled(
-    //     'feature_flags.foo.enabled',
+    //     'browser',
     //     config,
     //   )
     //
@@ -202,79 +197,3 @@ describe("assistant feature flag declaration coverage guard", () => {
     }
   });
 });
-// ---------------------------------------------------------------------------
-// Guard 3: Indirect key coverage — flag key literals anywhere in production code
-// ---------------------------------------------------------------------------
-describe("assistant feature flag indirect key coverage guard", () => {
-  test("all feature_flags.<id>.enabled string literals in production code are declared in the unified registry", () => {
-    const repoRoot = getRepoRoot();
-    // Load the unified registry and extract all declared keys (any scope)
-    const registry = loadRegistry();
-    const declaredKeys = new Set(registry.flags.map((f) => f.key));
-    // Search for any string literal matching the canonical key pattern
-    // in production .ts files under assistant/src/ and gateway/src/.
-    // This catches keys in maps, constants, variables, or any other
-    // indirect patterns that Guard 2 would miss.
-    let grepOutput = "";
-    try {
-      grepOutput = execSync(
-        `git grep -nE "feature_flags\\.[a-z0-9_-]+\\.enabled\\b" -- 'assistant/src/**/*.ts' 'gateway/src/**/*.ts'`,
-        { encoding: "utf-8", cwd: repoRoot },
-      ).trim();
-    } catch (err) {
-      // Exit code 1 means no matches — happy path
-      if ((err as { status?: number }).status === 1) {
-        return;
-      }
-      throw err;
-    }
-    const keyPattern = /feature_flags\.[a-z0-9_-]+\.enabled\b/g;
-    const undeclared: string[] = [];
-    for (const line of grepOutput.split("\n")) {
-      if (!line) continue;
-      // Format: "file:line:content"
-      const colonIdx = line.indexOf(":");
-      if (colonIdx === -1) continue;
-      const filePath = line.slice(0, colonIdx);
-      // Skip test files and persisted-data migration files (they reference retired flag keys by design)
-      if (isTestFile(filePath)) continue;
-      if (
-        filePath.includes("/workspace/migrations/") ||
-        filePath.includes("/memory/migrations/")
-      )
-        continue;
-      // Extract all key occurrences from this line
-      const content = line.slice(colonIdx + 1);
-      for (const match of content.matchAll(keyPattern)) {
-        const key = match[0];
-        if (!declaredKeys.has(key)) {
-          undeclared.push(`${filePath}: ${key}`);
-        }
-      }
-    }
-    if (undeclared.length > 0) {
-      const message = [
-        "Found feature_flags.<id>.enabled string literals in production code that are NOT declared in the unified registry.",
-        "This catches indirect flag key usage (maps, constants, variables) that the direct-call guard misses.",
-        `Registry: meta/feature-flags/feature-flag-registry.json`,
-        "",
-        "Undeclared keys:",
-        ...undeclared.map((k) => `  - ${k}`),
-        "",
-        "To fix: add the missing key(s) to the unified registry, or remove the stale reference.",
-      ].join("\n");
-      expect(undeclared, message).toEqual([]);
-    }
-  });
-});

package/src/__tests__/assistant-feature-flags-integration.test.ts CHANGED Viewed

@@ -45,7 +45,7 @@ let currentConfig: Record<string, unknown> = {
 };
 const DECLARED_FLAG_ID = "contacts";
-const DECLARED_FLAG_KEY = `feature_flags.${DECLARED_FLAG_ID}.enabled`;
+const DECLARED_FLAG_KEY = DECLARED_FLAG_ID;
 const DECLARED_SKILL_ID = "contacts";
 // eslint-disable-next-line @typescript-eslint/no-require-imports
@@ -201,7 +201,7 @@ describe("buildSystemPrompt assistant feature flag filtering", () => {
     _setOverridesForTesting({
       [DECLARED_FLAG_KEY]: false,
-      "feature_flags.browser.enabled": true,
+      browser: true,
     });
     currentConfig = {
@@ -286,7 +286,7 @@ describe("buildSystemPrompt assistant feature flag filtering", () => {
     _setOverridesForTesting({
       [DECLARED_FLAG_KEY]: false,
-      "feature_flags.email-channel.enabled": false,
+      "email-channel": false,
     });
     currentConfig = {
@@ -356,7 +356,7 @@ describe("buildSystemPrompt assistant feature flag filtering", () => {
       "browser",
     );
-    _setOverridesForTesting({ "feature_flags.browser.enabled": false });
+    _setOverridesForTesting({ browser: false });
     currentConfig = {
       services: {
@@ -478,21 +478,14 @@ describe("isAssistantFeatureFlagEnabled", () => {
   test("unknown flag defaults to true when no persisted override", () => {
     const config = {} as any;
-    expect(
-      isAssistantFeatureFlagEnabled(
-        "feature_flags.unknown-skill.enabled",
-        config,
-      ),
-    ).toBe(true);
+    expect(isAssistantFeatureFlagEnabled("unknown-skill", config)).toBe(true);
   });
   test("undeclared flag respects persisted override", () => {
-    _setOverridesForTesting({ "feature_flags.browser.enabled": false });
+    _setOverridesForTesting({ browser: false });
     const config = {} as any;
-    expect(
-      isAssistantFeatureFlagEnabled("feature_flags.browser.enabled", config),
-    ).toBe(false);
+    expect(isAssistantFeatureFlagEnabled("browser", config)).toBe(false);
   });
 });

package/src/__tests__/browser-skill-endstate.test.ts CHANGED Viewed

@@ -39,7 +39,7 @@ describe("browser skill migration end-state", () => {
   beforeAll(async () => {
     __resetRegistryForTesting();
     _setOverridesForTesting({
-      "feature_flags.browser.enabled": true,
+      browser: true,
     });
     await initializeTools();
   });

package/src/__tests__/btw-routes.test.ts CHANGED Viewed

@@ -61,6 +61,12 @@ mock.module("../prompts/system-prompt.js", () => ({
   buildSystemPrompt: mockBuildSystemPrompt,
 }));
+mock.module("../prompts/persona-resolver.js", () => ({
+  resolveGuardianPersona: () => null,
+  resolveChannelPersona: () => null,
+  resolveUserPersona: () => null,
+}));
 // ---------------------------------------------------------------------------
 // Imports (after mocks)
 // ---------------------------------------------------------------------------
@@ -304,7 +310,9 @@ describe("POST /v1/btw", () => {
     // System prompt built by buildSystemPrompt({ excludeBootstrap: true })
     expect(systemPrompt).toBe(MOCK_SYSTEM_PROMPT);
     expect(mockBuildSystemPrompt).toHaveBeenCalledWith({
+      channelPersona: null,
       excludeBootstrap: true,
+      userPersona: null,
     });
     // Options: tool_choice must be "none"