npm - @vellumai/assistant - Versions diffs - 0.3.19 → 0.3.21 - Mend

@vellumai/assistant 0.3.19 → 0.3.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (199) hide show

package/ARCHITECTURE.md +151 -15
package/Dockerfile +1 -0
package/README.md +40 -4
package/bun.lock +139 -2
package/docs/architecture/integrations.md +7 -11
package/package.json +2 -1
package/src/__tests__/__snapshots__/ipc-snapshot.test.ts.snap +54 -0
package/src/__tests__/approval-primitive.test.ts +540 -0
package/src/__tests__/assistant-feature-flag-guard.test.ts +206 -0
package/src/__tests__/assistant-feature-flag-guardrails.test.ts +198 -0
package/src/__tests__/assistant-feature-flags-integration.test.ts +272 -0
package/src/__tests__/call-controller.test.ts +439 -108
package/src/__tests__/channel-invite-transport.test.ts +264 -0
package/src/__tests__/cli.test.ts +42 -1
package/src/__tests__/config-schema.test.ts +11 -127
package/src/__tests__/config-watcher.test.ts +0 -8
package/src/__tests__/daemon-lifecycle.test.ts +1 -0
package/src/__tests__/daemon-server-session-init.test.ts +8 -2
package/src/__tests__/diff.test.ts +22 -0
package/src/__tests__/guardian-action-copy-generator.test.ts +5 -0
package/src/__tests__/guardian-action-grant-mint-consume.test.ts +300 -32
package/src/__tests__/guardian-action-late-reply.test.ts +546 -1
package/src/__tests__/guardian-actions-endpoint.test.ts +774 -0
package/src/__tests__/guardian-control-plane-policy.test.ts +36 -3
package/src/__tests__/guardian-dispatch.test.ts +124 -0
package/src/__tests__/guardian-grant-minting.test.ts +6 -17
package/src/__tests__/inbound-invite-redemption.test.ts +367 -0
package/src/__tests__/invite-redemption-service.test.ts +306 -0
package/src/__tests__/ipc-snapshot.test.ts +57 -0
package/src/__tests__/notification-decision-fallback.test.ts +88 -0
package/src/__tests__/sandbox-diagnostics.test.ts +6 -249
package/src/__tests__/sandbox-host-parity.test.ts +6 -13
package/src/__tests__/scoped-approval-grants.test.ts +6 -6
package/src/__tests__/scoped-grant-security-matrix.test.ts +5 -4
package/src/__tests__/script-proxy-session-manager.test.ts +1 -19
package/src/__tests__/session-load-history-repair.test.ts +169 -2
package/src/__tests__/session-runtime-assembly.test.ts +33 -5
package/src/__tests__/skill-feature-flags-integration.test.ts +171 -0
package/src/__tests__/skill-feature-flags.test.ts +188 -0
package/src/__tests__/skill-load-feature-flag.test.ts +141 -0
package/src/__tests__/skill-mirror-parity.test.ts +1 -0
package/src/__tests__/skill-projection-feature-flag.test.ts +363 -0
package/src/__tests__/system-prompt.test.ts +1 -1
package/src/__tests__/terminal-sandbox.test.ts +142 -9
package/src/__tests__/terminal-tools.test.ts +2 -93
package/src/__tests__/thread-seed-composer.test.ts +18 -0
package/src/__tests__/tool-approval-handler.test.ts +350 -0
package/src/__tests__/trusted-contact-lifecycle-notifications.test.ts +8 -10
package/src/__tests__/voice-scoped-grant-consumer.test.ts +46 -84
package/src/agent/loop.ts +36 -1
package/src/approvals/approval-primitive.ts +381 -0
package/src/approvals/guardian-decision-primitive.ts +191 -0
package/src/calls/call-controller.ts +252 -209
package/src/calls/call-domain.ts +44 -6
package/src/calls/guardian-dispatch.ts +48 -0
package/src/calls/types.ts +1 -1
package/src/calls/voice-session-bridge.ts +46 -30
package/src/cli/core-commands.ts +0 -4
package/src/cli/mcp.ts +58 -0
package/src/cli.ts +76 -34
package/src/config/__tests__/feature-flag-registry-guard.test.ts +179 -0
package/src/config/assistant-feature-flags.ts +162 -0
package/src/config/bundled-skills/api-mapping/icon.svg +18 -0
package/src/config/bundled-skills/messaging/TOOLS.json +30 -0
package/src/config/bundled-skills/messaging/tools/slack-delete-message.ts +24 -0
package/src/config/bundled-skills/notifications/SKILL.md +1 -1
package/src/config/bundled-skills/reminder/SKILL.md +49 -2
package/src/config/bundled-skills/time-based-actions/SKILL.md +49 -2
package/src/config/bundled-skills/voice-setup/SKILL.md +122 -0
package/src/config/core-schema.ts +1 -1
package/src/config/env-registry.ts +10 -0
package/src/config/feature-flag-registry.json +61 -0
package/src/config/loader.ts +22 -1
package/src/config/mcp-schema.ts +46 -0
package/src/config/sandbox-schema.ts +0 -39
package/src/config/schema.ts +18 -2
package/src/config/skill-state.ts +34 -0
package/src/config/skills-schema.ts +0 -1
package/src/config/skills.ts +9 -0
package/src/config/system-prompt.ts +110 -46
package/src/config/templates/SOUL.md +1 -1
package/src/config/types.ts +19 -1
package/src/config/vellum-skills/catalog.json +1 -1
package/src/config/vellum-skills/guardian-verify-setup/SKILL.md +1 -0
package/src/config/vellum-skills/sms-setup/SKILL.md +1 -1
package/src/config/vellum-skills/telegram-setup/SKILL.md +6 -5
package/src/config/vellum-skills/trusted-contacts/SKILL.md +105 -3
package/src/config/vellum-skills/twilio-setup/SKILL.md +1 -1
package/src/daemon/config-watcher.ts +0 -1
package/src/daemon/daemon-control.ts +1 -1
package/src/daemon/guardian-invite-intent.ts +124 -0
package/src/daemon/handlers/avatar.ts +68 -0
package/src/daemon/handlers/browser.ts +2 -2
package/src/daemon/handlers/guardian-actions.ts +120 -0
package/src/daemon/handlers/index.ts +4 -0
package/src/daemon/handlers/sessions.ts +19 -0
package/src/daemon/handlers/shared.ts +3 -1
package/src/daemon/install-cli-launchers.ts +58 -13
package/src/daemon/ipc-contract/guardian-actions.ts +53 -0
package/src/daemon/ipc-contract/sessions.ts +8 -2
package/src/daemon/ipc-contract/settings.ts +25 -2
package/src/daemon/ipc-contract-inventory.json +10 -0
package/src/daemon/ipc-contract.ts +4 -0
package/src/daemon/lifecycle.ts +14 -2
package/src/daemon/main.ts +1 -0
package/src/daemon/providers-setup.ts +26 -1
package/src/daemon/server.ts +1 -0
package/src/daemon/session-lifecycle.ts +52 -7
package/src/daemon/session-memory.ts +45 -0
package/src/daemon/session-process.ts +258 -432
package/src/daemon/session-runtime-assembly.ts +12 -0
package/src/daemon/session-skill-tools.ts +14 -1
package/src/daemon/session-tool-setup.ts +5 -0
package/src/daemon/session.ts +11 -0
package/src/daemon/shutdown-handlers.ts +11 -0
package/src/daemon/tool-side-effects.ts +35 -9
package/src/index.ts +2 -2
package/src/mcp/client.ts +152 -0
package/src/mcp/manager.ts +139 -0
package/src/memory/conversation-display-order-migration.ts +44 -0
package/src/memory/conversation-queries.ts +2 -0
package/src/memory/conversation-store.ts +91 -0
package/src/memory/db-init.ts +5 -1
package/src/memory/embedding-local.ts +13 -8
package/src/memory/guardian-action-store.ts +125 -2
package/src/memory/ingress-invite-store.ts +95 -1
package/src/memory/migrations/035-guardian-action-supersession.ts +23 -0
package/src/memory/migrations/index.ts +2 -1
package/src/memory/schema.ts +5 -1
package/src/memory/scoped-approval-grants.ts +14 -5
package/src/messaging/providers/slack/client.ts +12 -0
package/src/messaging/providers/slack/types.ts +5 -0
package/src/notifications/decision-engine.ts +49 -12
package/src/notifications/emit-signal.ts +7 -0
package/src/notifications/signal.ts +7 -0
package/src/notifications/thread-seed-composer.ts +2 -1
package/src/runtime/channel-approval-types.ts +16 -6
package/src/runtime/channel-approvals.ts +19 -15
package/src/runtime/channel-invite-transport.ts +85 -0
package/src/runtime/channel-invite-transports/telegram.ts +105 -0
package/src/runtime/guardian-action-grant-minter.ts +92 -35
package/src/runtime/guardian-action-message-composer.ts +30 -0
package/src/runtime/guardian-decision-types.ts +91 -0
package/src/runtime/http-server.ts +23 -1
package/src/runtime/ingress-service.ts +22 -0
package/src/runtime/invite-redemption-service.ts +181 -0
package/src/runtime/invite-redemption-templates.ts +39 -0
package/src/runtime/routes/call-routes.ts +2 -1
package/src/runtime/routes/guardian-action-routes.ts +206 -0
package/src/runtime/routes/guardian-approval-interception.ts +66 -190
package/src/runtime/routes/identity-routes.ts +73 -0
package/src/runtime/routes/inbound-message-handler.ts +486 -394
package/src/runtime/routes/pairing-routes.ts +4 -0
package/src/security/encrypted-store.ts +31 -17
package/src/security/keychain.ts +176 -2
package/src/security/secure-keys.ts +97 -0
package/src/security/tool-approval-digest.ts +1 -1
package/src/tools/browser/browser-execution.ts +2 -2
package/src/tools/browser/browser-manager.ts +46 -32
package/src/tools/browser/browser-screencast.ts +2 -2
package/src/tools/calls/call-start.ts +1 -1
package/src/tools/executor.ts +22 -17
package/src/tools/mcp/mcp-tool-factory.ts +100 -0
package/src/tools/network/script-proxy/session-manager.ts +1 -5
package/src/tools/registry.ts +64 -1
package/src/tools/skills/load.ts +22 -8
package/src/tools/system/avatar-generator.ts +119 -0
package/src/tools/system/navigate-settings.ts +65 -0
package/src/tools/system/open-system-settings.ts +75 -0
package/src/tools/system/voice-config.ts +121 -32
package/src/tools/terminal/backends/native.ts +40 -19
package/src/tools/terminal/backends/types.ts +3 -3
package/src/tools/terminal/parser.ts +1 -1
package/src/tools/terminal/sandbox-diagnostics.ts +6 -87
package/src/tools/terminal/sandbox.ts +1 -12
package/src/tools/terminal/shell.ts +3 -31
package/src/tools/tool-approval-handler.ts +141 -3
package/src/tools/tool-manifest.ts +6 -0
package/src/tools/types.ts +10 -2
package/src/util/diff.ts +36 -13
package/Dockerfile.sandbox +0 -5
package/src/__tests__/doordash-client.test.ts +0 -187
package/src/__tests__/doordash-session.test.ts +0 -154
package/src/__tests__/signup-e2e.test.ts +0 -354
package/src/__tests__/terminal-sandbox-docker.test.ts +0 -1065
package/src/__tests__/terminal-sandbox.integration.test.ts +0 -180
package/src/cli/doordash.ts +0 -1057
package/src/config/bundled-skills/doordash/SKILL.md +0 -163
package/src/config/templates/LOOKS.md +0 -25
package/src/doordash/cart-queries.ts +0 -787
package/src/doordash/client.ts +0 -1016
package/src/doordash/order-queries.ts +0 -85
package/src/doordash/queries.ts +0 -13
package/src/doordash/query-extractor.ts +0 -94
package/src/doordash/search-queries.ts +0 -203
package/src/doordash/session.ts +0 -84
package/src/doordash/store-queries.ts +0 -246
package/src/doordash/types.ts +0 -367
package/src/tools/terminal/backends/docker.ts +0 -379

package/src/__tests__/assistant-feature-flag-guard.test.ts ADDED Viewed

@@ -0,0 +1,206 @@
+import { execFileSync } from 'node:child_process';
+import { readFileSync } from 'node:fs';
+import { join } from 'node:path';
+import { describe, expect, test } from 'bun:test';
+/**
+ * Guard tests for assistant feature flags.
+ *
+ * 1. Key format validation: ensure production code uses the canonical
+ *    `feature_flags.<flagId>.enabled` format, not the legacy
+ *    `skills.<id>.enabled` format.
+ *
+ * 2. Declaration coverage: ensure all assistant-scope flag keys in the
+ *    unified registry conform to the canonical format.
+ *
+ * See AGENTS.md "Assistant Feature Flags" for the full convention.
+ */
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
+/** Resolve repo root (tests run from assistant/) */
+function getRepoRoot(): string {
+  return join(process.cwd(), '..');
+}
+function getRegistryPath(): string {
+  return join(getRepoRoot(), 'meta', 'feature-flags', 'feature-flag-registry.json');
+}
+interface RegistryFlag {
+  id: string;
+  scope: string;
+  key: string;
+  label: string;
+  description: string;
+  defaultEnabled: boolean;
+}
+interface Registry {
+  version: number;
+  flags: RegistryFlag[];
+}
+function loadRegistry(): Registry {
+  const raw = readFileSync(getRegistryPath(), 'utf-8');
+  return JSON.parse(raw);
+}
+const CANONICAL_KEY_RE = /^feature_flags\.[a-z0-9][a-z0-9._-]*\.enabled$/;
+/**
+ * Files allowed to contain the legacy `skills.<id>.enabled` key format.
+ * Keep this list minimal — only files that genuinely need to reference
+ * the legacy format for backward compatibility.
+ */
+const LEGACY_KEY_ALLOWLIST = new Set([
+  // macOS client: fallback reads from legacy config section
+  'clients/macos/vellum-assistant/Features/Settings/SettingsAccountTab.swift',
+]);
+function isTestFile(filePath: string): boolean {
+  return (
+    filePath.includes('/__tests__/') ||
+    filePath.includes('/Tests/') ||
+    filePath.endsWith('.test.ts') ||
+    filePath.endsWith('.test.js') ||
+    filePath.endsWith('.spec.ts') ||
+    filePath.endsWith('.spec.js') ||
+    filePath.endsWith('Tests.swift')
+  );
+}
+// ---------------------------------------------------------------------------
+// Test: key format validation
+// ---------------------------------------------------------------------------
+describe('assistant feature flag guard', () => {
+  test('no production files use legacy skills.<id>.enabled key format outside allowlist', () => {
+    // Search for the legacy key pattern in string literals across the codebase.
+    // The pattern matches quoted strings like 'skills.browser.enabled',
+    // "skills.browser.enabled", or `skills.browser.enabled`.
+    const pattern = `['"\`]skills\\.[a-z][a-z0-9._-]*\\.enabled['"\`]`;
+    let grepOutput = '';
+    try {
+      // Use execFileSync to avoid shell interpretation — the pattern contains
+      // backtick characters that would trigger command substitution in /bin/sh
+      // if passed through execSync's shell.
+      grepOutput = execFileSync(
+        'git',
+        ['grep', '-lE', pattern, '--', '*.ts', '*.tsx', '*.js', '*.jsx', '*.swift'],
+        { encoding: 'utf-8', cwd: getRepoRoot() },
+      ).trim();
+    } catch (err) {
+      // Exit code 1 means no matches — happy path
+      if ((err as { status?: number }).status === 1) {
+        return;
+      }
+      throw err;
+    }
+    const files = grepOutput.split('\n').filter((f) => f.length > 0);
+    const violations = files.filter((f) => {
+      if (isTestFile(f)) return false;
+      if (LEGACY_KEY_ALLOWLIST.has(f)) return false;
+      return true;
+    });
+    if (violations.length > 0) {
+      const message = [
+        'Found production files using the legacy `skills.<id>.enabled` key format.',
+        'New code must use the canonical format: `feature_flags.<id>.enabled`.',
+        'See AGENTS.md "Assistant Feature Flags" for the convention.',
+        '',
+        'Violations:',
+        ...violations.map((f) => `  - ${f}`),
+        '',
+        'To fix: replace `skills.<id>.enabled` with `feature_flags.<id>.enabled`.',
+        'If backward-compat access is genuinely needed, add to LEGACY_KEY_ALLOWLIST in assistant-feature-flag-guard.test.ts.',
+      ].join('\n');
+      expect(violations, message).toEqual([]);
+    }
+  });
+  // ---------------------------------------------------------------------------
+  // Test: unified registry key format (assistant-scope only)
+  // ---------------------------------------------------------------------------
+  test('all assistant-scope keys in the unified registry use the canonical feature_flags.<id>.enabled format', () => {
+    const registry = loadRegistry();
+    const assistantFlags = registry.flags.filter((f) => f.scope === 'assistant');
+    const keys = assistantFlags.map((f) => f.key);
+    const violations = keys.filter((key) => !CANONICAL_KEY_RE.test(key));
+    if (violations.length > 0) {
+      const message = [
+        'Found assistant-scope keys in the unified registry that do not match the canonical format.',
+        'Expected format: feature_flags.<flagId>.enabled',
+        '',
+        'Violations:',
+        ...violations.map((k) => `  - ${k}`),
+      ].join('\n');
+      expect(violations, message).toEqual([]);
+    }
+  });
+  // ---------------------------------------------------------------------------
+  // Test: registry entries have required fields
+  // ---------------------------------------------------------------------------
+  // ---------------------------------------------------------------------------
+  // Test: bundled registry copy stays in sync with canonical meta/ copy
+  // ---------------------------------------------------------------------------
+  test('bundled assistant/src/config/feature-flag-registry.json matches canonical meta/ copy', () => {
+    const canonicalPath = getRegistryPath();
+    const bundledPath = join(process.cwd(), 'src', 'config', 'feature-flag-registry.json');
+    const canonical = JSON.parse(readFileSync(canonicalPath, 'utf-8'));
+    const bundled = JSON.parse(readFileSync(bundledPath, 'utf-8'));
+    expect(bundled).toEqual(canonical);
+  });
+  // ---------------------------------------------------------------------------
+  // Test: registry entries have required fields
+  // ---------------------------------------------------------------------------
+  test('all assistant-scope entries in the unified registry have required fields', () => {
+    const registry = loadRegistry();
+    const assistantFlags = registry.flags.filter((f) => f.scope === 'assistant');
+    const violations: string[] = [];
+    for (const flag of assistantFlags) {
+      if (typeof flag.defaultEnabled !== 'boolean') {
+        violations.push(`${flag.key}: missing or non-boolean 'defaultEnabled'`);
+      }
+      if (typeof flag.description !== 'string' || flag.description.length === 0) {
+        violations.push(`${flag.key}: missing or empty 'description'`);
+      }
+      if (typeof flag.label !== 'string' || flag.label.length === 0) {
+        violations.push(`${flag.key}: missing or empty 'label'`);
+      }
+      if (typeof flag.id !== 'string' || flag.id.length === 0) {
+        violations.push(`${flag.key}: missing or empty 'id'`);
+      }
+    }
+    if (violations.length > 0) {
+      const message = [
+        'Found entries in the unified registry with missing or invalid required fields.',
+        '',
+        'Violations:',
+        ...violations.map((v) => `  - ${v}`),
+      ].join('\n');
+      expect(violations, message).toEqual([]);
+    }
+  });
+});

package/src/__tests__/assistant-feature-flag-guardrails.test.ts ADDED Viewed

@@ -0,0 +1,198 @@
+/**
+ * Guard tests for assistant feature flag conventions:
+ *
+ * 1. Key format: all feature flag keys used in production code must follow the
+ *    canonical `feature_flags.<flag_id>.enabled` format. Any remaining
+ *    `skills.<id>.enabled` usage outside of migration/backward-compat code is
+ *    flagged — including template literal forms like `skills.${skillId}.enabled`.
+ *
+ * 2. Declaration coverage: all literal keys passed to
+ *    `isAssistantFeatureFlagEnabled('<key>', ...)` in production code must be
+ *    declared in the unified registry. This keeps flag usage declarative while
+ *    allowing skills to exist without corresponding feature flags.
+ */
+import { execSync } from 'node:child_process';
+import { readFileSync } from 'node:fs';
+import { join } from 'node:path';
+import { describe, expect, test } from 'bun:test';
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
+/** Resolve the repo root from the assistant/ package directory. */
+function getRepoRoot(): string {
+  return join(process.cwd(), '..');
+}
+interface RegistryFlag {
+  id: string;
+  scope: string;
+  key: string;
+  label: string;
+  description: string;
+  defaultEnabled: boolean;
+}
+interface Registry {
+  version: number;
+  flags: RegistryFlag[];
+}
+function loadRegistry(): Registry {
+  const registryPath = join(getRepoRoot(), 'meta', 'feature-flags', 'feature-flag-registry.json');
+  return JSON.parse(readFileSync(registryPath, 'utf-8'));
+}
+/**
+ * Files allowed to contain `skills.<id>.enabled` string literals because they
+ * are part of the backward-compat / migration layer or are test files
+ * exercising legacy paths.
+ */
+const LEGACY_KEY_ALLOWLIST = new Set([
+  // Legacy wrapper (deprecated, kept for migration)
+  'assistant/src/config/skill-state.ts',
+  // Type definitions documenting the legacy format
+  'assistant/src/config/types.ts',
+  // macOS client: fallback reads from legacy config section
+  'clients/macos/vellum-assistant/Features/Settings/SettingsAccountTab.swift',
+]);
+function isTestFile(filePath: string): boolean {
+  return (
+    filePath.includes('/__tests__/') ||
+    filePath.endsWith('.test.ts') ||
+    filePath.endsWith('.test.js') ||
+    filePath.endsWith('.spec.ts') ||
+    filePath.endsWith('.spec.js')
+  );
+}
+// ---------------------------------------------------------------------------
+// Guard 1: Key format — no stale `skills.<id>.enabled` in production code
+// ---------------------------------------------------------------------------
+describe('assistant feature flag key format guard', () => {
+  test('no production TypeScript files use skills.<id>.enabled outside allowlist', () => {
+    const repoRoot = getRepoRoot();
+    // Search for string literals and template literals containing
+    // `skills.<id>.enabled` or `skills.${...}.enabled` in .ts files
+    // under assistant/src/ and gateway/src/ (excluding test files and
+    // allowlisted paths). The pattern catches both literal keys
+    // (e.g., `skills.foo.enabled`) and template literal forms
+    // (e.g., `skills.${skillId}.enabled`).
+    let grepOutput = '';
+    try {
+      grepOutput = execSync(
+        `git grep -lE "skills\\.[a-z0-9_-]+\\.enabled|skills\\.\\$\\{" -- 'assistant/src/**/*.ts' 'gateway/src/**/*.ts'`,
+        { encoding: 'utf-8', cwd: repoRoot },
+      ).trim();
+    } catch (err) {
+      // Exit code 1 means no matches — happy path
+      if ((err as { status?: number }).status === 1) {
+        return;
+      }
+      throw err;
+    }
+    const files = grepOutput.split('\n').filter((f) => f.length > 0);
+    const violations = files.filter((f) => {
+      if (isTestFile(f)) return false;
+      if (LEGACY_KEY_ALLOWLIST.has(f)) return false;
+      return true;
+    });
+    if (violations.length > 0) {
+      const message = [
+        'Found production TypeScript files using legacy `skills.<id>.enabled` key format.',
+        'Use the canonical `feature_flags.<id>.enabled` format instead.',
+        'Call `isAssistantFeatureFlagEnabled(`feature_flags.${skillId}.enabled`, config)` to check skill flags.',
+        '',
+        'Violations:',
+        ...violations.map((f) => `  - ${f}`),
+        '',
+        'If this is a legitimate backward-compat path, add it to LEGACY_KEY_ALLOWLIST in',
+        'assistant-feature-flag-guardrails.test.ts.',
+      ].join('\n');
+      expect(violations, message).toEqual([]);
+    }
+  });
+});
+// ---------------------------------------------------------------------------
+// Guard 2: Declaration coverage for literal key usage
+// ---------------------------------------------------------------------------
+describe('assistant feature flag declaration coverage guard', () => {
+  test('all literal flag keys in isAssistantFeatureFlagEnabled calls are declared in the unified registry', () => {
+    const repoRoot = getRepoRoot();
+    // Load the unified registry and extract assistant-scope keys
+    const registry = loadRegistry();
+    const declaredKeys = new Set(
+      registry.flags
+        .filter((f) => f.scope === 'assistant')
+        .map((f) => f.key),
+    );
+    // Extract full keys from isAssistantFeatureFlagEnabled('<key>', ...) calls
+    // in non-test production files. We read each matching file and apply a
+    // multiline regex so that calls split across lines are still caught:
+    //
+    //   isAssistantFeatureFlagEnabled(
+    //     'feature_flags.foo.enabled',
+    //     config,
+    //   )
+    //
+    const usedKeys = new Set<string>();
+    let matchingFiles = '';
+    try {
+      matchingFiles = execSync(
+        `git grep -l "isAssistantFeatureFlagEnabled" -- 'assistant/src/**/*.ts' ':!assistant/src/__tests__/**'`,
+        { encoding: 'utf-8', cwd: repoRoot },
+      ).trim();
+    } catch (err) {
+      if ((err as { status?: number }).status !== 1) throw err;
+    }
+    if (matchingFiles) {
+      // Multiline regex: match the function name, optional whitespace/newlines,
+      // opening paren, optional whitespace/newlines, then a quoted string key.
+      const multilinePattern = /isAssistantFeatureFlagEnabled\(\s*['"]([^'"]+)['"]/g;
+      for (const relPath of matchingFiles.split('\n')) {
+        if (!relPath) continue;
+        const absPath = join(repoRoot, relPath);
+        const content = readFileSync(absPath, 'utf-8');
+        for (const match of content.matchAll(multilinePattern)) {
+          usedKeys.add(match[1]);
+        }
+      }
+    }
+    // Check that all used keys are declared in the registry
+    const undeclared: string[] = [];
+    for (const key of usedKeys) {
+      if (!declaredKeys.has(key)) {
+        undeclared.push(key);
+      }
+    }
+    if (undeclared.length > 0) {
+      const message = [
+        'Found feature flag keys used in production code that are NOT declared in the unified registry.',
+        `Registry: meta/feature-flags/feature-flag-registry.json`,
+        '',
+        'Undeclared keys:',
+        ...undeclared.map((k) => `  - ${k}`),
+        '',
+        'To fix: add the missing key(s) to the unified registry with scope "assistant".',
+      ].join('\n');
+      expect(undeclared, message).toEqual([]);
+    }
+  });
+});

package/src/__tests__/assistant-feature-flags-integration.test.ts ADDED Viewed

@@ -0,0 +1,272 @@
+/**
+ * Integration tests for assistant feature flag enforcement at system prompt,
+ * skill_load, and session-skill-tools projection layers.
+ *
+ * Covers:
+ *   - Flag OFF blocks all exposure paths
+ *   - Missing persisted value falls back to code default
+ *   - New assistantFeatureFlagValues is the sole override mechanism
+ *   - Undeclared keys default to enabled
+ */
+import { existsSync, mkdirSync, readFileSync, rmSync, writeFileSync } from 'node:fs';
+import { tmpdir } from 'node:os';
+import { join } from 'node:path';
+import { afterEach, beforeEach, describe, expect, mock, test } from 'bun:test';
+// ---------------------------------------------------------------------------
+// Test-scoped temp directory and config state
+// ---------------------------------------------------------------------------
+const TEST_DIR = join(tmpdir(), `vellum-asst-flags-test-${crypto.randomUUID()}`);
+let currentConfig: Record<string, unknown> = {
+  sandbox: { enabled: false, backend: 'native' },
+};
+const DECLARED_FLAG_KEY = 'feature_flags.hatch-new-assistant.enabled';
+const DECLARED_SKILL_ID = 'hatch-new-assistant';
+mock.module('../util/platform.js', () => ({
+  getRootDir: () => TEST_DIR,
+  getDataDir: () => TEST_DIR,
+  getWorkspaceDir: () => TEST_DIR,
+  getWorkspaceConfigPath: () => join(TEST_DIR, 'config.json'),
+  getWorkspaceSkillsDir: () => join(TEST_DIR, 'skills'),
+  getWorkspaceHooksDir: () => join(TEST_DIR, 'hooks'),
+  getWorkspacePromptPath: (file: string) => join(TEST_DIR, file),
+  ensureDataDir: () => {},
+  getSocketPath: () => join(TEST_DIR, 'vellum.sock'),
+  getPidPath: () => join(TEST_DIR, 'vellum.pid'),
+  getDbPath: () => join(TEST_DIR, 'data', 'assistant.db'),
+  getLogPath: () => join(TEST_DIR, 'logs', 'vellum.log'),
+  getHistoryPath: () => join(TEST_DIR, 'history'),
+  getHooksDir: () => join(TEST_DIR, 'hooks'),
+  getIpcBlobDir: () => join(TEST_DIR, 'ipc-blobs'),
+  getSandboxRootDir: () => join(TEST_DIR, 'sandbox'),
+  getSandboxWorkingDir: () => TEST_DIR,
+  getInterfacesDir: () => join(TEST_DIR, 'interfaces'),
+  isMacOS: () => false,
+  isLinux: () => false,
+  isWindows: () => false,
+  getPlatformName: () => 'linux',
+  getClipboardCommand: () => null,
+  removeSocketFile: () => {},
+  migratePath: () => {},
+  migrateToWorkspaceLayout: () => {},
+  migrateToDataLayout: () => {},
+}));
+mock.module('../util/logger.js', () => ({
+  getLogger: () => new Proxy({} as Record<string, unknown>, {
+    get: () => () => {},
+  }),
+  isDebug: () => false,
+  truncateForLog: (v: string) => v,
+}));
+mock.module('../config/loader.js', () => ({
+  getConfig: () => currentConfig,
+}));
+mock.module('../config/user-reference.js', () => ({
+  resolveUserReference: () => 'TestUser',
+}));
+mock.module('../security/parental-control-store.js', () => ({
+  getParentalControlSettings: () => ({ enabled: false, contentRestrictions: [], blockedToolCategories: [] }),
+}));
+mock.module('../tools/credentials/metadata-store.js', () => ({
+  listCredentialMetadata: () => [],
+}));
+const { buildSystemPrompt } = await import('../config/system-prompt.js');
+const { isAssistantFeatureFlagEnabled } = await import('../config/assistant-feature-flags.js');
+const { isSkillFeatureEnabled } = await import('../config/skill-state.js');
+// ---------------------------------------------------------------------------
+// Setup / Teardown
+// ---------------------------------------------------------------------------
+beforeEach(() => {
+  mkdirSync(TEST_DIR, { recursive: true });
+  currentConfig = {
+    sandbox: { enabled: false, backend: 'native' },
+  };
+});
+afterEach(() => {
+  if (existsSync(TEST_DIR)) {
+    rmSync(TEST_DIR, { recursive: true, force: true });
+  }
+});
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
+function createSkillOnDisk(id: string, name: string, description: string): void {
+  const skillsDir = join(TEST_DIR, 'skills');
+  mkdirSync(join(skillsDir, id), { recursive: true });
+  writeFileSync(
+    join(skillsDir, id, 'SKILL.md'),
+    `---\nname: "${name}"\ndescription: "${description}"\n---\n\nInstructions for ${id}.\n`,
+  );
+  const indexPath = join(skillsDir, 'SKILLS.md');
+  const existing = existsSync(indexPath) ? readFileSync(indexPath, 'utf-8') : '';
+  writeFileSync(indexPath, existing + `- ${id}\n`);
+}
+// ---------------------------------------------------------------------------
+// System prompt — assistant feature flag filtering
+// ---------------------------------------------------------------------------
+describe('buildSystemPrompt assistant feature flag filtering', () => {
+  test('flag OFF skill does not appear in <available_skills> section', () => {
+    createSkillOnDisk(DECLARED_SKILL_ID, 'Hatch New Assistant', 'Toggle hatch new assistant behavior');
+    createSkillOnDisk('twitter', 'Twitter', 'Post to X/Twitter');
+    currentConfig = {
+      sandbox: { enabled: false, backend: 'native' },
+      assistantFeatureFlagValues: { [DECLARED_FLAG_KEY]: false },
+    };
+    const result = buildSystemPrompt();
+    expect(result).toContain('id="twitter"');
+    expect(result).not.toContain(`id="${DECLARED_SKILL_ID}"`);
+  });
+  test('all skills visible when no flag overrides set', () => {
+    createSkillOnDisk(DECLARED_SKILL_ID, 'Hatch New Assistant', 'Toggle hatch new assistant behavior');
+    createSkillOnDisk('twitter', 'Twitter', 'Post to X/Twitter');
+    currentConfig = {
+      sandbox: { enabled: false, backend: 'native' },
+    };
+    const result = buildSystemPrompt();
+    expect(result).toContain(`id="${DECLARED_SKILL_ID}"`);
+    expect(result).toContain('id="twitter"');
+  });
+  test('flagged-off skills hidden when all flags are OFF', () => {
+    createSkillOnDisk(DECLARED_SKILL_ID, 'Hatch New Assistant', 'Toggle hatch new assistant behavior');
+    createSkillOnDisk('twitter', 'Twitter', 'Post to X/Twitter');
+    currentConfig = {
+      sandbox: { enabled: false, backend: 'native' },
+      assistantFeatureFlagValues: {
+        [DECLARED_FLAG_KEY]: false,
+        'feature_flags.twitter.enabled': false,
+      },
+    };
+    const result = buildSystemPrompt();
+    expect(result).not.toContain(`id="${DECLARED_SKILL_ID}"`);
+    expect(result).not.toContain('id="twitter"');
+  });
+  test('assistantFeatureFlagValues overrides control visibility', () => {
+    createSkillOnDisk(DECLARED_SKILL_ID, 'Hatch New Assistant', 'Toggle hatch new assistant behavior');
+    currentConfig = {
+      sandbox: { enabled: false, backend: 'native' },
+      assistantFeatureFlagValues: { [DECLARED_FLAG_KEY]: true },
+    };
+    const result = buildSystemPrompt();
+    expect(result).toContain(`id="${DECLARED_SKILL_ID}"`);
+  });
+  test('persisted overrides for undeclared flags are respected', () => {
+    createSkillOnDisk('browser', 'Browser', 'Web browsing automation');
+    currentConfig = {
+      sandbox: { enabled: false, backend: 'native' },
+      assistantFeatureFlagValues: { 'feature_flags.browser.enabled': false },
+    };
+    const result = buildSystemPrompt();
+    // Even though 'browser' is not in the defaults registry, the user
+    // explicitly disabled it — that override must be honored.
+    expect(result).not.toContain('id="browser"');
+  });
+  test('undeclared flags with no persisted override default to enabled', () => {
+    createSkillOnDisk('browser', 'Browser', 'Web browsing automation');
+    currentConfig = {
+      sandbox: { enabled: false, backend: 'native' },
+    };
+    const result = buildSystemPrompt();
+    expect(result).toContain('id="browser"');
+  });
+});
+// ---------------------------------------------------------------------------
+// Resolver unit tests (within integration context)
+// ---------------------------------------------------------------------------
+describe('isAssistantFeatureFlagEnabled', () => {
+  test('reads from assistantFeatureFlagValues', () => {
+    const config = {
+      assistantFeatureFlagValues: { [DECLARED_FLAG_KEY]: true },
+    } as any;
+    expect(isAssistantFeatureFlagEnabled(DECLARED_FLAG_KEY, config)).toBe(true);
+  });
+  test('explicit false override in assistantFeatureFlagValues', () => {
+    const config = {
+      assistantFeatureFlagValues: { [DECLARED_FLAG_KEY]: false },
+    } as any;
+    expect(isAssistantFeatureFlagEnabled(DECLARED_FLAG_KEY, config)).toBe(false);
+  });
+  test('missing persisted value falls back to defaults registry defaultEnabled', () => {
+    // No explicit config at all — should fall back to defaults registry
+    // which has defaultEnabled: true for hatch-new-assistant
+    const config = {} as any;
+    expect(isAssistantFeatureFlagEnabled(DECLARED_FLAG_KEY, config)).toBe(true);
+  });
+  test('unknown flag defaults to true when no persisted override', () => {
+    const config = {} as any;
+    expect(isAssistantFeatureFlagEnabled('feature_flags.unknown-skill.enabled', config)).toBe(true);
+  });
+  test('undeclared flag respects persisted canonical override', () => {
+    const config = {
+      assistantFeatureFlagValues: { 'feature_flags.browser.enabled': false },
+    } as any;
+    expect(isAssistantFeatureFlagEnabled('feature_flags.browser.enabled', config)).toBe(false);
+  });
+});
+describe('legacy isSkillFeatureEnabled backward compat', () => {
+  test('delegates to the canonical resolver', () => {
+    const config = {
+      assistantFeatureFlagValues: { [DECLARED_FLAG_KEY]: false },
+    } as any;
+    expect(isSkillFeatureEnabled(DECLARED_SKILL_ID, config)).toBe(false);
+  });
+  test('enabled when no override set', () => {
+    const config = {} as any;
+    expect(isSkillFeatureEnabled(DECLARED_SKILL_ID, config)).toBe(true);
+  });
+});