npm - vellum - Versions diffs - 0.2.12 → 0.2.14 - Mend

vellum 0.2.12 → 0.2.14

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (209) hide show

package/README.md +32 -0
package/bun.lock +2 -2
package/docs/skills.md +4 -4
package/package.json +2 -2
package/src/__tests__/__snapshots__/ipc-snapshot.test.ts.snap +213 -3
package/src/__tests__/app-git-history.test.ts +176 -0
package/src/__tests__/app-git-service.test.ts +169 -0
package/src/__tests__/assistant-events-sse-hardening.test.ts +315 -0
package/src/__tests__/browser-skill-baseline-tool-payload.test.ts +8 -8
package/src/__tests__/browser-skill-endstate.test.ts +6 -6
package/src/__tests__/call-bridge.test.ts +105 -13
package/src/__tests__/call-domain.test.ts +163 -0
package/src/__tests__/call-orchestrator.test.ts +171 -0
package/src/__tests__/call-routes-http.test.ts +246 -6
package/src/__tests__/channel-approval-routes.test.ts +438 -0
package/src/__tests__/channel-approval.test.ts +266 -0
package/src/__tests__/channel-approvals.test.ts +393 -0
package/src/__tests__/channel-delivery-store.test.ts +447 -0
package/src/__tests__/checker.test.ts +607 -1048
package/src/__tests__/cli.test.ts +1 -56
package/src/__tests__/config-schema.test.ts +402 -5
package/src/__tests__/conflict-intent-tokenization.test.ts +141 -0
package/src/__tests__/conflict-policy.test.ts +121 -0
package/src/__tests__/conflict-store.test.ts +2 -0
package/src/__tests__/contacts-tools.test.ts +3 -3
package/src/__tests__/contradiction-checker.test.ts +99 -1
package/src/__tests__/credential-security-invariants.test.ts +22 -6
package/src/__tests__/credential-vault-unit.test.ts +780 -0
package/src/__tests__/elevenlabs-client.test.ts +271 -0
package/src/__tests__/ephemeral-permissions.test.ts +73 -23
package/src/__tests__/filesystem-tools.test.ts +579 -0
package/src/__tests__/gateway-only-enforcement.test.ts +114 -4
package/src/__tests__/handlers-add-trust-rule-metadata.test.ts +202 -0
package/src/__tests__/handlers-cu-observation-blob.test.ts +2 -1
package/src/__tests__/handlers-ipc-blob-probe.test.ts +2 -1
package/src/__tests__/handlers-slack-config.test.ts +2 -1
package/src/__tests__/handlers-telegram-config.test.ts +855 -0
package/src/__tests__/handlers-twitter-config.test.ts +141 -1
package/src/__tests__/hooks-runner.test.ts +6 -2
package/src/__tests__/host-file-edit-tool.test.ts +124 -0
package/src/__tests__/host-file-read-tool.test.ts +62 -0
package/src/__tests__/host-file-write-tool.test.ts +59 -0
package/src/__tests__/host-shell-tool.test.ts +251 -0
package/src/__tests__/ingress-reconcile.test.ts +581 -0
package/src/__tests__/ipc-snapshot.test.ts +100 -41
package/src/__tests__/ipc-validate.test.ts +50 -0
package/src/__tests__/key-migration.test.ts +23 -0
package/src/__tests__/memory-regressions.test.ts +99 -0
package/src/__tests__/memory-retrieval.benchmark.test.ts +1 -1
package/src/__tests__/oauth-callback-registry.test.ts +11 -4
package/src/__tests__/playbook-execution.test.ts +502 -0
package/src/__tests__/playbook-tools.test.ts +4 -6
package/src/__tests__/public-ingress-urls.test.ts +34 -0
package/src/__tests__/qdrant-manager.test.ts +267 -0
package/src/__tests__/recurrence-engine-rruleset.test.ts +97 -0
package/src/__tests__/recurrence-engine.test.ts +9 -0
package/src/__tests__/recurrence-types.test.ts +8 -0
package/src/__tests__/registry.test.ts +1 -1
package/src/__tests__/runtime-runs.test.ts +1 -25
package/src/__tests__/schedule-store.test.ts +16 -14
package/src/__tests__/schedule-tools.test.ts +83 -0
package/src/__tests__/scheduler-recurrence.test.ts +111 -10
package/src/__tests__/secret-allowlist.test.ts +18 -17
package/src/__tests__/secret-ingress-handler.test.ts +11 -0
package/src/__tests__/secret-scanner.test.ts +43 -0
package/src/__tests__/session-conflict-gate.test.ts +442 -6
package/src/__tests__/session-init.benchmark.test.ts +3 -0
package/src/__tests__/session-process-bridge.test.ts +242 -0
package/src/__tests__/session-skill-tools.test.ts +1 -1
package/src/__tests__/shell-identity.test.ts +256 -0
package/src/__tests__/skill-projection.benchmark.test.ts +11 -1
package/src/__tests__/subagent-tools.test.ts +637 -54
package/src/__tests__/task-management-tools.test.ts +936 -0
package/src/__tests__/task-runner.test.ts +2 -2
package/src/__tests__/terminal-tools.test.ts +840 -0
package/src/__tests__/tool-executor-shell-integration.test.ts +301 -0
package/src/__tests__/tool-executor.test.ts +85 -151
package/src/__tests__/tool-permission-simulate-handler.test.ts +336 -0
package/src/__tests__/trust-store.test.ts +28 -453
package/src/__tests__/twilio-provider.test.ts +153 -3
package/src/__tests__/twilio-routes-elevenlabs.test.ts +375 -0
package/src/__tests__/twilio-routes-twiml.test.ts +127 -0
package/src/__tests__/twilio-routes.test.ts +17 -262
package/src/__tests__/twitter-auth-handler.test.ts +2 -1
package/src/__tests__/twitter-cli-error-shaping.test.ts +208 -0
package/src/__tests__/twitter-cli-routing.test.ts +252 -0
package/src/__tests__/twitter-oauth-client.test.ts +209 -0
package/src/__tests__/workspace-policy.test.ts +213 -0
package/src/calls/call-bridge.ts +92 -19
package/src/calls/call-domain.ts +157 -5
package/src/calls/call-orchestrator.ts +96 -8
package/src/calls/call-store.ts +6 -0
package/src/calls/elevenlabs-client.ts +97 -0
package/src/calls/elevenlabs-config.ts +31 -0
package/src/calls/twilio-provider.ts +91 -0
package/src/calls/twilio-routes.ts +50 -6
package/src/calls/types.ts +3 -1
package/src/calls/voice-quality.ts +114 -0
package/src/cli/twitter.ts +200 -21
package/src/cli.ts +1 -20
package/src/config/bundled-skills/contacts/tools/contact-merge.ts +52 -4
package/src/config/bundled-skills/contacts/tools/contact-search.ts +55 -4
package/src/config/bundled-skills/contacts/tools/contact-upsert.ts +61 -4
package/src/config/bundled-skills/messaging/SKILL.md +17 -2
package/src/config/bundled-skills/messaging/tools/messaging-reply.ts +4 -1
package/src/config/bundled-skills/messaging/tools/messaging-send.ts +5 -1
package/src/config/bundled-skills/messaging/tools/shared.ts +5 -0
package/src/config/bundled-skills/phone-calls/SKILL.md +207 -19
package/src/config/bundled-skills/playbooks/tools/playbook-create.ts +95 -6
package/src/config/bundled-skills/playbooks/tools/playbook-delete.ts +51 -6
package/src/config/bundled-skills/playbooks/tools/playbook-list.ts +73 -6
package/src/config/bundled-skills/playbooks/tools/playbook-update.ts +110 -6
package/src/config/bundled-skills/public-ingress/SKILL.md +22 -5
package/src/config/bundled-skills/twitter/SKILL.md +103 -17
package/src/config/defaults.ts +26 -2
package/src/config/schema.ts +178 -9
package/src/config/types.ts +3 -0
package/src/config/vellum-skills/telegram-setup/SKILL.md +56 -61
package/src/daemon/assistant-attachments.ts +4 -2
package/src/daemon/handlers/apps.ts +69 -0
package/src/daemon/handlers/config.ts +543 -24
package/src/daemon/handlers/index.ts +1 -0
package/src/daemon/handlers/sessions.ts +22 -6
package/src/daemon/handlers/shared.ts +2 -1
package/src/daemon/handlers/skills.ts +5 -20
package/src/daemon/ipc-contract-inventory.json +28 -0
package/src/daemon/ipc-contract.ts +168 -10
package/src/daemon/ipc-validate.ts +17 -0
package/src/daemon/lifecycle.ts +2 -0
package/src/daemon/server.ts +78 -72
package/src/daemon/session-attachments.ts +1 -1
package/src/daemon/session-conflict-gate.ts +62 -6
package/src/daemon/session-notifiers.ts +1 -1
package/src/daemon/session-process.ts +62 -3
package/src/daemon/session-tool-setup.ts +1 -2
package/src/daemon/tls-certs.ts +189 -0
package/src/daemon/video-thumbnail.ts +5 -3
package/src/hooks/manager.ts +5 -9
package/src/memory/app-git-service.ts +295 -0
package/src/memory/app-store.ts +21 -0
package/src/memory/conflict-intent.ts +47 -4
package/src/memory/conflict-policy.ts +73 -0
package/src/memory/conflict-store.ts +9 -1
package/src/memory/contradiction-checker.ts +28 -0
package/src/memory/conversation-key-store.ts +15 -0
package/src/memory/db.ts +81 -0
package/src/memory/embedding-local.ts +3 -13
package/src/memory/external-conversation-store.ts +234 -0
package/src/memory/job-handlers/conflict.ts +22 -2
package/src/memory/jobs-worker.ts +67 -28
package/src/memory/runs-store.ts +54 -7
package/src/memory/schema.ts +20 -0
package/src/messaging/provider.ts +9 -0
package/src/messaging/providers/telegram-bot/adapter.ts +162 -0
package/src/messaging/providers/telegram-bot/client.ts +104 -0
package/src/messaging/providers/telegram-bot/types.ts +15 -0
package/src/messaging/registry.ts +1 -0
package/src/permissions/checker.ts +48 -44
package/src/permissions/defaults.ts +11 -0
package/src/permissions/prompter.ts +0 -4
package/src/permissions/shell-identity.ts +227 -0
package/src/permissions/trust-store.ts +76 -53
package/src/permissions/types.ts +0 -19
package/src/permissions/workspace-policy.ts +114 -0
package/src/providers/retry.ts +12 -37
package/src/runtime/assistant-event-hub.ts +41 -4
package/src/runtime/channel-approval-parser.ts +60 -0
package/src/runtime/channel-approval-types.ts +71 -0
package/src/runtime/channel-approvals.ts +145 -0
package/src/runtime/gateway-client.ts +16 -0
package/src/runtime/http-server.ts +29 -9
package/src/runtime/routes/call-routes.ts +52 -2
package/src/runtime/routes/channel-routes.ts +296 -16
package/src/runtime/routes/conversation-routes.ts +12 -5
package/src/runtime/routes/events-routes.ts +97 -28
package/src/runtime/routes/run-routes.ts +2 -7
package/src/runtime/run-orchestrator.ts +0 -3
package/src/schedule/recurrence-engine.ts +26 -2
package/src/schedule/recurrence-types.ts +1 -1
package/src/schedule/schedule-store.ts +12 -3
package/src/security/secret-scanner.ts +7 -0
package/src/tasks/ephemeral-permissions.ts +0 -2
package/src/tasks/task-scheduler.ts +2 -1
package/src/tools/calls/call-start.ts +8 -0
package/src/tools/execution-target.ts +21 -0
package/src/tools/execution-timeout.ts +49 -0
package/src/tools/executor.ts +6 -135
package/src/tools/network/web-search.ts +9 -32
package/src/tools/policy-context.ts +29 -0
package/src/tools/schedule/update.ts +8 -1
package/src/tools/terminal/parser.ts +16 -18
package/src/tools/types.ts +4 -11
package/src/twitter/oauth-client.ts +102 -0
package/src/twitter/router.ts +101 -0
package/src/util/debounce.ts +88 -0
package/src/util/network-info.ts +47 -0
package/src/util/platform.ts +29 -4
package/src/util/promise-guard.ts +37 -0
package/src/util/retry.ts +98 -0
package/src/util/truncate.ts +1 -1
package/src/workspace/git-service.ts +129 -112
package/src/tools/contacts/contact-merge.ts +0 -55
package/src/tools/contacts/contact-search.ts +0 -58
package/src/tools/contacts/contact-upsert.ts +0 -64
package/src/tools/playbooks/index.ts +0 -4
package/src/tools/playbooks/playbook-create.ts +0 -96
package/src/tools/playbooks/playbook-delete.ts +0 -52
package/src/tools/playbooks/playbook-list.ts +0 -74
package/src/tools/playbooks/playbook-update.ts +0 -111

package/src/permissions/checker.ts CHANGED Viewed

@@ -5,10 +5,21 @@ import { resolveSkillSelector } from '../config/skills.js';
 import { computeSkillVersionHash } from '../skills/version-hash.js';
 import { getTool } from '../tools/registry.js';
 import { getConfig } from '../config/loader.js';
+import { getLogger } from '../util/logger.js';
 import { dirname, resolve } from 'node:path';
 import { homedir } from 'node:os';
 import { looksLikeHostPortShorthand, looksLikePathOnlyInput } from '../tools/network/url-safety.js';
 import { normalizeFilePath, isSkillSourcePath } from '../skills/path-classifier.js';
+import { isWorkspaceScopedInvocation } from './workspace-policy.js';
+import { buildShellCommandCandidates, buildShellAllowlistOptions, type ParsedCommand } from './shell-identity.js';
+// Ensures the legacy mode deprecation warning fires at most once per process.
+let _legacyDeprecationWarned = false;
+/** @internal — exposed only for tests to reset the one-time warning flag. */
+export function _resetLegacyDeprecationWarning(): void {
+  _legacyDeprecationWarned = false;
+}
 // Low-risk shell programs that are read-only / informational
 const LOW_RISK_PROGRAMS = new Set([
@@ -143,9 +154,9 @@ function escapeMinimatchLiteral(value: string): string {
   return value.replace(/([\\*?[\]{}()!+@|])/g, '\\$1');
 }
-function buildCommandCandidates(toolName: string, input: Record<string, unknown>, workingDir: string): string[] {
+async function buildCommandCandidates(toolName: string, input: Record<string, unknown>, workingDir: string, preParsed?: ParsedCommand): Promise<string[]> {
   if (toolName === 'bash' || toolName === 'host_bash') {
-    return [getStringField(input, 'command')];
+    return buildShellCommandCandidates(getStringField(input, 'command'), preParsed);
   }
   if (toolName === 'skill_load') {
@@ -233,7 +244,7 @@ function buildCommandCandidates(toolName: string, input: Record<string, unknown>
   return [...new Set(candidates)];
 }
-export async function classifyRisk(toolName: string, input: Record<string, unknown>, workingDir?: string): Promise<RiskLevel> {
+export async function classifyRisk(toolName: string, input: Record<string, unknown>, workingDir?: string, preParsed?: ParsedCommand): Promise<RiskLevel> {
   if (toolName === 'file_read') return RiskLevel.Low;
   if (toolName === 'file_write' || toolName === 'file_edit') {
     const filePath = getStringField(input, 'path', 'file_path');
@@ -273,7 +284,7 @@ export async function classifyRisk(toolName: string, input: Record<string, unkno
     const command = (input.command as string) ?? '';
     if (!command.trim()) return RiskLevel.Low;
-    const parsed = await parse(command);
+    const parsed = preParsed ?? await parse(command);
     // Dangerous patterns → High
     if (parsed.dangerousPatterns.length > 0) return RiskLevel.High;
@@ -341,10 +352,19 @@ export async function check(
   workingDir: string,
   policyContext?: PolicyContext,
 ): Promise<PermissionCheckResult> {
-  const risk = await classifyRisk(toolName, input, workingDir);
+  // For shell tools, parse once and share the result to avoid duplicate tree-sitter work.
+  let shellParsed: ParsedCommand | undefined;
+  if (toolName === 'bash' || toolName === 'host_bash') {
+    const command = ((input.command as string) ?? '').trim();
+    if (command) {
+      shellParsed = await parse(command);
+    }
+  }
+  const risk = await classifyRisk(toolName, input, workingDir, shellParsed);
   // Build command string candidates for rule matching
-  const commandCandidates = buildCommandCandidates(toolName, input, workingDir);
+  const commandCandidates = await buildCommandCandidates(toolName, input, workingDir, shellParsed);
   // Find the highest-priority matching rule across all candidates
   const matchedRule = findHighestPriorityRule(toolName, commandCandidates, workingDir, policyContext);
@@ -399,10 +419,28 @@ export async function check(
   // agent new capabilities, so in strict mode users must approve each
   // skill load via an exact-version or wildcard trust rule.
   const permissionsMode = getConfig().permissions.mode;
+  if (permissionsMode === 'legacy' && !_legacyDeprecationWarned) {
+    _legacyDeprecationWarned = true;
+    getLogger('checker').warn('Permissions mode "legacy" is deprecated and will be removed in a future release. Switch to "workspace" (default) or "strict".');
+  }
   if (permissionsMode === 'strict' && !matchedRule) {
     return { decision: 'prompt', reason: `Strict mode: no matching rule, requires approval` };
   }
+  // Workspace mode: auto-allow workspace-scoped operations that don't have
+  // an explicit rule. Non-workspace operations fall through to risk-based policy.
+  if (permissionsMode === 'workspace' && !matchedRule) {
+    // When sandbox is disabled, bash runs on the host — don't auto-allow
+    const sandboxEnabled = getConfig().sandbox.enabled;
+    if (toolName === 'bash' && !sandboxEnabled) {
+      // Fall through to risk-based policy below
+    } else if (isWorkspaceScopedInvocation(toolName, input, workingDir)) {
+      return { decision: 'allow', reason: 'Workspace mode: workspace-scoped operation auto-allowed' };
+    }
+  }
   // Auto-allow low-risk bundled skill tools even without explicit trust rules.
   // These are first-party tools with a vetted risk declaration — applying the
   // same policy as the per-tool default allow rules for browser tools, but
@@ -448,38 +486,10 @@ function friendlyHostname(url: URL): string {
   return url.hostname.replace(/^www\./, '');
 }
-export function generateAllowlistOptions(toolName: string, input: Record<string, unknown>): AllowlistOption[] {
+export async function generateAllowlistOptions(toolName: string, input: Record<string, unknown>): Promise<AllowlistOption[]> {
   if (toolName === 'bash' || toolName === 'host_bash') {
     const command = ((input.command as string) ?? '').trim();
-    const parts = command.split(/\s+/);
-    const program = parts[0] ?? command;
-    const options: AllowlistOption[] = [];
-    // Exact match
-    options.push({ label: command, description: 'This exact command', pattern: command });
-    if (parts.length >= 2) {
-      // Subcommand wildcard: "npm install *"
-      const sub = parts.slice(0, -1).join(' ');
-      options.push({
-        label: `${sub} *`,
-        description: `Any "${sub}" command`,
-        pattern: `${sub} *`,
-      });
-    }
-    if (parts.length >= 1) {
-      // Program wildcard: "npm *"
-      options.push({ label: `${program} *`, description: `Any ${program} command`, pattern: `${program} *` });
-    }
-    // Deduplicate
-    const seen = new Set<string>();
-    return options.filter((o) => {
-      if (seen.has(o.pattern)) return false;
-      seen.add(o.pattern);
-      return true;
-    });
+    return buildShellAllowlistOptions(command);
   }
   if (
@@ -604,7 +614,7 @@ export function generateAllowlistOptions(toolName: string, input: Record<string,
   return [{ label: '*', description: 'Everything', pattern: '*' }];
 }
-export function generateScopeOptions(workingDir: string, toolName?: string): ScopeOption[] {
+export function generateScopeOptions(workingDir: string, _toolName?: string): ScopeOption[] {
   const home = homedir();
   const options: ScopeOption[] = [];
@@ -626,11 +636,5 @@ export function generateScopeOptions(workingDir: string, toolName?: string): Sco
   // Everywhere
   options.push({ label: 'everywhere', scope: 'everywhere' });
-  if (!toolName?.startsWith('host_')) {
-    return options;
-  }
-  const everywhere = options.find((option) => option.scope === 'everywhere');
-  const scoped = options.filter((option) => option.scope !== 'everywhere');
-  return everywhere ? [everywhere, ...scoped] : options;
+  return options;
 }

package/src/permissions/defaults.ts CHANGED Viewed

@@ -225,6 +225,16 @@ export function getDefaultRuleTemplates(): DefaultRuleTemplate[] {
     priority: 100,
   };
+  // memory_search is a read-only tool — always allow without prompting.
+  const memorySearchRule: DefaultRuleTemplate = {
+    id: 'default:allow-memory_search-global',
+    tool: 'memory_search',
+    pattern: 'memory_search:*',
+    scope: 'everywhere',
+    decision: 'allow',
+    priority: 100,
+  };
   return [
     ...hostFileRules,
     hostShellRule,
@@ -239,5 +249,6 @@ export function getDefaultRuleTemplates(): DefaultRuleTemplate[] {
     ...browserToolRules,
     ...uiSurfaceRules,
     viewImageRule,
+    memorySearchRule,
   ];
 }

package/src/permissions/prompter.ts CHANGED Viewed

@@ -37,7 +37,6 @@ export class PermissionPrompter {
     sandboxed?: boolean,
     sessionId?: string,
     executionTarget?: ExecutionTarget,
-    principal?: { kind?: string; id?: string; version?: string },
     persistentDecisionsAllowed?: boolean,
   ): Promise<{ decision: UserDecision; selectedPattern?: string; selectedScope?: string }> {
     const requestId = uuid();
@@ -64,9 +63,6 @@ export class PermissionPrompter {
         sandboxed,
         sessionId,
         executionTarget,
-        principalKind: principal?.kind,
-        principalId: principal?.id,
-        principalVersion: principal?.version,
         persistentDecisionsAllowed: persistentDecisionsAllowed ?? true,
       });
     });

package/src/permissions/shell-identity.ts ADDED Viewed

@@ -0,0 +1,227 @@
+import { parse, type ParsedCommand, type CommandSegment, type DangerousPattern } from '../tools/terminal/parser.js';
+import type { AllowlistOption } from './types.js';
+export type { ParsedCommand };
+export interface ShellActionKey {
+  /** e.g. "action:gh", "action:gh pr", "action:gh pr view" */
+  key: string;
+  /** How many tokens deep this key goes */
+  depth: number;
+}
+export interface ShellIdentityAnalysis {
+  /** The parsed segments from the shell parser */
+  segments: CommandSegment[];
+  /** The operator sequence between segments (e.g. ['&&', '|']) */
+  operators: string[];
+  /** Whether the command contains opaque constructs (eval, heredocs, etc.) */
+  hasOpaqueConstructs: boolean;
+  /** Dangerous patterns detected by the parser */
+  dangerousPatterns: DangerousPattern[];
+}
+export interface ActionKeyResult {
+  /** The derived action keys from narrowest to broadest */
+  keys: ShellActionKey[];
+  /** Whether this command has a "simple action" shape (setup prefix + single action) */
+  isSimpleAction: boolean;
+  /** The primary action segment (the non-setup-prefix action command) */
+  primarySegment?: CommandSegment;
+}
+/** Programs that are considered setup prefixes (not the main action) */
+const SETUP_PREFIX_PROGRAMS = new Set(['cd', 'pushd', 'export', 'unset', 'set']);
+const MAX_ACTION_KEY_DEPTH = 3;
+/**
+ * Analyze a shell command using the tree-sitter parser to extract
+ * identity information for permission decisions.
+ */
+export async function analyzeShellCommand(command: string, preParsed?: ParsedCommand): Promise<ShellIdentityAnalysis> {
+  const parsed = preParsed ?? await parse(command);
+  const operators: string[] = [];
+  for (const seg of parsed.segments) {
+    if (seg.operator) {
+      operators.push(seg.operator);
+    }
+  }
+  return {
+    segments: parsed.segments,
+    operators,
+    hasOpaqueConstructs: parsed.hasOpaqueConstructs,
+    dangerousPatterns: parsed.dangerousPatterns,
+  };
+}
+/**
+ * Derive canonical action keys from a shell command analysis.
+ *
+ * Action keys identify the "family" of a command for allowlist purposes.
+ * For example, `cd repo && gh pr view 5525 --json title` derives:
+ *   - action:gh pr view
+ *   - action:gh pr
+ *   - action:gh
+ *
+ * Only "simple action" commands (optional setup prefix + one action) get
+ * action keys. Pipelines and complex chains are marked non-simple.
+ */
+export function deriveShellActionKeys(analysis: ShellIdentityAnalysis): ActionKeyResult {
+  const { segments } = analysis;
+  if (segments.length === 0) {
+    return { keys: [], isSimpleAction: false };
+  }
+  // For multi-segment commands, only allow simple-action classification if
+  // ALL inter-segment operators are explicitly &&. Any other operator (|, ||,
+  // ;, &, empty/missing) means the separator is unknown or unsafe.
+  // This safely handles cases where the parser doesn't capture certain
+  // separators (;, newline, &) and leaves them as empty operators.
+  if (segments.length > 1) {
+    for (const seg of segments) {
+      const op = seg.operator;
+      // Non-empty operator that isn't && → definitely complex
+      if (op && op !== '&&') {
+        return { keys: [], isSimpleAction: false };
+      }
+    }
+    // Also check: if there are multiple segments but no operators at all
+    // between them (e.g. newline-separated), that's suspicious.
+    // The first segment always has operator '' (no preceding operator).
+    // If any non-first segment also has operator '', the separator was
+    // not captured — treat as complex for safety.
+    for (let i = 1; i < segments.length; i++) {
+      if (!segments[i].operator) {
+        return { keys: [], isSimpleAction: false };
+      }
+    }
+  }
+  // Separate setup-prefix segments from action segments
+  const actionSegments: CommandSegment[] = [];
+  let foundNonPrefix = false;
+  for (const seg of segments) {
+    if (!foundNonPrefix && SETUP_PREFIX_PROGRAMS.has(seg.program)) {
+      continue;
+    }
+    foundNonPrefix = true;
+    actionSegments.push(seg);
+  }
+  // Simple action: exactly one non-prefix action segment
+  if (actionSegments.length !== 1) {
+    return { keys: [], isSimpleAction: false };
+  }
+  const primarySegment = actionSegments[0];
+  const tokens: string[] = [primarySegment.program];
+  // Add non-flag, non-path stable subcommand tokens (up to MAX_ACTION_KEY_DEPTH)
+  for (const arg of primarySegment.args) {
+    if (tokens.length >= MAX_ACTION_KEY_DEPTH) break;
+    if (arg.startsWith('-')) continue;
+    if (arg.includes('/') || arg.startsWith('.')) continue;
+    if (/^\d+$/.test(arg)) continue;
+    if (arg.includes('$') || arg.includes('"') || arg.includes("'")) continue;
+    tokens.push(arg);
+  }
+  // Build action keys from narrowest to broadest
+  const keys: ShellActionKey[] = [];
+  for (let depth = tokens.length; depth >= 1; depth--) {
+    keys.push({
+      key: `action:${tokens.slice(0, depth).join(' ')}`,
+      depth,
+    });
+  }
+  return { keys, isSimpleAction: true, primarySegment };
+}
+/**
+ * Build an ordered list of command candidates for trust-rule matching.
+ *
+ * Candidate ordering:
+ *   1. Raw command (backward compatibility — existing rules match as before)
+ *   2. Canonical primary command (if simple action) — the full primary segment text
+ *   3. Action keys from narrowest to broadest (if simple action)
+ *
+ * Complex commands (pipelines, multi-action chains) only return the raw candidate.
+ */
+export async function buildShellCommandCandidates(command: string, preParsed?: ParsedCommand): Promise<string[]> {
+  const trimmed = command.trim();
+  if (!trimmed) return [trimmed];
+  const analysis = await analyzeShellCommand(trimmed, preParsed);
+  const actionResult = deriveShellActionKeys(analysis);
+  const candidates: string[] = [trimmed];
+  if (actionResult.isSimpleAction && actionResult.primarySegment) {
+    // Add canonical primary command text (the actual segment, not the full command with setup prefixes)
+    const canonical = actionResult.primarySegment.command;
+    if (canonical !== trimmed) {
+      candidates.push(canonical);
+    }
+    // Add action keys
+    for (const actionKey of actionResult.keys) {
+      candidates.push(actionKey.key);
+    }
+  }
+  // Deduplicate while preserving order
+  return [...new Set(candidates)];
+}
+/**
+ * Build allowlist options for shell commands using parser-derived identity.
+ *
+ * For simple actions (optional setup prefix + one action), options are:
+ *   1. Exact canonical primary command
+ *   2. Deepest action key (e.g. "action:gh pr view")
+ *   3. Broader action keys (e.g. "action:gh pr", "action:gh")
+ *
+ * For complex commands (pipelines, multi-action chains), only the exact
+ * command is offered (no broad options).
+ */
+export async function buildShellAllowlistOptions(command: string): Promise<AllowlistOption[]> {
+  const trimmed = command.trim();
+  if (!trimmed) return [];
+  const analysis = await analyzeShellCommand(trimmed);
+  const actionResult = deriveShellActionKeys(analysis);
+  if (!actionResult.isSimpleAction || !actionResult.primarySegment) {
+    // Complex command — exact only
+    return [{ label: trimmed, description: 'This exact compound command', pattern: trimmed }];
+  }
+  const options: AllowlistOption[] = [];
+  // Full original command text — "this exact command" means exactly what the user approved
+  options.push({ label: trimmed, description: 'This exact command', pattern: trimmed });
+  // Action keys from narrowest to broadest
+  for (const actionKey of actionResult.keys) {
+    const keyTokens = actionKey.key.replace(/^action:/, '');
+    options.push({
+      label: `${keyTokens} *`,
+      description: `Any "${keyTokens}" command`,
+      pattern: actionKey.key,
+    });
+  }
+  // Deduplicate by pattern
+  const seen = new Set<string>();
+  return options.filter((o) => {
+    if (seen.has(o.pattern)) return false;
+    seen.add(o.pattern);
+    return true;
+  });
+}

package/src/permissions/trust-store.ts CHANGED Viewed

@@ -1,7 +1,7 @@
 import { readFileSync, writeFileSync, existsSync, mkdirSync, renameSync, chmodSync } from 'node:fs';
 import { join, dirname } from 'node:path';
 import { v4 as uuid } from 'uuid';
-import { minimatch } from 'minimatch';
+import { Minimatch } from 'minimatch';
 import { getRootDir } from '../util/platform.js';
 import { getLogger } from '../util/logger.js';
 import { getDefaultRuleTemplates } from './defaults.js';
@@ -21,6 +21,50 @@ interface TrustFile {
 let cachedRules: TrustRule[] | null = null;
 let cachedStarterBundleAccepted: boolean | null = null;
+/**
+ * Cache of pre-compiled Minimatch objects keyed by pattern string.
+ * Rebuilt whenever cachedRules changes. Avoids re-parsing glob patterns
+ * on every tool-call permission check.
+ */
+const compiledPatterns = new Map<string, Minimatch>();
+/** Get or compile a Minimatch object for the given pattern. Returns null if the pattern is invalid. */
+function getCompiledPattern(pattern: string): Minimatch | null {
+  let compiled = compiledPatterns.get(pattern);
+  if (!compiled) {
+    if (typeof pattern !== 'string') {
+      log.warn({ pattern }, 'Cannot compile non-string pattern');
+      return null;
+    }
+    try {
+      compiled = new Minimatch(pattern);
+      compiledPatterns.set(pattern, compiled);
+    } catch (err) {
+      log.warn({ pattern, err }, 'Failed to compile pattern');
+      return null;
+    }
+  }
+  return compiled;
+}
+/** Rebuild the compiled pattern cache from the current rule set. */
+function rebuildPatternCache(rules: TrustRule[]): void {
+  compiledPatterns.clear();
+  for (const rule of rules) {
+    if (typeof rule.pattern !== 'string') {
+      log.warn({ ruleId: rule.id, pattern: rule.pattern }, 'Skipping rule with non-string pattern during cache rebuild');
+      continue;
+    }
+    if (!compiledPatterns.has(rule.pattern)) {
+      try {
+        compiledPatterns.set(rule.pattern, new Minimatch(rule.pattern));
+      } catch (err) {
+        log.warn({ ruleId: rule.id, pattern: rule.pattern, err }, 'Skipping rule with invalid pattern during cache rebuild');
+      }
+    }
+  }
+}
 function getTrustPath(): string {
   return join(getRootDir(), 'protected', 'trust.json');
 }
@@ -201,6 +245,22 @@ function loadFromDisk(): TrustRule[] {
         log.info({ ruleCount: rules.length }, 'Migrated v2 trust rules to v3 (principal fields)');
       } else if (data.version === TRUST_FILE_VERSION) {
         rules = rawRules;
+        // Strip legacy principal-scoped fields from persisted v3 rules.
+        // Before the principal concept was removed, rules could carry
+        // principalKind/principalId/principalVersion which acted as scope
+        // constraints. Now that matching ignores those fields, leaving them
+        // on loaded rules would silently widen their scope to global
+        // wildcards. Stripping them and re-saving prevents scope escalation.
+        for (const rule of rules) {
+          const r = rule as unknown as Record<string, unknown>;
+          if ('principalKind' in r || 'principalId' in r || 'principalVersion' in r) {
+            delete r.principalKind;
+            delete r.principalId;
+            delete r.principalVersion;
+            needsSave = true;
+          }
+        }
       } else if (data.version !== 1) {
         log.warn({ version: data.version }, 'Unknown trust file version, applying defaults in-memory only');
         // Apply default deny rules in-memory so the assistant is still
@@ -262,6 +322,7 @@ function saveToDisk(rules: TrustRule[]): void {
 function getRules(): TrustRule[] {
   if (cachedRules === null) {
     cachedRules = loadFromDisk();
+    rebuildPatternCache(cachedRules);
   }
   return cachedRules;
 }
@@ -274,9 +335,6 @@ export function addRule(
   priority: number = 100,
   options?: {
     allowHighRisk?: boolean;
-    principalKind?: string;
-    principalId?: string;
-    principalVersion?: string;
     executionTarget?: string;
   },
 ): TrustRule {
@@ -296,21 +354,13 @@ export function addRule(
   if (options?.allowHighRisk != null) {
     rule.allowHighRisk = options.allowHighRisk;
   }
-  if (options?.principalKind != null) {
-    rule.principalKind = options.principalKind;
-  }
-  if (options?.principalId != null) {
-    rule.principalId = options.principalId;
-  }
-  if (options?.principalVersion != null) {
-    rule.principalVersion = options.principalVersion;
-  }
   if (options?.executionTarget != null) {
     rule.executionTarget = options.executionTarget;
   }
   rules.push(rule);
   rules.sort(ruleOrder);
   cachedRules = rules;
+  rebuildPatternCache(rules);
   saveToDisk(rules);
   log.info({ rule }, 'Added trust rule');
   return rule;
@@ -337,6 +387,7 @@ export function updateRule(
   rules[index] = rule;
   rules.sort(ruleOrder);
   cachedRules = rules;
+  rebuildPatternCache(rules);
   saveToDisk(rules);
   log.info({ rule }, 'Updated trust rule');
   return rule;
@@ -353,6 +404,7 @@ export function removeRule(id: string): boolean {
   if (index === -1) return false;
   rules.splice(index, 1);
   cachedRules = rules;
+  rebuildPatternCache(rules);
   saveToDisk(rules);
   log.info({ id }, 'Removed trust rule');
   return true;
@@ -372,47 +424,14 @@ function findRuleByDecision(tool: string, command: string, scope: string, decisi
   for (const rule of rules) {
     if (rule.tool !== tool) continue;
     if (rule.decision !== decision) continue;
-    if (!minimatch(command, rule.pattern)) continue;
+    const compiled = getCompiledPattern(rule.pattern);
+    if (!compiled || !compiled.match(command)) continue;
     if (!matchesScope(rule.scope, scope)) continue;
     return rule;
   }
   return null;
 }
-/**
- * Check whether a rule's principal constraints match the given policy context.
- *
- * A missing field on the rule acts as a wildcard — it matches any value
- * (or absence) in the context. When a rule specifies a principal field,
- * the context must provide a matching value for the rule to apply.
- */
-function matchesPrincipal(rule: TrustRule, ctx?: PolicyContext): boolean {
-  // If the rule has no principal constraints it matches everything (wildcard).
-  if (rule.principalKind == null && rule.principalId == null && rule.principalVersion == null) {
-    return true;
-  }
-  const principal = ctx?.principal;
-  // Rule specifies a principalKind — context must supply one that matches.
-  if (rule.principalKind != null) {
-    if (principal?.kind !== rule.principalKind) return false;
-  }
-  // Rule specifies a principalId — context must supply one that matches.
-  if (rule.principalId != null) {
-    if (principal?.id !== rule.principalId) return false;
-  }
-  // Rule specifies a principalVersion — context must supply one that matches.
-  // If the rule omits principalVersion, any version (or none) is accepted.
-  if (rule.principalVersion != null) {
-    if (principal?.version !== rule.principalVersion) return false;
-  }
-  return true;
-}
 /**
  * Check whether a rule's executionTarget constraint matches the context.
  *
@@ -428,9 +447,9 @@ function matchesExecutionTarget(rule: TrustRule, ctx?: PolicyContext): boolean {
  * Find the highest-priority rule that matches any of the command candidates.
  * Rules are pre-sorted by priority descending, so the first match wins.
  *
- * When a `PolicyContext` is provided, rules that specify principal or
- * executionTarget constraints are filtered accordingly. Rules without
- * those constraints act as wildcards and match any context.
+ * When a `PolicyContext` is provided, rules that specify executionTarget
+ * constraints are filtered accordingly. Rules without those constraints
+ * act as wildcards and match any context.
  */
 export function findHighestPriorityRule(tool: string, commands: string[], scope: string, ctx?: PolicyContext): TrustRule | null {
   // Check ephemeral (task-scoped) rules first — they take precedence over
@@ -449,10 +468,11 @@ export function findHighestPriorityRule(tool: string, commands: string[], scope:
   for (const rule of allRules) {
     if (rule.tool !== tool) continue;
     if (!matchesScope(rule.scope, scope)) continue;
-    if (!matchesPrincipal(rule, ctx)) continue;
     if (!matchesExecutionTarget(rule, ctx)) continue;
+    const compiled = getCompiledPattern(rule.pattern);
+    if (!compiled) continue;
     for (const command of commands) {
-      if (minimatch(command, rule.pattern)) {
+      if (compiled.match(command)) {
         return rule;
       }
     }
@@ -480,6 +500,7 @@ export function clearAllRules(): void {
   backfillDefaults(rules);
   rules.sort(ruleOrder);
   cachedRules = rules;
+  rebuildPatternCache(rules);
   saveToDisk(rules);
   log.info('Cleared all user trust rules (default rules preserved)');
 }
@@ -487,6 +508,7 @@ export function clearAllRules(): void {
 export function clearCache(): void {
   cachedRules = null;
   cachedStarterBundleAccepted = null;
+  compiledPatterns.clear();
 }
 // ─── Starter approval bundle ────────────────────────────────────────────────
@@ -577,6 +599,7 @@ export function acceptStarterBundle(): AcceptStarterBundleResult {
   cachedStarterBundleAccepted = true;
   rules.sort(ruleOrder);
   cachedRules = rules;
+  rebuildPatternCache(rules);
   saveToDisk(rules);
   log.info({ rulesAdded: added }, 'Starter approval bundle accepted');