npm - @gotgenes/pi-permission-system - Versions diffs - 8.3.2 → 9.0.1 - Mend

@gotgenes/pi-permission-system 8.3.2 → 9.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (25) hide show

package/CHANGELOG.md +35 -0
package/package.json +1 -1
package/src/handlers/gates/bash-command.ts +55 -0
package/src/handlers/gates/bash-external-directory.ts +2 -1
package/src/handlers/gates/bash-path-extractor.ts +9 -618
package/src/handlers/gates/bash-path.ts +13 -7
package/src/handlers/gates/bash-program.ts +727 -0
package/src/handlers/gates/candidate-check.ts +32 -0
package/src/handlers/lifecycle.ts +9 -0
package/src/handlers/permission-gate-handler.ts +21 -8
package/src/index.ts +30 -11
package/src/permission-events.ts +3 -2
package/src/service.ts +17 -4
package/src/subagent-context.ts +28 -9
package/test/composition-root.test.ts +398 -0
package/test/handlers/gates/bash-command.test.ts +167 -0
package/test/handlers/gates/bash-program.test.ts +107 -0
package/test/handlers/gates/candidate-check.test.ts +52 -0
package/test/handlers/lifecycle.test.ts +15 -2
package/test/handlers/tool-call.test.ts +73 -0
package/test/helpers/make-fake-pi.ts +95 -0
package/test/permission-events.test.ts +32 -2
package/test/permission-system.test.ts +16 -34
package/test/service.test.ts +25 -6
package/test/subagent-context.test.ts +40 -0

package/src/handlers/gates/bash-path-extractor.ts CHANGED Viewed

@@ -1,636 +1,27 @@
-import { createRequire } from "node:module";
-import { basename, resolve } from "node:path";
-import {
-  classifyTokenAsPathCandidate,
-  classifyTokenAsRuleCandidate,
-} from "#src/handlers/gates/bash-token-classification";
-import {
-  isPathWithinDirectory,
-  isSafeSystemPath,
-  normalizePathForComparison,
-} from "#src/path-utils";
-// ── tree-sitter-bash lazy parser ───────────────────────────────────────────
-/**
- * Minimal subset of web-tree-sitter's SyntaxNode used by the AST walker.
- * Defined locally so callers do not need to import web-tree-sitter types.
- */
-interface TSNode {
-  readonly type: string;
-  readonly text: string;
-  readonly childCount: number;
-  child(index: number): TSNode | null;
-}
-/**
- * Minimal subset of web-tree-sitter's Parser used by this module.
- */
-interface TSParser {
-  parse(input: string): { rootNode: TSNode; delete(): void } | null;
-  delete(): void;
-}
-let parserPromise: Promise<TSParser> | null = null;
-async function initParser(): Promise<TSParser> {
-  // Use named imports — web-tree-sitter exports Parser as a named class.
-  const { Parser, Language } = await import("web-tree-sitter");
-  const req = createRequire(import.meta.url);
-  const treeSitterWasm = req.resolve("web-tree-sitter/web-tree-sitter.wasm");
-  await Parser.init({ locateFile: () => treeSitterWasm });
-  const parser = new Parser();
-  const bashWasm = req.resolve("tree-sitter-bash/tree-sitter-bash.wasm");
-  const bash = await Language.load(bashWasm);
-  parser.setLanguage(bash);
-  return parser;
-}
-function getParser(): Promise<TSParser> {
-  parserPromise ??= initParser();
-  return parserPromise;
-}
-// ── AST walker ─────────────────────────────────────────────────────────────
-/**
- * Node types whose subtrees must never be descended into for
- * path extraction — their text content is not a command argument.
- */
-const SKIP_SUBTREE_TYPES = new Set(["heredoc_body", "heredoc_end", "comment"]);
+import { BashProgram } from "./bash-program";
 /**
- * Resolve the "shell value" of an argument node — the string the shell
- * would pass to the command after quote removal.
+ * Extract paths from a bash command string that resolve outside CWD.
  *
- * - `word`          → `.text` (already unquoted)
- * - `raw_string`    → strip surrounding single quotes
- * - `string`        → strip surrounding double quotes, concatenate children text
- * - `concatenation` → concatenate resolved children
- * - other           → `.text` as fallback
- */
-function resolveNodeText(node: TSNode): string {
-  switch (node.type) {
-    case "word":
-      return node.text;
-    case "raw_string": {
-      // Strip surrounding single quotes: 'content' → content
-      const t = node.text;
-      if (t.length >= 2 && t.startsWith("'") && t.endsWith("'")) {
-        return t.slice(1, -1);
-      }
-      return t;
-    }
-    case "string": {
-      // Double-quoted string: concatenate the resolved text of inner children,
-      // skipping the quote-delimiter nodes (literal `"`).
-      let result = "";
-      for (let i = 0; i < node.childCount; i++) {
-        const child = node.child(i);
-        if (!child) continue;
-        // Skip the literal `"` delimiters
-        if (child.type === '"') continue;
-        result += resolveNodeText(child);
-      }
-      return result;
-    }
-    case "string_content":
-    case "simple_expansion":
-    case "expansion":
-      return node.text;
-    case "concatenation": {
-      let result = "";
-      for (let i = 0; i < node.childCount; i++) {
-        const child = node.child(i);
-        if (!child) continue;
-        result += resolveNodeText(child);
-      }
-      return result;
-    }
-    default:
-      return node.text;
-  }
-}
-// ── Pattern-first command config ───────────────────────────────────────────
-interface PatternCommandConfig {
-  /** Flags that consume the next argument as a non-path value (pattern, separator, etc.) */
-  readonly argConsumingFlags: ReadonlySet<string>;
-  /** Flags that consume the next argument as a file path */
-  readonly fileConsumingFlags: ReadonlySet<string>;
-  /**
-   * Number of leading positional arguments that are patterns/scripts, not paths.
-   * Default: 1 (covers sed, awk, grep, rg).
-   * sd uses 2 (FIND and REPLACE_WITH are both non-path positionals).
-   */
-  readonly patternPositionals?: number;
-}
-/**
- * Commands whose first N positional arguments are inline patterns/scripts,
- * not filesystem paths. The map stores per-command flag configuration so
- * the walker can correctly identify which arguments are consumed by flags
- * vs. which are positional.
- */
-const PATTERN_FIRST_COMMANDS: ReadonlyMap<string, PatternCommandConfig> =
-  new Map([
-    [
-      "sed",
-      {
-        argConsumingFlags: new Set(["-e", "-i"]),
-        fileConsumingFlags: new Set(["-f"]),
-      },
-    ],
-    [
-      "awk",
-      {
-        argConsumingFlags: new Set(["-e", "-F", "-v"]),
-        fileConsumingFlags: new Set(["-f"]),
-      },
-    ],
-    [
-      "gawk",
-      {
-        argConsumingFlags: new Set(["-e", "-F", "-v"]),
-        fileConsumingFlags: new Set(["-f"]),
-      },
-    ],
-    [
-      "nawk",
-      {
-        argConsumingFlags: new Set(["-e", "-F", "-v"]),
-        fileConsumingFlags: new Set(["-f"]),
-      },
-    ],
-    [
-      "grep",
-      {
-        argConsumingFlags: new Set(["-e", "-A", "-B", "-C", "-m"]),
-        fileConsumingFlags: new Set(["-f"]),
-      },
-    ],
-    [
-      "egrep",
-      {
-        argConsumingFlags: new Set(["-e", "-A", "-B", "-C", "-m"]),
-        fileConsumingFlags: new Set(["-f"]),
-      },
-    ],
-    [
-      "fgrep",
-      {
-        argConsumingFlags: new Set(["-e", "-A", "-B", "-C", "-m"]),
-        fileConsumingFlags: new Set(["-f"]),
-      },
-    ],
-    [
-      "rg",
-      {
-        argConsumingFlags: new Set([
-          "-e",
-          "-A",
-          "-B",
-          "-C",
-          "-m",
-          "-g",
-          "-t",
-          "-T",
-          "-j",
-          "-M",
-          "-r",
-          "-E",
-        ]),
-        fileConsumingFlags: new Set(["-f"]),
-      },
-    ],
-    [
-      "sd",
-      {
-        argConsumingFlags: new Set(["-n", "-f"]),
-        fileConsumingFlags: new Set([]),
-        patternPositionals: 2,
-      },
-    ],
-  ]);
-/** Node types that represent argument values in the AST. */
-const ARG_NODE_TYPES = new Set([
-  "word",
-  "concatenation",
-  "string",
-  "raw_string",
-]);
-/**
- * Extract the command name from a `command` node.
- * Returns the basename (e.g. `/usr/bin/sed` → `sed`), or undefined
- * if the command name cannot be determined (e.g. variable expansion).
- */
-function extractCommandName(node: TSNode): string | undefined {
-  for (let i = 0; i < node.childCount; i++) {
-    const child = node.child(i);
-    if (!child) continue;
-    if (child.type === "command_name") {
-      const text = resolveNodeText(child);
-      return text ? basename(text) : undefined;
-    }
-  }
-  return undefined;
-}
-/**
- * Describes what the walker should do when it encounters a flag word inside
- * a pattern-first command.  Using a discriminated union lets the `switch` in
- * `collectPatternCommandTokens` narrow `nextArgAction` without a non-null
- * assertion (which would trigger the Biome/ESLint assertion conflict).
- */
-type PatternCommandFlagDirective =
-  | { kind: "end-of-flags" }
-  | { kind: "regular-flag" }
-  | {
-      kind: "consume-arg";
-      nextArgAction: "skip" | "extract";
-      setsExplicitScript: boolean;
-    };
-/**
- * Classify a flag word from a pattern-first command into a directive that
- * tells the walker how to handle the flag and its following argument.
- */
-function classifyPatternCommandFlag(
-  text: string,
-  config: PatternCommandConfig,
-): PatternCommandFlagDirective {
-  if (text === "--") return { kind: "end-of-flags" };
-  if (config.argConsumingFlags.has(text)) {
-    return {
-      kind: "consume-arg",
-      nextArgAction: "skip",
-      setsExplicitScript: text === "-e" || text === "-f",
-    };
-  }
-  if (config.fileConsumingFlags.has(text)) {
-    return {
-      kind: "consume-arg",
-      nextArgAction: "extract",
-      setsExplicitScript: true,
-    };
-  }
-  return { kind: "regular-flag" };
-}
-/**
- * Collect path-candidate tokens from a command known to have
- * pattern/script arguments in leading positional slots.
- *
- * Uses position-based skipping: the first N positional arguments
- * (where N = patternPositionals, default 1) are assumed to be
- * inline patterns/scripts and are skipped. Remaining positional
- * arguments are collected as path candidates.
- *
- * Flags listed in `argConsumingFlags` consume the next argument
- * (skipped). Flags in `fileConsumingFlags` consume the next
- * argument as a file path (collected). The flags `-e` and `-f`
- * additionally signal that an explicit script was provided via
- * flag, so no inline positional script is expected.
- */
-function collectPatternCommandTokens(
-  node: TSNode,
-  config: PatternCommandConfig,
-): string[] {
-  const patternPositionals = config.patternPositionals ?? 1;
-  let hasExplicitScript = false;
-  let positionalsSeen = 0;
-  let nextArgAction: "skip" | "extract" | null = null;
-  let pastEndOfFlags = false;
-  const tokens: string[] = [];
-  for (let i = 0; i < node.childCount; i++) {
-    const child = node.child(i);
-    if (!child) continue;
-    // Skip command_name and variable_assignment nodes.
-    if (child.type === "command_name" || child.type === "variable_assignment")
-      continue;
-    // Only process argument-like nodes; recurse into others
-    // (e.g. command_substitution) for nested commands.
-    if (!ARG_NODE_TYPES.has(child.type)) {
-      tokens.push(...collectPathCandidateTokens(child));
-      continue;
-    }
-    const text = resolveNodeText(child);
-    // Handle consumed argument from previous flag.
-    if (nextArgAction === "skip") {
-      nextArgAction = null;
-      continue;
-    }
-    if (nextArgAction === "extract") {
-      tokens.push(text);
-      nextArgAction = null;
-      continue;
-    }
-    // Flag detection (only before "--" end-of-flags marker).
-    if (
-      !pastEndOfFlags &&
-      child.type === "word" &&
-      text.startsWith("-") &&
-      text.length > 1
-    ) {
-      const directive = classifyPatternCommandFlag(text, config);
-      switch (directive.kind) {
-        case "end-of-flags":
-          pastEndOfFlags = true;
-          break;
-        case "consume-arg":
-          nextArgAction = directive.nextArgAction;
-          if (directive.setsExplicitScript) hasExplicitScript = true;
-          break;
-        case "regular-flag":
-          break;
-      }
-      continue;
-    }
-    // Positional argument.
-    if (!hasExplicitScript && positionalsSeen < patternPositionals) {
-      positionalsSeen++;
-      continue; // Skip: this is an inline pattern/script.
-    }
-    // File argument — collect as path candidate.
-    tokens.push(text);
-  }
-  return tokens;
-}
-/**
- * Collect all argument tokens from a generic (non-pattern-first) command node,
- * skipping the command name and variable assignments.
- */
-function collectGenericCommandTokens(node: TSNode): string[] {
-  const tokens: string[] = [];
-  let seenCommandName = false;
-  for (let i = 0; i < node.childCount; i++) {
-    const child = node.child(i);
-    if (!child) continue;
-    if (child.type === "command_name") {
-      seenCommandName = true;
-      continue;
-    }
-    // Skip variable_assignment nodes (FOO=/bar)
-    if (child.type === "variable_assignment") continue;
-    // If there was no explicit command_name node, the first word-like
-    // child is the command name itself — skip it.
-    if (!seenCommandName && ARG_NODE_TYPES.has(child.type)) {
-      seenCommandName = true;
-      continue;
-    }
-    // Argument nodes: resolve their text and collect.
-    if (ARG_NODE_TYPES.has(child.type)) {
-      tokens.push(resolveNodeText(child));
-      continue;
-    }
-    // Recurse into other children (e.g. command_substitution nested in args)
-    tokens.push(...collectPathCandidateTokens(child));
-  }
-  return tokens;
-}
-/**
- * Collect redirect-destination tokens from a `file_redirect` node.
- */
-function collectRedirectTokens(node: TSNode): string[] {
-  const tokens: string[] = [];
-  for (let i = 0; i < node.childCount; i++) {
-    const child = node.child(i);
-    if (!child) continue;
-    if (ARG_NODE_TYPES.has(child.type)) {
-      tokens.push(resolveNodeText(child));
-    }
-  }
-  return tokens;
-}
-/**
- * Select the collection strategy for a `command` node: pattern-first
- * commands use `collectPatternCommandTokens`; all others use
- * `collectGenericCommandTokens`.
- */
-function collectCommandTokens(node: TSNode): string[] {
-  const commandName = extractCommandName(node);
-  const config = commandName
-    ? PATTERN_FIRST_COMMANDS.get(commandName)
-    : undefined;
-  return config
-    ? collectPatternCommandTokens(node, config)
-    : collectGenericCommandTokens(node);
-}
-/**
- * Recursively visit the AST and collect resolved text of nodes that
- * represent command arguments or redirect destinations.
- *
- * Skips `heredoc_body`, `heredoc_end`, and `comment` subtrees entirely.
- *
- * For commands in `PATTERN_FIRST_COMMANDS`, uses position-based
- * argument skipping to avoid collecting inline patterns/scripts
- * as path candidates. For all other commands, collects all
- * arguments generically.
- */
-function collectPathCandidateTokens(node: TSNode): string[] {
-  if (SKIP_SUBTREE_TYPES.has(node.type)) return [];
-  if (node.type === "command") return collectCommandTokens(node);
-  if (node.type === "file_redirect") return collectRedirectTokens(node);
-  const tokens: string[] = [];
-  for (let i = 0; i < node.childCount; i++) {
-    const child = node.child(i);
-    if (child) tokens.push(...collectPathCandidateTokens(child));
-  }
-  return tokens;
-}
-// Token classification is delegated to bash-token-classification.ts,
-// which exports classifyTokenAsPathCandidate and classifyTokenAsRuleCandidate
-// with a shared rejectNonPathToken predicate eliminating the prior clone.
-// ── Leading cd detection ───────────────────────────────────────────────────
-/**
- * Walk down from the root to find the first `command` node in the program.
- *
- * Only descends into `program` and `list` nodes — subshells, pipelines, and
- * other compound statements are ignored because a `cd` inside them does not
- * affect the outer shell's working directory.
- */
-function findFirstCommand(node: TSNode): TSNode | null {
-  if (node.type === "command") return node;
-  if (node.type === "program" || node.type === "list") {
-    const firstChild = node.child(0);
-    if (firstChild) return findFirstCommand(firstChild);
-  }
-  return null;
-}
-/**
- * Extract the target directory of a leading `cd` command from the parsed AST.
- *
- * When a bash command begins with `cd <dir> && …`, the shell resolves
- * subsequent relative paths against `<dir>`, not the original working
- * directory.  The external-directory guard must do the same, otherwise a
- * path that the shell keeps inside the working directory can appear to
- * escape it and trigger a spurious permission prompt.
- *
- * Returns `undefined` when the first command is not `cd`, or when the
- * target cannot be meaningfully resolved (`cd -`, bare `cd`, or `cd ~…`).
- */
-function extractLeadingCdTarget(rootNode: TSNode): string | undefined {
-  const firstCmd = findFirstCommand(rootNode);
-  if (!firstCmd) return undefined;
-  const cmdName = extractCommandName(firstCmd);
-  if (cmdName !== "cd") return undefined;
-  for (let i = 0; i < firstCmd.childCount; i++) {
-    const child = firstCmd.child(i);
-    if (!child) continue;
-    if (child.type === "command_name" || child.type === "variable_assignment")
-      continue;
-    if (!ARG_NODE_TYPES.has(child.type)) continue;
-    const text = resolveNodeText(child);
-    // Skip `--` (end-of-flags marker)
-    if (text === "--") continue;
-    // `cd -` jumps to $OLDPWD; `cd ~…` is home-relative — neither can be
-    // resolved against the working directory.
-    if (text === "-" || text.startsWith("~")) return undefined;
-    return text;
-  }
-  return undefined;
-}
-/**
- * Compute the effective base directory for resolving relative path candidates.
- *
- * When the leading `cd` target stays within the working directory, subsequent
- * relative paths should be resolved against it.  An escaping target is itself
- * an external access (reported via its own candidate token) and must never
- * silence checks on subsequent paths, so the function falls back to `cwd`.
- */
-function computeEffectiveResolveBase(
-  cdTarget: string | undefined,
-  cwd: string,
-): string {
-  if (cdTarget === undefined) return cwd;
-  const resolved = resolve(cwd, cdTarget);
-  const normalizedCwd = resolve(cwd);
-  return isPathWithinDirectory(resolved, normalizedCwd) ? resolved : cwd;
-}
-// ── Public extractors ──────────────────────────────────────────────────────
-/**
- * Extracts paths from a bash command string that resolve outside CWD.
- * Uses tree-sitter-bash to parse the command into a full AST, then walks
- * command argument and redirect-destination nodes.  Heredoc bodies, comments,
- * and other non-argument content are skipped, eliminating false positives.
- *
- * When the command begins with `cd <dir> && …`, relative candidate paths are
- * resolved against `<dir>` (if it stays within CWD) rather than CWD itself,
- * mirroring how the shell would resolve them.
+ * Thin facade over {@link BashProgram.externalPaths}; parses the command and
+ * returns the cd-aware external paths. See `BashProgram` for the parsing and
+ * resolution semantics.
  */
 export async function extractExternalPathsFromBashCommand(
   command: string,
   cwd: string,
 ): Promise<string[]> {
-  const parser = await getParser();
-  const tree = parser.parse(command);
-  if (!tree) return [];
-  let cdTarget: string | undefined;
-  let tokens: string[] = [];
-  try {
-    cdTarget = extractLeadingCdTarget(tree.rootNode);
-    tokens = collectPathCandidateTokens(tree.rootNode);
-  } finally {
-    tree.delete();
-  }
-  const resolveBase = computeEffectiveResolveBase(cdTarget, cwd);
-  const normalizedCwd = normalizePathForComparison(cwd, cwd);
-  const seen = new Set<string>();
-  const externalPaths: string[] = [];
-  for (const token of tokens) {
-    const candidate = classifyTokenAsPathCandidate(token);
-    if (!candidate) continue;
-    const normalized = normalizePathForComparison(candidate, resolveBase);
-    if (!normalized) continue;
-    if (
-      normalizedCwd !== "" &&
-      !isSafeSystemPath(normalized) &&
-      !isPathWithinDirectory(normalized, normalizedCwd) &&
-      !seen.has(normalized)
-    ) {
-      seen.add(normalized);
-      externalPaths.push(normalized);
-    }
-  }
-  return externalPaths;
+  return (await BashProgram.parse(command)).externalPaths(cwd);
 }
 /**
- * Extract tokens from a bash command that may be file paths, using a broader
+ * Extract tokens from a bash command that may be file paths, using the broader
  * filter suitable for cross-cutting `path` permission rules.
  *
- * Unlike `extractExternalPathsFromBashCommand`, this function:
- * - Accepts relative paths (`.env`, `src/foo.ts`, `./build`)
- * - Does NOT filter by CWD — returns raw tokens for rule evaluation
- * - Returns deduplicated tokens
+ * Thin facade over {@link BashProgram.pathTokens}.
  */
 export async function extractTokensForPathRules(
   command: string,
 ): Promise<string[]> {
-  const parser = await getParser();
-  const tree = parser.parse(command);
-  if (!tree) return [];
-  let tokens: string[] = [];
-  try {
-    tokens = collectPathCandidateTokens(tree.rootNode);
-  } finally {
-    tree.delete();
-  }
-  const seen = new Set<string>();
-  const result: string[] = [];
-  for (const token of tokens) {
-    const candidate = classifyTokenAsRuleCandidate(token);
-    if (!candidate) continue;
-    if (!seen.has(candidate)) {
-      seen.add(candidate);
-      result.push(candidate);
-    }
-  }
-  return result;
+  return (await BashProgram.parse(command)).pathTokens();
 }

package/src/handlers/gates/bash-path.ts CHANGED Viewed

@@ -4,6 +4,7 @@ import { SessionApproval } from "#src/session-approval";
 import { deriveApprovalPattern } from "#src/session-rules";
 import type { PermissionCheckResult } from "#src/types";
 import { extractTokensForPathRules } from "./bash-path-extractor";
+import { pickMostRestrictive } from "./candidate-check";
 import type { GateResult } from "./descriptor";
 import { formatPathAskPrompt } from "./path";
 import type { ToolCallContext } from "./types";
@@ -45,8 +46,9 @@ export async function describeBashPathGate(
   // Check each token against path rules with session rules appended.
   const sessionRules = getSessionRuleset();
-  let worstCheck: PermissionCheckResult | null = null;
-  let worstToken: string | null = null;
+  // Tokens whose resolved state needs a check (deny/ask), paired with the
+  // token that produced them so the descriptor can derive its pattern.
+  const uncovered: Array<{ token: string; check: PermissionCheckResult }> = [];
   let allSessionCovered = true;
   for (const token of tokens) {
@@ -70,13 +72,11 @@ export async function describeBashPathGate(
     }
     if (check.state === "deny") {
-      worstCheck = check;
-      worstToken = token;
+      uncovered.push({ token, check });
       break; // Short-circuit on deny.
     }
-    if (check.state === "ask" && worstCheck?.state !== "ask") {
-      worstCheck = check;
-      worstToken = token;
+    if (check.state === "ask") {
+      uncovered.push({ token, check });
     }
   }
@@ -99,6 +99,12 @@ export async function describeBashPathGate(
     };
   }
+  // Pick the most restrictive (deny > ask > allow, first-wins) uncovered token.
+  const worstCheck = pickMostRestrictive(uncovered.map(({ check }) => check));
+  const worstToken = worstCheck
+    ? (uncovered.find(({ check }) => check === worstCheck)?.token ?? null)
+    : null;
   // All tokens evaluate to allow — no restriction.
   if (!worstCheck || !worstToken) return null;