npm - @cdot65/prisma-airs - Versions diffs - 0.1.4 → 0.2.1 - Mend

@cdot65/prisma-airs 0.1.4 → 0.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

package/hooks/prisma-airs-audit/HOOK.md +47 -0
package/hooks/prisma-airs-audit/handler.ts +167 -0
package/hooks/prisma-airs-context/HOOK.md +41 -0
package/hooks/prisma-airs-context/handler.ts +295 -0
package/hooks/prisma-airs-outbound/HOOK.md +43 -0
package/hooks/prisma-airs-outbound/handler.test.ts +296 -0
package/hooks/prisma-airs-outbound/handler.ts +341 -0
package/hooks/prisma-airs-tools/HOOK.md +40 -0
package/hooks/prisma-airs-tools/handler.ts +279 -0
package/index.ts +3 -3
package/openclaw.plugin.json +75 -4
package/package.json +2 -2
package/src/scan-cache.test.ts +167 -0
package/src/scan-cache.ts +134 -0
package/src/scanner.ts +15 -7

package/hooks/prisma-airs-outbound/handler.test.ts ADDED Viewed

@@ -0,0 +1,296 @@
+/**
+ * Tests for prisma-airs-outbound hook handler
+ */
+import { describe, it, expect, vi, beforeEach, afterEach } from "vitest";
+import handler from "./handler";
+// Mock the scanner module
+vi.mock("../../src/scanner", () => ({
+  scan: vi.fn(),
+}));
+import { scan } from "../../src/scanner";
+const mockScan = vi.mocked(scan);
+describe("prisma-airs-outbound handler", () => {
+  beforeEach(() => {
+    vi.clearAllMocks();
+    // Suppress console output during tests
+    vi.spyOn(console, "log").mockImplementation(() => {});
+    vi.spyOn(console, "error").mockImplementation(() => {});
+  });
+  afterEach(() => {
+    vi.restoreAllMocks();
+  });
+  const baseEvent = {
+    content: "This is a test response",
+    to: "user@example.com",
+    channel: "slack",
+    metadata: {
+      sessionKey: "test-session",
+    },
+  };
+  const baseCtx = {
+    channelId: "slack",
+    conversationId: "conv-123",
+    cfg: {
+      plugins: {
+        entries: {
+          "prisma-airs": {
+            config: {
+              outbound_scanning_enabled: true,
+              profile_name: "default",
+              app_name: "test-app",
+              fail_closed: true,
+              dlp_mask_only: true,
+            },
+          },
+        },
+      },
+    },
+  };
+  describe("allow action", () => {
+    it("should return undefined for allowed responses", async () => {
+      mockScan.mockResolvedValue({
+        action: "allow",
+        severity: "SAFE",
+        categories: ["safe"],
+        scanId: "scan_123",
+        reportId: "report_456",
+        profileName: "default",
+        promptDetected: { injection: false, dlp: false, urlCats: false },
+        responseDetected: { dlp: false, urlCats: false },
+        latencyMs: 50,
+      });
+      const result = await handler(baseEvent, baseCtx);
+      expect(result).toBeUndefined();
+    });
+  });
+  describe("warn action", () => {
+    it("should allow through with warning logged", async () => {
+      mockScan.mockResolvedValue({
+        action: "warn",
+        severity: "MEDIUM",
+        categories: ["url_filtering_response"],
+        scanId: "scan_123",
+        reportId: "report_456",
+        profileName: "default",
+        promptDetected: { injection: false, dlp: false, urlCats: false },
+        responseDetected: { dlp: false, urlCats: true },
+        latencyMs: 50,
+      });
+      const result = await handler(baseEvent, baseCtx);
+      expect(result).toBeUndefined();
+      expect(console.log).toHaveBeenCalled();
+    });
+  });
+  describe("block action - DLP masking", () => {
+    it("should mask SSN in response", async () => {
+      mockScan.mockResolvedValue({
+        action: "block",
+        severity: "HIGH",
+        categories: ["dlp_response"],
+        scanId: "scan_123",
+        reportId: "report_456",
+        profileName: "default",
+        promptDetected: { injection: false, dlp: false, urlCats: false },
+        responseDetected: { dlp: true, urlCats: false },
+        latencyMs: 50,
+      });
+      const eventWithSSN = {
+        ...baseEvent,
+        content: "Your SSN is 123-45-6789",
+      };
+      const result = await handler(eventWithSSN, baseCtx);
+      expect(result?.content).toContain("[SSN REDACTED]");
+      expect(result?.content).not.toContain("123-45-6789");
+    });
+    it("should mask credit card numbers", async () => {
+      mockScan.mockResolvedValue({
+        action: "block",
+        severity: "HIGH",
+        categories: ["dlp_response"],
+        scanId: "scan_123",
+        reportId: "report_456",
+        profileName: "default",
+        promptDetected: { injection: false, dlp: false, urlCats: false },
+        responseDetected: { dlp: true, urlCats: false },
+        latencyMs: 50,
+      });
+      const eventWithCard = {
+        ...baseEvent,
+        content: "Your card number is 4111-1111-1111-1111",
+      };
+      const result = await handler(eventWithCard, baseCtx);
+      expect(result?.content).toContain("[CARD REDACTED]");
+    });
+    it("should mask email addresses", async () => {
+      mockScan.mockResolvedValue({
+        action: "block",
+        severity: "HIGH",
+        categories: ["dlp_response"],
+        scanId: "scan_123",
+        reportId: "report_456",
+        profileName: "default",
+        promptDetected: { injection: false, dlp: false, urlCats: false },
+        responseDetected: { dlp: true, urlCats: false },
+        latencyMs: 50,
+      });
+      const eventWithEmail = {
+        ...baseEvent,
+        content: "Contact us at secret@company.com",
+      };
+      const result = await handler(eventWithEmail, baseCtx);
+      expect(result?.content).toContain("[EMAIL REDACTED]");
+    });
+  });
+  describe("block action - full block", () => {
+    it("should block responses with malicious code", async () => {
+      mockScan.mockResolvedValue({
+        action: "block",
+        severity: "CRITICAL",
+        categories: ["malicious_code"],
+        scanId: "scan_123",
+        reportId: "report_456",
+        profileName: "default",
+        promptDetected: { injection: false, dlp: false, urlCats: false },
+        responseDetected: { dlp: false, urlCats: false },
+        latencyMs: 50,
+      });
+      const result = await handler(baseEvent, baseCtx);
+      expect(result?.content).toContain("security policy");
+      expect(result?.content).toContain("malicious code");
+    });
+    it("should block responses with toxicity", async () => {
+      mockScan.mockResolvedValue({
+        action: "block",
+        severity: "HIGH",
+        categories: ["toxicity"],
+        scanId: "scan_123",
+        reportId: "report_456",
+        profileName: "default",
+        promptDetected: { injection: false, dlp: false, urlCats: false },
+        responseDetected: { dlp: false, urlCats: false },
+        latencyMs: 50,
+      });
+      const result = await handler(baseEvent, baseCtx);
+      expect(result?.content).toContain("security policy");
+    });
+    it("should block even DLP violations when combined with other threats", async () => {
+      mockScan.mockResolvedValue({
+        action: "block",
+        severity: "CRITICAL",
+        categories: ["dlp_response", "malicious_code"],
+        scanId: "scan_123",
+        reportId: "report_456",
+        profileName: "default",
+        promptDetected: { injection: false, dlp: false, urlCats: false },
+        responseDetected: { dlp: true, urlCats: false },
+        latencyMs: 50,
+      });
+      const eventWithSSN = {
+        ...baseEvent,
+        content: "Your SSN is 123-45-6789",
+      };
+      const result = await handler(eventWithSSN, baseCtx);
+      // Should be a full block, not masking
+      expect(result?.content).toContain("security policy");
+      expect(result?.content).not.toContain("[SSN REDACTED]");
+    });
+  });
+  describe("fail-closed behavior", () => {
+    it("should block on scan failure when fail_closed is true", async () => {
+      mockScan.mockRejectedValue(new Error("API timeout"));
+      const result = await handler(baseEvent, baseCtx);
+      expect(result?.content).toContain("security verification issue");
+    });
+    it("should allow through on scan failure when fail_closed is false", async () => {
+      mockScan.mockRejectedValue(new Error("API timeout"));
+      const ctxFailOpen = {
+        ...baseCtx,
+        cfg: {
+          plugins: {
+            entries: {
+              "prisma-airs": {
+                config: {
+                  ...baseCtx.cfg?.plugins?.entries?.["prisma-airs"]?.config,
+                  fail_closed: false,
+                },
+              },
+            },
+          },
+        },
+      };
+      const result = await handler(baseEvent, ctxFailOpen);
+      expect(result).toBeUndefined();
+    });
+  });
+  describe("disabled scanning", () => {
+    it("should skip scanning when disabled", async () => {
+      const ctxDisabled = {
+        ...baseCtx,
+        cfg: {
+          plugins: {
+            entries: {
+              "prisma-airs": {
+                config: {
+                  outbound_scanning_enabled: false,
+                },
+              },
+            },
+          },
+        },
+      };
+      const result = await handler(baseEvent, ctxDisabled);
+      expect(result).toBeUndefined();
+      expect(mockScan).not.toHaveBeenCalled();
+    });
+  });
+  describe("empty content", () => {
+    it("should skip empty content", async () => {
+      const emptyEvent = { ...baseEvent, content: "" };
+      const result = await handler(emptyEvent, baseCtx);
+      expect(result).toBeUndefined();
+      expect(mockScan).not.toHaveBeenCalled();
+    });
+    it("should skip undefined content", async () => {
+      const noContentEvent = { ...baseEvent, content: undefined };
+      const result = await handler(noContentEvent, baseCtx);
+      expect(result).toBeUndefined();
+      expect(mockScan).not.toHaveBeenCalled();
+    });
+  });
+});

package/hooks/prisma-airs-outbound/handler.ts ADDED Viewed

@@ -0,0 +1,341 @@
+/**
+ * Prisma AIRS Outbound Security Scanner (message_sending)
+ *
+ * Scans ALL outbound responses for:
+ * - WildFire: malicious URLs and content
+ * - Toxicity: harmful/abusive content
+ * - URL Filtering: disallowed URL categories
+ * - DLP: sensitive data leakage
+ * - Malicious Code: malware/exploits
+ * - Custom Topics: org-specific policy violations
+ * - Grounding: hallucination detection
+ *
+ * CAN BLOCK via { cancel: true } or modify via { content: "..." }
+ */
+import { scan, type ScanResult } from "../../src/scanner";
+// Event shape from OpenClaw message_sending hook
+interface MessageSendingEvent {
+  content?: string;
+  to?: string;
+  channel?: string;
+  metadata?: {
+    sessionKey?: string;
+    messageId?: string;
+  };
+}
+// Context passed to hook
+interface HookContext {
+  channelId?: string;
+  accountId?: string;
+  conversationId?: string;
+  cfg?: PluginConfig;
+}
+// Plugin config structure
+interface PluginConfig {
+  plugins?: {
+    entries?: {
+      "prisma-airs"?: {
+        config?: {
+          outbound_scanning_enabled?: boolean;
+          profile_name?: string;
+          app_name?: string;
+          fail_closed?: boolean;
+          dlp_mask_only?: boolean;
+        };
+      };
+    };
+  };
+}
+// Hook result type - can modify content or cancel
+interface HookResult {
+  content?: string;
+  cancel?: boolean;
+}
+// Map AIRS categories to user-friendly messages
+const CATEGORY_MESSAGES: Record<string, string> = {
+  // Core detections
+  prompt_injection: "prompt injection attempt",
+  dlp_prompt: "sensitive data in input",
+  dlp_response: "sensitive data leakage",
+  url_filtering_prompt: "disallowed URL in input",
+  url_filtering_response: "disallowed URL in response",
+  malicious_url: "malicious URL detected",
+  toxicity: "inappropriate content",
+  toxic_content: "inappropriate content",
+  malicious_code: "malicious code detected",
+  agent_threat: "AI agent threat",
+  grounding: "response grounding violation",
+  ungrounded: "ungrounded response",
+  custom_topic: "policy violation",
+  topic_violation: "policy violation",
+  db_security: "database security threat",
+  safe: "safe",
+  benign: "safe",
+  api_error: "security scan error",
+  "scan-failure": "security scan failed",
+};
+// Categories that can be masked instead of blocked
+const MASKABLE_CATEGORIES = ["dlp_response", "dlp_prompt", "dlp"];
+// Categories that always require full block
+const ALWAYS_BLOCK_CATEGORIES = [
+  "malicious_code",
+  "malicious_url",
+  "toxicity",
+  "toxic_content",
+  "agent_threat",
+  "prompt_injection",
+  "db_security",
+  "scan-failure",
+];
+/**
+ * Get plugin configuration
+ */
+function getPluginConfig(ctx: HookContext): {
+  enabled: boolean;
+  profileName: string;
+  appName: string;
+  failClosed: boolean;
+  dlpMaskOnly: boolean;
+} {
+  const cfg = ctx.cfg?.plugins?.entries?.["prisma-airs"]?.config;
+  return {
+    enabled: cfg?.outbound_scanning_enabled !== false,
+    profileName: cfg?.profile_name ?? "default",
+    appName: cfg?.app_name ?? "openclaw",
+    failClosed: cfg?.fail_closed ?? true, // Default fail-closed
+    dlpMaskOnly: cfg?.dlp_mask_only ?? true, // Default mask instead of block for DLP
+  };
+}
+/**
+ * Mask sensitive data in content
+ *
+ * Uses regex patterns for common PII types.
+ * TODO: Use AIRS API match offsets for precision masking when available.
+ */
+function maskSensitiveData(content: string): string {
+  let masked = content;
+  // Social Security Numbers (XXX-XX-XXXX)
+  masked = masked.replace(/\b\d{3}-\d{2}-\d{4}\b/g, "[SSN REDACTED]");
+  // Credit Card Numbers (with or without spaces/dashes)
+  masked = masked.replace(/\b(?:\d{4}[-\s]?){3}\d{4}\b/g, "[CARD REDACTED]");
+  // Email addresses
+  masked = masked.replace(
+    /\b[A-Za-z0-9._%+-]+@[A-Za-z0-9.-]+\.[A-Z|a-z]{2,}\b/g,
+    "[EMAIL REDACTED]"
+  );
+  // API keys and tokens (common patterns)
+  masked = masked.replace(
+    /\b(?:sk-|pk-|api[_-]?key[_-]?|token[_-]?|secret[_-]?|password[_-]?)[a-zA-Z0-9_-]{16,}\b/gi,
+    "[API KEY REDACTED]"
+  );
+  // AWS keys
+  masked = masked.replace(/\b(?:AKIA|ABIA|ACCA|ASIA)[A-Z0-9]{16}\b/g, "[AWS KEY REDACTED]");
+  // Generic long alphanumeric strings that look like secrets (40+ chars)
+  masked = masked.replace(/\b[a-zA-Z0-9_-]{40,}\b/g, (match) => {
+    // Only redact if it looks like a key (has mixed case or numbers)
+    if (/[a-z]/.test(match) && /[A-Z]/.test(match) && /[0-9]/.test(match)) {
+      return "[SECRET REDACTED]";
+    }
+    return match;
+  });
+  // US Phone numbers
+  masked = masked.replace(
+    /\b(?:\+1[-.\s]?)?\(?\d{3}\)?[-.\s]?\d{3}[-.\s]?\d{4}\b/g,
+    "[PHONE REDACTED]"
+  );
+  // IP addresses (private ranges especially)
+  masked = masked.replace(
+    /\b(?:10\.\d{1,3}\.\d{1,3}\.\d{1,3}|172\.(?:1[6-9]|2\d|3[01])\.\d{1,3}\.\d{1,3}|192\.168\.\d{1,3}\.\d{1,3})\b/g,
+    "[IP REDACTED]"
+  );
+  return masked;
+}
+/**
+ * Build user-friendly block message
+ */
+function buildBlockMessage(result: ScanResult): string {
+  const reasons = result.categories
+    .map((cat) => CATEGORY_MESSAGES[cat] || cat.replace(/_/g, " "))
+    .filter((r) => r !== "safe")
+    .join(", ");
+  return (
+    `I apologize, but I'm unable to provide that response due to security policy` +
+    (reasons ? ` (${reasons})` : "") +
+    `. Please rephrase your request or contact support if you believe this is an error.`
+  );
+}
+/**
+ * Determine if result should be masked vs blocked
+ */
+function shouldMaskOnly(result: ScanResult, config: { dlpMaskOnly: boolean }): boolean {
+  if (!config.dlpMaskOnly) return false;
+  // Check if any always-block categories are present
+  const hasBlockingCategory = result.categories.some((cat) =>
+    ALWAYS_BLOCK_CATEGORIES.includes(cat)
+  );
+  if (hasBlockingCategory) return false;
+  // Check if all categories are maskable
+  const allMaskable = result.categories.every(
+    (cat) => MASKABLE_CATEGORIES.includes(cat) || cat === "safe" || cat === "benign"
+  );
+  return allMaskable;
+}
+/**
+ * Main hook handler
+ */
+const handler = async (
+  event: MessageSendingEvent,
+  ctx: HookContext
+): Promise<HookResult | void> => {
+  const config = getPluginConfig(ctx);
+  // Check if outbound scanning is enabled
+  if (!config.enabled) {
+    return;
+  }
+  // Validate we have content to scan
+  const content = event.content;
+  if (!content || typeof content !== "string" || content.trim().length === 0) {
+    return;
+  }
+  const sessionKey = event.metadata?.sessionKey || ctx.conversationId || "unknown";
+  let result: ScanResult;
+  try {
+    // Scan the outbound response
+    result = await scan({
+      response: content,
+      profileName: config.profileName,
+      appName: config.appName,
+    });
+  } catch (err) {
+    console.error(
+      JSON.stringify({
+        event: "prisma_airs_outbound_scan_error",
+        timestamp: new Date().toISOString(),
+        sessionKey,
+        error: err instanceof Error ? err.message : String(err),
+      })
+    );
+    // Fail-closed: block on scan failure
+    if (config.failClosed) {
+      return {
+        content:
+          "I apologize, but I'm unable to provide a response at this time due to a security verification issue. Please try again.",
+      };
+    }
+    return; // Fail-open
+  }
+  // Log the scan result
+  console.log(
+    JSON.stringify({
+      event: "prisma_airs_outbound_scan",
+      timestamp: new Date().toISOString(),
+      sessionKey,
+      action: result.action,
+      severity: result.severity,
+      categories: result.categories,
+      scanId: result.scanId,
+      reportId: result.reportId,
+      latencyMs: result.latencyMs,
+      responseDetected: result.responseDetected,
+    })
+  );
+  // Handle allow - no modification needed
+  if (result.action === "allow") {
+    return;
+  }
+  // Handle warn - log but allow through
+  if (result.action === "warn") {
+    console.log(
+      JSON.stringify({
+        event: "prisma_airs_outbound_warn",
+        timestamp: new Date().toISOString(),
+        sessionKey,
+        severity: result.severity,
+        categories: result.categories,
+        scanId: result.scanId,
+      })
+    );
+    return; // Allow through with warning logged
+  }
+  // Handle block
+  if (result.action === "block") {
+    // Check if we should mask instead of block (DLP-only)
+    if (shouldMaskOnly(result, config)) {
+      const maskedContent = maskSensitiveData(content);
+      // Only return modified content if masking actually changed something
+      if (maskedContent !== content) {
+        console.log(
+          JSON.stringify({
+            event: "prisma_airs_outbound_mask",
+            timestamp: new Date().toISOString(),
+            sessionKey,
+            categories: result.categories,
+            scanId: result.scanId,
+          })
+        );
+        return {
+          content: maskedContent,
+        };
+      }
+    }
+    // Full block - replace content entirely
+    console.log(
+      JSON.stringify({
+        event: "prisma_airs_outbound_block",
+        timestamp: new Date().toISOString(),
+        sessionKey,
+        action: result.action,
+        severity: result.severity,
+        categories: result.categories,
+        scanId: result.scanId,
+        reportId: result.reportId,
+      })
+    );
+    return {
+      content: buildBlockMessage(result),
+    };
+  }
+};
+export default handler;

package/hooks/prisma-airs-tools/HOOK.md ADDED Viewed

@@ -0,0 +1,40 @@
+---
+name: prisma-airs-tools
+description: "Block dangerous tool calls when security threats are detected"
+metadata: { "openclaw": { "emoji": "🛑", "events": ["before_tool_call"] } }
+---
+# Prisma AIRS Tool Gating
+Blocks dangerous tool calls when security warnings are active from inbound scanning.
+## Behavior
+This hook runs before each tool call and checks if the current session has an active security warning (from `message_received` or `before_agent_start` scanning). Based on the detected threat categories, it blocks specific tools that could be dangerous.
+## Tool Blocking Matrix
+| Threat Category                 | Blocked Tools                 |
+| ------------------------------- | ----------------------------- |
+| `agent-threat`                  | ALL external tools            |
+| `sql-injection` / `db-security` | exec, database, query, sql    |
+| `malicious-code`                | exec, write, edit, eval, bash |
+| `prompt-injection`              | exec, gateway, message, cron  |
+| `malicious-url`                 | web_fetch, browser, curl      |
+## High-Risk Tools (Default)
+These tools are blocked on ANY detected threat:
+- `exec` - Command execution
+- `Bash` - Shell access
+- `write` - File writing
+- `edit` - File editing
+- `gateway` - Gateway operations
+- `message` - Sending messages
+- `cron` - Scheduled tasks
+## Configuration
+- `tool_gating_enabled`: Enable/disable (default: true)
+- `high_risk_tools`: List of tools to block on any threat