npm - watchmyagents - Versions diffs - 0.3.0 → 0.6.0 - Mend

watchmyagents 0.3.0 → 0.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

package/README.md +59 -9
package/SECURITY.md +9 -3
package/package.json +10 -4
package/scripts/anonymize.js +121 -0
package/scripts/fetch-anthropic.js +10 -0
package/scripts/inspect.js +14 -4
package/scripts/shield.js +164 -16
package/scripts/upload-fortress.js +222 -0
package/src/anonymizer.js +206 -0
package/src/fortress/url.js +59 -0
package/src/logger.js +11 -2
package/src/shield/policy.js +50 -7
package/src/shield/sources/fortress.js +203 -0

package/scripts/upload-fortress.js ADDED Viewed

@@ -0,0 +1,222 @@
+#!/usr/bin/env node
+// wma-upload-fortress — anonymize local Watch NDJSON and POST signals to
+// the Fortress ingest-signals Edge Function.
+//
+// Composable with the rest of the SDK:
+//   wma-fetch  →  ./watchmyagents-logs/<agent_id>/<date>.ndjson   (local capture)
+//   wma-anonymize  →  signals payload (Modèle C: no raw content)
+//   wma-upload-fortress  →  POST signals to https://<project>.supabase.co/functions/v1/ingest-signals
+//
+// Usage:
+//   wma-upload-fortress --agent-id agent_xxx \
+//                       [--log-dir ./watchmyagents-logs] \
+//                       [--fortress-url https://<project>.supabase.co/functions/v1/ingest-signals] \
+//                       [--api-key wma_...] \
+//                       [--salt <hex>] \
+//                       [--display-name "My agent"] \
+//                       [--dry-run]
+//
+// Env vars (preferred over CLI flags):
+//   WMA_API_KEY            — the wma_xxx key from the Fortress dashboard
+//   WMA_FORTRESS_URL       — full URL to the ingest-signals endpoint
+//   WMA_SIGNALS_SALT       — per-customer hex salt for IoC hashing
+//                            (must be stable across runs)
+import { request as httpsRequest } from 'node:https';
+import { URL } from 'node:url';
+import { readdir, stat } from 'node:fs/promises';
+import { join, resolve } from 'node:path';
+import { createReadStream } from 'node:fs';
+import { createInterface } from 'node:readline';
+import { SignalsAggregator } from '../src/anonymizer.js';
+import { resolveFortressBase, fortressEndpoint } from '../src/fortress/url.js';
+function parseArgs(argv) {
+  const out = {};
+  for (let i = 0; i < argv.length; i++) {
+    const a = argv[i];
+    if (a.startsWith('--')) {
+      const k = a.slice(2);
+      const n = argv[i + 1];
+      if (n == null || n.startsWith('--')) out[k] = true;
+      else { out[k] = n; i++; }
+    }
+  }
+  return out;
+}
+function die(msg, code = 1) { process.stderr.write(`${msg}\n`); process.exit(code); }
+function info(msg) { process.stdout.write(`[wma-upload-fortress] ${msg}\n`); }
+function warn(msg) { process.stderr.write(`[wma-upload-fortress] ⚠️  ${msg}\n`); }
+async function collectFiles(p) {
+  const s = await stat(p).catch(() => null);
+  if (!s) return [];
+  if (s.isFile()) return p.endsWith('.ndjson') && !p.includes('raw-') ? [p] : [];
+  const out = [];
+  for (const name of await readdir(p)) {
+    out.push(...(await collectFiles(join(p, name))));
+  }
+  return out;
+}
+function postJson(url, headers, body) {
+  return new Promise((resolveReq, rejectReq) => {
+    const u = new URL(url);
+    if (u.protocol !== 'https:') {
+      return rejectReq(new Error(`refusing non-https fortress URL: ${url}`));
+    }
+    const data = Buffer.from(body);
+    const req = httpsRequest(
+      {
+        method: 'POST',
+        hostname: u.hostname,
+        port: u.port || 443,
+        path: u.pathname + u.search,
+        headers: {
+          ...headers,
+          'content-type': 'application/json',
+          'content-length': data.length,
+        },
+        rejectUnauthorized: true,
+      },
+      (res) => {
+        const chunks = [];
+        res.on('data', (c) => chunks.push(c));
+        res.on('end', () => {
+          const raw = Buffer.concat(chunks).toString('utf8');
+          let parsed = null;
+          try { parsed = JSON.parse(raw); } catch { /* keep raw */ }
+          resolveReq({ status: res.statusCode || 0, body: parsed ?? raw });
+        });
+      }
+    );
+    req.on('error', rejectReq);
+    req.write(data);
+    req.end();
+  });
+}
+async function main() {
+  const args = parseArgs(process.argv.slice(2));
+  const agentId = args['agent-id'];
+  const logDir = resolve(args['log-dir'] || './watchmyagents-logs');
+  const apiKey = args['api-key'] || process.env.WMA_API_KEY;
+  const salt = args.salt || process.env.WMA_SIGNALS_SALT;
+  const displayName = args['display-name'] || agentId;
+  const dryRun = !!args['dry-run'];
+  // Resolve Fortress base URL. Accepts:
+  //   --fortress-base-url <base>            (preferred CLI)
+  //   --fortress-url <full ingest-signals>  (legacy CLI)
+  //   WMA_FORTRESS_BASE_URL env             (preferred env)
+  //   WMA_FORTRESS_URL env                  (legacy env, points at ingest-signals)
+  const fortressBase = resolveFortressBase({
+    explicitBase: args['fortress-base-url'],
+    explicitUrl: args['fortress-url'],
+  });
+  const fortressUrl = fortressBase ? fortressEndpoint(fortressBase, 'ingest-signals') : null;
+  // Validation
+  if (!agentId) die('error: --agent-id required (Anthropic agent_id, e.g. agent_01XaN...)');
+  // Strict alphanumeric to prevent path traversal in collectFiles below
+  // (--agent-id ends up as a filesystem path segment).
+  if (!/^agent_[a-zA-Z0-9]+$/.test(agentId)) {
+    die(`error: --agent-id has invalid format (expected "agent_" + alphanumeric, got "${agentId}")`);
+  }
+  if (!dryRun && !fortressUrl) {
+    die('error: --fortress-url or WMA_FORTRESS_URL required (full URL to /functions/v1/ingest-signals).\n' +
+        '       Use --dry-run to print the payload without uploading.');
+  }
+  if (!dryRun && !apiKey) {
+    die('error: --api-key or WMA_API_KEY required.\n' +
+        '       Get one from your Fortress dashboard → Settings → API Keys.');
+  }
+  if (!dryRun && apiKey && !/^wma_[a-f0-9]{32}$/i.test(apiKey)) {
+    warn(`API key format looks unusual (expected "wma_<32hex>", got "${apiKey.slice(0, 8)}…").`);
+  }
+  if (!salt) {
+    die('error: --salt or WMA_SIGNALS_SALT required (per-customer hex secret for hashing IoCs).\n' +
+        '       Generate once with:  node -e "console.log(require(\'crypto\').randomBytes(16).toString(\'hex\'))"\n' +
+        '       Store stably in .env.local.');
+  }
+  if (salt.length < 16) die('error: salt too short (need ≥16 hex chars)');
+  // Warn about CLI-passed secrets
+  if (args['api-key']) {
+    warn('--api-key on the command line is visible in shell history and process list.\n' +
+         '                Prefer: export WMA_API_KEY=...');
+  }
+  if (args.salt) {
+    warn('--salt on the command line is visible in shell history.\n' +
+         '                Prefer: export WMA_SIGNALS_SALT=...');
+  }
+  // Discover the agent's NDJSON files
+  const agentDir = join(logDir, agentId);
+  const files = await collectFiles(agentDir);
+  if (files.length === 0) {
+    die(`error: no .ndjson files found under ${agentDir}. Run wma-fetch first?`);
+  }
+  info(`scanning ${files.length} ndjson file(s) under ${agentDir}`);
+  // Aggregate into a single signals payload
+  const agg = new SignalsAggregator({ salt });
+  for (const f of files) {
+    const stream = createReadStream(f, { encoding: 'utf8' });
+    const rl = createInterface({ input: stream, crlfDelay: Infinity });
+    for await (const line of rl) {
+      if (!line.trim()) continue;
+      let e; try { e = JSON.parse(line); } catch { continue; }
+      agg.add(e);
+    }
+  }
+  const signals = agg.finalize();
+  if (!signals.window_start || !signals.window_end) {
+    die('error: no entries had timestamps — nothing to upload');
+  }
+  const body = {
+    anthropic_agent_id: agentId,
+    display_name: displayName,
+    window_start: signals.window_start,
+    window_end: signals.window_end,
+    payload: signals.payload,
+  };
+  const bodyJson = JSON.stringify(body);
+  info(`payload built: ${signals._meta.entries_processed} entries → ${bodyJson.length} bytes`);
+  info(`window: ${signals.window_start} → ${signals.window_end}`);
+  info(`ioc_hashes: ${signals.payload.ioc_hashes.length}, tool_counts: ${Object.keys(signals.payload.tool_counts).length}`);
+  if (dryRun) {
+    info('--dry-run: payload that WOULD be POSTed:');
+    process.stdout.write(JSON.stringify(body, null, 2) + '\n');
+    return;
+  }
+  // POST it
+  info(`POST ${fortressUrl}`);
+  const { status, body: respBody } = await postJson(
+    fortressUrl,
+    { authorization: `Bearer ${apiKey}` },
+    bodyJson
+  );
+  if (status >= 200 && status < 300) {
+    info(`✅ HTTP ${status}`);
+    if (typeof respBody === 'object' && respBody.signal_id) {
+      info(`signal_id: ${respBody.signal_id}`);
+      info(`agent_id:  ${respBody.agent_id}`);
+      if (respBody.registered_new_agent) info('🆕 agent was auto-registered on this upload');
+    } else {
+      info(`response: ${typeof respBody === 'string' ? respBody.slice(0, 300) : JSON.stringify(respBody).slice(0, 300)}`);
+    }
+  } else {
+    const msg = typeof respBody === 'object' ? JSON.stringify(respBody) : String(respBody).slice(0, 500);
+    die(`error: upload failed (HTTP ${status}): ${msg}`);
+  }
+}
+main().catch((e) => { process.stderr.write(`error: ${e.stack || e.message}\n`); process.exit(1); });

package/src/anonymizer.js ADDED Viewed

@@ -0,0 +1,206 @@
+// ─────────────────────────────────────────────────────────────────────────
+// Anonymizer — strip raw payloads, produce signals safe for Fortress
+// ─────────────────────────────────────────────────────────────────────────
+// Reads a Watch NDJSON file (the full local log) and produces an
+// anonymized signals payload — the shape Fortress's `signals` table
+// expects. The output contains ONLY:
+//
+//   - counts (action_type, tool_name)
+//   - latencies (p50, p95, max) per tool
+//   - error rates per tool
+//   - salted SHA-256 hashes of IoCs (URLs, commands, queries)
+//   - top action_type sequences (Markov pairs)
+//   - stop_reason type counts (NOT the message text)
+//   - tokens_total
+//
+// What it NEVER outputs:
+//   - input.content (prompts)
+//   - output.content (agent text)
+//   - raw URLs / commands / queries
+//   - error messages
+//   - readable session_id (hashed)
+//   - readable agent_id (hashed)
+//   - PII of any kind
+//
+// This is the single bottleneck between Watch (local) and Fortress (cloud).
+// Every byte that crosses to the cloud passes through this module.
+import { createHash, randomBytes } from 'node:crypto';
+import { createReadStream } from 'node:fs';
+import { createInterface } from 'node:readline';
+// ── Configuration ────────────────────────────────────────────────────────
+// Fields that may contain raw data — we extract a hash, never the raw value.
+const HASHABLE_INPUT_FIELDS = ['url', 'query', 'command', 'path', 'file_path'];
+// Tool types whose inputs we want to hash for IoC tracking
+const TOOL_ACTIONS = new Set(['tool_use', 'mcp_tool_use', 'custom_tool_use']);
+// ── Hash helpers ─────────────────────────────────────────────────────────
+/**
+ * Salted SHA-256 hash. The salt is per-customer (passed in) so the same URL
+ * at customer A produces a different hash than at customer B by default —
+ * but if a global salt is used, identical IoCs across customers produce
+ * identical hashes (the antivirus model for L4 cross-customer intel).
+ */
+export function hashWithSalt(value, salt) {
+  if (value == null) return null;
+  const s = typeof value === 'string' ? value : JSON.stringify(value);
+  return 'sha256:' + createHash('sha256').update(salt).update(s).digest('hex').slice(0, 32);
+}
+// Generate a customer salt (if none provided)
+export function generateSalt() {
+  return randomBytes(16).toString('hex');
+}
+// ── Single-entry extractor: what hashable IoCs are in this entry? ────────
+function extractIocs(entry, salt) {
+  const out = [];
+  if (!entry.input || typeof entry.input !== 'object') return out;
+  for (const field of HASHABLE_INPUT_FIELDS) {
+    const v = entry.input[field];
+    if (typeof v === 'string' && v.length > 0) {
+      out.push(hashWithSalt(v, salt));
+    }
+  }
+  return out;
+}
+// ── Aggregator: walks the NDJSON stream and builds the signals payload ──
+export class SignalsAggregator {
+  constructor({ salt } = {}) {
+    if (!salt) throw new Error('SignalsAggregator requires a salt');
+    this.salt = salt;
+    this.counts = Object.create(null);          // action_type → count
+    this.toolCounts = Object.create(null);      // tool_name → count
+    this.toolErrors = Object.create(null);      // tool_name → error count
+    this.toolLatencies = Object.create(null);   // tool_name → number[]
+    this.iocHashes = new Set();                 // unique IoC hashes
+    this.sequences = Object.create(null);       // "A → B" → count
+    this.stopReasons = Object.create(null);     // stop_reason.type → count
+    this.tokensTotal = 0;
+    this.windowStart = null;
+    this.windowEnd = null;
+    this.entryCount = 0;
+    this._prevActionType = null;
+    this._prevSessionId = null;
+  }
+  add(entry) {
+    if (!entry) return;
+    this.entryCount++;
+    // Track window bounds
+    const ts = entry.timestamp || '';
+    if (ts) {
+      if (!this.windowStart || ts < this.windowStart) this.windowStart = ts;
+      if (!this.windowEnd || ts > this.windowEnd) this.windowEnd = ts;
+    }
+    // Counts
+    const at = entry.action_type || 'unknown';
+    this.counts[at] = (this.counts[at] || 0) + 1;
+    // Sequence tracking (only within the same session)
+    if (this._prevActionType && entry.session_id === this._prevSessionId
+        && at !== 'session_end' && this._prevActionType !== 'session_end') {
+      const seqKey = `${this._prevActionType} → ${at}`;
+      this.sequences[seqKey] = (this.sequences[seqKey] || 0) + 1;
+    }
+    this._prevActionType = at;
+    this._prevSessionId = entry.session_id || null;
+    // Tools
+    if (entry.tool_name && TOOL_ACTIONS.has(at)) {
+      this.toolCounts[entry.tool_name] = (this.toolCounts[entry.tool_name] || 0) + 1;
+      if (entry.status === 'error') {
+        this.toolErrors[entry.tool_name] = (this.toolErrors[entry.tool_name] || 0) + 1;
+      }
+      if (typeof entry.duration_ms === 'number') {
+        if (!this.toolLatencies[entry.tool_name]) this.toolLatencies[entry.tool_name] = [];
+        this.toolLatencies[entry.tool_name].push(entry.duration_ms);
+      }
+      // Extract & hash IoCs from this tool's input
+      for (const h of extractIocs(entry, this.salt)) this.iocHashes.add(h);
+    }
+    // Tokens
+    if (typeof entry.tokens_used === 'number') this.tokensTotal += entry.tokens_used;
+    // Stop reasons (state_transition entries carry these)
+    const stopType = entry.output?.stop_reason?.type;
+    if (typeof stopType === 'string') {
+      this.stopReasons[stopType] = (this.stopReasons[stopType] || 0) + 1;
+    }
+  }
+  // Compute p50/p95/max for an array of durations
+  _percentiles(arr) {
+    if (arr.length === 0) return null;
+    const sorted = [...arr].sort((a, b) => a - b);
+    const at = (p) => sorted[Math.min(sorted.length - 1, Math.floor((p / 100) * sorted.length))];
+    return { p50: at(50), p95: at(95), max: sorted[sorted.length - 1], n: sorted.length };
+  }
+  finalize() {
+    // Latencies aggregated
+    const latencies_p50_ms = {};
+    const latencies_p95_ms = {};
+    const error_rate_by_tool = {};
+    for (const [tool, durations] of Object.entries(this.toolLatencies)) {
+      const p = this._percentiles(durations);
+      if (p) {
+        latencies_p50_ms[tool] = p.p50;
+        latencies_p95_ms[tool] = p.p95;
+      }
+    }
+    for (const tool of Object.keys(this.toolCounts)) {
+      const errs = this.toolErrors[tool] || 0;
+      error_rate_by_tool[tool] = +(errs / this.toolCounts[tool]).toFixed(4);
+    }
+    // Top-10 sequences
+    const sequencesTop = Object.entries(this.sequences)
+      .sort((a, b) => b[1] - a[1])
+      .slice(0, 10)
+      .map(([pattern, count]) => ({ pattern, count }));
+    return {
+      window_start: this.windowStart,
+      window_end: this.windowEnd,
+      payload: {
+        counts: this.counts,
+        tool_counts: this.toolCounts,
+        latencies_p50_ms,
+        latencies_p95_ms,
+        error_rate_by_tool,
+        ioc_hashes: [...this.iocHashes],
+        sequences_top10: sequencesTop,
+        stop_reasons: this.stopReasons,
+        tokens_total: this.tokensTotal,
+      },
+      _meta: {
+        entries_processed: this.entryCount,
+      },
+    };
+  }
+}
+// ── Streaming convenience: anonymize a whole NDJSON file/dir ────────────
+export async function anonymizeFile(filePath, { salt } = {}) {
+  if (!salt) throw new Error('anonymizeFile requires a salt');
+  const agg = new SignalsAggregator({ salt });
+  const stream = createReadStream(filePath, { encoding: 'utf8' });
+  const rl = createInterface({ input: stream, crlfDelay: Infinity });
+  for await (const line of rl) {
+    if (!line.trim()) continue;
+    let e; try { e = JSON.parse(line); } catch { continue; }
+    agg.add(e);
+  }
+  return agg.finalize();
+}

package/src/fortress/url.js ADDED Viewed

@@ -0,0 +1,59 @@
+// ─────────────────────────────────────────────────────────────────────────
+// Fortress URL resolution — shared across upload-fortress, shield, etc.
+// ─────────────────────────────────────────────────────────────────────────
+// The user sets ONE of:
+//
+//   WMA_FORTRESS_BASE_URL=https://<project>.supabase.co/functions/v1
+//      → preferred. Each tool appends its endpoint (/ingest-signals,
+//        /get-policies, /ingest-decisions).
+//
+//   WMA_FORTRESS_URL=https://<project>.supabase.co/functions/v1/ingest-signals
+//      → legacy (v0.5.0 era). The base URL is derived by stripping the
+//        last path segment, so other endpoints can be constructed.
+//
+// Either way, callers receive a `base` they append `/<endpoint>` to.
+/**
+ * Resolve the Fortress base URL from env / args.
+ * @param {object} opts - { explicitUrl, explicitBase, env }
+ * @returns {string|null} base URL like https://x.supabase.co/functions/v1
+ *                       (no trailing slash), or null if not configured.
+ */
+export function resolveFortressBase({ explicitUrl, explicitBase, env = process.env } = {}) {
+  // 1. Explicit base URL from CLI
+  if (explicitBase) return stripTrailingSlash(explicitBase);
+  // 2. Env: WMA_FORTRESS_BASE_URL (preferred)
+  if (env.WMA_FORTRESS_BASE_URL) return stripTrailingSlash(env.WMA_FORTRESS_BASE_URL);
+  // 3. Legacy: WMA_FORTRESS_URL (full path to ingest-signals)
+  const legacy = explicitUrl || env.WMA_FORTRESS_URL;
+  if (legacy) {
+    // Strip last path segment to get the base
+    try {
+      const u = new URL(legacy);
+      const parts = u.pathname.split('/').filter(Boolean);
+      if (parts.length > 0) parts.pop();
+      u.pathname = '/' + parts.join('/');
+      return stripTrailingSlash(u.toString());
+    } catch {
+      return null;
+    }
+  }
+  return null;
+}
+function stripTrailingSlash(s) {
+  return s.endsWith('/') ? s.slice(0, -1) : s;
+}
+/**
+ * Build a full endpoint URL given a base + endpoint name.
+ * @param {string} base - e.g. https://x.supabase.co/functions/v1
+ * @param {string} endpoint - e.g. "ingest-signals", "get-policies"
+ */
+export function fortressEndpoint(base, endpoint) {
+  if (!base) throw new Error('Fortress base URL not configured');
+  return `${base}/${endpoint}`;
+}

package/src/logger.js CHANGED Viewed

@@ -12,11 +12,17 @@ const EXPORT_FIELDS = [
 ];
 export class Logger {
-  constructor({ logDir, agentId, sessionId, silent }) {
+  // `silent`     : don't print log errors to stderr (default: true — quiet operation)
+  // `bestEffort` : SWALLOW write failures (default: false — fail loud).
+  //                Audit-grade default: refuse to silently lose events. Disk
+  //                full / EACCES / EINVAL must propagate so callers know.
+  //                Opt into bestEffort=true only for non-critical paths.
+  constructor({ logDir, agentId, sessionId, silent, bestEffort } = {}) {
     this.logDir = logDir;
     this.agentId = agentId;
     this.sessionId = sessionId || randomUUID();
     this.silent = silent !== false;
+    this.bestEffort = bestEffort === true;
     this.sequence = 0;
     this.currentDay = null;
     this.currentPath = null;
@@ -63,7 +69,10 @@ export class Logger {
       await appendFile(path, JSON.stringify(full) + '\n', { encoding: 'utf8', mode: 0o600 });
       this.count++;
     } catch (err) {
-      if (!this.silent) process.stderr.write(`[wma] log error: ${err.message}\n`);
+      if (!this.silent) process.stderr.write(`[wma] log write error: ${err.message}\n`);
+      // Audit-grade default: fail loud so callers know events are being lost.
+      // Disk full, EACCES, EINVAL etc. should NOT be silently swallowed.
+      if (!this.bestEffort) throw err;
     }
     return full;
   }

package/src/shield/policy.js CHANGED Viewed

@@ -42,12 +42,46 @@ export async function loadPolicies(path) {
   return data;
 }
+// ReDoS protection: regexes are loaded from a user-provided JSON policy file,
+// so a malicious or buggy pattern (e.g. `(a+)+$`) could pin the CPU on a long
+// input. We mitigate two ways:
+//   1) Cap the maximum input length passed to any regex test to MAX_REGEX_INPUT
+//      bytes. Above that we truncate before testing. Real agent values
+//      (URLs, commands, queries) are well under this in practice.
+//   2) Reject obviously dangerous patterns at compile time (heuristic).
+//
+// A future v0.5 may add a proper safe-regex-2 dependency for thorough analysis.
+const MAX_REGEX_INPUT = 8192;
+const SUSPICIOUS_REGEX_PATTERNS = [
+  /(\([^)]*[+*][^)]*\))[+*]/,   // (x+)+ or (x*)* — classic catastrophic backtracking
+  /(\.\*){3,}/,                  // multiple .* in a row
+];
+function validateRegexString(src, where) {
+  if (typeof src !== 'string') {
+    throw new Error(`policy ${where}: regex must be a string`);
+  }
+  if (src.length > 2000) {
+    throw new Error(`policy ${where}: regex too long (>2000 chars)`);
+  }
+  for (const sus of SUSPICIOUS_REGEX_PATTERNS) {
+    if (sus.test(src)) {
+      throw new Error(`policy ${where}: regex looks vulnerable to catastrophic backtracking ("${src.slice(0, 60)}…"). Refusing to load.`);
+    }
+  }
+  return new RegExp(src);
+}
 function compileMatchRegexes(match) {
-  for (const condition of Object.values(match)) {
+  for (const [field, condition] of Object.entries(match)) {
     if (condition && typeof condition === 'object') {
-      if (condition.regex) condition._regex = new RegExp(condition.regex);
-      if (condition.not_regex) condition._not_regex = new RegExp(condition.not_regex);
-      if (condition.regex_any) condition._regex_any = condition.regex_any.map(r => new RegExp(r));
+      if (condition.regex) condition._regex = validateRegexString(condition.regex, `${field}.regex`);
+      if (condition.not_regex) condition._not_regex = validateRegexString(condition.not_regex, `${field}.not_regex`);
+      if (condition.regex_any) {
+        condition._regex_any = condition.regex_any.map((r, i) =>
+          validateRegexString(r, `${field}.regex_any[${i}]`));
+      }
     }
   }
 }
@@ -56,6 +90,15 @@ function getNested(obj, path) {
   return path.split('.').reduce((o, k) => (o == null ? undefined : o[k]), obj);
 }
+// Truncate input before passing to regex test — guards against ReDoS on
+// pathologically long values (e.g. an agent that pastes a 5MB string into
+// a tool argument).
+function safeRegexTest(re, value) {
+  if (typeof value !== 'string') return false;
+  const s = value.length > MAX_REGEX_INPUT ? value.slice(0, MAX_REGEX_INPUT) : value;
+  return re.test(s);
+}
 function matchValue(value, condition) {
   // Literal scalar match
   if (condition === null || typeof condition !== 'object') {
@@ -67,13 +110,13 @@ function matchValue(value, condition) {
   if (condition.in !== undefined) return condition.in.includes(value);
   if (condition.not_in !== undefined) return !condition.not_in.includes(value);
   if (condition._regex !== undefined) {
-    return typeof value === 'string' && condition._regex.test(value);
+    return safeRegexTest(condition._regex, value);
   }
   if (condition._not_regex !== undefined) {
-    return typeof value === 'string' && !condition._not_regex.test(value);
+    return typeof value === 'string' && !safeRegexTest(condition._not_regex, value);
   }
   if (condition._regex_any !== undefined) {
-    return typeof value === 'string' && condition._regex_any.some(r => r.test(value));
+    return condition._regex_any.some(r => safeRegexTest(r, value));
   }
   // Unknown condition shape — defensive: fail-closed (no match) so unknown
   // conditions never silently allow events.