npm - @fanboynz/network-scanner - Versions diffs - 2.0.66 → 3.0.0 - Mend

@fanboynz/network-scanner 2.0.66 → 3.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

package/.github/workflows/npm-publish.yml +134 -10
package/CHANGELOG.md +135 -0
package/CLAUDE.md +18 -7
package/README.md +12 -4
package/lib/adblock-rust.js +23 -18
package/lib/adblock.js +127 -82
package/lib/browserexit.js +210 -200
package/lib/browserhealth.js +84 -60
package/lib/cdp.js +103 -81
package/lib/clear_sitedata.js +61 -159
package/lib/cloudflare.js +579 -409
package/lib/colorize.js +29 -12
package/lib/compare.js +16 -8
package/lib/compress.js +2 -1
package/lib/curl.js +287 -220
package/lib/domain-cache.js +87 -40
package/lib/dry-run.js +137 -194
package/lib/fingerprint.js +20 -18
package/lib/flowproxy.js +391 -188
package/lib/ghost-cursor.js +8 -7
package/lib/grep.js +248 -171
package/lib/ignore_similar.js +70 -124
package/lib/interaction.js +132 -235
package/lib/nettools.js +309 -87
package/lib/openvpn_vpn.js +12 -11
package/lib/output.js +92 -59
package/lib/post-processing.js +216 -162
package/lib/redirect.js +46 -30
package/lib/referrer.js +158 -165
package/lib/searchstring.js +290 -381
package/lib/smart-cache.js +141 -91
package/lib/socks-relay.js +8 -7
package/lib/spawn-async.js +137 -0
package/lib/validate_rules.js +188 -176
package/lib/wireguard_vpn.js +111 -117
package/nwss.js +740 -156
package/package.json +4 -4

package/lib/ghost-cursor.js CHANGED Viewed

@@ -14,7 +14,8 @@
 // INSTALL:
 //   npm install ghost-cursor            (optional dependency)
-const { formatLogMessage } = require('./colorize');
+const { formatLogMessage, messageColors } = require('./colorize');
+const GHOST_CURSOR_TAG = messageColors.processing('[ghost-cursor]');
 let ghostCursorModule = null;
 let ghostCursorAvailable = false;
@@ -61,7 +62,7 @@ function createGhostCursor(page, options = {}) {
     return cursor;
   } catch (err) {
     if (forceDebug) {
-      console.log(formatLogMessage('debug', `[ghost-cursor] Failed to create cursor: ${err.message}`));
+      console.log(formatLogMessage('debug', `${GHOST_CURSOR_TAG} Failed to create cursor: ${err.message}`));
     }
     return null;
   }
@@ -103,13 +104,13 @@ async function ghostMove(cursor, toX, toY, options = {}) {
     await cursor.moveTo({ x: toX, y: toY }, moveOpts);
     if (forceDebug) {
-      console.log(formatLogMessage('debug', `[ghost-cursor] Moved to (${Math.round(toX)}, ${Math.round(toY)})`));
+      console.log(formatLogMessage('debug', `${GHOST_CURSOR_TAG} Moved to (${Math.round(toX)}, ${Math.round(toY)})`));
     }
     return true;
   } catch (err) {
     if (forceDebug) {
-      console.log(formatLogMessage('debug', `[ghost-cursor] Move failed: ${err.message}`));
+      console.log(formatLogMessage('debug', `${GHOST_CURSOR_TAG} Move failed: ${err.message}`));
     }
     return false;
   }
@@ -162,13 +163,13 @@ async function ghostClick(cursor, target, options = {}) {
     if (forceDebug) {
       const label = typeof target === 'string' ? target : `(${Math.round(target.x)}, ${Math.round(target.y)})`;
-      console.log(formatLogMessage('debug', `[ghost-cursor] Clicked ${label}`));
+      console.log(formatLogMessage('debug', `${GHOST_CURSOR_TAG} Clicked ${label}`));
     }
     return true;
   } catch (err) {
     if (forceDebug) {
-      console.log(formatLogMessage('debug', `[ghost-cursor] Click failed: ${err.message}`));
+      console.log(formatLogMessage('debug', `${GHOST_CURSOR_TAG} Click failed: ${err.message}`));
     }
     return false;
   }
@@ -193,7 +194,7 @@ async function ghostRandomMove(cursor, options = {}) {
     return true;
   } catch (err) {
     if (options.forceDebug) {
-      console.log(formatLogMessage('debug', `[ghost-cursor] Random move failed: ${err.message}`));
+      console.log(formatLogMessage('debug', `${GHOST_CURSOR_TAG} Random move failed: ${err.message}`));
     }
     return false;
   }

package/lib/grep.js CHANGED Viewed

@@ -2,33 +2,85 @@
 // Alternative to searchstring.js using grep for pattern matching
 const fs = require('fs');
+// spawnSync only used for validateGrepAvailability (runs once at
+// startup). Production grep + curl paths go through runProcess (async).
 const { spawnSync } = require('child_process');
-const { colorize, colors, messageColors, tags, formatLogMessage } = require('./colorize');
+const { runProcess } = require('./spawn-async');
+const { messageColors, formatLogMessage } = require('./colorize');
+const GREP_TAG = messageColors.processing('[grep]');
 // === Constants ===
 const GREP_DEFAULTS = {
   TIMEOUT_SECONDS: 30,
   MAX_REDIRECTS: 5,
-  MAX_SIZE_BYTES: 10 * 1024 * 1024, // 10MB
-  VALIDATION_TIMEOUT: 5000, // 5 seconds
-  SPAWN_TIMEOUT_MULTIPLIER: 1000, // Convert seconds to milliseconds
-  GREP_TIMEOUT: 10000, // 10 seconds for grep operations
-  MAX_BUFFER_SIZE: 1024 * 1024, // 1MB max buffer
+  // 50MB to match lib/curl.js and lib/searchstring.js — the three
+  // download paths previously had two different caps (10MB here, 50MB
+  // there) so the same URL could succeed via one path and fail via
+  // another.
+  MAX_SIZE_BYTES: 50 * 1024 * 1024,
+  // Cap grep's stdout collection at the input size — output can in
+  // theory exceed input (overlapping match contexts) but in practice
+  // matching lines from 50MB of content max out around that. Replaces
+  // the old 1MB MAX_BUFFER_SIZE that silently killed grep with ENOBUFS
+  // on pages with many matching lines, making the pattern silently
+  // report "not found" despite thousands of matches.
+  MAX_GREP_OUTPUT_BYTES: 50 * 1024 * 1024,
+  VALIDATION_TIMEOUT: 5000,
+  GREP_TIMEOUT: 10000,
   DEFAULT_MAX_MATCHES: 1000,
   GREP_SUCCESS_STATUS: 0,
-  GREP_NOT_FOUND_STATUS: 1,
   CURL_SUCCESS_STATUS: 0,
   VERSION_LINE_INDEX: 0
 };
 /**
- * Searches content using grep with the provided patterns
+ * Run a single grep pattern against `content`, returning the result
+ * asynchronously. Uses spawn (NOT spawnSync) — same rationale as
+ * downloadAndGrep — and handles stdout buffering ourselves so we can
+ * accept output up to MAX_GREP_OUTPUT_BYTES instead of being capped
+ * at spawnSync's `maxBuffer` (which silently killed grep with ENOBUFS
+ * on pages with many matching lines).
+ *
+ * @param {string} content - Stdin content for grep
+ * @param {string} pattern - The pattern to search for
+ * @param {string[]} baseArgs - Pre-computed grep flags (-i, -F, etc.)
+ * @returns {Promise<{status: number|null, stdout: string, truncated: boolean, signal: string|null, error?: string}>}
+ */
+async function grepOne(content, pattern, baseArgs) {
+  // Shared async-spawn helper handles stdout cap, kill timer, error/close
+  // wiring, and stdin EPIPE swallowing. We just adapt the return shape
+  // to what grepContent expects (string stdout, status alias for code).
+  const result = await runProcess('grep', [...baseArgs, pattern], {
+    timeout: GREP_DEFAULTS.GREP_TIMEOUT,
+    maxStdout: GREP_DEFAULTS.MAX_GREP_OUTPUT_BYTES,
+    input: content,
+    collectStderr: false  // grep's stderr isn't used by callers
+  });
+  return {
+    status: result.error ? -1 : result.code,
+    stdout: result.stdout.toString('utf8'),
+    truncated: result.truncated,
+    signal: result.signal,
+    error: result.error
+  };
+}
+/**
+ * Searches content using grep with the provided patterns.
+ *
+ * Async — runs one spawn per pattern (sequential, not concurrent, to
+ * avoid spiking memory with N copies of `content` on grep's stdin
+ * simultaneously). The previous spawnSync-per-pattern implementation
+ * blocked the event loop for the duration of every grep call; the
+ * outer downloadAndGrep's switch to async spawn was undone by this
+ * sync inner step.
+ *
  * @param {string} content - The content to search
  * @param {Array<string>} searchPatterns - Array of grep patterns to search for
- * @param {object} options - Grep options
- * @returns {Promise<object>} Object with found boolean, matchedPattern, and allMatches array
+ * @param {object} options - Grep options (ignoreCase, wholeWord, regex, maxMatches)
+ * @returns {Promise<{found: boolean, matchedPattern: string|null, allMatches: Array<{pattern: string, matches: string[]}>}>}
  */
-function grepContent(content, searchPatterns, options = {}) {
+async function grepContent(content, searchPatterns, options = {}) {
   const {
     ignoreCase = true,
     wholeWord = false,
@@ -36,60 +88,53 @@ function grepContent(content, searchPatterns, options = {}) {
     maxMatches = GREP_DEFAULTS.DEFAULT_MAX_MATCHES
   } = options;
-  if (!content || searchPatterns.length === 0) {
+  // Pre-filter empty/whitespace patterns at the top instead of doing
+  // `if (!pattern || ...) continue` inside the loop. `typeof === 'string'`
+  // guard rejects non-string entries (numbers, booleans, etc.) so we
+  // don't trip TypeError on `p.trim()` for misconfigured input.
+  const validPatterns = Array.isArray(searchPatterns)
+    ? searchPatterns.filter(p => typeof p === 'string' && p.trim().length > 0)
+    : [];
+  if (!content || validPatterns.length === 0) {
     return { found: false, matchedPattern: null, allMatches: [] };
   }
-  try {
-    const allMatches = [];
-    let firstMatch = null;
-    // Build common args once outside the loop
-    const baseArgs = ['--text', '--color=never'];
-    if (ignoreCase) baseArgs.push('-i');
-    if (wholeWord) baseArgs.push('-w');
-    if (!regex) baseArgs.push('-F');
-    for (const pattern of searchPatterns) {
-      if (!pattern || pattern.trim().length === 0) continue;
-      const grepArgs = [...baseArgs, pattern];
-      try {
-        const result = spawnSync('grep', grepArgs, {
-          encoding: 'utf8',
-          input: content,
-          timeout: GREP_DEFAULTS.GREP_TIMEOUT,
-          maxBuffer: GREP_DEFAULTS.MAX_BUFFER_SIZE
-        });
-        // grep returns 0 if found, 1 if not found, 2+ for errors
-        if (result.status === GREP_DEFAULTS.GREP_SUCCESS_STATUS && result.stdout) {
-          allMatches.push({
-            pattern: pattern,
-            matches: result.stdout.split('\n').filter(line => line.trim().length > 0).slice(0, maxMatches)
-          });
-          if (!firstMatch) {
-            firstMatch = pattern;
-          }
-        }
-      } catch (grepErr) {
-        // Continue with next pattern if this one fails
-        console.warn(formatLogMessage('warn', `[grep] Pattern "${pattern}" failed: ${grepErr.message}`));
-      }
+  const baseArgs = ['--text', '--color=never'];
+  if (ignoreCase) baseArgs.push('-i');
+  if (wholeWord) baseArgs.push('-w');
+  if (!regex) baseArgs.push('-F');
+  const allMatches = [];
+  let firstMatch = null;
+  for (const pattern of validPatterns) {
+    const result = await grepOne(content, pattern, baseArgs);
+    if (result.error) {
+      console.warn(formatLogMessage('warn', `${GREP_TAG} Pattern "${pattern}" failed: ${result.error}`));
+      continue;
+    }
+    // Surface truncation so admins can see when grep output hit the
+    // 50MB cap — previously this was silent (the SIGTERM-on-truncation
+    // path looks the same as a normal exit to the caller).
+    if (result.truncated) {
+      console.warn(formatLogMessage('warn', `${GREP_TAG} Pattern "${pattern}" output truncated at ${GREP_DEFAULTS.MAX_GREP_OUTPUT_BYTES} bytes; results may be incomplete`));
+    }
+    // grep exit codes: 0 = found, 1 = not found, 2+ = error.
+    // Also accept truncated output — we collected enough to slice to
+    // maxMatches even though more existed beyond the cap.
+    if (result.status === GREP_DEFAULTS.GREP_SUCCESS_STATUS && result.stdout) {
+      const lines = result.stdout.split('\n').filter(line => line.trim().length > 0).slice(0, maxMatches);
+      allMatches.push({ pattern, matches: lines });
+      if (!firstMatch) firstMatch = pattern;
     }
-    return {
-      found: allMatches.length > 0,
-      matchedPattern: firstMatch,
-      allMatches: allMatches
-    };
-  } catch (error) {
-    throw new Error(`Grep search failed: ${error.message}`);
   }
+  return {
+    found: allMatches.length > 0,
+    matchedPattern: firstMatch,
+    allMatches
+  };
 }
 /**
@@ -102,74 +147,84 @@ function grepContent(content, searchPatterns, options = {}) {
  * @returns {Promise<object>} Object with found boolean, matchedPattern, and content
  */
 async function downloadAndGrep(url, searchPatterns, userAgent = '', grepOptions = {}, timeout = GREP_DEFAULTS.TIMEOUT_SECONDS) {
-  try {
-    const curlArgs = [
-      '-s', // Silent mode
-      '-L', // Follow redirects
-      '--max-time', timeout.toString(),
-      '--max-redirs', GREP_DEFAULTS.MAX_REDIRECTS.toString(),
-      '--fail-with-body', // Return body even on HTTP errors
-      '--compressed', // Accept compressed responses
-    ];
-    if (userAgent) {
-      curlArgs.push('-H', `User-Agent: ${userAgent}`);
-    }
+  const curlArgs = [
+    '-s',
+    '-L',
+    '--max-time', timeout.toString(),
+    '--max-redirs', GREP_DEFAULTS.MAX_REDIRECTS.toString(),
+    '--fail-with-body',
+    '--compressed'
+  ];
+  if (userAgent) curlArgs.push('-H', `User-Agent: ${userAgent}`);
+  curlArgs.push(
+    '-H', 'Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',
+    '-H', 'Accept-Language: en-US,en;q=0.5',
+    '-H', 'Accept-Encoding: gzip, deflate',
+    '-H', 'Connection: keep-alive',
+    '-H', 'Upgrade-Insecure-Requests: 1'
+  );
+  curlArgs.push(url);
-    // Add common headers to appear more browser-like
-    curlArgs.push(
-      '-H', 'Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',
-      '-H', 'Accept-Language: en-US,en;q=0.5',
-      '-H', 'Accept-Encoding: gzip, deflate',
-      '-H', 'Connection: keep-alive',
-      '-H', 'Upgrade-Insecure-Requests: 1'
-    );
+  const result = await runProcess('curl', curlArgs, {
+    timeout: timeout * 1000,
+    maxStdout: GREP_DEFAULTS.MAX_SIZE_BYTES
+  });
-    curlArgs.push(url);
+  if (result.error) throw new Error(`Download and grep failed for ${url}: ${result.error}`);
+  if (result.truncated) throw new Error(`Output exceeded ${GREP_DEFAULTS.MAX_SIZE_BYTES} bytes for ${url}`);
+  if (result.signal) throw new Error(`Curl killed by signal ${result.signal} for ${url}`);
+  if (result.code !== GREP_DEFAULTS.CURL_SUCCESS_STATUS) {
+    throw new Error(`Curl exited with status ${result.code}: ${result.stderr.toString('utf8')}`);
+  }
-    // Download content with curl
-    const curlResult = spawnSync('curl', curlArgs, {
-      encoding: 'utf8',
-      timeout: timeout * GREP_DEFAULTS.SPAWN_TIMEOUT_MULTIPLIER,
-      maxBuffer: GREP_DEFAULTS.MAX_SIZE_BYTES
-    });
-    if (curlResult.error) {
-      throw curlResult.error;
-    }
-    if (curlResult.status !== GREP_DEFAULTS.CURL_SUCCESS_STATUS) {
-      throw new Error(`Curl exited with status ${curlResult.status}: ${curlResult.stderr}`);
-    }
-    const content = curlResult.stdout;
-    // Search content with grep
+  const content = result.stdout.toString('utf8');
+  try {
     const grepResult = await grepContent(content, searchPatterns, grepOptions);
     return {
       found: grepResult.found,
       matchedPattern: grepResult.matchedPattern,
       allMatches: grepResult.allMatches,
-      content: content,
+      content,
       contentLength: content.length
     };
-  } catch (error) {
-    throw new Error(`Download and grep failed for ${url}: ${error.message}`);
+  } catch (grepErr) {
+    throw new Error(`Download and grep failed for ${url}: ${grepErr.message}`);
   }
 }
 /**
- * Creates a grep-based URL handler for downloading and searching content
- * @param {object} config - Configuration object containing all necessary parameters
- * @returns {Function} URL handler function for grep-based content analysis
+ * Creates a grep-based URL handler for downloading and searching content.
+ *
+ * @param {object} config
+ * @param {string[]} config.searchStrings - OR-logic patterns (any match)
+ * @param {string[]} config.searchStringsAnd - AND-logic patterns (all must match)
+ * @param {boolean} config.hasSearchString - True if searchStrings is non-empty
+ * @param {boolean} config.hasSearchStringAnd - True if searchStringsAnd is non-empty;
+ *   when true, AND-logic is applied to the combined grep result
+ * @param {RegExp[]} config.regexes - URL regex patterns for the first-pass filter
+ * @param {Function} config.addMatchedDomain - Sink for matched domains
+ * @param {Function} config.isDomainAlreadyDetected - Skip-if-true predicate
+ * @param {Function} [config.onContentFetched] - Optional cache hook
+ * @param {string} config.currentUrl - The page URL being scanned
+ * @param {boolean} config.perSiteSubDomains - Track at subdomain granularity
+ * @param {string[]} config.ignoreDomains - Domain ignore list
+ * @param {Function} config.matchesIgnoreDomain - Ignore-list matcher
+ * @param {Function} config.getRootDomain - URL → registrable root domain
+ * @param {object} config.siteConfig - Per-site config (verbose, firstParty, thirdParty)
+ * @param {boolean} config.dumpUrls - Write matched URLs to file
+ * @param {string} config.matchedUrlsLogFile - Path for dumpUrls output
+ * @param {boolean} config.forceDebug
+ * @param {string} config.userAgent - Curl user agent
+ * @param {string|null} config.resourceType - Resource type for adblock-rules mode
+ * @param {object} [config.grepOptions] - Passed through to grepContent
+ *   (ignoreCase, wholeWord, regex, maxMatches)
+ * @returns {Function} URL handler: async (requestUrl) => void
  */
 function createGrepHandler(config) {
   const {
     searchStrings,
+    searchStringsAnd,
     regexes,
-    matchedDomains,
     addMatchedDomain,
     isDomainAlreadyDetected,
     onContentFetched,
@@ -185,122 +240,143 @@ function createGrepHandler(config) {
     userAgent,
     resourceType,
     hasSearchString,
+    hasSearchStringAnd,
     grepOptions = {}
   } = config;
+  // Hoisted: currentUrl doesn't change for this handler's lifetime.
+  // Previously parsed on every single request.
+  let currentRootDomain = '';
+  let currentUrlHostname = '';
+  try { currentRootDomain = getRootDomain(currentUrl); } catch (_) {}
+  try { currentUrlHostname = new URL(currentUrl).hostname; } catch (_) {}
   return async function grepHandler(requestUrl) {
-    const respDomain = perSiteSubDomains ? (new URL(requestUrl)).hostname : getRootDomain(requestUrl);
-    const fullSubdomain = (new URL(requestUrl)).hostname; // Always get full subdomain for cache tracking
-    // Skip if already detected to avoid duplicates
+    // Regex check FIRST — cheap filter that skips ~99% of requests.
+    // Previously this ran AFTER URL parses and a domain-cache lookup,
+    // paying for parses on requests we then immediately drop.
+    const matchesRegex = regexes.some(re => re.test(requestUrl));
+    if (!matchesRegex) return;
+    // Parse requestUrl ONCE and reuse. Was parsed 4 times previously
+    // (two hostname parses + two for currentUrlHostname/requestHostname).
+    let requestHostname;
+    try { requestHostname = new URL(requestUrl).hostname; } catch (_) { return; }
+    const fullSubdomain = requestHostname;
+    const respDomain = perSiteSubDomains ? requestHostname : getRootDomain(requestUrl);
     if (isDomainAlreadyDetected(fullSubdomain)) {
       if (forceDebug) {
-        console.log(formatLogMessage('debug', `[grep] Skipping already detected subdomain: ${fullSubdomain}`));
+        console.log(formatLogMessage('debug', `${GREP_TAG} Skipping already detected subdomain: ${fullSubdomain}`));
       }
       return;
     }
-    // Only process URLs that match our regex patterns
-    const matchesRegex = regexes.some(re => re.test(requestUrl));
-    if (!matchesRegex) return;
-    // Check if this is a first-party request (same domain as the URL being scanned)
-    const currentUrlHostname = new URL(currentUrl).hostname;
-    const requestHostname = new URL(requestUrl).hostname;
     const isFirstParty = currentUrlHostname === requestHostname;
-    // Apply first-party/third-party filtering
     if (isFirstParty && siteConfig.firstParty === false) {
       if (forceDebug) {
-        console.log(formatLogMessage('debug', `[grep] Skipping first-party request (firstParty=false): ${requestUrl}`));
+        console.log(formatLogMessage('debug', `${GREP_TAG} Skipping first-party request (firstParty=false): ${requestUrl}`));
       }
       return;
     }
     if (!isFirstParty && siteConfig.thirdParty === false) {
       if (forceDebug) {
-        console.log(formatLogMessage('debug', `[grep] Skipping third-party request (thirdParty=false): ${requestUrl}`));
+        console.log(formatLogMessage('debug', `${GREP_TAG} Skipping third-party request (thirdParty=false): ${requestUrl}`));
       }
       return;
     }
     try {
       if (forceDebug) {
-        console.log(formatLogMessage('debug', `[grep] Downloading and searching content from: ${requestUrl}`));
+        console.log(formatLogMessage('debug', `${GREP_TAG} Downloading and searching content from: ${requestUrl}`));
       }
-      // If NO searchstring is defined, match immediately (like browser behavior)
-      if (!hasSearchString) {
-        if (!respDomain || matchesIgnoreDomain(respDomain, ignoreDomains)) {
-          return;
-        }
+      // No searchstring at all → match immediately on regex alone.
+      if (!hasSearchString && !hasSearchStringAnd) {
+        if (!respDomain || matchesIgnoreDomain(respDomain, ignoreDomains)) return;
         addMatchedDomain(respDomain, resourceType, fullSubdomain);
-        const simplifiedUrl = getRootDomain(currentUrl);
+        const partyType = isFirstParty ? 'first-party' : 'third-party';
         if (siteConfig.verbose === 1) {
-          const partyType = isFirstParty ? 'first-party' : 'third-party';
-          console.log(formatLogMessage('match', `[${simplifiedUrl}] ${requestUrl} (${partyType}, grep) matched regex`));
+          console.log(formatLogMessage('match', `[${currentRootDomain}] ${requestUrl} (${partyType}, grep) matched regex`));
         }
-        if (dumpUrls) {
+        if (dumpUrls && matchedUrlsLogFile) {
           const timestamp = new Date().toISOString();
-          const partyType = isFirstParty ? 'first-party' : 'third-party';
           try {
-            fs.appendFileSync(matchedUrlsLogFile,
-              `${timestamp} [match][${simplifiedUrl}] ${requestUrl} (${partyType}, grep)\n`);
+            fs.appendFileSync(matchedUrlsLogFile,
+              `${timestamp} [match][${currentRootDomain}] ${requestUrl} (${partyType}, grep)\n`);
           } catch (logErr) {
             console.warn(formatLogMessage('warn', `Failed to write to matched URLs log: ${logErr.message}`));
           }
         }
         return;
       }
-      // If searchstring IS defined, download and grep content
-      const result = await downloadAndGrep(requestUrl, searchStrings, userAgent, grepOptions, GREP_DEFAULTS.TIMEOUT_SECONDS);
-      // Cache the fetched content if callback provided
+      // Combine OR + AND patterns into one grep pass. The AND-logic
+      // check below uses per-pattern attribution from
+      // grepContent.allMatches. Previously createGrepHandler only
+      // destructured `searchStrings` and ignored `searchStringsAnd`
+      // entirely — users configuring AND-only patterns with grep mode
+      // got silent zero matches.
+      const allPatterns = [
+        ...(searchStrings || []),
+        ...(searchStringsAnd || [])
+      ];
+      const result = await downloadAndGrep(requestUrl, allPatterns, userAgent, grepOptions, GREP_DEFAULTS.TIMEOUT_SECONDS);
       if (onContentFetched && result.content) {
         try {
           onContentFetched(requestUrl, result.content);
         } catch (cacheErr) {
-          if (forceDebug) console.log(formatLogMessage('debug', `[grep] Content caching failed: ${cacheErr.message}`));
+          if (forceDebug) console.log(formatLogMessage('debug', `${GREP_TAG} Content caching failed: ${cacheErr.message}`));
         }
       }
-      if (result.found) {
-        if (!respDomain || matchesIgnoreDomain(respDomain, ignoreDomains)) {
-          return;
+      // Apply OR vs AND logic. AND requires every searchStringsAnd
+      // pattern to appear in grepResult.allMatches; OR just needs
+      // anything found.
+      let matched = false;
+      let matchDescription = null;
+      if (hasSearchStringAnd && searchStringsAnd && searchStringsAnd.length > 0) {
+        const foundPatterns = new Set(result.allMatches.map(m => m.pattern));
+        if (searchStringsAnd.every(p => foundPatterns.has(p))) {
+          matched = true;
+          matchDescription = `patterns: ${searchStringsAnd.length}/${searchStringsAnd.length} (AND)`;
         }
+      } else if (result.found) {
+        matched = true;
+        matchDescription = `pattern: "${result.matchedPattern}"`;
+      }
+      if (matched) {
+        if (!respDomain || matchesIgnoreDomain(respDomain, ignoreDomains)) return;
         addMatchedDomain(respDomain, resourceType, fullSubdomain);
-        const simplifiedUrl = getRootDomain(currentUrl);
+        const partyType = isFirstParty ? 'first-party' : 'third-party';
+        const matchCount = result.allMatches.reduce((sum, m) => sum + m.matches.length, 0);
         if (siteConfig.verbose === 1) {
-          const partyType = isFirstParty ? 'first-party' : 'third-party';
-          const matchCount = result.allMatches.reduce((sum, match) => sum + match.matches.length, 0);
-          console.log(formatLogMessage('match', `[${simplifiedUrl}] ${requestUrl} (${partyType}, grep) contains pattern: "${result.matchedPattern}" (${matchCount} matches)`));
+          console.log(formatLogMessage('match', `[${currentRootDomain}] ${requestUrl} (${partyType}, grep) contains ${matchDescription} (${matchCount} matches)`));
         }
-        if (dumpUrls) {
+        if (dumpUrls && matchedUrlsLogFile) {
           const timestamp = new Date().toISOString();
-          const partyType = isFirstParty ? 'first-party' : 'third-party';
-          const matchCount = result.allMatches.reduce((sum, match) => sum + match.matches.length, 0);
           try {
-            fs.appendFileSync(matchedUrlsLogFile,
-              `${timestamp} [match][${simplifiedUrl}] ${requestUrl} (${partyType}, grep, pattern: "${result.matchedPattern}", matches: ${matchCount})\n`);
+            fs.appendFileSync(matchedUrlsLogFile,
+              `${timestamp} [match][${currentRootDomain}] ${requestUrl} (${partyType}, grep, ${matchDescription}, matches: ${matchCount})\n`);
           } catch (logErr) {
             console.warn(formatLogMessage('warn', `Failed to write to matched URLs log: ${logErr.message}`));
           }
         }
       } else if (forceDebug) {
         const partyType = isFirstParty ? 'first-party' : 'third-party';
-        console.log(formatLogMessage('debug', `[grep] ${requestUrl} (${partyType}) matched regex but no patterns found`));
+        console.log(formatLogMessage('debug', `${GREP_TAG} ${requestUrl} (${partyType}) matched regex but no patterns found`));
       }
     } catch (err) {
       if (forceDebug) {
-        console.log(formatLogMessage('debug', `[grep] Failed to download/grep content for ${requestUrl}: ${err.message}`));
+        console.log(formatLogMessage('debug', `${GREP_TAG} Failed to download/grep content for ${requestUrl}: ${err.message}`));
       }
     }
   };
@@ -340,9 +416,10 @@ function validateGrepAvailability() {
   }
 }
+// Public surface. downloadAndGrep is module-internal (only called by
+// createGrepHandler) — was exported but no external caller imported it.
 module.exports = {
   grepContent,
-  downloadAndGrep,
   createGrepHandler,
   validateGrepAvailability
 };