npm - muaddib-scanner - Versions diffs - 2.6.1 → 2.6.2 - Mend

muaddib-scanner 2.6.1 → 2.6.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "muaddib-scanner",
-  "version": "2.6.1",
+  "version": "2.6.2",
   "description": "Supply-chain threat detection & response for npm & PyPI/Python",
   "main": "src/index.js",
   "bin": {
@@ -55,7 +55,7 @@
   },
   "devDependencies": {
     "@eslint/js": "10.0.1",
-    "eslint": "10.0.2",
+    "eslint": "10.0.3",
     "eslint-plugin-security": "^4.0.0",
     "globals": "17.4.0"
   }

package/src/scoring.js CHANGED Viewed

@@ -122,8 +122,14 @@ const FP_COUNT_THRESHOLDS = {
   // B1 FP reduction: bundled code aliases eval/Function (sinon, storybook, vitest)
   dangerous_call_eval: { maxCount: 3, from: 'MEDIUM', to: 'LOW' },
   // P6: HTTP client libraries (undici, aws-sdk, nodemailer, jsdom) parse Authorization/Bearer headers
-  // with 5+ credential regexes. Real harvesters use 1-2 targeted regexes.
-  credential_regex_harvest: { maxCount: 4, from: 'HIGH', to: 'LOW' }
+  // with 3+ credential regexes. Real harvesters use 1-2 targeted regexes.
+  credential_regex_harvest: { maxCount: 2, from: 'HIGH', to: 'LOW' },
+  // P7: Config frameworks (pm2, nx, dotenv, aws-sdk) read 10+ env vars — not credential theft.
+  // Real stealers access 1-5 targeted env vars. Count >10 = config loader pattern.
+  env_access: { maxCount: 10, from: 'HIGH', to: 'LOW' },
+  // P7: Bundled files with 5+ high-entropy strings are data files, not malware payloads.
+  // Real payloads use 1-2 targeted encoded strings. Count >5 = bundled assets/data.
+  high_entropy_string: { maxCount: 5, to: 'LOW' }
 };
 // Types exempt from dist/ downgrade — IOC matches, lifecycle scripts, and
@@ -144,8 +150,9 @@ const DIST_EXEMPT_TYPES = new Set([
   // fetch_decrypt_exec (fetch+decrypt+eval triple) remains exempt — never coincidental.
 ]);
-// Regex matching dist/build/minified/bundled file paths
-const DIST_FILE_RE = /(?:^|[/\\])(?:dist|build)[/\\]|\.min\.js$|\.bundle\.js$/i;
+// Regex matching dist/build/out/output/minified/bundled file paths
+// P7: added out/ and output/ — common build output directories (esbuild, custom build scripts)
+const DIST_FILE_RE = /(?:^|[/\\])(?:dist|build|out|output)[/\\]|\.min\.js$|\.bundle\.js$/i;
 // Bundler artifact types: get two-notch downgrade in dist/ files (CRITICAL→MEDIUM, HIGH→LOW).
 // These are individual pattern signals that bundlers routinely produce (eval for globalThis,
@@ -155,7 +162,9 @@ const DIST_BUNDLER_ARTIFACT_TYPES = new Set([
   'dynamic_require', 'dynamic_import',
   'obfuscation_detected', 'high_entropy_string', 'possible_obfuscation',
   'js_obfuscation_pattern', 'vm_code_execution',
-  'module_compile', 'module_compile_dynamic'
+  'module_compile', 'module_compile_dynamic',
+  // P7: env_access in dist/ is bundled SDK config reading, not credential theft
+  'env_access'
 ]);
 // Types exempt from reachability downgrade — IOC matches, lifecycle, and package-level types.
@@ -223,15 +232,16 @@ function applyFPReductions(threats, reachableFiles, packageName) {
     const rule = FP_COUNT_THRESHOLDS[t.type];
     if (rule && typeCounts[t.type] > rule.maxCount && (!rule.from || t.severity === rule.from)) {
       const typeRatio = typeCounts[t.type] / totalThreats;
-      // suspicious_dataflow: partial bypass of percentage guard up to 80%.
-      // Complex apps (SMTP, monitoring) have 50-80% dataflow findings — still downgrade.
-      // But if dataflow is >80% of ALL findings, it may be real targeted exfiltration.
-      // (Audit fix: full bypass was exploitable — 4+ dataflow patterns = all LOW.)
+      // suspicious_dataflow: full bypass of percentage guard. Packages with >3 suspicious_dataflow
+      // findings are always legitimate SDKs (SMTP, monitoring, analytics). Real malware has 1-2
+      // targeted source→sink pairs. The count >3 threshold is sufficient protection.
+      // P7: removed 80% ratio cap — it caused ~30k FP hits in production on SDK packages
+      // where dataflow was the dominant finding type (e.g. @darajs/core, addio-admin-sdk).
       // vm_code_execution: full bypass — packages with only vm.Script calls (cassandra-driver,
       // webpack, jest) are legitimate. Real malware using vm always has other signals
       // (network, fs, obfuscation). The >3 count threshold is sufficient protection.
       if (typeRatio < 0.4 ||
-          (t.type === 'suspicious_dataflow' && typeRatio < 0.8) ||
+          t.type === 'suspicious_dataflow' ||
           t.type === 'vm_code_execution') {
         t.severity = rule.to;
       }

package/src/temporal-runner.js CHANGED Viewed

@@ -84,6 +84,7 @@ async function runTemporalAnalyses(targetPath, options, pkgNames) {
     }
     {
       const PUBLISH_CONCURRENCY = 5;
+      const publishThreats = [];
       for (let i = 0; i < pkgNames.length; i += PUBLISH_CONCURRENCY) {
         const batch = pkgNames.slice(i, i + PUBLISH_CONCURRENCY);
         const results = await Promise.allSettled(
@@ -93,15 +94,38 @@ async function runTemporalAnalyses(targetPath, options, pkgNames) {
           if (r.status !== 'fulfilled' || !r.value.suspicious) continue;
           const det = r.value;
           for (const a of det.anomalies) {
-            threats.push({
+            publishThreats.push({
               type: a.type,
               severity: a.severity,
               message: a.description,
-              file: `node_modules/${det.packageName}/package.json`
+              file: `node_modules/${det.packageName}/package.json`,
+              _scope: det.packageName.startsWith('@') ? det.packageName.split('/')[0] : null
             });
           }
         }
       }
+      // P7: Scope-aware deduplication for monorepo releases.
+      // When 3+ packages from the same @scope trigger publish_burst or rapid_succession,
+      // it's a coordinated monorepo release (lerna, nx, turbo), not an attack.
+      // Downgrade all findings for that scope to LOW severity.
+      const MONOREPO_SCOPE_THRESHOLD = 3;
+      const scopeTypeCounts = new Map(); // key: `${scope}:${type}` → count
+      for (const t of publishThreats) {
+        if (!t._scope) continue;
+        const key = `${t._scope}:${t.type}`;
+        scopeTypeCounts.set(key, (scopeTypeCounts.get(key) || 0) + 1);
+      }
+      for (const t of publishThreats) {
+        if (t._scope) {
+          const key = `${t._scope}:${t.type}`;
+          if ((scopeTypeCounts.get(key) || 0) >= MONOREPO_SCOPE_THRESHOLD) {
+            t.severity = 'LOW';
+          }
+        }
+        delete t._scope; // clean up internal field
+        threats.push(t);
+      }
     }
   }