npm - muaddib-scanner - Versions diffs - 2.10.33 → 2.10.34 - Mend

muaddib-scanner 2.10.33 → 2.10.34

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/package.json +1 -1
package/src/integrations/webhook.js +22 -0
package/src/ml/llm-detective.js +538 -0
package/src/monitor/classify.js +15 -0
package/src/monitor/daemon.js +11 -1
package/src/monitor/queue.js +35 -2
package/src/monitor/state.js +4 -0
package/src/monitor/webhook.js +42 -7

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "muaddib-scanner",
-  "version": "2.10.33",
+  "version": "2.10.34",
   "description": "Supply-chain threat detection & response for npm & PyPI/Python",
   "main": "src/index.js",
   "bin": {

package/src/integrations/webhook.js CHANGED Viewed

@@ -223,6 +223,28 @@ function formatDiscord(results) {
     });
   }
+  // Add LLM Detective field if LLM analysis was performed
+  if (results.llm && results.llm.verdict) {
+    const verdictEmoji = results.llm.verdict === 'malicious' ? '\u274C'
+      : results.llm.verdict === 'benign' ? '\u2705' : '\u2753';
+    const modeTag = results.llm.mode === 'shadow' ? ' [shadow]' : '';
+    let llmValue = `${verdictEmoji} **${results.llm.verdict}** (${Math.round(results.llm.confidence * 100)}% confidence)${modeTag}`;
+    if (results.llm.attack_type) {
+      llmValue += `\nType: ${results.llm.attack_type}`;
+    }
+    if (results.llm.iocs_found && results.llm.iocs_found.length > 0) {
+      llmValue += `\nIOCs: ${results.llm.iocs_found.join(', ')}`;
+    }
+    if (results.llm.reasoning) {
+      llmValue += `\n${results.llm.reasoning}`;
+    }
+    fields.push({
+      name: 'LLM Analysis',
+      value: llmValue.slice(0, 1024),
+      inline: false
+    });
+  }
   const titlePrefix = emoji ? `${emoji} ` : '';
   const prioritySuffix = priority && priority.level ? ` [${priority.level}]` : '';
   const ts = results.timestamp ? new Date(results.timestamp) : new Date();

package/src/ml/llm-detective.js ADDED Viewed

@@ -0,0 +1,538 @@
+'use strict';
+/**
+ * LLM Detective — Claude Haiku-based package analysis for FP reduction.
+ *
+ * Reads ALL source code from a suspect package and asks Haiku to determine
+ * if it's real malware or a false positive. Operates in two modes:
+ *   - shadow (default): log verdict, don't affect webhook flow
+ *   - active: suppress webhook for high-confidence benign, enrich for malicious
+ *
+ * No external dependency — uses native fetch() against the Anthropic Messages API.
+ *
+ * Security: NEVER sends sandboxResult (contains honey tokens).
+ */
+const fs = require('fs');
+const path = require('path');
+const { findFiles } = require('../utils.js');
+// ── Constants ──
+const API_URL = 'https://api.anthropic.com/v1/messages';
+const MODEL_ID = 'claude-haiku-4-5-20251001';
+const MAX_CONTEXT_BYTES = 100 * 1024; // 100KB cap for source code in prompt
+const LLM_TIMEOUT_MS = 60000; // 60s timeout per API call
+const LLM_CONCURRENCY_MAX = 2; // max simultaneous API calls
+const LLM_DAILY_LIMIT_DEFAULT = 100;
+const MAX_SINGLE_FILE_BYTES = 512 * 1024; // skip individual files > 512KB
+// Extensions to collect from packages
+const SOURCE_EXTENSIONS = ['.js', '.mjs', '.cjs', '.ts', '.json', '.py'];
+// ── Semaphore (pattern: src/shared/http-limiter.js) ──
+const _semaphore = { active: 0, queue: [] };
+function acquireLlmSlot() {
+  if (_semaphore.active < LLM_CONCURRENCY_MAX) {
+    _semaphore.active++;
+    return Promise.resolve();
+  }
+  return new Promise(resolve => {
+    _semaphore.queue.push(resolve);
+  });
+}
+function releaseLlmSlot() {
+  if (_semaphore.queue.length > 0) {
+    const next = _semaphore.queue.shift();
+    next();
+  } else {
+    _semaphore.active--;
+  }
+}
+// ── Daily quota counter (in-memory, resets at midnight UTC) ──
+const _dailyCounter = { count: 0, resetDate: null };
+function getTodayUTC() {
+  return new Date().toISOString().slice(0, 10);
+}
+function isDailyQuotaAvailable() {
+  const today = getTodayUTC();
+  if (_dailyCounter.resetDate !== today) {
+    _dailyCounter.count = 0;
+    _dailyCounter.resetDate = today;
+  }
+  return _dailyCounter.count < getDailyLimit();
+}
+function incrementDailyCounter() {
+  const today = getTodayUTC();
+  if (_dailyCounter.resetDate !== today) {
+    _dailyCounter.count = 0;
+    _dailyCounter.resetDate = today;
+  }
+  _dailyCounter.count++;
+}
+function getDailyLimit() {
+  return Math.max(1, parseInt(process.env.MUADDIB_LLM_DAILY_LIMIT, 10) || LLM_DAILY_LIMIT_DEFAULT);
+}
+function getDailyCount() {
+  return _dailyCounter.count;
+}
+function resetDailyCounter() {
+  _dailyCounter.count = 0;
+  _dailyCounter.resetDate = null;
+}
+// ── Feature flags ──
+function isLlmEnabled() {
+  if (!process.env.ANTHROPIC_API_KEY) return false;
+  const env = process.env.MUADDIB_LLM_ENABLED;
+  if (env !== undefined && env.toLowerCase() === 'false') return false;
+  return true;
+}
+function getLlmMode() {
+  const env = process.env.MUADDIB_LLM_MODE;
+  if (env && env.toLowerCase() === 'active') return 'active';
+  return 'shadow';
+}
+// ── Stats ──
+const _stats = { analyzed: 0, malicious: 0, benign: 0, uncertain: 0, errors: 0, skipped: 0 };
+function getStats() {
+  return { ..._stats };
+}
+function resetStats() {
+  _stats.analyzed = 0;
+  _stats.malicious = 0;
+  _stats.benign = 0;
+  _stats.uncertain = 0;
+  _stats.errors = 0;
+  _stats.skipped = 0;
+}
+// ── Source context collection ──
+/**
+ * Collect source files from an extracted package directory.
+ * Respects MAX_CONTEXT_BYTES cap. If over, falls back to priority files.
+ *
+ * @param {string} extractedDir - path to extracted package
+ * @param {Object} scanResult - scan result with threats[].file for priority
+ * @returns {{ files: Array<{path: string, content: string}>, truncated: boolean, totalBytes: number }}
+ */
+function collectSourceContext(extractedDir, scanResult) {
+  const allFiles = findFiles(extractedDir, {
+    extensions: SOURCE_EXTENSIONS,
+    maxFiles: 200
+  });
+  const fileEntries = [];
+  let totalBytes = 0;
+  let truncated = false;
+  // Try to include all files
+  for (const filePath of allFiles) {
+    try {
+      const stat = fs.statSync(filePath);
+      if (stat.size > MAX_SINGLE_FILE_BYTES) continue;
+      if (totalBytes + stat.size > MAX_CONTEXT_BYTES) {
+        truncated = true;
+        break;
+      }
+      const content = fs.readFileSync(filePath, 'utf8');
+      const relPath = path.relative(extractedDir, filePath).replace(/\\/g, '/');
+      totalBytes += Buffer.byteLength(content, 'utf8');
+      fileEntries.push({ path: relPath, content });
+    } catch {
+      // Skip unreadable files
+    }
+  }
+  // If truncated, restart with priority files only
+  if (truncated) {
+    fileEntries.length = 0;
+    totalBytes = 0;
+    truncated = true;
+    const flaggedFiles = new Set(
+      ((scanResult && scanResult.threats) || [])
+        .map(t => t.file)
+        .filter(Boolean)
+    );
+    // Priority order: package.json, flagged files, entry point, README
+    const priorityRelPaths = new Set();
+    priorityRelPaths.add('package.json');
+    for (const f of flaggedFiles) priorityRelPaths.add(f);
+    // Read package.json to find entry point
+    try {
+      const pkgJsonPath = path.join(extractedDir, 'package.json');
+      const pkgJson = JSON.parse(fs.readFileSync(pkgJsonPath, 'utf8'));
+      if (pkgJson.main) priorityRelPaths.add(pkgJson.main);
+      if (pkgJson.bin) {
+        const bins = typeof pkgJson.bin === 'string' ? [pkgJson.bin] : Object.values(pkgJson.bin || {});
+        for (const b of bins) if (b) priorityRelPaths.add(b);
+      }
+    } catch {}
+    priorityRelPaths.add('README.md');
+    priorityRelPaths.add('readme.md');
+    for (const relPath of priorityRelPaths) {
+      const absPath = path.join(extractedDir, relPath);
+      try {
+        if (!fs.existsSync(absPath)) continue;
+        const stat = fs.statSync(absPath);
+        if (stat.size > MAX_SINGLE_FILE_BYTES) continue;
+        if (totalBytes + stat.size > MAX_CONTEXT_BYTES) continue;
+        const content = fs.readFileSync(absPath, 'utf8');
+        totalBytes += Buffer.byteLength(content, 'utf8');
+        fileEntries.push({ path: relPath.replace(/\\/g, '/'), content });
+      } catch {}
+    }
+  }
+  return { files: fileEntries, truncated, totalBytes };
+}
+// ── Prompt construction ──
+const SYSTEM_PROMPT = `You are a senior supply-chain security analyst. You receive the COMPLETE source code of a suspect npm/PyPI package and the results of a static threat scanner.
+Your job: determine if this package is MALICIOUS or LEGITIMATE.
+METHODICAL ANALYSIS:
+1. Read ALL the code, not just flagged files
+2. Look for exfiltration patterns: process.env -> HTTP/DNS/WebSocket to an external domain
+3. Look for persistence patterns: writes to ~/.bashrc, ~/.npmrc, crontab, systemd
+4. Look for obfuscation patterns: eval(atob(...)), Buffer.from(...,'base64'), String.fromCharCode chains
+5. Look for reverse shell patterns: child_process.exec + /bin/sh + net.Socket
+6. Check coherence: does the README match the code? Are declared dependencies actually used?
+7. Check lifecycle scripts: what does postinstall/preinstall actually do?
+LEGITIMATE PATTERNS (DO NOT FLAG):
+- CLI tools using child_process for documented commands
+- Bundlers/transpilers doing dynamic require/import
+- Web frameworks accessing process.env for configuration
+- Build tools downloading native binaries from their own CDN/GitHub releases
+- Packages with >1000 weekly downloads AND an active GitHub repo with stars
+MALICIOUS PATTERNS:
+- Code executed at postinstall unrelated to the described functionality
+- Exfiltration of process.env, ~/.npmrc, ~/.ssh, ~/.aws to an external domain
+- Obfuscation with no reason (a 10-line package doesn't need minification)
+- Suspicious domains in code (raw IPs, recent domains, ngrok, serveo, etc.)
+- Empty or copied README (typosquatting signal)
+- Package created recently (<7 days) with 0 downloads and dangerous code
+RESPOND IN STRICT JSON ONLY (nothing else):
+{
+  "verdict": "malicious" | "benign" | "uncertain",
+  "confidence": 0.0-1.0,
+  "reasoning": "Detailed explanation of your analysis",
+  "iocs_found": ["domain.com", "1.2.3.4"],
+  "attack_type": "credential_exfil" | "reverse_shell" | "crypto_miner" | "backdoor" | "typosquat" | "protestware" | null,
+  "recommendation": "block" | "monitor" | "safe"
+}`;
+/**
+ * Build the messages array for the Anthropic API call.
+ *
+ * @param {string} name - package name
+ * @param {string} version - package version
+ * @param {string} ecosystem - 'npm' or 'pypi'
+ * @param {{ files: Array, truncated: boolean, totalBytes: number }} sourceContext
+ * @param {Array} threats - scan findings
+ * @param {Object} npmRegistryMeta - registry metadata (optional)
+ * @returns {{ system: string, messages: Array }}
+ */
+function buildPrompt(name, version, ecosystem, sourceContext, threats, npmRegistryMeta) {
+  let userContent = `## Package: ${name}@${version} (${ecosystem})\n\n`;
+  // Registry metadata
+  if (npmRegistryMeta) {
+    userContent += `## Registry Metadata\n`;
+    if (npmRegistryMeta.age_days !== undefined) userContent += `- Age: ${npmRegistryMeta.age_days} days\n`;
+    if (npmRegistryMeta.weekly_downloads !== undefined) userContent += `- Weekly downloads: ${npmRegistryMeta.weekly_downloads}\n`;
+    if (npmRegistryMeta.version_count !== undefined) userContent += `- Version count: ${npmRegistryMeta.version_count}\n`;
+    if (npmRegistryMeta.author_package_count !== undefined) userContent += `- Author package count: ${npmRegistryMeta.author_package_count}\n`;
+    if (npmRegistryMeta.has_repository !== undefined) userContent += `- Has repository: ${npmRegistryMeta.has_repository}\n`;
+    userContent += '\n';
+  }
+  // Static scanner findings
+  if (threats && threats.length > 0) {
+    userContent += `## Static Scanner Findings (${threats.length} total)\n`;
+    for (const t of threats.slice(0, 30)) {
+      const loc = t.file ? ` in ${t.file}${t.line ? ':' + t.line : ''}` : '';
+      userContent += `- [${t.severity}] ${t.type}${loc}: ${t.message || ''}\n`;
+    }
+    if (threats.length > 30) {
+      userContent += `... and ${threats.length - 30} more findings\n`;
+    }
+    userContent += '\n';
+  }
+  // Source code
+  userContent += `## Source Code (${sourceContext.files.length} files, ${sourceContext.totalBytes} bytes${sourceContext.truncated ? ', TRUNCATED — only priority files shown' : ''})\n\n`;
+  for (const file of sourceContext.files) {
+    userContent += `### ${file.path}\n\`\`\`\n${file.content}\n\`\`\`\n\n`;
+  }
+  return {
+    system: SYSTEM_PROMPT,
+    messages: [{ role: 'user', content: userContent }]
+  };
+}
+// ── Anthropic API call ──
+/**
+ * Call the Anthropic Messages API with retry on 429/5xx.
+ *
+ * @param {string} system - system prompt
+ * @param {Array} messages - conversation messages
+ * @returns {Promise<string>} response text content
+ */
+async function callAnthropicAPI(system, messages) {
+  const apiKey = process.env.ANTHROPIC_API_KEY;
+  if (!apiKey) throw new Error('ANTHROPIC_API_KEY not set');
+  const body = JSON.stringify({
+    model: MODEL_ID,
+    max_tokens: 1024,
+    system,
+    messages
+  });
+  const maxAttempts = 2;
+  for (let attempt = 0; attempt < maxAttempts; attempt++) {
+    const controller = new AbortController();
+    const timeout = setTimeout(() => controller.abort(), LLM_TIMEOUT_MS);
+    try {
+      const response = await fetch(API_URL, {
+        method: 'POST',
+        headers: {
+          'Content-Type': 'application/json',
+          'x-api-key': apiKey,
+          'anthropic-version': '2023-06-01'
+        },
+        body,
+        signal: controller.signal
+      });
+      clearTimeout(timeout);
+      if (response.ok) {
+        const data = await response.json();
+        if (data.content && data.content[0] && data.content[0].text) {
+          return data.content[0].text;
+        }
+        throw new Error('Unexpected response format');
+      }
+      // Retry on 429 or 5xx
+      if ((response.status === 429 || response.status >= 500) && attempt < maxAttempts - 1) {
+        const delay = 2000 * (attempt + 1);
+        console.log(`[LLM] API ${response.status}, retrying in ${delay}ms...`);
+        await new Promise(r => setTimeout(r, delay));
+        continue;
+      }
+      const errorText = await response.text().catch(() => '');
+      throw new Error(`API ${response.status}: ${errorText.slice(0, 200)}`);
+    } catch (err) {
+      clearTimeout(timeout);
+      if (err.name === 'AbortError') {
+        throw new Error(`API timeout (${LLM_TIMEOUT_MS}ms)`);
+      }
+      if (attempt < maxAttempts - 1 && err.message && /ECONNRESET|ETIMEDOUT|ENOTFOUND/.test(err.message)) {
+        await new Promise(r => setTimeout(r, 2000));
+        continue;
+      }
+      throw err;
+    }
+  }
+}
+// ── Response parsing ──
+/**
+ * Parse LLM response text into structured verdict object.
+ * Handles raw JSON and markdown-fenced JSON.
+ *
+ * @param {string} text - raw response text
+ * @returns {{ verdict: string, confidence: number, reasoning: string, iocs_found: string[], attack_type: string|null, recommendation: string }}
+ */
+function parseResponse(text) {
+  const fallback = {
+    verdict: 'uncertain',
+    confidence: 0,
+    reasoning: 'Failed to parse LLM response',
+    iocs_found: [],
+    attack_type: null,
+    recommendation: 'monitor'
+  };
+  if (!text || typeof text !== 'string') return fallback;
+  let parsed;
+  try {
+    parsed = JSON.parse(text.trim());
+  } catch {
+    // Try extracting JSON from markdown fence
+    const fenceMatch = text.match(/```(?:json)?\s*([\s\S]*?)```/);
+    if (fenceMatch) {
+      try {
+        parsed = JSON.parse(fenceMatch[1].trim());
+      } catch {
+        return fallback;
+      }
+    } else {
+      // Try finding first { ... } block
+      const start = text.indexOf('{');
+      const end = text.lastIndexOf('}');
+      if (start !== -1 && end > start) {
+        try {
+          parsed = JSON.parse(text.substring(start, end + 1));
+        } catch {
+          return fallback;
+        }
+      } else {
+        return fallback;
+      }
+    }
+  }
+  // Validate and normalize
+  const validVerdicts = ['malicious', 'benign', 'uncertain'];
+  const verdict = validVerdicts.includes(parsed.verdict) ? parsed.verdict : 'uncertain';
+  let confidence = parseFloat(parsed.confidence);
+  if (isNaN(confidence)) confidence = 0;
+  confidence = Math.max(0, Math.min(1, confidence));
+  const validRecommendations = ['block', 'monitor', 'safe'];
+  const recommendation = validRecommendations.includes(parsed.recommendation) ? parsed.recommendation : 'monitor';
+  return {
+    verdict,
+    confidence: Math.round(confidence * 1000) / 1000,
+    reasoning: typeof parsed.reasoning === 'string' ? parsed.reasoning : '',
+    iocs_found: Array.isArray(parsed.iocs_found) ? parsed.iocs_found.filter(x => typeof x === 'string').slice(0, 20) : [],
+    attack_type: typeof parsed.attack_type === 'string' ? parsed.attack_type : null,
+    recommendation
+  };
+}
+// ── Main entry point ──
+/**
+ * Investigate a suspect package with Claude Haiku.
+ *
+ * @param {string} extractedDir - path to extracted package source
+ * @param {Object} scanResult - static scan result with threats[] and summary
+ * @param {Object} options - { name, version, ecosystem, registryMeta, npmRegistryMeta, tier }
+ * @returns {Promise<Object|null>} verdict object or null on skip/error
+ */
+async function investigatePackage(extractedDir, scanResult, options = {}) {
+  const { name, version, ecosystem, npmRegistryMeta, tier } = options;
+  // Guard rails
+  if (!isLlmEnabled()) {
+    _stats.skipped++;
+    return null;
+  }
+  if (!isDailyQuotaAvailable()) {
+    _stats.skipped++;
+    console.log(`[LLM] Daily quota exhausted (${_dailyCounter.count}/${getDailyLimit()}) — skipping ${name}@${version}`);
+    return null;
+  }
+  await acquireLlmSlot();
+  try {
+    incrementDailyCounter();
+    // Collect source files
+    const sourceContext = collectSourceContext(extractedDir, scanResult);
+    if (sourceContext.files.length === 0) {
+      _stats.skipped++;
+      console.log(`[LLM] No source files found in ${name}@${version} — skipping`);
+      return null;
+    }
+    // Build prompt
+    const threats = (scanResult && scanResult.threats) || [];
+    const { system, messages } = buildPrompt(
+      name || 'unknown', version || '0.0.0', ecosystem || 'npm',
+      sourceContext, threats, npmRegistryMeta
+    );
+    // Call API
+    const responseText = await callAnthropicAPI(system, messages);
+    // Parse response
+    const result = parseResponse(responseText);
+    result.mode = getLlmMode();
+    // Update stats
+    _stats.analyzed++;
+    if (result.verdict === 'malicious') _stats.malicious++;
+    else if (result.verdict === 'benign') _stats.benign++;
+    else _stats.uncertain++;
+    return result;
+  } catch (err) {
+    _stats.errors++;
+    console.error(`[LLM] Investigation error for ${name}@${version}: ${err.message}`);
+    return null;
+  } finally {
+    releaseLlmSlot();
+  }
+}
+// ── Reset for testing ──
+function resetLlmLimiter() {
+  _semaphore.active = 0;
+  _semaphore.queue.length = 0;
+}
+module.exports = {
+  investigatePackage,
+  isLlmEnabled,
+  getLlmMode,
+  getDailyLimit,
+  getDailyCount,
+  isDailyQuotaAvailable,
+  incrementDailyCounter,
+  getStats,
+  resetStats,
+  resetDailyCounter,
+  resetLlmLimiter,
+  // Exported for testing
+  collectSourceContext,
+  buildPrompt,
+  parseResponse,
+  // Constants for testing
+  MAX_CONTEXT_BYTES,
+  LLM_CONCURRENCY_MAX,
+  LLM_DAILY_LIMIT_DEFAULT
+};

package/src/monitor/classify.js CHANGED Viewed

@@ -250,6 +250,19 @@ function isCanaryEnabled() {
   return true;
 }
+function isLlmDetectiveEnabled() {
+  if (!process.env.ANTHROPIC_API_KEY) return false;
+  const env = process.env.MUADDIB_LLM_ENABLED;
+  if (env !== undefined && env.toLowerCase() === 'false') return false;
+  return true;
+}
+function getLlmDetectiveMode() {
+  const env = process.env.MUADDIB_LLM_MODE;
+  if (env && env.toLowerCase() === 'active') return 'active';
+  return 'shadow';
+}
 /** @deprecated See comment above verboseMode. */
 function isVerboseMode() {
   if (verboseMode) return true;
@@ -348,6 +361,8 @@ module.exports = {
   formatFindings,
   isSandboxEnabled,
   isCanaryEnabled,
+  isLlmDetectiveEnabled,
+  getLlmDetectiveMode,
   isVerboseMode,
   setVerboseMode,
   quickTyposquatCheck,

package/src/monitor/daemon.js CHANGED Viewed

@@ -3,7 +3,7 @@ const fs = require('fs');
 const path = require('path');
 const os = require('os');
 const { isDockerAvailable, SANDBOX_CONCURRENCY_MAX } = require('../sandbox/index.js');
-const { setVerboseMode, isSandboxEnabled, isCanaryEnabled } = require('./classify.js');
+const { setVerboseMode, isSandboxEnabled, isCanaryEnabled, isLlmDetectiveEnabled, getLlmDetectiveMode } = require('./classify.js');
 const { loadState, saveState, loadDailyStats, saveDailyStats, purgeTarballCache, getParisHour } = require('./state.js');
 const { isTemporalEnabled, isTemporalAstEnabled, isTemporalPublishEnabled, isTemporalMaintainerEnabled } = require('./temporal.js');
 const { pendingGrouped, flushScopeGroup, sendDailyReport, DAILY_REPORT_HOUR } = require('./webhook.js');
@@ -119,6 +119,16 @@ async function startMonitor(options, stats, dailyAlerts, recentlyScanned, downlo
     console.log('[MONITOR] Canary tokens disabled (MUADDIB_MONITOR_CANARY=false)');
   }
+  // LLM Detective status
+  if (isLlmDetectiveEnabled()) {
+    const llmMode = getLlmDetectiveMode();
+    const llmLimit = parseInt(process.env.MUADDIB_LLM_DAILY_LIMIT, 10) || 100;
+    console.log(`[MONITOR] LLM Detective enabled — mode: ${llmMode}, daily limit: ${llmLimit}, model: claude-haiku-4-5`);
+  } else {
+    const reason = !process.env.ANTHROPIC_API_KEY ? 'no ANTHROPIC_API_KEY' : 'MUADDIB_LLM_ENABLED=false';
+    console.log(`[MONITOR] LLM Detective disabled (${reason})`);
+  }
   // Temporal analysis status
   if (isTemporalEnabled()) {
     console.log('[MONITOR] Temporal lifecycle analysis enabled — detecting sudden lifecycle script changes');

package/src/monitor/queue.js CHANGED Viewed

@@ -676,11 +676,44 @@ async function scanPackage(name, version, ecosystem, tarballUrl, registryMeta, s
         } else if (ecosystem === 'npm' && hasHighConfidenceThreat(result)) {
           console.log(`[MONITOR] REPUTATION BYPASS: ${name} has high-confidence threat — using raw score`);
         }
-        await trySendWebhook(name, version, ecosystem, adjustedResult, sandboxResult, mlResult);
+        // LLM Detective: AI-powered analysis for T1a/T1b suspects
+        let llmResult = null;
+        if ((tier === '1a' || tier === '1b') && (adjustedResult.summary.riskScore || 0) >= 25) {
+          try {
+            const { investigatePackage, isLlmEnabled, getLlmMode } = require('../ml/llm-detective.js');
+            if (isLlmEnabled()) {
+              llmResult = await investigatePackage(extractedDir, result, {
+                name, version, ecosystem,
+                registryMeta: meta,
+                npmRegistryMeta,
+                tier
+              });
+              if (llmResult) {
+                const llmMode = getLlmMode();
+                console.log(`[LLM] ${name}@${version}: verdict=${llmResult.verdict} confidence=${llmResult.confidence} mode=${llmMode}`);
+                stats.llmAnalyzed = (stats.llmAnalyzed || 0) + 1;
+                if (llmMode === 'active' && llmResult.verdict === 'benign' && llmResult.confidence > 0.85) {
+                  console.log(`[LLM] SUPPRESS: ${name}@${version} cleared (benign, confidence=${llmResult.confidence})`);
+                  stats.llmSuppressed = (stats.llmSuppressed || 0) + 1;
+                  stats.scanned++;
+                  stats.totalTimeMs += Date.now() - startTime;
+                  updateScanStats('llm_benign');
+                  recordTrainingSample(result, { name, version, ecosystem, label: 'llm_benign', tier, registryMeta: meta, unpackedSize: meta.unpackedSize, npmRegistryMeta, fileCountTotal, hasTests });
+                  return { sandboxResult, llmResult, tier, staticScore: result.summary.riskScore || 0 };
+                }
+              }
+            }
+          } catch (err) {
+            console.error(`[LLM] Error for ${name}@${version}: ${err.message}`);
+          }
+        }
+        await trySendWebhook(name, version, ecosystem, adjustedResult, sandboxResult, mlResult, llmResult);
         const staticScore = result.summary.riskScore || 0;
         const hasHCThreats = hasHighConfidenceThreat(result);
         const isDormant = sandboxResult && sandboxResult.score === 0 && (result.summary.riskScore || 0) >= 20;
-        return { sandboxResult, staticClean: false, tier, staticScore, hasHCThreats, isDormant };
+        return { sandboxResult, llmResult, staticClean: false, tier, staticScore, hasHCThreats, isDormant };
       }
     }
   } catch (err) {

package/src/monitor/state.js CHANGED Viewed

@@ -680,6 +680,8 @@ function loadDailyStats(stats, dailyAlerts) {
       }
       stats.totalTimeMs = data.totalTimeMs || 0;
       stats.mlFiltered = data.mlFiltered || 0;
+      stats.llmAnalyzed = data.llmAnalyzed || 0;
+      stats.llmSuppressed = data.llmSuppressed || 0;
       if (Array.isArray(data.dailyAlerts)) {
         dailyAlerts.length = 0;
         dailyAlerts.push(...data.dailyAlerts);
@@ -704,6 +706,8 @@ function saveDailyStats(stats, dailyAlerts) {
       errorsByType: { ...stats.errorsByType },
       totalTimeMs: stats.totalTimeMs,
       mlFiltered: stats.mlFiltered,
+      llmAnalyzed: stats.llmAnalyzed || 0,
+      llmSuppressed: stats.llmSuppressed || 0,
       dailyAlerts: dailyAlerts.slice()
     };
     atomicWriteFileSync(DAILY_STATS_FILE, JSON.stringify(data, null, 2));

package/src/monitor/webhook.js CHANGED Viewed

@@ -355,7 +355,7 @@ function computeAlertPriority(result, sandboxResult) {
   return { level: 'P3', reason: 'default' };
 }
-function buildAlertData(name, version, ecosystem, result, sandboxResult) {
+function buildAlertData(name, version, ecosystem, result, sandboxResult, llmResult) {
   const priority = computeAlertPriority(result, sandboxResult);
   const webhookData = {
     target: `${ecosystem}/${name}@${version}`,
@@ -375,10 +375,20 @@ function buildAlertData(name, version, ecosystem, result, sandboxResult) {
       severity: sandboxResult.severity
     };
   }
+  if (llmResult && llmResult.verdict) {
+    webhookData.llm = {
+      verdict: llmResult.verdict,
+      confidence: llmResult.confidence,
+      reasoning: (llmResult.reasoning || '').slice(0, 200),
+      attack_type: llmResult.attack_type || null,
+      iocs_found: (llmResult.iocs_found || []).slice(0, 5),
+      mode: llmResult.mode || 'shadow'
+    };
+  }
   return webhookData;
 }
-async function trySendWebhook(name, version, ecosystem, result, sandboxResult, mlResult) {
+async function trySendWebhook(name, version, ecosystem, result, sandboxResult, mlResult, llmResult) {
   if (!shouldSendWebhook(result, sandboxResult, mlResult)) {
     if (mlResult && mlResult.prediction !== 'clean' && mlResult.probability >= 0.90
         && !hasHighOrCritical(result)) {
@@ -443,13 +453,13 @@ async function trySendWebhook(name, version, ecosystem, result, sandboxResult, m
   // Scope grouping: buffer scoped npm packages for grouped webhook
   const scope = extractScope(name);
   if (scope && ecosystem === 'npm') {
-    bufferScopedWebhook(scope, name, version, ecosystem, result, sandboxResult);
+    bufferScopedWebhook(scope, name, version, ecosystem, result, sandboxResult, llmResult);
     return;
   }
   // Non-scoped: send immediately (existing behavior)
   const url = getWebhookUrl();
-  const webhookData = buildAlertData(name, version, ecosystem, result, sandboxResult);
+  const webhookData = buildAlertData(name, version, ecosystem, result, sandboxResult, llmResult);
   try {
     await sendWebhook(url, webhookData);
     console.log(`[MONITOR] Webhook sent for ${name}@${version}`);
@@ -473,12 +483,13 @@ function extractScope(name) {
  * Multiple packages from the same scope published within SCOPE_GROUP_WINDOW_MS
  * are grouped into a single webhook (monorepo noise reduction).
  */
-function bufferScopedWebhook(scope, name, version, ecosystem, result, sandboxResult) {
+function bufferScopedWebhook(scope, name, version, ecosystem, result, sandboxResult, llmResult) {
   const entry = {
     name, version,
     score: (result && result.summary) ? (result.summary.riskScore || 0) : 0,
     threats: result.threats || [],
-    sandboxResult
+    sandboxResult,
+    llmResult: llmResult || null
   };
   const existing = pendingGrouped.get(scope);
@@ -521,7 +532,7 @@ async function flushScopeGroup(scope) {
       threats: pkg.threats,
       summary: { riskScore: pkg.score, critical, high, medium, low, total: pkg.threats.length }
     };
-    const webhookData = buildAlertData(pkg.name, pkg.version, group.ecosystem, result, pkg.sandboxResult);
+    const webhookData = buildAlertData(pkg.name, pkg.version, group.ecosystem, result, pkg.sandboxResult, pkg.llmResult);
     try {
       await sendWebhook(url, webhookData);
       console.log(`[MONITOR] Webhook sent for ${pkg.name}@${pkg.version} (scope group flush, single)`);
@@ -834,6 +845,23 @@ function buildDailyReportEmbed(stats, dailyAlerts) {
     mlText = 'No model loaded';
   }
+  // --- LLM Detective stats ---
+  let llmText;
+  try {
+    const { isLlmEnabled, getStats: getLlmStats } = require('../ml/llm-detective.js');
+    if (isLlmEnabled()) {
+      const ls = getLlmStats();
+      llmText = `${ls.analyzed} analyzed (${ls.malicious} mal, ${ls.benign} ben, ${ls.uncertain} unc, ${ls.errors} err)`;
+      if ((stats.llmSuppressed || 0) > 0) {
+        llmText += ` | ${stats.llmSuppressed} suppressed`;
+      }
+    } else {
+      llmText = 'Disabled';
+    }
+  } catch {
+    llmText = 'Not loaded';
+  }
   // --- System health ---
   const uptimeSec = Math.floor(process.uptime());
   const uptimeH = Math.floor(uptimeSec / 3600);
@@ -863,6 +891,7 @@ function buildDailyReportEmbed(stats, dailyAlerts) {
         { name: 'Timeouts', value: timeoutText, inline: true },
         { name: 'vs Yesterday', value: trendsText, inline: false },
         { name: 'ML', value: mlText, inline: true },
+        { name: 'LLM Detective', value: llmText, inline: true },
         { name: 'Top Suspects', value: top3Text, inline: false },
         { name: 'System', value: healthText, inline: false }
       ],
@@ -907,6 +936,8 @@ async function sendDailyReport(stats, dailyAlerts, recentlyScanned, downloadsCac
     avgScanTimeMs: stats.scanned > 0 ? Math.round(stats.totalTimeMs / stats.scanned) : 0,
     suspectByTier: { ...stats.suspectByTier },
     mlFiltered: stats.mlFiltered || 0,
+    llmAnalyzed: stats.llmAnalyzed || 0,
+    llmSuppressed: stats.llmSuppressed || 0,
     changesStreamPackages: stats.changesStreamPackages || 0,
     topSuspects: dailyAlerts.slice().sort((a, b) => b.findingsCount - a.findingsCount).slice(0, 10)
   });
@@ -942,6 +973,10 @@ async function sendDailyReport(stats, dailyAlerts, recentlyScanned, downloadsCac
   stats.errorsByType.other = 0;
   stats.totalTimeMs = 0;
   stats.mlFiltered = 0;
+  stats.llmAnalyzed = 0;
+  stats.llmSuppressed = 0;
+  // Reset LLM detective internal stats
+  try { require('../ml/llm-detective.js').resetStats(); } catch {}
   stats.changesStreamPackages = 0;
   stats.rssFallbackCount = 0;
   dailyAlerts.length = 0;