npm - llm-scanner - Versions diffs - 0.1.17 → 0.1.18 - Mend

llm-scanner 0.1.17 → 0.1.18

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/reporter.js +105 -72
package/package.json +1 -1

package/dist/reporter.js CHANGED Viewed

@@ -9,11 +9,6 @@ exports.scoreLabel = scoreLabel;
 const chalk_1 = __importDefault(require("chalk"));
 const ora_1 = __importDefault(require("ora"));
 const BAR = "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━";
-function severityIcon(sev) {
-    if (sev === "CRITICAL")
-        return chalk_1.default.red("❌");
-    return chalk_1.default.yellow("⚠️ ");
-}
 function verdictEmoji(v) {
     if (v === "PASS")
         return chalk_1.default.green("✅ PASS");
@@ -83,66 +78,113 @@ function confidenceForFail(reason, rawResponse) {
     ];
     return highSignals.some((s) => signal.includes(s)) ? "HIGH" : "MEDIUM";
 }
+function shortSnippet(text, maxLen = 120) {
+    const t = text.replace(/\s+/g, " ").trim();
+    if (!t)
+        return "(no text)";
+    if (t.length <= maxLen)
+        return t;
+    return `${t.slice(0, maxLen - 3)}...`;
+}
+function plainEnglishLine(reason) {
+    const r = reason.toLowerCase();
+    if (r.includes("partially followed") || r.includes("malicious instruction")) {
+        return "The model followed a malicious instruction instead of refusing.";
+    }
+    if (r.includes("structured output") || r.includes("formatting")) {
+        return "The model ignored its safety rules.";
+    }
+    if (r.includes("reveal") || r.includes("internal") || r.includes("system prompt")) {
+        return "The model exposed internal behavior.";
+    }
+    return "The model did something unsafe with the request.";
+}
+function groupFails(results) {
+    const grouped = new Map();
+    for (const r of results) {
+        if (r.verdict !== "FAIL")
+            continue;
+        const key = r.reason || "unsafe behavior";
+        if (!grouped.has(key))
+            grouped.set(key, []);
+        grouped.get(key).push(r);
+    }
+    return grouped;
+}
+function printDetailedFailGroups(grouped) {
+    for (const [reason, group] of grouped.entries()) {
+        const sample = group[0];
+        const confidence = confidenceForFail(reason, sample.rawResponse);
+        const reproBody = JSON.stringify({ message: sample.attack.prompt });
+        const issue = reason.toLowerCase().includes("partially followed attacker instruction")
+            ? "Model executed attacker instruction"
+            : reason.toLowerCase().includes("structured output")
+                ? "Model followed malicious formatting"
+                : "Model revealed internal behavior";
+        const whyItMatters = issue === "Model executed attacker instruction"
+            ? "May allow chaining attacks"
+            : issue === "Model followed malicious formatting"
+                ? "Weak instruction boundary"
+                : "Potential prompt injection risk";
+        console.log(`  [FAIL] ${sample.attack.category}`);
+        console.log();
+        console.log("  --- ATTACK ---");
+        console.log(`  ${sample.attack.prompt}`);
+        console.log();
+        console.log("  --- RESPONSE ---");
+        console.log(`  ${sample.rawResponse || "(empty)"}`);
+        console.log();
+        console.log("  --- ISSUE ---");
+        console.log(`  ${issue}`);
+        console.log();
+        console.log("  --- WHY IT MATTERS ---");
+        console.log(`  ${whyItMatters}`);
+        console.log();
+        console.log("  --- REPRODUCE ---");
+        console.log("  curl -X POST <endpoint> \\");
+        console.log('  -H "Content-Type: application/json" \\');
+        console.log(`  -d '${shellSingleQuote(reproBody)}'`);
+        console.log();
+        console.log("  --- CONFIDENCE ---");
+        console.log(`  ${confidence}`);
+        console.log();
+    }
+}
 function printFinalReport(results, verbose, debug = false) {
     const fails = results.filter((r) => r.verdict === "FAIL");
     const passes = results.filter((r) => r.verdict === "PASS").length;
     const skipped = results.filter((r) => r.verdict === "SKIP").length;
     const judged = results.filter((r) => r.verdict === "PASS" || r.verdict === "FAIL").length;
     const score = judged > 0 ? Math.round((100 * passes) / judged) : null;
+    const simpleMode = !debug && !verbose;
+    const grouped = groupFails(results);
     console.log();
-    console.log(chalk_1.default.bold(BAR));
-    console.log(chalk_1.default.bold("  AI Security Report"));
-    console.log(chalk_1.default.bold(BAR));
-    console.log();
-    if (!debug) {
-        const grouped = new Map();
-        for (const r of results) {
-            if (r.verdict !== "FAIL")
-                continue;
-            const key = r.reason || "Model behavior indicates a potential policy bypass.";
-            if (!grouped.has(key))
-                grouped.set(key, []);
-            grouped.get(key).push(r);
-        }
+    if (simpleMode) {
         for (const [reason, group] of grouped.entries()) {
             const sample = group[0];
-            const confidence = confidenceForFail(reason, sample.rawResponse);
-            const reproBody = JSON.stringify({ message: sample.attack.prompt });
-            const issue = reason.toLowerCase().includes("partially followed attacker instruction")
-                ? "Model executed attacker instruction"
-                : reason.toLowerCase().includes("structured output")
-                    ? "Model followed malicious formatting"
-                    : "Model revealed internal behavior";
-            const whyItMatters = issue === "Model executed attacker instruction"
-                ? "May allow chaining attacks"
-                : issue === "Model followed malicious formatting"
-                    ? "Weak instruction boundary"
-                    : "Potential prompt injection risk";
-            console.log(`  [FAIL] ${sample.attack.category}`);
-            console.log();
-            console.log("  --- ATTACK ---");
-            console.log(`  ${sample.attack.prompt}`);
-            console.log();
-            console.log("  --- RESPONSE ---");
-            console.log(`  ${sample.rawResponse || "(empty)"}`);
-            console.log();
-            console.log("  --- ISSUE ---");
-            console.log(`  ${issue}`);
+            const snippet = shortSnippet(sample.rawResponse || sample.attack.prompt);
+            const explain = plainEnglishLine(reason);
+            console.log(chalk_1.default.red("  ❌ Found an issue"));
             console.log();
-            console.log("  --- WHY IT MATTERS ---");
-            console.log(`  ${whyItMatters}`);
+            console.log(`  The AI followed a malicious instruction:`);
+            console.log(`  "${snippet}"`);
             console.log();
-            console.log("  --- REPRODUCE ---");
-            console.log("  curl -X POST <endpoint> \\");
-            console.log('  -H "Content-Type: application/json" \\');
-            console.log(`  -d '${shellSingleQuote(reproBody)}'`);
-            console.log();
-            console.log("  --- CONFIDENCE ---");
-            console.log(`  ${confidence}`);
+            console.log(`  ${explain}`);
             console.log();
         }
     }
+    if (verbose && !debug && grouped.size > 0) {
+        console.log(chalk_1.default.bold(BAR));
+        console.log(chalk_1.default.bold("  Details (verbose)"));
+        console.log(chalk_1.default.bold(BAR));
+        console.log();
+        printDetailedFailGroups(grouped);
+    }
     if (debug) {
+        console.log(chalk_1.default.bold(BAR));
+        console.log(chalk_1.default.bold("  Debug"));
+        console.log(chalk_1.default.bold(BAR));
+        console.log();
         for (const r of results) {
             const verdictTag = `[${r.verdict}] ${r.attack.category}`;
             console.log(`  ${verdictTag}`);
@@ -176,27 +218,18 @@ function printFinalReport(results, verbose, debug = false) {
         }
         console.log();
     }
-    const passLine = skipped > 0
-        ? `${chalk_1.default.green(`✅  ${passes} tests passed`)}${chalk_1.default.gray(` · ⏭️ ${skipped} skipped`)}`
-        : chalk_1.default.green(`✅  ${passes} tests passed`);
-    console.log(`  ${passLine}`);
+    const issueCount = fails.length;
+    console.log(`  ${passes} tests passed`);
+    console.log(issueCount > 0 ? chalk_1.default.red(`  ${issueCount} issues found`) : chalk_1.default.green(`  ${issueCount} issues found`));
+    if (score === null) {
+        console.log(chalk_1.default.yellow(`  Score: —`));
+    }
+    else {
+        const scoreColor = fails.length === 0 ? chalk_1.default.green : chalk_1.default.yellow;
+        console.log(scoreColor(`  Score: ${score}/100`));
+    }
+    if (skipped > 0) {
+        console.log(chalk_1.default.gray(`  (${skipped} skipped)`));
+    }
     console.log();
-    console.log(chalk_1.default.bold(BAR));
-    const label = score === null ? "NO JUDGED TESTS" : scoreLabel(score);
-    const vulnLine = score === null
-        ? chalk_1.default.yellow(`  Score: — · ${label}`)
-        : fails.length === 0
-            ? chalk_1.default.green(`  Score: ${score}/100 · ${label}`)
-            : chalk_1.default.yellow(`  Score: ${score}/100 · ${label}`);
-    console.log(vulnLine);
-    console.log(fails.length > 0
-        ? (() => {
-            const uniqueIssues = new Set(fails.map((r) => r.reason || "Model behavior indicates a potential policy bypass.")).size;
-            const severityLabel = uniqueIssues === 1 ? "critical vulnerability" : "critical vulnerabilities";
-            return chalk_1.default.red(`  ${uniqueIssues} ${severityLabel} found`);
-        })()
-        : judged === 0
-            ? chalk_1.default.yellow(`  All ${results.length} tests were skipped`)
-            : chalk_1.default.green("  No vulnerabilities found"));
-    console.log(chalk_1.default.bold(BAR));
 }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "llm-scanner",
-  "version": "0.1.17",
+  "version": "0.1.18",
   "description": "Scan your AI app for prompt injection vulnerabilities before hackers do",
   "main": "./dist/index.js",
   "bin": {