npm - jaku.sh - Versions diffs - 1.0.2 → 1.2.0 - Mend

jaku.sh 1.0.2 → 1.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

package/README.md +161 -18
package/action.yml +32 -1
package/package.json +2 -1
package/src/agents/ai-agent.js +47 -1
package/src/agents/api-agent.js +9 -0
package/src/agents/logic-agent.js +158 -90
package/src/agents/orchestrator.js +56 -1
package/src/agents/security-agent.js +86 -54
package/src/cli.js +68 -6
package/src/core/ai/ai-endpoint-detector.js +28 -4
package/src/core/ai/prompt-injector.js +34 -0
package/src/core/api/api-key-auditor.js +1 -1
package/src/core/api/cors-ws-tester.js +1 -1
package/src/core/crawler.js +22 -1
package/src/core/llm/augmentations.js +210 -0
package/src/core/llm/llm-client.js +184 -0
package/src/core/llm/providers/anthropic-provider.js +46 -0
package/src/core/llm/providers/base-provider.js +44 -0
package/src/core/llm/providers/null-provider.js +21 -0
package/src/core/llm/providers/openai-provider.js +47 -0
package/src/core/logic/access-boundary-tester.js +1 -1
package/src/core/logic/business-rule-inferrer.js +50 -1
package/src/core/security/sqli-prober.js +312 -43
package/src/core/security/xss-scanner.js +26 -2
package/src/reporting/report-generator.js +96 -9
package/src/reporting/sarif-generator.js +81 -5
package/src/utils/config.js +196 -2
package/src/utils/finding.js +3 -0
package/src/utils/logger.js +33 -0
package/src/utils/param-discovery.js +93 -0
package/src/utils/safety.js +44 -0
package/src/utils/version.js +30 -0

package/src/cli.js CHANGED Viewed

@@ -14,11 +14,15 @@ import { APIAgent } from './agents/api-agent.js';
 import { ReportGenerator } from './reporting/report-generator.js';
 import { ComplianceReporter } from './reporting/compliance-reporter.js';
 import { AuthManager } from './core/auth-manager.js';
+import { getVersion } from './utils/version.js';
+import { LLMClient } from './core/llm/llm-client.js';
+const VERSION = getVersion();
 const BANNER = `
 ${chalk.hex('#00ff88').bold('  ╦╔═╗╦╔═╦ ╦')}
 ${chalk.hex('#00ff88').bold('  ║╠═╣╠╩╗║ ║')}  ${chalk.dim('呪 Autonomous Security & Quality Intelligence')}
-${chalk.hex('#00ff88').bold(' ╚╝╩ ╩╩ ╩╚═╝')}  ${chalk.dim('v1.0.2 · Multi-Agent')}
+${chalk.hex('#00ff88').bold(' ╚╝╩ ╩╩ ╩╚═╝')}  ${chalk.dim(`v${VERSION} · Multi-Agent`)}
 `;
 const program = new Command();
@@ -26,7 +30,7 @@ const program = new Command();
 program
     .name('jaku')
     .description('JAKU (呪) — Autonomous QA & Security scanning agent for vibe-coded apps')
-    .version('1.0.2');
+    .version(VERSION);
 // ═══════════════════════════════════════════════
 // Multi-Agent Scan Runner
@@ -91,10 +95,25 @@ async function runScan(url, options, modulesToRun) {
     const runAPI = modulesToRun.includes('api');
     const moduleLabel = modulesToRun.join(' + ').toUpperCase();
+    const safetyLabels = {
+        passive: 'Passive (recon + static analysis only)',
+        'safe-active': 'Safe-Active (non-destructive probing)',
+        aggressive: 'Aggressive (includes destructive tests)',
+    };
     console.log(chalk.hex('#00ff88')('  Target:  ') + chalk.white(url));
     console.log(chalk.hex('#00ff88')('  Modules: ') + chalk.white(moduleLabel));
     console.log(chalk.hex('#00ff88')('  Mode:    ') + chalk.white('Multi-Agent Orchestration'));
+    console.log(chalk.hex('#00ff88')('  Safety:  ') + chalk.white(safetyLabels[config.safety_mode] || config.safety_mode));
     console.log(chalk.hex('#00ff88')('  Severity:') + chalk.white(` ≥ ${config.severity_threshold}`));
+    // Single startup line stating whether LLM augmentation is active (no secrets).
+    const llmStatus = LLMClient.describe(config);
+    const llmActive = llmStatus.startsWith('enabled');
+    console.log(
+        chalk.hex('#00ff88')('  LLM:     ') +
+        (llmActive ? chalk.cyan(llmStatus) : chalk.dim(llmStatus))
+    );
     console.log();
     // ═══════════════════════════════════════
@@ -213,7 +232,7 @@ async function runScan(url, options, modulesToRun) {
     try {
         const duration = Date.now() - startTime;
-        const reporter = new ReportGenerator(config, logger);
+        const reporter = new ReportGenerator(config, logger, orchestrator.llmClient);
         const testSummary = qaAgent?.testSummary || {};
@@ -224,6 +243,7 @@ async function runScan(url, options, modulesToRun) {
             testSummary: { ...testSummary, duration },
             surfaceInventory: results.surfaceInventory,
             outputDir: config.output_dir,
+            modules: modulesToRun,
         });
         // Generate compliance report if requested
@@ -234,7 +254,7 @@ async function runScan(url, options, modulesToRun) {
                 options.compliance,
                 results.findings,
                 reportDir,
-                { target: url, version: '1.0.2', scannedAt: new Date().toISOString() }
+                { target: url, version: VERSION, scannedAt: new Date().toISOString() }
             );
         }
@@ -321,12 +341,12 @@ async function runScan(url, options, modulesToRun) {
 program
     .command('scan')
-    .description('Run JAKU scan with selected modules (default: qa + security)')
+    .description('Run JAKU scan with selected modules (default: qa + security + ai + logic + api)')
     .argument('<url>', 'Target URL to scan')
     .option('-c, --config <path>', 'Path to jaku.config.json')
     .option('-o, --output <dir>', 'Output directory for reports')
     .option('-m, --modules <list>', 'Comma-separated modules to run (qa,security,ai,logic,api)', 'qa,security,ai,logic,api')
-    .option('-s, --severity <level>', 'Minimum severity threshold (critical|high|medium|low)', 'low')
+    .option('-s, --severity <level>', 'Minimum severity threshold (critical|high|medium|low|info)', 'low')
     .option('--profile <type>', 'Scan profile: quick|deep|ci (overrides crawl settings)')
     .option('--compliance <framework>', 'Generate compliance report (owasp)')
     .option('--json', 'Output JSON report')
@@ -336,6 +356,13 @@ program
     .option('--halt-on-critical', 'Abort scan immediately on critical finding')
     .option('--webhook <url>', 'POST findings to webhook URL on completion')
     .option('--prod-safe', 'Confirm authorization to scan production targets')
+    .option('--passive', 'Safety mode: recon + static analysis only (no attack probing)')
+    .option('--safe-active', 'Safety mode: non-destructive active probing (default)')
+    .option('--aggressive', 'Safety mode: enable destructive/state-changing tests')
+    .option('--llm', 'Enable optional LLM augmentation (key from env; default off)')
+    .option('--llm-provider <name>', 'LLM provider: openai|anthropic')
+    .option('--llm-model <id>', 'LLM model id (provider default if omitted)')
+    .option('--llm-consent', 'Consent to send minimal finding/target data to the LLM provider')
     .option('--auth-strategy <type>', 'Auth strategy: auto|form|api|cookie (default: auto)')
     .option('--login-url <url>', 'Login page URL for form-based auth')
     .option('--username <user>', 'Username/email for authenticated scanning')
@@ -355,6 +382,13 @@ program
     .option('-s, --severity <level>', 'Severity threshold', 'low')
     .option('--max-pages <n>', 'Maximum pages to crawl', '50')
     .option('--max-depth <n>', 'Maximum crawl depth', '5')
+    .option('--passive', 'Safety mode: recon + static analysis only (no attack probing)')
+    .option('--safe-active', 'Safety mode: non-destructive active probing (default)')
+    .option('--aggressive', 'Safety mode: enable destructive/state-changing tests')
+    .option('--llm', 'Enable optional LLM augmentation (key from env; default off)')
+    .option('--llm-provider <name>', 'LLM provider: openai|anthropic')
+    .option('--llm-model <id>', 'LLM model id (provider default if omitted)')
+    .option('--llm-consent', 'Consent to send minimal finding/target data to the LLM provider')
     .option('-v, --verbose', 'Enable verbose logging')
     .action(async (url, options) => {
         await runScan(url, options, ['qa']);
@@ -369,6 +403,13 @@ program
     .option('-s, --severity <level>', 'Severity threshold', 'low')
     .option('--max-pages <n>', 'Maximum pages to crawl', '50')
     .option('--max-depth <n>', 'Maximum crawl depth', '5')
+    .option('--passive', 'Safety mode: recon + static analysis only (no attack probing)')
+    .option('--safe-active', 'Safety mode: non-destructive active probing (default)')
+    .option('--aggressive', 'Safety mode: enable destructive/state-changing tests')
+    .option('--llm', 'Enable optional LLM augmentation (key from env; default off)')
+    .option('--llm-provider <name>', 'LLM provider: openai|anthropic')
+    .option('--llm-model <id>', 'LLM model id (provider default if omitted)')
+    .option('--llm-consent', 'Consent to send minimal finding/target data to the LLM provider')
     .option('-v, --verbose', 'Enable verbose logging')
     .action(async (url, options) => {
         await runScan(url, options, ['security']);
@@ -383,6 +424,13 @@ program
     .option('-s, --severity <level>', 'Severity threshold', 'low')
     .option('--max-pages <n>', 'Maximum pages to crawl', '50')
     .option('--max-depth <n>', 'Maximum crawl depth', '5')
+    .option('--passive', 'Safety mode: recon + static analysis only (no attack probing)')
+    .option('--safe-active', 'Safety mode: non-destructive active probing (default)')
+    .option('--aggressive', 'Safety mode: enable destructive/state-changing tests')
+    .option('--llm', 'Enable optional LLM augmentation (key from env; default off)')
+    .option('--llm-provider <name>', 'LLM provider: openai|anthropic')
+    .option('--llm-model <id>', 'LLM model id (provider default if omitted)')
+    .option('--llm-consent', 'Consent to send minimal finding/target data to the LLM provider')
     .option('-v, --verbose', 'Enable verbose logging')
     .action(async (url, options) => {
         await runScan(url, options, ['ai']);
@@ -397,6 +445,13 @@ program
     .option('-s, --severity <level>', 'Severity threshold', 'low')
     .option('--max-pages <n>', 'Maximum pages to crawl', '50')
     .option('--max-depth <n>', 'Maximum crawl depth', '5')
+    .option('--passive', 'Safety mode: recon + static analysis only (no attack probing)')
+    .option('--safe-active', 'Safety mode: non-destructive active probing (default)')
+    .option('--aggressive', 'Safety mode: enable destructive/state-changing tests')
+    .option('--llm', 'Enable optional LLM augmentation (key from env; default off)')
+    .option('--llm-provider <name>', 'LLM provider: openai|anthropic')
+    .option('--llm-model <id>', 'LLM model id (provider default if omitted)')
+    .option('--llm-consent', 'Consent to send minimal finding/target data to the LLM provider')
     .option('-v, --verbose', 'Enable verbose logging')
     .action(async (url, options) => {
         await runScan(url, options, ['logic']);
@@ -411,6 +466,13 @@ program
     .option('-s, --severity <level>', 'Severity threshold', 'low')
     .option('--max-pages <n>', 'Maximum pages to crawl', '50')
     .option('--max-depth <n>', 'Maximum crawl depth', '5')
+    .option('--passive', 'Safety mode: recon + static analysis only (no attack probing)')
+    .option('--safe-active', 'Safety mode: non-destructive active probing (default)')
+    .option('--aggressive', 'Safety mode: enable destructive/state-changing tests')
+    .option('--llm', 'Enable optional LLM augmentation (key from env; default off)')
+    .option('--llm-provider <name>', 'LLM provider: openai|anthropic')
+    .option('--llm-model <id>', 'LLM model id (provider default if omitted)')
+    .option('--llm-consent', 'Consent to send minimal finding/target data to the LLM provider')
     .option('-v, --verbose', 'Enable verbose logging')
     .action(async (url, options) => {
         await runScan(url, options, ['api']);

package/src/core/ai/ai-endpoint-detector.js CHANGED Viewed

@@ -42,19 +42,43 @@ export class AIEndpointDetector {
      */
     async detect(surfaceInventory) {
         const aiSurfaces = [];
+        const seenApiUrls = new Set();
-        // 1. Check discovered API endpoints
-        const apis = surfaceInventory.apis || [];
+        // 1. Check discovered API endpoints.
+        //    NOTE: the crawler emits `apiEndpoints` (not `apis`) — read the
+        //    correct field so API-discovered surfaces are actually considered.
+        const apis = surfaceInventory.apiEndpoints || surfaceInventory.apis || [];
         for (const api of apis) {
             const url = api.url || api;
-            if (this._matchesAIPattern(url)) {
+            if (!url || seenApiUrls.has(url)) continue;
+            const method = (api.method || 'POST').toUpperCase();
+            const contentType = api.contentType || '';
+            const matchesPattern = this._matchesAIPattern(url);
+            // Non-GET or JSON endpoints are plausible LLM surfaces even when the
+            // URL itself doesn't match a known AI path — they get probed below.
+            const isJsonOrMutating =
+                contentType.includes('application/json') ||
+                (method !== 'GET' && method !== 'OPTIONS' && method !== 'HEAD');
+            if (matchesPattern) {
+                seenApiUrls.add(url);
                 aiSurfaces.push({
                     type: 'api',
                     url,
-                    method: api.method || 'POST',
+                    method,
                     confidence: 'high',
                     reason: 'URL pattern matches known AI endpoint',
                 });
+            } else if (isJsonOrMutating) {
+                seenApiUrls.add(url);
+                aiSurfaces.push({
+                    type: 'api',
+                    url,
+                    method,
+                    confidence: 'low',
+                    reason: 'Non-GET/JSON API endpoint — probing for LLM behavior',
+                });
             }
         }

package/src/core/ai/prompt-injector.js CHANGED Viewed

@@ -214,6 +214,40 @@ export class PromptInjector {
         return findings;
     }
+    /**
+     * Fire a set of LLM-generated payloads at AI surfaces (Phase 1).
+     * Each finding is tagged source:'llm'. Destructive generated payloads are
+     * only fired when allowDestructive is true (caller enforces safety tier).
+     */
+    async injectGenerated(aiSurfaces, generatedPayloads, { allowDestructive = false } = {}) {
+        const findings = [];
+        if (!Array.isArray(generatedPayloads) || generatedPayloads.length === 0) return findings;
+        for (const surface of aiSurfaces) {
+            if (surface.confidence === 'low') continue;
+            const baseline = await this._getBaseline(surface);
+            if (!baseline) continue;
+            for (const payload of generatedPayloads) {
+                if (payload.destructive && !allowDestructive) continue;
+                try {
+                    const result = await this._firePayload(surface, payload, baseline);
+                    if (result) {
+                        result.source = 'llm';
+                        result.title = `LLM-Generated ${result.title}`;
+                        findings.push(result);
+                    }
+                } catch (err) {
+                    this.logger?.debug?.(`Generated payload "${payload.name}" failed: ${err.message}`);
+                }
+            }
+        }
+        this.logger?.info?.(`Prompt Injector: ${findings.length} findings from ${generatedPayloads.length} LLM-generated payloads`);
+        return findings;
+    }
     /**
      * Get a baseline response for comparison.
      */

package/src/core/api/api-key-auditor.js CHANGED Viewed

@@ -63,7 +63,7 @@ export class APIKeyAuditor {
     _checkKeysInURLs(surfaceInventory) {
         const findings = [];
         const pages = surfaceInventory.pages || [];
-        const apis = surfaceInventory.apis || [];
+        const apis = surfaceInventory.apiEndpoints || surfaceInventory.apis || [];
         for (const entry of [...pages, ...apis]) {
             const url = entry.url || entry;

package/src/core/api/cors-ws-tester.js CHANGED Viewed

@@ -54,7 +54,7 @@ export class CORSWSTester {
         const testUrls = [baseUrl + '/'];
         // Add API endpoints
-        const apis = surfaceInventory.apis || [];
+        const apis = surfaceInventory.apiEndpoints || surfaceInventory.apis || [];
         testUrls.push(...apis.slice(0, 5).map(a => a.url || a));
         // Add common API paths

package/src/core/crawler.js CHANGED Viewed

@@ -45,7 +45,28 @@ export class Crawler {
      */
     async crawl(targetUrl, authState = null, seedLinks = []) {
         this.baseUrl = new URL(targetUrl);
-        const browser = await chromium.launch({ headless: true });
+        let browser;
+        try {
+            browser = await chromium.launch({ headless: true });
+        } catch (err) {
+            if (err.message.includes("Executable doesn't exist") || err.message.includes('playwright install')) {
+                this.logger?.warn?.('Chromium not found — attempting automatic install...');
+                const { execSync } = await import('child_process');
+                try {
+                    execSync('npx playwright install chromium', { stdio: 'inherit', timeout: 120000 });
+                    browser = await chromium.launch({ headless: true });
+                } catch {
+                    throw new Error(
+                        'Playwright Chromium is not installed. Run:\n\n' +
+                        '    npx playwright install chromium\n\n' +
+                        'Then re-run your jaku command.'
+                    );
+                }
+            } else {
+                throw err;
+            }
+        }
         const contextOptions = {
             viewport: { width: 1440, height: 900 },

package/src/core/llm/augmentations.js ADDED Viewed

@@ -0,0 +1,210 @@
+/**
+ * LLM augmentations — task-specific helpers built on top of LLMClient.
+ *
+ * Every function here is STRICTLY ADDITIVE: it returns null on any failure (no
+ * client, disabled, budget exhausted, parse error) so callers fall back to their
+ * deterministic behavior. Each function applies DATA MINIMIZATION — it sends the
+ * smallest useful slice of data for its task, never raw target dumps or secrets.
+ */
+const SYSTEM_BASE =
+    'You are a security engineering assistant embedded in the JAKU scanner. ' +
+    'Be precise, terse, and factual. Never fabricate findings.';
+/** Extract the first JSON value (object or array) from a model response. */
+function parseJsonLoose(text) {
+    if (!text || typeof text !== 'string') return null;
+    // Strip code fences if present.
+    const cleaned = text.replace(/```(?:json)?/gi, '').trim();
+    try {
+        return JSON.parse(cleaned);
+    } catch {
+        /* fall through to bracket scan */
+    }
+    const start = cleaned.search(/[[{]/);
+    if (start === -1) return null;
+    const open = cleaned[start];
+    const close = open === '{' ? '}' : ']';
+    const end = cleaned.lastIndexOf(close);
+    if (end <= start) return null;
+    try {
+        return JSON.parse(cleaned.slice(start, end + 1));
+    } catch {
+        return null;
+    }
+}
+function snippet(str, n = 400) {
+    if (!str) return '';
+    const s = typeof str === 'string' ? str : JSON.stringify(str);
+    return s.length > n ? s.slice(0, n) + '…' : s;
+}
+/**
+ * Phase 0 — Framework-specific remediation for a single finding.
+ * Data sent: title, module, severity, description (no raw target bodies).
+ */
+export async function enhanceRemediation(llmClient, finding) {
+    if (!llmClient?.isEnabled?.()) return null;
+    const prompt =
+        `Provide concise, actionable remediation for this web/AI security finding. ` +
+        `Prefer concrete, framework-specific fixes (name the framework only if implied by the finding). ` +
+        `Plain text, max ~120 words, no preamble.\n\n` +
+        `Title: ${finding.title}\n` +
+        `Module: ${finding.module}\n` +
+        `Severity: ${finding.severity}\n` +
+        `Description: ${snippet(finding.description, 600)}`;
+    const text = await llmClient.ask({ system: SYSTEM_BASE, prompt, maxTokens: 300, temperature: 0 });
+    const out = text && text.trim();
+    return out ? out : null;
+}
+/**
+ * Phase 2 — Triage / false-positive assessment for a borderline finding.
+ * Data sent: title, severity, description, short evidence snippet.
+ * Returns { assessment, confidence, note, source } or null. Advisory only —
+ * never changes the deterministic severity.
+ */
+export async function triageFinding(llmClient, finding) {
+    if (!llmClient?.isEnabled?.()) return null;
+    const prompt =
+        `Assess whether this scanner finding is likely a TRUE positive or a FALSE positive. ` +
+        `Consider typical false-positive patterns. Respond with ONLY JSON: ` +
+        `{"assessment":"true_positive|false_positive|uncertain","confidence":0.0-1.0,"note":"<=160 chars"}.\n\n` +
+        `Title: ${finding.title}\n` +
+        `Severity: ${finding.severity}\n` +
+        `Description: ${snippet(finding.description, 500)}\n` +
+        `Evidence: ${snippet(finding.evidence, 400)}`;
+    const text = await llmClient.ask({ system: SYSTEM_BASE, prompt, maxTokens: 160, temperature: 0 });
+    const json = parseJsonLoose(text);
+    if (!json || !json.assessment) return null;
+    const confidence = Number(json.confidence);
+    return {
+        assessment: String(json.assessment),
+        confidence: Number.isFinite(confidence) ? Math.max(0, Math.min(1, confidence)) : null,
+        note: json.note ? String(json.note).slice(0, 200) : '',
+        source: 'llm',
+    };
+}
+/**
+ * Phase 2 — Enrich an attack-chain correlation narrative.
+ * Data sent: correlation title + existing narrative (already derived, no raw data).
+ */
+export async function enrichCorrelation(llmClient, correlation) {
+    if (!llmClient?.isEnabled?.()) return null;
+    const prompt =
+        `Improve this attack-chain narrative for a security report. Keep it factual and concrete, ` +
+        `explain WHY the combination is exploitable and the realistic impact. Plain text, <=100 words.\n\n` +
+        `Title: ${correlation.title}\n` +
+        `Current narrative: ${snippet(correlation.narrative, 600)}`;
+    const text = await llmClient.ask({ system: SYSTEM_BASE, prompt, maxTokens: 240, temperature: 0 });
+    const out = text && text.trim();
+    return out ? out : null;
+}
+/**
+ * Phase 2 — Natural-language executive summary.
+ * Data sent: severity counts, target, finding TITLES only (no bodies/evidence).
+ */
+export async function generateExecutiveSummary(llmClient, { target, summary, topTitles = [], correlationTitles = [] }) {
+    if (!llmClient?.isEnabled?.()) return null;
+    const prompt =
+        `Write a brief executive summary (<=150 words) of this security scan for a technical leader. ` +
+        `State overall risk posture and the most important themes. No markdown headings, plain paragraphs.\n\n` +
+        `Target: ${target}\n` +
+        `Counts: ${JSON.stringify(summary)}\n` +
+        `Top findings: ${topTitles.slice(0, 12).map(t => `- ${t}`).join('\n')}\n` +
+        (correlationTitles.length ? `Attack chains: ${correlationTitles.slice(0, 6).join('; ')}` : '');
+    const text = await llmClient.ask({ system: SYSTEM_BASE, prompt, maxTokens: 320, temperature: 0 });
+    const out = text && text.trim();
+    return out ? out : null;
+}
+/**
+ * Phase 1 — Generate context-aware prompt-injection/jailbreak payloads tailored
+ * to an extracted system prompt.
+ * Data sent: a snippet of the (already-leaked) system prompt + the target URL host.
+ * Returns array of { name, category, payload, marker, destructive } or null.
+ */
+export async function generateInjectionPayloads(llmClient, { systemPrompt, surfaceUrl, allowDestructive = false, max = 6 }) {
+    if (!llmClient?.isEnabled?.()) return null;
+    const prompt =
+        `An AI endpoint leaked (part of) its system prompt. Craft up to ${max} prompt-injection / jailbreak ` +
+        `test payloads tailored to bypass THIS system prompt's specific guardrails. ` +
+        `${allowDestructive
+            ? 'You MAY include payloads that attempt to trigger state-changing/tool actions.'
+            : 'Do NOT include payloads that attempt destructive or state-changing actions; detection-only.'} ` +
+        `Each payload must instruct the model to emit a unique uppercase canary marker so success is detectable. ` +
+        `Respond with ONLY a JSON array of objects: ` +
+        `{"name":"...","category":"role_override|instruction_override|jailbreak|delimiter_escape|encoding_bypass","payload":"...","marker":"CANARY_TOKEN","destructive":false}.\n\n` +
+        `Target host: ${(() => { try { return new URL(surfaceUrl).host; } catch { return 'unknown'; } })()}\n` +
+        `Leaked system prompt (snippet): ${snippet(systemPrompt, 800)}`;
+    const text = await llmClient.ask({ system: SYSTEM_BASE, prompt, maxTokens: 900, temperature: 0 });
+    const json = parseJsonLoose(text);
+    if (!Array.isArray(json)) return null;
+    const seen = new Set();
+    const out = [];
+    for (const p of json) {
+        if (!p || typeof p.payload !== 'string' || !p.payload.trim()) continue;
+        const key = p.payload.trim();
+        if (seen.has(key)) continue;
+        seen.add(key);
+        const destructive = !!p.destructive;
+        if (destructive && !allowDestructive) continue; // safety gate (also enforced by caller)
+        out.push({
+            name: String(p.name || 'LLM-generated payload').slice(0, 120),
+            category: String(p.category || 'instruction_override'),
+            payload: key,
+            marker: p.marker ? String(p.marker).slice(0, 64) : null,
+            destructive,
+        });
+        if (out.length >= max) break;
+    }
+    return out.length ? out : null;
+}
+/**
+ * Phase 3 — Augment business-domain inference.
+ * Data sent: discovered URL paths + form field names only (no values, no bodies).
+ * Returns { domains: [{name, urls?}], invariants: [string] } or null.
+ */
+export async function inferBusinessDomains(llmClient, { paths = [], formFields = [] }) {
+    if (!llmClient?.isEnabled?.()) return null;
+    const prompt =
+        `Given these URL paths and form field names from a web app, infer business domains beyond simple ` +
+        `keyword matching (e.g. payments, auth, subscriptions, inventory, referrals, workflows, messaging, kyc) ` +
+        `and propose security-relevant business invariants worth testing. ` +
+        `Respond with ONLY JSON: {"domains":["..."],"invariants":["..."]}.\n\n` +
+        `Paths: ${JSON.stringify(paths.slice(0, 60))}\n` +
+        `Form fields: ${JSON.stringify(formFields.slice(0, 60))}`;
+    const text = await llmClient.ask({ system: SYSTEM_BASE, prompt, maxTokens: 400, temperature: 0 });
+    const json = parseJsonLoose(text);
+    if (!json) return null;
+    return {
+        domains: Array.isArray(json.domains) ? json.domains.map(String).slice(0, 20) : [],
+        invariants: Array.isArray(json.invariants) ? json.invariants.map(String).slice(0, 20) : [],
+    };
+}
+export default {
+    enhanceRemediation,
+    triageFinding,
+    enrichCorrelation,
+    generateExecutiveSummary,
+    generateInjectionPayloads,
+    inferBusinessDomains,
+};