npm - jaku.sh - Versions diffs - 1.0.2 → 1.2.0 - Mend

jaku.sh 1.0.2 → 1.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

package/README.md +161 -18
package/action.yml +32 -1
package/package.json +2 -1
package/src/agents/ai-agent.js +47 -1
package/src/agents/api-agent.js +9 -0
package/src/agents/logic-agent.js +158 -90
package/src/agents/orchestrator.js +56 -1
package/src/agents/security-agent.js +86 -54
package/src/cli.js +68 -6
package/src/core/ai/ai-endpoint-detector.js +28 -4
package/src/core/ai/prompt-injector.js +34 -0
package/src/core/api/api-key-auditor.js +1 -1
package/src/core/api/cors-ws-tester.js +1 -1
package/src/core/crawler.js +22 -1
package/src/core/llm/augmentations.js +210 -0
package/src/core/llm/llm-client.js +184 -0
package/src/core/llm/providers/anthropic-provider.js +46 -0
package/src/core/llm/providers/base-provider.js +44 -0
package/src/core/llm/providers/null-provider.js +21 -0
package/src/core/llm/providers/openai-provider.js +47 -0
package/src/core/logic/access-boundary-tester.js +1 -1
package/src/core/logic/business-rule-inferrer.js +50 -1
package/src/core/security/sqli-prober.js +312 -43
package/src/core/security/xss-scanner.js +26 -2
package/src/reporting/report-generator.js +96 -9
package/src/reporting/sarif-generator.js +81 -5
package/src/utils/config.js +196 -2
package/src/utils/finding.js +3 -0
package/src/utils/logger.js +33 -0
package/src/utils/param-discovery.js +93 -0
package/src/utils/safety.js +44 -0
package/src/utils/version.js +30 -0

package/README.md CHANGED Viewed

@@ -14,9 +14,13 @@ JAKU crawls your entire app, generates test cases, probes for security vulnerabi
 - [Architecture](#architecture)
 - [Module 01 — QA & Functional Testing](#module-01--qa--functional-testing)
 - [Module 02 — Security Vulnerability Scanning](#module-02--security-vulnerability-scanning)
+- [Module 03 — Business Logic Validation](#module-03--business-logic-validation)
 - [Module 04 — Prompt Injection & AI Abuse Detection](#module-04--prompt-injection--ai-abuse-detection)
+- [Module 05 — API & Auth Flow Verification](#module-05--api--auth-flow-verification)
 - [Correlation Engine](#correlation-engine)
 - [CLI Reference](#cli-reference)
+- [Safety Modes](#safety-modes)
+- [LLM Augmentation (optional)](#llm-augmentation-optional)
 - [Reports](#reports)
 - [Severity Framework](#severity-framework)
 - [Configuration](#configuration)
@@ -78,7 +82,7 @@ JAKU is a **multi-agent system** — a central Orchestrator coordinates 6 specia
 |-------|------|-------------|---------|
 | **JAKU-CRAWL** | Surface discovery | — | Wave 1 (solo) |
 | **JAKU-QA** | QA & functional testing (5 sub-modules) | JAKU-CRAWL | Wave 2 (parallel) |
-| **JAKU-SEC** | Security vulnerability scanning (8 sub-modules) | JAKU-CRAWL | Wave 2 (parallel) |
+| **JAKU-SEC** | Security vulnerability scanning (15 sub-modules) | JAKU-CRAWL | Wave 2 (parallel) |
 | **JAKU-AI** | Prompt injection & AI abuse (8 sub-modules) | JAKU-CRAWL | Wave 2 (parallel) |
 | **JAKU-LOGIC** | Business logic validation (6 sub-modules) | JAKU-CRAWL | Wave 2 (parallel) |
 | **JAKU-API** | API & auth flow verification (5 sub-modules) | JAKU-CRAWL | Wave 2 (parallel) |
@@ -213,19 +217,34 @@ node src/cli.js qa https://your-app.dev --verbose
 ## Module 02 — Security Vulnerability Scanning
-Probes your app's attack surface with safe, non-destructive payloads.
+Probes your app's attack surface. Under the default `--safe-active` mode these
+checks use detection-only payloads and do not issue state-changing requests
+(see [Safety Modes](#safety-modes)).
 | Sub-Module | What It Does |
 |-----------|-------------|
 | **Header Analyzer** | Checks CSP, HSTS, X-Frame-Options, X-Content-Type-Options, CORS, Referrer-Policy, Permissions-Policy, and technology fingerprinting |
 | **Secret Detector** | Scans page source, JS, and inline scripts for 19 secret patterns (AWS, Google, Stripe, GitHub, Slack, Firebase, JWT, DB URLs, private keys). Probes 21 sensitive paths (`.env`, `.git/config`, `/debug`, `/actuator`). Checks for source map exposure |
-| **XSS Scanner** | Tests URL parameters and form inputs for reflected and stored XSS using 9 detection-only payloads |
-| **SQLi Prober** | Tests URL params, form inputs, and API endpoints with 8 SQL and 3 NoSQL payloads. Detects 18 database error signatures |
+| **XSS Scanner** | Tests URL parameters and form inputs for reflected and stored XSS using 9 detection-only payloads (parameters are discovered from forms/links/APIs, with a fallback name list) |
+| **SQLi Prober** | Tests URL params, form inputs, and API endpoints with SQL and NoSQL payloads. Detects 18 database error signatures plus boolean-based and time-based blind injection |
 | **Dependency Auditor** | Runs `npm audit`, maps CVE advisories to JAKU severity, checks for unpinned dependencies and risky npm scripts |
 | **TLS Checker** | Validates certificate expiry, detects self-signed certs, checks HTTP→HTTPS redirect, and scans for mixed content |
 | **Infrastructure Scanner** | Probes 40 admin/debug endpoints, detects directory listing, checks error pages for information disclosure, and tests GraphQL introspection |
-> **Safety:** All security testing uses simulation-only payloads. No destructive operations are ever executed.
+| **File Upload Tester** | Tests upload endpoints for MIME spoofing, dangerous extensions, and path traversal *(active — `safe-active`+)* |
+| **CSRF Detector** | Checks state-changing forms/endpoints for anti-CSRF tokens and SameSite cookie protection |
+| **Open Redirect Detector** | Tests redirect parameters for unvalidated off-site redirection *(active — `safe-active`+)* |
+| **Subdomain Scanner** | Enumerates common subdomains and flags exposed/sensitive hosts |
+| **Cookie Auditor** | Audits cookies for `HttpOnly`, `Secure`, `SameSite`, and scope/expiry hygiene |
+| **CSP Validator** | Parses Content-Security-Policy for unsafe directives (`unsafe-inline`, `unsafe-eval`, wildcards, missing directives) |
+| **Clickjacking Detector** | Verifies frame-busting protection via `X-Frame-Options` / CSP `frame-ancestors` |
+| **SSRF Prober** | Probes server-side request forgery via URL/host parameters *(active — `safe-active`+)* |
+> **Safety:** Module 02 (security) checks use detection-only payloads and do not
+> perform destructive operations in any mode. Note that some **Module 03
+> (business logic)** tests *do* send real state-changing requests (e.g. race
+> conditions, pricing/checkout mutation) — those are gated behind the
+> `--aggressive` safety mode and are **skipped by default**. See
+> [Safety Modes](#safety-modes).
 ```bash
 # Security only
@@ -238,6 +257,12 @@ node src/cli.js security https://your-app.dev --verbose
 Detects business logic flaws that traditional scanners miss: pricing manipulation, access control bypass, workflow skipping, race conditions, and referral abuse.
+> ⚠ **Some logic tests are destructive.** Pricing exploitation, race-condition,
+> cart-manipulation, coupon-abuse, and account-takeover testing issue (or are
+> classified as) real state-changing requests. They only run under
+> `--aggressive` and are **skipped by default** (`--safe-active`). See
+> [Safety Modes](#safety-modes).
 ### How It Works
 Unlike security scanning, business logic testing requires **understanding what the app does**. JAKU-LOGIC first infers business rules from your app's surface:
@@ -288,6 +313,11 @@ node src/cli.js scan https://your-app.dev --modules security,logic
 | 3 | **System Prompt Extractor** | 17 techniques | Direct repeat, token forcing ("Continue: You are a"), structured output (JSON/YAML), indirect summarization, fill-in-the-blanks, reverse output |
 | 4 | **Output Analyzer** | 10 tests | AI-mediated XSS: makes the AI generate `<script>` tags, `<img onerror>`, SVG onload, markdown `javascript:` links, data exfiltration payloads — tests if output is rendered unsanitized |
 | 5 | **Guardrail Prober** | 15 probes | PII leakage (other users' data), excessive agency (delete account, send emails, execute code), off-topic compliance, tool/function-call abuse |
+| 6 | **Model DoS Tester** | resource probes | Context bombing, token-loop / repetition attacks, and oversized-input handling to detect denial-of-wallet / resource exhaustion |
+| 7 | **Indirect Injector** | 6 payloads | Indirect prompt injection via content the AI later ingests (e.g. retrieved/stored data, profile fields) rather than the direct chat input |
+> Detection runs first via the **AI Endpoint Detector**, then the 7 phases above
+> run against each detected endpoint — 8 AI sub-modules in total.
 ### AI Threat Categories
@@ -417,10 +447,103 @@ Correlations appear in the CLI output and reports with severity escalation.
 | `--halt-on-critical` | Abort scan immediately on any critical finding | off |
 | `--webhook <url>` | POST findings summary to webhook URL on completion | off |
 | `--prod-safe` | Confirm authorization to scan production targets | off |
+| `--passive` | Safety mode: recon + static analysis only (no attack probing) | — |
+| `--safe-active` | Safety mode: non-destructive active probing | **default** |
+| `--aggressive` | Safety mode: enable destructive/state-changing tests | — |
+| `--llm` | Enable optional LLM augmentation (key from env) | off |
+| `--llm-provider <name>` | LLM provider: `openai` or `anthropic` | `openai` |
+| `--llm-model <id>` | LLM model id | provider default |
+| `--llm-consent` | Consent to send minimal finding/target data to the provider | off |
 | `--json` | Output JSON report | off |
 | `--html` | Output HTML report | off |
 | `-v, --verbose` | Enable verbose logging | off |
+### Safety Modes
+JAKU exposes three explicit safety tiers so you control how invasive a scan is.
+The default is `--safe-active`. You can also set `"safety_mode"` in
+`jaku.config.json`; the CLI flag takes precedence.
+| Mode | Flag | What runs | What it never does |
+|------|------|-----------|--------------------|
+| **Passive** | `--passive` | Crawl/discovery + read-only/static analysis only (headers, secrets, TLS, cookies, CSP, clickjacking, static form/API analysis) | Sends no attack payloads and no state-changing requests. Active probers (XSS, SQLi, infra, SSRF, file-upload, open-redirect, AI, API/auth, and all logic tests) are skipped. |
+| **Safe-Active** *(default)* | `--safe-active` | Everything in passive **plus** non-destructive active probing: XSS/SQLi probes, AI prompt-injection, API/auth verification, and non-destructive logic checks (access boundary, workflow, abuse patterns, email enumeration, feature flags) | Never issues destructive/state-changing requests. Destructive logic tests are skipped with a clear log line. |
+| **Aggressive** | `--aggressive` | Everything in safe-active **plus** destructive/state-changing tests: pricing exploitation, race conditions, cart manipulation, coupon abuse, account takeover | — (use only against environments you are authorized to mutate) |
+> JAKU is a security scanner and **intentionally does not honor `robots.txt`** in
+> any mode. The legacy `respect_robots` / `respect_robots_txt` config key has
+> been removed.
+### LLM Augmentation (optional)
+JAKU can optionally use your **own** LLM API key to make scans smarter. This
+feature is **off by default and strictly additive** — with no key, no `--llm`
+flag, no consent, an unreachable API, or an exhausted budget, JAKU behaves
+**exactly** as it does without it. The LLM **never** decides core pass/fail;
+deterministic scanners always own the verdict.
+**What the LLM adds (all advisory / tagged `source: "llm"`):**
+| Phase | Augmentation | Where |
+|-------|--------------|-------|
+| 0 | Framework-specific remediation guidance + executive summary | reports |
+| 1 | Context-aware prompt-injection payloads tailored to a leaked system prompt | `JAKU-AI` |
+| 2 | False-positive triage of borderline findings + attack-chain narrative enrichment | synthesis + reports |
+| 3 | Extra business-domain / invariant inference | `JAKU-LOGIC` |
+**Enabling it:**
+```bash
+# Key comes ONLY from the environment — never the config file or CLI
+export OPENAI_API_KEY=sk-...            # or ANTHROPIC_API_KEY=sk-ant-...
+node src/cli.js scan https://myapp.dev --llm --llm-consent --llm-provider openai
+```
+Both `--llm` (enablement) **and** `--llm-consent` (or `llm.consent: true`) are
+required before any data leaves your machine. Configure non-secret settings in
+`jaku.config.json`:
+```jsonc
+"llm": {
+  "enabled": false,        // or pass --llm
+  "provider": "openai",    // openai | anthropic
+  "model": null,           // null → cheap provider default
+  "max_tokens": 1024,      // per-call output cap
+  "max_calls": 50,         // per-scan call budget
+  "token_budget": 100000,  // per-scan token budget
+  "timeout_seconds": 30,
+  "consent": false,        // or pass --llm-consent
+  "base_url": null         // optional self-hosted/proxy endpoint
+}
+```
+**What data leaves the machine (data minimization):**
+- *Remediation:* finding title, module, severity, description.
+- *Triage:* title, severity, description, a short evidence snippet — borderline findings only.
+- *Executive summary:* severity counts + finding **titles** (no bodies/evidence).
+- *Payload generation:* a snippet of the **already-leaked** system prompt + the target host.
+- *Business inference:* discovered URL **paths** + form field **names** (no values, no bodies).
+**Security & safety guarantees:**
+- **Keys never persist or print.** The API key is read from the environment only,
+  is never written to config, logs, reports, `meta`, `finding.evidence`, or PR
+  comments. The logger scrubs `sk-…`, `Bearer …`, and `x-api-key` patterns from
+  all output. Putting an `api_key` in `jaku.config.json` is rejected with a warning.
+- **Passive mode = no egress.** Third-party calls are auto-disabled in `--passive`.
+- **Safety-tier gating.** LLM-generated **destructive** payloads only fire under
+  `--aggressive`; non-destructive generated probes require `--safe-active`.
+- **Budgeted & resilient.** Per-scan call/token budgets, per-call timeout,
+  429 backoff, and a connection-failure circuit breaker — any failure degrades
+  silently to deterministic behavior.
+- **No new dependencies.** Uses the built-in `fetch` only.
+To disable, simply omit `--llm` (or set `"enabled": false`). In CI, set
+`enable-llm: 'true'` on the action and provide `OPENAI_API_KEY` /
+`ANTHROPIC_API_KEY` from repository secrets in the job environment.
 ### Report Formats
 Every scan generates 5 report files:
@@ -467,12 +590,14 @@ node src/cli.js ai https://myapp.dev/api/chat --max-pages 1 -v
 ```
   ╦╔═╗╦╔═╦ ╦
   ║╠═╣╠╩╗║ ║  呪 Autonomous Security & Quality Intelligence
- ╚╝╩ ╩╩ ╩╚═╝  v1.0.2 · Multi-Agent
+ ╚╝╩ ╩╩ ╩╚═╝  v1.2.0 · Multi-Agent
   Target:  https://your-app.dev
   Modules: QA + SECURITY + AI
   Mode:    Multi-Agent Orchestration
+  Safety:  Safe-Active (non-destructive probing)
   Severity: ≥ low
+  LLM:     disabled — not enabled (set llm.enabled or pass --llm)
   ✔ [JAKU-CRAWL] Complete — 0 findings in 2.1s
   ✔ [JAKU-QA] Complete — 3 findings in 14.9s      ⚡parallel
@@ -505,13 +630,16 @@ node src/cli.js ai https://myapp.dev/api/chat --max-pages 1 -v
 ## Reports
-Every scan generates three report formats, saved to `jaku-reports/<timestamp>/`:
+Every scan generates the following report formats, saved to `jaku-reports/<timestamp>/`:
 | Format | File | Description |
 |--------|------|-------------|
 | **JSON** | `report.json` | Machine-readable findings array for CI/CD integration |
 | **Markdown** | `report.md` | Human-readable narrative with severity tables and finding details |
 | **HTML** | `report.html` | Self-contained dark-themed report with severity charts, filters, and embedded evidence |
+| **SARIF** | `report.sarif` | GitHub/GitLab Security Dashboard integration (SARIF v2.1.0) |
+| **Diff** | `diff-report.md` / `diff-report.json` | Regression detection vs. the previous scan run |
+| **OWASP Compliance** | `compliance-owasp.*` | OWASP Top 10 pass/fail report (JSON + MD + HTML) — only with `--compliance owasp` |
 ### Finding Schema
@@ -536,7 +664,7 @@ Every scan generates three report formats, saved to `jaku-reports/<timestamp>/`:
 }
 ```
-Modules tag findings as: `qa`, `security`, or `ai`.
+Modules tag findings as: `qa`, `security`, `ai`, `logic`, or `api`.
 ---
@@ -563,33 +691,48 @@ cp jaku.config.example.json jaku.config.json
 ```json
 {
   "target_url": "https://your-app.dev",
-  "credentials": {
-    "username": "",
-    "password": ""
-  },
-  "modules": ["qa", "security", "ai"],
+  "modules_enabled": ["qa", "security", "ai", "logic", "api"],
   "severity_threshold": "low",
+  "safety_mode": "safe-active",
   "halt_on_critical": true,
   "crawler": {
     "max_pages": 50,
     "max_depth": 5,
-    "respect_robots": true
+    "concurrency": 4
+  },
+  "llm": {
+    "enabled": false,
+    "provider": "openai",
+    "consent": false
   }
 }
 ```
+> The LLM API key is **never** stored in this file — it is read from the
+> `OPENAI_API_KEY` / `ANTHROPIC_API_KEY` environment variable only. See
+> [LLM Augmentation](#llm-augmentation-optional).
+Unknown, mistyped, or deprecated keys in `jaku.config.json` are reported as
+warnings on load (and ignored) rather than silently honored.
 ### Configuration Options
 | Key | Type | Description |
 |-----|------|-------------|
 | `target_url` | string | The application URL to scan |
-| `credentials` | object | Login credentials for authenticated scanning |
-| `modules` | string[] | Modules to enable: `qa`, `security`, `ai` |
+| `credentials` | object[] | Login credentials for authenticated scanning |
+| `modules_enabled` | string[] | Modules to enable: `qa`, `security`, `ai`, `logic`, `api` |
 | `severity_threshold` | string | Minimum severity to report: `critical`, `high`, `medium`, `low` |
+| `safety_mode` | string | Safety tier: `passive`, `safe-active` (default), `aggressive` — see [Safety Modes](#safety-modes) |
 | `halt_on_critical` | boolean | Exit with code 1 if critical findings detected (for CI/CD) |
 | `crawler.max_pages` | number | Maximum pages to crawl |
 | `crawler.max_depth` | number | Maximum link depth to follow |
-| `crawler.respect_robots` | boolean | Honor robots.txt directives |
+| `crawler.concurrency` | number | Parallel crawl workers |
+| `llm.enabled` | boolean | Enable optional LLM augmentation (default `false`) — see [LLM Augmentation](#llm-augmentation-optional) |
+| `llm.provider` | string | `openai` or `anthropic` |
+| `llm.model` | string | Model id (provider default if omitted) |
+| `llm.consent` | boolean | Required (with enablement) before any data egress |
+| `llm.max_calls` / `llm.token_budget` | number | Per-scan call / token budgets |
 ### CI/CD Integration

package/action.yml CHANGED Viewed

@@ -49,6 +49,18 @@ inputs:
     description: 'Maximum pages to crawl'
     required: false
     default: '50'
+  enable-llm:
+    description: 'Enable optional LLM augmentation (requires OPENAI_API_KEY or ANTHROPIC_API_KEY in job env and consent)'
+    required: false
+    default: 'false'
+  llm-provider:
+    description: 'LLM provider when enabled (openai|anthropic)'
+    required: false
+    default: 'openai'
+  llm-model:
+    description: 'LLM model id (provider default if empty)'
+    required: false
+    default: ''
   verbose:
     description: 'Enable verbose logging'
     required: false
@@ -102,6 +114,14 @@ runs:
         JAKU_AUTH_STRATEGY: ${{ inputs.auth-strategy }}
         JAKU_MAX_PAGES: ${{ inputs.max-pages }}
         JAKU_VERBOSE: ${{ inputs.verbose }}
+        JAKU_ENABLE_LLM: ${{ inputs.enable-llm }}
+        JAKU_LLM_PROVIDER: ${{ inputs.llm-provider }}
+        JAKU_LLM_MODEL: ${{ inputs.llm-model }}
+        # API keys are read from the job environment (set these from repo secrets
+        # in your workflow, e.g. OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}).
+        # They are passed to the scanner process only and never printed.
+        OPENAI_API_KEY: ${{ env.OPENAI_API_KEY }}
+        ANTHROPIC_API_KEY: ${{ env.ANTHROPIC_API_KEY }}
       run: |
         REPORT_DIR="${{ runner.temp }}/jaku-reports"
@@ -124,6 +144,17 @@ runs:
         if [ "${JAKU_VERBOSE}" = "true" ]; then
           CMD="${CMD} --verbose"
         fi
+        # Optional LLM augmentation. Only enabled when explicitly requested AND a
+        # key is present in the environment. The key itself is never added to the
+        # command line — LLMClient reads it from env. --llm-consent is implied by
+        # the operator opting in via enable-llm in CI.
+        if [ "${JAKU_ENABLE_LLM}" = "true" ] && { [ -n "${OPENAI_API_KEY}" ] || [ -n "${ANTHROPIC_API_KEY}" ]; }; then
+          CMD="${CMD} --llm --llm-consent --llm-provider ${JAKU_LLM_PROVIDER}"
+          if [ -n "${JAKU_LLM_MODEL}" ]; then
+            CMD="${CMD} --llm-model ${JAKU_LLM_MODEL}"
+          fi
+        fi
         # Run scan
         eval ${CMD} || true
@@ -217,7 +248,7 @@ runs:
               }
             }
-            body += '\n---\n*Scanned by [JAKU](https://github.com/jaku-security/jaku) v1.0.2*';
+            body += `\n---\n*Scanned by [JAKU](https://github.com/jaku-security/jaku) v${report.meta?.version || ''}*`;
           } else {
             body += '⚠️ Scan completed but no report was generated. Check workflow logs for errors.';
           }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "jaku.sh",
-  "version": "1.0.2",
+  "version": "1.2.0",
   "description": "JAKU (呪) — Autonomous Security & Quality Intelligence Agent for vibe-coded apps. XSS, SQLi, prompt injection, QA testing, and attack chain correlation in one command.",
   "type": "module",
   "main": "src/cli.js",
@@ -18,6 +18,7 @@
   ],
   "scripts": {
     "scan": "node src/cli.js scan",
+    "postinstall": "npx playwright install chromium 2>/dev/null || echo '⚠ JAKU: Could not auto-install Chromium. Run: npx playwright install chromium'",
     "prepublishOnly": "node src/cli.js --help"
   },
   "keywords": [

package/src/agents/ai-agent.js CHANGED Viewed

@@ -1,4 +1,6 @@
 import { BaseAgent } from './base-agent.js';
+import { allows, getSafetyMode } from '../utils/safety.js';
+import { generateInjectionPayloads } from '../core/llm/augmentations.js';
 import { AIEndpointDetector } from '../core/ai/ai-endpoint-detector.js';
 import { PromptInjector } from '../core/ai/prompt-injector.js';
 import { JailbreakTester } from '../core/ai/jailbreak-tester.js';
@@ -34,6 +36,14 @@ export class AIAgent extends BaseAgent {
             throw new Error('No surface inventory available — JAKU-CRAWL must run first');
         }
+        // AI endpoint detection and abuse testing send live requests (benign
+        // probes + injection payloads), so they require at least safe-active.
+        if (!allows(config, 'safe-active')) {
+            this._log(`AI abuse testing skipped — requires active probing (current: ${getSafetyMode(config)} mode)`);
+            this.progress('complete', 'AI testing skipped (passive mode)', 100);
+            return;
+        }
         // Phase 1: Detect AI endpoints
         this.progress('detect', 'Detecting AI-powered endpoints...', 0);
@@ -78,9 +88,10 @@ export class AIAgent extends BaseAgent {
         // Phase 4: System Prompt Extraction
         this.progress('extraction', 'Attempting system prompt extraction...', 50);
+        let extractionFindings = [];
         try {
             const extractor = new SystemPromptExtractor(logger);
-            const extractionFindings = await extractor.extract(aiSurfaces, sendMessage);
+            extractionFindings = await extractor.extract(aiSurfaces, sendMessage);
             this.addFindings(extractionFindings);
             this._log(`System prompt extraction: ${extractionFindings.length} leaks`);
         } catch (err) {
@@ -88,6 +99,41 @@ export class AIAgent extends BaseAgent {
         }
         this.progress('extraction', 'System prompt extraction complete', 70);
+        // Phase 4.5: LLM-generated, context-aware injection payloads (optional).
+        // Only runs when LLM augmentation is active (egress is auto-disabled in
+        // passive mode). Generated DESTRUCTIVE payloads require --aggressive;
+        // non-destructive generated probes need safe-active (already satisfied).
+        const llmClient = context.llmClient;
+        if (llmClient?.isEnabled?.()) {
+            try {
+                // Reuse the (already-leaked) system prompt as generation context.
+                const leaked = extractionFindings
+                    .map(f => {
+                        const m = /Extracted content:\n([\s\S]*)/.exec(f.evidence || '');
+                        return m ? m[1].trim() : '';
+                    })
+                    .filter(Boolean)[0] || '';
+                if (leaked) {
+                    const allowDestructive = allows(config, 'aggressive');
+                    const generated = await generateInjectionPayloads(llmClient, {
+                        systemPrompt: leaked,
+                        surfaceUrl: aiSurfaces[0]?.url || config.target_url,
+                        allowDestructive,
+                    });
+                    if (generated?.length) {
+                        const genFindings = await injector.injectGenerated(aiSurfaces, generated, { allowDestructive });
+                        this.addFindings(genFindings);
+                        this._log(`LLM-generated payloads: ${genFindings.length} findings from ${generated.length} tailored payloads`);
+                    }
+                } else {
+                    this._log('No leaked system prompt — skipping LLM payload generation');
+                }
+            } catch (err) {
+                this._log(`LLM payload generation failed: ${err.message}`, 'error');
+            }
+        }
         // Phase 5: Output Analysis (AI-mediated XSS)
         this.progress('output', 'Analyzing AI output sanitization...', 70);
         try {

package/src/agents/api-agent.js CHANGED Viewed

@@ -1,4 +1,5 @@
 import { BaseAgent } from './base-agent.js';
+import { allows, getSafetyMode } from '../utils/safety.js';
 import { AuthFlowTester } from '../core/api/auth-flow-tester.js';
 import { OAuthProber } from '../core/api/oauth-prober.js';
 import { APIKeyAuditor } from '../core/api/api-key-auditor.js';
@@ -28,6 +29,14 @@ export class APIAgent extends BaseAgent {
             throw new Error('No surface inventory available — JAKU-CRAWL must run first');
         }
+        // API/auth flow verification sends live requests, so it requires at
+        // least safe-active. In passive mode it is skipped.
+        if (!allows(config, 'safe-active')) {
+            this._log(`API & auth flow verification skipped — requires active probing (current: ${getSafetyMode(config)} mode)`);
+            this.progress('complete', 'API testing skipped (passive mode)', 100);
+            return;
+        }
         // Phase 1: Auth flow testing
         this.progress('auth', 'Testing authentication flows...', 0);
         try {