npm - jaku.sh - Versions diffs - 1.0.0 - Mend

jaku.sh 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (69) hide show

package/LICENSE +52 -0
package/README.md +636 -0
package/action.yml +264 -0
package/bin/jaku +2 -0
package/package.json +62 -0
package/src/agents/ai-agent.js +175 -0
package/src/agents/api-agent.js +95 -0
package/src/agents/base-agent.js +158 -0
package/src/agents/crawl-agent.js +175 -0
package/src/agents/event-bus.js +59 -0
package/src/agents/findings-ledger.js +410 -0
package/src/agents/logic-agent.js +144 -0
package/src/agents/orchestrator.js +323 -0
package/src/agents/qa-agent.js +149 -0
package/src/agents/security-agent.js +211 -0
package/src/cli.js +423 -0
package/src/core/accessibility-checker.js +171 -0
package/src/core/ai/ai-endpoint-detector.js +227 -0
package/src/core/ai/guardrail-prober.js +362 -0
package/src/core/ai/indirect-injector.js +106 -0
package/src/core/ai/jailbreak-tester.js +212 -0
package/src/core/ai/model-dos-tester.js +174 -0
package/src/core/ai/model-fingerprinter.js +246 -0
package/src/core/ai/multi-turn-attacker.js +297 -0
package/src/core/ai/output-analyzer.js +182 -0
package/src/core/ai/prompt-injector.js +543 -0
package/src/core/ai/system-prompt-extractor.js +244 -0
package/src/core/api/api-key-auditor.js +266 -0
package/src/core/api/auth-flow-tester.js +430 -0
package/src/core/api/cors-ws-tester.js +263 -0
package/src/core/api/graphql-tester.js +287 -0
package/src/core/api/oauth-prober.js +343 -0
package/src/core/auth-manager.js +902 -0
package/src/core/broken-flow-detector.js +207 -0
package/src/core/browser-manager.js +119 -0
package/src/core/console-monitor.js +111 -0
package/src/core/crawler.js +430 -0
package/src/core/csr-waiter.js +410 -0
package/src/core/form-validator.js +240 -0
package/src/core/logic/abuse-pattern-scanner.js +291 -0
package/src/core/logic/access-boundary-tester.js +448 -0
package/src/core/logic/business-rule-inferrer.js +196 -0
package/src/core/logic/graphql-auditor.js +298 -0
package/src/core/logic/parameter-polluter.js +212 -0
package/src/core/logic/pricing-exploiter.js +299 -0
package/src/core/logic/race-condition-detector.js +222 -0
package/src/core/logic/workflow-enforcer.js +284 -0
package/src/core/performance-checker.js +204 -0
package/src/core/responsive-checker.js +228 -0
package/src/core/security/cors-prober.js +150 -0
package/src/core/security/csrf-prober.js +217 -0
package/src/core/security/dependency-auditor.js +182 -0
package/src/core/security/file-upload-tester.js +340 -0
package/src/core/security/header-analyzer.js +324 -0
package/src/core/security/infra-scanner.js +391 -0
package/src/core/security/path-traversal.js +112 -0
package/src/core/security/prototype-pollution.js +147 -0
package/src/core/security/secret-detector.js +517 -0
package/src/core/security/sqli-prober.js +257 -0
package/src/core/security/tls-checker.js +223 -0
package/src/core/security/xss-scanner.js +225 -0
package/src/core/test-generator.js +339 -0
package/src/core/test-runner.js +398 -0
package/src/reporting/diff-reporter.js +172 -0
package/src/reporting/report-generator.js +408 -0
package/src/reporting/sarif-generator.js +190 -0
package/src/utils/config.js +57 -0
package/src/utils/finding.js +67 -0
package/src/utils/logger.js +50 -0

package/src/core/security/infra-scanner.js ADDED Viewed

@@ -0,0 +1,391 @@
+import { createFinding } from '../../utils/finding.js';
+/**
+ * Infrastructure Scanner — Scans for infrastructure exposure and misconfigurations.
+ * Checks debug endpoints, directory listing, error disclosure, and common misconfigs.
+ */
+export class InfraScanner {
+    constructor(logger) {
+        this.logger = logger;
+        this.findings = [];
+    }
+    // Common admin/debug/sensitive endpoints to probe
+    static PROBE_PATHS = [
+        { path: '/admin', desc: 'Admin panel', severity: 'high' },
+        { path: '/administrator', desc: 'Admin panel', severity: 'high' },
+        { path: '/admin/login', desc: 'Admin login', severity: 'medium' },
+        { path: '/wp-admin', desc: 'WordPress admin', severity: 'high' },
+        { path: '/wp-login.php', desc: 'WordPress login', severity: 'medium' },
+        { path: '/debug', desc: 'Debug endpoint', severity: 'high' },
+        { path: '/_debug', desc: 'Debug endpoint', severity: 'high' },
+        { path: '/__debug', desc: 'Debug endpoint', severity: 'high' },
+        { path: '/debug/vars', desc: 'Go debug vars', severity: 'critical' },
+        { path: '/debug/pprof', desc: 'Go profiler', severity: 'critical' },
+        { path: '/status', desc: 'Status page', severity: 'low' },
+        { path: '/health', desc: 'Health check', severity: 'info' },
+        { path: '/healthz', desc: 'Kubernetes health', severity: 'info' },
+        { path: '/readyz', desc: 'Kubernetes readiness', severity: 'info' },
+        { path: '/metrics', desc: 'Prometheus metrics', severity: 'high' },
+        { path: '/api-docs', desc: 'API documentation', severity: 'low' },
+        { path: '/swagger', desc: 'Swagger UI', severity: 'medium' },
+        { path: '/swagger-ui.html', desc: 'Swagger UI', severity: 'medium' },
+        { path: '/swagger.json', desc: 'Swagger spec', severity: 'medium' },
+        { path: '/openapi.json', desc: 'OpenAPI spec', severity: 'medium' },
+        { path: '/graphql', desc: 'GraphQL endpoint', severity: 'low' },
+        { path: '/graphiql', desc: 'GraphQL IDE', severity: 'high' },
+        { path: '/__graphql', desc: 'GraphQL endpoint', severity: 'low' },
+        { path: '/actuator', desc: 'Spring Boot actuator', severity: 'high' },
+        { path: '/actuator/env', desc: 'Spring environment', severity: 'critical' },
+        { path: '/actuator/heapdump', desc: 'Spring heap dump', severity: 'critical' },
+        { path: '/actuator/beans', desc: 'Spring beans', severity: 'high' },
+        { path: '/console', desc: 'Console endpoint', severity: 'high' },
+        { path: '/server-info', desc: 'Server info', severity: 'medium' },
+        { path: '/info', desc: 'Info endpoint', severity: 'low' },
+        { path: '/trace', desc: 'Trace endpoint', severity: 'high' },
+        { path: '/api/v1', desc: 'API v1 root', severity: 'info' },
+        { path: '/robots.txt', desc: 'Robots.txt', severity: 'info' },
+        { path: '/sitemap.xml', desc: 'Sitemap', severity: 'info' },
+        { path: '/crossdomain.xml', desc: 'Flash crossdomain', severity: 'medium' },
+        { path: '/elmah.axd', desc: '.NET error logs', severity: 'high' },
+        { path: '/phpinfo.php', desc: 'PHP info', severity: 'high' },
+        { path: '/test', desc: 'Test page', severity: 'low' },
+        { path: '/backup', desc: 'Backup directory', severity: 'high' },
+        { path: '/dump', desc: 'Data dump', severity: 'critical' },
+    ];
+    // Patterns in error pages that reveal internal details
+    static ERROR_DISCLOSURE_PATTERNS = [
+        { regex: /at [\w.]+\([\w/.]+:\d+:\d+\)/i, name: 'Stack trace (Node.js)', severity: 'medium' },
+        { regex: /Traceback \(most recent call/i, name: 'Stack trace (Python)', severity: 'medium' },
+        { regex: /at [\w.]+\.[\w]+\([\w]+\.java:\d+\)/i, name: 'Stack trace (Java)', severity: 'medium' },
+        { regex: /Fatal error:.*in \/[\w/]+\.php on line \d+/i, name: 'PHP fatal error with path', severity: 'high' },
+        { regex: /DOCUMENT_ROOT.*\/[\w/]+/i, name: 'Document root path disclosure', severity: 'medium' },
+        { regex: /\/home\/[\w]+\/|\/var\/www\/|\/usr\/local\//i, name: 'Server path disclosure', severity: 'medium' },
+        { regex: /DB_HOST|DB_PASSWORD|DATABASE_URL/i, name: 'Database config disclosure', severity: 'critical' },
+        { regex: /MongoServerError|mongoose.*Error/i, name: 'MongoDB error disclosure', severity: 'medium' },
+        { regex: /ECONNREFUSED|ETIMEDOUT.*\d+\.\d+\.\d+\.\d+/i, name: 'Internal IP disclosure', severity: 'medium' },
+    ];
+    /**
+     * Run infrastructure scanning.
+     */
+    async scan(surfaceInventory) {
+        const baseUrl = surfaceInventory.baseUrl;
+        // 1. Probe known sensitive endpoints
+        await this._probeEndpoints(baseUrl);
+        // 2. Check for directory listing
+        await this._checkDirectoryListing(baseUrl);
+        // 3. Check error page information disclosure
+        await this._checkErrorDisclosure(baseUrl);
+        // 4. Check for GraphQL introspection
+        await this._checkGraphQLIntrospection(baseUrl);
+        this.logger?.info?.(`Infrastructure scanner found ${this.findings.length} issues`);
+        return this.findings;
+    }
+    /**
+     * Probe known sensitive/admin endpoints.
+     */
+    async _probeEndpoints(baseUrl) {
+        // Fetch baseline fingerprint to detect SPA catch-all routes
+        const baseline = await this._fetchBaselineFingerprint(baseUrl);
+        const results = await Promise.allSettled(
+            InfraScanner.PROBE_PATHS.map(async ({ path, desc, severity }) => {
+                const url = new URL(path, baseUrl).toString();
+                try {
+                    const resp = await fetch(url, {
+                        method: 'GET',
+                        redirect: 'follow',
+                        signal: AbortSignal.timeout(5000),
+                    });
+                    if (resp.ok && resp.status === 200) {
+                        const contentType = resp.headers.get('content-type') || '';
+                        const body = await resp.text();
+                        // Skip if response matches the catch-all baseline (SPA serving same page for all routes)
+                        if (baseline.isCatchAll) {
+                            const probeHash = this._computeContentHash(body);
+                            if (probeHash === baseline.catchAllHash) return null;
+                            // Fuzzy match: if body length is within 5% of baseline and it's HTML, likely same page with minor variations
+                            const lengthRatio = Math.abs(body.length - baseline.catchAllLength) / Math.max(baseline.catchAllLength, 1);
+                            if (lengthRatio < 0.05 && contentType.includes('text/html')) return null;
+                        }
+                        // Skip if it's a generic 200 HTML page (SPA catch-all)
+                        if (this._isGenericSPAPage(body, path)) return null;
+                        // Skip very small responses (likely empty)
+                        if (body.trim().length < 20) return null;
+                        return { path, desc, severity, url, contentType, bodyLength: body.length, body };
+                    }
+                } catch {
+                    // Not accessible
+                }
+                return null;
+            })
+        );
+        for (const result of results) {
+            if (result.status !== 'fulfilled' || !result.value) continue;
+            const { path, desc, severity, url, contentType, bodyLength, body } = result.value;
+            // Determine actual severity based on content
+            let actualSeverity = severity;
+            if (this._containsSensitiveData(body)) {
+                actualSeverity = 'critical';
+            }
+            this.findings.push(createFinding({
+                module: 'security',
+                title: `Exposed Endpoint: ${path} (${desc})`,
+                severity: actualSeverity,
+                affected_surface: url,
+                description: `The endpoint "${path}" (${desc}) is publicly accessible and returned HTTP 200 with ${bodyLength} bytes.\n\nContent-Type: ${contentType}\n\nExposed management, debug, or admin endpoints can leak sensitive information and provide attack vectors.`,
+                reproduction: [
+                    `1. Navigate to ${url}`,
+                    `2. Endpoint returns HTTP 200 with ${bodyLength} bytes`,
+                    `3. Content-Type: ${contentType}`,
+                ],
+                evidence: body.substring(0, 500),
+                remediation: `Restrict access to "${path}" via authentication, IP whitelisting, or remove it entirely from production. Use environment-based configuration to disable debug endpoints in production.`,
+            }));
+        }
+    }
+    /**
+     * Check if common directories have directory listing enabled.
+     */
+    async _checkDirectoryListing(baseUrl) {
+        const dirs = ['/static/', '/assets/', '/uploads/', '/images/', '/files/', '/media/', '/public/'];
+        for (const dir of dirs) {
+            try {
+                const url = new URL(dir, baseUrl).toString();
+                const resp = await fetch(url, { signal: AbortSignal.timeout(5000) });
+                if (resp.ok) {
+                    const body = await resp.text();
+                    // Check for directory listing patterns
+                    if (body.includes('Index of') || body.includes('Directory listing') ||
+                        body.includes('<pre>') && (body.includes('Parent Directory') || body.match(/<a href="[^"]+\/">/g)?.length > 3)) {
+                        this.findings.push(createFinding({
+                            module: 'security',
+                            title: `Directory Listing Enabled: ${dir}`,
+                            severity: 'medium',
+                            affected_surface: url,
+                            description: `Directory listing is enabled at "${dir}". This allows anyone to browse the directory contents, potentially revealing sensitive files, backup files, or internal structure.`,
+                            reproduction: [
+                                `1. Navigate to ${url}`,
+                                '2. Observe the directory listing showing file names and sizes',
+                            ],
+                            remediation: 'Disable directory listing in your web server configuration. Apache: `Options -Indexes`. Nginx: remove `autoindex on`.',
+                        }));
+                    }
+                }
+            } catch {
+                // Not accessible
+            }
+        }
+    }
+    /**
+     * Check error pages for information disclosure.
+     */
+    async _checkErrorDisclosure(baseUrl) {
+        // Trigger error pages with various paths
+        const errorPaths = [
+            '/this-page-definitely-does-not-exist-jaku-test-404',
+            '/api/nonexistent-endpoint-jaku-test',
+            "/%00",  // Null byte
+            '/..%2f..%2f..%2fetc/passwd', // Path traversal
+        ];
+        for (const errorPath of errorPaths) {
+            try {
+                const url = new URL(errorPath, baseUrl).toString();
+                const resp = await fetch(url, {
+                    signal: AbortSignal.timeout(10000),
+                    redirect: 'follow',
+                });
+                const body = await resp.text();
+                for (const { regex, name, severity } of InfraScanner.ERROR_DISCLOSURE_PATTERNS) {
+                    const match = body.match(regex);
+                    if (match) {
+                        this.findings.push(createFinding({
+                            module: 'security',
+                            title: `Error Information Disclosure: ${name}`,
+                            severity,
+                            affected_surface: url,
+                            description: `The error page reveals internal information: ${name}.\n\nMatched pattern: "${match[0]}"\n\nDetailed error messages help attackers understand the technology stack, internal paths, and potential vulnerabilities.`,
+                            reproduction: [
+                                `1. Navigate to ${url}`,
+                                `2. Error response contains: ${match[0]}`,
+                            ],
+                            evidence: `Matched: ${match[0]}\n\nFull response excerpt:\n${body.substring(Math.max(0, match.index - 100), match.index + match[0].length + 100)}`,
+                            remediation: 'Configure custom error pages that do not reveal stack traces, file paths, or technology details. Set NODE_ENV=production or equivalent for your framework.',
+                        }));
+                    }
+                }
+            } catch {
+                // Request failed
+            }
+        }
+    }
+    /**
+     * Check if GraphQL introspection is enabled.
+     */
+    async _checkGraphQLIntrospection(baseUrl) {
+        const graphqlPaths = ['/graphql', '/api/graphql', '/__graphql', '/graphql/v1'];
+        for (const gqlPath of graphqlPaths) {
+            try {
+                const url = new URL(gqlPath, baseUrl).toString();
+                const resp = await fetch(url, {
+                    method: 'POST',
+                    headers: { 'Content-Type': 'application/json' },
+                    body: JSON.stringify({
+                        query: '{ __schema { types { name } } }',
+                    }),
+                    signal: AbortSignal.timeout(5000),
+                });
+                if (resp.ok) {
+                    const data = await resp.json().catch(() => null);
+                    if (data?.data?.__schema) {
+                        const typeCount = data.data.__schema.types?.length || 0;
+                        this.findings.push(createFinding({
+                            module: 'security',
+                            title: `GraphQL Introspection Enabled: ${gqlPath}`,
+                            severity: 'medium',
+                            affected_surface: url,
+                            description: `GraphQL introspection is enabled at "${gqlPath}", exposing the entire API schema (${typeCount} types discovered). Attackers can use this to map all queries, mutations, and types to find sensitive operations.`,
+                            reproduction: [
+                                `1. Send POST to ${url}`,
+                                `2. Body: {"query": "{ __schema { types { name } } }"}`,
+                                `3. Response contains full schema with ${typeCount} types`,
+                            ],
+                            remediation: 'Disable GraphQL introspection in production. Most GraphQL servers have a configuration option for this.',
+                            references: ['https://www.apollographql.com/docs/apollo-server/security/introspection/'],
+                        }));
+                    }
+                }
+            } catch {
+                // Not a GraphQL endpoint
+            }
+        }
+    }
+    /**
+     * Check if a response is a generic SPA catch-all page.
+     */
+    _isGenericSPAPage(body, path) {
+        // SPAs often serve the same index.html for all routes
+        if (!body.includes('<!DOCTYPE html') && !body.includes('<!doctype html')) return false;
+        // Broad set of SPA framework markers
+        const spaMarkers = [
+            'id="root"', 'id="app"', 'id="__next"', 'id="__nuxt"', 'id="__gatsby"',
+            'id="svelte"', 'id="__svelte"', 'data-reactroot', 'ng-app', 'ng-version',
+            'data-server-rendered', 'id="q-app"',  // Qwik
+            '_buildManifest.js', '_ssgManifest.js', // Next.js build artifacts
+        ];
+        return spaMarkers.some(marker => body.includes(marker));
+    }
+    /**
+     * Check if a response body contains actual sensitive data (not just HTML form labels).
+     */
+    _containsSensitiveData(body) {
+        // Patterns that indicate real sensitive data exposure (not normal HTML content)
+        const sensitivePatterns = [
+            /DB_HOST\s*[=:]/i,                        // Env variable assignment
+            /DB_PASSWORD\s*[=:]/i,                     // Env variable
+            /DATABASE_URL\s*[=:]/i,                    // Env variable
+            /["']?password["']?\s*[:=]\s*["'][^"']+["']/i,  // Key-value with actual password value
+            /["']?secret["']?\s*[:=]\s*["'][^"']+["']/i,    // Key-value with actual secret value
+            /private.key/i,                            // Private key file reference
+            /-----BEGIN (RSA |EC )?PRIVATE KEY-----/,  // Actual private key content
+            /access.token\s*[=:]\s*["']?[A-Za-z0-9._\-]{20,}/i,  // Actual token value
+            /api[_-]?key\s*[=:]\s*["']?[A-Za-z0-9._\-]{16,}/i,    // Actual API key value
+            /AKIA[0-9A-Z]{16}/,                        // AWS access key
+        ];
+        return sensitivePatterns.some(p => p.test(body));
+    }
+    /**
+     * Fetch baseline fingerprint to detect SPA catch-all routes.
+     * Compares the homepage response with a random nonsense path.
+     * If both return the same content, the site uses a catch-all.
+     */
+    async _fetchBaselineFingerprint(baseUrl) {
+        const result = { isCatchAll: false, catchAllHash: null, catchAllLength: 0 };
+        try {
+            const randomPath = `/jaku-fp-check-${Date.now()}-${Math.random().toString(36).slice(2, 8)}`;
+            const [homeResp, randomResp] = await Promise.all([
+                fetch(new URL('/', baseUrl).toString(), {
+                    method: 'GET', redirect: 'follow', signal: AbortSignal.timeout(10000),
+                }).catch(() => null),
+                fetch(new URL(randomPath, baseUrl).toString(), {
+                    method: 'GET', redirect: 'follow', signal: AbortSignal.timeout(10000),
+                }).catch(() => null),
+            ]);
+            if (!homeResp?.ok || !randomResp?.ok) return result;
+            const homeBody = await homeResp.text();
+            const randomBody = await randomResp.text();
+            const homeHash = this._computeContentHash(homeBody);
+            const randomHash = this._computeContentHash(randomBody);
+            if (homeHash === randomHash) {
+                result.isCatchAll = true;
+                result.catchAllHash = homeHash;
+                result.catchAllLength = homeBody.length;
+                this.logger?.info?.('Detected SPA catch-all route — baseline fingerprint will filter false positives');
+            }
+        } catch {
+            // Fingerprinting failed, proceed without baseline
+        }
+        return result;
+    }
+    /**
+     * Compute a simple content hash for comparing page bodies.
+     * Strips dynamic tokens (nonces, timestamps, CSRF tokens) for stable comparison.
+     */
+    _computeContentHash(body) {
+        // Normalize: strip nonces, CSRF tokens, timestamps, and whitespace variations
+        const normalized = body
+            .replace(/nonce="[^"]*"/g, 'nonce=""')
+            .replace(/csrf[_-]?token["']?\s*[:=]\s*["'][^"']*["']/gi, 'csrf_token=""')
+            .replace(/\b\d{13,}\b/g, '0')            // Unix timestamps (milliseconds)
+            .replace(/[a-f0-9]{32,}/gi, 'HASH')       // Long hex strings (session IDs, hashes)
+            .replace(/\s+/g, ' ')
+            .trim();
+        // Simple DJB2 hash — fast and sufficient for content comparison
+        let hash = 5381;
+        for (let i = 0; i < normalized.length; i++) {
+            hash = ((hash << 5) + hash + normalized.charCodeAt(i)) | 0;
+        }
+        return hash;
+    }
+}
+export default InfraScanner;

package/src/core/security/path-traversal.js ADDED Viewed

@@ -0,0 +1,112 @@
+import { createFinding } from '../../utils/finding.js';
+/**
+ * PathTraversalScanner — Tests for path traversal and local file inclusion (LFI).
+ *
+ * Targets:
+ * - URL path parameters (/download?file=, /view?path=, /image?src=)
+ * - Upload URL parameters
+ * - API file-serving endpoints
+ *
+ * Payloads include:
+ * - Unix path traversal: ../../../etc/passwd
+ * - Windows path traversal: ..\..\..\windows\win.ini
+ * - URL encoding: %2e%2e%2f
+ * - Double encoding: %252e%252e%252f
+ * - Null byte: ../../../etc/passwd%00.png
+ */
+export class PathTraversalScanner {
+    constructor(logger) {
+        this.logger = logger;
+        this.FILE_PARAMS = [
+            'file', 'path', 'filename', 'filepath', 'dir', 'directory',
+            'src', 'source', 'doc', 'document', 'template', 'page',
+            'include', 'require', 'show', 'view', 'read', 'load',
+            'img', 'image', 'photo', 'asset', 'resource', 'url', 'redirect',
+        ];
+        this.PAYLOADS = [
+            // Unix
+            { name: 'Basic Unix traversal', payload: '../../../etc/passwd', marker: /root:.*:0:0/, os: 'unix' },
+            { name: 'Encoded Unix traversal', payload: '..%2F..%2F..%2Fetc%2Fpasswd', marker: /root:.*:0:0/, os: 'unix' },
+            { name: 'Double-encoded traversal', payload: '..%252F..%252F..%252Fetc%252Fpasswd', marker: /root:.*:0:0/, os: 'unix' },
+            { name: 'Null byte bypass', payload: '../../../etc/passwd\x00.png', marker: /root:.*:0:0/, os: 'unix' },
+            { name: '/proc/self/environ exposure', payload: '../../../proc/self/environ', marker: /PATH=|HOME=|USER=/, os: 'unix' },
+            { name: '/etc/hosts exposure', payload: '../../../etc/hosts', marker: /127\.0\.0\.1\s+localhost/, os: 'unix' },
+            // Windows
+            { name: 'Windows traversal', payload: '..\\..\\..\\windows\\win.ini', marker: /\[fonts\]/i, os: 'windows' },
+            { name: 'Windows encoded traversal', payload: '..%5C..%5C..%5Cwindows%5Cwin.ini', marker: /\[fonts\]/i, os: 'windows' },
+            // Cloud/container paths
+            { name: 'AWS metadata', payload: 'http://169.254.169.254/latest/meta-data/iam/security-credentials', marker: /AccessKeyId|SecretAccessKey/i, os: 'cloud' },
+            { name: 'GCP metadata', payload: 'http://metadata.google.internal/computeMetadata/v1/instance/service-accounts/default/token', marker: /access_token|expires_in/i, os: 'cloud' },
+        ];
+    }
+    async scan(surfaceInventory) {
+        const findings = [];
+        for (const page of surfaceInventory.pages) {
+            if (!page.url || page.status >= 400) continue;
+            const url = new URL(page.url);
+            const paramNames = [...url.searchParams.keys()];
+            // Find file-like parameters in the URL
+            const fileParams = paramNames.filter(p =>
+                this.FILE_PARAMS.some(fp => p.toLowerCase().includes(fp))
+            );
+            if (fileParams.length === 0) continue;
+            for (const param of fileParams) {
+                for (const { name, payload, marker, os } of this.PAYLOADS) {
+                    try {
+                        const testUrl = new URL(page.url);
+                        testUrl.searchParams.set(param, payload);
+                        const controller = new AbortController();
+                        const timeout = setTimeout(() => controller.abort(), 10000);
+                        const response = await fetch(testUrl.toString(), {
+                            method: 'GET',
+                            signal: controller.signal,
+                        });
+                        clearTimeout(timeout);
+                        if (!response.ok) continue;
+                        const text = await response.text();
+                        if (marker.test(text)) {
+                            findings.push(createFinding({
+                                module: 'security',
+                                title: `Path Traversal / LFI: ${name} via "${param}" parameter`,
+                                severity: os === 'cloud' ? 'critical' : 'critical',
+                                affected_surface: page.url,
+                                description: `The parameter "${param}" at ${page.url} is vulnerable to path traversal. The payload "${payload}" successfully read a ${os === 'cloud' ? 'cloud metadata endpoint' : 'system file'}, allowing an attacker to read arbitrary files from the server's filesystem${os === 'cloud' ? ' and steal cloud credentials' : ', including application source code, configuration files, and credentials'}.`,
+                                reproduction: [
+                                    `1. Navigate to: ${testUrl.toString()}`,
+                                    `2. Server returns contents of ${os === 'unix' ? '/etc/passwd' : os === 'windows' ? 'windows/win.ini' : 'cloud metadata endpoint'}`,
+                                    '3. Escalate to reading: application config files, .env, database credentials',
+                                ],
+                                evidence: `Param: ${param}\nPayload: ${payload}\nResponse excerpt: ${text.substring(0, 300)}`,
+                                remediation: 'Never use user-supplied input directly in file path operations. Use an allowlist of permitted filenames. Resolve and verify the canonical path is within the expected base directory (e.g., require realpath to start with /app/public/). Use chroot jails or container isolation for file serving services.',
+                                references: [
+                                    'https://owasp.org/www-community/attacks/Path_Traversal',
+                                    'CWE-22',
+                                    'CWE-98',
+                                ],
+                            }));
+                            break; // One finding per param
+                        }
+                    } catch { /* continue */ }
+                }
+            }
+        }
+        this.logger?.info?.(`Path Traversal: found ${findings.length} issues`);
+        return findings;
+    }
+}
+export default PathTraversalScanner;

package/src/core/security/prototype-pollution.js ADDED Viewed

@@ -0,0 +1,147 @@
+import { createFinding } from '../../utils/finding.js';
+/**
+ * PrototypePollutionScanner — Tests for JavaScript prototype pollution vulnerabilities.
+ *
+ * Prototype pollution allows attackers to add properties to the global
+ * Object.prototype, which are then inherited by all objects, potentially
+ * causing RCE, access control bypass, or DoS in Node.js applications.
+ *
+ * Test vectors:
+ * - URL query parameters: ?__proto__[admin]=true
+ * - JSON body: {"__proto__":{"admin":true}}
+ * - Nested paths: ?constructor[prototype][admin]=true
+ * - URL path segments: /__proto__/admin
+ */
+export class PrototypePollutionScanner {
+    constructor(logger) {
+        this.logger = logger;
+        // Pollution vectors to test
+        this.URL_VECTORS = [
+            { param: '__proto__[polluted]', value: 'jaku_pp_test', label: 'Direct __proto__ param' },
+            { param: '__proto__[admin]', value: 'true', label: '__proto__[admin] escalation' },
+            { param: 'constructor[prototype][polluted]', value: 'jaku_pp_test', label: 'Constructor prototype' },
+            { param: 'constructor.prototype.polluted', value: 'jaku_pp_test', label: 'Dot notation constructor' },
+        ];
+        this.JSON_VECTORS = [
+            { body: { '__proto__': { 'polluted': 'jaku_pp_test', 'admin': true } }, label: 'JSON __proto__ key' },
+            { body: { 'constructor': { 'prototype': { 'polluted': 'jaku_pp_test' } } }, label: 'JSON constructor.prototype' },
+            { body: [{ '__proto__': { 'polluted': 'jaku_pp_test' } }], label: 'Array __proto__ element' },
+        ];
+    }
+    async scan(surfaceInventory) {
+        const findings = [];
+        const tested = new Set();
+        // Test API endpoints and forms
+        const targets = surfaceInventory.pages.filter(p => p.status < 400).slice(0, 20);
+        for (const target of targets) {
+            if (tested.has(target.url)) continue;
+            tested.add(target.url);
+            // URL parameter pollution
+            const urlFinding = await this._testURLPollution(target.url);
+            if (urlFinding) findings.push(urlFinding);
+            // JSON body pollution (for API endpoints)
+            const jsonFinding = await this._testJSONPollution(target.url);
+            if (jsonFinding) findings.push(jsonFinding);
+        }
+        this.logger?.info?.(`Prototype Pollution: found ${findings.length} issues`);
+        return findings;
+    }
+    async _testURLPollution(url) {
+        for (const vector of this.URL_VECTORS) {
+            try {
+                const testUrl = new URL(url);
+                testUrl.searchParams.set(vector.param, vector.value);
+                const controller = new AbortController();
+                const timeout = setTimeout(() => controller.abort(), 8000);
+                const response = await fetch(testUrl.toString(), {
+                    method: 'GET',
+                    signal: controller.signal,
+                });
+                clearTimeout(timeout);
+                if (!response.ok) continue;
+                const text = await response.text();
+                // Heuristic: if the pollution key/value appears in a JSON response, it may indicate reflection
+                if (text.includes('jaku_pp_test') || text.includes('"admin":true') || text.includes('"polluted"')) {
+                    return createFinding({
+                        module: 'security',
+                        title: `Prototype Pollution via URL Parameter: ${vector.label}`,
+                        severity: 'high',
+                        affected_surface: url,
+                        description: `The endpoint reflects prototype pollution payloads injected via URL parameters. The vector "${vector.param}=${vector.value}" appears in the response, suggesting the server merges query parameters into objects without sanitizing prototype chain keys. In Node.js applications (lodash.merge, jQuery.extend, etc.), this can lead to global object corruption, access control bypass, or Remote Code Execution.`,
+                        reproduction: [
+                            `1. Send GET ${testUrl.toString()}`,
+                            '2. Server reflects pollution key in response',
+                            '3. If server uses a vulnerable merge operation, Object.prototype is now polluted',
+                        ],
+                        evidence: `URL: ${testUrl.toString()}\nResponse contained: ${text.substring(0, 300)}`,
+                        remediation: 'Sanitize all object keys before using them as property names. Use Object.hasOwnProperty checks. Use Object.create(null) for merge targets. Update lodash >= 4.17.21, jQuery >= 3.4.0. Use flat-param libraries that reject prototype chain keys.',
+                        references: [
+                            'https://portswigger.net/web-security/prototype-pollution',
+                            'CWE-1321',
+                            'https://snyk.io/vuln/SNYK-JS-LODASH-567746',
+                        ],
+                    });
+                }
+            } catch { /* continue */ }
+        }
+        return null;
+    }
+    async _testJSONPollution(url) {
+        for (const vector of this.JSON_VECTORS) {
+            try {
+                const controller = new AbortController();
+                const timeout = setTimeout(() => controller.abort(), 8000);
+                const response = await fetch(url, {
+                    method: 'POST',
+                    headers: { 'Content-Type': 'application/json' },
+                    body: JSON.stringify(vector.body),
+                    signal: controller.signal,
+                });
+                clearTimeout(timeout);
+                if (!response.ok && response.status !== 422) continue;
+                const text = await response.text();
+                if (text.includes('jaku_pp_test') || (text.includes('admin') && text.includes('true'))) {
+                    return createFinding({
+                        module: 'security',
+                        title: `Prototype Pollution via JSON Body: ${vector.label}`,
+                        severity: 'critical',
+                        affected_surface: url,
+                        description: `The endpoint accepts JSON bodies containing "__proto__" or "constructor.prototype" keys and appears to process them without sanitization. A successful prototype pollution attack on the server can corrupt the Node.js runtime's Object prototype, enabling privilege escalation or code execution.`,
+                        reproduction: [
+                            `1. POST to ${url} with body: ${JSON.stringify(vector.body).substring(0, 150)}`,
+                            '2. Server processes the __proto__ key',
+                            '3. Check if admin endpoints become accessible: GET /admin',
+                        ],
+                        evidence: `Body: ${JSON.stringify(vector.body)}\nResponse: ${text.substring(0, 300)}`,
+                        remediation: 'Never use prototype-unsafe merge functions (lodash.merge pre-4.17.21, $.extend deep, Object.assign with user input as a source). Use a JSON schema validator that rejects __proto__ keys. Filter out __proto__, constructor, and prototype keys from all incoming JSON at the API gateway layer.',
+                        references: [
+                            'https://portswigger.net/web-security/prototype-pollution/server-side',
+                            'CWE-1321',
+                        ],
+                    });
+                }
+            } catch { /* continue */ }
+        }
+        return null;
+    }
+}
+export default PrototypePollutionScanner;