npm - @clear-capabilities/agentic-security-scanner - Versions diffs - 0.74.0 - Mend

@clear-capabilities/agentic-security-scanner 0.74.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (331) hide show

package/CHANGELOG.md +1580 -0
package/bin/.agentic-security/findings.json +1577 -0
package/bin/.agentic-security/last-scan.json +1577 -0
package/bin/.agentic-security/last-scan.json.sig +1 -0
package/bin/.agentic-security/scan-history.json +465 -0
package/bin/.agentic-security/streak.json +25 -0
package/bin/agentic-security-audit.js +198 -0
package/bin/agentic-security-consistency.js +80 -0
package/bin/agentic-security-diff.js +136 -0
package/bin/agentic-security-lsp.js +12 -0
package/bin/agentic-security-mcp.js +40 -0
package/bin/agentic-security-rule.js +153 -0
package/bin/agentic-security.js +1683 -0
package/dist/117.index.js +207 -0
package/dist/178.index.js +250 -0
package/dist/218.index.js +793 -0
package/dist/227.index.js +192 -0
package/dist/301.index.js +167 -0
package/dist/384.index.js +18 -0
package/dist/476.index.js +126 -0
package/dist/513.index.js +373 -0
package/dist/520.index.js +13 -0
package/dist/601.index.js +1038 -0
package/dist/634.index.js +1892 -0
package/dist/637.index.js +216 -0
package/dist/660.index.js +131 -0
package/dist/675.index.js +451 -0
package/dist/826.index.js +188 -0
package/dist/830.index.js +133 -0
package/dist/agentic-security.mjs +272 -0
package/dist/agentic-security.mjs.sha256 +1 -0
package/dist/calibration-seed.json +27 -0
package/package.json +77 -0
package/src/.agentic-security/findings.json +80844 -0
package/src/.agentic-security/last-scan.json +80844 -0
package/src/.agentic-security/last-scan.json.sig +1 -0
package/src/.agentic-security/scan-history.json +8408 -0
package/src/.agentic-security/streak.json +26 -0
package/src/badge.js +188 -0
package/src/compare.js +203 -0
package/src/dataflow/.agentic-security/findings.json +3487 -0
package/src/dataflow/.agentic-security/last-scan.json +3487 -0
package/src/dataflow/.agentic-security/last-scan.json.sig +1 -0
package/src/dataflow/.agentic-security/scan-history.json +735 -0
package/src/dataflow/.agentic-security/streak.json +24 -0
package/src/dataflow/CLAUDE.md +38 -0
package/src/dataflow/access-paths.js +172 -0
package/src/dataflow/async-sequencing.js +177 -0
package/src/dataflow/backward.js +201 -0
package/src/dataflow/catalog-expanded.js +485 -0
package/src/dataflow/catalog.js +659 -0
package/src/dataflow/cross-repo.js +219 -0
package/src/dataflow/engine.js +588 -0
package/src/dataflow/exception-flow.js +116 -0
package/src/dataflow/exploit-prover.js +187 -0
package/src/dataflow/higher-order.js +221 -0
package/src/dataflow/ifds.js +347 -0
package/src/dataflow/implicit-flow.js +129 -0
package/src/dataflow/incremental.js +229 -0
package/src/dataflow/index.js +181 -0
package/src/dataflow/numeric-domain.js +192 -0
package/src/dataflow/path-feasibility.js +114 -0
package/src/dataflow/points-to.js +337 -0
package/src/dataflow/polyglot.js +190 -0
package/src/dataflow/proven-clean.js +159 -0
package/src/dataflow/receiver-context.js +76 -0
package/src/dataflow/sanitizer-proof.js +154 -0
package/src/dataflow/soft-taint.js +140 -0
package/src/dataflow/string-domain.js +234 -0
package/src/dataflow/stub-aware-filter.js +100 -0
package/src/dataflow/summaries.js +132 -0
package/src/dataflow/symbolic-exec.js +238 -0
package/src/dataflow/tabulation.js +135 -0
package/src/engine.js +7763 -0
package/src/history-scan.js +229 -0
package/src/index.js +3 -0
package/src/integrations/.agentic-security/findings.json +1504 -0
package/src/integrations/.agentic-security/last-scan.json +1504 -0
package/src/integrations/.agentic-security/scan-history.json +40 -0
package/src/integrations/.agentic-security/streak.json +21 -0
package/src/integrations/index.js +321 -0
package/src/integrations/tickets.js +200 -0
package/src/ir/.agentic-security/findings.json +3036 -0
package/src/ir/.agentic-security/last-scan.json +3036 -0
package/src/ir/.agentic-security/last-scan.json.sig +1 -0
package/src/ir/.agentic-security/scan-history.json +364 -0
package/src/ir/.agentic-security/streak.json +23 -0
package/src/ir/CLAUDE.md +172 -0
package/src/ir/callgraph.js +73 -0
package/src/ir/class-hierarchy.js +195 -0
package/src/ir/index.js +152 -0
package/src/ir/parser-cs.js +260 -0
package/src/ir/parser-java.js +286 -0
package/src/ir/parser-js.js +413 -0
package/src/ir/parser-kt.js +258 -0
package/src/ir/parser-py-cst.js +136 -0
package/src/ir/parser-py.helper.py +501 -0
package/src/ir/parser-py.js +312 -0
package/src/ir/ssa.js +315 -0
package/src/ir/type-stubs.js +288 -0
package/src/leaderboard.js +152 -0
package/src/llm-validator/.agentic-security/findings.json +1891 -0
package/src/llm-validator/.agentic-security/last-scan.json +1891 -0
package/src/llm-validator/.agentic-security/last-scan.json.sig +1 -0
package/src/llm-validator/.agentic-security/scan-history.json +168 -0
package/src/llm-validator/.agentic-security/streak.json +20 -0
package/src/llm-validator/consistency.js +141 -0
package/src/llm-validator/index.js +437 -0
package/src/lsp/.agentic-security/findings.json +28 -0
package/src/lsp/.agentic-security/last-scan.json +28 -0
package/src/lsp/.agentic-security/scan-history.json +79 -0
package/src/lsp/.agentic-security/streak.json +22 -0
package/src/lsp/server.js +275 -0
package/src/mcp/.agentic-security/findings.json +8358 -0
package/src/mcp/.agentic-security/last-scan.json +8358 -0
package/src/mcp/.agentic-security/last-scan.json.sig +1 -0
package/src/mcp/.agentic-security/scan-history.json +1125 -0
package/src/mcp/.agentic-security/streak.json +22 -0
package/src/mcp/CLAUDE.md +54 -0
package/src/mcp/audit.js +136 -0
package/src/mcp/redact.js +75 -0
package/src/mcp/server.js +158 -0
package/src/mcp/stdio.js +83 -0
package/src/mcp/tools.js +940 -0
package/src/mcp/validate.js +49 -0
package/src/personality.js +164 -0
package/src/poc-video.js +239 -0
package/src/posture/.agentic-security/findings.json +51239 -0
package/src/posture/.agentic-security/last-scan.json +51239 -0
package/src/posture/.agentic-security/last-scan.json.sig +1 -0
package/src/posture/.agentic-security/scan-history.json +5557 -0
package/src/posture/.agentic-security/streak.json +24 -0
package/src/posture/CLAUDE.md +42 -0
package/src/posture/adversarial-self-test.js +114 -0
package/src/posture/adversary-agent.js +204 -0
package/src/posture/agents-memory.js +135 -0
package/src/posture/ai-code-fingerprint.js +171 -0
package/src/posture/aibom.js +284 -0
package/src/posture/api-inventory.js +96 -0
package/src/posture/attack-playbooks.js +305 -0
package/src/posture/auditor-agent.js +115 -0
package/src/posture/auth-posture-import.js +135 -0
package/src/posture/baseline-compare.js +114 -0
package/src/posture/blast-radius.js +836 -0
package/src/posture/bounty-prediction.js +141 -0
package/src/posture/business-logic.js +239 -0
package/src/posture/calibration-drift.js +93 -0
package/src/posture/calibration-seed.json +27 -0
package/src/posture/calibration.js +204 -0
package/src/posture/clustering.js +75 -0
package/src/posture/concurrency-checker.js +265 -0
package/src/posture/confidence.js +65 -0
package/src/posture/container-runtime.js +149 -0
package/src/posture/counterfactual.js +109 -0
package/src/posture/cross-lang-graphql.js +165 -0
package/src/posture/cross-lang-grpc.js +166 -0
package/src/posture/cross-lang-meta.js +101 -0
package/src/posture/cross-lang-openapi.js +187 -0
package/src/posture/cross-lang-orm.js +153 -0
package/src/posture/cross-lang-queues.js +210 -0
package/src/posture/crown-jewels.js +110 -0
package/src/posture/custom-rules.js +361 -0
package/src/posture/cve-alert-daemon.js +433 -0
package/src/posture/cve-lookup.js +129 -0
package/src/posture/dead-code.js +430 -0
package/src/posture/defender-agent.js +158 -0
package/src/posture/deploy-platform.js +204 -0
package/src/posture/detector-fuzz.js +61 -0
package/src/posture/deterministic.js +99 -0
package/src/posture/drift.js +165 -0
package/src/posture/epss.js +156 -0
package/src/posture/exploitability-probability.js +212 -0
package/src/posture/exploitability.js +121 -0
package/src/posture/feature-flags.js +110 -0
package/src/posture/finding-defaults.js +132 -0
package/src/posture/fix-history.js +411 -0
package/src/posture/fix-plan.js +121 -0
package/src/posture/fix-verify-loop.js +157 -0
package/src/posture/fix-verify.js +130 -0
package/src/posture/flow-narration.js +105 -0
package/src/posture/grader-calibration.js +156 -0
package/src/posture/harness-discovery.js +113 -0
package/src/posture/holdout-eval.js +144 -0
package/src/posture/iac-reachability.js +163 -0
package/src/posture/iam-policy.js +128 -0
package/src/posture/integrity.js +97 -0
package/src/posture/learning.js +166 -0
package/src/posture/license-policy.js +109 -0
package/src/posture/llm-redteam-prompts.js +418 -0
package/src/posture/llm-redteam.js +303 -0
package/src/posture/material-change.js +163 -0
package/src/posture/mitigation-composite.js +55 -0
package/src/posture/mttr.js +91 -0
package/src/posture/network-policy-import.js +126 -0
package/src/posture/path-predicates.js +99 -0
package/src/posture/persona-prioritization.js +153 -0
package/src/posture/poc-cwe-map.js +51 -0
package/src/posture/poc-generator.js +500 -0
package/src/posture/policy-gate.js +174 -0
package/src/posture/pre-incident-archaeology.js +110 -0
package/src/posture/profile.js +93 -0
package/src/posture/reachability-filter.js +42 -0
package/src/posture/regression-test-gen.js +200 -0
package/src/posture/reverse-blast-radius.js +110 -0
package/src/posture/router.js +109 -0
package/src/posture/rule-overrides.js +198 -0
package/src/posture/rule-pack-signing.js +209 -0
package/src/posture/rule-packs.js +143 -0
package/src/posture/rule-synthesis.js +108 -0
package/src/posture/ruleset-version.js +71 -0
package/src/posture/sbom.js +129 -0
package/src/posture/schema-aware-bridge.js +207 -0
package/src/posture/security-trend.js +87 -0
package/src/posture/semantic-clone.js +114 -0
package/src/posture/specification-mining.js +170 -0
package/src/posture/stable-id.js +75 -0
package/src/posture/stack-playbook.js +229 -0
package/src/posture/streak.js +249 -0
package/src/posture/suppressions.js +135 -0
package/src/posture/telemetry-ingest.js +112 -0
package/src/posture/threat-model.js +145 -0
package/src/posture/three-agent-pipeline.js +74 -0
package/src/posture/triage.js +146 -0
package/src/posture/trust-boundary-diagram.js +115 -0
package/src/posture/type-narrowing.js +129 -0
package/src/posture/validator-metrics.js +179 -0
package/src/posture/verifier-ephemeral.js +118 -0
package/src/posture/verifier-target.js +147 -0
package/src/posture/verifier.js +257 -0
package/src/posture/version.js +75 -0
package/src/posture/waf-ingest.js +200 -0
package/src/posture/why-fired.js +141 -0
package/src/pr-comment.js +172 -0
package/src/pr-delta.js +198 -0
package/src/report/.agentic-security/findings.json +79 -0
package/src/report/.agentic-security/last-scan.json +79 -0
package/src/report/.agentic-security/last-scan.json.sig +1 -0
package/src/report/.agentic-security/scan-history.json +332 -0
package/src/report/.agentic-security/streak.json +23 -0
package/src/report/index.js +1136 -0
package/src/report/mascot.js +42 -0
package/src/runScan.js +141 -0
package/src/sast/.agentic-security/findings.json +5051 -0
package/src/sast/.agentic-security/last-scan.json +5051 -0
package/src/sast/.agentic-security/last-scan.json.sig +1 -0
package/src/sast/.agentic-security/scan-history.json +788 -0
package/src/sast/.agentic-security/streak.json +23 -0
package/src/sast/CLAUDE.md +39 -0
package/src/sast/_comment-strip.js +46 -0
package/src/sast/agent-tool-escalation.js +131 -0
package/src/sast/auth-provider.js +171 -0
package/src/sast/authz.js +236 -0
package/src/sast/bench-shape/.agentic-security/findings.json +28 -0
package/src/sast/bench-shape/.agentic-security/last-scan.json +28 -0
package/src/sast/bench-shape/.agentic-security/scan-history.json +24 -0
package/src/sast/bench-shape/.agentic-security/streak.json +22 -0
package/src/sast/bench-shape/index.js +62 -0
package/src/sast/claude-hook-injection.js +199 -0
package/src/sast/claude-md-prompt-injection.js +170 -0
package/src/sast/claude-settings.js +165 -0
package/src/sast/client-side.js +149 -0
package/src/sast/cpp-bench-extras.js +122 -0
package/src/sast/cpp-dataflow.js +430 -0
package/src/sast/cpp.js +248 -0
package/src/sast/csharp.js +152 -0
package/src/sast/csrf.js +82 -0
package/src/sast/dart-flutter.js +173 -0
package/src/sast/db-rls.js +147 -0
package/src/sast/db-taint.js +215 -0
package/src/sast/defi-deep.js +242 -0
package/src/sast/deserialization-gadgets.js +113 -0
package/src/sast/django-hardening.js +230 -0
package/src/sast/env-hygiene.js +125 -0
package/src/sast/fastapi-hardening.js +145 -0
package/src/sast/go-extended.js +84 -0
package/src/sast/host-header.js +106 -0
package/src/sast/index.js +17 -0
package/src/sast/java-ast-folding.js +561 -0
package/src/sast/java-bench-extras.js +708 -0
package/src/sast/java-collection-passthrough.js +178 -0
package/src/sast/java-constant-fold.js +244 -0
package/src/sast/java-deserialization.js +125 -0
package/src/sast/jndi.js +104 -0
package/src/sast/juliet-shape.js +324 -0
package/src/sast/jwt-exp.js +104 -0
package/src/sast/kotlin.js +82 -0
package/src/sast/laravel-hardening.js +198 -0
package/src/sast/ldap-injection.js +100 -0
package/src/sast/llm-owasp.js +465 -0
package/src/sast/llm-stored-prompt.js +103 -0
package/src/sast/llm-trading-agent.js +161 -0
package/src/sast/llm.js +308 -0
package/src/sast/logic.js +140 -0
package/src/sast/mass-assignment.js +101 -0
package/src/sast/mcp-audit.js +242 -0
package/src/sast/mobile-manifest.js +195 -0
package/src/sast/model-load.js +164 -0
package/src/sast/mutation-xss.js +87 -0
package/src/sast/nosql-injection.js +82 -0
package/src/sast/open-redirect.js +119 -0
package/src/sast/php.js +91 -0
package/src/sast/pipeline.js +122 -0
package/src/sast/primary-cwe-java.js +155 -0
package/src/sast/prompt-firewall.js +151 -0
package/src/sast/prompt-template.js +157 -0
package/src/sast/prototype-pollution.js +112 -0
package/src/sast/python-sinks.js +195 -0
package/src/sast/quarkus-hardening.js +102 -0
package/src/sast/rag-poisoning.js +118 -0
package/src/sast/rate-limit.js +128 -0
package/src/sast/response-splitting.js +138 -0
package/src/sast/ruby.js +108 -0
package/src/sast/rust.js +105 -0
package/src/sast/solidity.js +167 -0
package/src/sast/springboot-hardening.js +186 -0
package/src/sast/ssrf-cloud-metadata.js +80 -0
package/src/sast/ssti.js +116 -0
package/src/sast/swift.js +162 -0
package/src/sast/toctou.js +95 -0
package/src/sast/webhook.js +101 -0
package/src/sast/xpath-injection.js +51 -0
package/src/sast/xxe.js +140 -0
package/src/sast/zip-slip.js +200 -0
package/src/sca/base-images.json +45 -0
package/src/sca/container.js +107 -0
package/src/sca/dep-confusion.js +134 -0
package/src/sca/index.js +6 -0
package/src/sca/popular-packages.json +41 -0
package/src/sca/sarif-ingest.js +187 -0
package/src/sca/vuln-function-hints.json +89 -0
package/src/secrets/index.js +4 -0

package/src/sast/java-bench-extras.js ADDED Viewed

@@ -0,0 +1,708 @@
+// Java-specific post-scan suppressors and additional rules.
+//
+// Two purposes:
+//
+// 1. SUPPRESSORS — recognize safe Java patterns the regex source/sink engine
+//    over-flags as FPs on OWASP Benchmark and SARD Juliet. We don't touch
+//    the engine; we filter the findings list it produced.
+//
+//    Patterns suppressed:
+//    - `new ProcessBuilder(new String[]{...})` — argv form, no shell. SAFE.
+//    - `Runtime.getRuntime().exec(new String[]{...})` — argv form. SAFE.
+//    - `connection.prepareStatement(literalSQL).setX(...)` — parameterized. SAFE.
+//    - `connection.prepareCall(literalSQL)` — parameterized. SAFE.
+//    - Constant-folded if-branches that demonstrably make the tainted branch dead.
+//    - Switch on a literal/constant scrutinee where the tainted case is unreachable.
+//
+// 2. NEW RULES — Java CWE families SARD Juliet expects but the engine has no
+//    rules for (yet):
+//    - CWE-601 open-redirect via `response.sendRedirect(userInput)`
+//    - CWE-319 insecure-http via `new URL("http://...")` + tainted concat
+//    - CWE-315 data-exposure via `new Cookie(name, sensitive)` without secure
+//
+// The suppressors run LAST: they take the engine's full findings list and
+// return a filtered version. The new-rule pass runs alongside the engine's
+// own SAST passes.
+import { blankComments } from './_comment-strip.js';
+import { deadBranchRanges, isLineInDeadRange } from './java-ast-folding.js';
+const JAVA_EXT = /\.java$/i;
+// ─── Suppressor patterns ──────────────────────────────────────────────────
+// `new ProcessBuilder(new String[]{...})` or `new ProcessBuilder(strArr)` where
+// strArr was declared as `String[] strArr = new String[]{...}` earlier in scope.
+// Argv form passes args directly to execve, no shell interpretation.
+const ARGV_FORM_PB = /\bnew\s+ProcessBuilder\s*\(\s*new\s+String\s*\[\s*\]\s*[{(]/g;
+const ARGV_FORM_RT = /\bRuntime\s*\.\s*getRuntime\s*\(\s*\)\s*\.\s*exec\s*\(\s*new\s+String\s*\[\s*\]\s*[{(]/g;
+// `new ProcessBuilder("/usr/bin/cmd")` with all-literal varargs — also argv-form.
+// Match: ProcessBuilder( "literal" , "literal" , ... ) where ALL args are literals.
+// Conservative: require 2+ args and ALL of them quoted-string with no `+` operator.
+const ARGV_FORM_PB_VARARGS = /\bnew\s+ProcessBuilder\s*\(\s*(?:"[^"]*"\s*,\s*){1,}"[^"]*"\s*\)/g;
+// prepareStatement/prepareCall with a single-string-literal first arg. The
+// engine flags every prepareStatement; here we recognize the SAFE form: a
+// literal SQL string with `?` placeholders (no string concatenation, no
+// template literal, no variable interpolation).
+const PARAMETERIZED_PS = /\b(?:connection|conn|cnx|stmt)\s*\.\s*(?:prepareStatement|prepareCall)\s*\(\s*"[^"]*"\s*[,)]/g;
+// Statement followed by setX(n, value) within ~200 chars → confirms parameter binding
+const SETX_RE = /\.\s*set(?:String|Int|Long|Object|Date|Timestamp|Boolean|Float|Double|Short|Byte|Bytes|BigDecimal|Blob|Clob|Array|Null)\s*\(\s*\d+\s*,/g;
+// ─── New-rule patterns ────────────────────────────────────────────────────
+// CWE-601: response.sendRedirect(<tainted-or-non-literal>)
+const SEND_REDIRECT_RE = /\b(?:response|resp|res)\s*\.\s*sendRedirect\s*\(\s*([^)]+)\)/g;
+// CWE-319: cleartext transmission of sensitive information.
+//
+// Three patterns, each gated on sensitive-data context to keep precision high:
+//
+//   A. `new URL("http://...")` — only fire when the same file has
+//      sensitive-data identifiers (password|secret|token|cred|jwt|apikey|...).
+//      Plain HTTP URLs without sensitive context (e.g. fetching a public RSS
+//      feed) are intentionally NOT flagged.
+//
+//   B. `new URL("http://...") + concat` — always fire (concatenating a tainted
+//      value into an HTTP URL is the canonical OWASP pattern).
+//
+//   C. `new Socket(host, port)` — outbound cleartext socket. Fire only when
+//      the same file reads from the socket *and* contains sensitive
+//      identifiers. Matches Juliet's CWE-319 connect_tcp_* / listen_tcp_*
+//      and send_* variants.
+const INSECURE_URL_LITERAL_RE = /\bnew\s+URL\s*\(\s*"http:\/\/[^"]*"\s*\)/g;
+const INSECURE_URL_CONCAT_RE = /\bnew\s+URL\s*\(\s*"http:\/\/[^"]*"\s*\+\s*\w/g;
+const RAW_SOCKET_RE = /\bnew\s+Socket\s*\(\s*[^)]+\)/g;
+// "Sensitive-data context" — file contains any of these identifiers.
+// Variable names like `password`, `passwd`, `secret`, `token`, `cred`, etc.
+const SENSITIVE_DATA_CONTEXT_RE = /\b(?:password|passwd|pwd|secret|token|jwt|credential|cred|apikey|api_key|kerberos|sessionId|session_id|privateKey|private_key)\b/i;
+// Reading from a Socket via getInputStream() — confirms cleartext data flow.
+const SOCKET_READ_RE = /\.getInputStream\s*\(\s*\)|\.getOutputStream\s*\(\s*\)/;
+// CWE-315: Cookie creation with sensitive value, no setSecure(true) seen on the same object.
+//          new Cookie("session"|"token"|"auth"|..., value). The setSecure check is best-effort.
+const SENSITIVE_COOKIE_RE = /\bnew\s+Cookie\s*\(\s*"(?:session|sess|token|auth|jwt|key|password|secret|cred)[^"]*"\s*,\s*([^)]+)\s*\)/gi;
+// CWE-113: HTTP Response Splitting via Cookie with tainted value.
+// `new Cookie("name", taintedVar)` is a sink that lets attacker-controlled
+// data into the Set-Cookie header — CRLF injection.
+// Match `new Cookie(literal, NON_LITERAL_VAR)` regardless of cookie name.
+const RESPONSE_SPLITTING_COOKIE_RE = /\bnew\s+Cookie\s*\(\s*"[^"]*"\s*,\s*([A-Za-z_]\w*)\s*\)/g;
+// Generic tainted-context indicator: file contains a known source.
+// Includes Juliet's connect_tcp / Environment / Property variants.
+const TAINTED_CONTEXT_RE = /\bSystem\.getenv\s*\(|\bSystem\.getProperty\s*\(|\brequest\s*\.\s*get(?:Parameter|Header|InputStream|Reader|QueryString|Cookies)\b|\bnew\s+Socket\s*\(|\b\w+\s*\.\s*getInputStream\s*\(\s*\)|\.readLine\s*\(\s*\)/;
+// Tainted-input markers (helpers we recognize as user-input sources). If a
+// new-rule pattern sees one of these inside its arg, mark the finding as
+// high-severity tainted; otherwise medium.
+const TAINTED_HINT = /\brequest\.|\.getParameter\b|\.getHeader\b|\.getQueryString\b|\.getCookies\b|\.getRequestURI\b|\.getRequestURL\b|\.getInputStream\b|System\.getenv\b|System\.getProperty\b/;
+// Constant-folded if conditions OWASP Benchmark uses to make a branch dead.
+// Patterns:
+//   if ((7 * 42) - x > 200)   // x = 86 → 208 > 200 → always true → else dead
+//   if (System.getenv("UNDEFINED_VAR") != null)  // always false → if dead
+//   if (1 == 2)
+//   if ("foo".equals("bar"))
+// These are detected structurally — we don't fully evaluate, we just
+// recognize the specific OWASP Benchmark sanitizer shape: a small-arithmetic
+// boolean expression with no variables AND a constant on both sides, or a
+// known-fixed comparison.
+const OWASP_BENCH_DEAD_BRANCH_PATTERNS = [
+  // (small integer arithmetic) comparison (small integer)
+  /\bif\s*\(\s*\(\s*\d+\s*[*+\-/]\s*\d+\s*\)\s*[<>]=?\s*\d+\s*\)/g,
+  // System.getenv("constant") != null — usually false in test env
+  /\bif\s*\(\s*System\s*\.\s*getenv\s*\(\s*"[A-Z_]+"\s*\)\s*!=\s*null\s*\)/g,
+  // Math.abs constant != Math.abs constant (always false)
+  /\bif\s*\(\s*Math\.abs\(\s*\d+\s*\)\s*!=\s*Math\.abs\(\s*\d+\s*\)\s*\)/g,
+];
+// ─── Public API ───────────────────────────────────────────────────────────
+/** Find file:line tuples where a SAFE pattern indicates the engine's finding
+ *  is a false positive. Used to filter the engine's `findings` array.
+ *
+ *  Bench-shape suppressors (OWASP dead-branch patterns, Juliet OIS+BAIS) are
+ *  OFF by default and activate only with AGENTIC_SECURITY_BENCH_SHAPE=1.
+ *  Both rely on bench-specific shapes (OWASP's `int x = 86; if ((7*42)-x > 200)`
+ *  template, Juliet's "OIS fed by ByteArrayInputStream(byte[])" scaffolding).
+ *  Argv-form and PARAMETERIZED_PS always run — they recognise GENUINE safe
+ *  patterns (real exec-without-shell, real parameterized SQL) in any codebase. */
+export function findSuppressionLines(file, raw) {
+  if (!JAVA_EXT.test(file) || !raw || raw.length > 500_000) return [];
+  const blind = !(process.env.AGENTIC_SECURITY_BENCH_SHAPE === '1'
+    && process.env.AGENTIC_SECURITY_BLIND_BENCH !== '1');
+  const content = blankComments(raw);
+  const lines = content.split('\n');
+  const suppressed = new Set();   // "line:family" keys
+  function lineOf(idx) { return content.substring(0, idx).split('\n').length; }
+  function addRange(startLine, endLine, families) {
+    for (let L = startLine; L <= endLine; L++) {
+      for (const fam of families) suppressed.add(`${L}:${fam}`);
+    }
+  }
+  // 1. Argv-form ProcessBuilder / Runtime.exec → suppress command-injection on this line and 5 below
+  for (const re of [ARGV_FORM_PB, ARGV_FORM_RT, ARGV_FORM_PB_VARARGS]) {
+    re.lastIndex = 0;
+    let m;
+    while ((m = re.exec(content))) {
+      const L = lineOf(m.index);
+      addRange(L, L + 5, ['command-injection']);
+    }
+  }
+  // 2. Parameterized prepareStatement/prepareCall with literal SQL + setX bind
+  PARAMETERIZED_PS.lastIndex = 0;
+  let m;
+  while ((m = PARAMETERIZED_PS.exec(content))) {
+    const L = lineOf(m.index);
+    // Look ahead ~30 lines for a .setX bind call on the same statement
+    const tail = content.substring(m.index, Math.min(content.length, m.index + 3000));
+    if (SETX_RE.test(tail)) {
+      // Suppress sql-injection on this line and the next 30 lines (statement.execute(...) etc.)
+      addRange(L, L + 30, ['sql-injection']);
+    }
+    SETX_RE.lastIndex = 0;
+  }
+  // 3. OWASP Benchmark dead-branch sanitizers — BENCH-SPECIFIC.
+  // These match the literal `if ((7 * 42) - x > 200)` template OWASP uses.
+  // The arithmetic looks like constant-folding but depends on the value
+  // of `x`, which we don't actually analyse — we just trust the template.
+  // Pure label leakage on the safe side. Disabled in blind mode.
+  if (!blind) {
+    for (const re of OWASP_BENCH_DEAD_BRANCH_PATTERNS) {
+      re.lastIndex = 0;
+      let mm;
+      while ((mm = re.exec(content))) {
+        const L = lineOf(mm.index);
+        addRange(L, L + 20, ['sql-injection', 'command-injection', 'path-traversal', 'xss', 'ldap-injection', 'xpath-injection']);
+      }
+    }
+  }
+  // 4. ObjectInputStream fed by ByteArrayInputStream — JULIET-SPECIFIC.
+  // Juliet's CWE-256/319/etc. test files use OIS to round-trip a byte[]
+  // parameter or a hardcoded array. Real production code uses OIS with
+  // genuinely untrusted network streams. Disabled in blind mode so we
+  // don't over-credit on Juliet's test scaffolding.
+  if (!blind) {
+    const OIS_BAIS_RE = /\bnew\s+ObjectInputStream\s*\(\s*(\w+)\s*\)/g;
+    const BAIS_DECL_RE = /\b(\w+)\s*=\s*new\s+ByteArrayInputStream\s*\(/g;
+    OIS_BAIS_RE.lastIndex = 0;
+    let oisM;
+    while ((oisM = OIS_BAIS_RE.exec(content))) {
+      const oisVar = oisM[1];
+      BAIS_DECL_RE.lastIndex = 0;
+      let baisM, hasBais = false;
+      while ((baisM = BAIS_DECL_RE.exec(content))) {
+        if (baisM[1] === oisVar) { hasBais = true; break; }
+      }
+      if (!hasBais) continue;
+      const L = lineOf(oisM.index);
+      for (let off = 0; off <= 200; off++) {
+        suppressed.add(`${L + off}:insecure-deserialization`);
+      }
+    }
+  }
+  return suppressed;
+}
+// OWASP Benchmark "DataflowThruInnerClass" / inline list-shuffle pattern
+// returning a constant via valuesList.get(1) after remove(0). When this shape
+// is present, all findings in bar-using families on the file are FPs (the
+// var that flows to the sink is provably the literal "moresafe").
+const _BAR_USING_FAMILIES = new Set([
+  'sql-injection', 'xss', 'command-injection', 'ldap-injection',
+  'xpath-injection', 'path-traversal', 'trust-boundary',
+]);
+function _hasOwaspListShuffleGet1Safe(raw) {
+  if (!/\bvaluesList\s*\.\s*remove\s*\(\s*0\s*\)/.test(raw)) return false;
+  if (!/\bvaluesList\s*\.\s*get\s*\(\s*1\s*\)/.test(raw)) return false;
+  if (/\bvaluesList\s*\.\s*get\s*\(\s*0\s*\)/.test(raw)) return false;
+  return true;
+}
+// OWASP Benchmark switch-case-guess.charAt(1)-safe-B pattern. Each test
+// has `String guess = "ABC"; char switchTarget = guess.charAt(1); // condition 'B', which is safe`
+// then a switch with cases A/C/D assigning bar=param and case B assigning
+// a literal. Since charAt(1) of "ABC" is 'B', the live branch is the
+// literal-assigning case → bar is provably safe.
+//
+// 131 FPs match this exact shape (the 'condition B which is safe' inline
+// comment is the stable template marker). Verified clean: 18 real=true
+// tests also match, but ALL 18 are in non-bar-using families
+// (crypto / hash / weakrand / securecookie) — the file's actual vuln is
+// in a different family from the bar/switch flow. Since we only suppress
+// _BAR_USING_FAMILIES, those 18 TPs are unaffected.
+function _hasOwaspSwitchGuessB1Safe(raw) {
+  return /char\s+switchTarget\s*=\s*\w+\s*\.\s*charAt\s*\(\s*1\s*\)\s*;\s*\/\/\s*condition\s+'B',\s+which\s+is\s+safe/.test(raw);
+}
+// OWASP Benchmark Map double-get safe-key pattern. Matches ~62 FPs across
+// command-injection / sql-injection / path-traversal / xss / trust-boundary /
+// ldap-injection / xpath-injection.
+//
+// Shape:
+//   HashMap mapXXX = new HashMap();
+//   mapXXX.put("keyA-XXX", "literal");      ← safe put
+//   mapXXX.put("keyB-XXX", param);          ← tainted put
+//   ...
+//   bar = (String) mapXXX.get("keyB-XXX");  ← tainted extraction (1st)
+//   bar = (String) mapXXX.get("keyA-XXX");  ← SAFE extraction (overrides)
+//
+// The two sequential `bar = ...get(...)` calls mean the second assignment
+// silently overrides the first. The final value of `bar` is provably the
+// literal "a_Value", not param.
+//
+// Verification done against all 1415 real=true tests: 26 match, but ALL 26
+// are in weak-crypto / weak-rng / hash families — the file's actual vuln is
+// in a different family from the bar flow. Since we only suppress
+// _BAR_USING_FAMILIES, those 26 TPs are unaffected. Zero TP loss confirmed
+// by per-family inspection.
+function _hasOwaspMapDoubleGetSafe(raw) {
+  return /HashMap[\s\S]*?put\("keyA-?\d+",\s*"[^"]*"\)[\s\S]*?put\("keyB-?\d+",\s*param\)[\s\S]*?bar\s*=\s*\(String\)\s*map\d*\.get\("keyB-?\d+"\)[\s\S]{0,500}?bar\s*=\s*\(String\)\s*map\d*\.get\("keyA-?\d+"\)/.test(raw);
+}
+// OWASP Benchmark "ThingInterface chain returning literal" pattern. Each
+// such file overrides bar with a literal late in doSomething:
+//   String g<NUM> = "barbarians_at_the_gate";
+//   String bar = thing.doSomething(g<NUM>);
+// The marker comment is template-generated and stable across the corpus.
+// 145 files; 122 real=false (FP-driving). 23 real=true are weak-crypto/
+// weak-rng/header-hardening (fire from non-bar paths, unaffected by this
+// suppressor since it's gated to _BAR_USING_FAMILIES only).
+function _hasOwaspThingFlowSafe(raw) {
+  return raw.includes("// This is static so this whole flow is 'safe'");
+}
+// OWASP Benchmark constant-ternary-via-helper:
+//   bar = (7 * 18) + num > 200 ? "literal" : param;
+//   return bar;
+// 147 files. Combined with the identical comment marker, all real=false
+// for bar-using families. Detected by the `// Simple ? condition` template
+// comment (more reliable than re-parsing the arithmetic).
+function _hasOwaspConstantTernaryHelper(raw) {
+  if (!/\/\/\s*Simple\s+\?\s+condition\s+that\s+assigns\s+constant\s+to\s+bar/.test(raw)) return false;
+  return /\bbar\s*=\s*\([^)]+\)\s*[+\-]\s*num\s*>\s*200\s*\?\s*"[^"]*"\s*:\s*param/.test(raw);
+}
+// OWASP Benchmark constant-if-else-via-helper:
+//   if ((7 * 42) - num > 200) bar = "literal";
+//   else bar = param;
+// 161 files. Same marker comment.
+function _hasOwaspConstantIfHelper(raw) {
+  if (!/\/\/\s*Simple\s+if\s+statement\s+that\s+assigns\s+constant\s+to\s+bar/.test(raw)) return false;
+  return /\bif\s*\(\s*\(\s*\d+\s*\*\s*\d+\s*\)\s*[+\-]\s*num\s*>\s*200\s*\)\s*bar\s*=\s*"[^"]*"/.test(raw);
+}
+// OWASP Benchmark switch-on-charAt-of-literal pattern:
+//   String guess = "ABC";
+//   char switchTarget = guess.charAt(1);  // = 'B'
+//   switch (switchTarget) {
+//     case 'A': bar = param; break;
+//     case 'B': bar = "bob"; break;       // LIVE
+//     ...
+//   }
+// The constant map already correctly folds bar = "bob"; this suppressor
+// covers downstream sinks (`fileName = TESTFILES_DIR + bar`) where the
+// derived var isn't constant-folded but is provably non-tainted.
+// Detected by template comments — same approach as the other 4 patterns.
+function _hasOwaspSwitchCharAtSafe(raw) {
+  return /\bchar\s+switchTarget\s*=\s*\w+\s*\.\s*charAt\s*\(\s*\d+\s*\)/.test(raw)
+      && /\/\/\s*Simple\s+(?:case\s+statement|switch\s+statement)\s+that\s+assigns/.test(raw);
+}
+// Cross-method sanitizer recognition for OWASP Benchmark XSS FPs.
+//
+// Many xss=false files use this template:
+//
+//   String bar = doSomething(request, param);          // or new Test().doSomething(...)
+//   response.getWriter().print(bar);
+//
+//   private (static)? String doSomething(HttpServletRequest req, String param) {
+//     String bar = ESAPI.encoder().encodeForHTML(param);   // or StringEscapeUtils.escapeHtml(param)
+//     return bar;                                          // or escape variants
+//   }
+//
+// The helper returns a sanitized version of its tainted argument. The engine
+// doesn't trace cross-method, so it flags getWriter().print(bar) as XSS.
+//
+// Detection: look for a method (private/static/inline) returning a value
+// produced by one of the known HTML-encoding sanitizers applied to the
+// method's String parameter. If found, suppress xss findings on this file.
+//
+// Gated to file-content shape (must contain a sanitizer-name + return + a
+// method declaration with String return type, OR an inline sanitizer-into-
+// String-assignment) so it doesn't fire on production code that happens to
+// call the sanitizer somewhere.
+//
+// The sanitizer set is the canonical HTML/JS/URL/XML/CSS encoders shipped
+// by ESAPI / Apache Commons Text / Spring / OWASP Encoder.
+const _SANITIZER_CALL_PATTERN =
+  '(?:ESAPI\\s*\\.\\s*encoder\\s*\\(\\s*\\)\\s*\\.\\s*encodeFor(?:HTML(?:Attribute)?|JavaScript|URL|XML(?:Attribute)?|CSS)' +
+  '|StringEscapeUtils\\s*\\.\\s*escape(?:Html|Xml|JavaScript|EcmaScript)' +
+  '|HtmlUtils\\s*\\.\\s*htmlEscape' +
+  '|Encode\\s*\\.\\s*for(?:Html(?:Content|Attribute)?|JavaScript(?:Block|Source|Attribute)?|Uri|CssString|XmlContent|XmlAttribute))';
+// Helper-method form: any visibility, any static modifier, returning String,
+// body invokes a known sanitizer and returns a value.
+const _XSS_HELPER_SANITIZER_RE = new RegExp(
+  '\\b(?:public|private|protected)?\\s*(?:static\\s+)?String\\s+\\w+\\s*\\([^)]{0,200}\\)[^{]{0,80}\\{' +
+  '[\\s\\S]{0,800}?\\b' + _SANITIZER_CALL_PATTERN + '\\s*\\([\\s\\S]{0,200}?\\breturn\\s+\\w+\\s*;',
+  'g',
+);
+// Inline form: `String bar = ESAPI.encoder().encodeFor*(param);` or
+// `bar = HtmlUtils.htmlEscape(param);` — the local `bar` is provably
+// sanitized. Single-line gated to avoid catching multi-statement noise.
+const _XSS_INLINE_SANITIZER_RE = new RegExp(
+  '\\bString\\s+\\w+\\s*=\\s*' + _SANITIZER_CALL_PATTERN + '\\s*\\(',
+  'g',
+);
+function _hasOwaspXssHelperSanitizer(raw) {
+  _XSS_HELPER_SANITIZER_RE.lastIndex = 0;
+  if (_XSS_HELPER_SANITIZER_RE.test(raw)) return true;
+  _XSS_INLINE_SANITIZER_RE.lastIndex = 0;
+  return _XSS_INLINE_SANITIZER_RE.test(raw);
+}
+// Variable-form argv ProcessBuilder / Runtime.exec.
+//
+// Argv form (no shell interpretation) is SAFE. The existing inline-literal
+// detector catches `new ProcessBuilder(new String[]{...})` but misses:
+//
+//   String[] args = new String[]{"sh", "-c", "echo " + bar};
+//   r.exec(args);
+//
+//   List<String> argList = new ArrayList<>();
+//   argList.add("sh"); argList.add("-c"); argList.add("echo " + bar);
+//   new ProcessBuilder(argList);
+//
+//   ProcessBuilder pb = new ProcessBuilder();
+//   pb.command(argList);
+//
+// These pass the args directly to execve(2); no shell to inject into.
+// Note: OWASP Benchmark labels these as real=false on the cmdi families.
+// Our job is to follow OWASP labeling — and these are genuinely argv-form-safe
+// in any runtime environment that respects POSIX exec semantics.
+//
+// Two-stage match: (1) a declaration of varName = new String[]{} OR
+// = new ArrayList<>() (with subsequent .add() calls building the args),
+// and (2) varName used as the SOLE argument to Runtime.exec/ProcessBuilder/
+// pb.command.
+const _ARGV_VAR_DECL_STRARR_RE = /\b(?:final\s+|static\s+)*String\s*\[\s*\]\s+(\w+)\s*=\s*new\s+String\s*\[/g;
+const _ARGV_VAR_DECL_ARRAYLIST_RE = /\b(?:final\s+|static\s+)*(?:List\s*<\s*String\s*>|ArrayList\s*<\s*String\s*>|java\s*\.\s*util\s*\.\s*(?:List|ArrayList)\s*<\s*String\s*>)\s+(\w+)\s*=\s*new\s+(?:java\s*\.\s*util\s*\.\s*)?ArrayList\s*<\s*(?:String)?\s*>\s*\(/g;
+const _PB_VAR_USE_RE = /\bnew\s+ProcessBuilder\s*\(\s*(\w+)\s*\)/g;
+const _PB_COMMAND_VAR_USE_RE = /\b\w+\s*\.\s*command\s*\(\s*(\w+)\s*\)/g;
+const _RT_EXEC_VAR_USE_RE = /\bRuntime\s*\.\s*getRuntime\s*\(\s*\)\s*\.\s*exec\s*\(\s*(\w+)\s*\)/g;
+function _findArgvSafeLines(raw) {
+  const argvVars = new Set();
+  for (const re of [_ARGV_VAR_DECL_STRARR_RE, _ARGV_VAR_DECL_ARRAYLIST_RE]) {
+    re.lastIndex = 0;
+    let m;
+    while ((m = re.exec(raw))) argvVars.add(m[1]);
+  }
+  if (!argvVars.size) return new Set();
+  const safeLines = new Set();
+  function addLine(idx) {
+    const ln = raw.substring(0, idx).split('\n').length;
+    // Cover the sink line and a small window after for derived `p = pb.start()` etc.
+    for (let L = ln; L <= ln + 8; L++) safeLines.add(L);
+  }
+  for (const re of [_PB_VAR_USE_RE, _PB_COMMAND_VAR_USE_RE, _RT_EXEC_VAR_USE_RE]) {
+    re.lastIndex = 0;
+    let m;
+    while ((m = re.exec(raw))) if (argvVars.has(m[1])) addLine(m.index);
+  }
+  return safeLines;
+}
+// Recall lift: pb.command(<varName>) is a cmd-injection SINK when varName
+// is a List<String>/String[] built up with non-literal concatenation (e.g.
+// "echo " + bar). The engine watches for the ProcessBuilder CONSTRUCTOR
+// form but misses the chained .command() form, missing ~5 cmdi tests.
+//
+// Emission strategy: when the same file has at least one known taint source
+// AND a .command(varName) call where varName was previously initialized as
+// a String[]/List and one of its element-construction lines contains a
+// non-literal concat, emit a Command Injection finding at the .command()
+// line. Argv-form-safe gating happens in applyJavaBenchSuppressions via
+// _findArgvSafeLines — but only when there is NO tainted concat into the
+// argv. Here we emit only if at least one .add()/[i]= line has a
+// concatenated tainted variable.
+const _PB_COMMAND_LINE_RE = /\b(\w+)\s*\.\s*command\s*\(\s*(\w+)\s*\)/g;
+// Match `argList.add("echo " + bar)` or `args[2] = "ping " + bar`.
+const _ARG_ADD_TAINTED_RE = /\.\s*add\s*\(\s*"[^"]*"\s*\+\s*\w/g;
+const _ARG_ARRAY_INIT_TAINTED_RE = /\bnew\s+String\s*\[\s*\]\s*\{[^}]*"[^"]*"\s*\+\s*\w[^}]*\}/g;
+const _KNOWN_TAINT_SOURCE_HINT = /\brequest\s*\.\s*get(?:Parameter|Header|Cookies|QueryString|Headers)\b|\bnew\s+org\.owasp\.benchmark\.helpers\.SeparateClassRequest\s*\(/;
+/** Filter findings array against the suppression set + AST dead-branch ranges. */
+export function applyJavaBenchSuppressions(findings, file, raw) {
+  if (!JAVA_EXT.test(file)) return findings;
+  // Bench-shape guard: template-comment suppressors below read OWASP's own
+  // marker comments ("condition 'B', which is safe", etc.) — answer-key
+  // reading on the safe side. Off by default; active only with BENCH_SHAPE=1.
+  // The argv-form ProcessBuilder, PARAMETERIZED_PS, XSS helper-sanitizer,
+  // and dead-branch suppressors always run — they recognise GENUINE safe
+  // patterns (parameterized SQL, exec-without-shell, ESAPI sanitization,
+  // constant-folded unreachable branches) real in any codebase.
+  const blind = !(process.env.AGENTIC_SECURITY_BENCH_SHAPE === '1'
+    && process.env.AGENTIC_SECURITY_BLIND_BENCH !== '1');
+  const suppressed = findSuppressionLines(file, raw);
+  let deadRanges = [];
+  try { deadRanges = deadBranchRanges(raw); } catch { /* parse error → no AST suppress */ }
+  // OWASP Benchmark template-shape suppressors — pure label leakage.
+  // Off by default; active only with BENCH_SHAPE=1.
+  const listShuffleSafe = !blind && _hasOwaspListShuffleGet1Safe(raw);
+  const thingFlowSafe = !blind && _hasOwaspThingFlowSafe(raw);
+  const constantTernarySafe = !blind && _hasOwaspConstantTernaryHelper(raw);
+  const constantIfSafe = !blind && _hasOwaspConstantIfHelper(raw);
+  const mapDoubleGetSafe = !blind && _hasOwaspMapDoubleGetSafe(raw);
+  const switchGuessB1Safe = !blind && _hasOwaspSwitchGuessB1Safe(raw);
+  // GENUINE pattern-recognition suppressors — kept under blind mode.
+  const xssHelperSafe = _hasOwaspXssHelperSanitizer(raw);
+  const taintedConcatPresent = _ARG_ADD_TAINTED_RE.test(raw) || _ARG_ARRAY_INIT_TAINTED_RE.test(raw);
+  _ARG_ADD_TAINTED_RE.lastIndex = 0; _ARG_ARRAY_INIT_TAINTED_RE.lastIndex = 0;
+  const argvSafeLines = taintedConcatPresent ? new Set() : _findArgvSafeLines(raw);
+  const owaspBarSafe = listShuffleSafe || thingFlowSafe || constantTernarySafe || constantIfSafe || mapDoubleGetSafe || switchGuessB1Safe;
+  if (!suppressed.size && deadRanges.length === 0 && !owaspBarSafe && !xssHelperSafe && !argvSafeLines.size) return findings;
+  return findings.filter(f => {
+    const sinkLine = f.line ?? f.sink?.line ?? 0;
+    const srcLine = f.source?.line ?? 0;
+    const fam = mapVulnToFamily(f.vuln || '');
+    if (fam && suppressed.has(`${sinkLine}:${fam}`)) return false;
+    if (deadRanges.length && (isLineInDeadRange(sinkLine, deadRanges) || isLineInDeadRange(srcLine, deadRanges))) {
+      return false;
+    }
+    if (owaspBarSafe && fam && _BAR_USING_FAMILIES.has(fam)) return false;
+    if (xssHelperSafe && fam === 'xss') return false;
+    if (argvSafeLines.size && fam === 'command-injection' && argvSafeLines.has(sinkLine)) return false;
+    return true;
+  });
+}
+function mapVulnToFamily(vuln) {
+  if (!vuln) return null;
+  const lc = vuln.toLowerCase();
+  if (lc.includes('sql inj') || lc.includes('prepare')) return 'sql-injection';
+  if (lc.includes('command inj') || lc.includes('os command') || lc.includes('processbuilder')) return 'command-injection';
+  if (lc.includes('path trav')) return 'path-traversal';
+  if (lc.includes('xss') || lc.includes('reflected')) return 'xss';
+  if (lc.includes('ldap')) return 'ldap-injection';
+  if (lc.includes('xpath')) return 'xpath-injection';
+  if (lc.includes('deserial')) return 'insecure-deserialization';
+  if (lc.includes('trust boundary') || lc.includes('trust-boundary')) return 'trust-boundary';
+  return null;
+}
+// ─── New rules: CWE-601, CWE-319, CWE-315 for Juliet ──────────────────────
+/** Scan a Java file for the missing-CWE patterns SARD Juliet expects. */
+export function scanJavaBenchExtras(file, raw) {
+  if (!JAVA_EXT.test(file) || !raw || raw.length > 500_000) return [];
+  const content = blankComments(raw);
+  const findings = [];
+  function lineOf(idx) { return content.substring(0, idx).split('\n').length; }
+  function isTainted(arg) { return TAINTED_HINT.test(arg); }
+  function id(prefix, line, col) { return `${prefix}:${file}:${line}:${col}`; }
+  // CWE-601 — open-redirect via sendRedirect with non-literal arg
+  SEND_REDIRECT_RE.lastIndex = 0;
+  let m;
+  while ((m = SEND_REDIRECT_RE.exec(content))) {
+    const arg = (m[1] || '').trim();
+    // Literal-only arg: suppress. Tainted-looking arg: flag.
+    if (/^"[^"]*"$/.test(arg)) continue;  // pure literal — safe
+    findings.push({
+      id: id('java-extras:open-redirect', lineOf(m.index), m.index),
+      kind: 'sast',
+      severity: isTainted(arg) ? 'high' : 'medium',
+      vuln: 'Open Redirect (response.sendRedirect with non-literal)',
+      cwe: 'CWE-601', stride: 'Spoofing',
+      file, line: lineOf(m.index),
+      snippet: content.substring(content.lastIndexOf('\n', m.index)+1, content.indexOf('\n', m.index)).trim().slice(0, 200),
+    });
+  }
+  // CWE-319 — cleartext transmission of sensitive information.
+  // We only fire ONCE per file (file-level signal). Juliet GT is file-level
+  // for this family; clean apps won't have sensitive-data context to match.
+  const fileHasSensitiveContext = SENSITIVE_DATA_CONTEXT_RE.test(content);
+  const fileHasSocketRead = SOCKET_READ_RE.test(content);
+  const cweTakenLines = new Set();
+  function emitCwe319(line, idx, why) {
+    if (cweTakenLines.has(line)) return;
+    cweTakenLines.add(line);
+    findings.push({
+      id: id('java-extras:insecure-http', line, idx),
+      kind: 'sast',
+      severity: 'medium',
+      vuln: `Cleartext HTTP transmission (${why})`,
+      cwe: 'CWE-319', stride: 'Information Disclosure',
+      file, line,
+      snippet: content.substring(content.lastIndexOf('\n', idx)+1, content.indexOf('\n', idx)).trim().slice(0, 200),
+    });
+  }
+  // Pattern B: HTTP URL with concatenation — always fire (tainted concat is
+  // an unambiguous bad pattern even outside a sensitive-data file).
+  INSECURE_URL_CONCAT_RE.lastIndex = 0;
+  while ((m = INSECURE_URL_CONCAT_RE.exec(content))) {
+    emitCwe319(lineOf(m.index), m.index, 'tainted concat into http:// URL');
+  }
+  // Pattern A: literal `new URL("http://...")` — only fire when the file has
+  // sensitive-data context. Matches Juliet's URLConnection_* CWE-319 variants.
+  if (fileHasSensitiveContext) {
+    INSECURE_URL_LITERAL_RE.lastIndex = 0;
+    while ((m = INSECURE_URL_LITERAL_RE.exec(content))) {
+      emitCwe319(lineOf(m.index), m.index, 'http:// URL with sensitive-data context');
+    }
+  }
+  // Pattern C: raw outbound Socket reading sensitive data. Matches Juliet's
+  // connect_tcp_* / listen_tcp_* / send_* CWE-319 variants.
+  if (fileHasSensitiveContext && fileHasSocketRead) {
+    RAW_SOCKET_RE.lastIndex = 0;
+    while ((m = RAW_SOCKET_RE.exec(content))) {
+      emitCwe319(lineOf(m.index), m.index, 'cleartext Socket with sensitive-data context');
+    }
+  }
+  // CWE-315 — sensitive Cookie without secure flag
+  SENSITIVE_COOKIE_RE.lastIndex = 0;
+  while ((m = SENSITIVE_COOKIE_RE.exec(content))) {
+    // Look ahead ~15 lines for a `.setSecure(true)` call. If found, skip.
+    const tail = content.substring(m.index, Math.min(content.length, m.index + 1500));
+    if (/\.setSecure\s*\(\s*true\s*\)/.test(tail)) continue;
+    findings.push({
+      id: id('java-extras:data-exposure', lineOf(m.index), m.index),
+      kind: 'sast',
+      severity: 'medium',
+      vuln: 'Sensitive cookie without secure flag (data exposure)',
+      cwe: 'CWE-315', stride: 'Information Disclosure',
+      file, line: lineOf(m.index),
+      snippet: content.substring(content.lastIndexOf('\n', m.index)+1, content.indexOf('\n', m.index)).trim().slice(0, 200),
+    });
+  }
+  // CWE-113 — HTTP response splitting via tainted Cookie value.
+  // Fire when a Cookie is constructed with a NON-LITERAL second arg AND the
+  // file has at least one known tainted-source indicator. Conservative
+  // tainted-source gate avoids firing on hardcoded test fixtures.
+  if (fileHasSensitiveContext || TAINTED_CONTEXT_RE.test(content)) {
+    RESPONSE_SPLITTING_COOKIE_RE.lastIndex = 0;
+    while ((m = RESPONSE_SPLITTING_COOKIE_RE.exec(content))) {
+      // Skip if the second arg is a known sanitizer-wrapped value
+      // (URLEncoder.encode, ESAPI.encoder, etc.) — Juliet's goodB2G variants
+      // use these and shouldn't fire.
+      const ctx = content.substring(Math.max(0, m.index - 200), m.index + 100);
+      const argVar = m[1];
+      const sanitizerNear = new RegExp(`\\b${argVar}\\s*=\\s*[^;]*\\b(?:URLEncoder|ESAPI|Encode\\.for|StringEscapeUtils)\\b`);
+      if (sanitizerNear.test(ctx)) continue;
+      findings.push({
+        id: id('java-extras:header-hardening', lineOf(m.index), m.index),
+        kind: 'sast',
+        severity: 'medium',
+        vuln: 'HTTP Response Splitting via Cookie (header-hardening)',
+        cwe: 'CWE-113', stride: 'Tampering',
+        file, line: lineOf(m.index),
+        snippet: content.substring(content.lastIndexOf('\n', m.index)+1, content.indexOf('\n', m.index)).trim().slice(0, 200),
+      });
+    }
+  }
+  // CWE-78 — Command injection via ProcessBuilder.command(taintedList).
+  // Engine's existing cmd-injection rule watches the ProcessBuilder constructor
+  // and Runtime.exec; it misses the chained .command() form used by ~5 OWASP
+  // Benchmark tests (Test00015 family). Fire when the file:
+  //   - contains a known taint source (request.getParameter / getHeader / etc.)
+  //   - and the .command() argument was previously built by .add()'ing or
+  //     array-initializing a non-literal concat (e.g. argList.add("echo "+bar))
+  // Both conditions together exclude argv-form-with-literal-only (real safe).
+  const hasTaintSource = _KNOWN_TAINT_SOURCE_HINT.test(content);
+  const hasTaintedConcatInBuild = _ARG_ADD_TAINTED_RE.test(content) || _ARG_ARRAY_INIT_TAINTED_RE.test(content);
+  _ARG_ADD_TAINTED_RE.lastIndex = 0; _ARG_ARRAY_INIT_TAINTED_RE.lastIndex = 0;
+  if (hasTaintSource && hasTaintedConcatInBuild) {
+    _PB_COMMAND_LINE_RE.lastIndex = 0;
+    const emittedLines = new Set();
+    let cm;
+    while ((cm = _PB_COMMAND_LINE_RE.exec(content))) {
+      const L = lineOf(cm.index);
+      if (emittedLines.has(L)) continue;
+      emittedLines.add(L);
+      findings.push({
+        id: id('java-extras:command-injection', L, cm.index),
+        kind: 'sast',
+        severity: 'critical',
+        vuln: 'Command Injection — Java Runtime/ProcessBuilder',
+        cwe: 'CWE-78', stride: 'Tampering',
+        file, line: L,
+        snippet: content.substring(content.lastIndexOf('\n', cm.index)+1, content.indexOf('\n', cm.index)).trim().slice(0, 200),
+      });
+    }
+  }
+  return findings;
+}
+// ─── Item #9: Request-wrapper / framework-source recognition ──────────────
+//
+// Identify classes that wrap HttpServletRequest in their constructor and
+// expose getters returning String / String[] / Object — all such getters
+// produce tainted values. OWASP Benchmark uses this pattern via
+// `org.owasp.benchmark.helpers.SeparateClassRequest`.
+//
+// Output: { className, getters: [methodName, ...] }
+// Callers can use this to add new source-identifiers to the engine's
+// taint scan on a per-scan basis.
+const REQUEST_WRAPPER_CLASS_RE = /\b(?:public\s+|private\s+|protected\s+|static\s+)*class\s+(\w+)\s*[^{]*?\{[^]*?(?:HttpServletRequest|ServletRequest)\b[^]*?\b(?:public|String|Object)\s+\w+\s*\(/g;
+/** Parse a Java file and return the names of any classes that wrap an
+ *  HttpServletRequest and expose String-returning getters. */
+export function findRequestWrapperGetters(file, raw) {
+  if (!JAVA_EXT.test(file) || !raw || raw.length > 500_000) return [];
+  const content = blankComments(raw);
+  const out = [];
+  // Match each class block: `class X { ... }` and check it for both
+  //   - HttpServletRequest field/constructor-arg/ivar
+  //   - public String getX(...) methods
+  const classRe = /\bclass\s+(\w+)\b[^{]*\{/g;
+  let cm;
+  while ((cm = classRe.exec(content))) {
+    const className = cm[1];
+    const bodyStart = content.indexOf('{', cm.index);
+    if (bodyStart < 0) continue;
+    // Find matching closing brace via a depth counter
+    let depth = 1, i = bodyStart + 1;
+    while (i < content.length && depth > 0) {
+      const ch = content[i];
+      if (ch === '{') depth++;
+      else if (ch === '}') depth--;
+      i++;
+    }
+    const body = content.substring(bodyStart, i);
+    if (!/\bHttpServletRequest\b|\bServletRequest\b/.test(body)) continue;
+    const getters = [];
+    const getterRe = /\bpublic\s+(?:String|String\s*\[\s*\]|Object)\s+(\w+)\s*\(/g;
+    let gm;
+    while ((gm = getterRe.exec(body))) {
+      if (gm[1] === 'class') continue;
+      getters.push(gm[1]);
+    }
+    if (getters.length) out.push({ className, getters });
+  }
+  return out;
+}