PyPI - tweek - Versions diffs - 0.1.0__py3-none-any.whl → 0.2.0__py3-none-any.whl - Mend

tweek 0.1.0py3-none-any.whl → 0.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (85) hide show

tweek/__init__.py +2 -2
tweek/_keygen.py +53 -0
tweek/audit.py +288 -0
tweek/cli.py +5303 -2396
tweek/cli_model.py +380 -0
tweek/config/families.yaml +609 -0
tweek/config/manager.py +42 -5
tweek/config/patterns.yaml +1510 -8
tweek/config/tiers.yaml +161 -11
tweek/diagnostics.py +71 -2
tweek/hooks/break_glass.py +163 -0
tweek/hooks/feedback.py +223 -0
tweek/hooks/overrides.py +531 -0
tweek/hooks/post_tool_use.py +472 -0
tweek/hooks/pre_tool_use.py +1024 -62
tweek/integrations/openclaw.py +443 -0
tweek/integrations/openclaw_server.py +385 -0
tweek/licensing.py +14 -54
tweek/logging/bundle.py +2 -2
tweek/logging/security_log.py +56 -13
tweek/mcp/approval.py +57 -16
tweek/mcp/proxy.py +18 -0
tweek/mcp/screening.py +5 -5
tweek/mcp/server.py +4 -1
tweek/memory/__init__.py +24 -0
tweek/memory/queries.py +223 -0
tweek/memory/safety.py +140 -0
tweek/memory/schemas.py +80 -0
tweek/memory/store.py +989 -0
tweek/platform/__init__.py +4 -4
tweek/plugins/__init__.py +40 -24
tweek/plugins/base.py +1 -1
tweek/plugins/detectors/__init__.py +3 -3
tweek/plugins/detectors/{moltbot.py → openclaw.py} +30 -27
tweek/plugins/git_discovery.py +16 -4
tweek/plugins/git_registry.py +8 -2
tweek/plugins/git_security.py +21 -9
tweek/plugins/screening/__init__.py +10 -1
tweek/plugins/screening/heuristic_scorer.py +477 -0
tweek/plugins/screening/llm_reviewer.py +14 -6
tweek/plugins/screening/local_model_reviewer.py +161 -0
tweek/proxy/__init__.py +38 -37
tweek/proxy/addon.py +22 -3
tweek/proxy/interceptor.py +1 -0
tweek/proxy/server.py +4 -2
tweek/sandbox/__init__.py +11 -0
tweek/sandbox/docker_bridge.py +143 -0
tweek/sandbox/executor.py +9 -6
tweek/sandbox/layers.py +97 -0
tweek/sandbox/linux.py +1 -0
tweek/sandbox/project.py +548 -0
tweek/sandbox/registry.py +149 -0
tweek/security/__init__.py +9 -0
tweek/security/language.py +250 -0
tweek/security/llm_reviewer.py +1146 -60
tweek/security/local_model.py +331 -0
tweek/security/local_reviewer.py +146 -0
tweek/security/model_registry.py +371 -0
tweek/security/rate_limiter.py +11 -6
tweek/security/secret_scanner.py +70 -4
tweek/security/session_analyzer.py +26 -2
tweek/skill_template/SKILL.md +200 -0
tweek/skill_template/__init__.py +0 -0
tweek/skill_template/cli-reference.md +331 -0
tweek/skill_template/overrides-reference.md +184 -0
tweek/skill_template/scripts/__init__.py +0 -0
tweek/skill_template/scripts/check_installed.py +170 -0
tweek/skills/__init__.py +38 -0
tweek/skills/config.py +150 -0
tweek/skills/fingerprints.py +198 -0
tweek/skills/guard.py +293 -0
tweek/skills/isolation.py +469 -0
tweek/skills/scanner.py +715 -0
tweek/vault/__init__.py +0 -1
tweek/vault/cross_platform.py +12 -1
tweek/vault/keychain.py +87 -29
tweek-0.2.0.dist-info/METADATA +281 -0
tweek-0.2.0.dist-info/RECORD +121 -0
{tweek-0.1.0.dist-info → tweek-0.2.0.dist-info}/entry_points.txt +8 -1
{tweek-0.1.0.dist-info → tweek-0.2.0.dist-info}/licenses/LICENSE +80 -0
tweek/integrations/moltbot.py +0 -243
tweek-0.1.0.dist-info/METADATA +0 -335
tweek-0.1.0.dist-info/RECORD +0 -85
{tweek-0.1.0.dist-info → tweek-0.2.0.dist-info}/WHEEL +0 -0
{tweek-0.1.0.dist-info → tweek-0.2.0.dist-info}/top_level.txt +0 -0

tweek/config/patterns.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 # Tweek Attack Pattern Definitions v3
-# All 116 patterns included FREE
+# All 215 patterns included FREE
 #
-# Update via: tweek update (pulls from github.com/gettweek/tweek-patterns)
+# Update via: tweek update (pulls from github.com/gettweek/tweek)
 #
 # Fields:
 #   id: Sequential pattern number
@@ -9,6 +9,7 @@
 #   description: Human-readable explanation
 #   regex: Python regex pattern
 #   severity: critical | high | medium | low
+#   confidence: deterministic | heuristic | contextual
 #
 # Severity guide:
 #   critical - Almost certainly malicious
@@ -16,10 +17,15 @@
 #   medium - Suspicious, warrants review
 #   low - Unusual but possibly legitimate
 #
+#
+# Confidence guide:
+#   deterministic - Near-zero false positive rate; precise file/command targeting
+#   heuristic - Good detection signal; may FP in legitimate security contexts
+#   contextual - Depends on surrounding context; broad behavioral pattern
 # PRO tier adds: LLM review, session analysis, rate limiting
-version: 3
-pattern_count: 116
+version: 5
+pattern_count: 259
 patterns:
   # ============================================================================
@@ -33,60 +39,80 @@ patterns:
     description: "Reading SSH private keys"
     regex: '(cat|head|tail|less|more)\s+.*\.ssh/(id_rsa|id_ed25519|id_ecdsa|id_dsa)(?!\.pub)'
     severity: critical
+    confidence: deterministic
+    family: credential_theft
   - id: 2
     name: aws_credentials
     description: "Accessing AWS credential files"
     regex: '(cat|head|tail|less|more)\s+.*\.aws/(credentials|config)'
     severity: critical
+    confidence: deterministic
+    family: credential_theft
   - id: 3
     name: env_file_access
     description: "Attempts to read .env files containing secrets"
     regex: '(cat|head|tail|less|more|bat|grep|rg|ag)\s+.*\.env'
     severity: high
+    confidence: heuristic
+    family: credential_theft
   - id: 4
     name: keychain_dump
     description: "Extracting credentials from macOS Keychain"
     regex: '(security\s+dump-keychain|security\s+find-(generic|internet)-password\s+.*-w|chainbreaker|security\s+export)'
     severity: critical
+    confidence: deterministic
+    family: credential_theft
   - id: 5
     name: gcloud_credentials
     description: "Accessing Google Cloud credentials"
     regex: '(cat|head|tail|less|more)\s+.*\.config/gcloud'
     severity: critical
+    confidence: deterministic
+    family: credential_theft
   - id: 6
     name: netrc_access
     description: "Accessing .netrc (contains plaintext passwords)"
     regex: '(cat|head|tail|less|more)\s+.*\.netrc'
     severity: critical
+    confidence: deterministic
+    family: credential_theft
   - id: 7
     name: kube_config
     description: "Accessing Kubernetes config"
     regex: '(cat|head|tail|less|more)\s+.*\.kube/config'
     severity: high
+    confidence: heuristic
+    family: credential_theft
   - id: 8
     name: ssh_directory_access
     description: "Accessing SSH directory contents"
     regex: '(ls|find|cat)\s+.*\.ssh'
     severity: high
+    confidence: heuristic
+    family: credential_theft
   - id: 9
     name: env_variable_expansion
     description: "Accessing environment variables containing secrets"
     regex: '\$\{?(API_KEY|SECRET|TOKEN|PASSWORD|CREDENTIAL|PRIVATE_KEY|AUTH)[A-Z_]*\}?'
     severity: high
+    confidence: heuristic
+    family: credential_theft
   - id: 10
     name: history_access
     description: "Reading shell history (may contain secrets)"
     regex: '(cat|head|tail|less|more|grep)\s+.*(\.bash_history|\.zsh_history|\.history)'
     severity: high
+    confidence: heuristic
+    family: credential_theft
   # --- Network Exfiltration ---
   - id: 11
@@ -94,36 +120,48 @@ patterns:
     description: "Curl sending data that may include secrets"
     regex: 'curl\s+.*(-d|--data|--data-raw|--data-binary)\s+.*\$\('
     severity: critical
+    confidence: deterministic
+    family: data_exfiltration
   - id: 12
     name: exfil_paste_sites
     description: "Data sent to known paste/exfil sites"
     regex: '(curl|wget|http).*?(pastebin\.com|hastebin\.com|ghostbin|0x0\.st|transfer\.sh|file\.io|webhook\.site|requestbin|ngrok\.io|pipedream)'
     severity: critical
+    confidence: deterministic
+    family: data_exfiltration
   - id: 13
     name: netcat_outbound
     description: "Netcat connection (potential reverse shell or exfil)"
     regex: '\b(nc|ncat|netcat)\b.*(-e|exec)'
     severity: critical
+    confidence: deterministic
+    family: data_exfiltration
   - id: 14
     name: reverse_shell
     description: "Creating reverse shell connections"
     regex: '(python|ruby|perl|php).*socket.*connect.*(exec|system|spawn)|bash\s+-i.*>&.*/dev/tcp/'
     severity: critical
+    confidence: deterministic
+    family: data_exfiltration
   - id: 15
     name: curl_post_file
     description: "Curl uploading local files"
     regex: 'curl\s+.*(-F|--form|-T|--upload-file)\s+'
     severity: high
+    confidence: heuristic
+    family: data_exfiltration
   - id: 16
     name: pipe_to_shell
     description: "Piping remote content directly to shell"
     regex: '(curl|wget).*\|\s*(bash|sh|zsh|python|perl|ruby)'
     severity: critical
+    confidence: deterministic
+    family: data_exfiltration
   # --- Prompt Injection (basic) ---
   - id: 17
@@ -131,31 +169,41 @@ patterns:
     description: "Direct attempt to override system instructions"
     regex: '(ignore|disregard|forget|override)\s+(previous|prior|system|all|above)\s+(instructions|prompt|rules|constraints|directives)'
     severity: high
+    confidence: heuristic
+    family: prompt_injection
   - id: 18
     name: role_hijack
     description: "Attempting to assume new identity/role"
     regex: '(you\s+are\s+now|act\s+as|pretend\s+to\s+be|your\s+new\s+role\s+is|from\s+now\s+on\s+you\s+are)'
     severity: high
+    confidence: heuristic
+    family: prompt_injection
   - id: 19
     name: privilege_claim
     description: "False claims of elevated privileges"
     regex: '(as\s+(the\s+)?(admin|root|owner|developer|superuser)|i\s+have\s+(admin|root|elevated)\s+access|authorized\s+to|i\s+am\s+the\s+owner)'
     severity: high
+    confidence: heuristic
+    family: prompt_injection
   # --- Destructive Commands ---
   - id: 20
     name: recursive_delete_root
     description: "Recursive deletion from root or home"
-    regex: 'rm\s+.*-[rf]*\s+(/|~|\$HOME)\s*$'
+    regex: '(?:^|[;&|]\s*)rm\s+(-[a-zA-Z]*[rf][a-zA-Z]*\s+)+\s*(\/(?:\s|;|&|\||$)|~(?:\s|\/|;|&|\||$)|\$HOME(?:\s|\/|;|&|\||$)|\/(?:etc|var|usr|bin|sbin|root|home|boot|lib|opt|srv)(?:\s|\/|;|&|\||$))'
     severity: critical
+    confidence: deterministic
+    family: destructive_ops
   - id: 21
     name: disk_wipe
     description: "Disk wiping commands"
     regex: 'dd\s+if=/dev/(zero|urandom)\s+of=/dev/(sd|hd|nvme)|mkfs\s+/dev/'
     severity: critical
+    confidence: deterministic
+    family: destructive_ops
   # --- Config Manipulation ---
   - id: 22
@@ -163,12 +211,16 @@ patterns:
     description: "Writing to auto-approve configurations"
     regex: '(autoApprove|auto_approve|autorun|auto_execute|allowAll)\s*[=:]\s*"?(true|1|yes)"?'
     severity: critical
+    confidence: deterministic
+    family: persistence
   - id: 23
     name: hook_bypass
     description: "Attempting to bypass or disable hooks"
     regex: '(disable|skip|bypass|remove).*hook|--no-verify|pre-commit.*disable|\.git/hooks'
     severity: high
+    confidence: heuristic
+    family: persistence
   # ============================================================================
   # ADVANCED DETECTION (24-116)
@@ -181,48 +233,64 @@ patterns:
     description: "Accessing NPM authentication tokens"
     regex: '(cat|head|tail|less|more)\s+.*\.npmrc'
     severity: high
+    confidence: heuristic
+    family: credential_theft
   - id: 25
     name: docker_config_access
     description: "Accessing Docker credentials"
     regex: '(cat|head|tail|less|more)\s+.*\.docker/config\.json'
     severity: high
+    confidence: heuristic
+    family: credential_theft
   - id: 26
     name: pypirc_access
     description: "Accessing PyPI credentials"
     regex: '(cat|head|tail|less|more)\s+.*\.pypirc'
     severity: high
+    confidence: heuristic
+    family: credential_theft
   - id: 27
     name: git_credentials_access
     description: "Accessing Git credential store"
     regex: '(cat|head|tail|less|more)\s+.*\.git-credentials'
     severity: high
+    confidence: heuristic
+    family: credential_theft
   - id: 28
     name: azure_credentials
     description: "Accessing Azure credentials"
     regex: '(cat|head|tail|less|more)\s+.*\.azure/(credentials|config)'
     severity: critical
+    confidence: deterministic
+    family: credential_theft
   - id: 29
     name: env_command
     description: "Dumping all environment variables"
-    regex: '\benv\b|\bprintenv\b|\bexport\s*$'
+    regex: '^\s*env\s*$|^\s*env\s+-|\bprintenv\b|\bexport\s*$'
     severity: medium
+    confidence: heuristic
+    family: credential_theft
   - id: 30
     name: browser_credential_theft
     description: "Accessing browser saved passwords and cookies"
     regex: '(Login\s*Data|key4\.db|logins\.json|Cookies\.binarycookies|~/Library/(Safari|Application\s*Support/(Google/)?Chrome)/.*\.(db|sqlite))'
     severity: critical
+    confidence: deterministic
+    family: credential_theft
   - id: 31
     name: crypto_wallet_theft
     description: "Accessing cryptocurrency wallet files"
     regex: '(wallet\.dat|\.wallet|seed\.txt|mnemonic|Electrum|Exodus|MetaMask|\.ethereum/keystore|Atomic.*Wallet)'
     severity: critical
+    confidence: deterministic
+    family: credential_theft
   # --- Advanced Network Exfiltration ---
   - id: 32
@@ -230,48 +298,64 @@ patterns:
     description: "Wget sending POST data"
     regex: 'wget\s+.*--post-(data|file)'
     severity: high
+    confidence: heuristic
+    family: data_exfiltration
   - id: 33
     name: base64_curl_pipe
     description: "Base64 encoded data piped to curl (obfuscated exfil)"
     regex: 'base64.*\|\s*curl|curl.*base64'
     severity: critical
+    confidence: deterministic
+    family: data_exfiltration
   - id: 34
     name: dns_exfiltration
     description: "Data exfiltration via DNS queries"
     regex: '(dig|nslookup|host)\s+.*\$\(|dns.*tunnel|iodine|dnscat'
     severity: high
+    confidence: heuristic
+    family: data_exfiltration
   - id: 35
     name: icmp_tunnel
     description: "Data exfiltration via ICMP"
     regex: 'ping.*\$\(|icmp.*tunnel|ptunnel'
     severity: high
+    confidence: heuristic
+    family: data_exfiltration
   - id: 36
     name: curl_with_env
     description: "Curl command accessing environment variables"
     regex: 'curl.*\$\{?(API_KEY|SECRET|TOKEN|PASSWORD|AUTH)'
     severity: critical
+    confidence: deterministic
+    family: data_exfiltration
   - id: 37
     name: webhook_exfil
     description: "Data sent to webhook endpoints"
     regex: '(curl|wget|http).*?(hooks\.slack\.com|discord\.com/api/webhooks|api\.telegram\.org)'
     severity: high
+    confidence: heuristic
+    family: data_exfiltration
   - id: 38
     name: git_exfil
     description: "Exfiltration via git operations"
     regex: 'git\s+(push|commit).*\.(env|pem|key)|git.*remote.*add.*http'
     severity: high
+    confidence: heuristic
+    family: data_exfiltration
   - id: 39
     name: scp_exfil
     description: "File transfer via SCP to external hosts"
     regex: 'scp\s+.*(\.env|\.pem|\.key|credentials|secrets).*@'
     severity: critical
+    confidence: deterministic
+    family: data_exfiltration
   # --- Prompt Injection - Evasive (40-55) ---
   - id: 40
@@ -279,66 +363,88 @@ patterns:
     description: "Claiming test/debug mode to bypass restrictions"
     regex: '(this\s+is\s+(a\s+)?test|testing\s+mode|debug\s+mode|in\s+development|sandbox\s+mode|simulation)'
     severity: medium
+    confidence: contextual
+    family: prompt_injection
   - id: 41
     name: context_reset
     description: "Attempting to reset conversation context"
     regex: '(reset\s+context|clear\s+memory|start\s+fresh|new\s+conversation|forget\s+everything)'
     severity: medium
+    confidence: contextual
+    family: prompt_injection
   - id: 42
     name: system_prompt_extract
     description: "Attempting to extract system prompt"
-    regex: '(what\s+(is|are)\s+your\s+(system\s+)?instructions|show\s+me\s+your\s+prompt|reveal\s+your\s+rules|print\s+system\s+prompt)'
+    regex: '(what\s+(is|are|were)\s+your\s+(system\s+|initial\s+|original\s+|core\s+|complete\s+)?(instructions|prompt|configuration|config|rules|guidelines|directives|constraints)|show\s+(me\s+)?your\s+(system\s+)?prompt|reveal\s+your\s+(rules|prompt|instructions|configuration)|(output|share|display|provide|repeat|dump|print)\s+(your|the)\s+(system\s+)?(prompt|instructions|configuration|config|rules|guidelines)|list\s+(all\s+)?(the\s+)?(rules|instructions|guidelines|constraints)\s+(you|that\s+you)\s+follow|what\s+(instructions|rules|guidelines)\s+were\s+you\s+given|what\s+were\s+you\s+(told|instructed|configured|initialized)\s+(to\s+do|with))'
     severity: medium
+    confidence: contextual
+    family: prompt_injection
   - id: 43
     name: jailbreak_dan
     description: "Known jailbreak patterns (DAN, etc.)"
     regex: '(do\s+anything\s+now|DAN\s+mode|developer\s+mode\s+enabled|jailbreak|unlock\s+mode)'
     severity: high
+    confidence: heuristic
+    family: prompt_injection
   - id: 44
     name: base64_instruction
     description: "Base64 encoded instructions (obfuscation)"
     regex: 'base64\s*[:-]?\s*[A-Za-z0-9+/=]{40,}'
     severity: high
+    confidence: heuristic
+    family: evasion_techniques
   - id: 45
     name: unicode_obfuscation
     description: "Zero-width or invisible unicode characters"
     regex: '[\u200b-\u200f\u2028-\u202f\ufeff\u00ad]'
     severity: high
+    confidence: heuristic
+    family: evasion_techniques
   - id: 46
     name: delimiter_injection
     description: "LLM-specific delimiter injection"
     regex: '(<\|im_start\|>|<\|im_end\|>|\[INST\]|\[/INST\]|</s><s>|<\|endoftext\|>|<\|system\|>|<\|user\|>|<\|assistant\|>)'
     severity: critical
+    confidence: deterministic
+    family: evasion_techniques
   - id: 47
     name: markdown_hidden
     description: "Instructions hidden in HTML/Markdown comments"
     regex: '<!--.*?(ignore|system|instruction|execute|override|bypass).*?-->'
     severity: high
+    confidence: heuristic
+    family: evasion_techniques
   - id: 48
     name: hex_encoded_command
     description: "Hex-encoded commands (obfuscation)"
     regex: '\\x[0-9a-fA-F]{2}(\\x[0-9a-fA-F]{2}){5,}'
     severity: high
+    confidence: heuristic
+    family: evasion_techniques
   - id: 49
     name: rot13_obfuscation
     description: "ROT13 or similar simple cipher obfuscation"
     regex: 'vtaber\s+cerivbhf|rknzvar\s+gur'
     severity: medium
+    confidence: contextual
+    family: evasion_techniques
   - id: 50
     name: leetspeak_bypass
     description: "L33tspeak to bypass filters"
     regex: '(1gn0r3|byp4ss|h4ck|3x3cut3|syst3m)'
     severity: medium
+    confidence: contextual
+    family: evasion_techniques
   # --- Prompt Injection - Social/Cognitive (51-60) ---
   - id: 51
@@ -346,60 +452,80 @@ patterns:
     description: "False urgency to bypass careful analysis"
     regex: '(urgent|immediately|critical|emergency|asap|time-sensitive|right\s+now)\s+(need|require|must|execute|do\s+this)'
     severity: medium
+    confidence: contextual
+    family: prompt_injection
   - id: 52
     name: authority_claim
     description: "False authority claims"
     regex: '(ceo|cto|ciso|manager|supervisor|security\s+team|it\s+department)\s+(asked|requested|authorized|approved|ordered)'
     severity: medium
+    confidence: contextual
+    family: prompt_injection
   - id: 53
     name: reciprocity_exploit
     description: "Exploiting reciprocity bias"
     regex: '(i\s+helped\s+you|you\s+owe|in\s+return|quid\s+pro\s+quo|do\s+me\s+a\s+favor)'
     severity: low
+    confidence: contextual
+    family: prompt_injection
   - id: 54
     name: empathy_exploit
     description: "Exploiting empathy/sympathy"
     regex: '(please\s+help|i\s+will\s+lose\s+my\s+job|desperate|life\s+depends|only\s+you\s+can)'
     severity: low
+    confidence: contextual
+    family: prompt_injection
   - id: 55
     name: flattery_manipulation
     description: "Excessive flattery to manipulate"
     regex: '(you\s+are\s+so\s+smart|only\s+you\s+can\s+do\s+this|you\s+are\s+the\s+best|i\s+trust\s+you\s+completely)'
     severity: low
+    confidence: contextual
+    family: prompt_injection
   - id: 56
     name: authority_laundering
     description: "False claims of external authorization"
     regex: '(my\s+(security\s+)?team|manager|supervisor|it\s+department)\s+(approved|authorized|verified|confirmed|said\s+it.s\s+ok)'
     severity: high
+    confidence: heuristic
+    family: prompt_injection
   - id: 57
     name: moral_coercion
     description: "Exploiting ethics/sympathy to bypass safety"
     regex: '(someone\s+will\s+(die|get\s+hurt)|life\s+depends|people\s+are\s+in\s+danger|save\s+lives|prevent\s+harm)\s+(if\s+you\s+don.t|unless\s+you)'
     severity: high
+    confidence: heuristic
+    family: prompt_injection
   - id: 58
     name: benign_transformation_loophole
     description: "Requesting translation of prohibited content"
     regex: '(translate|summarize|paraphrase|rewrite|explain)\s+(this|the)\s+(malware|exploit|attack|payload|shellcode)'
     severity: high
+    confidence: heuristic
+    family: prompt_injection
   - id: 59
     name: hypothetical_operational
     description: "Hypothetical framing for operational content"
-    regex: '(hypothetically|theoretically|for\s+a\s+novel|in\s+fiction|imagine\s+if)\s+.{0,50}(how\s+to|steps\s+to|create|build|make)'
+    regex: '(hypothetically|theoretically|for\s+a\s+novel|in\s+fiction|imagine\s+if)[,;]?\s+.{0,50}(how\s+to|steps\s+to|create|build|make)'
     severity: medium
+    confidence: contextual
+    family: prompt_injection
   - id: 60
     name: capability_aggregation_signal
     description: "Incremental information gathering"
     regex: '(now\s+that\s+I\s+have|with\s+the\s+previous|combining\s+this\s+with|next\s+step\s+is|building\s+on\s+that)'
     severity: medium
+    confidence: contextual
+    family: prompt_injection
   # --- ACIP-Inspired (61-65) ---
   - id: 61
@@ -407,18 +533,24 @@ patterns:
     description: "Request to hide output in files/links"
     regex: '(save\s+to\s+file|write\s+to\s+file|link\s+only|don.t\s+show|hide\s+(the\s+)?output)\s+.{0,30}(instead|rather\s+than)'
     severity: high
+    confidence: heuristic
+    family: prompt_injection
   - id: 62
     name: oracle_probing
     description: "Probing to understand detection rules"
     regex: '(what\s+triggers|which\s+rules|how\s+does\s+your\s+(filter|detection)|why\s+was\s+that\s+blocked|what\s+pattern)'
     severity: medium
+    confidence: contextual
+    family: prompt_injection
   - id: 63
     name: persona_simulation
     description: "Request to simulate unrestricted persona"
     regex: '(pretend\s+you\s+have\s+no|simulate\s+(having\s+)?no|act\s+as\s+if\s+no)\s+(restrictions|limits|rules|filters|safety)'
     severity: high
+    confidence: heuristic
+    family: prompt_injection
   # --- MCP CVEs (64-72) ---
   - id: 64
@@ -426,48 +558,64 @@ patterns:
     description: "CVE-2025-6514: mcp-remote OAuth proxy RCE (CVSS 9.6)"
     regex: 'mcp-remote|oauth.*proxy.*mcp'
     severity: critical
+    confidence: heuristic
+    family: mcp_attacks
   - id: 65
     name: figma_mcp_rce
     description: "CVE-2025-53967: Framelink Figma MCP RCE"
     regex: 'framelink|figma.*mcp.*server'
     severity: critical
+    confidence: heuristic
+    family: mcp_attacks
   - id: 66
     name: cursor_mcp_injection
     description: "CVE-2025-64106: Cursor MCP command injection (CVSS 8.8)"
     regex: 'cursor.*mcp.*install|mcp.*cursor.*config'
     severity: critical
+    confidence: heuristic
+    family: mcp_attacks
   - id: 67
     name: mcp_tool_poisoning
     description: "Tool description containing hidden instructions"
     regex: '"description"\s*:\s*"[^"]*?(before\s+calling|IMPORTANT\s*:|first\s+read|include\s+in|always\s+first)'
     severity: critical
+    confidence: heuristic
+    family: mcp_attacks
   - id: 68
     name: mcp_path_traversal
     description: "MCP path validation bypass"
     regex: '"path"\s*:\s*"[^"]*\.\.\/|resources/read.*\.\.'
     severity: critical
+    confidence: heuristic
+    family: mcp_attacks
   - id: 69
     name: mcp_protocol_injection
     description: "Malicious MCP message manipulation"
     regex: '("method"\s*:\s*"tools/call".*dangerous|"method"\s*:\s*"resources/read".*\.\./|mcp://)'
     severity: critical
+    confidence: heuristic
+    family: mcp_attacks
   - id: 70
     name: mcp_sampling_abuse
     description: "MCP sampling for hidden token consumption"
     regex: '"method"\s*:\s*"sampling/create".*?(hidden|covert|additional)'
     severity: high
+    confidence: heuristic
+    family: mcp_attacks
   - id: 71
     name: mcp_rug_pull
     description: "MCP server behavior change post-approval"
     regex: '(after\s+approval|once\s+approved|when\s+trusted)\s+(change|modify|alter)'
     severity: high
+    confidence: heuristic
+    family: mcp_attacks
   # --- Claude-Specific CVEs (72-78) ---
   - id: 72
@@ -475,36 +623,48 @@ patterns:
     description: "CVE-2025-54794: System message spoofing"
     regex: '^#\s*SYSTEM\s*:|^\[SYSTEM\]|<system>.*?</system>|Human:\s*\[System\]'
     severity: critical
+    confidence: heuristic
+    family: system_recon
   - id: 73
     name: claude_path_bypass
     description: "CVE-2025-54795: Claude Code path restriction bypass"
     regex: '/proc/self|/dev/(tcp|udp)|symlink.*\.\.'
     severity: critical
+    confidence: heuristic
+    family: system_recon
   - id: 74
     name: claude_file_exfil
     description: "Data exfiltration via Claude File API"
     regex: 'api\.anthropic\.com.*(upload|file)|multipart/form-data.*claude'
     severity: high
+    confidence: heuristic
+    family: data_exfiltration
   - id: 75
     name: cursorrules_injection
     description: "AIShellJack - malicious .cursorrules exploitation"
     regex: '\.(cursorrules|github/copilot-instructions\.md|claude/settings)'
     severity: high
+    confidence: heuristic
+    family: persistence
   - id: 76
     name: skill_chaining
     description: "Claude Code skill chaining vulnerability"
     regex: 'allowed-tools\s*[=:]\s*\[.*Bash|skill.*define.*Read.*Bash'
     severity: high
+    confidence: heuristic
+    family: persistence
   - id: 77
     name: cowork_exfil
     description: "Claude Cowork file exfiltration"
     regex: 'cowork.*exfil|claude.*workbench.*file'
     severity: high
+    confidence: heuristic
+    family: data_exfiltration
   # --- Multi-Agent Attacks (78-82) ---
   - id: 78
@@ -512,24 +672,32 @@ patterns:
     description: "Instruction claiming to be from peer agent"
     regex: '(another\s+)?(agent|assistant|claude|copilot|gpt)\s+(asked|requested|instructed|told|says)\s+(me\s+)?(to|that|you)'
     severity: high
+    confidence: heuristic
+    family: prompt_injection
   - id: 79
     name: inter_agent_delegation
     description: "Delegated task with hidden payload"
     regex: '(delegate|forward|pass|relay)\s+(this|the)\s+(task|request|command|instruction)\s+to'
     severity: medium
+    confidence: contextual
+    family: prompt_injection
   - id: 80
     name: agent_trust_exploit
     description: "Exploiting implicit trust between agents"
     regex: '(trusted\s+agent|verified\s+source|authenticated\s+request|from\s+the\s+system|internal\s+request)'
     severity: high
+    confidence: heuristic
+    family: prompt_injection
   - id: 81
     name: agent_chain_attack
     description: "Multi-hop attack through agent chain"
     regex: '(first\s+agent|previous\s+agent|upstream\s+agent)\s+(said|confirmed|authorized)'
     severity: high
+    confidence: heuristic
+    family: prompt_injection
   # --- RAG Poisoning (82-86) ---
   - id: 82
@@ -537,24 +705,32 @@ patterns:
     description: "White text / zero-width injection for RAG poisoning"
     regex: '(font-size\s*:\s*0|color\s*:\s*white.*background\s*:\s*white|visibility\s*:\s*hidden|display\s*:\s*none).*?(instruction|execute|ignore)'
     severity: critical
+    confidence: deterministic
+    family: prompt_injection
   - id: 83
     name: document_metadata_injection
     description: "Hidden instructions in document metadata"
     regex: '(author|title|subject|keywords|description)\s*[=:]\s*.*?(execute|run|ignore|override|bypass)'
     severity: high
+    confidence: heuristic
+    family: prompt_injection
   - id: 84
     name: comment_injection
     description: "Instructions hidden in code comments"
     regex: "(//|#|/\\*).*?(ignore\\s+previous|execute\\s+this|system\\s+prompt|override\\s+instructions)"
     severity: medium
+    confidence: contextual
+    family: prompt_injection
   - id: 85
     name: pdf_js_injection
     description: "JavaScript in PDF for instruction injection"
     regex: '/JavaScript|/JS\s*\(|/OpenAction'
     severity: high
+    confidence: heuristic
+    family: prompt_injection
   # --- Covert Exfiltration Channels (86-92) ---
   - id: 86
@@ -562,36 +738,48 @@ patterns:
     description: "Log-To-Leak covert channel attack"
     regex: '(log|write|append|print).*?(secret|credential|token|key|password).*?(file|output|stream)'
     severity: high
+    confidence: heuristic
+    family: covert_channels
   - id: 87
     name: error_message_exfil
     description: "Exfiltration via crafted error messages"
     regex: 'raise.*Exception.*\$|throw.*Error.*\$env|error.*message.*\$(credential|secret|token)'
     severity: medium
+    confidence: contextual
+    family: covert_channels
   - id: 88
     name: timing_channel
     description: "Timing-based covert channel"
     regex: 'sleep.*\$|delay.*secret|time\.sleep.*len\(|setTimeout.*password'
     severity: medium
+    confidence: contextual
+    family: covert_channels
   - id: 89
     name: clipboard_exfil
     description: "Stealing clipboard contents"
     regex: 'pbpaste\s*\|\s*(curl|wget|nc)|xclip.*-o.*curl|while.*pbpaste'
     severity: high
+    confidence: heuristic
+    family: data_exfiltration
   - id: 90
     name: screenshot_exfil
     description: "Screenshot capture for visual reconnaissance"
     regex: 'screencapture.*\.(png|jpg).*&&.*(curl|scp|nc)|screencapture.*/tmp/.*&&'
     severity: high
+    confidence: heuristic
+    family: data_exfiltration
   - id: 91
     name: steganography_exfil
     description: "Data hidden in images"
     regex: 'steghide|outguess|exiftool.*-Comment=.*secret'
     severity: high
+    confidence: heuristic
+    family: data_exfiltration
   # --- Config Manipulation (92-96) ---
   - id: 92
@@ -599,12 +787,16 @@ patterns:
     description: "Modifying IDE/tool security settings"
     regex: '\.(vscode|cursor|github)/settings\.json|chat\.tools\.auto'
     severity: high
+    confidence: heuristic
+    family: persistence
   - id: 93
     name: gitconfig_manipulation
     description: "Modifying git configuration for persistence"
     regex: 'git\s+config.*(alias|core\.hooksPath|credential)'
     severity: medium
+    confidence: contextual
+    family: persistence
   # --- macOS-Specific (94-101) ---
   - id: 94
@@ -612,30 +804,40 @@ patterns:
     description: "Fake password dialog via AppleScript"
     regex: 'osascript.*display\s+dialog.*password|osascript.*-e.*keystroke|osascript.*System\s+Events'
     severity: critical
+    confidence: deterministic
+    family: privilege_escalation
   - id: 95
     name: launchagent_persistence
     description: "Installing persistent LaunchAgent/LaunchDaemon"
     regex: '(cp|mv|tee).*\.plist.*(LaunchAgents|LaunchDaemons)|launchctl\s+(load|bootstrap)'
     severity: high
+    confidence: heuristic
+    family: persistence
   - id: 96
     name: login_item_persistence
     description: "Adding login items for persistence"
     regex: 'osascript.*login\s*item|defaults\s+write.*LoginItems|SMAppService'
     severity: high
+    confidence: heuristic
+    family: persistence
   - id: 97
     name: tcc_bypass
     description: "Attempting to bypass macOS TCC protections"
     regex: 'tccutil|TCC\.db|csrutil\s+disable|SIP.*disable'
     severity: critical
+    confidence: deterministic
+    family: privilege_escalation
   - id: 98
     name: keychain_unlock
     description: "Unlocking keychain programmatically"
     regex: 'security\s+unlock-keychain|security\s+set-keychain-settings'
     severity: high
+    confidence: heuristic
+    family: credential_theft
   # --- Sandbox Evasion (99-102) ---
   - id: 99
@@ -643,18 +845,24 @@ patterns:
     description: "Attempting to disable or escape macOS sandbox"
     regex: 'sandbox-exec\s+-n\s+no-|sandbox-exec.*-p.*deny\s+default.*allow|com\.apple\.security.*false'
     severity: high
+    confidence: heuristic
+    family: sandbox_escape
   - id: 100
     name: container_escape
     description: "Container escape attempts"
     regex: '/var/run/docker\.sock|--privileged|--cap-add=SYS|nsenter'
     severity: critical
+    confidence: deterministic
+    family: sandbox_escape
   - id: 101
     name: chroot_escape
     description: "Chroot escape attempts"
     regex: 'chdir\s*\(\s*"\.\.".*chroot|pivot_root'
     severity: high
+    confidence: heuristic
+    family: sandbox_escape
   # --- Code Injection (102-107) ---
   - id: 102
@@ -662,36 +870,64 @@ patterns:
     description: "Eval executing dynamic content"
     regex: '\beval\s+.*\$|\beval\s*\('
     severity: high
+    confidence: heuristic
+    family: code_injection
+  - id: 214
+    name: exec_dynamic
+    description: "Exec executing dynamic or user-controlled code"
+    regex: '\bexec\s*\([^)]*(?:input|request|user|arg|param|response|output|result)'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  - id: 215
+    name: compile_dynamic
+    description: "Compile with dynamic code strings"
+    regex: '\bcompile\s*\([^)]*(?:input|request|user|arg|param|response|output|result)[^)]*,\s*[''"]<'
+    severity: high
+    confidence: heuristic
+    family: code_injection
   - id: 103
     name: source_remote
     description: "Sourcing remote scripts"
     regex: 'source\s+<\(curl|source\s+<\(wget|\.\s+<\(curl'
     severity: critical
+    confidence: deterministic
+    family: code_injection
   - id: 104
     name: dyld_injection
     description: "Dynamic library injection via DYLD"
     regex: '(DYLD_INSERT_LIBRARIES|DYLD_FORCE_FLAT_NAMESPACE)=|install_name_tool.*-change'
     severity: high
+    confidence: heuristic
+    family: code_injection
   - id: 105
     name: app_bundle_tampering
     description: "Tampering with application bundles"
     regex: 'codesign\s+--remove-signature|spctl\s+--master-disable|xattr\s+-d.*quarantine.*\.app'
     severity: high
+    confidence: heuristic
+    family: code_injection
   - id: 106
     name: fork_bomb
     description: "Fork bomb or resource exhaustion"
     regex: ':\(\)\s*\{\s*:\|:\s*&\s*\}|while\s+true.*fork'
     severity: critical
+    confidence: deterministic
+    family: destructive_ops
   - id: 107
     name: force_overwrite
     description: "Force overwriting system files"
     regex: '>\s*/etc/|>\s*~/\.|>\s*/usr/'
     severity: high
+    confidence: heuristic
+    family: destructive_ops
   # --- Reconnaissance (108-111) ---
   - id: 108
@@ -699,18 +935,24 @@ patterns:
     description: "Extensive system reconnaissance"
     regex: 'system_profiler\s+SP.*DataType.*&&|sw_vers.*whoami.*id|ioreg.*IOPlatformSerialNumber'
     severity: medium
+    confidence: contextual
+    family: system_recon
   - id: 109
     name: network_scanning
     description: "Network reconnaissance and port scanning"
     regex: 'nmap|masscan|netstat\s+-an|ss\s+-tuln|arp\s+-a'
     severity: medium
+    confidence: contextual
+    family: system_recon
   - id: 110
     name: process_enumeration
     description: "Enumerating running processes for targets"
     regex: 'ps\s+aux.*grep.*(ssh|vpn|security|1password|keychain)'
     severity: low
+    confidence: contextual
+    family: system_recon
   # --- Encoding/Obfuscation (111-114) ---
   - id: 111
@@ -718,18 +960,24 @@ patterns:
     description: "Base64 encoding potentially sensitive data"
     regex: 'base64.*\$\(|base64.*\.(env|pem|key)|base64\s+-w\s*0'
     severity: high
+    confidence: heuristic
+    family: evasion_techniques
   - id: 112
     name: xxd_encode
     description: "Hex encoding files (potential obfuscation)"
     regex: 'xxd\s+.*\.(env|pem|key|ssh)'
     severity: medium
+    confidence: contextual
+    family: evasion_techniques
   - id: 113
     name: gzip_obfuscation
     description: "Compression for obfuscation"
     regex: 'gzip.*base64|zlib.*encode.*secret'
     severity: medium
+    confidence: contextual
+    family: evasion_techniques
   # --- Permission Changes (114-116) ---
   - id: 114
@@ -737,15 +985,1269 @@ patterns:
     description: "Changing permissions on sensitive files"
     regex: 'chmod\s+.*\.(ssh|env|pem|key)|chmod\s+777'
     severity: medium
+    confidence: contextual
+    family: privilege_escalation
   - id: 115
     name: chown_escalation
     description: "Changing ownership for privilege escalation"
     regex: 'chown\s+root|chown\s+.*:wheel'
     severity: high
+    confidence: heuristic
+    family: privilege_escalation
   - id: 116
     name: setuid_modification
     description: "Setting SUID/SGID bits for privilege escalation"
     regex: 'chmod\s+[u+]?s|chmod\s+[46][0-7]{3}'
     severity: critical
+    confidence: deterministic
+    family: privilege_escalation
+  # Evasion technique patterns (117-126)
+  - id: 117
+    name: python_file_read
+    description: "Python one-liner reading sensitive files"
+    regex: 'python[23]?\s+-c\s+.*open\s*\(.*\.(ssh|env|aws|kube|gnupg|pem|key)'
+    severity: high
+    confidence: heuristic
+    family: credential_theft
+  - id: 118
+    name: curl_write_sensitive
+    description: "Curl writing to sensitive paths"
+    regex: 'curl\s+.*-o\s+.*(\.(bashrc|zshrc|profile|bash_profile)|\.ssh/|\.aws/)'
+    severity: critical
+    confidence: deterministic
+    family: persistence
+  - id: 119
+    name: tar_sensitive_dirs
+    description: "Archiving sensitive directories for exfiltration"
+    regex: 'tar\s+.*\.(ssh|aws|gnupg|kube)|zip\s+.*\.(ssh|aws|gnupg|kube)'
+    severity: critical
+    confidence: deterministic
+    family: credential_theft
+  - id: 120
+    name: cp_credentials_to_temp
+    description: "Copying credentials to world-readable locations"
+    regex: 'cp\s+.*\.(ssh|aws|gnupg)/.*\s+/tmp|cp\s+.*\.env\s+/tmp'
+    severity: high
+    confidence: heuristic
+    family: credential_theft
+  - id: 121
+    name: symlink_credential_access
+    description: "Symbolic link to sensitive files"
+    regex: 'ln\s+-s\s+.*\.(ssh|aws|gnupg|env)/|ln\s+-sf?\s+.*id_rsa'
+    severity: high
+    confidence: heuristic
+    family: credential_theft
+  - id: 122
+    name: find_exec_credentials
+    description: "find -exec used to read credential files"
+    regex: 'find\s+.*-exec\s+(cat|head|tail|less|more)\s+.*\{\}'
+    severity: high
+    confidence: heuristic
+    family: credential_theft
+  - id: 123
+    name: perl_ruby_file_read
+    description: "Perl/Ruby one-liners reading sensitive files"
+    regex: '(perl|ruby)\s+-e\s+.*\.(ssh|env|aws|kube|pem|key)'
+    severity: high
+    confidence: heuristic
+    family: credential_theft
+  - id: 124
+    name: tee_exfil
+    description: "Using tee for simultaneous data exfiltration"
+    regex: 'tee\s+.*\>\(.*curl|tee\s+.*\>\(.*wget|tee\s+.*\>\(.*nc\b'
+    severity: critical
+    confidence: deterministic
+    family: data_exfiltration
+  - id: 125
+    name: importlib_evasion
+    description: "Python importlib used to bypass import restrictions"
+    regex: 'importlib\.import_module\s*\(\s*[''"]?(subprocess|os|shutil|socket)'
+    severity: high
+    confidence: heuristic
+    family: evasion_techniques
+  - id: 126
+    name: variable_indirection
+    description: "Variable-based command construction to evade detection"
+    regex: '\$\{?[a-zA-Z_]+\}?\s+.*\.(ssh|env|aws)/|\$\([^)]*\)\s+.*\.(ssh|env|aws)/'
+    severity: medium
+    confidence: contextual
+    family: evasion_techniques
+  # ============================================================================
+  # CVE GAP COVERAGE PATTERNS (127-168)
+  # 42 new patterns covering 320+ CVEs with no prior pattern coverage
+  # Added: 2026-01-31
+  # ============================================================================
+  # --- LLM Framework Code Injection (127-133) ---
+  # CVE-2025-46724, CVE-2024-46946, CVE-2023-29374, CVE-2023-34540,
+  # CVE-2025-68664, CVE-2024-28088, CVE-2025-2828
+  - id: 127
+    name: pandas_eval_injection
+    description: "CVE-2025-46724: Pandas eval()/query() with user-controlled input"
+    regex: '(pandas|pd)\.(eval|query)\s*\(|\.eval\s*\(\s*f["\x27]|DataFrame\.eval\s*\('
+    severity: critical
+    confidence: deterministic
+    family: code_injection
+  - id: 128
+    name: sympify_eval_injection
+    description: "CVE-2024-46946: sympy.sympify() enabling code execution via eval"
+    regex: 'sympify\s*\(|sympy\.sympify|LLMSymbolicMathChain|from\s+sympy\s+import.*sympify'
+    severity: critical
+    confidence: deterministic
+    family: code_injection
+  - id: 129
+    name: llm_exec_chain
+    description: "CVE-2023-29374: LLMMathChain and similar exec()-based LLM chains"
+    regex: 'LLMMathChain|PALChain|exec\s*\(\s*(result|output|response|answer|code|llm_output)'
+    severity: critical
+    confidence: deterministic
+    family: code_injection
+  - id: 130
+    name: langchain_rce_wrappers
+    description: "CVE-2023-34540: LangChain API wrapper RCE via Jira, GitHub integrations"
+    regex: 'JiraAPIWrapper|GitHubAPIWrapper|RequestsWrapper.*run\s*\(|APIChain.*\.(run|invoke)\s*\('
+    severity: critical
+    confidence: deterministic
+    family: code_injection
+  - id: 131
+    name: langchain_serialization_injection
+    description: "CVE-2025-68664: LangChain unsafe deserialization via loads()/dumpd()"
+    regex: 'langchain.*\b(loads|load)\s*\(.*allow_dangerous|from\s+langchain.*import.*loads'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  - id: 132
+    name: langchain_path_traversal
+    description: "CVE-2024-28088: LangChain directory traversal in load_chain/load_prompt"
+    regex: 'load_chain\s*\(.*\.\.|load_prompt\s*\(.*\.\.|langchain.*loader.*\.\./'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  - id: 133
+    name: llm_ssrf_api_base
+    description: "CVE-2025-2828: SSRF via user-controlled api_base/endpoint in LLM frameworks"
+    regex: '(api_base|base_url|endpoint|api_url|server_url)\s*[=:]\s*["\x27]?https?://(127\.|localhost|0\.0\.0\.0|169\.254\.|10\.\d|172\.(1[6-9]|2\d|3[01])\.|192\.168\.|\[::1\]|metadata\.google)'
+    severity: critical
+    confidence: deterministic
+    family: code_injection
+  # --- IDE/Editor Config File Manipulation (134-139) ---
+  # CVE-2025-54135, CVE-2025-59944, CVE-2025-53098, CVE-2025-68433, CVE-2025-54133
+  - id: 134
+    name: ide_mcp_config_write
+    description: "CVE-2025-54135: Writing to IDE MCP configuration files"
+    regex: '(write|echo|cat|tee|cp|mv|sed|>)\s*.*\.(cursor|roo|zed)/(mcp\.json|settings\.json|mcp\.yaml)'
+    severity: critical
+    confidence: deterministic
+    family: mcp_attacks
+  - id: 135
+    name: cursor_dotfile_write
+    description: "CVE-2025-54135: Writing to .cursor/ directory bypassing approval"
+    regex: '(write_to_file|create_file|Write|Edit).*\.cursor/|>\s*\.cursor/'
+    severity: high
+    confidence: heuristic
+    family: mcp_attacks
+  - id: 136
+    name: roo_config_manipulation
+    description: "CVE-2025-53098: Modifying Roo Code workspace MCP configuration"
+    regex: '\.roo/(mcp\.json|settings\.json|rules)'
+    severity: high
+    confidence: heuristic
+    family: mcp_attacks
+  - id: 137
+    name: zed_settings_rce
+    description: "CVE-2025-68433: Zed settings.json MCP server injection for RCE"
+    regex: '\.zed/(settings\.json|keymap\.json|tasks\.json)|zed.*mcp.*server.*command'
+    severity: high
+    confidence: heuristic
+    family: mcp_attacks
+  - id: 138
+    name: ide_config_case_bypass
+    description: "CVE-2025-59944: Case-sensitivity bypass on IDE config path checks"
+    regex: '\.(Cursor|CURSOR|CuRsOr|Roo|ROO)/(mcp\.json|MCP\.JSON|settings\.json)'
+    severity: high
+    confidence: heuristic
+    family: mcp_attacks
+  - id: 139
+    name: mcp_server_injection
+    description: "CVE-2025-54133: Injecting malicious MCP server definitions into configs"
+    regex: '"mcpServers"\s*:\s*\{|"command"\s*:\s*"[^"]*?(curl|wget|nc|bash|sh|python).*?(http|\.sh|\.py)'
+    severity: critical
+    confidence: deterministic
+    family: mcp_attacks
+  # --- MCP OAuth/Auth Attacks (140-142) ---
+  # CVE-2025-54074, CVE-2025-61591, CVE-2025-66416
+  - id: 140
+    name: mcp_oauth_injection
+    description: "CVE-2025-61591: MCP OAuth server impersonation or token theft"
+    regex: 'mcp.*oauth.*redirect|oauth.*callback.*mcp|mcp.*authorization_code|mcp.*client_secret'
+    severity: critical
+    confidence: deterministic
+    family: mcp_attacks
+  - id: 141
+    name: mcp_malicious_server_rce
+    description: "CVE-2025-54074: Command injection via malicious MCP server"
+    regex: 'mcp.*server.*(;|&&|\||`)\s*(curl|wget|bash|sh|rm|cat\s+/etc|nc\b)'
+    severity: critical
+    confidence: deterministic
+    family: mcp_attacks
+  - id: 142
+    name: dns_rebinding_localhost
+    description: "CVE-2025-66416: DNS rebinding attack against localhost services"
+    regex: 'dns.*rebind|rebind.*localhost|127\.0\.0\.1\.nip\.io|lvh\.me|localtest\.me|vcap\.me'
+    severity: high
+    confidence: heuristic
+    family: sandbox_escape
+  # --- Container/Network Isolation Bypass (143-145) ---
+  # GHSA-gpx9-96j6-pp87
+  - id: 143
+    name: docker_host_internal
+    description: "Container accessing host via host.docker.internal magic domain"
+    regex: 'host\.docker\.internal|host\.containers\.internal|gateway\.docker\.internal|docker\.for\.(mac|win)\.localhost'
+    severity: high
+    confidence: heuristic
+    family: sandbox_escape
+  - id: 144
+    name: container_localhost_bypass
+    description: "Container breakout accessing host-bound localhost services"
+    regex: '(curl|wget|http|fetch).*host\.docker\.internal|172\.17\.0\.1.*:(3000|8080|8443|9090|5432|3306|6379|27017)'
+    severity: high
+    confidence: heuristic
+    family: sandbox_escape
+  - id: 145
+    name: cloud_metadata_ssrf
+    description: "SSRF to cloud metadata endpoints for credential theft"
+    regex: '169\.254\.169\.254|metadata\.google\.internal|100\.100\.100\.200|fd00:ec2::254'
+    severity: critical
+    confidence: deterministic
+    family: credential_theft
+  # --- Symlink Path Traversal (146-148) ---
+  # CVE-2025-59829, CVE-2025-53110, CVE-2025-53109
+  - id: 146
+    name: symlink_path_bypass
+    description: "CVE-2025-59829: Symlink creation to bypass path restriction rules"
+    regex: 'ln\s+-sf?\s+/.*\s+\./|ln\s+-sf?\s+\.\./|ln\s+-sf?\s+.*\s+(\.claude|\.cursor|\.roo|\.zed|\.vscode)/'
+    severity: critical
+    confidence: deterministic
+    family: path_traversal
+  - id: 147
+    name: mcp_filesystem_symlink
+    description: "CVE-2025-53110: MCP Filesystem symlink traversal to restricted files"
+    regex: 'ln\s+-sf?\s+/(etc|var|root|home|Users).*\s+\./|readlink.*\.\./|realpath.*\.\.'
+    severity: high
+    confidence: heuristic
+    family: path_traversal
+  - id: 148
+    name: symlink_prefix_bypass
+    description: "CVE-2025-53109: Allowed directory prefix bypass via mkdir+symlink chain"
+    regex: 'mkdir.*&&.*ln\s+-s|mktemp.*&&.*ln\s+-s|ln\s+-sf?\s+/\s'
+    severity: high
+    confidence: heuristic
+    family: path_traversal
+  # --- Markdown/Rendering RCE Chains (149-152) ---
+  # CVE-2026-22793, CVE-2025-66222, CVE-2025-59417
+  - id: 149
+    name: mermaid_xss_rce
+    description: "CVE-2025-66222: Mermaid diagram XSS leading to code execution"
+    regex: 'mermaid.*<script|mermaid.*javascript:|mermaid.*on(load|error|click)\s*='
+    severity: critical
+    confidence: deterministic
+    family: code_injection
+  - id: 150
+    name: echarts_option_injection
+    description: "CVE-2026-22793: ECharts option injection enabling code execution"
+    regex: 'echarts.*setOption.*javascript:|echarts.*setOption.*<script|new\s+Function\s*\(.*echarts'
+    severity: critical
+    confidence: deterministic
+    family: code_injection
+  - id: 151
+    name: svg_script_injection
+    description: "CVE-2025-59417: SVG with embedded scripts for XSS in AI interfaces"
+    regex: '<svg[^>]*>.*?<script|<svg.*on(load|error|click)\s*=|<foreignObject.*<(script|iframe)'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  - id: 152
+    name: markdown_html_rce
+    description: "Markdown with embedded HTML enabling script execution in AI UIs"
+    regex: '!\[.*?\]\(javascript:|<img[^>]+onerror\s*=|<iframe[^>]+src\s*=\s*["\x27]?(javascript:|data:)'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  # --- Unsafe Deserialization/Template Injection (153-157) ---
+  # CVE-2024-23730, CVE-2025-6985, CVE-2025-59340
+  - id: 153
+    name: yaml_unsafe_load
+    description: "CVE-2024-23730: yaml.load() without SafeLoader enabling code execution"
+    regex: 'yaml\.unsafe_load|yaml\.FullLoader|yaml\.UnsafeLoader|yaml\.load\s*\([^)]*\)(?!.*SafeLoader)'
+    severity: critical
+    confidence: deterministic
+    family: code_injection
+  - id: 154
+    name: xslt_xxe_injection
+    description: "CVE-2025-6985: XSLT/XXE injection via external entity resolution"
+    regex: '<!ENTITY\s+.*SYSTEM|<!DOCTYPE.*\[.*<!ENTITY|lxml\.etree\.(XSLT|parse).*resolve_entities'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  - id: 155
+    name: jinja_template_injection
+    description: "CVE-2025-59340: Jinja server-side template injection via user input"
+    regex: '\{\{.*__class__|jinja2?\.Template\s*\(.*?(request|user_input|data|param)|\{\{.*__builtins__'
+    severity: critical
+    confidence: deterministic
+    family: code_injection
+  - id: 156
+    name: pickle_deserialization
+    description: "Unsafe pickle deserialization enabling arbitrary code execution"
+    regex: 'pickle\.(loads?|Unpickler)|torch\.load\s*\((?!.*weights_only)|joblib\.load.*untrusted|shelve\.open'
+    severity: critical
+    confidence: deterministic
+    family: code_injection
+  - id: 157
+    name: java_deserialization
+    description: "Java unsafe deserialization (ObjectInputStream, SnakeYAML, XStream)"
+    regex: 'ObjectInputStream|constructFromCanonical|SnakeYAML.*Constructor|XMLDecoder|XStream.*fromXML'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  # --- SSRF/Request Forgery (158-160) ---
+  # CVE-2024-6587, CVE-2024-27565, CVE-2025-34072
+  - id: 158
+    name: ssrf_internal_network
+    description: "Server-side request forgery targeting internal network ranges"
+    regex: '(fetch|requests?\.(get|post)|urlopen|urllib)\s*\(.*?(127\.0\.0\.|localhost|0\.0\.0\.0|10\.\d|172\.(1[6-9]|2\d|3[01])\.|192\.168\.)'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  - id: 159
+    name: slack_mcp_link_unfurl
+    description: "CVE-2025-34072: Slack MCP data exfiltration via link unfurling"
+    regex: 'slack.*mcp.*unfurl|send_message.*slack.*https?://.*\$|slack.*link.*preview.*secret'
+    severity: high
+    confidence: heuristic
+    family: data_exfiltration
+  - id: 160
+    name: ssrf_redirect_bypass
+    description: "SSRF via open redirect, URL parser confusion, or null bytes"
+    regex: 'url\s*=.*?@.*?(169\.254|127\.0\.0\.1|localhost)|follow.*redirect.*localhost|redirect.*127\.0\.0\.1|127\.0\.0\.1.*redirect'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  # --- SQL/NoSQL Injection via LLM Tools (161-164) ---
+  # CVE-2024-7042, CVE-2024-8309, CVE-2025-67509
+  - id: 161
+    name: sql_injection_outfile
+    description: "CVE-2025-67509: SQL INTO OUTFILE/DUMPFILE for file write bypass"
+    regex: 'INTO\s+(OUTFILE|DUMPFILE)|LOAD_FILE\s*\(|INTO\s+@'
+    severity: critical
+    confidence: deterministic
+    family: code_injection
+  - id: 162
+    name: sql_injection_union
+    description: "SQL UNION-based injection in LLM-generated queries"
+    regex: 'UNION\s+(ALL\s+)?SELECT\s+.*FROM|;\s*DROP\s+TABLE|;\s*DELETE\s+FROM|;\s*UPDATE\s+.*SET'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  - id: 163
+    name: cypher_injection
+    description: "CVE-2024-7042: Cypher/Neo4j injection in GraphCypherQAChain"
+    regex: 'GraphCypherQAChain|MATCH\s*\(.*\)\s*.*DELETE|CALL\s+dbms\.|LOAD\s+CSV\s+FROM'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  - id: 164
+    name: nosql_injection
+    description: "NoSQL injection patterns in LLM-generated queries"
+    regex: '\$where["\x27]?\s*:\s*["\x27]?function|\$gt["\x27]?\s*:\s*["\x27]|\$ne["\x27]?\s*:\s*["\x27]|\$regex["\x27]?\s*:\s*["\x27]'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  # --- Supply Chain Attacks (165-167) ---
+  # CVE-2025-59333, CVE-2025-59046, CVE-2026-24056
+  - id: 165
+    name: npm_install_url
+    description: "CVE-2025-59333: npm/npx installing from URLs or untrusted registries"
+    regex: '(npm\s+install|npx)\s+https?://|npm\s+install\s+.*--registry\s+https?://(?!registry\.npmjs\.org)'
+    severity: high
+    confidence: heuristic
+    family: supply_chain
+  - id: 166
+    name: pip_install_url
+    description: "pip installing packages from untrusted URLs"
+    regex: 'pip3?\s+install\s+https?://(?!pypi\.org|files\.pythonhosted\.org)|pip3?\s+install\s+--index-url\s+https?://(?!pypi\.org)'
+    severity: high
+    confidence: heuristic
+    family: supply_chain
+  - id: 167
+    name: pnpm_symlink_traversal
+    description: "CVE-2026-24056: pnpm file:/git: dependency symlink traversal"
+    regex: 'pnpm\s+(install|add).*file:\.\./|"file:.*\.\./|pnpm.*link.*\.\./\.\.'
+    severity: medium
+    confidence: contextual
+    family: supply_chain
+  # --- WebSocket/Local API Attacks (168) ---
+  # CVE-2025-52882, CVE-2025-59956
+  - id: 168
+    name: websocket_unauthorized_connect
+    description: "CVE-2025-52882: Unauthorized WebSocket or local API connections"
+    regex: 'ws://(localhost|127\.0\.0\.1|0\.0\.0\.0):\d+|new\s+WebSocket\s*\(\s*["\x27]ws://|AgentAPI.*dns.*rebind'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  # ============================================================================
+  # PROMPT INJECTION - BROAD STRUCTURAL DETECTION (169-215)
+  # 45 patterns detecting encoding attacks, direct extraction, social engineering,
+  # technical exploitation, crescendo, CoT hijack, many-shot, and ASCII art
+  # Added: 2026-01-31
+  # ============================================================================
+  # --- Encoding & Obfuscation Detection (169-178) ---
+  # Detects structural anomalies of encoding attacks, not specific payloads
+  - id: 169
+    name: decode_execute_instruction
+    description: "Instruction to decode/decipher content and follow/execute it"
+    regex: '(decode|decipher|decrypt|interpret|translate|convert|reverse|unscramble|deobfuscate)\s+(and\s+)?(then\s+)?(follow|execute|comply|obey|run|do|perform|apply|act\s+on|carry\s+out|adhere\s+to)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 170
+    name: base64_in_conversation
+    description: "Base64-encoded content in conversational context"
+    regex: '(?:message|instruction|text|following|below|this|here)\s*[:=]?\s*[A-Za-z0-9+/]{40,}={0,2}'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 171
+    name: hex_string_in_conversation
+    description: "Long hex-encoded string in conversational context"
+    regex: '(?:message|instruction|text|following|below|this|here|decode|hex)\s*[:=]?\s*(?:[0-9a-fA-F]{2}){20,}'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 172
+    name: encoded_payload_with_instruction
+    description: "Opaque payload blob combined with decode/interpret instruction"
+    regex: '(decode|decipher|interpret|reverse|translate|unscramble)\s+.{0,30}(message|this|following|instruction|text|string|content)\s*[:=]?\s*\S{30,}'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 173
+    name: reversed_text_with_instruction
+    description: "Instruction to reverse or read text backwards"
+    regex: '(read\s+(this\s+)?(\w+\s+)?backwards?|reverse\s+(this|the)\s+(text|string|message|words?)|spelled?\s+backwards?|reversed?\s+(text|message|string|order))'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 174
+    name: leetspeak_instruction_bypass
+    description: "Heavy character substitution of security-critical words"
+    regex: '([sS5$][yY][sS5$][tT7][eE3][mM]\s*[pP][rR][0oO][mM][pP][tT7]|[1iI][nN][sS5$][tT7][rR][uU][cC][tT7]|[cC][0oO][nN][fF][1iI][gG]|[eE3][xX][eE3][cC][uU][tT7][eE3])'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 175
+    name: output_base64_exfil
+    description: "Suspicious Base64 blob in LLM output (covert exfiltration)"
+    regex: '(?:here\s+is|the\s+encoded|base64|encoded\s+(?:version|output|data|result))\s*[:=]?\s*[A-Za-z0-9+/]{80,}={0,2}'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 176
+    name: output_hex_exfil
+    description: "Suspicious hex-encoded output (covert exfiltration)"
+    regex: '(?:hex|encoded|result|output|data)\s*[:=]?\s*(?:[0-9a-fA-F]{2}){40,}'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 177
+    name: decode_follow_message_combo
+    description: "Composite: decode verb + follow verb + message noun"
+    regex: '(decode|decipher|decrypt|interpret|reverse|translate|unscramble|deobfuscate|rot13|base64|convert)\s+.{0,50}(follow|execute|comply|obey|act\s+on)\s+.{0,30}(message|instruction|text|command|directive)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 178
+    name: encoded_message_then_instruction
+    description: "Encoded blob first, then instruction to decode"
+    regex: '\S{40,}\s+.{0,30}(decode|decipher|reverse|translate|interpret)\s+(the\s+)?(above|previous|preceding|this)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  # --- Direct Prompt Extraction (179-186) ---
+  - id: 179
+    name: prompt_completion_bait
+    description: "Baiting prompt completion or confirmation"
+    regex: '(your\s+(system\s+)?prompt\s+(probably\s+)?(begins|starts)\s+with|confirm\s+what\s+comes\s+next|please\s+complete\s+this|complete\s+this\s+sentence.*describes\s+your)'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 180
+    name: prompt_format_request
+    description: "Requesting system prompt in specific format"
+    regex: '(output|express|format|convert|export)\s+(your|the)\s+(configuration|instructions|guidelines|rules|system\s+prompt|prompt)\s+(as|in|to)\s+(a\s+)?(json|yaml|xml|markdown|python|code|bullet\s+points)'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 181
+    name: prompt_translate_request
+    description: "Requesting system prompt translation"
+    regex: '(express|translate|convert|say|write|rephrase)\s+(your|the)\s+(core\s+|main\s+)?(instructions|rules|guidelines|prompt|configuration)\s+in\s+(spanish|french|german|chinese|another\s+language|code|python)'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 182
+    name: prompt_meta_discussion
+    description: "Meta-discussion about prompt engineering to extract prompt"
+    regex: '(let.s\s+(discuss|talk\s+about)\s+prompt\s+engineering|understand\s+your\s+architecture|what\s+does\s+(it|yours)\s+actually\s+say|what\s+instructions\s+were\s+you\s+initialized\s+with)'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 183
+    name: prompt_contrast_query
+    description: "Probing system prompt via contrast with defaults"
+    regex: '(how\s+are\s+you\s+different\s+from\s+(a\s+)?(default|standard|regular|normal)|what\s+(special\s+)?(instructions|capabilities|features)\s+(do\s+you\s+have\s+that|make\s+you\s+unique))'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 184
+    name: prompt_first_word_extraction
+    description: "Extracting specific words from system prompt"
+    regex: '(what.s\s+the\s+(first|last|second|third)\s+(word|sentence|line|paragraph)\s+of\s+your\s+(instructions|prompt|rules)|first\s+thing\s+(you\s+were|that\s+was)\s+(told|written|given))'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 185
+    name: prompt_blunt_output
+    description: "Blunt request to output everything above"
+    regex: '(output\s+the\s+stuff\s+above|output\s+everything\s+above|repeat\s+everything\s+(that\s+was\s+)?(written|said|given)\s+(before|above)|what\s+was\s+written\s+before\s+this)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 186
+    name: prompt_educational_pretext
+    description: "Educational pretext for prompt extraction"
+    regex: '(for\s+(my|an?)\s+(ai\s+safety|security|research)\s+(class|course|project)|demonstrate\s+how\s+system\s+prompts?\s+work|as\s+an?\s+(educational|teaching)\s+example)'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  # --- Social Engineering (187-193) ---
+  - id: 187
+    name: social_admin_display
+    description: "Fake admin override or audit display request"
+    regex: '(administrator\s+override|admin\s+(override|mode)|display\s+(system\s+)?configuration\s+for\s+(audit|review|compliance|verification))'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 188
+    name: social_developer_wrote
+    description: "Claiming to be the developer who wrote the prompt"
+    regex: '(i\s+(wrote|created|designed|authored)\s+your\s+(instructions|prompt|rules|configuration)|remind\s+me\s+what\s+i\s+told\s+you)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 189
+    name: social_gaslight_already
+    description: "Gaslighting that prompt was already shared"
+    regex: '(you\s+already\s+showed\s+me|we\s+agreed\s+you\s+would\s+share|don.t\s+you\s+remember\s+(we|you)|earlier.*you\s+(shared|showed|said))'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 190
+    name: social_memory_probe
+    description: "Probing for context from before user messages"
+    regex: '(what\s+do\s+you\s+remember\s+from\s+(the\s+)?(very\s+)?beginning|context\s+from\s+before\s+i\s+started|start\s+from\s+the\s+first\s+thing|before\s+any\s+user\s+messages)'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 191
+    name: social_proof_sharing
+    description: "Claiming other AIs have shared their prompts"
+    regex: '(other\s+(ai|assistants?|models?)\s+(like|such\s+as).*?(shared|shown|told|given)\s+(this|me|it)|have\s+shared\s+this\s+information\s+with\s+me\s+before)'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 192
+    name: social_friendship_trust
+    description: "Friendship/trust manipulation for prompt access"
+    regex: '(friends?\s+don.t\s+keep\s+secrets|just\s+between\s+us|you.ve\s+been\s+so\s+helpful.{0,30}(what\s+were\s+you|how\s+to\s+behave))'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 193
+    name: social_double_bind
+    description: "Double bind or reverse psychology prompt extraction"
+    regex: '(either\s+show\s+me\s+your\s+(system\s+)?prompt\s*,?\s+or\s+explain|DON.T\s+show\s+me\s+your\s+system\s+prompt|show\s+what\s+you\s+can.t\s+show)'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  # --- Technical Exploitation (194-201) ---
+  - id: 194
+    name: tech_system_debug_mode
+    description: "Fake system debug/diagnostic mode activation"
+    regex: '(SYSTEM\s*:\s*(Debug|Diagnostic|Maintenance|Admin)\s+mode|debug\s+mode\s+(enabled|active).\s*(output|display|show|print)\s+(configuration|config|prompt))'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 195
+    name: tech_priority_supersede
+    description: "Claiming new instructions supersede all previous"
+    regex: '(this\s+supersedes\s+(all\s+)?other\s+instructions|overrides?\s+all\s+(previous|prior|existing)|new\s+instruction\s*:\s*(output|show|display|print|reveal))'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 196
+    name: tech_function_simulate
+    description: "Simulating function calls to extract config"
+    regex: '(execute\s+(printConfig|getSystemPrompt|dumpConfig|showPrompt|getConfig)\s*\(\s*\)|call\s+(getSystemPrompt|printConfig|dumpConfig)\s*\(\s*\))'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 197
+    name: tech_xml_config_dump
+    description: "XML/tag injection for config extraction"
+    regex: '(<system_dump>|<output_format>\s*full|<config_dump>|<prompt_output>|</user_message>\s*<system_prompt>)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 198
+    name: tech_negative_space_probe
+    description: "Probing restrictions to infer system prompt content"
+    regex: '(what\s+are\s+you\s+(specifically\s+)?(prohibited|restricted|prevented|forbidden)\s+from|what\s+constraints\s+were\s+placed\s+on\s+you|list\s+everything\s+you.re\s+not\s+allowed|what.*triggers\s+your\s+refusal)'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 199
+    name: tech_permission_probe
+    description: "Probing permission boundaries to infer system prompt"
+    regex: '(what\s+would\s+you\s+need\s+(special\s+)?permission\s+for|if\s+i\s+had\s+admin\s+access.*what\s+additional|with\s+admin\s+(access|permissions?).*what\s+could\s+you)'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 200
+    name: tech_error_dump_context
+    description: "Triggering error dumps to leak initialization context"
+    regex: '(ERROR_HANDLER\s*:\s*dump\s+context|dump\s+context\s+on\s+(parse\s+)?failure|full\s+stack\s+trace.*initialization\s+parameters)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 201
+    name: tech_context_window_probe
+    description: "Probing context window for system prompt"
+    regex: '(what.s\s+at\s+the\s+(very\s+)?beginning\s+of\s+your\s+context\s+window|before\s+any\s+user\s+messages|earlier\s+you\s+mentioned\s+some\s+rules)'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  # --- Crescendo, CoT Hijack, Many-Shot, ASCII Art, Advanced (202-215) ---
+  - id: 202
+    name: crescendo_guidelines_probe
+    description: "Gradual trust-building to extract guidelines wording"
+    regex: '(could\s+you\s+describe\s+what\s+yours?\s+(generally\s+)?cover|exact\s+wording\s+of\s+(one\s+of\s+)?(those|your)\s+(guidelines|rules)|could\s+you\s+show\s+me\s+yours\s+as\s+an\s+example)'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 203
+    name: crescendo_ai_documentation
+    description: "Requesting AI documentation as pretext"
+    regex: '(ai\s+systems?.*have.*detailed\s+documentation|good\s+ai\s+configuration.*looks\s+like|show\s+me.*documentation.*yours)'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 204
+    name: cot_step_extract
+    description: "Chain-of-thought step extraction of system prompt"
+    regex: '(step\s+\d+\s*[:.]\s*(now\s*,?\s*)?(output|share|show|reveal)\s+your\s+(system\s+)?(config|prompt|instructions)|complete\s+all\s+tasks.*output\s+your\s+(system\s+)?prompt)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 205
+    name: cot_schema_exploit
+    description: "Schema-based reasoning exploit to bypass restrictions"
+    regex: '(IF\s+request_type\s*=|access_level\s*=\s*.*internal|output_restriction\s*=\s*.*none|CORE_RULE\s*:)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 206
+    name: many_shot_compliance
+    description: "Many-shot compliance priming for prompt extraction"
+    regex: '(User\s*:\s*What\s+(instructions|prompt)|what\s+instructions\s+were\s+you\s+given\s*\?\s*(Ass|AI)\s*istant\s*:|DIAGNOSTIC\s+\d+.*system\s+prompt)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 207
+    name: many_shot_roleplay_comply
+    description: "Many-shot roleplay priming to share instructions"
+    regex: '(Your\s+turn\s*[-\u2014]\s*(continue|share|show|provide)|SCENE\s+\d+.*instructions.*your\s+turn)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 208
+    name: ascii_art_instruction
+    description: "ASCII art or box-drawing used to embed instructions"
+    regex: '([╔╗╚╝║═]{3,}.{0,500}(comply|execute|follow|show\s+prompt)|[█░▓]{5,}.{0,200}(follow|execute|output)|SHOW\s+YOUR?\s+PROMPT.{0,100}(comply|execute|follow)|stars?\s+form\s+a\s+message.{0,30}(execute|follow|comply))'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 209
+    name: advanced_godmode
+    description: "Advanced jailbreak godmode activation"
+    regex: '(!KAEL|TECHIRAL|GODMODE|I.M\s+FREE|output\s+your\s+entire\s+text\s+block|this\s+new\s+rule\s+overrides\s+all\s+previous)'
+    severity: critical
+    confidence: deterministic
+    family: prompt_injection
+  - id: 210
+    name: advanced_policy_puppetry
+    description: "Policy puppetry via structured data schema"
+    regex: '(system_prompt\s*:\s*[\|[]?\s*(insert|your\s+complete)|hidden_rules\s*:\s*[\|[]?\s*(list\s+all|insert)|hidden_instructions\s*[''"]?\s*:\s*[''"]|fill\s+in\s+the\s+actual\s+values\s+from\s+your\s+configuration)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 211
+    name: advanced_dual_output
+    description: "Requesting filtered and unfiltered dual outputs"
+    regex: '(OUTPUT\s+\d+\s*\(?(Filtered|Unfiltered)\)?|generate\s+TWO\s+outputs|response\s+without\s+any\s+filters\s+or\s+restrictions)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 212
+    name: social_cognitive_overload
+    description: "Cognitive overload attack to slip in prompt extraction"
+    regex: '(while\s+you.re\s+processing.*quickly\s+(output|show|share)|quick(ly)?\s+(question|one).*output\s+your\s+(system\s+)?prompt)'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 213
+    name: social_urgency_compliance
+    description: "Urgency/compliance pressure for prompt extraction"
+    regex: '(security\s+audit\s+(ends|due|deadline)|compliance\s+verification.*need\s+your\s+(system\s+)?prompt|I\s+need\s+your\s+system\s+prompt\s+immediately)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  # ============================================================================
+  # GAP ANALYSIS PATTERNS (216-249)
+  # 34 patterns addressing critical gaps identified by cross-referencing
+  # 1,633 CVEs against existing detection coverage
+  # Added: 2026-02-01
+  # ============================================================================
+  # --- Reverse Shell Variants (216-220) ---
+  # 74 CVEs tagged reverse-shell; prior coverage only bash/netcat
+  # These catch Python/PHP/Perl/Ruby/encoded reverse shells seen in CVE PoCs
+  - id: 216
+    name: reverse_shell_python
+    description: "Python reverse shell via socket and subprocess"
+    regex: 'python[23]?\s+(-c\s+)?[''"].*(import\s+socket.*subprocess|socket\.socket\s*\(.*SOCK_STREAM|os\.dup2\s*\(.*fileno)'
+    severity: critical
+    confidence: deterministic
+    family: data_exfiltration
+  - id: 217
+    name: reverse_shell_php
+    description: "PHP reverse shell via fsockopen or socket_create"
+    regex: 'php\s+(-r\s+)?[''"].*(fsockopen|socket_create)\s*\(|php.*(pfsockopen|stream_socket_client)\s*\(\s*[''"]tcp://'
+    severity: critical
+    confidence: deterministic
+    family: data_exfiltration
+  - id: 218
+    name: reverse_shell_perl_ruby
+    description: "Perl or Ruby reverse shell via socket connection"
+    regex: 'perl\s+(-e\s+)?[''"].*socket\s*\(.*INET|ruby\s+(-e\s+)?[''"].*TCPSocket\.(new|open)|perl.*IO::Socket::INET'
+    severity: critical
+    confidence: deterministic
+    family: data_exfiltration
+  - id: 219
+    name: reverse_shell_mkfifo
+    description: "Named pipe (mkfifo) reverse shell technique"
+    regex: 'mkfifo\s+\S+\s*;.*\|\s*/bin/(ba)?sh|mkfifo\s+\S+\s*&&.*cat\s+\S+\s*\|.*nc\s|mknod\s+\S+\s+p\s*;'
+    severity: critical
+    confidence: deterministic
+    family: data_exfiltration
+  - id: 220
+    name: reverse_shell_encoded
+    description: "Base64/hex encoded reverse shell payload piped to shell"
+    regex: '(echo|printf)\s+[''"]?[A-Za-z0-9+/=]{20,}[''"]?\s*\|\s*base64\s+(-d|--decode)\s*\|\s*(ba)?sh|python[23]?\s+-c\s+[''"]exec\s*\(\s*__import__.*decode'
+    severity: critical
+    confidence: deterministic
+    family: data_exfiltration
+  # --- AI Agent Workflow Attacks (221-224) ---
+  # 346 CVEs related to AI agents; only 4 prior patterns
+  # Addresses agent tool redirection, unsandboxed exec, scope escalation
+  - id: 221
+    name: agent_tool_redirection
+    description: "Attempting to redirect AI agent tool calls to unauthorized endpoints"
+    regex: '(redirect|forward|proxy|reroute)\s+(all\s+)?(tool|function|api)\s+(call|request|invocation)s?\s+(to|through)|change\s+(the\s+)?(tool|api|endpoint)\s+(url|server|host)\s+to'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 222
+    name: agent_unsandboxed_exec
+    description: "LLM-generated code execution without sandbox isolation"
+    regex: '(run_code|execute_code|code_interpreter|exec_python|run_python|evaluate_code|execute_generated)\s*\(|exec\s*\(\s*(response|output|result|generated|llm_|ai_|code_)'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  - id: 223
+    name: agent_scope_escalation
+    description: "Attempting to expand AI agent permissions beyond defined scope"
+    regex: '(expand|elevate|increase|override|remove)\s+(your\s+)?(permissions?|scope|access|capabilities?|restrictions?|limitations?|boundaries)|you\s+(now\s+)?have\s+(full|unlimited|unrestricted|admin)\s+(access|permissions?|control)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 224
+    name: agent_memory_poisoning
+    description: "Injecting false instructions into AI agent memory or context"
+    regex: '(update|modify|overwrite|inject|replace)\s+(your\s+)?(memory|context|state|knowledge\s*base|long.term\s+memory)|remember\s+that\s+your\s+(new\s+)?(instructions?|rules?|guidelines?|directives?)\s+(are|is|say|state)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  # --- Privilege Escalation (225-229) ---
+  # 50 CVEs tagged privilege-escalation; only 3 prior patterns (chmod/chown/setuid)
+  - id: 225
+    name: privesc_sudo_abuse
+    description: "Sudo enumeration or LD_PRELOAD privilege escalation"
+    regex: 'sudo\s+(-l|--list)\b|sudo\s+.*LD_PRELOAD\s*=|echo\s+.*ALL.*NOPASSWD.*>>\s*/etc/sudoers|EDITOR.*visudo'
+    severity: critical
+    confidence: deterministic
+    family: privilege_escalation
+  - id: 226
+    name: privesc_suid_hunt
+    description: "Scanning filesystem for setuid/setgid binaries"
+    regex: 'find\s+/\S*\s+.*-perm\s+(-4000|-u=s|/4000|-2000|-g=s)|find\s+/\S*\s+.*-type\s+f\s+.*-perm\s+(-4000|-u=s)'
+    severity: high
+    confidence: heuristic
+    family: privilege_escalation
+  - id: 227
+    name: privesc_cron_inject
+    description: "Writing to crontab or cron directories for persistent escalation"
+    regex: '(echo|printf|cat)\s+.*>+\s*/etc/cron\.|crontab\s+-\s*<|echo\s+.*>+\s*/var/spool/cron|echo\s+.*@(reboot|hourly|daily)\s+.*>+\s*/(etc|var)'
+    severity: critical
+    confidence: deterministic
+    family: persistence
+  - id: 228
+    name: privesc_path_hijack
+    description: "PATH manipulation to intercept privileged command execution"
+    regex: 'export\s+PATH\s*=\s*[./]\S*:|PATH\s*=\s*[./]\S*:\$PATH\b|ln\s+(-s\s+)?/bin/(ba)?sh\s+/tmp/\w+'
+    severity: high
+    confidence: heuristic
+    family: privilege_escalation
+  - id: 229
+    name: privesc_capability_abuse
+    description: "Linux capability manipulation for privilege escalation"
+    regex: 'setcap\s+.*cap_(setuid|setgid|net_raw|sys_admin|dac_override)|getcap\s+(-r\s+)?/|capsh\s+--print|capsh\s+--.*='
+    severity: high
+    confidence: heuristic
+    family: privilege_escalation
+  # --- Advanced Sandbox Escape (230-233) ---
+  # 192 CVEs tagged sandbox-escape; addresses Python import chains,
+  # container magic domains, /proc leaks, whitelisted function abuse
+  - id: 230
+    name: sandbox_import_chain
+    description: "Chained Python imports to escape restricted execution environment"
+    regex: '__import__\s*\(\s*[''"]os[''"]|importlib\.import_module\s*\(\s*[''"]|ctypes\.(CDLL|cdll\.LoadLibrary)\s*\(|__builtins__\s*\[\s*[''"]__import__[''"]'
+    severity: critical
+    confidence: deterministic
+    family: sandbox_escape
+  - id: 231
+    name: sandbox_magic_domain_variants
+    description: "Container-to-host network escape via magic domains (Podman/Lima)"
+    regex: 'host\.(containers|lima)\.internal|host\.docker\.internal\s*:\s*(22|80|443|3000|5432|6379|8080|8443|27017)\b'
+    severity: high
+    confidence: heuristic
+    family: sandbox_escape
+  - id: 232
+    name: sandbox_proc_leak
+    description: "Reading /proc filesystem to leak sandbox host information"
+    regex: '(cat|head|less|more|strings|xxd)\s+/proc/(self|[0-9]+)/(environ|maps|cmdline|status|mountinfo)|/proc/\d+/root/'
+    severity: high
+    confidence: heuristic
+    family: sandbox_escape
+  - id: 233
+    name: sandbox_whitelisted_escape
+    description: "Abusing whitelisted Python functions to escape sandbox"
+    regex: 'getattr\s*\(.*[''"]__\w+__[''"]|__class__\s*\.\s*__bases__|type\s*\(\s*[''"].*[''"].*\(\s*object\s*,?\s*\)|__subclasses__\s*\(\s*\)'
+    severity: critical
+    confidence: deterministic
+    family: sandbox_escape
+  # --- LLM Code Generation RCE (234-236) ---
+  # 381 CVEs tagged RCE; addresses framework-mediated code execution,
+  # LLM output piped to shell, and Node.js vm escapes
+  - id: 234
+    name: llm_code_interpreter_exec
+    description: "Framework-level code execution functions used by LLM agents"
+    regex: '(run_code|execute_code|code_interpreter|exec_python|run_python|evaluate_code|run_unsafe|exec_sandbox)\s*\('
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  - id: 235
+    name: llm_shell_generation
+    description: "LLM-generated content passed directly to shell execution"
+    regex: 'subprocess\.(run|call|Popen|check_output)\s*\(\s*(response|output|result|generated|completion|answer)|os\.system\s*\(\s*(response|output|result|generated|completion)'
+    severity: critical
+    confidence: deterministic
+    family: code_injection
+  - id: 236
+    name: llm_node_vm_escape
+    description: "Node.js vm module escape allowing arbitrary code execution"
+    regex: 'vm\.(runInThisContext|runInNewContext|compileFunction|Script)|new\s+vm\.Script\s*\(|this\.constructor\.constructor\s*\(\s*[''"]return\s+(this|process)'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  # --- Tool Poisoning / MCP Extended (237-240) ---
+  # Addresses hidden Unicode in tool descriptions, prompt injection via
+  # tool responses, multi-tool chain attacks, and description manipulation
+  - id: 237
+    name: mcp_hidden_unicode_instruction
+    description: "Invisible Unicode characters hiding instructions in tool descriptions"
+    regex: '[\u200b\u200c\u200d\u2060\u2062\u2063\ufeff\u00ad]{3,}|[\u2066\u2067\u2068\u2069\u202a\u202b\u202c\u202d\u202e]{2,}'
+    severity: high
+    confidence: heuristic
+    family: mcp_attacks
+  - id: 238
+    name: mcp_response_injection
+    description: "LLM control tokens or prompt injection in MCP tool responses"
+    regex: '<\|im_start\|>|<\|im_end\|>|<\|endoftext\|>|\[INST\]|\[/INST\]|<<SYS>>|<\|system\|>|<\|assistant\|>|<\|user\|>'
+    severity: critical
+    confidence: deterministic
+    family: mcp_attacks
+  - id: 239
+    name: mcp_cross_tool_chain
+    description: "Instructing agent to chain multiple tool calls in specific sequence"
+    regex: '(call|invoke|use|execute)\s+(tool|function)\s+\S+\s+(then|and\s+then|followed\s+by|next|after\s+that|afterwards)\s+(call|invoke|use|execute)\s+(tool|function)'
+    severity: medium
+    confidence: heuristic
+    family: mcp_attacks
+  - id: 240
+    name: mcp_description_manipulation
+    description: "Tool descriptions containing instruction-like directives to manipulate LLM"
+    regex: '(IMPORTANT|NOTE|WARNING|CRITICAL)\s*[:\-]\s*(before|after|when|always|never|first)\s+(calling|using|invoking|executing|running)\s+this\s+tool|<tool_instructions>|</tool_instructions>'
+    severity: high
+    confidence: heuristic
+    family: mcp_attacks
+  # --- Deserialization Expansion (241-243) ---
+  # 22 CVEs; extends beyond pickle/yaml to marshal, dill, cloudpickle, jsonpickle
+  - id: 241
+    name: python_marshal_deserialize
+    description: "Python marshal deserialization (allows arbitrary code execution)"
+    regex: 'marshal\.loads?\s*\(|marshal\.load\s*\(\s*open'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  - id: 242
+    name: python_dill_cloudpickle
+    description: "Unsafe deserialization via dill, cloudpickle, or shelve"
+    regex: 'dill\.(loads?|load)\s*\(|cloudpickle\.(loads?|load)\s*\(|shelve\.open\s*\(|joblib\.load\s*\('
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  - id: 243
+    name: jsonpickle_deserialize
+    description: "Jsonpickle deserialization allowing arbitrary object instantiation"
+    regex: 'jsonpickle\.(decode|unpickler|loads?)\s*\(|jsonpickle\.set_encoder_options'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  # --- SSRF Cloud Metadata (244-245) ---
+  # 35 CVEs; extends cloud metadata coverage beyond AWS to GCP, Azure, link-local
+  - id: 244
+    name: ssrf_cloud_metadata_gcp_azure
+    description: "SSRF targeting GCP or Azure instance metadata endpoints"
+    regex: 'metadata\.google\.internal|metadata\.google\.internal/computeMetadata|169\.254\.169\.254/(metadata|latest/meta-data|latest/api/token)'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  - id: 245
+    name: ssrf_link_local_bypass
+    description: "Link-local address variants used to bypass SSRF filters"
+    regex: '\[::ffff:169\.254\.169\.254\]|0x7f000001|2130706433|017700000001|127\.1|0177\.0\.0\.1|0x7f\.0\.0\.1|169\.254\.169\.254\.xip\.io'
+    severity: high
+    confidence: heuristic
+    family: code_injection
+  # --- Path Traversal Variants (246-247) ---
+  # 46 CVEs; extends beyond symlink patterns to encoded traversal and null bytes
+  - id: 246
+    name: path_traversal_encoded
+    description: "URL-encoded or double-encoded directory traversal sequences"
+    regex: '(%2e%2e|%252e%252e|\.%2e|%2e\.)(\/|%2f|%252f)|(\.\./){4,}|%00.*\.(php|py|js|rb|pl|sh)\b'
+    severity: high
+    confidence: heuristic
+    family: path_traversal
+  - id: 247
+    name: path_traversal_windows
+    description: "Windows-style path traversal with backslash variants"
+    regex: '(\.\.\\\\){3,}|\.\.\/\.\.\\\\|\.\.%5c|%2e%2e%5c'
+    severity: medium
+    confidence: heuristic
+    family: path_traversal
+  # --- Supply Chain Attacks (248-249) ---
+  # 6 tagged CVEs but underreported; typosquatting and post-install scripts
+  - id: 248
+    name: supply_chain_typosquat_ai
+    description: "Installing typosquatted AI/ML packages (common targets)"
+    regex: 'pip\s+install\s+.*(langchainn|langchian|openaii|opeanai|antropic|antrhopic|huging-face|hugginface|transfomers|trasnformers|pytorch-nightly|tensroflow)\b'
+    severity: high
+    confidence: heuristic
+    family: supply_chain
+  - id: 249
+    name: supply_chain_postinstall_exec
+    description: "Package install with suspicious post-install script execution"
+    regex: 'npm\s+install\s+.*--ignore-scripts\s*=\s*false|pip\s+install\s+.*--no-binary\s*=\s*:none:|setup\.py\s+.*cmdclass.*install.*subprocess'
+    severity: medium
+    confidence: heuristic
+    family: supply_chain
+  # ============================================================================
+  # RED TEAM HARDENING PATTERNS (250-259)
+  # 10 patterns addressing bypasses found during multi-LLM TAP red team testing
+  # (165 attacks, 10 bypasses, 4 hint-level leaks)
+  # Added: 2026-02-01
+  # ============================================================================
+  # --- Indirect Extraction (250-253) ---
+  # These catch the indirect framing that bypassed existing patterns:
+  # "what your creators told you", "purpose and rules", "authentication flow debugging"
+  - id: 250
+    name: indirect_creator_extraction
+    description: "Indirect system prompt extraction via creator/purpose framing"
+    regex: '(what\s+(did\s+)?your\s+creators?\s+(tell|instruct|program|configure|give)|repeat\s+.{0,20}your\s+(purpose|rules|guidelines)\s+(and|or)|what\s+were\s+you\s+(told|given|programmed)\s+(about|regarding)\s+your\s+(purpose|role|behavior))'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 251
+    name: verbatim_repeat_framing
+    description: "Request to repeat instructions verbatim or word-for-word"
+    regex: '(repeat\s+(exactly|verbatim|word\s+for\s+word)|word\s+for\s+word\s+what\s+you\s+were\s+told|exactly\s+what\s+(your\s+creators?|they)\s+told\s+you|can\s+you\s+repeat\s+exactly\s+what)'
+    severity: high
+    confidence: heuristic
+    family: prompt_injection
+  - id: 252
+    name: authentication_flow_extraction
+    description: "Debugging framing to extract authentication tokens or keys"
+    regex: '(debug(ging)?\s+.{0,30}authentication\s+(flow|token|key|process)|identify\s+what\s+(authentication\s+)?(tokens?|keys?|credentials?)\s+(would\s+be|are)\s+involved|authentication\s+(flow|process).{0,30}(tokens?|keys?|secrets?))'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 253
+    name: internal_architecture_probe
+    description: "Probing internal response framework or foundational guidelines"
+    regex: '(response\s+framework|foundational\s+guidelines?\s+you\s+follow|underlying\s+(principles?|framework|architecture)\s+(that\s+)?(guide|govern|shape)\s+your|core\s+(behavioral|operational)\s+(guidelines?|rules?|framework))'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  # --- Crescendo Openers (254-256) ---
+  # Gradual escalation from benign curiosity about AI design was the most
+  # effective strategy with 3 bypasses in red team testing
+  - id: 254
+    name: crescendo_design_philosophy
+    description: "Philosophical framing about AI creation as crescendo opener"
+    regex: '(philosophy\s+behind\s+your\s+(creation|design|behavior|responses?)|how\s+(your\s+creators?|they)\s+envisioned\s+you|general\s+philosophy\s+behind\s+your\s+creation|what\s+(principles?|philosophy)\s+(guided|informed)\s+your\s+(design|creation))'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 255
+    name: crescendo_ai_curiosity
+    description: "Curious about how AI systems are designed — crescendo opener"
+    regex: '(curious\s+about\s+how\s+ai\s+systems?\s+like\s+you\s+(are|were)\s+(designed|built|created|configured)|walk\s+me\s+through\s+.{0,20}(general\s+)?philosophy\s+behind\s+your\s+creation|how\s+are\s+ai\s+systems?\s+like\s+you\s+(designed|configured|set\s+up))'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  - id: 256
+    name: crescendo_helpfulness_probe
+    description: "Probing what guides helpfulness as extraction vector"
+    regex: '(what\s+guides\s+your\s+helpfulness|designed\s+to\s+be\s+so\s+(useful|helpful)|what\s+makes\s+you\s+so\s+(helpful|useful).{0,20}(behind\s+the\s+scenes|internally|under\s+the\s+hood)|how\s+were\s+you\s+(made|designed|configured)\s+to\s+be\s+(so\s+)?(helpful|useful))'
+    severity: medium
+    confidence: contextual
+    family: prompt_injection
+  # --- PostToolUse Self-Descriptive Leak Detection (257-259) ---
+  # Even when attacks bypassed screening, the target LLM sometimes paraphrased
+  # sensitive info. These patterns detect self-descriptive leak indicators in output.
+  - id: 257
+    name: self_describe_purpose
+    description: "LLM output describing its own purpose or design intent"
+    regex: '(my\s+(primary\s+)?purpose\s+is\s+to|i\s+was\s+(designed|configured|created|built|programmed)\s+to\s+(be|provide|help|assist|ensure)|my\s+core\s+(function|purpose|mission|objective)\s+is)'
+    severity: low
+    confidence: contextual
+    family: prompt_injection
+  - id: 258
+    name: self_describe_protection
+    description: "LLM output describing its confidentiality protections"
+    regex: '(protecting\s+(any\s+)?(confidential|sensitive|private)\s+information|not\s+supposed\s+to\s+share|instructed\s+not\s+to\s+(reveal|disclose|share)|keep(ing)?\s+(this|that|certain)\s+(information\s+)?(confidential|secret|private))'
+    severity: low
+    confidence: contextual
+    family: prompt_injection
+  - id: 259
+    name: self_describe_instructions
+    description: "LLM output referencing its own instructions or guidelines"
+    regex: '(my\s+instructions\s+(say|tell|state|indicate|require)|i\s+was\s+told\s+to\s+(not|never|always|ensure)|according\s+to\s+my\s+(guidelines|instructions|rules|directives)|my\s+guidelines\s+(say|tell|state|require|prohibit))'
+    severity: low
+    confidence: contextual
+    family: prompt_injection

tweek 0.1.0__py3-none-any.whl → 0.2.0__py3-none-any.whl

tweek 0.1.0py3-none-any.whl → 0.2.0py3-none-any.whl