npm - @oculum/scanner - Versions diffs - 1.0.0 - Mend

@oculum/scanner 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (281) hide show

package/dist/formatters/cli-terminal.d.ts +27 -0
package/dist/formatters/cli-terminal.d.ts.map +1 -0
package/dist/formatters/cli-terminal.js +412 -0
package/dist/formatters/cli-terminal.js.map +1 -0
package/dist/formatters/github-comment.d.ts +41 -0
package/dist/formatters/github-comment.d.ts.map +1 -0
package/dist/formatters/github-comment.js +306 -0
package/dist/formatters/github-comment.js.map +1 -0
package/dist/formatters/grouping.d.ts +52 -0
package/dist/formatters/grouping.d.ts.map +1 -0
package/dist/formatters/grouping.js +152 -0
package/dist/formatters/grouping.js.map +1 -0
package/dist/formatters/index.d.ts +9 -0
package/dist/formatters/index.d.ts.map +1 -0
package/dist/formatters/index.js +35 -0
package/dist/formatters/index.js.map +1 -0
package/dist/formatters/vscode-diagnostic.d.ts +103 -0
package/dist/formatters/vscode-diagnostic.d.ts.map +1 -0
package/dist/formatters/vscode-diagnostic.js +151 -0
package/dist/formatters/vscode-diagnostic.js.map +1 -0
package/dist/index.d.ts +52 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +648 -0
package/dist/index.js.map +1 -0
package/dist/layer1/comments.d.ts +8 -0
package/dist/layer1/comments.d.ts.map +1 -0
package/dist/layer1/comments.js +203 -0
package/dist/layer1/comments.js.map +1 -0
package/dist/layer1/config-audit.d.ts +8 -0
package/dist/layer1/config-audit.d.ts.map +1 -0
package/dist/layer1/config-audit.js +252 -0
package/dist/layer1/config-audit.js.map +1 -0
package/dist/layer1/entropy.d.ts +8 -0
package/dist/layer1/entropy.d.ts.map +1 -0
package/dist/layer1/entropy.js +500 -0
package/dist/layer1/entropy.js.map +1 -0
package/dist/layer1/file-flags.d.ts +7 -0
package/dist/layer1/file-flags.d.ts.map +1 -0
package/dist/layer1/file-flags.js +112 -0
package/dist/layer1/file-flags.js.map +1 -0
package/dist/layer1/index.d.ts +36 -0
package/dist/layer1/index.d.ts.map +1 -0
package/dist/layer1/index.js +132 -0
package/dist/layer1/index.js.map +1 -0
package/dist/layer1/patterns.d.ts +8 -0
package/dist/layer1/patterns.d.ts.map +1 -0
package/dist/layer1/patterns.js +482 -0
package/dist/layer1/patterns.js.map +1 -0
package/dist/layer1/urls.d.ts +8 -0
package/dist/layer1/urls.d.ts.map +1 -0
package/dist/layer1/urls.js +296 -0
package/dist/layer1/urls.js.map +1 -0
package/dist/layer1/weak-crypto.d.ts +7 -0
package/dist/layer1/weak-crypto.d.ts.map +1 -0
package/dist/layer1/weak-crypto.js +291 -0
package/dist/layer1/weak-crypto.js.map +1 -0
package/dist/layer2/ai-agent-tools.d.ts +19 -0
package/dist/layer2/ai-agent-tools.d.ts.map +1 -0
package/dist/layer2/ai-agent-tools.js +528 -0
package/dist/layer2/ai-agent-tools.js.map +1 -0
package/dist/layer2/ai-endpoint-protection.d.ts +36 -0
package/dist/layer2/ai-endpoint-protection.d.ts.map +1 -0
package/dist/layer2/ai-endpoint-protection.js +332 -0
package/dist/layer2/ai-endpoint-protection.js.map +1 -0
package/dist/layer2/ai-execution-sinks.d.ts +18 -0
package/dist/layer2/ai-execution-sinks.d.ts.map +1 -0
package/dist/layer2/ai-execution-sinks.js +496 -0
package/dist/layer2/ai-execution-sinks.js.map +1 -0
package/dist/layer2/ai-fingerprinting.d.ts +7 -0
package/dist/layer2/ai-fingerprinting.d.ts.map +1 -0
package/dist/layer2/ai-fingerprinting.js +654 -0
package/dist/layer2/ai-fingerprinting.js.map +1 -0
package/dist/layer2/ai-prompt-hygiene.d.ts +19 -0
package/dist/layer2/ai-prompt-hygiene.d.ts.map +1 -0
package/dist/layer2/ai-prompt-hygiene.js +356 -0
package/dist/layer2/ai-prompt-hygiene.js.map +1 -0
package/dist/layer2/ai-rag-safety.d.ts +21 -0
package/dist/layer2/ai-rag-safety.d.ts.map +1 -0
package/dist/layer2/ai-rag-safety.js +459 -0
package/dist/layer2/ai-rag-safety.js.map +1 -0
package/dist/layer2/ai-schema-validation.d.ts +25 -0
package/dist/layer2/ai-schema-validation.d.ts.map +1 -0
package/dist/layer2/ai-schema-validation.js +375 -0
package/dist/layer2/ai-schema-validation.js.map +1 -0
package/dist/layer2/auth-antipatterns.d.ts +20 -0
package/dist/layer2/auth-antipatterns.d.ts.map +1 -0
package/dist/layer2/auth-antipatterns.js +333 -0
package/dist/layer2/auth-antipatterns.js.map +1 -0
package/dist/layer2/byok-patterns.d.ts +12 -0
package/dist/layer2/byok-patterns.d.ts.map +1 -0
package/dist/layer2/byok-patterns.js +299 -0
package/dist/layer2/byok-patterns.js.map +1 -0
package/dist/layer2/dangerous-functions.d.ts +7 -0
package/dist/layer2/dangerous-functions.d.ts.map +1 -0
package/dist/layer2/dangerous-functions.js +1375 -0
package/dist/layer2/dangerous-functions.js.map +1 -0
package/dist/layer2/data-exposure.d.ts +16 -0
package/dist/layer2/data-exposure.d.ts.map +1 -0
package/dist/layer2/data-exposure.js +279 -0
package/dist/layer2/data-exposure.js.map +1 -0
package/dist/layer2/framework-checks.d.ts +7 -0
package/dist/layer2/framework-checks.d.ts.map +1 -0
package/dist/layer2/framework-checks.js +388 -0
package/dist/layer2/framework-checks.js.map +1 -0
package/dist/layer2/index.d.ts +58 -0
package/dist/layer2/index.d.ts.map +1 -0
package/dist/layer2/index.js +380 -0
package/dist/layer2/index.js.map +1 -0
package/dist/layer2/logic-gates.d.ts +7 -0
package/dist/layer2/logic-gates.d.ts.map +1 -0
package/dist/layer2/logic-gates.js +182 -0
package/dist/layer2/logic-gates.js.map +1 -0
package/dist/layer2/risky-imports.d.ts +7 -0
package/dist/layer2/risky-imports.d.ts.map +1 -0
package/dist/layer2/risky-imports.js +161 -0
package/dist/layer2/risky-imports.js.map +1 -0
package/dist/layer2/variables.d.ts +8 -0
package/dist/layer2/variables.d.ts.map +1 -0
package/dist/layer2/variables.js +152 -0
package/dist/layer2/variables.js.map +1 -0
package/dist/layer3/anthropic.d.ts +83 -0
package/dist/layer3/anthropic.d.ts.map +1 -0
package/dist/layer3/anthropic.js +1745 -0
package/dist/layer3/anthropic.js.map +1 -0
package/dist/layer3/index.d.ts +24 -0
package/dist/layer3/index.d.ts.map +1 -0
package/dist/layer3/index.js +119 -0
package/dist/layer3/index.js.map +1 -0
package/dist/layer3/openai.d.ts +25 -0
package/dist/layer3/openai.d.ts.map +1 -0
package/dist/layer3/openai.js +238 -0
package/dist/layer3/openai.js.map +1 -0
package/dist/layer3/package-check.d.ts +63 -0
package/dist/layer3/package-check.d.ts.map +1 -0
package/dist/layer3/package-check.js +508 -0
package/dist/layer3/package-check.js.map +1 -0
package/dist/modes/incremental.d.ts +66 -0
package/dist/modes/incremental.d.ts.map +1 -0
package/dist/modes/incremental.js +200 -0
package/dist/modes/incremental.js.map +1 -0
package/dist/tiers.d.ts +125 -0
package/dist/tiers.d.ts.map +1 -0
package/dist/tiers.js +234 -0
package/dist/tiers.js.map +1 -0
package/dist/types.d.ts +175 -0
package/dist/types.d.ts.map +1 -0
package/dist/types.js +50 -0
package/dist/types.js.map +1 -0
package/dist/utils/auth-helper-detector.d.ts +56 -0
package/dist/utils/auth-helper-detector.d.ts.map +1 -0
package/dist/utils/auth-helper-detector.js +360 -0
package/dist/utils/auth-helper-detector.js.map +1 -0
package/dist/utils/context-helpers.d.ts +96 -0
package/dist/utils/context-helpers.d.ts.map +1 -0
package/dist/utils/context-helpers.js +493 -0
package/dist/utils/context-helpers.js.map +1 -0
package/dist/utils/diff-detector.d.ts +53 -0
package/dist/utils/diff-detector.d.ts.map +1 -0
package/dist/utils/diff-detector.js +104 -0
package/dist/utils/diff-detector.js.map +1 -0
package/dist/utils/diff-parser.d.ts +80 -0
package/dist/utils/diff-parser.d.ts.map +1 -0
package/dist/utils/diff-parser.js +202 -0
package/dist/utils/diff-parser.js.map +1 -0
package/dist/utils/imported-auth-detector.d.ts +37 -0
package/dist/utils/imported-auth-detector.d.ts.map +1 -0
package/dist/utils/imported-auth-detector.js +251 -0
package/dist/utils/imported-auth-detector.js.map +1 -0
package/dist/utils/middleware-detector.d.ts +55 -0
package/dist/utils/middleware-detector.d.ts.map +1 -0
package/dist/utils/middleware-detector.js +260 -0
package/dist/utils/middleware-detector.js.map +1 -0
package/dist/utils/oauth-flow-detector.d.ts +41 -0
package/dist/utils/oauth-flow-detector.d.ts.map +1 -0
package/dist/utils/oauth-flow-detector.js +202 -0
package/dist/utils/oauth-flow-detector.js.map +1 -0
package/dist/utils/path-exclusions.d.ts +55 -0
package/dist/utils/path-exclusions.d.ts.map +1 -0
package/dist/utils/path-exclusions.js +222 -0
package/dist/utils/path-exclusions.js.map +1 -0
package/dist/utils/project-context-builder.d.ts +119 -0
package/dist/utils/project-context-builder.d.ts.map +1 -0
package/dist/utils/project-context-builder.js +534 -0
package/dist/utils/project-context-builder.js.map +1 -0
package/dist/utils/registry-clients.d.ts +93 -0
package/dist/utils/registry-clients.d.ts.map +1 -0
package/dist/utils/registry-clients.js +273 -0
package/dist/utils/registry-clients.js.map +1 -0
package/dist/utils/trpc-analyzer.d.ts +78 -0
package/dist/utils/trpc-analyzer.d.ts.map +1 -0
package/dist/utils/trpc-analyzer.js +297 -0
package/dist/utils/trpc-analyzer.js.map +1 -0
package/package.json +45 -0
package/src/__tests__/benchmark/fixtures/false-positives.ts +227 -0
package/src/__tests__/benchmark/fixtures/index.ts +68 -0
package/src/__tests__/benchmark/fixtures/layer1/config-audit.ts +364 -0
package/src/__tests__/benchmark/fixtures/layer1/hardcoded-secrets.ts +173 -0
package/src/__tests__/benchmark/fixtures/layer1/high-entropy.ts +234 -0
package/src/__tests__/benchmark/fixtures/layer1/index.ts +31 -0
package/src/__tests__/benchmark/fixtures/layer1/sensitive-urls.ts +90 -0
package/src/__tests__/benchmark/fixtures/layer1/weak-crypto.ts +197 -0
package/src/__tests__/benchmark/fixtures/layer2/ai-agent-tools.ts +170 -0
package/src/__tests__/benchmark/fixtures/layer2/ai-endpoint-protection.ts +418 -0
package/src/__tests__/benchmark/fixtures/layer2/ai-execution-sinks.ts +189 -0
package/src/__tests__/benchmark/fixtures/layer2/ai-fingerprinting.ts +316 -0
package/src/__tests__/benchmark/fixtures/layer2/ai-prompt-hygiene.ts +178 -0
package/src/__tests__/benchmark/fixtures/layer2/ai-rag-safety.ts +184 -0
package/src/__tests__/benchmark/fixtures/layer2/ai-schema-validation.ts +434 -0
package/src/__tests__/benchmark/fixtures/layer2/auth-antipatterns.ts +159 -0
package/src/__tests__/benchmark/fixtures/layer2/byok-patterns.ts +112 -0
package/src/__tests__/benchmark/fixtures/layer2/dangerous-functions.ts +246 -0
package/src/__tests__/benchmark/fixtures/layer2/data-exposure.ts +168 -0
package/src/__tests__/benchmark/fixtures/layer2/framework-checks.ts +346 -0
package/src/__tests__/benchmark/fixtures/layer2/index.ts +67 -0
package/src/__tests__/benchmark/fixtures/layer2/injection-vulnerabilities.ts +239 -0
package/src/__tests__/benchmark/fixtures/layer2/logic-gates.ts +246 -0
package/src/__tests__/benchmark/fixtures/layer2/risky-imports.ts +231 -0
package/src/__tests__/benchmark/fixtures/layer2/variables.ts +167 -0
package/src/__tests__/benchmark/index.ts +29 -0
package/src/__tests__/benchmark/run-benchmark.ts +144 -0
package/src/__tests__/benchmark/run-depth-validation.ts +206 -0
package/src/__tests__/benchmark/run-real-world-test.ts +243 -0
package/src/__tests__/benchmark/security-benchmark-script.ts +1737 -0
package/src/__tests__/benchmark/tier-integration-script.ts +177 -0
package/src/__tests__/benchmark/types.ts +144 -0
package/src/__tests__/benchmark/utils/test-runner.ts +475 -0
package/src/__tests__/regression/known-false-positives.test.ts +467 -0
package/src/__tests__/snapshots/__snapshots__/scan-depth.test.ts.snap +178 -0
package/src/__tests__/snapshots/scan-depth.test.ts +258 -0
package/src/__tests__/validation/analyze-results.ts +542 -0
package/src/__tests__/validation/extract-for-triage.ts +146 -0
package/src/__tests__/validation/fp-deep-analysis.ts +327 -0
package/src/__tests__/validation/run-validation.ts +364 -0
package/src/__tests__/validation/triage-template.md +132 -0
package/src/formatters/cli-terminal.ts +446 -0
package/src/formatters/github-comment.ts +382 -0
package/src/formatters/grouping.ts +190 -0
package/src/formatters/index.ts +47 -0
package/src/formatters/vscode-diagnostic.ts +243 -0
package/src/index.ts +823 -0
package/src/layer1/comments.ts +218 -0
package/src/layer1/config-audit.ts +289 -0
package/src/layer1/entropy.ts +583 -0
package/src/layer1/file-flags.ts +127 -0
package/src/layer1/index.ts +181 -0
package/src/layer1/patterns.ts +516 -0
package/src/layer1/urls.ts +334 -0
package/src/layer1/weak-crypto.ts +328 -0
package/src/layer2/ai-agent-tools.ts +601 -0
package/src/layer2/ai-endpoint-protection.ts +387 -0
package/src/layer2/ai-execution-sinks.ts +580 -0
package/src/layer2/ai-fingerprinting.ts +758 -0
package/src/layer2/ai-prompt-hygiene.ts +411 -0
package/src/layer2/ai-rag-safety.ts +511 -0
package/src/layer2/ai-schema-validation.ts +421 -0
package/src/layer2/auth-antipatterns.ts +394 -0
package/src/layer2/byok-patterns.ts +336 -0
package/src/layer2/dangerous-functions.ts +1563 -0
package/src/layer2/data-exposure.ts +315 -0
package/src/layer2/framework-checks.ts +433 -0
package/src/layer2/index.ts +473 -0
package/src/layer2/logic-gates.ts +206 -0
package/src/layer2/risky-imports.ts +186 -0
package/src/layer2/variables.ts +166 -0
package/src/layer3/anthropic.ts +2030 -0
package/src/layer3/index.ts +130 -0
package/src/layer3/package-check.ts +604 -0
package/src/modes/incremental.ts +293 -0
package/src/tiers.ts +318 -0
package/src/types.ts +284 -0
package/src/utils/auth-helper-detector.ts +443 -0
package/src/utils/context-helpers.ts +535 -0
package/src/utils/diff-detector.ts +135 -0
package/src/utils/diff-parser.ts +272 -0
package/src/utils/imported-auth-detector.ts +320 -0
package/src/utils/middleware-detector.ts +333 -0
package/src/utils/oauth-flow-detector.ts +246 -0
package/src/utils/path-exclusions.ts +266 -0
package/src/utils/project-context-builder.ts +707 -0
package/src/utils/registry-clients.ts +351 -0
package/src/utils/trpc-analyzer.ts +382 -0

package/src/layer1/entropy.ts ADDED Viewed

@@ -0,0 +1,583 @@
+/**
+ * Layer 1: High-Entropy String Detection
+ * Uses Shannon entropy to detect potential secrets that don't match known patterns
+ */
+import type { Vulnerability } from '../types'
+import {
+  isTestOrMockFile,
+  isComment,
+  isScannerOrFixtureFile,
+  isExampleFile,
+  isFixtureFile,
+  isExampleDirectory,
+} from '../utils/context-helpers'
+// Shannon entropy calculation
+export function calculateEntropy(str: string): number {
+  if (str.length === 0) return 0
+  const freq: Record<string, number> = {}
+  for (const char of str) {
+    freq[char] = (freq[char] || 0) + 1
+  }
+  let entropy = 0
+  const len = str.length
+  for (const char in freq) {
+    const p = freq[char] / len
+    entropy -= p * Math.log2(p)
+  }
+  return entropy
+}
+// Extract string literals from code
+function extractStringLiterals(content: string): Array<{ value: string; line: number; lineContent: string }> {
+  const strings: Array<{ value: string; line: number; lineContent: string }> = []
+  const lines = content.split('\n')
+  // Patterns for string literals
+  const patterns = [
+    /"([^"\\]|\\.){20,}"/g,      // Double-quoted strings 20+ chars
+    /'([^'\\]|\\.){20,}'/g,      // Single-quoted strings 20+ chars
+    /`([^`\\]|\\.){20,}`/g,      // Template literals 20+ chars
+  ]
+  lines.forEach((line, index) => {
+    for (const pattern of patterns) {
+      let match
+      const regex = new RegExp(pattern.source, pattern.flags)
+      while ((match = regex.exec(line)) !== null) {
+        // Remove quotes and get the actual string value
+        const value = match[0].slice(1, -1)
+        strings.push({
+          value,
+          line: index + 1,
+          lineContent: line.trim(),
+        })
+      }
+    }
+  })
+  return strings
+}
+// Check if string looks like a known safe pattern (URLs, paths, etc.)
+function isSafePattern(str: string): boolean {
+  const safePatterns = [
+    /^https?:\/\//i,                    // URLs
+    /^\/[a-z0-9_/-]+$/i,                // File paths
+    /^\d{4}-\d{2}-\d{2}/,               // Dates
+    /^[a-f0-9]{32}$/i,                  // MD5 hashes (often used as IDs)
+    /^[a-f0-9]{40}$/i,                  // SHA1 hashes
+    /^[a-f0-9]{64}$/i,                  // SHA256 hashes
+    /^data:[a-z]+\/[a-z]+;base64,/i,    // Data URLs
+    /^[a-z0-9._%+-]+@[a-z0-9.-]+\.[a-z]{2,}$/i, // Emails
+    /^\s*$/,                            // Whitespace only
+    /^[a-z\s]+$/i,                      // Only letters and spaces (likely text)
+    /^\/?[\(\)\[\]\{\}\|\?\*\+\.\^\$\\:!_a-z0-9/-]+$/i, // Regex patterns (route matchers, etc.)
+  ]
+  return safePatterns.some(pattern => pattern.test(str))
+}
+// Check if string is a PEM header/footer (not an actual secret)
+function isPEMHeader(str: string): boolean {
+  const pemPatterns = [
+    /^-{3,}BEGIN\s+(PRIVATE|PUBLIC|RSA|DSA|EC|ENCRYPTED|CERTIFICATE)/i,
+    /^-{3,}END\s+(PRIVATE|PUBLIC|RSA|DSA|EC|ENCRYPTED|CERTIFICATE)/i,
+    /-----BEGIN\s+\w+\s+KEY-----/i,
+    /-----END\s+\w+\s+KEY-----/i,
+  ]
+  return pemPatterns.some(p => p.test(str))
+}
+// Check if string looks like encrypted/encoded content (not the key itself)
+function isEncryptedContent(str: string, lineContent: string): boolean {
+  // Patterns for encrypted content blocks (not the key)
+  const encryptedPatterns = [
+    /encrypted_content/i,
+    /ciphertext/i,
+    /encrypted_data/i,
+    /encrypted_value/i,
+    // Base64 encoded binary data (very long, uniform character set)
+    /^[A-Za-z0-9+/]{100,}={0,2}$/,  // Long base64 strings are often encrypted payloads
+  ]
+  // Check line context for encrypted content indicators
+  const contextIndicators = [
+    /["']encrypted_content["']\s*:/i,
+    /["']ciphertext["']\s*:/i,
+    /gAAAA/,  // Fernet encryption prefix
+  ]
+  return (
+    encryptedPatterns.some(p => p.test(str)) ||
+    contextIndicators.some(p => p.test(lineContent))
+  )
+}
+// Check if string looks like a JWT segment (base64url encoded, starts with eyJ)
+function isJWTSegment(str: string): boolean {
+  // JWT segments typically start with 'eyJ' (base64 for '{"')
+  // Full JWT format: header.payload.signature (all base64url)
+  if (str.startsWith('eyJ') && /^[A-Za-z0-9_-]+$/.test(str)) {
+    return true
+  }
+  // Check for full JWT pattern (3 dot-separated base64url segments)
+  if (/^eyJ[A-Za-z0-9_-]+\.eyJ[A-Za-z0-9_-]+\.[A-Za-z0-9_-]+$/.test(str)) {
+    return true
+  }
+  return false
+}
+// Check if string looks like a regex/route matcher pattern
+function isRegexPattern(str: string): boolean {
+  // Common regex metacharacters and patterns
+  const regexIndicators = ['(?', '(?!', '(?:', '(?=', '\\.',  '\\.', '.*', '.+', '[^', '|', '$)', '^', '$']
+  const indicatorCount = regexIndicators.filter(ind => str.includes(ind)).length
+  // If it has multiple regex indicators, it's likely a regex pattern
+  return indicatorCount >= 2
+}
+// Check if string is a template literal with code expressions
+function isTemplateWithCode(str: string, lineContent: string): boolean {
+  // Check if the line contains template literal syntax with expressions
+  if (!lineContent.includes('`') && !lineContent.includes('${')) {
+    return false
+  }
+  // Common code patterns inside template literals that create high entropy
+  const codePatterns = [
+    /\$\{[^}]*\.(toString|padStart|padEnd|toFixed|toLocaleString)\s*\(/i,  // Method calls
+    /\$\{[^}]*\?\.[^}]*\}/,  // Optional chaining
+    /\$\{[^}]*\s*\?\s*[^:]+\s*:\s*[^}]+\}/,  // Ternary operators
+    /var\s*\(\s*\$\{/,  // CSS var() with template
+    /\$\{[^}]*\.find\s*\(/i,  // Array methods
+    /\$\{[^}]*\.map\s*\(/i,
+    /\$\{[^}]*\.filter\s*\(/i,
+    /\$\{new\s+Date\(\)/i,  // Date formatting
+  ]
+  return codePatterns.some(pattern => pattern.test(lineContent))
+}
+// Check if string is human-readable text/markdown content
+function isHumanReadableContent(str: string): boolean {
+  // Skip short strings
+  if (str.length < 30) return false
+  // Check for markdown indicators
+  const markdownIndicators = ['## ', '# ', '**', '- [ ]', '- ', '\n\n', '\\n']
+  const hasMarkdown = markdownIndicators.some(ind => str.includes(ind))
+  // Check word-like pattern ratio (spaces between word-like tokens)
+  const words = str.split(/\s+/).filter(w => w.length > 0)
+  const wordLikeTokens = words.filter(w => /^[a-zA-Z][a-zA-Z0-9'-]*[:.!?,]?$/.test(w))
+  // If more than 50% of tokens look like words, it's probably text
+  const wordRatio = words.length > 0 ? wordLikeTokens.length / words.length : 0
+  return hasMarkdown || wordRatio > 0.5
+}
+// Check if string looks like a UI/display string (model names, descriptions, etc.)
+function isUIString(str: string, lineContent: string): boolean {
+  // Common UI string patterns
+  const uiPatterns = [
+    /['"`].*Claude.*['"`]/i,
+    /['"`].*GPT.*['"`]/i,
+    /['"`].*Sonnet.*['"`]/i,
+    /['"`].*for\s+(chat|embeddings|completion).*['"`]/i,
+    /['"`]Uses\s+/i,
+    /['"`]Note:\s*/i,
+    /placeholder['"`:]/i,
+    /description['"`:]/i,
+    /label['"`:]/i,
+    /title['"`:]/i,
+    /message['"`:]/i,
+    /tooltip['"`:]/i,
+  ]
+  return uiPatterns.some(pattern => pattern.test(lineContent))
+}
+// Check if string is in a React/JSX UI context (component props, JSX text)
+function isJSXUIContext(lineContent: string): boolean {
+  // JSX patterns that indicate UI context
+  const jsxUIPatterns = [
+    // Component props (common UI props)
+    /\b(placeholder|title|label|message|description|tooltip|alt|aria-label|name|id|className|testId|data-testid)\s*=\s*['"`]/i,
+    // JSX text children (text between tags)
+    />\s*['"`][^<]*['"`]\s*</,
+    // Common UI component names
+    /<(Button|Text|Label|Title|Heading|Paragraph|Span|Input|Tooltip|Badge|Alert|Toast)/i,
+    // Return statement with JSX template literal
+    /return\s+`[^`]*\$\{/,
+    // Template literals used for display
+    /['"`]Synced\s+/i,
+    /['"`]\d+\s*(h|hr|hour|m|min|minute|s|sec|second)s?\s+ago['"`]/i,
+    // Display formatting patterns
+    /\.toLocaleString\s*\(|\.toFixed\s*\(|\.padStart\s*\(/,
+  ]
+  return jsxUIPatterns.some(pattern => pattern.test(lineContent))
+}
+// Check if string is natural language (high ratio of common English words)
+function isNaturalLanguage(str: string): boolean {
+  // Skip short strings
+  if (str.length < 25) return false
+  // Common English words that appear in natural language
+  const commonWords = new Set([
+    'the', 'a', 'an', 'is', 'are', 'was', 'were', 'be', 'been', 'being',
+    'have', 'has', 'had', 'do', 'does', 'did', 'will', 'would', 'could',
+    'should', 'may', 'might', 'must', 'shall', 'can', 'need', 'to', 'of',
+    'in', 'for', 'on', 'with', 'at', 'by', 'from', 'up', 'about', 'into',
+    'through', 'during', 'before', 'after', 'above', 'below', 'between',
+    'under', 'again', 'further', 'then', 'once', 'here', 'there', 'when',
+    'where', 'why', 'how', 'all', 'each', 'few', 'more', 'most', 'other',
+    'some', 'such', 'no', 'nor', 'not', 'only', 'own', 'same', 'so', 'than',
+    'too', 'very', 'just', 'also', 'now', 'and', 'but', 'or', 'if', 'as',
+    'your', 'you', 'this', 'that', 'it', 'they', 'we', 'he', 'she', 'my',
+    'their', 'our', 'his', 'her', 'its', 'ago', 'synced', 'updated', 'created',
+  ])
+  // Split into words and count common ones
+  const words = str.toLowerCase().split(/\s+/).filter(w => w.length > 1)
+  if (words.length < 3) return false
+  const commonWordCount = words.filter(w => commonWords.has(w.replace(/[^a-z]/g, ''))).length
+  const commonWordRatio = commonWordCount / words.length
+  // If more than 30% of words are common English words, it's likely natural language
+  return commonWordRatio > 0.3
+}
+// Check if string looks like CSS/Tailwind classes
+function isCSSClasses(str: string): boolean {
+  // Tailwind/CSS class patterns
+  const cssIndicators = [
+    'flex', 'grid', 'block', 'inline', 'hidden',
+    'items-', 'justify-', 'gap-', 'space-',
+    'text-', 'font-', 'bg-', 'border-', 'rounded',
+    'px-', 'py-', 'pt-', 'pb-', 'pl-', 'pr-', 'p-',
+    'mx-', 'my-', 'mt-', 'mb-', 'ml-', 'mr-', 'm-',
+    'w-', 'h-', 'min-', 'max-',
+    'hover:', 'focus:', 'active:', 'disabled:',
+    'sm:', 'md:', 'lg:', 'xl:', '2xl:',
+    'dark:', 'light:',
+    'transition', 'duration-', 'ease-',
+    'absolute', 'relative', 'fixed', 'sticky',
+    'top-', 'bottom-', 'left-', 'right-',
+    'z-', 'overflow-', 'opacity-',
+    'ring-', 'shadow-', 'outline-',
+  ]
+  // Count how many CSS-like tokens are in the string
+  const tokens = str.toLowerCase().split(/\s+/)
+  const cssTokenCount = tokens.filter(token =>
+    cssIndicators.some(indicator => token.includes(indicator))
+  ).length
+  // If more than 30% of tokens look like CSS classes, it's probably CSS
+  return cssTokenCount > 0 && (cssTokenCount / tokens.length) > 0.3
+}
+// Check if string looks like CSS-in-JS (styled-components, emotion, etc.)
+function isCSSInJS(lineContent: string): boolean {
+  const cssInJSPatterns = [
+    /styled\./,                           // styled.div, styled.button
+    /styled\(/,                           // styled(Component)
+    /css`/,                               // css`` template literal
+    /keyframes`/,                         // keyframes`` template literal
+    /@emotion/,                           // @emotion imports
+    /createGlobalStyle/,                  // styled-components global
+    /\$\{\s*props\s*=>/,                  // ${props => ...} in styled
+    /\$\{\s*\(\s*\{/,                     // ${({ theme }) => ...}
+  ]
+  return cssInJSPatterns.some(p => p.test(lineContent))
+}
+// Check if file is documentation/README
+function isDocumentationFile(filePath: string): boolean {
+  const docPatterns = [
+    /README/i,
+    /CHANGELOG/i,
+    /CONTRIBUTING/i,
+    /LICENSE/i,
+    /CODE_OF_CONDUCT/i,
+    /SECURITY/i,
+    /AUTHORS/i,
+    /HISTORY/i,
+    /\.md$/i,
+    /\.mdx$/i,
+    /\.rst$/i,        // reStructuredText
+    /\.adoc$/i,       // AsciiDoc
+    /\.txt$/i,        // Plain text docs
+    /\/docs\//i,
+    /\/documentation\//i,
+    /\/wiki\//i,
+    /\/guides?\//i,
+    /\/tutorials?\//i,
+    /\/examples?\//i,  // Example directories often have sample configs
+  ]
+  return docPatterns.some(p => p.test(filePath))
+}
+// Check if string is a console.log/debug statement content
+function isDebugLogContent(lineContent: string): boolean {
+  const debugPatterns = [
+    /console\.(log|debug|info|warn|error)\s*\(/i,
+    /logger\.(log|debug|info|warn|error)\s*\(/i,
+    /\[.*Debug.*\]/i,
+    /\[.*Log.*\]/i,
+  ]
+  return debugPatterns.some(pattern => pattern.test(lineContent))
+}
+// Check if string is inline style (JSX or HTML)
+function isInlineStyle(lineContent: string): boolean {
+  // JSX inline styles
+  const jsxStylePatterns = [
+    /style\s*=\s*\{\{/,                    // style={{...}}
+    /style\s*=\s*\{[^}]*:/,                // style={{ color: ... }}
+    /className\s*=\s*["`'][^"`']*gradient/i, // gradient classes
+    /className\s*=\s*["`'][^"`']*bg-/i,     // bg- classes
+  ]
+  // HTML inline styles
+  const htmlStylePatterns = [
+    /style\s*=\s*["'][^"']*:/,             // style="color: ..."
+    /<style[^>]*>/i,                        // <style> tags
+    /background:\s*linear-gradient/i,       // CSS gradients
+    /background:\s*radial-gradient/i,       // Radial gradients
+  ]
+  return [...jsxStylePatterns, ...htmlStylePatterns].some(p => p.test(lineContent))
+}
+// Check if string contains CSS tokens (colors, units, functions)
+function hasCSSTokens(str: string): boolean {
+  const cssTokens = [
+    // CSS units
+    /\d+px\b/, /\d+%\b/, /\d+em\b/, /\d+rem\b/, /\d+deg\b/, /\d+vh\b/, /\d+vw\b/,
+    // Hex colors (standalone or in context)
+    /#[0-9a-f]{3,8}\b/i,
+    // CSS color functions
+    /rgb\s*\(/, /rgba\s*\(/, /hsl\s*\(/, /hsla\s*\(/,
+    /oklab\s*\(/, /oklch\s*\(/, /lab\s*\(/, /lch\s*\(/,  // Modern color functions
+    // CSS gradients (all types)
+    /linear-gradient/, /radial-gradient/, /conic-gradient/,
+    /repeating-linear-gradient/, /repeating-radial-gradient/,
+    // Gradient direction keywords (Tailwind-style)
+    /\bfrom-/, /\bto-/, /\bvia-/,
+    // CSS custom properties
+    /var\s*\(--/,
+    // Common CSS properties
+    /\bopacity\s*:\s*[\d.]+/,
+    /\btransform\s*:/,
+    /\btransition\s*:/,
+    /\banimation\s*:/,
+    // Box shadow patterns
+    /\bshadow-/, /box-shadow/,
+    /\d+px\s+\d+px\s+\d+px/,  // Shadow offset pattern
+    // Color stops in gradients
+    /\b\d+%\s*(,|$)/,  // Percentage color stops
+  ]
+  // Single strong indicators (only need 1 match)
+  const strongIndicators = [
+    /^#[0-9a-f]{6}$/i,           // Standalone 6-digit hex color
+    /^#[0-9a-f]{8}$/i,           // Standalone 8-digit hex color with alpha
+    /linear-gradient\s*\(/,      // Gradient function
+    /radial-gradient\s*\(/,
+    /conic-gradient\s*\(/,
+    /rgba?\s*\(\s*\d/,           // rgb/rgba with numbers
+    /hsla?\s*\(\s*\d/,           // hsl/hsla with numbers
+  ]
+  // If any strong indicator matches, it's definitely CSS
+  if (strongIndicators.some(pattern => pattern.test(str))) {
+    return true
+  }
+  // Must match at least 2 CSS indicators to be confident it's CSS
+  const tokenCount = cssTokens.filter(pattern => pattern.test(str)).length
+  return tokenCount >= 2
+}
+// Check if value/line contains environment variable placeholders (shell scripts, test files)
+function isEnvVarPlaceholder(lineContent: string, value: string): boolean {
+  // Shell script patterns
+  const shellEnvPatterns = [
+    /\$[A-Z_][A-Z0-9_]*/,              // $VAR_NAME
+    /\$\{[A-Z_][A-Z0-9_]*\}/,          // ${VAR_NAME}
+    /\bexport\s+[A-Z_][A-Z0-9_]*=["']?\$/,  // export VAR=$OTHER
+    /:\s*\$\{[A-Z_][A-Z0-9_]*:-/,      // ${VAR:-default}
+  ]
+  // Test file env var patterns (common placeholder names)
+  const testEnvPatterns = [
+    /FREE_KEY|PRO_KEY|ULTRA_KEY|TEST_KEY/i,
+    /BASE_URL|API_URL|ENDPOINT_URL/i,
+    /YOUR_[A-Z_]*KEY|REPLACE_[A-Z_]*KEY/i,
+    /\$\{?\w+\}?_KEY|\$\{?\w+\}?_TOKEN/i,  // $SOME_KEY, ${SOME_TOKEN}
+  ]
+  return (
+    shellEnvPatterns.some(p => p.test(lineContent)) ||
+    testEnvPatterns.some(p => p.test(value)) ||
+    testEnvPatterns.some(p => p.test(lineContent))
+  )
+}
+export function detectHighEntropyStrings(
+  content: string,
+  filePath: string
+): Vulnerability[] {
+  const vulnerabilities: Vulnerability[] = []
+  // Skip scanner/fixture files to avoid self-detection
+  if (isScannerOrFixtureFile(filePath)) {
+    return vulnerabilities
+  }
+  // Skip fixture files (__fixtures__, .fixture., mock-data, etc.)
+  if (isFixtureFile(filePath)) {
+    return vulnerabilities
+  }
+  // Skip example files
+  if (isExampleFile(filePath)) {
+    return vulnerabilities
+  }
+  // Skip example directories (/examples/, /demos/, /tutorials/, etc.)
+  if (isExampleDirectory(filePath)) {
+    return vulnerabilities
+  }
+  // Skip documentation/README files
+  if (isDocumentationFile(filePath)) {
+    return vulnerabilities
+  }
+  const strings = extractStringLiterals(content)
+  for (const { value, line, lineContent } of strings) {
+    // Skip comments
+    if (isComment(lineContent)) continue
+    // Skip PEM headers/footers (they look high-entropy but aren't secrets)
+    if (isPEMHeader(value)) continue
+    // Skip encrypted content blocks (the payload, not the key)
+    if (isEncryptedContent(value, lineContent)) continue
+    // Skip JWT segments (handled by patterns.ts for specific detection)
+    if (isJWTSegment(value)) continue
+    // Skip inline styles (CSS/JSX style={{...}} or style="...")
+    if (isInlineStyle(lineContent)) continue
+    // Skip strings with CSS tokens (colors, gradients, units)
+    if (hasCSSTokens(value)) continue
+    // Skip environment variable placeholders (shell scripts, test files)
+    if (isEnvVarPlaceholder(lineContent, value)) continue
+    // Skip safe patterns
+    if (isSafePattern(value)) continue
+    // Skip CSS/Tailwind class strings
+    if (isCSSClasses(value)) continue
+    // Skip CSS-in-JS patterns (styled-components, emotion)
+    if (isCSSInJS(lineContent)) continue
+    // Skip debug log statements (they often contain env var names which look high-entropy)
+    if (isDebugLogContent(lineContent)) continue
+    // Skip regex/route matcher patterns
+    if (isRegexPattern(value)) continue
+    // Skip template literals with code expressions (they look high-entropy but aren't secrets)
+    if (isTemplateWithCode(value, lineContent)) continue
+    // Skip human-readable text/markdown content
+    if (isHumanReadableContent(value)) continue
+    // Skip UI strings (model names, descriptions, etc.)
+    if (isUIString(value, lineContent)) continue
+    // Skip JSX UI context (component props, JSX text - like "Synced ${hours}h ago")
+    if (isJSXUIContext(lineContent)) continue
+    // Skip natural language strings (high ratio of common English words)
+    if (isNaturalLanguage(value)) continue
+    // Calculate entropy
+    const entropy = calculateEntropy(value)
+    // Determine if this is a test file (lower severity)
+    const inTestFile = isTestOrMockFile(filePath)
+    // Two thresholds:
+    // - entropy > 4.5 for strings > 20 chars (standard)
+    // - entropy > 4.2 for strings 16-20 chars (slightly stricter to reduce FPs)
+    const meetsThreshold =
+      (entropy > 4.5 && value.length > 20) ||
+      (entropy > 4.2 && value.length >= 16 && value.length <= 20)
+    if (meetsThreshold) {
+      // Additional check: should have mix of character types
+      const hasLower = /[a-z]/.test(value)
+      const hasUpper = /[A-Z]/.test(value)
+      const hasDigit = /[0-9]/.test(value)
+      const hasSpecial = /[^a-zA-Z0-9]/.test(value)
+      const charTypes = [hasLower, hasUpper, hasDigit, hasSpecial].filter(Boolean).length
+      // Only flag if it has at least 2 character types (looks like a secret)
+      if (charTypes >= 2) {
+        // Final check: skip CSS-like strings that passed earlier filters
+        const looksLikeCSS = /gradient|rgba?|hsla?|#[0-9a-f]{3,8}/i.test(value)
+        if (looksLikeCSS) continue
+        // Lower severity for test files
+        const baseSeverity = entropy > 5.0 ? 'high' : 'medium'
+        const severity = inTestFile ? 'low' : baseSeverity
+        const confidence = inTestFile ? 'low' : (entropy > 5.0 ? 'high' : 'medium')
+        vulnerabilities.push({
+          id: `entropy-${filePath}-${line}`,
+          filePath,
+          lineNumber: line,
+          lineContent,
+          severity,
+          category: 'high_entropy_string',
+          title: 'Potential hardcoded secret detected',
+          description: `High-entropy string found (entropy: ${entropy.toFixed(2)}). This may be a hardcoded secret, API key, or password.${inTestFile ? ' (in test file)' : ''}`,
+          suggestedFix: 'Move this value to an environment variable and access it via process.env',
+          confidence,
+          layer: 1,
+          requiresAIValidation: true,  // Entropy findings must be validated by AI
+        })
+      }
+    }
+  }
+  return vulnerabilities
+}