npm - @oculum/scanner - Versions diffs - 1.0.0 - Mend

@oculum/scanner 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (281) hide show

package/dist/formatters/cli-terminal.d.ts +27 -0
package/dist/formatters/cli-terminal.d.ts.map +1 -0
package/dist/formatters/cli-terminal.js +412 -0
package/dist/formatters/cli-terminal.js.map +1 -0
package/dist/formatters/github-comment.d.ts +41 -0
package/dist/formatters/github-comment.d.ts.map +1 -0
package/dist/formatters/github-comment.js +306 -0
package/dist/formatters/github-comment.js.map +1 -0
package/dist/formatters/grouping.d.ts +52 -0
package/dist/formatters/grouping.d.ts.map +1 -0
package/dist/formatters/grouping.js +152 -0
package/dist/formatters/grouping.js.map +1 -0
package/dist/formatters/index.d.ts +9 -0
package/dist/formatters/index.d.ts.map +1 -0
package/dist/formatters/index.js +35 -0
package/dist/formatters/index.js.map +1 -0
package/dist/formatters/vscode-diagnostic.d.ts +103 -0
package/dist/formatters/vscode-diagnostic.d.ts.map +1 -0
package/dist/formatters/vscode-diagnostic.js +151 -0
package/dist/formatters/vscode-diagnostic.js.map +1 -0
package/dist/index.d.ts +52 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +648 -0
package/dist/index.js.map +1 -0
package/dist/layer1/comments.d.ts +8 -0
package/dist/layer1/comments.d.ts.map +1 -0
package/dist/layer1/comments.js +203 -0
package/dist/layer1/comments.js.map +1 -0
package/dist/layer1/config-audit.d.ts +8 -0
package/dist/layer1/config-audit.d.ts.map +1 -0
package/dist/layer1/config-audit.js +252 -0
package/dist/layer1/config-audit.js.map +1 -0
package/dist/layer1/entropy.d.ts +8 -0
package/dist/layer1/entropy.d.ts.map +1 -0
package/dist/layer1/entropy.js +500 -0
package/dist/layer1/entropy.js.map +1 -0
package/dist/layer1/file-flags.d.ts +7 -0
package/dist/layer1/file-flags.d.ts.map +1 -0
package/dist/layer1/file-flags.js +112 -0
package/dist/layer1/file-flags.js.map +1 -0
package/dist/layer1/index.d.ts +36 -0
package/dist/layer1/index.d.ts.map +1 -0
package/dist/layer1/index.js +132 -0
package/dist/layer1/index.js.map +1 -0
package/dist/layer1/patterns.d.ts +8 -0
package/dist/layer1/patterns.d.ts.map +1 -0
package/dist/layer1/patterns.js +482 -0
package/dist/layer1/patterns.js.map +1 -0
package/dist/layer1/urls.d.ts +8 -0
package/dist/layer1/urls.d.ts.map +1 -0
package/dist/layer1/urls.js +296 -0
package/dist/layer1/urls.js.map +1 -0
package/dist/layer1/weak-crypto.d.ts +7 -0
package/dist/layer1/weak-crypto.d.ts.map +1 -0
package/dist/layer1/weak-crypto.js +291 -0
package/dist/layer1/weak-crypto.js.map +1 -0
package/dist/layer2/ai-agent-tools.d.ts +19 -0
package/dist/layer2/ai-agent-tools.d.ts.map +1 -0
package/dist/layer2/ai-agent-tools.js +528 -0
package/dist/layer2/ai-agent-tools.js.map +1 -0
package/dist/layer2/ai-endpoint-protection.d.ts +36 -0
package/dist/layer2/ai-endpoint-protection.d.ts.map +1 -0
package/dist/layer2/ai-endpoint-protection.js +332 -0
package/dist/layer2/ai-endpoint-protection.js.map +1 -0
package/dist/layer2/ai-execution-sinks.d.ts +18 -0
package/dist/layer2/ai-execution-sinks.d.ts.map +1 -0
package/dist/layer2/ai-execution-sinks.js +496 -0
package/dist/layer2/ai-execution-sinks.js.map +1 -0
package/dist/layer2/ai-fingerprinting.d.ts +7 -0
package/dist/layer2/ai-fingerprinting.d.ts.map +1 -0
package/dist/layer2/ai-fingerprinting.js +654 -0
package/dist/layer2/ai-fingerprinting.js.map +1 -0
package/dist/layer2/ai-prompt-hygiene.d.ts +19 -0
package/dist/layer2/ai-prompt-hygiene.d.ts.map +1 -0
package/dist/layer2/ai-prompt-hygiene.js +356 -0
package/dist/layer2/ai-prompt-hygiene.js.map +1 -0
package/dist/layer2/ai-rag-safety.d.ts +21 -0
package/dist/layer2/ai-rag-safety.d.ts.map +1 -0
package/dist/layer2/ai-rag-safety.js +459 -0
package/dist/layer2/ai-rag-safety.js.map +1 -0
package/dist/layer2/ai-schema-validation.d.ts +25 -0
package/dist/layer2/ai-schema-validation.d.ts.map +1 -0
package/dist/layer2/ai-schema-validation.js +375 -0
package/dist/layer2/ai-schema-validation.js.map +1 -0
package/dist/layer2/auth-antipatterns.d.ts +20 -0
package/dist/layer2/auth-antipatterns.d.ts.map +1 -0
package/dist/layer2/auth-antipatterns.js +333 -0
package/dist/layer2/auth-antipatterns.js.map +1 -0
package/dist/layer2/byok-patterns.d.ts +12 -0
package/dist/layer2/byok-patterns.d.ts.map +1 -0
package/dist/layer2/byok-patterns.js +299 -0
package/dist/layer2/byok-patterns.js.map +1 -0
package/dist/layer2/dangerous-functions.d.ts +7 -0
package/dist/layer2/dangerous-functions.d.ts.map +1 -0
package/dist/layer2/dangerous-functions.js +1375 -0
package/dist/layer2/dangerous-functions.js.map +1 -0
package/dist/layer2/data-exposure.d.ts +16 -0
package/dist/layer2/data-exposure.d.ts.map +1 -0
package/dist/layer2/data-exposure.js +279 -0
package/dist/layer2/data-exposure.js.map +1 -0
package/dist/layer2/framework-checks.d.ts +7 -0
package/dist/layer2/framework-checks.d.ts.map +1 -0
package/dist/layer2/framework-checks.js +388 -0
package/dist/layer2/framework-checks.js.map +1 -0
package/dist/layer2/index.d.ts +58 -0
package/dist/layer2/index.d.ts.map +1 -0
package/dist/layer2/index.js +380 -0
package/dist/layer2/index.js.map +1 -0
package/dist/layer2/logic-gates.d.ts +7 -0
package/dist/layer2/logic-gates.d.ts.map +1 -0
package/dist/layer2/logic-gates.js +182 -0
package/dist/layer2/logic-gates.js.map +1 -0
package/dist/layer2/risky-imports.d.ts +7 -0
package/dist/layer2/risky-imports.d.ts.map +1 -0
package/dist/layer2/risky-imports.js +161 -0
package/dist/layer2/risky-imports.js.map +1 -0
package/dist/layer2/variables.d.ts +8 -0
package/dist/layer2/variables.d.ts.map +1 -0
package/dist/layer2/variables.js +152 -0
package/dist/layer2/variables.js.map +1 -0
package/dist/layer3/anthropic.d.ts +83 -0
package/dist/layer3/anthropic.d.ts.map +1 -0
package/dist/layer3/anthropic.js +1745 -0
package/dist/layer3/anthropic.js.map +1 -0
package/dist/layer3/index.d.ts +24 -0
package/dist/layer3/index.d.ts.map +1 -0
package/dist/layer3/index.js +119 -0
package/dist/layer3/index.js.map +1 -0
package/dist/layer3/openai.d.ts +25 -0
package/dist/layer3/openai.d.ts.map +1 -0
package/dist/layer3/openai.js +238 -0
package/dist/layer3/openai.js.map +1 -0
package/dist/layer3/package-check.d.ts +63 -0
package/dist/layer3/package-check.d.ts.map +1 -0
package/dist/layer3/package-check.js +508 -0
package/dist/layer3/package-check.js.map +1 -0
package/dist/modes/incremental.d.ts +66 -0
package/dist/modes/incremental.d.ts.map +1 -0
package/dist/modes/incremental.js +200 -0
package/dist/modes/incremental.js.map +1 -0
package/dist/tiers.d.ts +125 -0
package/dist/tiers.d.ts.map +1 -0
package/dist/tiers.js +234 -0
package/dist/tiers.js.map +1 -0
package/dist/types.d.ts +175 -0
package/dist/types.d.ts.map +1 -0
package/dist/types.js +50 -0
package/dist/types.js.map +1 -0
package/dist/utils/auth-helper-detector.d.ts +56 -0
package/dist/utils/auth-helper-detector.d.ts.map +1 -0
package/dist/utils/auth-helper-detector.js +360 -0
package/dist/utils/auth-helper-detector.js.map +1 -0
package/dist/utils/context-helpers.d.ts +96 -0
package/dist/utils/context-helpers.d.ts.map +1 -0
package/dist/utils/context-helpers.js +493 -0
package/dist/utils/context-helpers.js.map +1 -0
package/dist/utils/diff-detector.d.ts +53 -0
package/dist/utils/diff-detector.d.ts.map +1 -0
package/dist/utils/diff-detector.js +104 -0
package/dist/utils/diff-detector.js.map +1 -0
package/dist/utils/diff-parser.d.ts +80 -0
package/dist/utils/diff-parser.d.ts.map +1 -0
package/dist/utils/diff-parser.js +202 -0
package/dist/utils/diff-parser.js.map +1 -0
package/dist/utils/imported-auth-detector.d.ts +37 -0
package/dist/utils/imported-auth-detector.d.ts.map +1 -0
package/dist/utils/imported-auth-detector.js +251 -0
package/dist/utils/imported-auth-detector.js.map +1 -0
package/dist/utils/middleware-detector.d.ts +55 -0
package/dist/utils/middleware-detector.d.ts.map +1 -0
package/dist/utils/middleware-detector.js +260 -0
package/dist/utils/middleware-detector.js.map +1 -0
package/dist/utils/oauth-flow-detector.d.ts +41 -0
package/dist/utils/oauth-flow-detector.d.ts.map +1 -0
package/dist/utils/oauth-flow-detector.js +202 -0
package/dist/utils/oauth-flow-detector.js.map +1 -0
package/dist/utils/path-exclusions.d.ts +55 -0
package/dist/utils/path-exclusions.d.ts.map +1 -0
package/dist/utils/path-exclusions.js +222 -0
package/dist/utils/path-exclusions.js.map +1 -0
package/dist/utils/project-context-builder.d.ts +119 -0
package/dist/utils/project-context-builder.d.ts.map +1 -0
package/dist/utils/project-context-builder.js +534 -0
package/dist/utils/project-context-builder.js.map +1 -0
package/dist/utils/registry-clients.d.ts +93 -0
package/dist/utils/registry-clients.d.ts.map +1 -0
package/dist/utils/registry-clients.js +273 -0
package/dist/utils/registry-clients.js.map +1 -0
package/dist/utils/trpc-analyzer.d.ts +78 -0
package/dist/utils/trpc-analyzer.d.ts.map +1 -0
package/dist/utils/trpc-analyzer.js +297 -0
package/dist/utils/trpc-analyzer.js.map +1 -0
package/package.json +45 -0
package/src/__tests__/benchmark/fixtures/false-positives.ts +227 -0
package/src/__tests__/benchmark/fixtures/index.ts +68 -0
package/src/__tests__/benchmark/fixtures/layer1/config-audit.ts +364 -0
package/src/__tests__/benchmark/fixtures/layer1/hardcoded-secrets.ts +173 -0
package/src/__tests__/benchmark/fixtures/layer1/high-entropy.ts +234 -0
package/src/__tests__/benchmark/fixtures/layer1/index.ts +31 -0
package/src/__tests__/benchmark/fixtures/layer1/sensitive-urls.ts +90 -0
package/src/__tests__/benchmark/fixtures/layer1/weak-crypto.ts +197 -0
package/src/__tests__/benchmark/fixtures/layer2/ai-agent-tools.ts +170 -0
package/src/__tests__/benchmark/fixtures/layer2/ai-endpoint-protection.ts +418 -0
package/src/__tests__/benchmark/fixtures/layer2/ai-execution-sinks.ts +189 -0
package/src/__tests__/benchmark/fixtures/layer2/ai-fingerprinting.ts +316 -0
package/src/__tests__/benchmark/fixtures/layer2/ai-prompt-hygiene.ts +178 -0
package/src/__tests__/benchmark/fixtures/layer2/ai-rag-safety.ts +184 -0
package/src/__tests__/benchmark/fixtures/layer2/ai-schema-validation.ts +434 -0
package/src/__tests__/benchmark/fixtures/layer2/auth-antipatterns.ts +159 -0
package/src/__tests__/benchmark/fixtures/layer2/byok-patterns.ts +112 -0
package/src/__tests__/benchmark/fixtures/layer2/dangerous-functions.ts +246 -0
package/src/__tests__/benchmark/fixtures/layer2/data-exposure.ts +168 -0
package/src/__tests__/benchmark/fixtures/layer2/framework-checks.ts +346 -0
package/src/__tests__/benchmark/fixtures/layer2/index.ts +67 -0
package/src/__tests__/benchmark/fixtures/layer2/injection-vulnerabilities.ts +239 -0
package/src/__tests__/benchmark/fixtures/layer2/logic-gates.ts +246 -0
package/src/__tests__/benchmark/fixtures/layer2/risky-imports.ts +231 -0
package/src/__tests__/benchmark/fixtures/layer2/variables.ts +167 -0
package/src/__tests__/benchmark/index.ts +29 -0
package/src/__tests__/benchmark/run-benchmark.ts +144 -0
package/src/__tests__/benchmark/run-depth-validation.ts +206 -0
package/src/__tests__/benchmark/run-real-world-test.ts +243 -0
package/src/__tests__/benchmark/security-benchmark-script.ts +1737 -0
package/src/__tests__/benchmark/tier-integration-script.ts +177 -0
package/src/__tests__/benchmark/types.ts +144 -0
package/src/__tests__/benchmark/utils/test-runner.ts +475 -0
package/src/__tests__/regression/known-false-positives.test.ts +467 -0
package/src/__tests__/snapshots/__snapshots__/scan-depth.test.ts.snap +178 -0
package/src/__tests__/snapshots/scan-depth.test.ts +258 -0
package/src/__tests__/validation/analyze-results.ts +542 -0
package/src/__tests__/validation/extract-for-triage.ts +146 -0
package/src/__tests__/validation/fp-deep-analysis.ts +327 -0
package/src/__tests__/validation/run-validation.ts +364 -0
package/src/__tests__/validation/triage-template.md +132 -0
package/src/formatters/cli-terminal.ts +446 -0
package/src/formatters/github-comment.ts +382 -0
package/src/formatters/grouping.ts +190 -0
package/src/formatters/index.ts +47 -0
package/src/formatters/vscode-diagnostic.ts +243 -0
package/src/index.ts +823 -0
package/src/layer1/comments.ts +218 -0
package/src/layer1/config-audit.ts +289 -0
package/src/layer1/entropy.ts +583 -0
package/src/layer1/file-flags.ts +127 -0
package/src/layer1/index.ts +181 -0
package/src/layer1/patterns.ts +516 -0
package/src/layer1/urls.ts +334 -0
package/src/layer1/weak-crypto.ts +328 -0
package/src/layer2/ai-agent-tools.ts +601 -0
package/src/layer2/ai-endpoint-protection.ts +387 -0
package/src/layer2/ai-execution-sinks.ts +580 -0
package/src/layer2/ai-fingerprinting.ts +758 -0
package/src/layer2/ai-prompt-hygiene.ts +411 -0
package/src/layer2/ai-rag-safety.ts +511 -0
package/src/layer2/ai-schema-validation.ts +421 -0
package/src/layer2/auth-antipatterns.ts +394 -0
package/src/layer2/byok-patterns.ts +336 -0
package/src/layer2/dangerous-functions.ts +1563 -0
package/src/layer2/data-exposure.ts +315 -0
package/src/layer2/framework-checks.ts +433 -0
package/src/layer2/index.ts +473 -0
package/src/layer2/logic-gates.ts +206 -0
package/src/layer2/risky-imports.ts +186 -0
package/src/layer2/variables.ts +166 -0
package/src/layer3/anthropic.ts +2030 -0
package/src/layer3/index.ts +130 -0
package/src/layer3/package-check.ts +604 -0
package/src/modes/incremental.ts +293 -0
package/src/tiers.ts +318 -0
package/src/types.ts +284 -0
package/src/utils/auth-helper-detector.ts +443 -0
package/src/utils/context-helpers.ts +535 -0
package/src/utils/diff-detector.ts +135 -0
package/src/utils/diff-parser.ts +272 -0
package/src/utils/imported-auth-detector.ts +320 -0
package/src/utils/middleware-detector.ts +333 -0
package/src/utils/oauth-flow-detector.ts +246 -0
package/src/utils/path-exclusions.ts +266 -0
package/src/utils/project-context-builder.ts +707 -0
package/src/utils/registry-clients.ts +351 -0
package/src/utils/trpc-analyzer.ts +382 -0

package/src/__tests__/validation/analyze-results.ts ADDED Viewed

@@ -0,0 +1,542 @@
+#!/usr/bin/env npx tsx
+/**
+ * M7: Results Analysis Script
+ *
+ * Analyzes scan results from real-repo validation and generates
+ * summary metrics for documentation.
+ *
+ * Usage:
+ *   npx tsx packages/scanner/src/__tests__/validation/analyze-results.ts
+ *   npx tsx packages/scanner/src/__tests__/validation/analyze-results.ts --output docs/RESULTSCOMPARISON.md
+ */
+import * as fs from 'fs'
+import * as path from 'path'
+import type { ScanResult, Vulnerability, VulnerabilityCategory, VulnerabilitySeverity } from '../../types'
+const RESULTS_DIR = path.join(__dirname, '../../../validation-results')
+// M5 AI-era categories we're specifically validating
+const M5_CATEGORIES: VulnerabilityCategory[] = [
+  'ai_rag_exfiltration',
+  'ai_endpoint_unprotected',
+  'ai_schema_mismatch',
+  'ai_prompt_injection',
+  'ai_unsafe_execution',
+  'ai_overpermissive_tool',
+]
+interface FindingSummary {
+  category: VulnerabilityCategory
+  count: number
+  bySeverity: Record<VulnerabilitySeverity, number>
+  examples: Array<{
+    file: string
+    line: number
+    title: string
+    severity: VulnerabilitySeverity
+  }>
+}
+interface RepoAnalysis {
+  repoName: string
+  scanDepth: string
+  totalFindings: number
+  mediumPlusFindings: number
+  filesScanned: number
+  scanDuration: number
+  bySeverity: Record<VulnerabilitySeverity, number>
+  byCategory: Record<string, number>
+  m5Findings: FindingSummary[]
+  topCategories: Array<{ category: string; count: number }>
+  libraryCodeFindings: number
+  exampleCodeFindings: number
+  testCodeFindings: number
+}
+interface ValidationReport {
+  generatedAt: string
+  totalRepos: number
+  totalScans: number
+  analyses: RepoAnalysis[]
+  aggregateMetrics: {
+    totalFindings: number
+    totalMediumPlus: number
+    avgFindingsPerRepo: number
+    m5DetectorPerformance: Record<string, { total: number; mediumPlus: number }>
+  }
+}
+/**
+ * Classify file path as library internal, example, or test code
+ */
+function classifyFilePath(filePath: string): 'library' | 'example' | 'test' | 'other' {
+  const lowerPath = filePath.toLowerCase()
+  // Test files
+  if (
+    lowerPath.includes('__tests__') ||
+    lowerPath.includes('/test/') ||
+    lowerPath.includes('/tests/') ||
+    lowerPath.includes('.test.') ||
+    lowerPath.includes('.spec.') ||
+    lowerPath.includes('_test.') ||
+    lowerPath.includes('/fixtures/')
+  ) {
+    return 'test'
+  }
+  // Example/demo files
+  if (
+    lowerPath.includes('/examples/') ||
+    lowerPath.includes('/example/') ||
+    lowerPath.includes('/demos/') ||
+    lowerPath.includes('/demo/') ||
+    lowerPath.includes('/templates/') ||
+    lowerPath.includes('/cookbook/')
+  ) {
+    return 'example'
+  }
+  // Library internal code
+  if (
+    lowerPath.includes('/src/') ||
+    lowerPath.includes('/lib/') ||
+    lowerPath.includes('/libs/') ||
+    lowerPath.includes('/packages/')
+  ) {
+    return 'library'
+  }
+  return 'other'
+}
+/**
+ * Load scan results from JSON files
+ */
+function loadResults(): Map<string, ScanResult> {
+  const results = new Map<string, ScanResult>()
+  if (!fs.existsSync(RESULTS_DIR)) {
+    console.error(`Results directory not found: ${RESULTS_DIR}`)
+    console.error('Run run-validation.ts first to generate results.')
+    process.exit(1)
+  }
+  const files = fs.readdirSync(RESULTS_DIR).filter(f =>
+    f.endsWith('.json') && !f.includes('medium-plus')
+  )
+  if (files.length === 0) {
+    console.error('No result files found in', RESULTS_DIR)
+    console.error('Run run-validation.ts first to generate results.')
+    process.exit(1)
+  }
+  for (const file of files) {
+    const filePath = path.join(RESULTS_DIR, file)
+    const content = fs.readFileSync(filePath, 'utf-8')
+    const result = JSON.parse(content) as ScanResult
+    const key = file.replace('.json', '')
+    results.set(key, result)
+  }
+  return results
+}
+/**
+ * Analyze a single scan result
+ */
+function analyzeResult(key: string, result: ScanResult): RepoAnalysis {
+  const [repoName, scanDepth] = key.split('-')
+  // Severity distribution
+  const bySeverity: Record<VulnerabilitySeverity, number> = {
+    critical: 0,
+    high: 0,
+    medium: 0,
+    low: 0,
+    info: 0,
+  }
+  // Category distribution
+  const byCategory: Record<string, number> = {}
+  // Code type distribution
+  let libraryCodeFindings = 0
+  let exampleCodeFindings = 0
+  let testCodeFindings = 0
+  // M5 detector findings
+  const m5FindingsMap = new Map<VulnerabilityCategory, Vulnerability[]>()
+  for (const cat of M5_CATEGORIES) {
+    m5FindingsMap.set(cat, [])
+  }
+  // Process each finding
+  for (const vuln of result.vulnerabilities) {
+    // Severity
+    bySeverity[vuln.severity]++
+    // Category
+    byCategory[vuln.category] = (byCategory[vuln.category] || 0) + 1
+    // Code type
+    const codeType = classifyFilePath(vuln.filePath)
+    if (codeType === 'library') libraryCodeFindings++
+    else if (codeType === 'example') exampleCodeFindings++
+    else if (codeType === 'test') testCodeFindings++
+    // M5 categories
+    if (M5_CATEGORIES.includes(vuln.category as VulnerabilityCategory)) {
+      m5FindingsMap.get(vuln.category as VulnerabilityCategory)!.push(vuln)
+    }
+  }
+  // Build M5 findings summary
+  const m5Findings: FindingSummary[] = []
+  for (const [category, findings] of m5FindingsMap) {
+    if (findings.length === 0) continue
+    const severityBreakdown: Record<VulnerabilitySeverity, number> = {
+      critical: 0,
+      high: 0,
+      medium: 0,
+      low: 0,
+      info: 0,
+    }
+    for (const f of findings) {
+      severityBreakdown[f.severity]++
+    }
+    // Get top 5 examples
+    const examples = findings.slice(0, 5).map(f => ({
+      file: f.filePath,
+      line: f.lineNumber,
+      title: f.title,
+      severity: f.severity,
+    }))
+    m5Findings.push({
+      category,
+      count: findings.length,
+      bySeverity: severityBreakdown,
+      examples,
+    })
+  }
+  // Sort m5Findings by count
+  m5Findings.sort((a, b) => b.count - a.count)
+  // Top categories
+  const topCategories = Object.entries(byCategory)
+    .sort(([, a], [, b]) => b - a)
+    .slice(0, 10)
+    .map(([category, count]) => ({ category, count }))
+  // Medium+ count
+  const mediumPlusFindings = bySeverity.critical + bySeverity.high + bySeverity.medium
+  return {
+    repoName,
+    scanDepth,
+    totalFindings: result.vulnerabilities.length,
+    mediumPlusFindings,
+    filesScanned: result.filesScanned,
+    scanDuration: result.scanDuration,
+    bySeverity,
+    byCategory,
+    m5Findings,
+    topCategories,
+    libraryCodeFindings,
+    exampleCodeFindings,
+    testCodeFindings,
+  }
+}
+/**
+ * Generate aggregate metrics across all analyses
+ */
+function computeAggregateMetrics(analyses: RepoAnalysis[]): ValidationReport['aggregateMetrics'] {
+  let totalFindings = 0
+  let totalMediumPlus = 0
+  const m5Performance: Record<string, { total: number; mediumPlus: number }> = {}
+  for (const cat of M5_CATEGORIES) {
+    m5Performance[cat] = { total: 0, mediumPlus: 0 }
+  }
+  for (const analysis of analyses) {
+    totalFindings += analysis.totalFindings
+    totalMediumPlus += analysis.mediumPlusFindings
+    for (const m5 of analysis.m5Findings) {
+      m5Performance[m5.category].total += m5.count
+      m5Performance[m5.category].mediumPlus +=
+        m5.bySeverity.critical + m5.bySeverity.high + m5.bySeverity.medium
+    }
+  }
+  return {
+    totalFindings,
+    totalMediumPlus,
+    avgFindingsPerRepo: analyses.length > 0 ? Math.round(totalFindings / analyses.length) : 0,
+    m5DetectorPerformance: m5Performance,
+  }
+}
+/**
+ * Generate markdown report
+ */
+function generateMarkdownReport(report: ValidationReport): string {
+  const lines: string[] = []
+  lines.push('# M7: Real-Repo Validation Results')
+  lines.push('')
+  lines.push(`> Generated: ${report.generatedAt}`)
+  lines.push('')
+  // Executive Summary
+  lines.push('## Executive Summary')
+  lines.push('')
+  lines.push(`- **Repositories scanned:** ${report.totalRepos}`)
+  lines.push(`- **Total scans:** ${report.totalScans}`)
+  lines.push(`- **Total findings:** ${report.aggregateMetrics.totalFindings}`)
+  lines.push(`- **Medium+ findings (to triage):** ${report.aggregateMetrics.totalMediumPlus}`)
+  lines.push('')
+  // M5 Detector Performance
+  lines.push('## M5 AI-Era Detector Performance')
+  lines.push('')
+  lines.push('| Detector | Total Findings | Medium+ |')
+  lines.push('|----------|----------------|---------|')
+  for (const [category, stats] of Object.entries(report.aggregateMetrics.m5DetectorPerformance)) {
+    if (stats.total > 0) {
+      lines.push(`| ${category} | ${stats.total} | ${stats.mediumPlus} |`)
+    }
+  }
+  const emptyM5 = Object.entries(report.aggregateMetrics.m5DetectorPerformance)
+    .filter(([, stats]) => stats.total === 0)
+    .map(([cat]) => cat)
+  if (emptyM5.length > 0) {
+    lines.push('')
+    lines.push(`**No findings for:** ${emptyM5.join(', ')}`)
+  }
+  lines.push('')
+  // Per-Repo Results
+  lines.push('## Per-Repository Results')
+  lines.push('')
+  // Group analyses by repo
+  const byRepo = new Map<string, RepoAnalysis[]>()
+  for (const analysis of report.analyses) {
+    const existing = byRepo.get(analysis.repoName) || []
+    existing.push(analysis)
+    byRepo.set(analysis.repoName, existing)
+  }
+  for (const [repoName, analyses] of byRepo) {
+    lines.push(`### ${repoName}`)
+    lines.push('')
+    for (const analysis of analyses) {
+      lines.push(`#### Depth: ${analysis.scanDepth}`)
+      lines.push('')
+      lines.push(`- Files scanned: ${analysis.filesScanned}`)
+      lines.push(`- Total findings: ${analysis.totalFindings}`)
+      lines.push(`- Duration: ${analysis.scanDuration}ms`)
+      lines.push('')
+      lines.push('**Severity Breakdown:**')
+      lines.push(`| Critical | High | Medium | Low | Info |`)
+      lines.push(`|----------|------|--------|-----|------|`)
+      lines.push(`| ${analysis.bySeverity.critical} | ${analysis.bySeverity.high} | ${analysis.bySeverity.medium} | ${analysis.bySeverity.low} | ${analysis.bySeverity.info} |`)
+      lines.push('')
+      // Code type breakdown
+      lines.push('**Finding Distribution by Code Type:**')
+      lines.push(`- Library internals: ${analysis.libraryCodeFindings}`)
+      lines.push(`- Examples/demos: ${analysis.exampleCodeFindings}`)
+      lines.push(`- Test files: ${analysis.testCodeFindings}`)
+      lines.push('')
+      // Top categories
+      if (analysis.topCategories.length > 0) {
+        lines.push('**Top Categories:**')
+        for (const { category, count } of analysis.topCategories.slice(0, 5)) {
+          lines.push(`- ${category}: ${count}`)
+        }
+        lines.push('')
+      }
+      // M5 findings with examples
+      if (analysis.m5Findings.length > 0) {
+        lines.push('**M5 Detector Findings:**')
+        for (const m5 of analysis.m5Findings) {
+          lines.push(`- **${m5.category}**: ${m5.count} findings`)
+          if (m5.examples.length > 0) {
+            for (const ex of m5.examples.slice(0, 3)) {
+              lines.push(`  - \`${ex.file}:${ex.line}\` (${ex.severity}): ${ex.title}`)
+            }
+          }
+        }
+        lines.push('')
+      }
+    }
+  }
+  // Triage Checklist
+  lines.push('## FP Triage Checklist')
+  lines.push('')
+  lines.push('For each medium+ finding, classify as:')
+  lines.push('- [ ] **True Positive** - Real security issue')
+  lines.push('- [ ] **False Positive** - Safe code incorrectly flagged')
+  lines.push('- [ ] **Borderline** - Context-dependent, may need tuning')
+  lines.push('')
+  lines.push('### Triage Template')
+  lines.push('')
+  lines.push('```markdown')
+  lines.push('### Finding: [category]')
+  lines.push('**File:** [path]:[line]')
+  lines.push('**Severity:** [severity]')
+  lines.push('**Classification:** [ ] TP [ ] FP [ ] Borderline')
+  lines.push('**Context:** Library internal / Example code / Test file')
+  lines.push('**Reasoning:** [Why this is/isn\'t a real issue]')
+  lines.push('**Action:** [ ] Keep [ ] Tune detector [ ] Add to known-FP fixtures')
+  lines.push('```')
+  lines.push('')
+  // Next Steps
+  lines.push('## Next Steps')
+  lines.push('')
+  lines.push('1. Review all medium+ findings in this report')
+  lines.push('2. Classify each as TP/FP/Borderline')
+  lines.push('3. Calculate FP rate: `FP / (TP + FP)` - target: <20%')
+  lines.push('4. Add FP patterns to `known-false-positives.test.ts`')
+  lines.push('5. Tune detectors if FP rate exceeds 20%')
+  lines.push('')
+  return lines.join('\n')
+}
+/**
+ * Print console summary
+ */
+function printConsoleSummary(report: ValidationReport): void {
+  console.log('\n' + '='.repeat(60))
+  console.log('M7: VALIDATION ANALYSIS SUMMARY')
+  console.log('='.repeat(60))
+  console.log(`\nGenerated: ${report.generatedAt}`)
+  console.log(`Repositories: ${report.totalRepos}`)
+  console.log(`Total scans: ${report.totalScans}`)
+  console.log('\n--- Aggregate Metrics ---')
+  console.log(`Total findings: ${report.aggregateMetrics.totalFindings}`)
+  console.log(`Medium+ findings: ${report.aggregateMetrics.totalMediumPlus} (to triage)`)
+  console.log(`Avg per repo: ${report.aggregateMetrics.avgFindingsPerRepo}`)
+  console.log('\n--- M5 Detector Performance ---')
+  console.log('Category                      | Total | Medium+')
+  console.log('-'.repeat(50))
+  for (const [category, stats] of Object.entries(report.aggregateMetrics.m5DetectorPerformance)) {
+    const catPadded = category.padEnd(30)
+    console.log(`${catPadded}| ${String(stats.total).padEnd(6)}| ${stats.mediumPlus}`)
+  }
+  console.log('\n--- Per-Repo Breakdown ---')
+  for (const analysis of report.analyses) {
+    console.log(`\n${analysis.repoName} (${analysis.scanDepth}):`)
+    console.log(`  Files: ${analysis.filesScanned}, Findings: ${analysis.totalFindings}, Medium+: ${analysis.mediumPlusFindings}`)
+    console.log(`  Code types: Library=${analysis.libraryCodeFindings}, Example=${analysis.exampleCodeFindings}, Test=${analysis.testCodeFindings}`)
+  }
+}
+/**
+ * Main entry point
+ */
+async function main() {
+  const args = process.argv.slice(2)
+  let outputPath: string | null = null
+  // Parse args
+  for (let i = 0; i < args.length; i++) {
+    if (args[i] === '--output' && args[i + 1]) {
+      outputPath = args[i + 1]
+      i++
+    } else if (args[i] === '--help' || args[i] === '-h') {
+      console.log(`
+M7: Results Analysis Script
+Usage:
+  npx tsx analyze-results.ts [options]
+Options:
+  --output <path>   Write markdown report to file
+  --help, -h        Show this help
+Examples:
+  npx tsx analyze-results.ts                                    # Print summary
+  npx tsx analyze-results.ts --output docs/RESULTSCOMPARISON.md # Generate report
+`)
+      process.exit(0)
+    }
+  }
+  // Load results
+  const results = loadResults()
+  console.log(`Loaded ${results.size} result files`)
+  // Analyze each result
+  const analyses: RepoAnalysis[] = []
+  for (const [key, result] of results) {
+    const analysis = analyzeResult(key, result)
+    analyses.push(analysis)
+  }
+  // Get unique repo count
+  const uniqueRepos = new Set(analyses.map(a => a.repoName))
+  // Build report
+  const report: ValidationReport = {
+    generatedAt: new Date().toISOString(),
+    totalRepos: uniqueRepos.size,
+    totalScans: analyses.length,
+    analyses,
+    aggregateMetrics: computeAggregateMetrics(analyses),
+  }
+  // Print console summary
+  printConsoleSummary(report)
+  // Generate markdown if output path specified
+  if (outputPath) {
+    const markdown = generateMarkdownReport(report)
+    const fullPath = path.isAbsolute(outputPath)
+      ? outputPath
+      : path.join(process.cwd(), outputPath)
+    // Ensure directory exists
+    const dir = path.dirname(fullPath)
+    if (!fs.existsSync(dir)) {
+      fs.mkdirSync(dir, { recursive: true })
+    }
+    fs.writeFileSync(fullPath, markdown)
+    console.log(`\nMarkdown report saved to: ${fullPath}`)
+  } else {
+    console.log('\nTip: Use --output docs/RESULTSCOMPARISON.md to generate full report')
+  }
+}
+// Run
+main().catch(err => {
+  console.error('Analysis failed:', err)
+  process.exit(1)
+})

package/src/__tests__/validation/extract-for-triage.ts ADDED Viewed

@@ -0,0 +1,146 @@
+#!/usr/bin/env npx tsx
+/**
+ * Extract medium+ findings for systematic triage
+ *
+ * Outputs findings grouped by category with file paths for code review
+ */
+import * as fs from 'fs'
+import * as path from 'path'
+import type { ScanResult, Vulnerability } from '../../types'
+const RESULTS_DIR = path.join(__dirname, '../../../validation-results')
+const REPOS_DIR = path.join(__dirname, '../../../validation-repos')
+interface TriageFinding {
+  id: string
+  repo: string
+  file: string
+  line: number
+  severity: string
+  category: string
+  title: string
+  description: string
+  lineContent: string
+  codeType: 'library' | 'example' | 'test' | 'other'
+}
+function classifyCodeType(filePath: string): 'library' | 'example' | 'test' | 'other' {
+  const lowerPath = filePath.toLowerCase()
+  if (lowerPath.includes('__tests__') || lowerPath.includes('/test/') ||
+      lowerPath.includes('/tests/') || lowerPath.includes('.test.') ||
+      lowerPath.includes('.spec.') || lowerPath.includes('/fixtures/')) {
+    return 'test'
+  }
+  if (lowerPath.includes('/examples/') || lowerPath.includes('/example/') ||
+      lowerPath.includes('/demos/') || lowerPath.includes('/demo/') ||
+      lowerPath.includes('/templates/') || lowerPath.includes('/cookbook/')) {
+    return 'example'
+  }
+  if (lowerPath.includes('/src/') || lowerPath.includes('/lib/') ||
+      lowerPath.includes('/libs/') || lowerPath.includes('/packages/')) {
+    return 'library'
+  }
+  return 'other'
+}
+function extractMediumPlusFindings(): TriageFinding[] {
+  const findings: TriageFinding[] = []
+  const files = fs.readdirSync(RESULTS_DIR).filter(f => f.endsWith('.json'))
+  for (const file of files) {
+    const repoName = file.replace('-cheap.json', '').replace('-validated.json', '')
+    const content = fs.readFileSync(path.join(RESULTS_DIR, file), 'utf-8')
+    const result = JSON.parse(content) as ScanResult
+    for (const vuln of result.vulnerabilities) {
+      if (['critical', 'high', 'medium'].includes(vuln.severity)) {
+        findings.push({
+          id: vuln.id,
+          repo: repoName,
+          file: vuln.filePath,
+          line: vuln.lineNumber,
+          severity: vuln.severity,
+          category: vuln.category,
+          title: vuln.title,
+          description: vuln.description,
+          lineContent: vuln.lineContent,
+          codeType: classifyCodeType(vuln.filePath),
+        })
+      }
+    }
+  }
+  return findings
+}
+function groupByCategory(findings: TriageFinding[]): Map<string, TriageFinding[]> {
+  const groups = new Map<string, TriageFinding[]>()
+  for (const f of findings) {
+    const existing = groups.get(f.category) || []
+    existing.push(f)
+    groups.set(f.category, existing)
+  }
+  return groups
+}
+function main() {
+  const findings = extractMediumPlusFindings()
+  const grouped = groupByCategory(findings)
+  console.log(`\n${'='.repeat(60)}`)
+  console.log('MEDIUM+ FINDINGS FOR TRIAGE')
+  console.log('='.repeat(60))
+  console.log(`Total: ${findings.length} findings\n`)
+  // Summary by category
+  console.log('By Category:')
+  const sortedCategories = Array.from(grouped.entries())
+    .sort((a, b) => b[1].length - a[1].length)
+  for (const [category, catFindings] of sortedCategories) {
+    const bySeverity = {
+      critical: catFindings.filter(f => f.severity === 'critical').length,
+      high: catFindings.filter(f => f.severity === 'high').length,
+      medium: catFindings.filter(f => f.severity === 'medium').length,
+    }
+    console.log(`  ${category}: ${catFindings.length} (C:${bySeverity.critical} H:${bySeverity.high} M:${bySeverity.medium})`)
+  }
+  // By code type
+  const byCodeType = {
+    library: findings.filter(f => f.codeType === 'library').length,
+    example: findings.filter(f => f.codeType === 'example').length,
+    test: findings.filter(f => f.codeType === 'test').length,
+    other: findings.filter(f => f.codeType === 'other').length,
+  }
+  console.log(`\nBy Code Type:`)
+  console.log(`  Library: ${byCodeType.library}`)
+  console.log(`  Example: ${byCodeType.example}`)
+  console.log(`  Test: ${byCodeType.test}`)
+  console.log(`  Other: ${byCodeType.other}`)
+  // Output JSON for further processing
+  const outputPath = path.join(RESULTS_DIR, 'medium-plus-findings.json')
+  fs.writeFileSync(outputPath, JSON.stringify(findings, null, 2))
+  console.log(`\nFindings exported to: ${outputPath}`)
+  // Output summary by repo
+  console.log('\nBy Repository:')
+  const byRepo = new Map<string, number>()
+  for (const f of findings) {
+    byRepo.set(f.repo, (byRepo.get(f.repo) || 0) + 1)
+  }
+  for (const [repo, count] of byRepo) {
+    console.log(`  ${repo}: ${count}`)
+  }
+}
+main()