PyPI - zen-ai-pentest - Versions diffs - 2.2.0__py3-none-any.whl → 2.3.0__py3-none-any.whl - Mend

zen-ai-pentest 2.2.0py3-none-any.whl → 2.3.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

api/auth.py +61 -7
api/csrf_protection.py +286 -0
api/main.py +77 -11
api/rate_limiter.py +317 -0
api/rate_limiter_v2.py +586 -0
autonomous/ki_analysis_agent.py +1033 -0
benchmarks/__init__.py +12 -142
benchmarks/agent_performance.py +374 -0
benchmarks/api_performance.py +479 -0
benchmarks/scan_performance.py +272 -0
modules/agent_coordinator.py +255 -0
modules/api_key_manager.py +501 -0
modules/benchmark.py +706 -0
modules/cve_updater.py +303 -0
modules/false_positive_filter.py +149 -0
modules/output_formats.py +1088 -0
modules/risk_scoring.py +206 -0
{zen_ai_pentest-2.2.0.dist-info → zen_ai_pentest-2.3.0.dist-info}/METADATA +134 -289
{zen_ai_pentest-2.2.0.dist-info → zen_ai_pentest-2.3.0.dist-info}/RECORD +23 -9
{zen_ai_pentest-2.2.0.dist-info → zen_ai_pentest-2.3.0.dist-info}/WHEEL +0 -0
{zen_ai_pentest-2.2.0.dist-info → zen_ai_pentest-2.3.0.dist-info}/entry_points.txt +0 -0
{zen_ai_pentest-2.2.0.dist-info → zen_ai_pentest-2.3.0.dist-info}/licenses/LICENSE +0 -0
{zen_ai_pentest-2.2.0.dist-info → zen_ai_pentest-2.3.0.dist-info}/top_level.txt +0 -0

modules/cve_updater.py ADDED Viewed

@@ -0,0 +1,303 @@
+"""CVE Database Auto-Update Module
+Fetches and updates CVE data from NVD (National Vulnerability Database)
+- Daily delta updates
+- Caching with ETags
+- Rate limiting compliance (NVD: max 5 requests in 30 seconds)
+"""
+import asyncio
+import json
+import os
+from typing import Dict, List, Optional, Set
+from datetime import datetime, timedelta
+from dataclasses import dataclass, asdict
+import aiohttp
+import aiofiles
+import logging
+@dataclass
+class CVEEntry:
+    """Single CVE entry structure"""
+    id: str
+    published: str
+    last_modified: str
+    description: str
+    cvss_score: float
+    cvss_vector: str
+    severity: str
+    references: List[str]
+    cpe_matches: List[str]
+class NVDClient:
+    """NVD API Client with rate limiting"""
+    BASE_URL = "https://services.nvd.nist.gov/rest/json/cves/2.0"
+    RATE_LIMIT_DELAY = 6.0  # 6 seconds between requests (max 5 per 30s)
+    def __init__(self, api_key: Optional[str] = None):
+        self.api_key = api_key or os.getenv("NVD_API_KEY")
+        self.last_request_time = 0
+        self.session: Optional[aiohttp.ClientSession] = None
+    async def __aenter__(self):
+        self.session = aiohttp.ClientSession()
+        return self
+    async def __aexit__(self, *args):
+        if self.session:
+            await self.session.close()
+    async def _rate_limit(self):
+        """Ensure rate limiting compliance"""
+        elapsed = asyncio.get_event_loop().time() - self.last_request_time
+        if elapsed < self.RATE_LIMIT_DELAY:
+            await asyncio.sleep(self.RATE_LIMIT_DELAY - elapsed)
+        self.last_request_time = asyncio.get_event_loop().time()
+    async def fetch_cves(
+        self,
+        start_date: Optional[datetime] = None,
+        end_date: Optional[datetime] = None,
+        results_per_page: int = 2000
+    ) -> List[CVEEntry]:
+        """Fetch CVEs from NVD with optional date range"""
+        await self._rate_limit()
+        params = {"resultsPerPage": results_per_page}
+        if start_date:
+            params["lastModStartDate"] = start_date.strftime("%Y-%m-%dT%H:%M:%S.000")
+        if end_date:
+            params["lastModEndDate"] = end_date.strftime("%Y-%m-%dT%H:%M:%S.000")
+        if self.api_key:
+            params["apiKey"] = self.api_key
+        async with self.session.get(self.BASE_URL, params=params) as resp:
+            if resp.status != 200:
+                raise Exception(f"NVD API error: {resp.status}")
+            data = await resp.json()
+            return self._parse_cves(data)
+    def _parse_cves(self, data: Dict) -> List[CVEEntry]:
+        """Parse NVD API response"""
+        cves = []
+        for vuln in data.get("vulnerabilities", []):
+            cve_data = vuln.get("cve", {})
+            # Extract CVSS score
+            cvss_score = 0.0
+            severity = "unknown"
+            cvss_vector = ""
+            metrics = cve_data.get("metrics", {})
+            if "cvssMetricV31" in metrics:
+                cvss_data = metrics["cvssMetricV31"][0]["cvssData"]
+                cvss_score = cvss_data.get("baseScore", 0.0)
+                severity = metrics["cvssMetricV31"][0].get("baseSeverity", "unknown").lower()
+                cvss_vector = cvss_data.get("vectorString", "")
+            elif "cvssMetricV30" in metrics:
+                cvss_data = metrics["cvssMetricV30"][0]["cvssData"]
+                cvss_score = cvss_data.get("baseScore", 0.0)
+                severity = metrics["cvssMetricV30"][0].get("baseSeverity", "unknown").lower()
+                cvss_vector = cvss_data.get("vectorString", "")
+            # Extract description (English only)
+            descriptions = cve_data.get("descriptions", [])
+            description = ""
+            for desc in descriptions:
+                if desc.get("lang") == "en":
+                    description = desc.get("value", "")
+                    break
+            # Extract references
+            references = [
+                ref.get("url", "")
+                for ref in cve_data.get("references", [])
+                if ref.get("url")
+            ]
+            # Extract CPE matches
+            cpe_matches = []
+            configurations = cve_data.get("configurations", [])
+            for config in configurations:
+                for node in config.get("nodes", []):
+                    for match in node.get("cpeMatch", []):
+                        if match.get("criteria"):
+                            cpe_matches.append(match["criteria"])
+            cve = CVEEntry(
+                id=cve_data.get("id", ""),
+                published=cve_data.get("published", ""),
+                last_modified=cve_data.get("lastModified", ""),
+                description=description,
+                cvss_score=cvss_score,
+                cvss_vector=cvss_vector,
+                severity=severity,
+                references=references,
+                cpe_matches=cpe_matches
+            )
+            cves.append(cve)
+        return cves
+class CVEUpdater:
+    """CVE Database Updater"""
+    def __init__(self, db_path: str = "data/cve_database.json"):
+        self.db_path = db_path
+        self.metadata_path = db_path.replace(".json", "_meta.json")
+        self.db_dir = os.path.dirname(db_path)
+        # Ensure directory exists
+        if self.db_dir:
+            os.makedirs(self.db_dir, exist_ok=True)
+    async def initialize_db(self):
+        """Create initial empty database"""
+        if not os.path.exists(self.db_path):
+            await self._save_db({})
+            await self._save_metadata({"last_update": None, "total_cves": 0})
+    async def update(self, days_back: int = 1) -> Dict:
+        """Update CVE database with delta from last N days"""
+        await self.initialize_db()
+        # Calculate date range
+        end_date = datetime.utcnow()
+        start_date = end_date - timedelta(days=days_back)
+        logging.info(f"Fetching CVEs from {start_date} to {end_date}")
+        # Fetch from NVD
+        async with NVDClient() as client:
+            cves = await client.fetch_cves(start_date, end_date)
+        # Load existing database
+        db = await self._load_db()
+        # Merge updates
+        new_count = 0
+        updated_count = 0
+        for cve in cves:
+            if cve.id not in db:
+                new_count += 1
+            elif db[cve.id]["last_modified"] != cve.last_modified:
+                updated_count += 1
+            db[cve.id] = asdict(cve)
+        # Save updated database
+        await self._save_db(db)
+        # Update metadata
+        metadata = {
+            "last_update": datetime.utcnow().isoformat(),
+            "total_cves": len(db),
+            "last_fetch_new": new_count,
+            "last_fetch_updated": updated_count,
+            "last_fetch_date_range": f"{start_date.date()} to {end_date.date()}"
+        }
+        await self._save_metadata(metadata)
+        logging.info(f"Update complete: {new_count} new, {updated_count} updated, {len(db)} total")
+        return metadata
+    async def full_sync(self) -> Dict:
+        """Full database sync (last 120 days - NVD limit)"""
+        return await self.update(days_back=120)
+    async def _load_db(self) -> Dict:
+        """Load database from disk"""
+        if not os.path.exists(self.db_path):
+            return {}
+        async with aiofiles.open(self.db_path, 'r') as f:
+            content = await f.read()
+            return json.loads(content)
+    async def _save_db(self, db: Dict):
+        """Save database to disk"""
+        async with aiofiles.open(self.db_path, 'w') as f:
+            await f.write(json.dumps(db, indent=2))
+    async def _load_metadata(self) -> Dict:
+        """Load metadata from disk"""
+        if not os.path.exists(self.metadata_path):
+            return {}
+        async with aiofiles.open(self.metadata_path, 'r') as f:
+            content = await f.read()
+            return json.loads(content)
+    async def _save_metadata(self, metadata: Dict):
+        """Save metadata to disk"""
+        async with aiofiles.open(self.metadata_path, 'w') as f:
+            await f.write(json.dumps(metadata, indent=2))
+    def get_stats(self) -> Dict:
+        """Get database statistics"""
+        try:
+            if not os.path.exists(self.db_path):
+                return {"status": "not_initialized"}
+            with open(self.db_path, 'r') as f:
+                db = json.load(f)
+            with open(self.metadata_path, 'r') as f:
+                metadata = json.load(f)
+            # Count by severity
+            severity_counts = {}
+            for cve in db.values():
+                sev = cve.get("severity", "unknown")
+                severity_counts[sev] = severity_counts.get(sev, 0) + 1
+            return {
+                "status": "ready",
+                "total_cves": len(db),
+                "last_update": metadata.get("last_update"),
+                "by_severity": severity_counts,
+                "metadata": metadata
+            }
+        except Exception as e:
+            return {"status": "error", "error": str(e)}
+    async def lookup_cve(self, cve_id: str) -> Optional[Dict]:
+        """Lookup single CVE by ID"""
+        db = await self._load_db()
+        return db.get(cve_id)
+    def get_info(self) -> Dict:
+        """Get module info"""
+        return {
+            "name": "cve_updater",
+            "version": "1.0.0",
+            "description": "CVE Database Auto-Update from NVD",
+            "source": "NVD (National Vulnerability Database)",
+            "update_frequency": "daily",
+            "rate_limit": "6 seconds between requests"
+        }
+# CLI interface
+if __name__ == "__main__":
+    import sys
+    logging.basicConfig(level=logging.INFO)
+    updater = CVEUpdater()
+    if len(sys.argv) > 1 and sys.argv[1] == "full":
+        result = asyncio.run(updater.full_sync())
+    else:
+        result = asyncio.run(updater.update())
+    print(json.dumps(result, indent=2))

modules/false_positive_filter.py ADDED Viewed

@@ -0,0 +1,149 @@
+"""False Positive Reduction Module
+Uses ML-based heuristics and rule-based filters to reduce false positives.
+Addresses Issue #14
+"""
+from typing import Dict, List, Any, Optional
+from dataclasses import dataclass
+from enum import Enum
+import re
+class ConfidenceLevel(Enum):
+    HIGH = "high"      # > 90% confidence
+    MEDIUM = "medium"  # 70-90% confidence
+    LOW = "low"        # 50-70% confidence
+    UNKNOWN = "unknown"  # < 50% confidence
+@dataclass
+class Finding:
+    """Security finding structure"""
+    title: str
+    description: str
+    severity: str
+    cvss_score: float
+    evidence: List[str]
+    tool: str
+    confidence: float = 0.5
+class FalsePositiveFilter:
+    """Filter false positives from security findings"""
+    name = "false_positive_filter"
+    version = "1.0.0"
+    # Known false positive patterns
+    FALSE_POSITIVE_PATTERNS = [
+        r"(?i)self-signed certificate",  # Often intentional in dev
+        r"(?i)directory listing.*empty",
+        r"(?i)missing.*header.*not applicable",
+        r"(?i)information disclosure.*version.*normal",
+        r"(?i)cookie.*without.*secure.*localhost",
+    ]
+    # Keywords that indicate likely false positive
+    FP_KEYWORDS = [
+        "test", "localhost", "127.0.0.1", "example.com",
+        "documentation", "intentional", "expected behavior"
+    ]
+    def __init__(self):
+        self.rules_applied = 0
+        self.ml_model_loaded = False
+    def apply_rule_based_filter(self, finding: Finding) -> Tuple[bool, str]:
+        """
+        Apply rule-based filtering
+        Returns: (is_false_positive, reason)
+        """
+        # Check against known FP patterns
+        combined_text = f"{finding.title} {finding.description}"
+        for pattern in self.FALSE_POSITIVE_PATTERNS:
+            if re.search(pattern, combined_text):
+                return True, f"Matched FP pattern: {pattern}"
+        # Check for FP keywords
+        for keyword in self.FP_KEYWORDS:
+            if keyword.lower() in combined_text.lower():
+                return True, f"Contains FP keyword: {keyword}"
+        # Check confidence score
+        if finding.confidence < 0.3:
+            return True, "Confidence below threshold (0.3)"
+        return False, ""
+    def apply_ml_filter(self, finding: Finding) -> float:
+        """
+        ML-based false positive probability
+        Returns: probability (0.0 - 1.0) that this is a false positive
+        """
+        # In production, this would use a trained model
+        # For now, use heuristics as proxy
+        fp_score = 0.0
+        # Low evidence count = higher FP probability
+        if len(finding.evidence) == 0:
+            fp_score += 0.3
+        elif len(finding.evidence) < 2:
+            fp_score += 0.1
+        # Generic titles = higher FP probability
+        generic_patterns = [r"(?i)vulnerability", r"(?i)issue", r"(?i)problem"]
+        for pattern in generic_patterns:
+            if re.search(pattern, finding.title) and len(finding.title) < 30:
+                fp_score += 0.15
+        # Low severity + low confidence = likely FP
+        if finding.severity == "low" and finding.confidence < 0.5:
+            fp_score += 0.2
+        return min(fp_score, 1.0)
+    def filter_findings(
+        self,
+        findings: List[Finding],
+        fp_threshold: float = 0.7
+    ) -> Dict[str, List[Finding]]:
+        """
+        Filter findings and separate true positives from false positives
+        """
+        true_positives = []
+        false_positives = []
+        for finding in findings:
+            # Rule-based filter
+            is_fp_rule, reason = self.apply_rule_based_filter(finding)
+            # ML filter
+            fp_probability = self.apply_ml_filter(finding)
+            # Combine filters
+            if is_fp_rule or fp_probability > fp_threshold:
+                false_positives.append({
+                    'finding': finding,
+                    'fp_probability': fp_probability,
+                    'reason': reason if is_fp_rule else f"ML score: {fp_probability:.2f}"
+                })
+            else:
+                true_positives.append(finding)
+        return {
+            'true_positives': true_positives,
+            'false_positives': false_positives,
+            'reduction_rate': len(false_positives) / len(findings) if findings else 0
+        }
+    def get_info(self) -> Dict:
+        """Get module info"""
+        return {
+            'name': self.name,
+            'version': self.version,
+            'description': 'ML-based false positive reduction',
+            'rules_count': len(self.FALSE_POSITIVE_PATTERNS),
+            'threshold': 0.7
+        }

zen-ai-pentest 2.2.0__py3-none-any.whl → 2.3.0__py3-none-any.whl

zen-ai-pentest 2.2.0py3-none-any.whl → 2.3.0py3-none-any.whl