PyPI - bbot - Versions diffs - 2.6.0.6840rc0__py3-none-any.whl → 2.7.2.7424rc0__py3-none-any.whl - Mend

bbot 2.6.0.6840rc0py3-none-any.whl → 2.7.2.7424rc0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (122) hide show

bbot/__init__.py +1 -1
bbot/cli.py +22 -8
bbot/core/engine.py +1 -1
bbot/core/event/__init__.py +2 -2
bbot/core/event/base.py +138 -110
bbot/core/flags.py +1 -0
bbot/core/helpers/bloom.py +6 -7
bbot/core/helpers/depsinstaller/installer.py +21 -2
bbot/core/helpers/dns/dns.py +0 -1
bbot/core/helpers/dns/engine.py +0 -2
bbot/core/helpers/files.py +2 -2
bbot/core/helpers/git.py +17 -0
bbot/core/helpers/helper.py +6 -5
bbot/core/helpers/misc.py +8 -23
bbot/core/helpers/ntlm.py +0 -2
bbot/core/helpers/regex.py +1 -1
bbot/core/helpers/regexes.py +25 -8
bbot/core/helpers/web/web.py +2 -1
bbot/core/modules.py +22 -60
bbot/defaults.yml +4 -2
bbot/modules/apkpure.py +1 -1
bbot/modules/baddns.py +1 -1
bbot/modules/baddns_direct.py +1 -1
bbot/modules/baddns_zone.py +1 -1
bbot/modules/badsecrets.py +1 -1
bbot/modules/base.py +123 -38
bbot/modules/bucket_amazon.py +1 -1
bbot/modules/bucket_digitalocean.py +1 -1
bbot/modules/bucket_firebase.py +1 -1
bbot/modules/bucket_google.py +1 -1
bbot/modules/{bucket_azure.py → bucket_microsoft.py} +2 -2
bbot/modules/builtwith.py +4 -2
bbot/modules/dnsbimi.py +1 -4
bbot/modules/dnsbrute.py +6 -1
bbot/modules/dnsdumpster.py +35 -52
bbot/modules/dnstlsrpt.py +0 -6
bbot/modules/docker_pull.py +1 -1
bbot/modules/emailformat.py +17 -1
bbot/modules/ffuf.py +4 -1
bbot/modules/ffuf_shortnames.py +6 -3
bbot/modules/filedownload.py +7 -4
bbot/modules/git_clone.py +47 -22
bbot/modules/gitdumper.py +4 -14
bbot/modules/github_workflows.py +6 -5
bbot/modules/gitlab_com.py +31 -0
bbot/modules/gitlab_onprem.py +84 -0
bbot/modules/gowitness.py +0 -6
bbot/modules/graphql_introspection.py +5 -2
bbot/modules/httpx.py +2 -0
bbot/modules/iis_shortnames.py +0 -7
bbot/modules/internal/cloudcheck.py +65 -72
bbot/modules/internal/unarchive.py +9 -3
bbot/modules/lightfuzz/lightfuzz.py +6 -2
bbot/modules/lightfuzz/submodules/esi.py +42 -0
bbot/modules/medusa.py +4 -7
bbot/modules/nuclei.py +1 -1
bbot/modules/otx.py +9 -2
bbot/modules/output/base.py +3 -11
bbot/modules/paramminer_headers.py +10 -7
bbot/modules/portfilter.py +2 -0
bbot/modules/postman_download.py +1 -1
bbot/modules/retirejs.py +232 -0
bbot/modules/securitytxt.py +0 -3
bbot/modules/sslcert.py +2 -2
bbot/modules/subdomaincenter.py +1 -16
bbot/modules/telerik.py +7 -2
bbot/modules/templates/bucket.py +24 -4
bbot/modules/templates/gitlab.py +98 -0
bbot/modules/trufflehog.py +6 -3
bbot/modules/wafw00f.py +2 -2
bbot/presets/web/lightfuzz-heavy.yml +1 -1
bbot/presets/web/lightfuzz-medium.yml +1 -1
bbot/presets/web/lightfuzz-superheavy.yml +1 -1
bbot/scanner/manager.py +44 -37
bbot/scanner/scanner.py +12 -4
bbot/scripts/benchmark_report.py +433 -0
bbot/test/benchmarks/__init__.py +2 -0
bbot/test/benchmarks/test_bloom_filter_benchmarks.py +105 -0
bbot/test/benchmarks/test_closest_match_benchmarks.py +76 -0
bbot/test/benchmarks/test_event_validation_benchmarks.py +438 -0
bbot/test/benchmarks/test_excavate_benchmarks.py +291 -0
bbot/test/benchmarks/test_ipaddress_benchmarks.py +143 -0
bbot/test/benchmarks/test_weighted_shuffle_benchmarks.py +70 -0
bbot/test/test_step_1/test_bbot_fastapi.py +2 -2
bbot/test/test_step_1/test_events.py +22 -21
bbot/test/test_step_1/test_helpers.py +1 -0
bbot/test/test_step_1/test_manager_scope_accuracy.py +45 -0
bbot/test/test_step_1/test_modules_basic.py +40 -15
bbot/test/test_step_1/test_python_api.py +2 -2
bbot/test/test_step_1/test_regexes.py +21 -4
bbot/test/test_step_1/test_scan.py +7 -8
bbot/test/test_step_1/test_web.py +46 -0
bbot/test/test_step_2/module_tests/base.py +6 -1
bbot/test/test_step_2/module_tests/test_module_bucket_amazon.py +52 -18
bbot/test/test_step_2/module_tests/test_module_bucket_google.py +1 -1
bbot/test/test_step_2/module_tests/{test_module_bucket_azure.py → test_module_bucket_microsoft.py} +7 -5
bbot/test/test_step_2/module_tests/test_module_cloudcheck.py +19 -31
bbot/test/test_step_2/module_tests/test_module_dnsbimi.py +2 -1
bbot/test/test_step_2/module_tests/test_module_dnsdumpster.py +3 -5
bbot/test/test_step_2/module_tests/test_module_emailformat.py +1 -1
bbot/test/test_step_2/module_tests/test_module_emails.py +2 -2
bbot/test/test_step_2/module_tests/test_module_excavate.py +57 -4
bbot/test/test_step_2/module_tests/test_module_github_workflows.py +10 -1
bbot/test/test_step_2/module_tests/test_module_gitlab_com.py +66 -0
bbot/test/test_step_2/module_tests/{test_module_gitlab.py → test_module_gitlab_onprem.py} +4 -69
bbot/test/test_step_2/module_tests/test_module_lightfuzz.py +71 -3
bbot/test/test_step_2/module_tests/test_module_nuclei.py +1 -2
bbot/test/test_step_2/module_tests/test_module_otx.py +3 -0
bbot/test/test_step_2/module_tests/test_module_portfilter.py +2 -0
bbot/test/test_step_2/module_tests/test_module_retirejs.py +161 -0
bbot/test/test_step_2/module_tests/test_module_telerik.py +1 -1
bbot/test/test_step_2/module_tests/test_module_trufflehog.py +10 -1
{bbot-2.6.0.6840rc0.dist-info → bbot-2.7.2.7424rc0.dist-info}/METADATA +10 -7
{bbot-2.6.0.6840rc0.dist-info → bbot-2.7.2.7424rc0.dist-info}/RECORD +117 -106
{bbot-2.6.0.6840rc0.dist-info → bbot-2.7.2.7424rc0.dist-info}/WHEEL +1 -1
{bbot-2.6.0.6840rc0.dist-info → bbot-2.7.2.7424rc0.dist-info/licenses}/LICENSE +98 -58
bbot/modules/censys.py +0 -98
bbot/modules/gitlab.py +0 -141
bbot/modules/zoomeye.py +0 -77
bbot/test/test_step_2/module_tests/test_module_censys.py +0 -83
bbot/test/test_step_2/module_tests/test_module_zoomeye.py +0 -35
{bbot-2.6.0.6840rc0.dist-info → bbot-2.7.2.7424rc0.dist-info}/entry_points.txt +0 -0

bbot/scanner/scanner.py CHANGED Viewed

@@ -10,7 +10,7 @@ from datetime import datetime
 from collections import OrderedDict
 from bbot import __version__
-from bbot.core.event import make_event
+from bbot.core.event import make_event, update_event
 from .manager import ScanIngress, ScanEgress
 from bbot.core.helpers.misc import sha1, rand_string
 from bbot.core.helpers.names_generator import random_name
@@ -99,6 +99,7 @@ class Scanner:
     def __init__(
         self,
         *targets,
+        name=None,
         scan_id=None,
         dispatcher=None,
         **kwargs,
@@ -137,6 +138,9 @@ class Scanner:
         from .preset import Preset
+        if name is not None:
+            kwargs["scan_name"] = name
         base_preset = Preset(*targets, **kwargs)
         if custom_preset is not None:
@@ -226,8 +230,8 @@ class Scanner:
             )
         # url file extensions
+        self.url_extension_special = {e.lower() for e in self.config.get("url_extension_special", [])}
         self.url_extension_blacklist = {e.lower() for e in self.config.get("url_extension_blacklist", [])}
-        self.url_extension_httpx_only = {e.lower() for e in self.config.get("url_extension_httpx_only", [])}
         # url querystring behavior
         self.url_querystring_remove = self.config.get("url_querystring_remove", True)
@@ -480,7 +484,7 @@ class Scanner:
         for module in self.modules.values():
             module.start()
-    async def setup_modules(self, remove_failed=True):
+    async def setup_modules(self, remove_failed=True, deps_only=False):
         """Asynchronously initializes all loaded modules by invoking their `setup()` methods.
         Args:
@@ -505,7 +509,7 @@ class Scanner:
         hard_failed = []
         soft_failed = []
-        async for task in self.helpers.as_completed([m._setup() for m in self.modules.values()]):
+        async for task in self.helpers.as_completed([m._setup(deps_only=deps_only) for m in self.modules.values()]):
             module, status, msg = await task
             if status is True:
                 self.debug(f"Setup succeeded for {module.name} ({msg})")
@@ -991,6 +995,10 @@ class Scanner:
         event = make_event(*args, **kwargs)
         return event
+    def update_event(self, event, **kwargs):
+        kwargs["scan"] = self
+        return update_event(event, **kwargs)
     @property
     def root_event(self):
         """

bbot/scripts/benchmark_report.py ADDED Viewed

@@ -0,0 +1,433 @@
+#!/usr/bin/env python3
+"""
+Branch-based benchmark comparison tool for BBOT performance tests.
+This script takes two git branches, runs benchmarks on each, and generates
+a comparison report showing performance differences between them.
+"""
+import json
+import argparse
+import subprocess
+import tempfile
+from pathlib import Path
+from typing import Dict, List, Any, Tuple
+def run_command(cmd: List[str], cwd: Path = None, capture_output: bool = True) -> subprocess.CompletedProcess:
+    """Run a shell command and return the result."""
+    try:
+        result = subprocess.run(cmd, cwd=cwd, capture_output=capture_output, text=True, check=True)
+        return result
+    except subprocess.CalledProcessError as e:
+        print(f"Command failed: {' '.join(cmd)}")
+        print(f"Exit code: {e.returncode}")
+        print(f"Error output: {e.stderr}")
+        raise
+def get_current_branch() -> str:
+    """Get the current git branch name."""
+    result = run_command(["git", "branch", "--show-current"])
+    return result.stdout.strip()
+def checkout_branch(branch: str, repo_path: Path = None):
+    """Checkout a git branch."""
+    print(f"Checking out branch: {branch}")
+    run_command(["git", "checkout", branch], cwd=repo_path)
+def run_benchmarks(output_file: Path, repo_path: Path = None) -> bool:
+    """Run benchmarks and save results to JSON file."""
+    print(f"Running benchmarks, saving to {output_file}")
+    # Check if benchmarks directory exists
+    benchmarks_dir = repo_path / "bbot/test/benchmarks" if repo_path else Path("bbot/test/benchmarks")
+    if not benchmarks_dir.exists():
+        print(f"Benchmarks directory not found: {benchmarks_dir}")
+        print("This branch likely doesn't have benchmark tests yet.")
+        return False
+    try:
+        cmd = [
+            "poetry",
+            "run",
+            "python",
+            "-m",
+            "pytest",
+            "bbot/test/benchmarks/",
+            "--benchmark-only",
+            f"--benchmark-json={output_file}",
+            "-q",
+        ]
+        run_command(cmd, cwd=repo_path, capture_output=False)
+        return True
+    except subprocess.CalledProcessError:
+        print("Benchmarks failed for current state")
+        return False
+def load_benchmark_data(filepath: Path) -> Dict[str, Any]:
+    """Load benchmark data from JSON file."""
+    try:
+        with open(filepath, "r") as f:
+            return json.load(f)
+    except FileNotFoundError:
+        print(f"Warning: Benchmark file not found: {filepath}")
+        return {}
+    except json.JSONDecodeError:
+        print(f"Warning: Could not parse JSON from {filepath}")
+        return {}
+def format_time(seconds: float) -> str:
+    """Format time in human-readable format."""
+    if seconds < 0.000001:  # Less than 1 microsecond
+        return f"{seconds * 1000000000:.0f}ns"  # Show as nanoseconds with no decimal
+    elif seconds < 0.001:  # Less than 1 millisecond
+        return f"{seconds * 1000000:.2f}µs"  # Show as microseconds with 2 decimal places
+    elif seconds < 1:  # Less than 1 second
+        return f"{seconds * 1000:.2f}ms"  # Show as milliseconds with 2 decimal places
+    else:
+        return f"{seconds:.3f}s"  # Show as seconds with 3 decimal places
+def format_ops(ops: float) -> str:
+    """Format operations per second."""
+    if ops > 1000:
+        return f"{ops / 1000:.1f}K ops/sec"
+    else:
+        return f"{ops:.1f} ops/sec"
+def calculate_change_percentage(old_value: float, new_value: float) -> Tuple[float, str]:
+    """Calculate percentage change and return emoji indicator."""
+    if old_value == 0:
+        return 0, "🆕"
+    change = ((new_value - old_value) / old_value) * 100
+    if change > 10:
+        return change, "⚠️"  # Regression (slower)
+    elif change < -10:
+        return change, "🚀"  # Improvement (faster)
+    else:
+        return change, "✅"  # No significant change
+def generate_benchmark_table(benchmarks: List[Dict[str, Any]], title: str = "Results") -> str:
+    """Generate markdown table for benchmark results."""
+    if not benchmarks:
+        return f"### {title}\nNo benchmark data available.\n"
+    table = f"""### {title}
+| Test Name | Mean Time | Ops/sec | Min | Max |
+|-----------|-----------|---------|-----|-----|
+"""
+    for bench in benchmarks:
+        stats = bench.get("stats", {})
+        name = bench.get("name", "Unknown")
+        # Generic test name cleanup - just remove 'test_' prefix and format nicely
+        test_name = name.replace("test_", "").replace("_", " ").title()
+        mean = format_time(stats.get("mean", 0))
+        ops = format_ops(stats.get("ops", 0))
+        min_time = format_time(stats.get("min", 0))
+        max_time = format_time(stats.get("max", 0))
+        table += f"| {test_name} | {mean} | {ops} | {min_time} | {max_time} |\n"
+    return table + "\n"
+def generate_comparison_table(current_data: Dict, base_data: Dict, current_branch: str, base_branch: str) -> str:
+    """Generate comparison table between current and base benchmark results."""
+    if not current_data or not base_data:
+        return ""
+    current_benchmarks = current_data.get("benchmarks", [])
+    base_benchmarks = base_data.get("benchmarks", [])
+    # Create lookup for base benchmarks
+    base_lookup = {bench["name"]: bench for bench in base_benchmarks}
+    if not current_benchmarks:
+        return ""
+    # Count changes for summary
+    improvements = 0
+    regressions = 0
+    no_change = 0
+    table = f"""## 📊 Performance Benchmark Report
+> Comparing **`{base_branch}`** (baseline) vs **`{current_branch}`** (current)
+<details>
+<summary>📈 <strong>Detailed Results</strong> (All Benchmarks)</summary>
+> 📋 **Complete results for all benchmarks** - includes both significant and insignificant changes
+| 🧪 Test Name | 📏 Base | 📏 Current | 📈 Change | 🎯 Status |
+|--------------|---------|------------|-----------|-----------|"""
+    significant_changes = []
+    performance_summary = []
+    for current_bench in current_benchmarks:
+        name = current_bench.get("name", "Unknown")
+        # Generic test name cleanup - just remove 'test_' prefix and format nicely
+        test_name = name.replace("test_", "").replace("_", " ").title()
+        current_stats = current_bench.get("stats", {})
+        current_mean = current_stats.get("mean", 0)
+        # For multi-item benchmarks, calculate correct ops/sec
+        if "excavate" in name:
+            current_ops = 100 / current_mean  # 100 segments per test
+        elif "event_validation" in name and "small" in name:
+            current_ops = 100 / current_mean  # 100 targets per test
+        elif "event_validation" in name and "large" in name:
+            current_ops = 1000 / current_mean  # 1000 targets per test
+        elif "make_event" in name and "small" in name:
+            current_ops = 100 / current_mean  # 100 items per test
+        elif "make_event" in name and "large" in name:
+            current_ops = 1000 / current_mean  # 1000 items per test
+        elif "ip" in name:
+            current_ops = 1000 / current_mean  # 1000 IPs per test
+        elif "bloom_filter" in name:
+            if "dns_mutation" in name:
+                current_ops = 2500 / current_mean  # 2500 operations per test
+            else:
+                current_ops = 13000 / current_mean  # 13000 operations per test
+        else:
+            current_ops = 1 / current_mean  # Default: single operation
+        base_bench = base_lookup.get(name)
+        if base_bench:
+            base_stats = base_bench.get("stats", {})
+            base_mean = base_stats.get("mean", 0)
+            # For multi-item benchmarks, calculate correct ops/sec
+            if "excavate" in name:
+                base_ops = 100 / base_mean  # 100 segments per test
+            elif "event_validation" in name and "small" in name:
+                base_ops = 100 / base_mean  # 100 targets per test
+            elif "event_validation" in name and "large" in name:
+                base_ops = 1000 / base_mean  # 1000 targets per test
+            elif "make_event" in name and "small" in name:
+                base_ops = 100 / base_mean  # 100 items per test
+            elif "make_event" in name and "large" in name:
+                base_ops = 1000 / base_mean  # 1000 items per test
+            elif "ip" in name:
+                base_ops = 1000 / base_mean  # 1000 IPs per test
+            elif "bloom_filter" in name:
+                if "dns_mutation" in name:
+                    base_ops = 2500 / base_mean  # 2500 operations per test
+                else:
+                    base_ops = 13000 / base_mean  # 13000 operations per test
+            else:
+                base_ops = 1 / base_mean  # Default: single operation
+            change_percent, emoji = calculate_change_percentage(base_mean, current_mean)
+            # Create visual change indicator
+            if abs(change_percent) > 20:
+                change_bar = "🔴🔴🔴" if change_percent > 0 else "🟢🟢🟢"
+            elif abs(change_percent) > 10:
+                change_bar = "🟡🟡" if change_percent > 0 else "🟢🟢"
+            else:
+                change_bar = "⚪"
+            table += f"\n| **{test_name}** | `{format_time(base_mean)}` | `{format_time(current_mean)}` | **{change_percent:+.1f}%** {change_bar} | {emoji} |"
+            # Track significant changes
+            if abs(change_percent) > 10:
+                direction = "🐌 slower" if change_percent > 0 else "🚀 faster"
+                significant_changes.append(f"- **{test_name}**: {abs(change_percent):.1f}% {direction}")
+                if change_percent > 0:
+                    regressions += 1
+                else:
+                    improvements += 1
+            else:
+                no_change += 1
+            # Add to performance summary
+            ops_change = ((current_ops - base_ops) / base_ops) * 100 if base_ops > 0 else 0
+            performance_summary.append(
+                {
+                    "name": test_name,
+                    "time_change": change_percent,
+                    "ops_change": ops_change,
+                    "current_ops": current_ops,
+                }
+            )
+        else:
+            table += f"\n| **{test_name}** | `-` | `{format_time(current_mean)}` | **New** 🆕 | 🆕 |"
+            significant_changes.append(
+                f"- **{test_name}**: New test 🆕 ({format_time(current_mean)}, {format_ops(current_ops)})"
+            )
+    table += "\n\n</details>\n\n"
+    # Add performance summary
+    table += "## 🎯 Performance Summary\n\n"
+    if improvements > 0 or regressions > 0:
+        table += "```diff\n"
+        if improvements > 0:
+            table += f"+ {improvements} improvement{'s' if improvements != 1 else ''} 🚀\n"
+        if regressions > 0:
+            table += f"! {regressions} regression{'s' if regressions != 1 else ''} ⚠️\n"
+        if no_change > 0:
+            table += f"  {no_change} unchanged ✅\n"
+        table += "```\n\n"
+    else:
+        table += "✅ **No significant performance changes detected** (all changes <10%)\n\n"
+    # Add significant changes section
+    if significant_changes:
+        table += "### 🔍 Significant Changes (>10%)\n\n"
+        for change in significant_changes:
+            table += f"{change}\n"
+        table += "\n"
+    return table
+def generate_report(current_data: Dict, base_data: Dict, current_branch: str, base_branch: str) -> str:
+    """Generate complete benchmark comparison report."""
+    if not current_data:
+        report = """## 🚀 Performance Benchmark Report
+> ⚠️ **No current benchmark data available**
+>
+> This might be because:
+> - Benchmarks failed to run
+> - No benchmark tests found
+> - Dependencies missing
+"""
+        return report
+    if not base_data:
+        report = f"""## 🚀 Performance Benchmark Report
+> ℹ️ **No baseline benchmark data available**
+>
+> Showing current results for **{current_branch}** only.
+"""
+        current_benchmarks = current_data.get("benchmarks", [])
+        if current_benchmarks:
+            report += f"""<details>
+<summary>📊 Current Results ({current_branch}) - Click to expand</summary>
+{generate_benchmark_table(current_benchmarks, "Results")}
+</details>"""
+    else:
+        # Add comparison
+        comparison = generate_comparison_table(current_data, base_data, current_branch, base_branch)
+        if comparison:
+            report = comparison
+        else:
+            # Fallback if no comparison data
+            report = f"""## 🚀 Performance Benchmark Report
+> ℹ️ **No baseline benchmark data available**
+>
+> Showing current results for **{current_branch}** only.
+"""
+    # Get Python version info
+    machine_info = current_data.get("machine_info", {})
+    python_version = machine_info.get("python_version", "Unknown")
+    report += f"\n\n---\n\n🐍 Python Version {python_version}"
+    return report
+def main():
+    parser = argparse.ArgumentParser(description="Compare benchmark performance between git branches")
+    parser.add_argument("--base", required=True, help="Base branch name (e.g., 'main', 'dev')")
+    parser.add_argument("--current", required=True, help="Current branch name (e.g., 'feature-branch', 'HEAD')")
+    parser.add_argument("--output", type=Path, help="Output markdown file (default: stdout)")
+    parser.add_argument("--keep-results", action="store_true", help="Keep intermediate JSON files")
+    args = parser.parse_args()
+    # Get current working directory
+    repo_path = Path.cwd()
+    # Save original branch to restore later
+    try:
+        original_branch = get_current_branch()
+        print(f"Current branch: {original_branch}")
+    except subprocess.CalledProcessError:
+        print("Warning: Could not determine current branch")
+        original_branch = None
+    # Create temporary files for benchmark results
+    with tempfile.TemporaryDirectory() as temp_dir:
+        temp_path = Path(temp_dir)
+        base_results_file = temp_path / "base_results.json"
+        current_results_file = temp_path / "current_results.json"
+        base_data = {}
+        current_data = {}
+        base_data = {}
+        current_data = {}
+        try:
+            # Run benchmarks on base branch
+            print(f"\n=== Running benchmarks on base branch: {args.base} ===")
+            checkout_branch(args.base, repo_path)
+            if run_benchmarks(base_results_file, repo_path):
+                base_data = load_benchmark_data(base_results_file)
+            # Run benchmarks on current branch
+            print(f"\n=== Running benchmarks on current branch: {args.current} ===")
+            checkout_branch(args.current, repo_path)
+            if run_benchmarks(current_results_file, repo_path):
+                current_data = load_benchmark_data(current_results_file)
+            # Generate report
+            print("\n=== Generating comparison report ===")
+            report = generate_report(current_data, base_data, args.current, args.base)
+            # Output report
+            if args.output:
+                with open(args.output, "w") as f:
+                    f.write(report)
+                print(f"Report written to {args.output}")
+            else:
+                print("\n" + "=" * 80)
+                print(report)
+            # Keep results if requested
+            if args.keep_results:
+                if base_data:
+                    with open("base_benchmark_results.json", "w") as f:
+                        json.dump(base_data, f, indent=2)
+                if current_data:
+                    with open("current_benchmark_results.json", "w") as f:
+                        json.dump(current_data, f, indent=2)
+                print("Benchmark result files saved.")
+        finally:
+            # Restore original branch
+            if original_branch:
+                print(f"\nRestoring original branch: {original_branch}")
+                try:
+                    checkout_branch(original_branch, repo_path)
+                except subprocess.CalledProcessError:
+                    print(f"Warning: Could not restore original branch {original_branch}")
+if __name__ == "__main__":
+    main()

bbot/test/benchmarks/__init__.py ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ # Benchmark tests for BBOT performance monitoring
2	+ # These tests measure performance of critical code paths

bbot/test/benchmarks/test_bloom_filter_benchmarks.py ADDED Viewed

@@ -0,0 +1,105 @@
+import pytest
+import string
+import random
+from bbot.scanner import Scanner
+class TestBloomFilterBenchmarks:
+    """
+    Benchmark tests for Bloom Filter operations.
+    These tests measure the performance of bloom filter operations which are
+    critical for DNS brute-forcing efficiency in BBOT.
+    """
+    def setup_method(self):
+        """Setup common test data"""
+        self.scan = Scanner()
+        # Generate test data of different sizes
+        self.items_small = self._generate_random_strings(1000)  # 1K items
+        self.items_medium = self._generate_random_strings(10000)  # 10K items
+    def _generate_random_strings(self, n, length=10):
+        """Generate a list of n random strings."""
+        # Slightly longer strings for testing performance difference
+        length = length + 2  # Make strings 2 chars longer
+        return ["".join(random.choices(string.ascii_letters + string.digits, k=length)) for _ in range(n)]
+    @pytest.mark.benchmark(group="bloom_filter_operations")
+    def test_bloom_filter_dns_mutation_tracking_performance(self, benchmark):
+        """Benchmark comprehensive bloom filter operations (add, check, mixed) for DNS brute-forcing"""
+        def comprehensive_bloom_operations():
+            bloom_filter = self.scan.helpers.bloom_filter(size=8000000)  # 8M bits
+            # Phase 1: Add operations (simulating storing tried DNS mutations)
+            for item in self.items_small:
+                bloom_filter.add(item)
+            # Phase 2: Check operations (simulating lookup of existing mutations)
+            found_count = 0
+            for item in self.items_small:
+                if item in bloom_filter:
+                    found_count += 1
+            # Phase 3: Mixed operations (realistic DNS brute-force simulation)
+            # Add new items while checking existing ones
+            for i, item in enumerate(self.items_medium[:500]):  # Smaller subset for mixed ops
+                bloom_filter.add(item)
+                # Every few additions, check some existing items
+                if i % 10 == 0:
+                    for check_item in self.items_small[i : i + 5]:
+                        if check_item in bloom_filter:
+                            found_count += 1
+            return {
+                "items_added": len(self.items_small) + 500,
+                "items_checked": found_count,
+                "bloom_size": bloom_filter.size,
+            }
+        result = benchmark(comprehensive_bloom_operations)
+        assert result["items_added"] > 1000
+        assert result["items_checked"] > 0
+    @pytest.mark.benchmark(group="bloom_filter_scalability")
+    def test_bloom_filter_large_scale_dns_brute_force(self, benchmark):
+        """Benchmark bloom filter performance with large-scale DNS brute-force simulation"""
+        def large_scale_simulation():
+            bloom_filter = self.scan.helpers.bloom_filter(size=8000000)  # 8M bits
+            # Simulate a large DNS brute-force session
+            mutations_tried = 0
+            duplicate_attempts = 0
+            # Add all medium dataset (simulating 10K DNS mutations)
+            for item in self.items_medium:
+                bloom_filter.add(item)
+                mutations_tried += 1
+            # Simulate checking for duplicates during brute-force
+            for item in self.items_medium[:2000]:  # Check subset for duplicates
+                if item in bloom_filter:
+                    duplicate_attempts += 1
+            # Simulate adding more mutations with duplicate checking
+            for item in self.items_small:
+                if item not in bloom_filter:  # Only add if not already tried
+                    bloom_filter.add(item)
+                    mutations_tried += 1
+                else:
+                    duplicate_attempts += 1
+            return {
+                "total_mutations_tried": mutations_tried,
+                "duplicates_avoided": duplicate_attempts,
+                "efficiency_ratio": mutations_tried / (mutations_tried + duplicate_attempts)
+                if duplicate_attempts > 0
+                else 1.0,
+            }
+        result = benchmark(large_scale_simulation)
+        assert result["total_mutations_tried"] > 10000
+        assert result["efficiency_ratio"] > 0

bbot/test/benchmarks/test_closest_match_benchmarks.py ADDED Viewed

@@ -0,0 +1,76 @@
+import pytest
+import random
+from bbot.core.helpers.misc import closest_match
+class TestClosestMatchBenchmarks:
+    """
+    Benchmark tests for closest_match operations.
+    This function is critical for BBOT's DNS brute forcing, where it finds the best
+    matching parent event among thousands of choices. Performance here directly impacts
+    scan throughput and DNS mutation efficiency.
+    """
+    def setup_method(self):
+        """Setup common test data"""
+        # Set deterministic seed for consistent benchmark results
+        random.seed(42)  # Fixed seed for reproducible results
+        # Generate test data for benchmarks
+        self.large_closest_match_choices = self._generate_large_closest_match_choices()
+        self.realistic_closest_match_choices = self._generate_realistic_closest_match_choices()
+    def _generate_large_closest_match_choices(self):
+        """Generate large closest match dataset (stress test with many parent events)"""
+        choices = []
+        for i in range(10000):
+            # Generate realistic domain names with more variety
+            tld = random.choice(["com", "net", "org", "io", "co", "dev"])
+            domain = f"subdomain{i}.example{i % 100}.{tld}"
+            choices.append(domain)
+        return choices
+    def _generate_realistic_closest_match_choices(self):
+        """Generate realistic closest match parent event choices (like actual BBOT usage)"""
+        choices = []
+        # Common TLDs
+        tlds = ["com", "net", "org", "io", "co", "dev", "test", "local"]
+        # Generate parent domains with realistic patterns
+        for i in range(5000):
+            # Base domain patterns
+            if i % 10 == 0:
+                # Simple domains
+                domain = f"example{i}.{random.choice(tlds)}"
+            elif i % 5 == 0:
+                # Multi-level domains
+                domain = f"sub{i}.example{i}.{random.choice(tlds)}"
+            else:
+                # Complex domains
+                domain = f"level1{i}.level2{i}.example{i}.{random.choice(tlds)}"
+            choices.append(domain)
+        return choices
+    @pytest.mark.benchmark(group="closest_match")
+    def test_large_closest_match_lookup(self, benchmark):
+        """Benchmark closest_match with large closest match workload (many parent events)"""
+        def find_large_closest_match():
+            return closest_match("subdomain5678.example50.com", self.large_closest_match_choices)
+        result = benchmark.pedantic(find_large_closest_match, iterations=50, rounds=10)
+        assert result is not None
+    @pytest.mark.benchmark(group="closest_match")
+    def test_realistic_closest_match_workload(self, benchmark):
+        """Benchmark closest_match with realistic BBOT closest match parent event choices"""
+        def find_realistic_closest_match():
+            return closest_match("subdomain123.example5.com", self.realistic_closest_match_choices)
+        result = benchmark.pedantic(find_realistic_closest_match, iterations=50, rounds=10)
+        assert result is not None

bbot 2.6.0.6840rc0__py3-none-any.whl → 2.7.2.7424rc0__py3-none-any.whl

bbot 2.6.0.6840rc0py3-none-any.whl → 2.7.2.7424rc0py3-none-any.whl