PyPI - openhack - Versions diffs - 0.1.0__py3-none-any.whl - Mend

openhack 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (113) hide show

openhack/__init__.py +2 -0
openhack/__main__.py +225 -0
openhack/agents/__init__.py +30 -0
openhack/agents/base.py +230 -0
openhack/agents/browser_verifier.py +679 -0
openhack/agents/browser_verifier_swarm.py +256 -0
openhack/agents/checkpoint.py +89 -0
openhack/agents/context_manager.py +356 -0
openhack/agents/coordinator.py +1105 -0
openhack/agents/endpoint_analyst.py +307 -0
openhack/agents/feature_hunter.py +93 -0
openhack/agents/hunter.py +481 -0
openhack/agents/hunter_swarm.py +385 -0
openhack/agents/llm.py +334 -0
openhack/agents/recon.py +19 -0
openhack/agents/sandbox_verifier.py +396 -0
openhack/agents/sandbox_verifier_swarm.py +250 -0
openhack/agents/session.py +286 -0
openhack/agents/validator.py +217 -0
openhack/agents/validator_swarm.py +106 -0
openhack/auth.py +175 -0
openhack/browser/__init__.py +12 -0
openhack/browser/runner.py +385 -0
openhack/categories.py +130 -0
openhack/config.py +201 -0
openhack/deterministic_recon.py +464 -0
openhack/entry_points.py +745 -0
openhack/framework_classifier.py +515 -0
openhack/framework_detection.py +269 -0
openhack/headless_scan.py +179 -0
openhack/prompts/__init__.py +108 -0
openhack/prompts/browser_verifier.py +171 -0
openhack/prompts/coordinator.py +31 -0
openhack/prompts/django/__init__.py +32 -0
openhack/prompts/django/auth_bypass.py +76 -0
openhack/prompts/django/csrf.py +62 -0
openhack/prompts/django/data_exposure.py +67 -0
openhack/prompts/django/idor.py +74 -0
openhack/prompts/django/injection.py +67 -0
openhack/prompts/django/misconfiguration.py +70 -0
openhack/prompts/django/ssrf.py +64 -0
openhack/prompts/endpoint_analyst.py +122 -0
openhack/prompts/express/__init__.py +29 -0
openhack/prompts/express/auth_bypass.py +71 -0
openhack/prompts/express/data_exposure.py +77 -0
openhack/prompts/express/idor.py +69 -0
openhack/prompts/express/injection.py +75 -0
openhack/prompts/express/misconfiguration.py +72 -0
openhack/prompts/express/ssrf.py +63 -0
openhack/prompts/feature_hunter.py +140 -0
openhack/prompts/flask/__init__.py +29 -0
openhack/prompts/flask/auth_bypass.py +86 -0
openhack/prompts/flask/data_exposure.py +78 -0
openhack/prompts/flask/idor.py +83 -0
openhack/prompts/flask/injection.py +77 -0
openhack/prompts/flask/misconfiguration.py +73 -0
openhack/prompts/flask/ssrf.py +65 -0
openhack/prompts/hunter.py +362 -0
openhack/prompts/hunter_continuation_loop.py +12 -0
openhack/prompts/hunter_continuation_no_findings.py +19 -0
openhack/prompts/hunter_continuation_no_progress.py +22 -0
openhack/prompts/hunter_tool_instructions.py +55 -0
openhack/prompts/nextjs/__init__.py +42 -0
openhack/prompts/nextjs/auth_bypass.py +80 -0
openhack/prompts/nextjs/csrf.py +71 -0
openhack/prompts/nextjs/data_exposure.py +88 -0
openhack/prompts/nextjs/idor.py +64 -0
openhack/prompts/nextjs/injection.py +65 -0
openhack/prompts/nextjs/middleware_bypass.py +75 -0
openhack/prompts/nextjs/misconfiguration.py +92 -0
openhack/prompts/nextjs/server_actions.py +97 -0
openhack/prompts/nextjs/ssrf.py +66 -0
openhack/prompts/nextjs/xss.py +69 -0
openhack/prompts/pr_analysis_system.py +80 -0
openhack/prompts/pr_analysis_user.py +11 -0
openhack/prompts/project_context.py +89 -0
openhack/prompts/recon.py +199 -0
openhack/prompts/reporter.py +88 -0
openhack/prompts/researchers.py +434 -0
openhack/prompts/sandbox_verifier.py +128 -0
openhack/prompts/supabase/__init__.py +39 -0
openhack/prompts/supabase/auth_tokens.py +131 -0
openhack/prompts/supabase/edge_functions.py +150 -0
openhack/prompts/supabase/graphql.py +102 -0
openhack/prompts/supabase/postgrest.py +99 -0
openhack/prompts/supabase/realtime.py +93 -0
openhack/prompts/supabase/rls.py +110 -0
openhack/prompts/supabase/rpc_functions.py +127 -0
openhack/prompts/supabase/storage.py +110 -0
openhack/prompts/supabase/tenant_isolation.py +118 -0
openhack/prompts/validator.py +319 -0
openhack/prompts/validator_continuation_incomplete.py +12 -0
openhack/prompts/validator_tool_instructions.py +29 -0
openhack/quality.py +231 -0
openhack/sandbox/__init__.py +12 -0
openhack/sandbox/orchestrator.py +517 -0
openhack/sandbox/runner.py +177 -0
openhack/scan_session.py +245 -0
openhack/setup.py +452 -0
openhack/static_validator.py +612 -0
openhack/tools/__init__.py +1 -0
openhack/tools/ast_tools.py +307 -0
openhack/tools/coverage.py +1078 -0
openhack/tools/filesystem.py +404 -0
openhack/tools/nextjs.py +258 -0
openhack/tools/registry.py +52 -0
openhack/tui.py +3450 -0
openhack/updates.py +170 -0
openhack-0.1.0.dist-info/METADATA +189 -0
openhack-0.1.0.dist-info/RECORD +113 -0
openhack-0.1.0.dist-info/WHEEL +4 -0
openhack-0.1.0.dist-info/entry_points.txt +2 -0
openhack-0.1.0.dist-info/licenses/LICENSE +661 -0

openhack/sandbox/orchestrator.py ADDED Viewed

@@ -0,0 +1,517 @@
+"""
+Docker sandbox orchestrator.
+Manages the lifecycle of target applications in isolated Docker containers:
+- Detects docker-compose.yml / Dockerfile in the target repo
+- Builds and starts the application
+- Waits for health check
+- Provides the base URL for exploit execution
+- Tears down containers on completion
+"""
+import asyncio
+import logging
+import shutil
+import time
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Optional
+logger = logging.getLogger(__name__)
+@dataclass
+class SandboxConfig:
+    """Configuration for the sandbox environment."""
+    # How to start the app
+    build_command: Optional[str] = None       # e.g. "docker-compose up --build -d"
+    compose_file: Optional[str] = None        # path to docker-compose.yml relative to target
+    dockerfile: Optional[str] = None          # path to Dockerfile relative to target
+    # Health check
+    health_check_url: Optional[str] = None    # e.g. "http://localhost:3000/api/health"
+    health_check_port: int = 3000
+    health_check_path: str = "/"
+    health_check_timeout: int = 120           # seconds to wait for app to be ready
+    # Environment
+    env_vars: dict[str, str] = field(default_factory=dict)
+    # Network isolation
+    network_mode: str = "bridge"              # "bridge" or "none" for full isolation
+    host_port: int = 0                        # 0 = auto-assign
+    # Cleanup
+    teardown_on_complete: bool = True
+@dataclass
+class SandboxStatus:
+    """Current status of the sandbox."""
+    running: bool = False
+    base_url: str = ""
+    container_ids: list[str] = field(default_factory=list)
+    project_name: str = ""
+    start_time: float = 0.0
+    host_port: int = 0
+class SandboxOrchestrator:
+    """Manages Docker sandbox lifecycle for exploit verification."""
+    def __init__(self, target_dir: Path, config: Optional[SandboxConfig] = None):
+        self.target_dir = target_dir.resolve()
+        self.config = config or SandboxConfig()
+        self.status = SandboxStatus()
+        self._project_name = f"openhack-sandbox-{int(time.time())}"
+    async def start(self) -> SandboxStatus:
+        """Start the target application in a Docker sandbox."""
+        logger.info(f"Starting sandbox for {self.target_dir}")
+        # Auto-detect how to start the app
+        compose_file = self._find_compose_file()
+        dockerfile = self._find_dockerfile()
+        if not compose_file and not dockerfile:
+            raise SandboxError(
+                f"No docker-compose.yml or Dockerfile found in {self.target_dir}. "
+                "Cannot start sandbox without containerization config."
+            )
+        # Assign a host port
+        host_port = self.config.host_port or await self._find_free_port()
+        self.status.host_port = host_port
+        try:
+            if compose_file:
+                await self._start_with_compose(compose_file, host_port)
+            else:
+                await self._start_with_dockerfile(dockerfile, host_port)
+        except SandboxError:
+            await self._force_cleanup_network()
+            raise
+        # Wait for health check
+        base_url = f"http://localhost:{host_port}"
+        self.status.base_url = base_url
+        health_url = self.config.health_check_url or f"{base_url}{self.config.health_check_path}"
+        try:
+            await self._wait_for_health(health_url)
+        except SandboxError:
+            self.status.running = True
+            await self.stop()
+            raise
+        self.status.running = True
+        self.status.start_time = time.time()
+        logger.info(f"Sandbox ready at {base_url}")
+        return self.status
+    async def stop(self) -> None:
+        """Tear down the sandbox containers and clean up Docker resources."""
+        if not self.status.running:
+            return
+        logger.info(f"Stopping sandbox {self._project_name}")
+        try:
+            compose_file = self._find_compose_file()
+            if compose_file:
+                cmd = [
+                    "docker", "compose", "-p", self._project_name,
+                    "-f", str(compose_file),
+                ]
+                override = getattr(self, '_override_file', None)
+                if override and override.exists():
+                    cmd.extend(["-f", str(override)])
+                cmd.extend(["down", "-v", "--remove-orphans"])
+                await self._run_command(cmd, timeout=30)
+                # Clean up override file
+                if override and override.exists():
+                    override.unlink()
+            else:
+                for cid in self.status.container_ids:
+                    await self._run_command(
+                        ["docker", "rm", "-f", cid], timeout=15,
+                    )
+        except Exception as e:
+            logger.warning(f"Error during sandbox teardown: {e}")
+            await self._force_cleanup_network()
+        finally:
+            self.status.running = False
+            self.status.container_ids = []
+            logger.info("Sandbox stopped")
+    async def _force_cleanup_network(self) -> None:
+        """Remove the Docker network for this project if it still exists."""
+        network_name = f"{self._project_name}_default"
+        try:
+            await self._run_command(
+                ["docker", "network", "rm", network_name], timeout=10,
+            )
+            logger.info(f"Cleaned up stale network: {network_name}")
+        except Exception:
+            pass
+    async def __aenter__(self):
+        await self.start()
+        return self
+    async def __aexit__(self, exc_type, exc_val, exc_tb):
+        if self.config.teardown_on_complete:
+            await self.stop()
+    def _find_compose_file(self) -> Optional[Path]:
+        """Find docker-compose file in the target directory."""
+        if self.config.compose_file:
+            path = self.target_dir / self.config.compose_file
+            return path if path.exists() else None
+        for name in ("docker-compose.yml", "docker-compose.yaml", "compose.yml", "compose.yaml"):
+            path = self.target_dir / name
+            if path.exists():
+                return path
+        return None
+    def _find_dockerfile(self) -> Optional[Path]:
+        """Find Dockerfile in the target directory."""
+        if self.config.dockerfile:
+            path = self.target_dir / self.config.dockerfile
+            return path if path.exists() else None
+        path = self.target_dir / "Dockerfile"
+        return path if path.exists() else None
+    async def _find_free_port(self) -> int:
+        """Find a free port on the host."""
+        import socket
+        with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as s:
+            s.bind(("", 0))
+            return s.getsockname()[1]
+    async def _start_with_compose(self, compose_file: Path, host_port: int) -> None:
+        """Start the app using docker-compose.
+        Generates an override file that:
+        - Removes hardcoded container_name directives (project name handles naming)
+        - Remaps the app port to an available host port
+        - Remaps any other ports that might conflict
+        """
+        self.status.project_name = self._project_name
+        self._override_file: Optional[Path] = None
+        # Parse compose file to find the app service and generate overrides
+        override = await self._generate_compose_override(compose_file, host_port)
+        env = {**self.config.env_vars, "HOST_PORT": str(host_port)}
+        # Write override file
+        override_path = self.target_dir / f".openhack-sandbox-override-{self._project_name}.yml"
+        override_path.write_text(override)
+        self._override_file = override_path
+        # Build and start with override
+        cmd = [
+            "docker", "compose",
+            "-p", self._project_name,
+            "-f", str(compose_file),
+            "-f", str(override_path),
+            "up", "--build", "-d",
+        ]
+        logger.info(f"Starting with compose (port {host_port}): {' '.join(cmd)}")
+        await self._run_command(cmd, cwd=self.target_dir, env=env, timeout=300)
+        # Get container IDs
+        ps_cmd = [
+            "docker", "compose", "-p", self._project_name,
+            "-f", str(compose_file),
+            "-f", str(override_path),
+            "ps", "-q",
+        ]
+        result = await self._run_command(ps_cmd, cwd=self.target_dir, timeout=10)
+        self.status.container_ids = [
+            cid.strip() for cid in result.stdout.strip().split("\n") if cid.strip()
+        ]
+    async def _generate_compose_override(self, compose_file: Path, host_port: int) -> str:
+        """Generate a docker-compose override that remaps ports and removes container names.
+        Parses the compose file with a simple line-based approach to avoid
+        requiring pyyaml as a dependency.
+        """
+        compose_text = compose_file.read_text()
+        # Extract service names and their port mappings
+        services = self._parse_compose_services(compose_text)
+        override: dict = {"services": {}}
+        for svc_name, svc_info in services.items():
+            svc_override: dict = {}
+            if svc_info.get("container_name"):
+                svc_override["container_name"] = f"{self._project_name}-{svc_name}"
+            ports = svc_info.get("ports", [])
+            if ports:
+                new_ports = []
+                for port_mapping in ports:
+                    if ":" in port_mapping:
+                        parts = port_mapping.strip('"').strip("'").split(":")
+                        container_port = parts[-1]
+                        if container_port == str(self.config.health_check_port):
+                            new_ports.append(f"{host_port}:{container_port}")
+                        else:
+                            free = await self._find_free_port()
+                            new_ports.append(f"{free}:{container_port}")
+                    else:
+                        new_ports.append(port_mapping)
+                svc_override["ports"] = new_ports
+            if svc_override:
+                override["services"][svc_name] = svc_override
+        return self._dict_to_yaml(override, override_lists=True)
+    @staticmethod
+    def _parse_compose_services(text: str) -> dict:
+        """Minimally parse a docker-compose file to extract service info.
+        Returns {service_name: {"container_name": str|None, "ports": [str]}}.
+        """
+        services = {}
+        current_service = None
+        in_services = False
+        in_ports = False
+        services_indent = None
+        service_indent = None
+        prop_indent = None
+        for line in text.splitlines():
+            stripped = line.strip()
+            if not stripped or stripped.startswith("#"):
+                continue
+            indent = len(line) - len(line.lstrip())
+            # Find the top-level "services:" key
+            if stripped == "services:" and indent == 0:
+                in_services = True
+                services_indent = indent
+                continue
+            # Exited services block
+            if in_services and indent == 0 and stripped and not stripped.startswith("-"):
+                in_services = False
+                current_service = None
+                continue
+            if not in_services:
+                continue
+            # Service name: first level of indent under services (typically 2 spaces)
+            if stripped.endswith(":") and ":" not in stripped[:-1]:
+                if service_indent is None or indent <= service_indent:
+                    name = stripped.rstrip(":")
+                    current_service = name
+                    service_indent = indent
+                    services[current_service] = {"container_name": None, "ports": []}
+                    in_ports = False
+                    prop_indent = None
+                    continue
+            if current_service is None:
+                continue
+            # Service properties are one level deeper than service name
+            if prop_indent is None and indent > service_indent:
+                prop_indent = indent
+            # If we're back to service-level indent, it's a new service
+            if indent <= service_indent and stripped.endswith(":") and ":" not in stripped[:-1]:
+                name = stripped.rstrip(":")
+                current_service = name
+                services[current_service] = {"container_name": None, "ports": []}
+                in_ports = False
+                prop_indent = None
+                continue
+            if prop_indent is not None and indent == prop_indent:
+                in_ports = False
+                if stripped.startswith("container_name:"):
+                    val = stripped.split(":", 1)[1].strip().strip('"').strip("'")
+                    services[current_service]["container_name"] = val
+                elif stripped == "ports:":
+                    in_ports = True
+            elif in_ports and stripped.startswith("-"):
+                port = stripped.lstrip("- ").strip('"').strip("'")
+                services[current_service]["ports"].append(port)
+        return services
+    @staticmethod
+    def _dict_to_yaml(d: dict, indent: int = 0, override_lists: bool = False) -> str:
+        """Minimal dict-to-YAML serializer (avoids pyyaml dependency).
+        When override_lists=True, list keys emit `!override` so Docker Compose
+        replaces the base list instead of merging into it.
+        """
+        lines = []
+        prefix = "  " * indent
+        for key, val in d.items():
+            if isinstance(val, dict):
+                lines.append(f"{prefix}{key}:")
+                lines.append(SandboxOrchestrator._dict_to_yaml(val, indent + 1, override_lists))
+            elif isinstance(val, list):
+                tag = " !override" if override_lists else ""
+                lines.append(f"{prefix}{key}:{tag}")
+                for item in val:
+                    if isinstance(item, dict):
+                        items = list(item.items())
+                        first_key, first_val = items[0]
+                        lines.append(f"{prefix}  - {first_key}: {first_val}")
+                        for k, v in items[1:]:
+                            lines.append(f"{prefix}    {k}: {v}")
+                    else:
+                        lines.append(f"{prefix}  - \"{item}\"" if isinstance(item, str) else f"{prefix}  - {item}")
+            else:
+                if isinstance(val, str):
+                    lines.append(f"{prefix}{key}: \"{val}\"")
+                else:
+                    lines.append(f"{prefix}{key}: {val}")
+        return "\n".join(lines)
+    async def _start_with_dockerfile(self, dockerfile: Path, host_port: int) -> None:
+        """Start the app by building a Dockerfile and running the container."""
+        image_name = f"openhack-sandbox:{self._project_name}"
+        # Build
+        build_cmd = [
+            "docker", "build",
+            "-t", image_name,
+            "-f", str(dockerfile),
+            str(self.target_dir),
+        ]
+        logger.info(f"Building image: {image_name}")
+        await self._run_command(build_cmd, timeout=300)
+        # Run
+        app_port = self.config.health_check_port
+        run_cmd = [
+            "docker", "run", "-d",
+            "--name", self._project_name,
+            "-p", f"{host_port}:{app_port}",
+        ]
+        for k, v in self.config.env_vars.items():
+            run_cmd.extend(["-e", f"{k}={v}"])
+        run_cmd.append(image_name)
+        logger.info(f"Running container: {self._project_name}")
+        result = await self._run_command(run_cmd, timeout=30)
+        container_id = result.stdout.strip()
+        self.status.container_ids = [container_id]
+    async def _wait_for_health(self, health_url: str) -> None:
+        """Poll the health check URL until the app is ready."""
+        import aiohttp
+        timeout = self.config.health_check_timeout
+        start = time.time()
+        last_error = None
+        logger.info(f"Waiting for health check: {health_url} (timeout: {timeout}s)")
+        while time.time() - start < timeout:
+            try:
+                async with aiohttp.ClientSession() as session:
+                    async with session.get(health_url, timeout=aiohttp.ClientTimeout(total=5)) as resp:
+                        if resp.status < 500:
+                            elapsed = time.time() - start
+                            logger.info(f"Health check passed (status {resp.status}) in {elapsed:.1f}s")
+                            return
+                        last_error = f"HTTP {resp.status}"
+            except Exception as e:
+                last_error = str(e)
+            await asyncio.sleep(2)
+        # Pull the last few lines of container logs so the error surfaces
+        # *why* the app failed (Prisma schema missing, port conflict, etc.)
+        # instead of just "HTTP 500".
+        tail_logs = ""
+        try:
+            tail_logs = await self.get_logs(tail=40)
+        except Exception:
+            pass
+        log_snippet = (
+            "\n— Recent container logs —\n" + tail_logs.strip()[-2000:]
+            if tail_logs.strip() else ""
+        )
+        raise SandboxError(
+            f"Health check failed after {timeout}s. "
+            f"URL: {health_url}, last error: {last_error}{log_snippet}"
+        )
+    async def get_logs(self, tail: int = 100) -> str:
+        """Get container logs for debugging."""
+        logs = []
+        for cid in self.status.container_ids:
+            try:
+                result = await self._run_command(
+                    ["docker", "logs", "--tail", str(tail), cid], timeout=10,
+                )
+                logs.append(f"=== Container {cid[:12]} ===\n{result.stdout}")
+                if result.stderr:
+                    logs.append(f"STDERR:\n{result.stderr}")
+            except Exception as e:
+                logs.append(f"=== Container {cid[:12]} === ERROR: {e}")
+        return "\n".join(logs)
+    @staticmethod
+    async def _run_command(
+        cmd: list[str],
+        cwd: Optional[Path] = None,
+        env: Optional[dict] = None,
+        timeout: int = 60,
+    ) -> asyncio.subprocess.Process:
+        """Run a shell command asynchronously."""
+        import os
+        full_env = {**os.environ, **(env or {})}
+        proc = await asyncio.create_subprocess_exec(
+            *cmd,
+            stdout=asyncio.subprocess.PIPE,
+            stderr=asyncio.subprocess.PIPE,
+            cwd=cwd,
+            env=full_env,
+        )
+        try:
+            stdout, stderr = await asyncio.wait_for(proc.communicate(), timeout=timeout)
+        except asyncio.TimeoutError:
+            proc.kill()
+            await proc.communicate()
+            raise SandboxError(f"Command timed out after {timeout}s: {' '.join(cmd)}")
+        proc.stdout = stdout.decode() if stdout else ""
+        proc.stderr = stderr.decode() if stderr else ""
+        if proc.returncode != 0:
+            raise SandboxError(
+                f"Command failed (exit {proc.returncode}): {' '.join(cmd)}\n"
+                f"STDERR: {proc.stderr[:2000]}"
+            )
+        return proc
+class SandboxError(Exception):
+    """Raised when sandbox operations fail."""
+    pass

openhack/sandbox/runner.py ADDED Viewed

@@ -0,0 +1,177 @@
+"""
+Exploit runner for sandbox verification.
+Executes HTTP requests and scripts against a running sandboxed application.
+Returns full response details so the agent can analyze whether the exploit worked.
+"""
+import asyncio
+import json
+import logging
+import time
+from dataclasses import dataclass, field
+from typing import Any, Optional
+import aiohttp
+logger = logging.getLogger(__name__)
+@dataclass
+class ExploitResult:
+    """Result of an exploit attempt."""
+    success: bool
+    status_code: Optional[int] = None
+    headers: dict[str, str] = field(default_factory=dict)
+    body: str = ""
+    elapsed_ms: float = 0.0
+    error: Optional[str] = None
+    attempt: int = 1
+    def to_dict(self) -> dict:
+        d = {
+            "success": self.success,
+            "status_code": self.status_code,
+            "elapsed_ms": round(self.elapsed_ms, 1),
+            "attempt": self.attempt,
+        }
+        if self.headers:
+            # Only include security-relevant headers
+            relevant = {}
+            for k, v in self.headers.items():
+                kl = k.lower()
+                if kl in (
+                    "content-type", "set-cookie", "location",
+                    "x-powered-by", "server", "access-control-allow-origin",
+                    "www-authenticate", "x-frame-options",
+                    "content-security-policy", "x-content-type-options",
+                ):
+                    relevant[k] = v
+            d["headers"] = relevant
+        if self.body:
+            d["body"] = self.body[:5000]  # Cap body size for context window
+        if self.error:
+            d["error"] = self.error
+        return d
+class ExploitRunner:
+    """Executes exploit requests against a sandboxed application."""
+    def __init__(self, base_url: str, timeout: int = 30):
+        self.base_url = base_url.rstrip("/")
+        self.timeout = aiohttp.ClientTimeout(total=timeout)
+        self._session: Optional[aiohttp.ClientSession] = None
+    async def __aenter__(self):
+        self._session = aiohttp.ClientSession(timeout=self.timeout)
+        return self
+    async def __aexit__(self, exc_type, exc_val, exc_tb):
+        if self._session:
+            await self._session.close()
+    async def execute_request(
+        self,
+        method: str,
+        path: str,
+        headers: Optional[dict[str, str]] = None,
+        body: Optional[str] = None,
+        json_body: Optional[dict] = None,
+        follow_redirects: bool = False,
+        attempt: int = 1,
+    ) -> ExploitResult:
+        """Execute a single HTTP request against the sandbox."""
+        url = f"{self.base_url}{path}" if path.startswith("/") else path
+        if not self._session:
+            self._session = aiohttp.ClientSession(timeout=self.timeout)
+        start = time.time()
+        try:
+            kwargs: dict[str, Any] = {
+                "method": method.upper(),
+                "url": url,
+                "headers": headers or {},
+                "allow_redirects": follow_redirects,
+            }
+            if json_body is not None:
+                kwargs["json"] = json_body
+            elif body is not None:
+                kwargs["data"] = body
+            async with self._session.request(**kwargs) as resp:
+                elapsed = (time.time() - start) * 1000
+                resp_body = await resp.text()
+                resp_headers = dict(resp.headers)
+                return ExploitResult(
+                    success=True,
+                    status_code=resp.status,
+                    headers=resp_headers,
+                    body=resp_body,
+                    elapsed_ms=elapsed,
+                    attempt=attempt,
+                )
+        except asyncio.TimeoutError:
+            return ExploitResult(
+                success=False,
+                error=f"Request timed out after {self.timeout.total}s",
+                elapsed_ms=(time.time() - start) * 1000,
+                attempt=attempt,
+            )
+        except aiohttp.ClientError as e:
+            return ExploitResult(
+                success=False,
+                error=f"Connection error: {str(e)}",
+                elapsed_ms=(time.time() - start) * 1000,
+                attempt=attempt,
+            )
+        except Exception as e:
+            return ExploitResult(
+                success=False,
+                error=f"Unexpected error: {str(e)}",
+                elapsed_ms=(time.time() - start) * 1000,
+                attempt=attempt,
+            )
+    async def execute_multi_step(
+        self,
+        steps: list[dict],
+    ) -> list[ExploitResult]:
+        """Execute a sequence of requests (for multi-step exploits).
+        Each step is a dict with: method, path, headers, body/json_body.
+        Later steps can reference earlier responses via {step_N_body} placeholders.
+        """
+        results: list[ExploitResult] = []
+        for i, step in enumerate(steps):
+            # Substitute placeholders from previous results
+            step_str = json.dumps(step)
+            for j, prev in enumerate(results):
+                placeholder = f"{{step_{j}_body}}"
+                if placeholder in step_str:
+                    escaped = json.dumps(prev.body)[1:-1]  # Remove outer quotes
+                    step_str = step_str.replace(placeholder, escaped)
+            step = json.loads(step_str)
+            result = await self.execute_request(
+                method=step.get("method", "GET"),
+                path=step.get("path", "/"),
+                headers=step.get("headers"),
+                body=step.get("body"),
+                json_body=step.get("json_body"),
+                follow_redirects=step.get("follow_redirects", False),
+                attempt=i + 1,
+            )
+            results.append(result)
+            # If a step fails at the connection level, stop the chain
+            if not result.success:
+                break
+        return results