PyPI - openhack - Versions diffs - 0.1.0__py3-none-any.whl - Mend

openhack 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (113) hide show

openhack/__init__.py +2 -0
openhack/__main__.py +225 -0
openhack/agents/__init__.py +30 -0
openhack/agents/base.py +230 -0
openhack/agents/browser_verifier.py +679 -0
openhack/agents/browser_verifier_swarm.py +256 -0
openhack/agents/checkpoint.py +89 -0
openhack/agents/context_manager.py +356 -0
openhack/agents/coordinator.py +1105 -0
openhack/agents/endpoint_analyst.py +307 -0
openhack/agents/feature_hunter.py +93 -0
openhack/agents/hunter.py +481 -0
openhack/agents/hunter_swarm.py +385 -0
openhack/agents/llm.py +334 -0
openhack/agents/recon.py +19 -0
openhack/agents/sandbox_verifier.py +396 -0
openhack/agents/sandbox_verifier_swarm.py +250 -0
openhack/agents/session.py +286 -0
openhack/agents/validator.py +217 -0
openhack/agents/validator_swarm.py +106 -0
openhack/auth.py +175 -0
openhack/browser/__init__.py +12 -0
openhack/browser/runner.py +385 -0
openhack/categories.py +130 -0
openhack/config.py +201 -0
openhack/deterministic_recon.py +464 -0
openhack/entry_points.py +745 -0
openhack/framework_classifier.py +515 -0
openhack/framework_detection.py +269 -0
openhack/headless_scan.py +179 -0
openhack/prompts/__init__.py +108 -0
openhack/prompts/browser_verifier.py +171 -0
openhack/prompts/coordinator.py +31 -0
openhack/prompts/django/__init__.py +32 -0
openhack/prompts/django/auth_bypass.py +76 -0
openhack/prompts/django/csrf.py +62 -0
openhack/prompts/django/data_exposure.py +67 -0
openhack/prompts/django/idor.py +74 -0
openhack/prompts/django/injection.py +67 -0
openhack/prompts/django/misconfiguration.py +70 -0
openhack/prompts/django/ssrf.py +64 -0
openhack/prompts/endpoint_analyst.py +122 -0
openhack/prompts/express/__init__.py +29 -0
openhack/prompts/express/auth_bypass.py +71 -0
openhack/prompts/express/data_exposure.py +77 -0
openhack/prompts/express/idor.py +69 -0
openhack/prompts/express/injection.py +75 -0
openhack/prompts/express/misconfiguration.py +72 -0
openhack/prompts/express/ssrf.py +63 -0
openhack/prompts/feature_hunter.py +140 -0
openhack/prompts/flask/__init__.py +29 -0
openhack/prompts/flask/auth_bypass.py +86 -0
openhack/prompts/flask/data_exposure.py +78 -0
openhack/prompts/flask/idor.py +83 -0
openhack/prompts/flask/injection.py +77 -0
openhack/prompts/flask/misconfiguration.py +73 -0
openhack/prompts/flask/ssrf.py +65 -0
openhack/prompts/hunter.py +362 -0
openhack/prompts/hunter_continuation_loop.py +12 -0
openhack/prompts/hunter_continuation_no_findings.py +19 -0
openhack/prompts/hunter_continuation_no_progress.py +22 -0
openhack/prompts/hunter_tool_instructions.py +55 -0
openhack/prompts/nextjs/__init__.py +42 -0
openhack/prompts/nextjs/auth_bypass.py +80 -0
openhack/prompts/nextjs/csrf.py +71 -0
openhack/prompts/nextjs/data_exposure.py +88 -0
openhack/prompts/nextjs/idor.py +64 -0
openhack/prompts/nextjs/injection.py +65 -0
openhack/prompts/nextjs/middleware_bypass.py +75 -0
openhack/prompts/nextjs/misconfiguration.py +92 -0
openhack/prompts/nextjs/server_actions.py +97 -0
openhack/prompts/nextjs/ssrf.py +66 -0
openhack/prompts/nextjs/xss.py +69 -0
openhack/prompts/pr_analysis_system.py +80 -0
openhack/prompts/pr_analysis_user.py +11 -0
openhack/prompts/project_context.py +89 -0
openhack/prompts/recon.py +199 -0
openhack/prompts/reporter.py +88 -0
openhack/prompts/researchers.py +434 -0
openhack/prompts/sandbox_verifier.py +128 -0
openhack/prompts/supabase/__init__.py +39 -0
openhack/prompts/supabase/auth_tokens.py +131 -0
openhack/prompts/supabase/edge_functions.py +150 -0
openhack/prompts/supabase/graphql.py +102 -0
openhack/prompts/supabase/postgrest.py +99 -0
openhack/prompts/supabase/realtime.py +93 -0
openhack/prompts/supabase/rls.py +110 -0
openhack/prompts/supabase/rpc_functions.py +127 -0
openhack/prompts/supabase/storage.py +110 -0
openhack/prompts/supabase/tenant_isolation.py +118 -0
openhack/prompts/validator.py +319 -0
openhack/prompts/validator_continuation_incomplete.py +12 -0
openhack/prompts/validator_tool_instructions.py +29 -0
openhack/quality.py +231 -0
openhack/sandbox/__init__.py +12 -0
openhack/sandbox/orchestrator.py +517 -0
openhack/sandbox/runner.py +177 -0
openhack/scan_session.py +245 -0
openhack/setup.py +452 -0
openhack/static_validator.py +612 -0
openhack/tools/__init__.py +1 -0
openhack/tools/ast_tools.py +307 -0
openhack/tools/coverage.py +1078 -0
openhack/tools/filesystem.py +404 -0
openhack/tools/nextjs.py +258 -0
openhack/tools/registry.py +52 -0
openhack/tui.py +3450 -0
openhack/updates.py +170 -0
openhack-0.1.0.dist-info/METADATA +189 -0
openhack-0.1.0.dist-info/RECORD +113 -0
openhack-0.1.0.dist-info/WHEEL +4 -0
openhack-0.1.0.dist-info/entry_points.txt +2 -0
openhack-0.1.0.dist-info/licenses/LICENSE +661 -0

openhack/categories.py ADDED Viewed

@@ -0,0 +1,130 @@
+"""
+Canonical vulnerability categories.
+Every finding reported by the scanner MUST use one of these exact category
+strings.  This eliminates the cross-scan drift where the LLM invents
+slightly different labels for the same vulnerability class.
+The `normalize_category` function maps freeform LLM output to the closest
+canonical category using keyword matching.
+"""
+from __future__ import annotations
+CATEGORIES: list[str] = [
+    "SQL Injection",
+    "Command Injection",
+    "XSS",
+    "SSRF",
+    "Open Redirect",
+    "Path Traversal",
+    "IDOR",
+    "Authentication Bypass",
+    "Authorization Bypass",
+    "CSRF",
+    "Data Exposure",
+    "Information Disclosure",
+    "Hardcoded Secret",
+    "Security Misconfiguration",
+    "Missing RLS",
+    "RPC Function Abuse",
+    "Storage Misconfiguration",
+    "Mass Assignment",
+    "Business Logic Flaw",
+    "Denial of Service",
+    "RCE",
+]
+_CANONICAL_LOWER: dict[str, str] = {c.lower(): c for c in CATEGORIES}
+_KEYWORD_MAP: list[tuple[set[str], str]] = [
+    ({"sqli", "sql injection", "sql inject"}, "SQL Injection"),
+    ({"command injection", "command inject", "child_process", "exec injection", "rce", "remote code"}, "RCE"),
+    ({"xss", "cross-site scripting", "cross site scripting", "dangerouslysetinnerhtml", "innerhtml"}, "XSS"),
+    ({"ssrf", "server-side request", "server side request"}, "SSRF"),
+    ({"open redirect", "redirect", "returnto", "redirectto", "callbackurl"}, "Open Redirect"),
+    ({"path traversal", "directory traversal", "lfi", "local file inclusion"}, "Path Traversal"),
+    ({"idor", "insecure direct object", "broken object level"}, "IDOR"),
+    ({"authentication bypass", "auth bypass", "broken authentication"}, "Authentication Bypass"),
+    ({"authorization bypass", "broken access", "missing authorization", "privilege escalation", "access control"}, "Authorization Bypass"),
+    ({"csrf", "cross-site request forgery", "cross site request forgery"}, "CSRF"),
+    ({"missing rls", "row level security", "rls policy", "cross-tenant", "tenant isolation", "missing delete policy"}, "Missing RLS"),
+    ({"data exposure", "data leak", "pii exposure", "sensitive data", "token exposure",
+      "credential exposure", "plaintext", "write access"}, "Data Exposure"),
+    ({"information disclosure", "info disclosure", "verbose error", "error message", "stack trace"}, "Information Disclosure"),
+    ({"hardcoded secret", "hardcoded credential", "hardcoded key", "hardcoded password", "embedded secret"}, "Hardcoded Secret"),
+    ({"misconfiguration", "security header", "cors", "missing header", "insecure config",
+      "insecure documentation", "auth misconfiguration"}, "Security Misconfiguration"),
+    ({"rpc function", "rpc abuse", "security definer"}, "RPC Function Abuse"),
+    ({"storage misconfiguration", "storage bucket", "storage policy", "public bucket", "insecure storage"}, "Storage Misconfiguration"),
+    ({"mass assignment", "over-posting", "parameter pollution"}, "Mass Assignment"),
+    ({"business logic", "logic flaw", "logic error", "race condition",
+      "broken functionality"}, "Business Logic Flaw"),
+    ({"denial of service", "dos", "redos", "resource exhaustion",
+      "rate limit", "missing rate"}, "Denial of Service"),
+]
+CATEGORY_SEVERITY: dict[str, str] = {
+    "SQL Injection":            "critical",
+    "Command Injection":        "critical",
+    "RCE":                      "critical",
+    "Authentication Bypass":   "critical",
+    "Missing RLS":              "critical",
+    "SSRF":                     "high",
+    "Path Traversal":           "high",
+    "IDOR":                     "high",
+    "Authorization Bypass":     "high",
+    "Hardcoded Secret":         "high",
+    "Data Exposure":            "high",
+    "RPC Function Abuse":       "high",
+    "Storage Misconfiguration": "high",
+    "Open Redirect":            "medium",
+    "XSS":                      "medium",
+    "CSRF":                     "medium",
+    "Mass Assignment":          "medium",
+    "Business Logic Flaw":      "medium",
+    "Denial of Service":        "medium",
+    "Information Disclosure":   "low",
+    "Security Misconfiguration":"medium",
+}
+def normalize_severity(
+    findings: list[dict],
+    *,
+    use_category_default: bool = True,
+) -> list[dict]:
+    SEVERITY_ORDER = {"critical": 0, "high": 1, "medium": 2, "low": 3, "info": 4}
+    SEVERITY_NAMES = {v: k for k, v in SEVERITY_ORDER.items()}
+    out = [dict(f) for f in findings]
+    for i, f in enumerate(out):
+        canonical = normalize_category(f.get("category", ""))
+        current = SEVERITY_ORDER.get((f.get("severity") or "info").lower(), 4)
+        if use_category_default:
+            default_sev = SEVERITY_ORDER.get(
+                CATEGORY_SEVERITY.get(canonical, "medium").lower(), 2
+            )
+            if current > default_sev:
+                out[i]["severity"] = SEVERITY_NAMES[default_sev]
+    return out
+def normalize_category(raw: str) -> str:
+    if not raw:
+        return "Security Misconfiguration"
+    lower = raw.strip().lower()
+    if lower in _CANONICAL_LOWER:
+        return _CANONICAL_LOWER[lower]
+    for keywords, canonical in _KEYWORD_MAP:
+        for kw in keywords:
+            if kw in lower:
+                return canonical
+    return raw.strip().title()

openhack/config.py ADDED Viewed

@@ -0,0 +1,201 @@
+import json
+import os
+from pathlib import Path
+from typing import Optional
+from pydantic_settings import BaseSettings, SettingsConfigDict
+CONFIG_DIR = Path.home() / ".openhack"
+CONFIG_PATH = CONFIG_DIR / "config"
+_PROVIDER_KEY_FIELDS = {
+    "openhack": "openhack_api_key",
+}
+def _dotenv_nonempty_keys(path: Path) -> set[str]:
+    """Return uppercase keys with non-empty values from a dotenv file."""
+    keys: set[str] = set()
+    if not path.exists():
+        return keys
+    try:
+        for raw_line in path.read_text().splitlines():
+            line = raw_line.strip()
+            if not line or line.startswith("#"):
+                continue
+            if line.startswith("export "):
+                line = line[len("export "):].strip()
+            if "=" not in line:
+                continue
+            key, val = line.split("=", 1)
+            key = key.strip()
+            val = val.strip().strip('"').strip("'")
+            if key and val != "":
+                keys.add(key.upper())
+    except OSError:
+        return set()
+    return keys
+def load_user_config() -> dict:
+    """Load persistent config from ~/.openhack/config."""
+    if CONFIG_PATH.exists():
+        try:
+            return json.loads(CONFIG_PATH.read_text())
+        except (json.JSONDecodeError, OSError):
+            return {}
+    return {}
+def save_user_config(data: dict) -> None:
+    """Save persistent config to ~/.openhack/config."""
+    CONFIG_DIR.mkdir(parents=True, exist_ok=True)
+    try:
+        os.chmod(CONFIG_DIR, 0o700)
+    except OSError:
+        pass
+    existing = load_user_config()
+    existing.update(data)
+    CONFIG_PATH.write_text(json.dumps(existing, indent=2) + "\n")
+    # Config now holds long-lived bearer tokens; restrict to owner-only read/write.
+    try:
+        os.chmod(CONFIG_PATH, 0o600)
+    except OSError:
+        pass
+def resolve_provider(name: str) -> str:
+    """Normalize provider name."""
+    return name
+PROD_APP_URL = "https://app.openhack.com"
+PROD_BASE_URL = "https://api.openhack.com/v1"
+DEV_APP_URL = "http://localhost:9080"
+DEV_BASE_URL = "http://localhost:8787/v1"
+class Settings(BaseSettings):
+    """Minimal settings for the standalone scanner."""
+    # Set OPENHACK_DEV=1 to point both URLs at local dev (Next.js app on :9080,
+    # wrangler dev inference on :8787) instead of production.
+    openhack_dev: bool = False
+    llm_provider: str = "openhack"
+    openhack_api_key: Optional[str] = None
+    openhack_base_url: str = ""
+    openhack_app_url: str = ""
+    openhack_model_id: str = "kimi-k2.5"
+    openhack_org_id: Optional[str] = None
+    openhack_org_slug: Optional[str] = None
+    openhack_org_name: Optional[str] = None
+    openhack_user_email: Optional[str] = None
+    openhack_user_first_name: Optional[str] = None
+    openhack_user_last_name: Optional[str] = None
+    openhack_read_timeout: int = 600
+    openhack_connect_timeout: int = 30
+    openhack_max_retries: int = 5
+    recon_model_id: Optional[str] = None
+    hunter_model_id: Optional[str] = None
+    validator_model_id: Optional[str] = None
+    browser_verifier_model_id: Optional[str] = None
+    max_concurrent_hunters: int = 3
+    max_concurrent_validators: int = 5
+    compaction_threshold: float = 0.70
+    tool_result_max_lines: int = 200
+    checkpoint_enabled: bool = True
+    # Scan scoping — exclude paths that are never production web attack surface
+    scan_exclude_patterns: list[str] = [
+        "**/test/**", "**/tests/**", "**/__tests__/**", "**/spec/**",
+        "**/__mocks__/**", "**/fixtures/**", "**/__fixtures__/**",
+        "**/e2e/**", "**/cypress/**", "**/playwright/**",
+        "**/cli/**", "**/CLI/**",
+        "**/docs/**", "**/documentation/**",
+        "**/examples/**", "**/example/**", "**/samples/**", "**/demo/**", "**/demos/**",
+        "**/tutorial/**", "**/tutorials/**", "**/playground/**", "**/sandbox/**",
+        "**/mock/**", "**/mocks/**", "**/stub/**", "**/stubs/**",
+        "**/scripts/**", "**/tools/**", "**/devtools/**",
+        "**/benchmarks/**", "**/benchmark/**",
+        "**/integration-tests/**",
+        "**/*.test.*", "**/*.spec.*", "**/test_*",
+        "**/conftest.py", "**/jest.config.*", "**/vitest.config.*",
+        "**/.storybook/**", "**/stories/**",
+    ]
+    # Feature deep dive
+    feature_hunt_enabled: bool = True
+    max_feature_hunters: int = 7
+    feature_hunter_max_iterations: int = 75
+    max_concurrent_feature_hunters: int = 2
+    feature_hunter_model_id: Optional[str] = None
+    # Sandbox verification
+    sandbox_enabled: bool = False
+    sandbox_max_exploit_attempts: int = 7
+    sandbox_health_check_timeout: int = 120
+    sandbox_health_check_path: str = "/"
+    sandbox_teardown_on_complete: bool = True
+    # Browser verification
+    # Browser verification
+    browser_verification_enabled: bool = False
+    browser_headless: bool = True
+    browser_max_exploit_attempts: int = 7
+    browser_timeout_ms: int = 30000
+    model_config = SettingsConfigDict(
+        env_file=".env",
+        env_file_encoding="utf-8",
+        case_sensitive=False,
+    )
+    def model_post_init(self, __context) -> None:
+        if not self.openhack_app_url:
+            self.openhack_app_url = DEV_APP_URL if self.openhack_dev else PROD_APP_URL
+        if not self.openhack_base_url:
+            self.openhack_base_url = DEV_BASE_URL if self.openhack_dev else PROD_BASE_URL
+def _build_settings() -> Settings:
+    """Build Settings, overlaying ~/.openhack/config values as env-like overrides."""
+    user_cfg = load_user_config()
+    env_overrides = {}
+    for key, val in user_cfg.items():
+        if val is not None and val != "":
+            env_overrides[key.upper()] = str(val)
+    dotenv_keys = _dotenv_nonempty_keys(Path(".env"))
+    old_env = {}
+    for k, v in env_overrides.items():
+        # Respect explicit non-empty environment variables, but allow persisted
+        # config to fill missing or blank values. Also let .env values win.
+        current = os.environ.get(k)
+        if (current is None or current == "") and k not in dotenv_keys:
+            old_env[k] = current
+            os.environ[k] = v
+    try:
+        s = Settings()
+    finally:
+        for k, prev in old_env.items():
+            if prev is None:
+                os.environ.pop(k, None)
+            else:
+                os.environ[k] = prev
+    return s
+settings = _build_settings()
+def reload_settings() -> None:
+    """Reload settings from ~/.openhack/config and environment."""
+    global settings
+    settings = _build_settings()