PyPI - devguard - Versions diffs - 0.2.0__py3-none-any.whl - Mend

devguard 0.2.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (60) hide show

devguard/INTEGRATION_SUMMARY.md +121 -0
devguard/__init__.py +3 -0
devguard/__main__.py +6 -0
devguard/checkers/__init__.py +41 -0
devguard/checkers/api_usage.py +523 -0
devguard/checkers/aws_cost.py +331 -0
devguard/checkers/aws_iam.py +284 -0
devguard/checkers/base.py +25 -0
devguard/checkers/container.py +137 -0
devguard/checkers/domain.py +189 -0
devguard/checkers/firecrawl.py +117 -0
devguard/checkers/fly.py +225 -0
devguard/checkers/github.py +210 -0
devguard/checkers/npm.py +327 -0
devguard/checkers/npm_security.py +244 -0
devguard/checkers/redteam.py +290 -0
devguard/checkers/secret.py +279 -0
devguard/checkers/swarm.py +376 -0
devguard/checkers/tailscale.py +143 -0
devguard/checkers/tailsnitch.py +303 -0
devguard/checkers/tavily.py +179 -0
devguard/checkers/vercel.py +192 -0
devguard/cli.py +1510 -0
devguard/cli_helpers.py +189 -0
devguard/config.py +249 -0
devguard/core.py +293 -0
devguard/dashboard.py +715 -0
devguard/discovery.py +363 -0
devguard/http_client.py +142 -0
devguard/llm_service.py +481 -0
devguard/mcp_server.py +259 -0
devguard/metrics.py +144 -0
devguard/models.py +208 -0
devguard/reporting.py +1571 -0
devguard/sarif.py +295 -0
devguard/scripts/ANALYSIS_SUMMARY.md +141 -0
devguard/scripts/README.md +221 -0
devguard/scripts/auto_fix_recommendations.py +145 -0
devguard/scripts/generate_npmignore.py +175 -0
devguard/scripts/generate_security_report.py +324 -0
devguard/scripts/prepublish_check.sh +29 -0
devguard/scripts/redteam_npm_packages.py +1262 -0
devguard/scripts/review_all_repos.py +300 -0
devguard/spec.py +617 -0
devguard/sweeps/__init__.py +23 -0
devguard/sweeps/ai_editor_config_audit.py +697 -0
devguard/sweeps/cargo_publish_audit.py +655 -0
devguard/sweeps/dependency_audit.py +419 -0
devguard/sweeps/gitignore_audit.py +336 -0
devguard/sweeps/local_dev.py +260 -0
devguard/sweeps/local_dirty_worktree_secrets.py +521 -0
devguard/sweeps/project_flaudit.py +636 -0
devguard/sweeps/public_github_secrets.py +680 -0
devguard/sweeps/publish_audit.py +478 -0
devguard/sweeps/ssh_key_audit.py +327 -0
devguard/utils.py +174 -0
devguard-0.2.0.dist-info/METADATA +225 -0
devguard-0.2.0.dist-info/RECORD +60 -0
devguard-0.2.0.dist-info/WHEEL +4 -0
devguard-0.2.0.dist-info/entry_points.txt +2 -0

devguard/sweeps/ssh_key_audit.py ADDED Viewed

@@ -0,0 +1,327 @@
+"""SSH key hygiene audit sweep: detect weak, unprotected, or stale SSH keys.
+Scans ~/.ssh/ for private key files and checks:
+- Algorithm type and bit strength (flags DSA, short RSA, optionally ECDSA)
+- Passphrase protection (keys without a passphrase are flagged)
+- File permissions (should be 600 or 400)
+- GitHub registration (cross-references with `gh ssh-key list`)
+"""
+from __future__ import annotations
+import json
+import re
+import shutil
+import stat
+import subprocess
+from datetime import UTC, datetime
+from pathlib import Path
+from typing import Any
+def _utc_now() -> str:
+    return datetime.now(UTC).isoformat().replace("+00:00", "Z")
+# Well-known private key filenames (without path).
+_WELL_KNOWN_NAMES = {"id_rsa", "id_ecdsa", "id_ed25519", "id_dsa"}
+# PEM header that marks a private key file.
+_PRIVATE_KEY_HEADER = b"-----BEGIN"
+def _is_private_key_file(path: Path) -> bool:
+    """Heuristic: file looks like an SSH private key."""
+    if not path.is_file():
+        return False
+    # Skip .pub files
+    if path.suffix == ".pub":
+        return False
+    # Well-known names are always candidates
+    if path.name in _WELL_KNOWN_NAMES:
+        return True
+    # Otherwise check for PEM header in first 64 bytes
+    try:
+        head = path.read_bytes()[:64]
+        return _PRIVATE_KEY_HEADER in head
+    except (OSError, PermissionError):
+        return False
+def _parse_keygen_fingerprint(output: str) -> tuple[int, str, str]:
+    """Parse `ssh-keygen -l` output into (bits, fingerprint, key_type).
+    Example lines:
+        256 SHA256:abc...xyz user@host (ED25519)
+        3072 SHA256:def...uvw user@host (RSA)
+    """
+    # Pattern: <bits> <fingerprint> <comment> (<type>)
+    m = re.match(r"(\d+)\s+(SHA256:\S+).*\((\w+)\)", output.strip())
+    if m:
+        return int(m.group(1)), m.group(2), m.group(3).upper()
+    return 0, "", "UNKNOWN"
+def _get_key_info(key_path: Path) -> tuple[int, str, str, list[str]]:
+    """Run ssh-keygen -l to get bits, fingerprint, type. Returns (bits, fingerprint, algo, errors)."""
+    errors: list[str] = []
+    if not shutil.which("ssh-keygen"):
+        return 0, "", "UNKNOWN", ["ssh-keygen not found on PATH"]
+    try:
+        res = subprocess.run(
+            ["ssh-keygen", "-l", "-f", str(key_path)],
+            capture_output=True,
+            text=True,
+            timeout=10,
+        )
+        if res.returncode != 0:
+            errors.append(f"ssh-keygen -l failed: {res.stderr.strip()}")
+            return 0, "", "UNKNOWN", errors
+        bits, fingerprint, algo = _parse_keygen_fingerprint(res.stdout)
+        return bits, fingerprint, algo, errors
+    except subprocess.TimeoutExpired:
+        return 0, "", "UNKNOWN", ["ssh-keygen -l timed out"]
+    except OSError as exc:
+        return 0, "", "UNKNOWN", [f"ssh-keygen -l error: {exc}"]
+def _check_passphrase(key_path: Path) -> tuple[bool | None, list[str]]:
+    """Check whether a private key has a passphrase.
+    Returns (has_passphrase, errors).
+    - True  = passphrase-protected (good)
+    - False = no passphrase (bad)
+    - None  = could not determine
+    """
+    errors: list[str] = []
+    if not shutil.which("ssh-keygen"):
+        return None, ["ssh-keygen not found on PATH"]
+    try:
+        res = subprocess.run(
+            ["ssh-keygen", "-y", "-P", "", "-f", str(key_path)],
+            capture_output=True,
+            text=True,
+            timeout=10,
+        )
+        # Exit 0 + public key on stdout => no passphrase (bad)
+        if res.returncode == 0:
+            return False, errors
+        # Non-zero => passphrase required (good) or other error
+        stderr = res.stderr.strip().lower()
+        if "incorrect passphrase" in stderr or "bad passphrase" in stderr:
+            return True, errors
+        # Some other failure (corrupt key, permission issue, etc.)
+        return None, [f"passphrase check inconclusive: {res.stderr.strip()}"]
+    except subprocess.TimeoutExpired:
+        return None, ["passphrase check timed out"]
+    except OSError as exc:
+        return None, [f"passphrase check error: {exc}"]
+def _check_permissions(key_path: Path) -> tuple[bool, str]:
+    """Check file permissions. Returns (ok, octal_string)."""
+    try:
+        mode = key_path.stat().st_mode
+        file_perms = stat.S_IMODE(mode)
+        octal_str = f"{file_perms:04o}"
+        # Acceptable: 0600 (owner rw) or 0400 (owner r)
+        ok = file_perms in (0o600, 0o400)
+        return ok, octal_str
+    except OSError:
+        return False, "????"
+def _get_github_keys() -> tuple[list[dict[str, str]], list[str]]:
+    """Fetch SSH keys registered on GitHub via `gh ssh-key list`.
+    Returns (keys, errors) where each key is {"fingerprint": ..., "title": ...}.
+    """
+    errors: list[str] = []
+    if not shutil.which("gh"):
+        return [], ["gh CLI not found on PATH; skipping GitHub cross-reference"]
+    try:
+        res = subprocess.run(
+            ["gh", "ssh-key", "list"],
+            capture_output=True,
+            text=True,
+            timeout=15,
+        )
+        if res.returncode != 0:
+            stderr = res.stderr.strip()
+            return [], [f"gh ssh-key list failed: {stderr}"]
+    except subprocess.TimeoutExpired:
+        return [], ["gh ssh-key list timed out"]
+    except OSError as exc:
+        return [], [f"gh ssh-key list error: {exc}"]
+    keys: list[dict[str, str]] = []
+    for line in res.stdout.strip().splitlines():
+        # Format: TITLE\tTYPE\tFINGERPRINT\tADDED
+        # or:     TITLE\tFINGERPRINT\tADDED  (older gh versions)
+        parts = line.split("\t")
+        if len(parts) >= 3:
+            title = parts[0].strip()
+            # Fingerprint is the part that starts with SHA256:
+            fingerprint = ""
+            for p in parts[1:]:
+                p = p.strip()
+                if p.startswith("SHA256:"):
+                    fingerprint = p
+                    break
+            if fingerprint:
+                keys.append({"title": title, "fingerprint": fingerprint})
+    return keys, errors
+def audit_ssh_keys(
+    *,
+    ssh_dir: Path | None = None,
+    check_github: bool = True,
+    min_rsa_bits: int = 3072,
+    flag_ecdsa: bool = False,
+) -> tuple[dict[str, Any], list[str]]:
+    """Audit SSH keys and return (report, errors)."""
+    errors: list[str] = []
+    ssh_path = ssh_dir if ssh_dir is not None else Path("~/.ssh").expanduser()
+    if not ssh_path.is_dir():
+        report: dict[str, Any] = {
+            "generated_at": _utc_now(),
+            "scope": {"ssh_dir": str(ssh_path)},
+            "summary": {"keys_scanned": 0, "issues_total": 0},
+            "keys": [],
+            "github_cross_reference": None,
+            "errors": [f"SSH directory not found: {ssh_path}"],
+        }
+        return report, [f"SSH directory not found: {ssh_path}"]
+    # Discover private key files
+    private_keys: list[Path] = []
+    try:
+        for entry in sorted(ssh_path.iterdir()):
+            if _is_private_key_file(entry):
+                private_keys.append(entry)
+    except PermissionError as exc:
+        errors.append(f"cannot read {ssh_path}: {exc}")
+    # Analyze each key
+    key_results: list[dict[str, Any]] = []
+    local_fingerprints: dict[str, str] = {}  # fingerprint -> key_path
+    for key_path in private_keys:
+        issues: list[str] = []
+        # Algorithm and bit strength
+        bits, fingerprint, algo, key_errors = _get_key_info(key_path)
+        errors.extend(key_errors)
+        if fingerprint:
+            local_fingerprints[fingerprint] = str(key_path)
+        # Weak algorithm checks
+        if algo == "DSA":
+            issues.append("DSA algorithm is deprecated and weak")
+        elif algo == "RSA" and bits > 0 and bits < min_rsa_bits:
+            issues.append(f"RSA key is {bits}-bit (minimum recommended: {min_rsa_bits})")
+        elif algo == "ECDSA" and flag_ecdsa:
+            issues.append("ECDSA uses NIST curves (flagged by policy)")
+        # Passphrase check
+        has_passphrase, pp_errors = _check_passphrase(key_path)
+        errors.extend(pp_errors)
+        if has_passphrase is False:
+            issues.append("no passphrase protection")
+        # Permissions check
+        perms_ok, perms_octal = _check_permissions(key_path)
+        if not perms_ok:
+            issues.append(f"permissions too open: {perms_octal} (should be 0600 or 0400)")
+        key_results.append({
+            "key_path": str(key_path),
+            "algorithm": algo,
+            "bits": bits,
+            "fingerprint": fingerprint,
+            "has_passphrase": has_passphrase,
+            "permissions": perms_octal,
+            "permissions_ok": perms_ok,
+            "issues": issues,
+        })
+    # GitHub cross-reference
+    github_cross_ref: dict[str, Any] | None = None
+    if check_github:
+        gh_keys, gh_errors = _get_github_keys()
+        errors.extend(gh_errors)
+        if gh_keys or not gh_errors:
+            gh_fingerprints = {k["fingerprint"] for k in gh_keys}
+            local_fp_set = set(local_fingerprints.keys())
+            local_not_on_github = [
+                {"fingerprint": fp, "key_path": local_fingerprints[fp]}
+                for fp in sorted(local_fp_set - gh_fingerprints)
+            ]
+            github_not_local = [
+                {"fingerprint": k["fingerprint"], "title": k["title"]}
+                for k in gh_keys
+                if k["fingerprint"] not in local_fp_set
+            ]
+            github_cross_ref = {
+                "github_keys_count": len(gh_keys),
+                "local_not_on_github": local_not_on_github,
+                "github_not_local": github_not_local,
+            }
+            # Add cross-ref issues to relevant keys
+            for entry in local_not_on_github:
+                for kr in key_results:
+                    if kr["fingerprint"] == entry["fingerprint"]:
+                        kr["registered_on_github"] = False
+                        kr["issues"].append("not registered on GitHub (stale?)")
+            # Mark keys that are registered
+            for kr in key_results:
+                if "registered_on_github" not in kr:
+                    if kr["fingerprint"] and kr["fingerprint"] in gh_fingerprints:
+                        kr["registered_on_github"] = True
+                    elif not kr["fingerprint"]:
+                        kr["registered_on_github"] = None
+                    else:
+                        kr["registered_on_github"] = False
+    total_issues = sum(len(k["issues"]) for k in key_results)
+    report = {
+        "generated_at": _utc_now(),
+        "scope": {
+            "ssh_dir": str(ssh_path),
+            "check_github": check_github,
+            "min_rsa_bits": min_rsa_bits,
+            "flag_ecdsa": flag_ecdsa,
+        },
+        "summary": {
+            "keys_scanned": len(key_results),
+            "issues_total": total_issues,
+            "keys_without_passphrase": sum(
+                1 for k in key_results if k["has_passphrase"] is False
+            ),
+            "keys_with_weak_algorithm": sum(
+                1 for k in key_results
+                if any("deprecated" in i or "bit" in i or "NIST" in i for i in k["issues"])
+            ),
+            "keys_with_bad_permissions": sum(
+                1 for k in key_results if not k["permissions_ok"]
+            ),
+        },
+        "keys": key_results,
+        "github_cross_reference": github_cross_ref,
+        "errors": errors,
+    }
+    return report, errors
+def write_report(path: Path, report: dict[str, Any]) -> None:
+    path.parent.mkdir(parents=True, exist_ok=True)
+    path.write_text(json.dumps(report, indent=2) + "\n")

devguard/utils.py ADDED Viewed

@@ -0,0 +1,174 @@
+"""Utility functions for Guardian.
+This module provides utilities for accessing external modules (like ops/agent)
+without fragile path manipulation.
+"""
+import logging
+import sys
+from pathlib import Path
+from typing import TYPE_CHECKING, Any
+if TYPE_CHECKING:
+    from devguard.config import Settings
+logger = logging.getLogger(__name__)
+# Cache for resolved paths
+_resolved_paths: dict[str, Path | None] = {}
+def get_ops_agent_path() -> Path | None:
+    """Get the path to ops/agent directory.
+    Returns None if not found. Uses cached result after first resolution.
+    """
+    cache_key = "ops_agent"
+    if cache_key in _resolved_paths:
+        return _resolved_paths[cache_key]
+    # Try to find ops/agent relative to devguard
+    devguard_path = Path(__file__).parent.parent.parent
+    ops_agent_path = devguard_path.parent / "ops" / "agent"
+    if ops_agent_path.exists() and ops_agent_path.is_dir():
+        _resolved_paths[cache_key] = ops_agent_path
+        return ops_agent_path
+    _resolved_paths[cache_key] = None
+    return None
+def get_ops_config_path() -> Path | None:
+    """Get the path to ops/config directory.
+    Returns None if not found. Uses cached result after first resolution.
+    """
+    cache_key = "ops_config"
+    if cache_key in _resolved_paths:
+        return _resolved_paths[cache_key]
+    devguard_path = Path(__file__).parent.parent.parent
+    ops_config_path = devguard_path.parent / "ops" / "config"
+    if ops_config_path.exists() and ops_config_path.is_dir():
+        _resolved_paths[cache_key] = ops_config_path
+        return ops_config_path
+    _resolved_paths[cache_key] = None
+    return None
+def import_smart_email() -> Any:
+    """Import smart_email module from ops/agent.
+    Returns the module if found, None otherwise.
+    Handles path manipulation internally.
+    """
+    ops_agent_path = get_ops_agent_path()
+    if not ops_agent_path:
+        return None
+    try:
+        # Add to path if not already there
+        ops_agent_str = str(ops_agent_path)
+        if ops_agent_str not in sys.path:
+            sys.path.insert(0, ops_agent_str)
+        import smart_email
+        return smart_email
+    except ImportError as e:
+        logger.debug(f"Could not import smart_email: {e}")
+        return None
+def import_llm_service() -> Any:
+    """Import LLMService from ops/agent.
+    Returns the class if found, None otherwise.
+    """
+    ops_agent_path = get_ops_agent_path()
+    if not ops_agent_path:
+        return None
+    try:
+        ops_agent_str = str(ops_agent_path)
+        if ops_agent_str not in sys.path:
+            sys.path.insert(0, ops_agent_str)
+        from llm_service import LLMService
+        return LLMService
+    except ImportError as e:
+        logger.debug(f"Could not import LLMService: {e}")
+        return None
+def get_smart_email_db_path(settings: "Settings") -> Path:
+    """Get the smart_email database path from settings or environment.
+    Args:
+        settings: Settings object with smart_email_db_path attribute
+    Returns:
+        Path to database file
+    """
+    db_path_str = getattr(settings, "smart_email_db_path", None)
+    if db_path_str:
+        return Path(db_path_str)
+    import os
+    db_path_str = os.getenv("SMART_EMAIL_DB", "/data/smart_email.db")
+    return Path(db_path_str)
+def get_budget_config_path() -> Path | None:
+    """Get the path to ops/config/budget.yaml.
+    Returns None if not found.
+    """
+    ops_config_path = get_ops_config_path()
+    if not ops_config_path:
+        return None
+    budget_path = ops_config_path / "budget.yaml"
+    if budget_path.exists():
+        return budget_path
+    return None
+def load_budget_config() -> dict[str, Any]:
+    """Load budget configuration from ops/config/budget.yaml.
+    Returns empty dict if file not found or error loading.
+    """
+    budget_path = get_budget_config_path()
+    if not budget_path:
+        return {}
+    try:
+        import yaml
+        with open(budget_path) as f:
+            config = yaml.safe_load(f)
+            return config.get("aws", {})
+    except Exception as e:
+        logger.debug(f"Failed to load budget config from {budget_path}: {e}")
+        return {}
+def get_iam_posture_path() -> Path | None:
+    """Get the path to ops/security/iam-posture.yaml.
+    Returns None if not found.
+    """
+    devguard_path = Path(__file__).parent.parent.parent
+    iam_path = devguard_path.parent / "ops" / "security" / "iam-posture.yaml"
+    if iam_path.exists():
+        return iam_path
+    return None