PyPI - devguard - Versions diffs - 0.2.0__py3-none-any.whl - Mend

devguard 0.2.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (60) hide show

devguard/INTEGRATION_SUMMARY.md +121 -0
devguard/__init__.py +3 -0
devguard/__main__.py +6 -0
devguard/checkers/__init__.py +41 -0
devguard/checkers/api_usage.py +523 -0
devguard/checkers/aws_cost.py +331 -0
devguard/checkers/aws_iam.py +284 -0
devguard/checkers/base.py +25 -0
devguard/checkers/container.py +137 -0
devguard/checkers/domain.py +189 -0
devguard/checkers/firecrawl.py +117 -0
devguard/checkers/fly.py +225 -0
devguard/checkers/github.py +210 -0
devguard/checkers/npm.py +327 -0
devguard/checkers/npm_security.py +244 -0
devguard/checkers/redteam.py +290 -0
devguard/checkers/secret.py +279 -0
devguard/checkers/swarm.py +376 -0
devguard/checkers/tailscale.py +143 -0
devguard/checkers/tailsnitch.py +303 -0
devguard/checkers/tavily.py +179 -0
devguard/checkers/vercel.py +192 -0
devguard/cli.py +1510 -0
devguard/cli_helpers.py +189 -0
devguard/config.py +249 -0
devguard/core.py +293 -0
devguard/dashboard.py +715 -0
devguard/discovery.py +363 -0
devguard/http_client.py +142 -0
devguard/llm_service.py +481 -0
devguard/mcp_server.py +259 -0
devguard/metrics.py +144 -0
devguard/models.py +208 -0
devguard/reporting.py +1571 -0
devguard/sarif.py +295 -0
devguard/scripts/ANALYSIS_SUMMARY.md +141 -0
devguard/scripts/README.md +221 -0
devguard/scripts/auto_fix_recommendations.py +145 -0
devguard/scripts/generate_npmignore.py +175 -0
devguard/scripts/generate_security_report.py +324 -0
devguard/scripts/prepublish_check.sh +29 -0
devguard/scripts/redteam_npm_packages.py +1262 -0
devguard/scripts/review_all_repos.py +300 -0
devguard/spec.py +617 -0
devguard/sweeps/__init__.py +23 -0
devguard/sweeps/ai_editor_config_audit.py +697 -0
devguard/sweeps/cargo_publish_audit.py +655 -0
devguard/sweeps/dependency_audit.py +419 -0
devguard/sweeps/gitignore_audit.py +336 -0
devguard/sweeps/local_dev.py +260 -0
devguard/sweeps/local_dirty_worktree_secrets.py +521 -0
devguard/sweeps/project_flaudit.py +636 -0
devguard/sweeps/public_github_secrets.py +680 -0
devguard/sweeps/publish_audit.py +478 -0
devguard/sweeps/ssh_key_audit.py +327 -0
devguard/utils.py +174 -0
devguard-0.2.0.dist-info/METADATA +225 -0
devguard-0.2.0.dist-info/RECORD +60 -0
devguard-0.2.0.dist-info/WHEEL +4 -0
devguard-0.2.0.dist-info/entry_points.txt +2 -0

devguard/cli_helpers.py ADDED Viewed

@@ -0,0 +1,189 @@
+"""Shared helper functions for CLI commands."""
+import asyncio
+import logging
+import httpx
+from rich.console import Console
+from devguard.config import Settings
+console = Console()
+logger = logging.getLogger(__name__)
+async def test_github_token(token: str) -> tuple[bool, str]:
+    """Test a GitHub token.
+    Returns:
+        Tuple of (success, message)
+    """
+    try:
+        from github import Auth, Github
+        auth = Auth.Token(token)
+        github = Github(auth=auth)
+        user = github.get_user()
+        return True, f"Authenticated as {user.login}"
+    except Exception as e:
+        return False, f"Token invalid - {str(e)}"
+async def test_vercel_token(token: str) -> tuple[bool, str]:
+    """Test a Vercel token.
+    Returns:
+        Tuple of (success, message)
+    """
+    try:
+        async with httpx.AsyncClient() as client:
+            response = await client.get(
+                "https://api.vercel.com/v2/user",
+                headers={"Authorization": f"Bearer {token}"},
+                timeout=10.0,
+            )
+            if response.status_code == 200:
+                data = response.json()
+                name = data.get("user", {}).get("name", "Unknown")
+                return True, f"Authenticated as {name}"
+            else:
+                return False, f"Token invalid (HTTP {response.status_code})"
+    except Exception as e:
+        return False, f"Error - {str(e)}"
+async def test_fly_token(token: str) -> tuple[bool, str]:
+    """Test a Fly.io token.
+    Returns:
+        Tuple of (success, message)
+    """
+    try:
+        async with httpx.AsyncClient() as client:
+            response = await client.get(
+                "https://api.machines.dev/v1/apps",
+                headers={"Authorization": f"Bearer {token}"},
+                timeout=10.0,
+            )
+            if response.status_code == 200:
+                return True, "Token is valid"
+            else:
+                return False, f"Token invalid (HTTP {response.status_code})"
+    except Exception as e:
+        return False, f"Error - {str(e)}"
+async def test_snyk_token(token: str) -> tuple[bool, str]:
+    """Test a Snyk token.
+    Returns:
+        Tuple of (success, message)
+    """
+    try:
+        async with httpx.AsyncClient() as client:
+            response = await client.get(
+                "https://api.snyk.io/v1/user/me",
+                headers={"Authorization": f"token {token}"},
+                timeout=10.0,
+            )
+            if response.status_code == 200:
+                data = response.json()
+                email = data.get("email", "Unknown")
+                return True, f"Authenticated as {email}"
+            else:
+                return False, f"Token invalid (HTTP {response.status_code})"
+    except Exception as e:
+        return False, f"Error - {str(e)}"
+async def test_service_token(service: str, token: str) -> tuple[bool, str]:
+    """Test a token for a given service.
+    Args:
+        service: Service name (gh, github, vercel, fly, snyk)
+        token: Token to test
+    Returns:
+        Tuple of (success, message)
+    """
+    service = service.lower()
+    if service in ("gh", "github"):
+        return await test_github_token(token)
+    elif service == "vercel":
+        return await test_vercel_token(token)
+    elif service == "fly":
+        return await test_fly_token(token)
+    elif service == "snyk":
+        return await test_snyk_token(token)
+    else:
+        return False, f"Unknown service: {service}"
+def show_auth_status(settings: Settings) -> None:
+    """Show authentication status for all configured services.
+    Args:
+        settings: Guardian settings
+    """
+    console.print("[bold blue]Guardian Authentication Status[/bold blue]\n")
+    # GitHub
+    if settings.github_token:
+        token_str = (
+            settings.github_token.get_secret_value()
+            if hasattr(settings.github_token, "get_secret_value")
+            else str(settings.github_token)
+        )
+        success, message = asyncio.run(test_github_token(token_str))
+        if success:
+            console.print(f"[bold green]✓[/bold green] GitHub: {message}")
+        else:
+            console.print(f"[bold red]✗[/bold red] GitHub: {message}")
+    else:
+        console.print("[yellow]○[/yellow] GitHub: Not configured")
+    # Vercel
+    if settings.vercel_token:
+        token_str = (
+            settings.vercel_token.get_secret_value()
+            if hasattr(settings.vercel_token, "get_secret_value")
+            else str(settings.vercel_token)
+        )
+        success, message = asyncio.run(test_vercel_token(token_str))
+        if success:
+            console.print(f"[bold green]✓[/bold green] Vercel: {message}")
+        else:
+            console.print(f"[bold red]✗[/bold red] Vercel: {message}")
+    else:
+        console.print("[yellow]○[/yellow] Vercel: Not configured")
+    # Fly.io
+    if settings.fly_api_token:
+        token_str = (
+            settings.fly_api_token.get_secret_value()
+            if hasattr(settings.fly_api_token, "get_secret_value")
+            else str(settings.fly_api_token)
+        )
+        success, message = asyncio.run(test_fly_token(token_str))
+        if success:
+            console.print(f"[bold green]✓[/bold green] Fly.io: {message}")
+        else:
+            console.print(f"[bold red]✗[/bold red] Fly.io: {message}")
+    else:
+        console.print("[yellow]○[/yellow] Fly.io: Not configured")
+    # Snyk
+    if settings.snyk_token:
+        token_str = (
+            settings.snyk_token.get_secret_value()
+            if hasattr(settings.snyk_token, "get_secret_value")
+            else str(settings.snyk_token)
+        )
+        success, message = asyncio.run(test_snyk_token(token_str))
+        if success:
+            console.print(f"[bold green]✓[/bold green] Snyk: {message}")
+        else:
+            console.print(f"[bold red]✗[/bold red] Snyk: {message}")
+    else:
+        console.print("[yellow]○[/yellow] Snyk: Not configured")

devguard/config.py ADDED Viewed

@@ -0,0 +1,249 @@
+"""Configuration management for devguard."""
+from typing import Annotated
+from pydantic import Field, SecretStr, field_validator
+from pydantic_settings import BaseSettings, NoDecode, SettingsConfigDict
+class Settings(BaseSettings):
+    """Application settings loaded from environment variables."""
+    model_config = SettingsConfigDict(
+        env_file=(".env", "../.env"),  # Load local first, then root fallback
+        env_file_encoding="utf-8",
+        case_sensitive=False,
+        extra="ignore",
+    )
+    # GitHub Configuration
+    github_token: SecretStr | None = Field(None, description="GitHub personal access token")
+    github_org: str | None = Field(None, description="GitHub organization name (optional)")
+    # Vercel Configuration
+    vercel_token: SecretStr | None = Field(None, description="Vercel API token")
+    vercel_team_id: str | None = Field(None, description="Vercel team ID (optional)")
+    # Fly.io Configuration
+    fly_api_token: SecretStr | None = Field(None, description="Fly.io API token")
+    # npm/Snyk Configuration
+    snyk_token: SecretStr | None = Field(None, description="Snyk API token (optional)")
+    # Monitoring Configuration
+    check_interval_seconds: int = Field(3600, description="Interval between checks in seconds")
+    alert_webhook_url: SecretStr | None = Field(None, description="Webhook URL for alerts")
+    alert_email: str | None = Field(None, description="Email address for alerts")
+    environment: str = Field("development", description="Environment mode (development/production)")
+    # Rate Limiting Configuration
+    rate_limit_per_minute: int = Field(60, description="Maximum API calls per minute per service")
+    rate_limit_per_hour: int = Field(1000, description="Maximum API calls per hour per service")
+    # Red Team Security Testing
+    redteam_enabled: bool = Field(
+        True, description="Enable red team security testing for deployments"
+    )
+    # Deep npm Package Security Analysis
+    npm_security_enabled: bool = Field(
+        False,
+        description="Enable deep security analysis of npm packages (secrets, obfuscation, etc.)",
+    )
+    # Dashboard Configuration
+    dashboard_enabled: bool = Field(False, description="Enable web dashboard")
+    dashboard_host: str = Field("0.0.0.0", description="Dashboard host to bind to")
+    dashboard_port: int = Field(8080, description="Dashboard port")
+    metrics_enabled: bool = Field(True, description="Enable Prometheus metrics")
+    metrics_port: int = Field(9090, description="Prometheus metrics port")
+    dashboard_api_key: SecretStr | None = Field(
+        None, description="API key for dashboard access (generate with openssl rand -hex 32)"
+    )
+    allowed_origins: Annotated[list[str], NoDecode] = Field(
+        default_factory=list,
+        description="Comma-separated list of allowed CORS origins",
+    )
+    # Additional Service API Keys
+    firecrawl_api_key: SecretStr | None = Field(None, description="Firecrawl API key")
+    tavily_api_key: SecretStr | None = Field(None, description="Tavily API key")
+    anthropic_api_key: SecretStr | None = Field(None, description="Anthropic API key")
+    openrouter_api_key: SecretStr | None = Field(None, description="OpenRouter API key")
+    openai_api_key: SecretStr | None = Field(None, description="OpenAI API key")
+    perplexity_api_key: SecretStr | None = Field(None, description="Perplexity API key")
+    groq_api_key: SecretStr | None = Field(None, description="Groq API key")
+    # SMTP Configuration (for email alerts)
+    smtp_host: str | None = Field(None, description="SMTP server hostname")
+    smtp_port: int = Field(587, description="SMTP server port")
+    smtp_user: str | None = Field(None, description="SMTP username")
+    smtp_password: SecretStr | None = Field(None, description="SMTP password")
+    smtp_from: str | None = Field(None, description="From email address")
+    smtp_use_tls: bool = Field(True, description="Use TLS for SMTP connection")
+    email_only_on_issues: bool = Field(
+        True, description="Only send emails when there are issues (skip 'all clear' reports)"
+    )
+    email_thread_id_file: str | None = Field(
+        None,
+        description="Path to file storing last email thread ID (default: .devguard-email-thread)",
+    )
+    email_history_file: str | None = Field(
+        None,
+        description="Path to JSON file storing email history for agent introspection (default: .devguard-email-history.json)",
+    )
+    email_llm_enabled: bool = Field(
+        True,
+        description="Enable LLM-powered email judgements (subject lines, send decisions, summaries). Defaults to True. Set to False to disable.",
+    )
+    use_smart_email: bool = Field(
+        True,
+        description="Use smart_email system (SNS) instead of direct SMTP. Provides batching, deduplication, and threading. Falls back to SMTP if smart_email unavailable.",
+    )
+    smart_email_db_path: str | None = Field(
+        None,
+        description="Path to smart_email SQLite database (default: /data/smart_email.db or SMART_EMAIL_DB env var)",
+    )
+    # Package Monitoring - use NoDecode to prevent JSON parsing,
+    # validator handles comma-separated strings
+    npm_packages_to_monitor: Annotated[list[str], NoDecode] = Field(
+        default_factory=list,
+        description="List of npm packages to monitor",
+    )
+    # Repository Monitoring
+    github_repos_to_monitor: Annotated[list[str], NoDecode] = Field(
+        default_factory=list,
+        description="List of GitHub repos to monitor (owner/repo format)",
+    )
+    # Deployment Monitoring
+    fly_apps_to_monitor: Annotated[list[str], NoDecode] = Field(
+        default_factory=list,
+        description="List of Fly.io apps to monitor",
+    )
+    vercel_projects_to_monitor: Annotated[list[str], NoDecode] = Field(
+        default_factory=list,
+        description="List of Vercel projects to monitor",
+    )
+    # Secret Scanning
+    secret_scan_enabled: bool = Field(True, description="Enable secret scanning of git repos")
+    secret_scan_paths: Annotated[list[str], NoDecode] = Field(
+        default_factory=list,
+        description="Paths to git repos to scan for secrets (default: _infra subprojects)",
+    )
+    # Container Security
+    container_check_enabled: bool = Field(
+        True, description="Enable Container/Dockerfile security checks"
+    )
+    # AWS IAM Security
+    aws_iam_check_enabled: bool = Field(
+        False, description="Enable AWS IAM security checks for satellite nodes"
+    )
+    # AWS Cost Monitoring
+    aws_cost_check_enabled: bool = Field(
+        False, description="Enable AWS cost monitoring and budget alerts"
+    )
+    aws_monthly_cost_ceiling: float = Field(
+        100.0,
+        description="AWS monthly cost ceiling in USD (alerts when exceeded)",
+    )
+    aws_allowed_instances: Annotated[list[str], NoDecode] = Field(
+        default_factory=list,
+        description="Allowed EC2 instance names (comma-separated). Unlisted running instances trigger alerts.",
+    )
+    # Tailscale Network Health
+    tailscale_check_enabled: bool = Field(
+        False, description="Enable Tailscale mesh network health checks"
+    )
+    tailscale_expected_nodes: Annotated[list[str], NoDecode] = Field(
+        default_factory=list,
+        description="Expected Tailscale node hostnames (comma-separated)",
+    )
+    # Tailsnitch ACL Security Audit
+    tailsnitch_check_enabled: bool = Field(
+        False, description="Enable Tailsnitch security audit for Tailscale ACLs"
+    )
+    tailsnitch_binary_path: str | None = Field(
+        None, description="Custom path to tailsnitch binary (auto-detected if not set)"
+    )
+    tailsnitch_tailnet: str | None = Field(
+        None, description="Specific tailnet to audit (default: from API key)"
+    )
+    # Tailscale authentication (for Tailsnitch)
+    # Note: Tailsnitch supports both API key and OAuth
+    # API key: TSKEY or TS_API_KEY
+    # OAuth: TS_OAUTH_CLIENT_ID + TS_OAUTH_CLIENT_SECRET
+    # These are read from environment, not stored in Settings for security
+    # Domain/SSL Monitoring
+    domain_check_enabled: bool = Field(
+        False, description="Enable domain and SSL certificate monitoring"
+    )
+    domains_to_monitor: Annotated[list[str], NoDecode] = Field(
+        default_factory=list,
+        description="Domains to monitor for SSL/health (comma-separated, e.g. 'example.com,app.example.com')",
+    )
+    # Docker Swarm Health
+    swarm_check_enabled: bool = Field(
+        False, description="Enable Docker Swarm cluster health checks"
+    )
+    swarm_expected_nodes: Annotated[list[str], NoDecode] = Field(
+        default_factory=list,
+        description="Expected swarm node hostnames (comma-separated)",
+    )
+    swarm_critical_services: Annotated[list[str], NoDecode] = Field(
+        default_factory=list,
+        description="Critical swarm service names (comma-separated)",
+    )
+    # API Usage/Credits Monitoring
+    api_usage_check_enabled: bool = Field(
+        False, description="Enable API usage/credits monitoring for LLM providers"
+    )
+    @field_validator(
+        "npm_packages_to_monitor",
+        "github_repos_to_monitor",
+        "fly_apps_to_monitor",
+        "vercel_projects_to_monitor",
+        "allowed_origins",
+        "secret_scan_paths",
+        "domains_to_monitor",
+        "swarm_expected_nodes",
+        "swarm_critical_services",
+        "tailscale_expected_nodes",
+        "aws_allowed_instances",
+        mode="before",
+    )
+    @classmethod
+    def parse_comma_separated_string(cls, v: str | list[str] | None) -> list[str]:
+        """Parse comma-separated strings into lists."""
+        if v is None:
+            return []
+        if isinstance(v, str):
+            return [item.strip() for item in v.split(",") if item.strip()]
+        if isinstance(v, list):
+            return v
+        return []
+def get_settings(env_file: str | None = None) -> Settings:
+    """Get application settings.
+    Args:
+        env_file: Optional path to an env file to load (e.g. "../.env" when
+            running Guardian from inside an infra repo). When not provided,
+            the Settings `model_config.env_file` default is used.
+    """
+    if env_file:
+        return Settings(_env_file=env_file)  # type: ignore[call-arg]
+    return Settings()  # type: ignore[call-arg]