PyPI - lucidscan - Versions diffs - 0.5.12__py3-none-any.whl - Mend

lucidscan 0.5.12__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (91) hide show

lucidscan/__init__.py +12 -0
lucidscan/bootstrap/__init__.py +26 -0
lucidscan/bootstrap/paths.py +160 -0
lucidscan/bootstrap/platform.py +111 -0
lucidscan/bootstrap/validation.py +76 -0
lucidscan/bootstrap/versions.py +119 -0
lucidscan/cli/__init__.py +50 -0
lucidscan/cli/__main__.py +8 -0
lucidscan/cli/arguments.py +405 -0
lucidscan/cli/commands/__init__.py +64 -0
lucidscan/cli/commands/autoconfigure.py +294 -0
lucidscan/cli/commands/help.py +69 -0
lucidscan/cli/commands/init.py +656 -0
lucidscan/cli/commands/list_scanners.py +59 -0
lucidscan/cli/commands/scan.py +307 -0
lucidscan/cli/commands/serve.py +142 -0
lucidscan/cli/commands/status.py +84 -0
lucidscan/cli/commands/validate.py +105 -0
lucidscan/cli/config_bridge.py +152 -0
lucidscan/cli/exit_codes.py +17 -0
lucidscan/cli/runner.py +284 -0
lucidscan/config/__init__.py +29 -0
lucidscan/config/ignore.py +178 -0
lucidscan/config/loader.py +431 -0
lucidscan/config/models.py +316 -0
lucidscan/config/validation.py +645 -0
lucidscan/core/__init__.py +3 -0
lucidscan/core/domain_runner.py +463 -0
lucidscan/core/git.py +174 -0
lucidscan/core/logging.py +34 -0
lucidscan/core/models.py +207 -0
lucidscan/core/streaming.py +340 -0
lucidscan/core/subprocess_runner.py +164 -0
lucidscan/detection/__init__.py +21 -0
lucidscan/detection/detector.py +154 -0
lucidscan/detection/frameworks.py +270 -0
lucidscan/detection/languages.py +328 -0
lucidscan/detection/tools.py +229 -0
lucidscan/generation/__init__.py +15 -0
lucidscan/generation/config_generator.py +275 -0
lucidscan/generation/package_installer.py +330 -0
lucidscan/mcp/__init__.py +20 -0
lucidscan/mcp/formatter.py +510 -0
lucidscan/mcp/server.py +297 -0
lucidscan/mcp/tools.py +1049 -0
lucidscan/mcp/watcher.py +237 -0
lucidscan/pipeline/__init__.py +17 -0
lucidscan/pipeline/executor.py +187 -0
lucidscan/pipeline/parallel.py +181 -0
lucidscan/plugins/__init__.py +40 -0
lucidscan/plugins/coverage/__init__.py +28 -0
lucidscan/plugins/coverage/base.py +160 -0
lucidscan/plugins/coverage/coverage_py.py +454 -0
lucidscan/plugins/coverage/istanbul.py +411 -0
lucidscan/plugins/discovery.py +107 -0
lucidscan/plugins/enrichers/__init__.py +61 -0
lucidscan/plugins/enrichers/base.py +63 -0
lucidscan/plugins/linters/__init__.py +26 -0
lucidscan/plugins/linters/base.py +125 -0
lucidscan/plugins/linters/biome.py +448 -0
lucidscan/plugins/linters/checkstyle.py +393 -0
lucidscan/plugins/linters/eslint.py +368 -0
lucidscan/plugins/linters/ruff.py +498 -0
lucidscan/plugins/reporters/__init__.py +45 -0
lucidscan/plugins/reporters/base.py +30 -0
lucidscan/plugins/reporters/json_reporter.py +79 -0
lucidscan/plugins/reporters/sarif_reporter.py +303 -0
lucidscan/plugins/reporters/summary_reporter.py +61 -0
lucidscan/plugins/reporters/table_reporter.py +81 -0
lucidscan/plugins/scanners/__init__.py +57 -0
lucidscan/plugins/scanners/base.py +60 -0
lucidscan/plugins/scanners/checkov.py +484 -0
lucidscan/plugins/scanners/opengrep.py +464 -0
lucidscan/plugins/scanners/trivy.py +492 -0
lucidscan/plugins/test_runners/__init__.py +27 -0
lucidscan/plugins/test_runners/base.py +111 -0
lucidscan/plugins/test_runners/jest.py +381 -0
lucidscan/plugins/test_runners/karma.py +481 -0
lucidscan/plugins/test_runners/playwright.py +434 -0
lucidscan/plugins/test_runners/pytest.py +598 -0
lucidscan/plugins/type_checkers/__init__.py +27 -0
lucidscan/plugins/type_checkers/base.py +106 -0
lucidscan/plugins/type_checkers/mypy.py +355 -0
lucidscan/plugins/type_checkers/pyright.py +313 -0
lucidscan/plugins/type_checkers/typescript.py +280 -0
lucidscan-0.5.12.dist-info/METADATA +242 -0
lucidscan-0.5.12.dist-info/RECORD +91 -0
lucidscan-0.5.12.dist-info/WHEEL +5 -0
lucidscan-0.5.12.dist-info/entry_points.txt +34 -0
lucidscan-0.5.12.dist-info/licenses/LICENSE +201 -0
lucidscan-0.5.12.dist-info/top_level.txt +1 -0

lucidscan/plugins/scanners/opengrep.py ADDED Viewed

@@ -0,0 +1,464 @@
+"""OpenGrep scanner plugin for SAST (Static Application Security Testing)."""
+from __future__ import annotations
+import hashlib
+import json
+import os
+import subprocess
+from pathlib import Path
+from typing import Any, Dict, List, Optional
+from urllib.request import urlopen
+from lucidscan.plugins.scanners.base import ScannerPlugin
+from lucidscan.core.models import ScanContext, ScanDomain, Severity, UnifiedIssue
+from lucidscan.bootstrap.paths import LucidscanPaths
+from lucidscan.bootstrap.platform import get_platform_info
+from lucidscan.bootstrap.versions import get_tool_version
+from lucidscan.core.logging import get_logger
+from lucidscan.core.subprocess_runner import run_with_streaming
+LOGGER = get_logger(__name__)
+# Default version from pyproject.toml [tool.lucidscan.tools]
+DEFAULT_VERSION = get_tool_version("opengrep")
+# OpenGrep severity mapping to unified severity
+# OpenGrep/Semgrep uses: ERROR, WARNING, INFO
+OPENGREP_SEVERITY_MAP: Dict[str, Severity] = {
+    "ERROR": Severity.HIGH,
+    "WARNING": Severity.MEDIUM,
+    "INFO": Severity.LOW,
+    # Additional mappings for rule metadata
+    "CRITICAL": Severity.CRITICAL,
+    "HIGH": Severity.HIGH,
+    "MEDIUM": Severity.MEDIUM,
+    "LOW": Severity.LOW,
+}
+class OpenGrepScanner(ScannerPlugin):
+    """Scanner plugin for OpenGrep (SAST).
+    Handles:
+    - Static application security testing via `opengrep scan`
+    Binary management:
+    - Downloads from https://github.com/opengrep/opengrep/releases/
+    - Caches at {project}/.lucidscan/bin/opengrep/{version}/opengrep
+    """
+    def __init__(
+        self,
+        version: str = DEFAULT_VERSION,
+        project_root: Optional[Path] = None,
+    ) -> None:
+        self._version = version
+        if project_root:
+            self._paths = LucidscanPaths.for_project(project_root)
+        else:
+            self._paths = LucidscanPaths.default()
+    @property
+    def name(self) -> str:
+        return "opengrep"
+    @property
+    def domains(self) -> List[ScanDomain]:
+        return [ScanDomain.SAST]
+    def get_version(self) -> str:
+        return self._version
+    def ensure_binary(self) -> Path:
+        """Ensure the OpenGrep binary is available, downloading if needed."""
+        binary_dir = self._paths.plugin_bin_dir(self.name, self._version)
+        binary_name = self._get_binary_name()
+        binary_path = binary_dir / binary_name
+        if binary_path.exists():
+            LOGGER.debug(f"OpenGrep binary found at {binary_path}")
+            return binary_path
+        LOGGER.info(f"Downloading OpenGrep v{self._version}...")
+        self._download_binary(binary_dir)
+        if not binary_path.exists():
+            raise RuntimeError(f"Failed to download OpenGrep binary to {binary_path}")
+        return binary_path
+    def _get_binary_name(self) -> str:
+        """Get the binary name for the current platform."""
+        platform_info = get_platform_info()
+        if platform_info.os == "windows":
+            return "opengrep.exe"
+        return "opengrep"
+    def _download_binary(self, dest_dir: Path) -> None:
+        """Download OpenGrep binary for current platform."""
+        platform_info = get_platform_info()
+        # Map platform to OpenGrep release naming
+        # OpenGrep uses: opengrep_manylinux_x86, opengrep_osx_arm64, etc.
+        if platform_info.os == "linux":
+            os_name = "manylinux"
+            arch_name = "x86" if platform_info.arch == "amd64" else "aarch64"
+            filename = f"opengrep_{os_name}_{arch_name}"
+        elif platform_info.os == "darwin":
+            os_name = "osx"
+            arch_name = "x86" if platform_info.arch == "amd64" else "arm64"
+            filename = f"opengrep_{os_name}_{arch_name}"
+        elif platform_info.os == "windows":
+            filename = "opengrep_windows_x86.exe"
+        else:
+            raise RuntimeError(
+                f"Unsupported platform: {platform_info.os}-{platform_info.arch}"
+            )
+        # Construct download URL
+        url = f"https://github.com/opengrep/opengrep/releases/download/v{self._version}/{filename}"
+        LOGGER.debug(f"Downloading from {url}")
+        # Create destination directory
+        dest_dir.mkdir(parents=True, exist_ok=True)
+        # Determine destination path
+        binary_name = self._get_binary_name()
+        binary_path = dest_dir / binary_name
+        # Validate URL scheme and domain for security
+        if not url.startswith("https://github.com/"):
+            raise ValueError(f"Invalid download URL: {url}")
+        # Download binary directly (not an archive)
+        try:
+            with urlopen(url) as response:  # nosec B310 nosemgrep
+                binary_path.write_bytes(response.read())
+            # Make binary executable (not needed on Windows)
+            if platform_info.os != "windows":
+                binary_path.chmod(0o755)
+            LOGGER.info(f"OpenGrep v{self._version} installed to {binary_path}")
+        except Exception as e:
+            # Clean up partial download
+            if binary_path.exists():
+                binary_path.unlink()
+            raise RuntimeError(f"Failed to download OpenGrep: {e}") from e
+    def scan(self, context: ScanContext) -> List[UnifiedIssue]:
+        """Execute OpenGrep scan and return normalized issues.
+        Args:
+            context: Scan context containing target paths and configuration.
+        Returns:
+            List of unified issues found during the scan.
+        """
+        if ScanDomain.SAST not in context.enabled_domains:
+            return []
+        binary = self.ensure_binary()
+        return self._run_sast_scan(binary, context)
+    def _run_sast_scan(
+        self, binary: Path, context: ScanContext
+    ) -> List[UnifiedIssue]:
+        """Run OpenGrep SAST scan.
+        Args:
+            binary: Path to the OpenGrep binary.
+            context: Scan context with project root and configuration.
+        Returns:
+            List of unified issues from the SAST scan.
+        """
+        # Get SAST-specific config options
+        sast_config = context.get_scanner_options("sast")
+        # Get ruleset configuration
+        ruleset_list = sast_config.get("ruleset", ["auto"])
+        if isinstance(ruleset_list, list) and ruleset_list:
+            ruleset = ruleset_list[0]  # Use first ruleset
+        else:
+            ruleset = "auto"
+        cmd = [
+            str(binary),
+            "scan",
+            "--json",
+            "--quiet",
+        ]
+        # Add timeout if specified
+        timeout = sast_config.get("timeout")
+        if timeout:
+            cmd.extend(["--timeout", str(timeout)])
+        # Add ruleset if specified (auto uses default rules)
+        if ruleset and ruleset != "auto":
+            cmd.extend(["--config", ruleset])
+        else:
+            # Use default rules - OpenGrep auto-detects without explicit config
+            cmd.extend(["--config", "auto"])
+        # Apply ignore patterns from .lucidscanignore and config
+        exclude_patterns = context.get_exclude_patterns()
+        for pattern in exclude_patterns:
+            cmd.extend(["--exclude", pattern])
+        # Add target path
+        cmd.append(str(context.project_root))
+        LOGGER.debug(f"Running: {' '.join(cmd)}")
+        # Set environment variables for the scan
+        env = self._get_scan_env()
+        old_env: Dict[str, Optional[str]] = {}
+        for key, value in env.items():
+            if key not in os.environ or os.environ[key] != value:
+                old_env[key] = os.environ.get(key)
+                os.environ[key] = value
+        try:
+            result = run_with_streaming(
+                cmd=cmd,
+                cwd=context.project_root,
+                tool_name="opengrep",
+                stream_handler=context.stream_handler,
+                timeout=180,
+            )
+            # OpenGrep returns non-zero exit code when findings exist
+            # This is expected behavior, not an error
+            if result.returncode not in (0, 1) and result.stderr:
+                LOGGER.warning(f"OpenGrep stderr: {result.stderr}")
+            if not result.stdout.strip():
+                LOGGER.debug("OpenGrep returned empty output")
+                return []
+            return self._parse_opengrep_json(result.stdout, context.project_root)
+        except subprocess.TimeoutExpired:
+            LOGGER.warning("OpenGrep scan timed out after 180 seconds")
+            return []
+        except Exception as e:
+            LOGGER.error(f"OpenGrep scan failed: {e}")
+            return []
+        finally:
+            # Restore original environment
+            for key, value in old_env.items():  # type: ignore[assignment]
+                if value is None:
+                    os.environ.pop(key, None)
+                else:
+                    os.environ[key] = value
+    def _get_scan_env(self) -> Dict[str, str]:
+        """Get environment variables for the scan process."""
+        env = os.environ.copy()
+        # Disable telemetry/metrics
+        env["SEMGREP_SEND_METRICS"] = "off"
+        env["OPENGREP_SEND_METRICS"] = "off"
+        return env
+    def _parse_opengrep_json(
+        self,
+        json_output: str,
+        project_root: Path,
+    ) -> List[UnifiedIssue]:
+        """Parse OpenGrep JSON output and convert to UnifiedIssue list.
+        Args:
+            json_output: Raw JSON string from OpenGrep.
+            project_root: Project root path for relative path resolution.
+        Returns:
+            List of unified issues parsed from the JSON.
+        """
+        try:
+            data = json.loads(json_output)
+        except json.JSONDecodeError as e:
+            LOGGER.error(f"Failed to parse OpenGrep JSON: {e}")
+            return []
+        issues: List[UnifiedIssue] = []
+        # OpenGrep output structure: {"results": [...], "errors": [...]}
+        results = data.get("results", [])
+        for result in results:
+            issue = self._result_to_unified_issue(result, project_root)
+            if issue:
+                issues.append(issue)
+        # Log any errors from the scan
+        errors = data.get("errors", [])
+        for error in errors:
+            LOGGER.warning(f"OpenGrep error: {error}")
+        LOGGER.debug(f"Parsed {len(issues)} issues from OpenGrep output")
+        return issues
+    def _result_to_unified_issue(
+        self,
+        result: Dict[str, Any],
+        project_root: Path,
+    ) -> Optional[UnifiedIssue]:
+        """Convert a single OpenGrep result to a UnifiedIssue.
+        Args:
+            result: Result dict from OpenGrep JSON.
+            project_root: Project root path for relative path resolution.
+        Returns:
+            UnifiedIssue or None if conversion fails.
+        """
+        try:
+            # Extract basic fields
+            rule_id = result.get("check_id", "unknown")
+            path = result.get("path", "unknown")
+            message = result.get("extra", {}).get("message", "No message")
+            # Extract location information
+            start = result.get("start", {})
+            end = result.get("end", {})
+            line_start = start.get("line", 1)
+            line_end = end.get("line", line_start)
+            col_start = start.get("col", 1)
+            col_end = end.get("col", col_start)
+            # Extract severity from extra metadata
+            extra = result.get("extra", {})
+            severity_str = extra.get("severity", "WARNING").upper()
+            # Also check metadata for severity
+            metadata = extra.get("metadata", {})
+            if "severity" in metadata:
+                severity_str = metadata["severity"].upper()
+            severity = OPENGREP_SEVERITY_MAP.get(severity_str, Severity.MEDIUM)
+            # Extract code snippet (the matched lines)
+            lines = extra.get("lines", "")
+            code_snippet = lines if isinstance(lines, str) else str(lines)
+            # Generate deterministic issue ID
+            issue_id = self._generate_issue_id(rule_id, path, line_start, col_start)
+            # Build file path (relative or absolute)
+            file_path = Path(path)
+            if not file_path.is_absolute():
+                file_path = project_root / path
+            # Build title from rule ID
+            title = self._format_title(rule_id, message)
+            # Build description
+            description = message
+            if "metavars" in extra:
+                # Add context about matched variables
+                metavars = extra["metavars"]
+                if metavars:
+                    description += f"\n\nMatched values: {json.dumps(metavars, indent=2)}"
+            # Build recommendation
+            recommendation = metadata.get("fix", None)
+            if not recommendation and "fix" in extra:
+                recommendation = extra["fix"]
+            # Build scanner metadata with raw OpenGrep data
+            scanner_metadata: Dict[str, Any] = {
+                "rule_id": rule_id,
+                "line_start": line_start,
+                "line_end": line_end,
+                "col_start": col_start,
+                "col_end": col_end,
+                "severity_raw": severity_str,
+                "fingerprint": result.get("extra", {}).get("fingerprint"),
+                "engine_kind": extra.get("engine_kind"),
+                "validation_state": extra.get("validation_state"),
+            }
+            # Add metadata fields if present
+            if metadata:
+                scanner_metadata["metadata"] = {
+                    "cwe": metadata.get("cwe", []),
+                    "owasp": metadata.get("owasp", []),
+                    "references": metadata.get("references", []),
+                    "category": metadata.get("category"),
+                    "technology": metadata.get("technology", []),
+                    "confidence": metadata.get("confidence"),
+                }
+            # Get documentation URL from metadata references
+            references = metadata.get("references", []) if metadata else []
+            documentation_url = references[0] if references else None
+            return UnifiedIssue(
+                id=issue_id,
+                domain=ScanDomain.SAST,
+                source_tool="opengrep",
+                severity=severity,
+                rule_id=rule_id,
+                title=title,
+                description=description,
+                documentation_url=documentation_url,
+                file_path=file_path,
+                line_start=line_start,
+                line_end=line_end,
+                column_start=start.get("col") if start else None,
+                column_end=end.get("col") if end else None,
+                code_snippet=code_snippet,
+                recommendation=recommendation,
+                fixable=bool(extra.get("fix")),
+                suggested_fix=extra.get("fix"),
+                metadata=scanner_metadata,
+            )
+        except Exception as e:
+            LOGGER.warning(f"Failed to convert OpenGrep result to UnifiedIssue: {e}")
+            return None
+    def _format_title(self, rule_id: str, message: str) -> str:
+        """Format a human-readable title from rule ID and message.
+        Args:
+            rule_id: OpenGrep rule identifier.
+            message: Rule message.
+        Returns:
+            Formatted title string.
+        """
+        # Shorten message if too long
+        max_message_len = 80
+        if len(message) > max_message_len:
+            message = message[:max_message_len - 3] + "..."
+        # Use rule ID as prefix for clarity
+        return f"{rule_id}: {message}"
+    def _generate_issue_id(
+        self,
+        rule_id: str,
+        path: str,
+        line: int,
+        col: int,
+    ) -> str:
+        """Generate a deterministic issue ID for deduplication.
+        Args:
+            rule_id: OpenGrep rule identifier.
+            path: File path.
+            line: Line number.
+            col: Column number.
+        Returns:
+            A stable hash-based ID string.
+        """
+        components = f"opengrep:{rule_id}:{path}:{line}:{col}"
+        hash_digest = hashlib.sha256(components.encode()).hexdigest()[:16]
+        return f"opengrep-{hash_digest}"