PyPI - prompture - Versions diffs - 0.0.50__py3-none-any.whl → 0.0.51.dev1__py3-none-any.whl - Mend

prompture 0.0.50py3-none-any.whl → 0.0.51.dev1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

prompture/__init__.py +62 -0
prompture/_version.py +2 -2
prompture/agent.py +61 -2
prompture/agent_types.py +98 -0
prompture/analysis/__init__.py +19 -0
prompture/analysis/analyzer.py +142 -0
prompture/analysis/ast_visitors.py +302 -0
prompture/analysis/risk_scoring.py +219 -0
prompture/history.py +299 -0
prompture/sandbox/__init__.py +31 -0
prompture/sandbox/exceptions.py +54 -0
prompture/sandbox/resource_limits.py +128 -0
prompture/sandbox/restrictions.py +292 -0
prompture/sandbox/sandbox.py +406 -0
{prompture-0.0.50.dist-info → prompture-0.0.51.dev1.dist-info}/METADATA +1 -1
{prompture-0.0.50.dist-info → prompture-0.0.51.dev1.dist-info}/RECORD +20 -10
{prompture-0.0.50.dist-info → prompture-0.0.51.dev1.dist-info}/WHEEL +0 -0
{prompture-0.0.50.dist-info → prompture-0.0.51.dev1.dist-info}/entry_points.txt +0 -0
{prompture-0.0.50.dist-info → prompture-0.0.51.dev1.dist-info}/licenses/LICENSE +0 -0
{prompture-0.0.50.dist-info → prompture-0.0.51.dev1.dist-info}/top_level.txt +0 -0

prompture/analysis/ast_visitors.py ADDED Viewed

@@ -0,0 +1,302 @@
+"""AST visitors for extracting code features.
+Provides an AST node visitor that extracts security-relevant features
+from Python source code.
+"""
+from __future__ import annotations
+import ast
+from dataclasses import dataclass, field
+@dataclass
+class CodeFeatures:
+    """Features extracted from Python code via AST analysis.
+    Attributes:
+        imports: Set of module names imported (import x, from x import y).
+        file_operations: List of (operation, args) tuples for file access.
+        network_calls: List of network-related function calls detected.
+        system_calls: List of system/subprocess calls detected.
+        exec_eval_usage: List of exec/eval/compile calls detected.
+        dangerous_builtins: Set of dangerous builtin names used.
+        attribute_accesses: Set of attribute access patterns (e.g., "os.system").
+        function_calls: Set of all function call names.
+        has_global_statements: Whether the code uses global statements.
+        has_nonlocal_statements: Whether the code uses nonlocal statements.
+        class_definitions: Set of class names defined.
+        async_operations: Whether the code contains async/await.
+    """
+    imports: set[str] = field(default_factory=set)
+    file_operations: list[tuple[str, list[str]]] = field(default_factory=list)
+    network_calls: list[tuple[str, list[str]]] = field(default_factory=list)
+    system_calls: list[tuple[str, list[str]]] = field(default_factory=list)
+    exec_eval_usage: list[tuple[str, list[str]]] = field(default_factory=list)
+    dangerous_builtins: set[str] = field(default_factory=set)
+    attribute_accesses: set[str] = field(default_factory=set)
+    function_calls: set[str] = field(default_factory=set)
+    has_global_statements: bool = False
+    has_nonlocal_statements: bool = False
+    class_definitions: set[str] = field(default_factory=set)
+    async_operations: bool = False
+# Builtins that can be dangerous when executed dynamically
+DANGEROUS_BUILTINS = frozenset(
+    {
+        "eval",
+        "exec",
+        "compile",
+        "__import__",
+        "open",
+        "input",
+        "breakpoint",
+        "memoryview",
+        "vars",
+        "dir",
+        "globals",
+        "locals",
+        "getattr",
+        "setattr",
+        "delattr",
+        "hasattr",
+    }
+)
+# File operation function names
+FILE_OPERATIONS = frozenset(
+    {
+        "open",
+        "read",
+        "write",
+        "close",
+        "seek",
+        "tell",
+        "readline",
+        "readlines",
+        "writelines",
+        "flush",
+        "truncate",
+    }
+)
+# Network-related module prefixes and function names
+NETWORK_MODULES = frozenset(
+    {
+        "socket",
+        "urllib",
+        "http",
+        "requests",
+        "httpx",
+        "aiohttp",
+        "ftplib",
+        "smtplib",
+        "poplib",
+        "imaplib",
+        "telnetlib",
+        "ssl",
+        "websocket",
+        "websockets",
+    }
+)
+# System call patterns
+SYSTEM_CALL_PATTERNS = frozenset(
+    {
+        "os.system",
+        "os.popen",
+        "os.spawn",
+        "os.spawnl",
+        "os.spawnle",
+        "os.spawnlp",
+        "os.spawnlpe",
+        "os.spawnv",
+        "os.spawnve",
+        "os.spawnvp",
+        "os.spawnvpe",
+        "os.exec",
+        "os.execl",
+        "os.execle",
+        "os.execlp",
+        "os.execlpe",
+        "os.execv",
+        "os.execve",
+        "os.execvp",
+        "os.execvpe",
+        "os.fork",
+        "os.forkpty",
+        "os.kill",
+        "os.killpg",
+        "subprocess.run",
+        "subprocess.call",
+        "subprocess.check_call",
+        "subprocess.check_output",
+        "subprocess.Popen",
+        "subprocess.getoutput",
+        "subprocess.getstatusoutput",
+        "pty.spawn",
+        "pty.fork",
+    }
+)
+class FeatureExtractor(ast.NodeVisitor):
+    """AST visitor that extracts security-relevant features from Python code.
+    Usage::
+        extractor = FeatureExtractor()
+        extractor.visit(ast.parse(source_code))
+        features = extractor.features
+    """
+    def __init__(self) -> None:
+        self.features = CodeFeatures()
+        self._current_module_context: list[str] = []
+    def visit_Import(self, node: ast.Import) -> None:
+        """Handle import statements."""
+        for alias in node.names:
+            self.features.imports.add(alias.name.split(".")[0])
+        self.generic_visit(node)
+    def visit_ImportFrom(self, node: ast.ImportFrom) -> None:
+        """Handle from ... import statements."""
+        if node.module:
+            self.features.imports.add(node.module.split(".")[0])
+        self.generic_visit(node)
+    def visit_Call(self, node: ast.Call) -> None:
+        """Handle function calls."""
+        call_name = self._get_call_name(node)
+        if call_name:
+            self.features.function_calls.add(call_name)
+            self._classify_call(call_name, node)
+        self.generic_visit(node)
+    def visit_Attribute(self, node: ast.Attribute) -> None:
+        """Handle attribute access."""
+        attr_chain = self._get_attribute_chain(node)
+        if attr_chain:
+            self.features.attribute_accesses.add(attr_chain)
+        self.generic_visit(node)
+    def visit_Name(self, node: ast.Name) -> None:
+        """Handle name references (potential builtin usage)."""
+        if node.id in DANGEROUS_BUILTINS:
+            self.features.dangerous_builtins.add(node.id)
+        self.generic_visit(node)
+    def visit_Global(self, node: ast.Global) -> None:
+        """Handle global statements."""
+        self.features.has_global_statements = True
+        self.generic_visit(node)
+    def visit_Nonlocal(self, node: ast.Nonlocal) -> None:
+        """Handle nonlocal statements."""
+        self.features.has_nonlocal_statements = True
+        self.generic_visit(node)
+    def visit_ClassDef(self, node: ast.ClassDef) -> None:
+        """Handle class definitions."""
+        self.features.class_definitions.add(node.name)
+        self.generic_visit(node)
+    def visit_AsyncFunctionDef(self, node: ast.AsyncFunctionDef) -> None:
+        """Handle async function definitions."""
+        self.features.async_operations = True
+        self.generic_visit(node)
+    def visit_Await(self, node: ast.Await) -> None:
+        """Handle await expressions."""
+        self.features.async_operations = True
+        self.generic_visit(node)
+    def visit_AsyncFor(self, node: ast.AsyncFor) -> None:
+        """Handle async for loops."""
+        self.features.async_operations = True
+        self.generic_visit(node)
+    def visit_AsyncWith(self, node: ast.AsyncWith) -> None:
+        """Handle async with statements."""
+        self.features.async_operations = True
+        self.generic_visit(node)
+    def _get_call_name(self, node: ast.Call) -> str | None:
+        """Extract the full call name from a Call node."""
+        if isinstance(node.func, ast.Name):
+            return node.func.id
+        elif isinstance(node.func, ast.Attribute):
+            return self._get_attribute_chain(node.func)
+        return None
+    def _get_attribute_chain(self, node: ast.Attribute) -> str | None:
+        """Build the full attribute chain (e.g., 'os.path.join')."""
+        parts: list[str] = [node.attr]
+        current = node.value
+        while isinstance(current, ast.Attribute):
+            parts.append(current.attr)
+            current = current.value
+        if isinstance(current, ast.Name):
+            parts.append(current.id)
+            return ".".join(reversed(parts))
+        return None
+    def _get_call_args_as_strings(self, node: ast.Call) -> list[str]:
+        """Extract string representations of call arguments."""
+        args: list[str] = []
+        for arg in node.args:
+            if isinstance(arg, ast.Constant) and isinstance(arg.value, str):
+                args.append(arg.value)
+            else:
+                args.append(ast.dump(arg))
+        return args
+    def _classify_call(self, call_name: str, node: ast.Call) -> None:
+        """Classify a function call into categories."""
+        args = self._get_call_args_as_strings(node)
+        # Check for exec/eval
+        if call_name in ("exec", "eval", "compile"):
+            self.features.exec_eval_usage.append((call_name, args))
+        # Check for file operations
+        if (
+            call_name == "open"
+            or call_name.endswith(".open")
+            or any(call_name.endswith(f".{op}") for op in FILE_OPERATIONS)
+        ):
+            self.features.file_operations.append((call_name, args))
+        # Check for system calls
+        if call_name in SYSTEM_CALL_PATTERNS or any(
+            call_name.startswith(pattern.rsplit(".", 1)[0])
+            for pattern in SYSTEM_CALL_PATTERNS
+            if call_name.endswith(pattern.rsplit(".", 1)[-1])
+        ):
+            self.features.system_calls.append((call_name, args))
+        # Check for network calls
+        module_prefix = call_name.split(".")[0] if "." in call_name else ""
+        if module_prefix in NETWORK_MODULES:
+            self.features.network_calls.append((call_name, args))
+def extract_features(source: str) -> CodeFeatures:
+    """Extract security-relevant features from Python source code.
+    Args:
+        source: Python source code as a string.
+    Returns:
+        CodeFeatures dataclass with extracted features.
+    Raises:
+        SyntaxError: If the source code is not valid Python.
+    """
+    tree = ast.parse(source)
+    extractor = FeatureExtractor()
+    extractor.visit(tree)
+    return extractor.features

prompture/analysis/risk_scoring.py ADDED Viewed

@@ -0,0 +1,219 @@
+"""Risk scoring for Python code analysis.
+Calculates risk levels based on detected code features.
+"""
+from __future__ import annotations
+import enum
+from dataclasses import dataclass, field
+from .ast_visitors import CodeFeatures
+# Always-blocked imports that represent severe security risks
+CRITICAL_IMPORTS = frozenset(
+    {
+        "ctypes",
+        "multiprocessing",
+        "threading",
+        "_thread",
+        "gc",
+        "sys",
+        "builtins",
+        "importlib",
+        "pkgutil",
+        "code",
+        "codeop",
+        "rlcompleter",
+        "pdb",
+        "bdb",
+        "trace",
+        "traceback",
+        "linecache",
+        "inspect",
+        "dis",
+        "pickletools",
+        "formatter",
+        "msilib",
+        "winreg",
+        "_winapi",
+        "posix",
+        "posixpath",
+        "nt",
+        "ntpath",
+        "_posixsubprocess",
+    }
+)
+# High-risk imports
+HIGH_RISK_IMPORTS = frozenset(
+    {
+        "os",
+        "subprocess",
+        "shutil",
+        "pathlib",
+        "pickle",
+        "shelve",
+        "marshal",
+        "socket",
+        "ssl",
+        "asyncio",
+        "signal",
+        "pty",
+        "tty",
+        "termios",
+        "resource",
+        "syslog",
+        "tempfile",
+        "glob",
+        "fnmatch",
+    }
+)
+# Medium-risk imports
+MEDIUM_RISK_IMPORTS = frozenset(
+    {
+        "urllib",
+        "http",
+        "email",
+        "mailbox",
+        "mimetypes",
+        "base64",
+        "binascii",
+        "quopri",
+        "uu",
+        "html",
+        "xml",
+        "configparser",
+        "logging",
+        "warnings",
+        "contextlib",
+        "abc",
+        "atexit",
+        "weakref",
+        "copy",
+        "pprint",
+        "reprlib",
+    }
+)
+class RiskLevel(str, enum.Enum):
+    """Risk level classification for code analysis."""
+    LOW = "low"
+    MEDIUM = "medium"
+    HIGH = "high"
+    CRITICAL = "critical"
+@dataclass
+class RiskAssessment:
+    """Detailed risk assessment for analyzed code.
+    Attributes:
+        level: Overall risk level.
+        score: Numeric risk score (0-100).
+        reasons: List of reasons contributing to the risk.
+        blocked_imports: Imports that would be blocked.
+        warnings: Non-blocking warnings about the code.
+    """
+    level: RiskLevel
+    score: int
+    reasons: list[str] = field(default_factory=list)
+    blocked_imports: set[str] = field(default_factory=set)
+    warnings: list[str] = field(default_factory=list)
+def calculate_risk(features: CodeFeatures) -> RiskAssessment:
+    """Calculate risk score and level from extracted code features.
+    Args:
+        features: CodeFeatures from AST analysis.
+    Returns:
+        RiskAssessment with level, score, reasons, and warnings.
+    """
+    score = 0
+    reasons: list[str] = []
+    warnings: list[str] = []
+    blocked_imports: set[str] = set()
+    # Check critical imports (instant critical)
+    critical_found = features.imports & CRITICAL_IMPORTS
+    if critical_found:
+        score += 100
+        blocked_imports.update(critical_found)
+        reasons.append(f"Critical imports detected: {', '.join(sorted(critical_found))}")
+    # Check high-risk imports
+    high_risk_found = features.imports & HIGH_RISK_IMPORTS
+    if high_risk_found:
+        score += 40
+        reasons.append(f"High-risk imports: {', '.join(sorted(high_risk_found))}")
+    # Check medium-risk imports
+    medium_risk_found = features.imports & MEDIUM_RISK_IMPORTS
+    if medium_risk_found:
+        score += 15
+        warnings.append(f"Medium-risk imports: {', '.join(sorted(medium_risk_found))}")
+    # Check exec/eval usage (critical)
+    if features.exec_eval_usage:
+        score += 80
+        calls = [call[0] for call in features.exec_eval_usage]
+        reasons.append(f"Dynamic code execution: {', '.join(calls)}")
+    # Check system calls (critical)
+    if features.system_calls:
+        score += 80
+        calls = [call[0] for call in features.system_calls]
+        reasons.append(f"System calls detected: {', '.join(calls)}")
+    # Check network calls (high)
+    if features.network_calls:
+        score += 35
+        calls = [call[0] for call in features.network_calls]
+        reasons.append(f"Network operations: {', '.join(calls)}")
+    # Check file operations (medium-high depending on context)
+    if features.file_operations:
+        score += 25
+        calls = [call[0] for call in features.file_operations]
+        warnings.append(f"File operations: {', '.join(calls)}")
+    # Check dangerous builtins
+    if features.dangerous_builtins:
+        score += 20
+        warnings.append(f"Dangerous builtins: {', '.join(sorted(features.dangerous_builtins))}")
+    # Check for global/nonlocal (can be used to escape sandbox)
+    if features.has_global_statements:
+        score += 10
+        warnings.append("Uses global statements")
+    if features.has_nonlocal_statements:
+        score += 5
+        warnings.append("Uses nonlocal statements")
+    # Cap score at 100
+    score = min(score, 100)
+    # Determine level
+    if score >= 70:
+        level = RiskLevel.CRITICAL
+    elif score >= 40:
+        level = RiskLevel.HIGH
+    elif score >= 15:
+        level = RiskLevel.MEDIUM
+    else:
+        level = RiskLevel.LOW
+    return RiskAssessment(
+        level=level,
+        score=score,
+        reasons=reasons,
+        blocked_imports=blocked_imports,
+        warnings=warnings,
+    )

prompture 0.0.50__py3-none-any.whl → 0.0.51.dev1__py3-none-any.whl

prompture 0.0.50py3-none-any.whl → 0.0.51.dev1py3-none-any.whl