PyPI - iam-policy-validator - Versions diffs - 1.10.2__py3-none-any.whl → 1.11.0__py3-none-any.whl - Mend

iam-policy-validator 1.10.2py3-none-any.whl → 1.11.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

iam_policy_validator-1.11.0.dist-info/METADATA +782 -0
{iam_policy_validator-1.10.2.dist-info → iam_policy_validator-1.11.0.dist-info}/RECORD +26 -22
iam_validator/__version__.py +1 -1
iam_validator/checks/action_condition_enforcement.py +27 -14
iam_validator/checks/sensitive_action.py +123 -11
iam_validator/checks/utils/policy_level_checks.py +47 -10
iam_validator/checks/wildcard_resource.py +29 -7
iam_validator/commands/__init__.py +6 -0
iam_validator/commands/completion.py +420 -0
iam_validator/commands/query.py +485 -0
iam_validator/commands/validate.py +21 -26
iam_validator/core/config/category_suggestions.py +77 -0
iam_validator/core/config/condition_requirements.py +105 -54
iam_validator/core/config/defaults.py +110 -6
iam_validator/core/config/wildcards.py +3 -0
iam_validator/core/diff_parser.py +321 -0
iam_validator/core/formatters/enhanced.py +34 -27
iam_validator/core/models.py +2 -0
iam_validator/core/pr_commenter.py +179 -51
iam_validator/core/report.py +19 -17
iam_validator/integrations/github_integration.py +250 -1
iam_validator/sdk/__init__.py +33 -0
iam_validator/sdk/query_utils.py +454 -0
iam_policy_validator-1.10.2.dist-info/METADATA +0 -549
{iam_policy_validator-1.10.2.dist-info → iam_policy_validator-1.11.0.dist-info}/WHEEL +0 -0
{iam_policy_validator-1.10.2.dist-info → iam_policy_validator-1.11.0.dist-info}/entry_points.txt +0 -0
{iam_policy_validator-1.10.2.dist-info → iam_policy_validator-1.11.0.dist-info}/licenses/LICENSE +0 -0

iam_validator/core/diff_parser.py ADDED Viewed

@@ -0,0 +1,321 @@
+"""Diff Parser Module.
+This module parses GitHub PR diff information to extract changed line numbers.
+It supports GitHub's unified diff format and provides utilities for determining
+which lines and statements were modified in a PR.
+"""
+import logging
+import re
+from dataclasses import dataclass
+from typing import Any
+logger = logging.getLogger(__name__)
+@dataclass
+class ParsedDiff:
+    """Parsed GitHub PR diff information for a single file.
+    Attributes:
+        file_path: Relative path to the file from repository root
+        changed_lines: Set of all line numbers that were added or modified (new side)
+        added_lines: Set of line numbers that were added (new side)
+        deleted_lines: Set of line numbers that were deleted (old side)
+        status: File status (added, modified, removed, renamed)
+    """
+    file_path: str
+    changed_lines: set[int]
+    added_lines: set[int]
+    deleted_lines: set[int]
+    status: str
+@dataclass
+class StatementLocation:
+    """Location information for a statement in a policy file.
+    Attributes:
+        statement_index: Zero-based index of the statement
+        start_line: First line number of the statement (1-indexed)
+        end_line: Last line number of the statement (1-indexed)
+        has_changes: True if any line in this range was modified
+    """
+    statement_index: int
+    start_line: int
+    end_line: int
+    has_changes: bool
+class DiffParser:
+    """Parser for GitHub PR diff information."""
+    @staticmethod
+    def parse_pr_files(pr_files: list[dict[str, Any]]) -> dict[str, ParsedDiff]:
+        """Parse GitHub PR files response to extract changed line information.
+        Args:
+            pr_files: List of file dicts from GitHub API's get_pr_files() call.
+                     Each dict contains: filename, status, patch, additions, deletions
+        Returns:
+            Dict mapping file paths to ParsedDiff objects
+        Example:
+            >>> pr_files = [{
+            ...     "filename": "policies/policy.json",
+            ...     "status": "modified",
+            ...     "patch": "@@ -5,3 +5,4 @@\\n context\\n-old\\n+new\\n+added"
+            ... }]
+            >>> result = DiffParser.parse_pr_files(pr_files)
+            >>> result["policies/policy.json"].changed_lines
+            {6, 7}
+        """
+        parsed: dict[str, ParsedDiff] = {}
+        for file_info in pr_files:
+            if not isinstance(file_info, dict):
+                continue
+            filename = file_info.get("filename")
+            if not filename or not isinstance(filename, str):
+                continue
+            status = file_info.get("status", "modified")
+            patch = file_info.get("patch")
+            # Files without patches (e.g., binary files, very large files)
+            if not patch or not isinstance(patch, str):
+                logger.debug(f"No patch available for {filename}, skipping diff parsing")
+                # Still track the file with empty change sets
+                parsed[filename] = ParsedDiff(
+                    file_path=filename,
+                    changed_lines=set(),
+                    added_lines=set(),
+                    deleted_lines=set(),
+                    status=status,
+                )
+                continue
+            try:
+                diff = DiffParser.parse_unified_diff(patch)
+                parsed[filename] = ParsedDiff(
+                    file_path=filename,
+                    changed_lines=diff["changed_lines"],
+                    added_lines=diff["added_lines"],
+                    deleted_lines=diff["deleted_lines"],
+                    status=status,
+                )
+                logger.debug(
+                    f"Parsed diff for {filename}: {len(diff['changed_lines'])} changed lines"
+                )
+            except Exception as e:  # pylint: disable=broad-exception-caught
+                logger.warning(f"Failed to parse diff for {filename}: {e}")
+                # Track file with empty change sets on parse error
+                parsed[filename] = ParsedDiff(
+                    file_path=filename,
+                    changed_lines=set(),
+                    added_lines=set(),
+                    deleted_lines=set(),
+                    status=status,
+                )
+        return parsed
+    @staticmethod
+    def parse_unified_diff(patch: str) -> dict[str, set[int]]:
+        """Parse a unified diff patch to extract changed line numbers.
+        Unified diff format uses @@ headers to indicate line ranges:
+        @@ -old_start,old_count +new_start,new_count @@
+        Lines starting with:
+        - '-' are deletions (old side line numbers)
+        - '+' are additions (new side line numbers)
+        - ' ' are context (both sides)
+        Args:
+            patch: Unified diff string from GitHub API
+        Returns:
+            Dict with keys:
+            - changed_lines: All added/modified lines (new side)
+            - added_lines: Only added lines (new side)
+            - deleted_lines: Only deleted lines (old side)
+        Example:
+            >>> patch = '''@@ -5,3 +5,4 @@
+            ...  context line
+            ... -deleted line
+            ... +added line
+            ... +another added line
+            ...  context line'''
+            >>> result = DiffParser.parse_unified_diff(patch)
+            >>> result['added_lines']
+            {6, 7}
+        """
+        changed_lines: set[int] = set()
+        added_lines: set[int] = set()
+        deleted_lines: set[int] = set()
+        # Pattern to match @@ -old_start,old_count +new_start,new_count @@ headers
+        # Handles variations: @@ -5,3 +5,4 @@, @@ -5 +5,2 @@, etc.
+        hunk_header_pattern = re.compile(r"^@@\s+-(\d+)(?:,(\d+))?\s+\+(\d+)(?:,(\d+))?\s+@@")
+        lines = patch.split("\n")
+        current_new_line = 0
+        current_old_line = 0
+        for line in lines:
+            # Check for hunk header
+            match = hunk_header_pattern.match(line)
+            if match:
+                old_start = int(match.group(1))
+                new_start = int(match.group(3))
+                current_old_line = old_start
+                current_new_line = new_start
+                continue
+            # Process diff lines
+            if not line:
+                continue
+            first_char = line[0]
+            if first_char == "+":
+                # Addition (new side only)
+                added_lines.add(current_new_line)
+                changed_lines.add(current_new_line)
+                current_new_line += 1
+            elif first_char == "-":
+                # Deletion (old side only)
+                deleted_lines.add(current_old_line)
+                current_old_line += 1
+            elif first_char == " ":
+                # Context line (both sides)
+                current_new_line += 1
+                current_old_line += 1
+            # Ignore lines that don't start with +, -, or space (e.g., \ No newline)
+        return {
+            "changed_lines": changed_lines,
+            "added_lines": added_lines,
+            "deleted_lines": deleted_lines,
+        }
+    @staticmethod
+    def get_modified_statements(
+        line_mapping: dict[int, int],
+        changed_lines: set[int],
+        policy_file: str,
+    ) -> dict[int, StatementLocation]:
+        """Determine which statements were modified based on changed lines.
+        A statement is considered modified if ANY line within its range appears
+        in the changed_lines set.
+        Args:
+            line_mapping: Dict mapping statement index to statement start line
+                         (from PRCommenter._get_line_mapping())
+            changed_lines: Set of line numbers that were changed in the PR
+            policy_file: Path to the policy file (to determine statement end lines)
+        Returns:
+            Dict mapping statement indices to StatementLocation objects
+            Only includes statements that were modified.
+        Example:
+            >>> line_mapping = {0: 3, 1: 10, 2: 20}  # Statement starts
+            >>> changed_lines = {5, 6}  # Lines changed in statement 0
+            >>> result = get_modified_statements(line_mapping, changed_lines, "policy.json")
+            >>> result[0].has_changes
+            True
+            >>> 1 in result  # Statement 1 not modified
+            False
+        """
+        if not line_mapping or not changed_lines:
+            return {}
+        # Determine end line for each statement
+        statement_ranges: dict[int, tuple[int, int]] = {}
+        sorted_indices = sorted(line_mapping.keys())
+        for i, stmt_idx in enumerate(sorted_indices):
+            start_line = line_mapping[stmt_idx]
+            # End line is either:
+            # 1. One line before next statement starts, OR
+            # 2. EOF for the last statement
+            if i < len(sorted_indices) - 1:
+                next_start = line_mapping[sorted_indices[i + 1]]
+                end_line = next_start - 1
+            else:
+                # For last statement, try to read file to get actual end
+                end_line = DiffParser.get_statement_end_line(policy_file, start_line)
+            statement_ranges[stmt_idx] = (start_line, end_line)
+        # Check which statements have changes
+        modified_statements: dict[int, StatementLocation] = {}
+        for stmt_idx, (start_line, end_line) in statement_ranges.items():
+            # Check if any line in this statement's range was changed
+            statement_lines = set(range(start_line, end_line + 1))
+            has_changes = bool(statement_lines & changed_lines)
+            if has_changes:
+                modified_statements[stmt_idx] = StatementLocation(
+                    statement_index=stmt_idx,
+                    start_line=start_line,
+                    end_line=end_line,
+                    has_changes=True,
+                )
+                logger.debug(f"Statement {stmt_idx} (lines {start_line}-{end_line}) was modified")
+        return modified_statements
+    @staticmethod
+    def get_statement_end_line(policy_file: str, start_line: int) -> int:
+        """Find the end line of a statement block starting at start_line.
+        Tracks brace depth to find where the statement object closes.
+        Args:
+            policy_file: Path to policy file
+            start_line: Line number where statement starts (1-indexed)
+        Returns:
+            Line number where statement ends (1-indexed)
+        """
+        try:
+            with open(policy_file, encoding="utf-8") as f:
+                lines = f.readlines()
+            # Start counting from the statement's opening brace
+            brace_depth = 0
+            in_statement = False
+            for line_num in range(start_line - 1, len(lines)):  # Convert to 0-indexed
+                line = lines[line_num]
+                # Track braces
+                for char in line:
+                    if char == "{":
+                        brace_depth += 1
+                        in_statement = True
+                    elif char == "}":
+                        brace_depth -= 1
+                        # Found the closing brace for this statement
+                        if in_statement and brace_depth == 0:
+                            return line_num + 1  # Convert back to 1-indexed
+            # If we couldn't find the end, return a reasonable default
+            # (start_line + 20 or end of file)
+            return min(start_line + 20, len(lines))
+        except Exception as e:  # pylint: disable=broad-exception-caught
+            logger.debug(f"Could not determine statement end line: {e}")
+            return start_line + 10  # Reasonable default

iam_validator/core/formatters/enhanced.py CHANGED Viewed

@@ -61,7 +61,6 @@ class EnhancedFormatter(OutputFormatter):
         )
         # Header with title
-        console.print()
         title = Text(
             f"IAM Policy Validation Report (v{__version__})",
             style="bold cyan",
@@ -75,7 +74,6 @@ class EnhancedFormatter(OutputFormatter):
                 width=constants.CONSOLE_PANEL_WIDTH,
             )
         )
-        console.print()
         # Executive Summary with progress bars (optional)
         if show_summary:
@@ -83,12 +81,15 @@ class EnhancedFormatter(OutputFormatter):
         # Severity breakdown if there are issues (optional)
         if show_severity_breakdown and report.total_issues > 0:
-            console.print()
             self._print_severity_breakdown(console, report)
-        console.print()
-        console.print(Rule(title="[bold]Detailed Results", style=constants.CONSOLE_HEADER_COLOR))
-        console.print()
+        console.print(
+            Rule(
+                title="[bold]Detailed Results",
+                style=constants.CONSOLE_HEADER_COLOR,
+            ),
+            width=constants.CONSOLE_PANEL_WIDTH,
+        )
         # Detailed results using tree structure
         for idx, result in enumerate(report.results, 1):
@@ -99,7 +100,7 @@ class EnhancedFormatter(OutputFormatter):
         self._print_final_status(console, report)
         # Get the formatted output
-        output = string_buffer.getvalue()
+        output = string_buffer.getvalue().rstrip("\n")
         string_buffer.close()
         return output
@@ -305,13 +306,10 @@ class EnhancedFormatter(OutputFormatter):
         if not result.issues:
             console.print(header)
             console.print("     [dim italic]No issues detected[/dim italic]")
-            console.print()
             return
         console.print(header)
         console.print(f"     [dim]{len(result.issues)} issue(s) found[/dim]")
-        console.print()
         # Create tree structure for issues
         tree = Tree(f"[bold]Issues ({len(result.issues)})[/bold]", guide_style="bright_black")
@@ -372,10 +370,14 @@ class EnhancedFormatter(OutputFormatter):
     def _add_issue_to_tree(self, branch: Tree, issue, color: str) -> None:
         """Add an issue to a tree branch."""
         # Build location string (use 1-indexed statement numbers for user-facing output)
-        statement_num = issue.statement_index + 1
-        location = f"Statement {statement_num}"
-        if issue.statement_sid:
-            location = f"{issue.statement_sid} (#{statement_num})"
+        # Handle policy-level issues (statement_index = -1)
+        if issue.statement_index == -1:
+            location = "Policy-level"
+        else:
+            statement_num = issue.statement_index + 1
+            location = f"Statement {statement_num}"
+            if issue.statement_sid:
+                location = f"{issue.statement_sid} (#{statement_num})"
         if issue.line_number is not None:
             location += f" @L{issue.line_number}"
@@ -399,19 +401,24 @@ class EnhancedFormatter(OutputFormatter):
                 details.append(f"Condition: {issue.condition_key}")
             msg_node.add(Text(" • ".join(details), style="dim cyan"))
-        # Suggestion
-        if issue.suggestion:
-            suggestion_text = Text()
-            suggestion_text.append("💡 ", style="yellow")
-            suggestion_text.append(issue.suggestion, style="italic yellow")
-            msg_node.add(suggestion_text)
+        # Suggestion and Example - combine into single node to reduce spacing
+        if issue.suggestion or issue.example:
+            combined_text = Text()
+            # Add suggestion
+            if issue.suggestion:
+                combined_text.append("💡 ", style="yellow")
+                combined_text.append(issue.suggestion, style="italic yellow")
+            # Add example on same node (reduces vertical spacing)
+            if issue.example:
+                if issue.suggestion:
+                    combined_text.append("\n", style="yellow")  # Single newline separator
+                combined_text.append("Example:", style="bold cyan")
+                combined_text.append("\n")
+                combined_text.append(issue.example, style="dim")
-        # Example (if present, show with indentation)
-        if issue.example:
-            msg_node.add(Text("Example:", style="bold cyan"))
-            # Show example code with syntax highlighting
-            example_text = Text(issue.example, style="dim")
-            msg_node.add(example_text)
+            msg_node.add(combined_text)
     def _print_final_status(self, console: Console, report: ValidationReport) -> None:
         """Print final status panel."""
@@ -461,7 +468,7 @@ class EnhancedFormatter(OutputFormatter):
         # Combine status and message
         final_text = Text()
         final_text.append(status)
-        final_text.append("\n\n")
+        final_text.append("\n")  # Reduced from \n\n to single newline
         final_text.append(message)
         console.print(

iam_validator/core/models.py CHANGED Viewed

@@ -233,6 +233,8 @@ class ValidationIssue(BaseModel):
         if include_identifier:
             parts.append(f"{constants.REVIEW_IDENTIFIER}\n")
             parts.append(f"{constants.BOT_IDENTIFIER}\n")
+            # Add issue type identifier to allow multiple issues at same line
+            parts.append(f"<!-- issue-type: {self.issue_type} -->\n")
         # Build statement context for better navigation
         statement_context = f"Statement[{self.statement_index}]"

iam-policy-validator 1.10.2__py3-none-any.whl → 1.11.0__py3-none-any.whl

iam-policy-validator 1.10.2py3-none-any.whl → 1.11.0py3-none-any.whl