PyPI - thailint - Versions diffs - 0.8.0__py3-none-any.whl → 0.10.0__py3-none-any.whl - Mend

thailint 0.8.0py3-none-any.whl → 0.10.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (46) hide show

src/cli.py +242 -0
src/config.py +2 -3
src/core/base.py +4 -0
src/core/rule_discovery.py +143 -84
src/core/violation_builder.py +75 -15
src/linter_config/loader.py +43 -11
src/linters/collection_pipeline/__init__.py +90 -0
src/linters/collection_pipeline/config.py +63 -0
src/linters/collection_pipeline/continue_analyzer.py +100 -0
src/linters/collection_pipeline/detector.py +130 -0
src/linters/collection_pipeline/linter.py +437 -0
src/linters/collection_pipeline/suggestion_builder.py +63 -0
src/linters/dry/block_filter.py +6 -8
src/linters/dry/block_grouper.py +4 -0
src/linters/dry/cache_query.py +4 -0
src/linters/dry/python_analyzer.py +34 -18
src/linters/dry/token_hasher.py +5 -1
src/linters/dry/typescript_analyzer.py +61 -31
src/linters/dry/violation_builder.py +4 -0
src/linters/dry/violation_filter.py +4 -0
src/linters/file_header/bash_parser.py +4 -0
src/linters/file_header/linter.py +7 -11
src/linters/file_placement/directory_matcher.py +4 -0
src/linters/file_placement/linter.py +28 -8
src/linters/file_placement/pattern_matcher.py +4 -0
src/linters/file_placement/pattern_validator.py +4 -0
src/linters/magic_numbers/context_analyzer.py +4 -0
src/linters/magic_numbers/typescript_analyzer.py +4 -0
src/linters/nesting/python_analyzer.py +4 -0
src/linters/nesting/typescript_function_extractor.py +4 -0
src/linters/print_statements/typescript_analyzer.py +4 -0
src/linters/srp/class_analyzer.py +4 -0
src/linters/srp/heuristics.py +4 -3
src/linters/srp/linter.py +2 -3
src/linters/srp/python_analyzer.py +55 -20
src/linters/srp/typescript_metrics_calculator.py +83 -47
src/linters/srp/violation_builder.py +4 -0
src/linters/stateless_class/__init__.py +25 -0
src/linters/stateless_class/config.py +58 -0
src/linters/stateless_class/linter.py +355 -0
src/linters/stateless_class/python_analyzer.py +299 -0
{thailint-0.8.0.dist-info → thailint-0.10.0.dist-info}/METADATA +226 -3
{thailint-0.8.0.dist-info → thailint-0.10.0.dist-info}/RECORD +46 -36
{thailint-0.8.0.dist-info → thailint-0.10.0.dist-info}/WHEEL +0 -0
{thailint-0.8.0.dist-info → thailint-0.10.0.dist-info}/entry_points.txt +0 -0
{thailint-0.8.0.dist-info → thailint-0.10.0.dist-info}/licenses/LICENSE +0 -0

src/linters/collection_pipeline/linter.py ADDED Viewed

@@ -0,0 +1,437 @@
+"""
+Purpose: CollectionPipelineRule implementation for detecting loop filtering anti-patterns
+Scope: Main rule class implementing BaseLintRule interface for collection-pipeline detection
+Overview: Implements the BaseLintRule interface to detect for loops with embedded
+    filtering logic that could be refactored to collection pipelines. Detects patterns
+    like 'for x in iter: if not cond: continue; action(x)' which can be refactored to
+    use generator expressions or filter(). Based on Martin Fowler's refactoring pattern.
+    Integrates with thai-lint CLI and supports text, JSON, and SARIF output formats.
+    Supports comprehensive 5-level ignore system including project-level patterns,
+    linter-specific ignore patterns, file-level directives, line-level directives,
+    and block-level directives via IgnoreDirectiveParser.
+Dependencies: BaseLintRule, BaseLintContext, Violation, PipelinePatternDetector,
+    CollectionPipelineConfig, IgnoreDirectiveParser
+Exports: CollectionPipelineRule class
+Interfaces: CollectionPipelineRule.check(context) -> list[Violation], rule metadata properties
+Implementation: Uses PipelinePatternDetector for AST analysis, composition pattern with
+    config loading and comprehensive ignore checking via IgnoreDirectiveParser
+"""
+from pathlib import Path
+from src.core.base import BaseLintContext, BaseLintRule
+from src.core.types import Severity, Violation
+from src.linter_config.ignore import IgnoreDirectiveParser
+from .config import CollectionPipelineConfig
+from .detector import PatternMatch, PipelinePatternDetector
+class CollectionPipelineRule(BaseLintRule):  # thailint: ignore[srp,dry]
+    """Detects for loops with embedded filtering that could use collection pipelines."""
+    def __init__(self) -> None:
+        """Initialize the rule with ignore parser."""
+        self._ignore_parser = IgnoreDirectiveParser()
+    @property
+    def rule_id(self) -> str:
+        """Unique identifier for this rule."""
+        return "collection-pipeline.embedded-filter"
+    @property
+    def rule_name(self) -> str:
+        """Human-readable name for this rule."""
+        return "Embedded Loop Filtering"
+    @property
+    def description(self) -> str:
+        """Description of what this rule checks."""
+        return (
+            "For loops with embedded if/continue filtering patterns should be "
+            "refactored to use collection pipelines (generator expressions, filter())"
+        )
+    def check(self, context: BaseLintContext) -> list[Violation]:
+        """Check for collection pipeline anti-patterns.
+        Args:
+            context: Lint context with file information
+        Returns:
+            List of violations found
+        """
+        if not self._should_analyze(context):
+            return []
+        config = self._load_config(context)
+        if not config.enabled:
+            return []
+        if self._is_file_ignored(context, config):
+            return []
+        if self._has_file_level_ignore(context):
+            return []
+        return self._analyze_python(context, config)
+    def _should_analyze(self, context: BaseLintContext) -> bool:
+        """Check if context should be analyzed.
+        Args:
+            context: Lint context
+        Returns:
+            True if should analyze
+        """
+        return context.language == "python" and context.file_content is not None
+    def _get_config_dict(self, context: BaseLintContext) -> dict | None:
+        """Get configuration dictionary from context.
+        Args:
+            context: Lint context
+        Returns:
+            Config dict or None
+        """
+        if hasattr(context, "config") and context.config is not None:
+            return context.config
+        if hasattr(context, "metadata") and context.metadata is not None:
+            return context.metadata
+        return None
+    def _load_config(self, context: BaseLintContext) -> CollectionPipelineConfig:
+        """Load configuration from context.
+        Args:
+            context: Lint context
+        Returns:
+            CollectionPipelineConfig instance
+        """
+        config_dict = self._get_config_dict(context)
+        if config_dict is None or not isinstance(config_dict, dict):
+            return CollectionPipelineConfig()
+        # Check for collection_pipeline or collection-pipeline specific config
+        linter_config = config_dict.get(
+            "collection_pipeline", config_dict.get("collection-pipeline", config_dict)
+        )
+        return CollectionPipelineConfig.from_dict(linter_config)
+    def _is_file_ignored(self, context: BaseLintContext, config: CollectionPipelineConfig) -> bool:
+        """Check if file matches ignore patterns.
+        Args:
+            context: Lint context
+            config: Configuration
+        Returns:
+            True if file should be ignored
+        """
+        if not config.ignore:
+            return False
+        if not context.file_path:
+            return False
+        file_path = Path(context.file_path)
+        for pattern in config.ignore:
+            if self._matches_pattern(file_path, pattern):
+                return True
+        return False
+    def _matches_pattern(self, file_path: Path, pattern: str) -> bool:
+        """Check if file path matches a glob pattern.
+        Args:
+            file_path: Path to check
+            pattern: Glob pattern
+        Returns:
+            True if path matches pattern
+        """
+        if file_path.match(pattern):
+            return True
+        if pattern in str(file_path):
+            return True
+        return False
+    def _has_file_level_ignore(self, context: BaseLintContext) -> bool:
+        """Check if file has file-level ignore directive.
+        Args:
+            context: Lint context
+        Returns:
+            True if file should be ignored at file level
+        """
+        if not context.file_content:
+            return False
+        # Check first 10 lines for ignore-file directive
+        lines = context.file_content.splitlines()[:10]
+        for line in lines:
+            if self._is_file_ignore_directive(line):
+                return True
+        return False
+    def _is_file_ignore_directive(self, line: str) -> bool:
+        """Check if line is a file-level ignore directive.
+        Args:
+            line: Line to check
+        Returns:
+            True if line has file-level ignore for this rule
+        """
+        line_lower = line.lower()
+        if "thailint: ignore-file" not in line_lower:
+            return False
+        # Check for general ignore-file (no rule specified)
+        if "ignore-file[" not in line_lower:
+            return True
+        # Check for rule-specific ignore
+        return self._matches_rule_ignore(line_lower, "ignore-file")
+    def _matches_rule_ignore(self, line: str, directive: str) -> bool:
+        """Check if line matches rule-specific ignore.
+        Args:
+            line: Line to check (lowercase)
+            directive: Directive name (ignore-file or ignore)
+        Returns:
+            True if ignore applies to this rule
+        """
+        import re
+        pattern = rf"{directive}\[([^\]]+)\]"
+        match = re.search(pattern, line)
+        if not match:
+            return False
+        rules = [r.strip().lower() for r in match.group(1).split(",")]
+        return any(self._rule_matches(r) for r in rules)
+    def _rule_matches(self, rule_pattern: str) -> bool:
+        """Check if rule pattern matches this rule.
+        Args:
+            rule_pattern: Rule pattern to check
+        Returns:
+            True if pattern matches this rule
+        """
+        rule_id_lower = self.rule_id.lower()
+        pattern_lower = rule_pattern.lower()
+        # Exact match
+        if rule_id_lower == pattern_lower:
+            return True
+        # Prefix match: collection-pipeline matches collection-pipeline.embedded-filter
+        if rule_id_lower.startswith(pattern_lower + "."):
+            return True
+        # Wildcard match: collection-pipeline.* matches collection-pipeline.embedded-filter
+        if pattern_lower.endswith("*"):
+            prefix = pattern_lower[:-1]
+            return rule_id_lower.startswith(prefix)
+        return False
+    def _analyze_python(
+        self, context: BaseLintContext, config: CollectionPipelineConfig
+    ) -> list[Violation]:
+        """Analyze Python code for collection pipeline patterns.
+        Args:
+            context: Lint context with Python file information
+            config: Collection pipeline configuration
+        Returns:
+            List of violations found
+        """
+        detector = PipelinePatternDetector(context.file_content or "")
+        matches = detector.detect_patterns()
+        return self._filter_matches_to_violations(matches, config, context)
+    def _filter_matches_to_violations(
+        self,
+        matches: list[PatternMatch],
+        config: CollectionPipelineConfig,
+        context: BaseLintContext,
+    ) -> list[Violation]:
+        """Filter matches by threshold and ignore rules.
+        Args:
+            matches: Detected pattern matches
+            config: Configuration with thresholds
+            context: Lint context
+        Returns:
+            List of violations after filtering
+        """
+        violations: list[Violation] = []
+        for match in matches:
+            violation = self._process_match(match, config, context)
+            if violation:
+                violations.append(violation)
+        return violations
+    def _process_match(
+        self,
+        match: PatternMatch,
+        config: CollectionPipelineConfig,
+        context: BaseLintContext,
+    ) -> Violation | None:
+        """Process a single match into a violation if applicable.
+        Args:
+            match: Pattern match to process
+            config: Configuration with thresholds
+            context: Lint context
+        Returns:
+            Violation if match should be reported, None otherwise
+        """
+        if len(match.conditions) < config.min_continues:
+            return None
+        violation = self._create_violation(match, context)
+        if self._should_ignore_violation(violation, match.line_number, context):
+            return None
+        return violation
+    def _should_ignore_violation(
+        self, violation: Violation, line_num: int, context: BaseLintContext
+    ) -> bool:
+        """Check if violation should be ignored.
+        Args:
+            violation: Violation to check
+            line_num: Line number of the violation
+            context: Lint context
+        Returns:
+            True if violation should be ignored
+        """
+        if not context.file_content:
+            return False
+        # Check using IgnoreDirectiveParser for comprehensive ignore checking
+        if self._ignore_parser.should_ignore_violation(violation, context.file_content):
+            return True
+        # Also check inline ignore on loop line
+        return self._has_inline_ignore(line_num, context)
+    def _has_inline_ignore(self, line_num: int, context: BaseLintContext) -> bool:
+        """Check for inline ignore directive on loop line.
+        Args:
+            line_num: Line number to check
+            context: Lint context
+        Returns:
+            True if line has ignore directive
+        """
+        line = self._get_line_text(line_num, context)
+        if not line:
+            return False
+        return self._is_ignore_directive(line.lower())
+    def _get_line_text(self, line_num: int, context: BaseLintContext) -> str | None:
+        """Get text of a specific line.
+        Args:
+            line_num: Line number (1-indexed)
+            context: Lint context
+        Returns:
+            Line text or None if invalid
+        """
+        if not context.file_content:
+            return None
+        lines = context.file_content.splitlines()
+        if line_num <= 0 or line_num > len(lines):
+            return None
+        return lines[line_num - 1]
+    def _is_ignore_directive(self, line: str) -> bool:
+        """Check if line contains ignore directive for this rule.
+        Args:
+            line: Line text (lowercase)
+        Returns:
+            True if line has applicable ignore directive
+        """
+        if "thailint:" not in line or "ignore" not in line:
+            return False
+        # General ignore (no rule specified)
+        if "ignore[" not in line:
+            return True
+        # Rule-specific ignore
+        return self._matches_rule_ignore(line, "ignore")
+    def _create_violation(self, match: PatternMatch, context: BaseLintContext) -> Violation:
+        """Create a Violation from a PatternMatch.
+        Args:
+            match: Detected pattern match
+            context: Lint context
+        Returns:
+            Violation object for the detected pattern
+        """
+        message = self._build_message(match)
+        file_path = str(context.file_path) if context.file_path else "unknown"
+        return Violation(
+            rule_id=self.rule_id,
+            file_path=file_path,
+            line=match.line_number,
+            column=0,
+            message=message,
+            severity=Severity.ERROR,
+            suggestion=match.suggestion,
+        )
+    def _build_message(self, match: PatternMatch) -> str:
+        """Build violation message.
+        Args:
+            match: Detected pattern match
+        Returns:
+            Human-readable message describing the violation
+        """
+        num_conditions = len(match.conditions)
+        if num_conditions == 1:
+            return (
+                f"For loop over '{match.iterable}' has embedded filtering. "
+                f"Consider using a generator expression."
+            )
+        return (
+            f"For loop over '{match.iterable}' has {num_conditions} filter conditions. "
+            f"Consider combining into a collection pipeline."
+        )

src/linters/collection_pipeline/suggestion_builder.py ADDED Viewed

@@ -0,0 +1,63 @@
+"""
+Purpose: Build refactoring suggestions for collection pipeline patterns
+Scope: Generate code suggestions for converting embedded filtering to collection pipelines
+Overview: Provides helper functions for generating refactoring suggestions when embedded
+    filtering patterns are detected. Handles condition inversion (converting continue guard
+    conditions to filter conditions), target name extraction, and suggestion string generation.
+    Separates suggestion logic from pattern detection logic for better maintainability.
+Dependencies: ast module for Python AST processing
+Exports: build_suggestion, invert_condition, get_target_name
+Interfaces: Functions for suggestion generation and condition transformation
+Implementation: AST-based condition inversion and string formatting for suggestions
+"""
+import ast
+def get_target_name(target: ast.expr) -> str:
+    """Get the loop variable name from AST target.
+    Args:
+        target: AST expression for loop target
+    Returns:
+        String representation of the loop variable
+    """
+    if isinstance(target, ast.Name):
+        return target.id
+    return ast.unparse(target)
+def invert_condition(condition: ast.expr) -> str:
+    """Invert a condition (for if not x: continue -> if x).
+    Args:
+        condition: AST expression for the condition
+    Returns:
+        String representation of the inverted condition
+    """
+    if isinstance(condition, ast.UnaryOp) and isinstance(condition.op, ast.Not):
+        return ast.unparse(condition.operand)
+    return f"not ({ast.unparse(condition)})"
+def build_suggestion(loop_var: str, iterable: str, conditions: list[str]) -> str:
+    """Generate refactoring suggestion code snippet.
+    Args:
+        loop_var: Name of the loop variable
+        iterable: Source representation of the iterable
+        conditions: List of filter conditions (already inverted)
+    Returns:
+        Code suggestion for refactoring to generator expression
+    """
+    combined = " and ".join(conditions)
+    return f"for {loop_var} in ({loop_var} for {loop_var} in {iterable} if {combined}):"

src/linters/dry/block_filter.py CHANGED Viewed

@@ -165,6 +165,10 @@ class ImportGroupFilter(BaseBlockFilter):
     Import organization often creates similar patterns that aren't meaningful duplication.
     """
+    def __init__(self) -> None:
+        """Initialize the import group filter."""
+        pass  # Stateless filter for import blocks
     def should_filter(self, block: CodeBlock, file_content: str) -> bool:
         """Check if block is only import statements.
@@ -235,14 +239,8 @@ class BlockFilterRegistry:
         Returns:
             True if block should be filtered out
         """
-        for filter_instance in self._filters:
-            if filter_instance.name not in self._enabled_filters:
-                continue
-            if filter_instance.should_filter(block, file_content):
-                return True
-        return False
+        enabled_filters = (f for f in self._filters if f.name in self._enabled_filters)
+        return any(f.should_filter(block, file_content) for f in enabled_filters)
     def get_enabled_filters(self) -> list[str]:
         """Get list of enabled filter names.

src/linters/dry/block_grouper.py CHANGED Viewed

@@ -26,6 +26,10 @@ from .cache import CodeBlock
 class BlockGrouper:
     """Groups blocks and violations by file path."""
+    def __init__(self) -> None:
+        """Initialize the block grouper."""
+        pass  # Stateless grouper for code blocks
     def group_blocks_by_file(self, blocks: list[CodeBlock]) -> dict[Path, list[CodeBlock]]:
         """Group blocks by file path.

src/linters/dry/cache_query.py CHANGED Viewed

@@ -22,6 +22,10 @@ import sqlite3
 class CacheQueryService:
     """Handles cache database queries."""
+    def __init__(self) -> None:
+        """Initialize the cache query service."""
+        pass  # Stateless query service for database operations
     def get_duplicate_hashes(self, db: sqlite3.Connection) -> list[int]:
         """Get all hash values that appear 2+ times.

src/linters/dry/python_analyzer.py CHANGED Viewed

@@ -217,25 +217,43 @@ class PythonDuplicateAnalyzer(BaseTokenAnalyzer):  # thailint: ignore[srp.violat
         lines_with_numbers = []
         in_multiline_import = False
-        for line_num, line in enumerate(content.split("\n"), start=1):
-            if line_num in docstring_lines:
-                continue
-            line = self._hasher._normalize_line(line)  # pylint: disable=protected-access
-            if not line:
-                continue
-            # Update multi-line import state and check if line should be skipped
-            in_multiline_import, should_skip = self._hasher._should_skip_import_line(  # pylint: disable=protected-access
+        non_docstring_lines = (
+            (line_num, line)
+            for line_num, line in enumerate(content.split("\n"), start=1)
+            if line_num not in docstring_lines
+        )
+        for line_num, line in non_docstring_lines:
+            in_multiline_import, normalized = self._normalize_and_filter_line(
                 line, in_multiline_import
             )
-            if should_skip:
-                continue
-            lines_with_numbers.append((line_num, line))
+            if normalized is not None:
+                lines_with_numbers.append((line_num, normalized))
         return lines_with_numbers
+    def _normalize_and_filter_line(
+        self, line: str, in_multiline_import: bool
+    ) -> tuple[bool, str | None]:
+        """Normalize line and check if it should be included.
+        Args:
+            line: Raw source line
+            in_multiline_import: Current multi-line import state
+        Returns:
+            Tuple of (new_import_state, normalized_line or None if should skip)
+        """
+        normalized = self._hasher._normalize_line(line)  # pylint: disable=protected-access
+        if not normalized:
+            return in_multiline_import, None
+        new_state, should_skip = self._hasher._should_skip_import_line(  # pylint: disable=protected-access
+            normalized, in_multiline_import
+        )
+        if should_skip:
+            return new_state, None
+        return new_state, normalized
     def _rolling_hash_with_tracking(
         self, lines_with_numbers: list[tuple[int, str]], window_size: int
     ) -> list[tuple[int, int, int, str]]:
@@ -640,10 +658,8 @@ class PythonDuplicateAnalyzer(BaseTokenAnalyzer):  # thailint: ignore[srp.violat
         def is_within_class_body(tree: ast.Module, lookback_start: int) -> bool:
             """Check if flagged range falls within a class body."""
-            for stmt in tree.body:
-                if not isinstance(stmt, ast.ClassDef):
-                    continue
+            class_defs = (s for s in tree.body if isinstance(s, ast.ClassDef))
+            for stmt in class_defs:
                 # Adjust line numbers: stmt.lineno is relative to context
                 # We need to convert back to original file line numbers
                 class_start_in_context = stmt.lineno

src/linters/dry/token_hasher.py CHANGED Viewed

@@ -20,9 +20,13 @@ Implementation: Token-based normalization with rolling window algorithm, languag
 """
-class TokenHasher:
+class TokenHasher:  # thailint: ignore[srp] - Methods support single responsibility of code tokenization
     """Tokenize code and create rolling hashes for duplicate detection."""
+    def __init__(self) -> None:
+        """Initialize the token hasher."""
+        pass  # Stateless hasher for code tokenization
     def tokenize(self, code: str) -> list[str]:
         """Tokenize code by stripping comments and normalizing whitespace.

thailint 0.8.0__py3-none-any.whl → 0.10.0__py3-none-any.whl

thailint 0.8.0py3-none-any.whl → 0.10.0py3-none-any.whl