PyPI - crackerjack - Versions diffs - 0.31.4__py3-none-any.whl → 0.31.7__py3-none-any.whl - Mend

crackerjack 0.31.4py3-none-any.whl → 0.31.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of crackerjack might be problematic. Click here for more details.

Files changed (25) hide show

crackerjack/__main__.py +2 -0
crackerjack/agents/base.py +1 -0
crackerjack/agents/test_creation_agent.py +5 -0
crackerjack/cli/options.py +8 -0
crackerjack/core/phase_coordinator.py +25 -1
crackerjack/core/workflow_orchestrator.py +264 -78
crackerjack/dynamic_config.py +3 -3
crackerjack/managers/publish_manager.py +22 -0
crackerjack/managers/test_executor.py +13 -5
crackerjack/managers/test_progress.py +31 -61
crackerjack/mcp/context.py +6 -0
crackerjack/mcp/tools/execution_tools.py +4 -2
crackerjack/mcp/tools/progress_tools.py +95 -19
crackerjack/mcp/tools/workflow_executor.py +224 -19
crackerjack/orchestration/coverage_improvement.py +223 -0
crackerjack/services/config.py +12 -1
crackerjack/services/coverage_ratchet.py +9 -0
crackerjack/services/filesystem.py +26 -0
crackerjack/services/git.py +12 -1
crackerjack/services/initialization.py +38 -12
{crackerjack-0.31.4.dist-info → crackerjack-0.31.7.dist-info}/METADATA +1 -1
{crackerjack-0.31.4.dist-info → crackerjack-0.31.7.dist-info}/RECORD +25 -24
{crackerjack-0.31.4.dist-info → crackerjack-0.31.7.dist-info}/WHEEL +0 -0
{crackerjack-0.31.4.dist-info → crackerjack-0.31.7.dist-info}/entry_points.txt +0 -0
{crackerjack-0.31.4.dist-info → crackerjack-0.31.7.dist-info}/licenses/LICENSE +0 -0

crackerjack/__main__.py CHANGED Viewed

@@ -171,6 +171,7 @@ def main(
     coverage_status: bool = CLI_OPTIONS["coverage_status"],
     coverage_goal: float | None = CLI_OPTIONS["coverage_goal"],
     no_coverage_ratchet: bool = CLI_OPTIONS["no_coverage_ratchet"],
+    boost_coverage: bool = CLI_OPTIONS["boost_coverage"],
 ) -> None:
     options = create_options(
         commit,
@@ -207,6 +208,7 @@ def main(
         coverage_status,
         coverage_goal,
         no_coverage_ratchet,
+        boost_coverage,
     )
     if ai_debug:

crackerjack/agents/base.py CHANGED Viewed

@@ -26,6 +26,7 @@ class IssueType(Enum):
     PERFORMANCE = "performance"
     DOCUMENTATION = "documentation"
     TEST_ORGANIZATION = "test_organization"
+    COVERAGE_IMPROVEMENT = "coverage_improvement"
 @dataclass

crackerjack/agents/test_creation_agent.py CHANGED Viewed

@@ -23,6 +23,7 @@ class TestCreationAgent(SubAgent):
             IssueType.TEST_FAILURE,
             IssueType.DEPENDENCY,
             IssueType.TEST_ORGANIZATION,
+            IssueType.COVERAGE_IMPROVEMENT,
         }
     async def can_handle(self, issue: Issue) -> float:
@@ -31,6 +32,10 @@ class TestCreationAgent(SubAgent):
         message_lower = issue.message.lower()
+        # Handle coverage improvement requests with perfect confidence
+        if issue.type == IssueType.COVERAGE_IMPROVEMENT:
+            return 1.0
         # Handle test organization issues with high confidence
         if issue.type == IssueType.TEST_ORGANIZATION:
             return self._check_test_organization_confidence(message_lower)

crackerjack/cli/options.py CHANGED Viewed

@@ -48,6 +48,7 @@ class Options(BaseModel):
     keep_releases: int = 10
     track_progress: bool = False
     orchestrated: bool = False
+    boost_coverage: bool = True
     coverage: bool = False
     orchestration_strategy: str = "adaptive"
     orchestration_progress: str = "granular"
@@ -324,6 +325,11 @@ CLI_OPTIONS = {
         "--no-coverage-ratchet",
         help="Disable coverage ratchet system temporarily (for experiments).",
     ),
+    "boost_coverage": typer.Option(
+        True,
+        "--boost-coverage/--no-boost-coverage",
+        help="Automatically improve test coverage after successful workflow execution (default: True).",
+    ),
 }
@@ -362,6 +368,7 @@ def create_options(
     coverage_status: bool,
     coverage_goal: float | None,
     no_coverage_ratchet: bool,
+    boost_coverage: bool,
 ) -> Options:
     return Options(
         commit=commit,
@@ -398,4 +405,5 @@ def create_options(
         coverage_status=coverage_status,
         coverage_goal=coverage_goal,
         no_coverage_ratchet=no_coverage_ratchet,
+        boost_coverage=boost_coverage,
     )

crackerjack/core/phase_coordinator.py CHANGED Viewed

@@ -501,12 +501,36 @@ class PhaseCoordinator:
         self.console.print(
             f"[red]❌[/red] {hook_type.title()} hooks failed: {summary['failed']} failed, {summary['errors']} errors",
         )
+        # Collect detailed hook failure information for AI agent processing
+        detailed_error_msg = self._build_detailed_hook_error_message(results, summary)
         self.session.fail_task(
             f"{hook_type}_hooks",
-            f"{summary['failed']} failed, {summary['errors']} errors",
+            detailed_error_msg,
         )
         return False
+    def _build_detailed_hook_error_message(
+        self, results: list[t.Any], summary: dict[str, t.Any]
+    ) -> str:
+        """Build detailed error message with specific hook failure information."""
+        error_parts = [f"{summary['failed']} failed, {summary['errors']} errors"]
+        # Extract specific hook failures
+        failed_hooks = []
+        for result in results:
+            if hasattr(result, "failed") and result.failed:
+                hook_name = getattr(result, "hook_id", "") or getattr(
+                    result, "name", "unknown"
+                )
+                failed_hooks.append(hook_name.lower())
+        if failed_hooks:
+            error_parts.append(f"Failed hooks: {', '.join(failed_hooks)}")
+        return " | ".join(error_parts)
     def _should_retry_fast_hooks(self, results: list[t.Any]) -> bool:
         formatting_hooks = {
             "ruff-format",

crackerjack/core/workflow_orchestrator.py CHANGED Viewed

@@ -259,7 +259,7 @@ class WorkflowPipeline:
         success = self.phases.run_comprehensive_hooks_only(options)
         if not success:
-            self.session.fail_task("workflow", "Comprehensive hooks failed")
+            self.session.fail_task("comprehensive_hooks", "Comprehensive hooks failed")
             self._update_mcp_status("comprehensive", "failed")
             # In AI agent mode, continue to collect more failures
             # In non-AI mode, this will be handled by caller
@@ -345,7 +345,25 @@ class WorkflowPipeline:
         """Run AI agent fixing phase to analyze and fix collected failures."""
         self._update_mcp_status("ai_fixing", "running")
         self.logger.info("Starting AI agent fixing phase")
+        self._log_debug_phase_start()
+        try:
+            agent_coordinator = self._setup_agent_coordinator()
+            issues = await self._collect_issues_from_failures()
+            if not issues:
+                return self._handle_no_issues_found()
+            self.logger.info(f"AI agents will attempt to fix {len(issues)} issues")
+            fix_result = await agent_coordinator.handle_issues(issues)
+            return await self._process_fix_results(options, fix_result)
+        except Exception as e:
+            return self._handle_fixing_phase_error(e)
+    def _log_debug_phase_start(self) -> None:
+        """Log debug information for phase start."""
         if self._should_debug():
             self.debugger.log_workflow_phase(
                 "ai_agent_fixing",
@@ -353,77 +371,150 @@ class WorkflowPipeline:
                 details={"ai_agent": True},
             )
-        try:
-            # Create AI agent context
-            agent_context = AgentContext(
-                project_path=self.pkg_path,
-                session_id=getattr(self.session, "session_id", None),
-            )
+    def _setup_agent_coordinator(self) -> AgentCoordinator:
+        """Set up agent coordinator with proper context."""
+        from crackerjack.agents.coordinator import AgentCoordinator
-            # Initialize agent coordinator
-            agent_coordinator = AgentCoordinator(agent_context)
-            agent_coordinator.initialize_agents()
+        agent_context = AgentContext(
+            project_path=self.pkg_path,
+            session_id=getattr(self.session, "session_id", None),
+        )
-            # Collect issues from failures
-            issues = await self._collect_issues_from_failures()
+        agent_coordinator = AgentCoordinator(agent_context)
+        agent_coordinator.initialize_agents()
+        return agent_coordinator
-            if not issues:
-                self.logger.info("No issues collected for AI agent fixing")
-                self._update_mcp_status("ai_fixing", "completed")
-                return True
+    def _handle_no_issues_found(self) -> bool:
+        """Handle case when no issues are collected."""
+        self.logger.info("No issues collected for AI agent fixing")
+        self._update_mcp_status("ai_fixing", "completed")
+        return True
-            self.logger.info(f"AI agents will attempt to fix {len(issues)} issues")
+    async def _process_fix_results(
+        self, options: OptionsProtocol, fix_result: t.Any
+    ) -> bool:
+        """Process fix results and verify success."""
+        verification_success = await self._verify_fixes_applied(options, fix_result)
+        success = fix_result.success and verification_success
-            # Let agents handle the issues
-            fix_result = await agent_coordinator.handle_issues(issues)
+        if success:
+            self._handle_successful_fixes(fix_result)
+        else:
+            self._handle_failed_fixes(fix_result, verification_success)
-            success = fix_result.success
-            if success:
-                self.logger.info("AI agents successfully fixed all issues")
-                self._update_mcp_status("ai_fixing", "completed")
+        self._log_debug_phase_completion(success, fix_result)
+        return success
-                # Log fix counts for debugging
-                if self._should_debug():
-                    total_fixes = len(fix_result.fixes_applied)
-                    # Estimate test vs hook fixes based on original issue types
-                    test_fixes = len(
-                        [f for f in fix_result.fixes_applied if "test" in f.lower()],
-                    )
-                    hook_fixes = total_fixes - test_fixes
-                    self.debugger.log_test_fixes(test_fixes)
-                    self.debugger.log_hook_fixes(hook_fixes)
-            else:
-                self.logger.warning(
-                    f"AI agents could not fix all issues: {fix_result.remaining_issues}",
-                )
-                self._update_mcp_status("ai_fixing", "failed")
+    def _handle_successful_fixes(self, fix_result: t.Any) -> None:
+        """Handle successful fix results."""
+        self.logger.info(
+            "AI agents successfully fixed all issues and verification passed"
+        )
+        self._update_mcp_status("ai_fixing", "completed")
+        self._log_fix_counts_if_debugging(fix_result)
-            if self._should_debug():
-                self.debugger.log_workflow_phase(
-                    "ai_agent_fixing",
-                    "completed" if success else "failed",
-                    details={
-                        "confidence": fix_result.confidence,
-                        "fixes_applied": len(fix_result.fixes_applied),
-                        "remaining_issues": len(fix_result.remaining_issues),
-                    },
-                )
+    def _handle_failed_fixes(
+        self, fix_result: t.Any, verification_success: bool
+    ) -> None:
+        """Handle failed fix results."""
+        if not verification_success:
+            self.logger.warning(
+                "AI agent fixes did not pass verification - issues still exist"
+            )
+        else:
+            self.logger.warning(
+                f"AI agents could not fix all issues: {fix_result.remaining_issues}",
+            )
+        self._update_mcp_status("ai_fixing", "failed")
-            return success
+    def _log_fix_counts_if_debugging(self, fix_result: t.Any) -> None:
+        """Log fix counts for debugging if debug mode is enabled."""
+        if not self._should_debug():
+            return
-        except Exception as e:
-            self.logger.exception(f"AI agent fixing phase failed: {e}")
-            self.session.fail_task("ai_fixing", f"AI agent fixing failed: {e}")
-            self._update_mcp_status("ai_fixing", "failed")
+        total_fixes = len(fix_result.fixes_applied)
+        test_fixes = len(
+            [f for f in fix_result.fixes_applied if "test" in f.lower()],
+        )
+        hook_fixes = total_fixes - test_fixes
+        self.debugger.log_test_fixes(test_fixes)
+        self.debugger.log_hook_fixes(hook_fixes)
-            if self._should_debug():
-                self.debugger.log_workflow_phase(
-                    "ai_agent_fixing",
-                    "failed",
-                    details={"error": str(e)},
+    def _log_debug_phase_completion(self, success: bool, fix_result: t.Any) -> None:
+        """Log debug information for phase completion."""
+        if self._should_debug():
+            self.debugger.log_workflow_phase(
+                "ai_agent_fixing",
+                "completed" if success else "failed",
+                details={
+                    "confidence": fix_result.confidence,
+                    "fixes_applied": len(fix_result.fixes_applied),
+                    "remaining_issues": len(fix_result.remaining_issues),
+                },
+            )
+    def _handle_fixing_phase_error(self, error: Exception) -> bool:
+        """Handle errors during the fixing phase."""
+        self.logger.exception(f"AI agent fixing phase failed: {error}")
+        self.session.fail_task("ai_fixing", f"AI agent fixing failed: {error}")
+        self._update_mcp_status("ai_fixing", "failed")
+        if self._should_debug():
+            self.debugger.log_workflow_phase(
+                "ai_agent_fixing",
+                "failed",
+                details={"error": str(error)},
+            )
+        return False
+    async def _verify_fixes_applied(
+        self, options: OptionsProtocol, fix_result: t.Any
+    ) -> bool:
+        """Verify that AI agent fixes actually resolved the issues by re-running checks."""
+        if not fix_result.fixes_applied:
+            return True  # No fixes were applied, nothing to verify
+        self.logger.info("Verifying AI agent fixes by re-running quality checks")
+        # Re-run the phases that previously failed to verify fixes
+        verification_success = True
+        # Check if we need to re-run tests
+        if any("test" in fix.lower() for fix in fix_result.fixes_applied):
+            self.logger.info("Re-running tests to verify test fixes")
+            test_success = self.phases.run_testing_phase(options)
+            if not test_success:
+                self.logger.warning(
+                    "Test verification failed - test fixes did not work"
+                )
+                verification_success = False
+        # Check if we need to re-run comprehensive hooks
+        hook_fixes = [
+            f
+            for f in fix_result.fixes_applied
+            if "hook" not in f.lower()
+            or "complexity" in f.lower()
+            or "type" in f.lower()
+        ]
+        if hook_fixes:
+            self.logger.info("Re-running comprehensive hooks to verify hook fixes")
+            hook_success = self.phases.run_comprehensive_hooks_only(options)
+            if not hook_success:
+                self.logger.warning(
+                    "Hook verification failed - hook fixes did not work"
                 )
+                verification_success = False
-            return False
+        if verification_success:
+            self.logger.info("All AI agent fixes verified successfully")
+        else:
+            self.logger.error(
+                "Verification failed - some fixes did not resolve the issues"
+            )
+        return verification_success
     async def _collect_issues_from_failures(self) -> list[Issue]:
         """Collect issues from test and comprehensive hook failures."""
@@ -469,29 +560,124 @@ class WorkflowPipeline:
         issues: list[Issue] = []
         hook_count = 0
-        if self.session.session_tracker:
-            for task_id, task_data in self.session.session_tracker.tasks.items():
-                if task_data.status == "failed" and task_id in (
-                    "fast_hooks",
-                    "comprehensive_hooks",
-                ):
-                    hook_count += 1
-                    issue_type = (
-                        IssueType.FORMATTING
-                        if "fast" in task_id
-                        else IssueType.TYPE_ERROR
+        if not self.session.session_tracker:
+            return issues, hook_count
+        for task_id, task_data in self.session.session_tracker.tasks.items():
+            if self._is_failed_hook_task(task_data, task_id):
+                hook_count += 1
+                hook_issues = self._process_hook_failure(task_id, task_data)
+                issues.extend(hook_issues)
+        return issues, hook_count
+    def _is_failed_hook_task(self, task_data: t.Any, task_id: str) -> bool:
+        """Check if a task is a failed hook task."""
+        return task_data.status == "failed" and task_id in (
+            "fast_hooks",
+            "comprehensive_hooks",
+        )
+    def _process_hook_failure(self, task_id: str, task_data: t.Any) -> list[Issue]:
+        """Process a single hook failure and return corresponding issues."""
+        error_msg = getattr(task_data, "error_message", "Unknown error")
+        specific_issues = self._parse_hook_error_details(task_id, error_msg)
+        if specific_issues:
+            return specific_issues
+        return [self._create_generic_hook_issue(task_id, error_msg)]
+    def _create_generic_hook_issue(self, task_id: str, error_msg: str) -> Issue:
+        """Create a generic issue for unspecific hook failures."""
+        issue_type = IssueType.FORMATTING if "fast" in task_id else IssueType.TYPE_ERROR
+        return Issue(
+            id=f"hook_failure_{task_id}",
+            type=issue_type,
+            severity=Priority.MEDIUM,
+            message=error_msg,
+            stage=task_id.replace("_hooks", ""),
+        )
+    def _parse_hook_error_details(self, task_id: str, error_msg: str) -> list[Issue]:
+        """Parse specific hook failure details to create targeted issues."""
+        issues: list[Issue] = []
+        # For comprehensive hooks, parse specific tool failures
+        if task_id == "comprehensive_hooks":
+            # Check for complexipy failures (complexity violations)
+            if "complexipy" in error_msg.lower():
+                issues.append(
+                    Issue(
+                        id="complexipy_violation",
+                        type=IssueType.COMPLEXITY,
+                        severity=Priority.HIGH,
+                        message="Code complexity violation detected by complexipy",
+                        stage="comprehensive",
+                    )
+                )
+            # Check for pyright failures (type errors)
+            if "pyright" in error_msg.lower():
+                issues.append(
+                    Issue(
+                        id="pyright_type_error",
+                        type=IssueType.TYPE_ERROR,
+                        severity=Priority.HIGH,
+                        message="Type checking errors detected by pyright",
+                        stage="comprehensive",
+                    )
+                )
+            # Check for bandit failures (security issues)
+            if "bandit" in error_msg.lower():
+                issues.append(
+                    Issue(
+                        id="bandit_security_issue",
+                        type=IssueType.SECURITY,
+                        severity=Priority.HIGH,
+                        message="Security vulnerabilities detected by bandit",
+                        stage="comprehensive",
                     )
-                    error_msg = getattr(task_data, "error_message", "Unknown error")
-                    issue = Issue(
-                        id=f"hook_failure_{task_id}",
-                        type=issue_type,
+                )
+            # Check for refurb failures (code quality issues)
+            if "refurb" in error_msg.lower():
+                issues.append(
+                    Issue(
+                        id="refurb_quality_issue",
+                        type=IssueType.PERFORMANCE,  # Use PERFORMANCE as closest match for refurb issues
                         severity=Priority.MEDIUM,
-                        message=error_msg,
-                        stage=task_id.replace("_hooks", ""),
+                        message="Code quality issues detected by refurb",
+                        stage="comprehensive",
                     )
-                    issues.append(issue)
+                )
-        return issues, hook_count
+            # Check for vulture failures (dead code)
+            if "vulture" in error_msg.lower():
+                issues.append(
+                    Issue(
+                        id="vulture_dead_code",
+                        type=IssueType.DEAD_CODE,
+                        severity=Priority.MEDIUM,
+                        message="Dead code detected by vulture",
+                        stage="comprehensive",
+                    )
+                )
+        elif task_id == "fast_hooks":
+            # Fast hooks are typically formatting issues
+            issues.append(
+                Issue(
+                    id="fast_hooks_formatting",
+                    type=IssueType.FORMATTING,
+                    severity=Priority.LOW,
+                    message="Code formatting issues detected",
+                    stage="fast",
+                )
+            )
+        return issues
     def _log_failure_counts_if_debugging(
         self, test_count: int, hook_count: int

crackerjack/dynamic_config.py CHANGED Viewed

@@ -123,7 +123,7 @@ HOOKS_REGISTRY: dict[str, list[HookMetadata]] = {
             "id": "uv-lock",
             "name": None,
             "repo": "https://github.com/astral-sh/uv-pre-commit",
-            "rev": "0.8.13",
+            "rev": "0.8.14",
             "tier": 1,
             "time_estimate": 0.5,
             "stages": None,
@@ -195,7 +195,7 @@ HOOKS_REGISTRY: dict[str, list[HookMetadata]] = {
             "id": "ruff-check",
             "name": None,
             "repo": "https://github.com/astral-sh/ruff-pre-commit",
-            "rev": "v0.12.10",
+            "rev": "v0.12.11",
             "tier": 2,
             "time_estimate": 1.5,
             "stages": None,
@@ -212,7 +212,7 @@ HOOKS_REGISTRY: dict[str, list[HookMetadata]] = {
             "id": "ruff-format",
             "name": None,
             "repo": "https://github.com/astral-sh/ruff-pre-commit",
-            "rev": "v0.12.10",
+            "rev": "v0.12.11",
             "tier": 2,
             "time_estimate": 1.0,
             "stages": None,

crackerjack/managers/publish_manager.py CHANGED Viewed

@@ -233,7 +233,29 @@ class PublishManagerImpl:
         self.console.print("[yellow]🔍[/yellow] Would build package")
         return True
+    def _clean_dist_directory(self) -> None:
+        """Clean dist directory to ensure only current version artifacts are uploaded."""
+        dist_dir = self.pkg_path / "dist"
+        if not dist_dir.exists():
+            return
+        try:
+            import shutil
+            # Remove entire dist directory and recreate it
+            shutil.rmtree(dist_dir)
+            dist_dir.mkdir(exist_ok=True)
+            self.console.print("[cyan]🧹[/cyan] Cleaned dist directory for fresh build")
+        except Exception as e:
+            self.console.print(
+                f"[yellow]⚠️[/yellow] Warning: Could not clean dist directory: {e}"
+            )
+            # Continue with build anyway - uv publish will fail with clear error
     def _execute_build(self) -> bool:
+        # Clean dist directory before building to avoid uploading multiple versions
+        self._clean_dist_directory()
         result = self._run_command(["uv", "build"])
         if result.returncode != 0:

crackerjack/managers/test_executor.py CHANGED Viewed

@@ -234,11 +234,14 @@ class TestExecutor:
     def _handle_session_events(self, line: str, progress: TestProgress) -> bool:
         """Handle pytest session events."""
-        if "session starts" in line:
-            progress.update(collection_status="Session starting...")
+        if "session starts" in line and progress.collection_status != "Session started":
+            progress.update(collection_status="Session started")
             return True
-        elif "test session starts" in line:
-            progress.update(collection_status="Starting test collection...")
+        elif (
+            "test session starts" in line
+            and progress.collection_status != "Test collection started"
+        ):
+            progress.update(collection_status="Test collection started")
             return True
         return False
@@ -308,7 +311,12 @@ class TestExecutor:
     def _should_refresh_display(self, progress: TestProgress) -> bool:
         """Determine if display should be refreshed."""
-        return True  # Simplified - let Rich handle refresh rate
+        # Only refresh on significant changes to reduce spam
+        return (
+            progress.is_complete
+            or progress.total_tests > 0
+            or len(progress.current_test) > 0
+        )
     def _mark_test_as_stuck(self, progress: TestProgress, test_name: str) -> None:
         """Mark a test as potentially stuck."""

crackerjack 0.31.4__py3-none-any.whl → 0.31.7__py3-none-any.whl

Potentially problematic release.

crackerjack 0.31.4py3-none-any.whl → 0.31.7py3-none-any.whl