PyPI - gitflow-analytics - Versions diffs - 1.3.6__py3-none-any.whl → 3.3.0__py3-none-any.whl - Mend

gitflow-analytics 1.3.6py3-none-any.whl → 3.3.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (48) hide show

gitflow_analytics/_version.py +1 -1
gitflow_analytics/classification/batch_classifier.py +156 -4
gitflow_analytics/cli.py +897 -179
gitflow_analytics/config/loader.py +40 -1
gitflow_analytics/config/schema.py +4 -0
gitflow_analytics/core/cache.py +20 -0
gitflow_analytics/core/data_fetcher.py +1254 -228
gitflow_analytics/core/git_auth.py +169 -0
gitflow_analytics/core/git_timeout_wrapper.py +347 -0
gitflow_analytics/core/metrics_storage.py +12 -3
gitflow_analytics/core/progress.py +219 -18
gitflow_analytics/core/subprocess_git.py +145 -0
gitflow_analytics/extractors/ml_tickets.py +3 -2
gitflow_analytics/extractors/tickets.py +93 -8
gitflow_analytics/integrations/jira_integration.py +1 -1
gitflow_analytics/integrations/orchestrator.py +47 -29
gitflow_analytics/metrics/branch_health.py +3 -2
gitflow_analytics/models/database.py +72 -1
gitflow_analytics/pm_framework/adapters/jira_adapter.py +12 -5
gitflow_analytics/pm_framework/orchestrator.py +8 -3
gitflow_analytics/qualitative/classifiers/llm/openai_client.py +24 -4
gitflow_analytics/qualitative/classifiers/llm_commit_classifier.py +3 -1
gitflow_analytics/qualitative/core/llm_fallback.py +34 -2
gitflow_analytics/reports/narrative_writer.py +118 -74
gitflow_analytics/security/__init__.py +11 -0
gitflow_analytics/security/config.py +189 -0
gitflow_analytics/security/extractors/__init__.py +7 -0
gitflow_analytics/security/extractors/dependency_checker.py +379 -0
gitflow_analytics/security/extractors/secret_detector.py +197 -0
gitflow_analytics/security/extractors/vulnerability_scanner.py +333 -0
gitflow_analytics/security/llm_analyzer.py +347 -0
gitflow_analytics/security/reports/__init__.py +5 -0
gitflow_analytics/security/reports/security_report.py +358 -0
gitflow_analytics/security/security_analyzer.py +414 -0
gitflow_analytics/tui/app.py +3 -1
gitflow_analytics/tui/progress_adapter.py +313 -0
gitflow_analytics/tui/screens/analysis_progress_screen.py +407 -46
gitflow_analytics/tui/screens/results_screen.py +219 -206
gitflow_analytics/ui/__init__.py +21 -0
gitflow_analytics/ui/progress_display.py +1477 -0
gitflow_analytics/verify_activity.py +697 -0
{gitflow_analytics-1.3.6.dist-info → gitflow_analytics-3.3.0.dist-info}/METADATA +2 -1
{gitflow_analytics-1.3.6.dist-info → gitflow_analytics-3.3.0.dist-info}/RECORD +47 -31
gitflow_analytics/cli_rich.py +0 -503
{gitflow_analytics-1.3.6.dist-info → gitflow_analytics-3.3.0.dist-info}/WHEEL +0 -0
{gitflow_analytics-1.3.6.dist-info → gitflow_analytics-3.3.0.dist-info}/entry_points.txt +0 -0
{gitflow_analytics-1.3.6.dist-info → gitflow_analytics-3.3.0.dist-info}/licenses/LICENSE +0 -0
{gitflow_analytics-1.3.6.dist-info → gitflow_analytics-3.3.0.dist-info}/top_level.txt +0 -0

gitflow_analytics/_version.py CHANGED Viewed

@@ -1,4 +1,4 @@
 """Version information for gitflow-analytics."""
-__version__ = "1.3.6"
+__version__ = "3.3.0"
 __version_info__ = tuple(int(x) for x in __version__.split("."))

gitflow_analytics/classification/batch_classifier.py CHANGED Viewed

@@ -45,6 +45,7 @@ class BatchCommitClassifier:
         batch_size: int = 50,
         confidence_threshold: float = 0.7,
         fallback_enabled: bool = True,
+        max_processing_time_minutes: int = 30,  # Maximum time for classification
     ):
         """Initialize the batch classifier.
@@ -60,6 +61,8 @@ class BatchCommitClassifier:
         self.batch_size = min(batch_size, 50)  # Limit for token constraints
         self.confidence_threshold = confidence_threshold
         self.fallback_enabled = fallback_enabled
+        self.max_processing_time_minutes = max_processing_time_minutes
+        self.classification_start_time = None
         # Initialize LLM classifier
         # Handle different config types
@@ -84,9 +87,25 @@ class BatchCommitClassifier:
             llm_config_obj = LLMConfig()
         self.llm_classifier = LLMCommitClassifier(config=llm_config_obj, cache_dir=cache_dir)
-        logger.info(
-            f"LLM Classifier initialized with API key: {'Yes' if llm_config_obj.api_key else 'No'}"
-        )
+        # Warn if no API key is configured
+        if not llm_config_obj.api_key:
+            logger.warning(
+                "No API key configured for LLM classification. "
+                "Will fall back to rule-based classification."
+            )
+            # Set a flag to skip LLM calls entirely
+            self.llm_enabled = False
+        else:
+            self.llm_enabled = True
+            logger.info(
+                f"LLM Classifier initialized with API key: Yes (model: {llm_config_obj.model})"
+            )
+        # Circuit breaker for LLM API failures
+        self.api_failure_count = 0
+        self.max_consecutive_failures = 5
+        self.circuit_breaker_open = False
         # Rule-based fallback patterns for when LLM fails
         self.fallback_patterns = {
@@ -165,6 +184,7 @@ class BatchCommitClassifier:
             Dictionary containing classification results and statistics
         """
         logger.info(f"Starting batch classification from {start_date.date()} to {end_date.date()}")
+        self.classification_start_time = datetime.utcnow()
         # Get daily batches to process
         batches_to_process = self._get_batches_to_process(
@@ -206,6 +226,18 @@ class BatchCommitClassifier:
                     f"Processing repository {repo_num}/{len(repo_batches)}: {repo_name} ({len(repo_batch_list)} batches, {repo_commit_count} commits)"
                 )
+                # Check if we've exceeded max processing time
+                if self.classification_start_time:
+                    elapsed_minutes = (
+                        datetime.utcnow() - self.classification_start_time
+                    ).total_seconds() / 60
+                    if elapsed_minutes > self.max_processing_time_minutes:
+                        logger.error(
+                            f"Classification exceeded maximum time limit of {self.max_processing_time_minutes} minutes. "
+                            f"Stopping classification to prevent hanging."
+                        )
+                        break
                 # Process this repository's batches by week for optimal context
                 weekly_batches = self._group_batches_by_week(repo_batch_list)
@@ -403,6 +435,30 @@ class BatchCommitClassifier:
                 leave=False,
             ) as batch_ctx:
                 for i in range(0, len(week_commits), self.batch_size):
+                    # Check for timeout before processing each batch
+                    if self.classification_start_time:
+                        elapsed_minutes = (
+                            datetime.utcnow() - self.classification_start_time
+                        ).total_seconds() / 60
+                        if elapsed_minutes > self.max_processing_time_minutes:
+                            logger.error(
+                                f"Classification timeout after {elapsed_minutes:.1f} minutes. "
+                                f"Processed {len(classified_commits)}/{len(week_commits)} commits."
+                            )
+                            # Use fallback for remaining commits
+                            remaining_commits = week_commits[i:]
+                            for commit in remaining_commits:
+                                classified_commits.append(
+                                    {
+                                        "commit_hash": commit["commit_hash"],
+                                        "category": "maintenance",
+                                        "confidence": 0.2,
+                                        "method": "timeout_fallback",
+                                        "error": "Classification timeout",
+                                    }
+                                )
+                            break
                     batch_num = i // self.batch_size + 1
                     batch_commits = week_commits[i : i + self.batch_size]
                     progress.set_description(
@@ -558,6 +614,13 @@ class BatchCommitClassifier:
         batch_id = str(uuid.uuid4())
         logger.info(f"Starting LLM classification for batch {batch_id} with {len(commits)} commits")
+        # Add timeout warning for large batches
+        if len(commits) > 20:
+            logger.warning(
+                f"Large batch size ({len(commits)} commits) may take longer to process. "
+                f"Consider reducing batch_size if timeouts occur."
+            )
         # Prepare batch for LLM classification
         enhanced_commits = []
         for commit in commits:
@@ -573,12 +636,68 @@ class BatchCommitClassifier:
             enhanced_commit["ticket_context"] = relevant_tickets
             enhanced_commits.append(enhanced_commit)
+        # Check if LLM is enabled before attempting classification
+        if not self.llm_enabled:
+            logger.debug(f"LLM disabled, using fallback for batch {batch_id[:8]}")
+            # Skip directly to fallback
+            fallback_results = []
+            for commit in commits:
+                category = self._fallback_classify_commit(commit)
+                fallback_results.append(
+                    {
+                        "commit_hash": commit["commit_hash"],
+                        "category": category,
+                        "confidence": 0.3,  # Low confidence for fallback
+                        "method": "fallback_only",
+                        "error": "LLM not configured",
+                        "batch_id": batch_id,
+                    }
+                )
+            return fallback_results
+        # Check circuit breaker status
+        if self.circuit_breaker_open:
+            logger.info(
+                f"Circuit breaker OPEN - Skipping LLM API call for batch {batch_id[:8]} "
+                f"after {self.api_failure_count} consecutive failures. Using fallback classification."
+            )
+            # Use fallback for all commits
+            fallback_results = []
+            for commit in commits:
+                category = self._fallback_classify_commit(commit)
+                fallback_results.append(
+                    {
+                        "commit_hash": commit["commit_hash"],
+                        "category": category,
+                        "confidence": 0.3,  # Low confidence for fallback
+                        "method": "circuit_breaker_fallback",
+                        "error": "Circuit breaker open - API repeatedly failing",
+                        "batch_id": batch_id,
+                    }
+                )
+            return fallback_results
         try:
             # Use LLM classifier with enhanced context
+            logger.debug(f"Calling LLM classifier for batch {batch_id[:8]}...")
+            start_time = datetime.utcnow()
             llm_results = self.llm_classifier.classify_commits_batch(
                 enhanced_commits, batch_id=batch_id, include_confidence=True
             )
+            elapsed = (datetime.utcnow() - start_time).total_seconds()
+            logger.info(f"LLM classification for batch {batch_id[:8]} took {elapsed:.2f}s")
+            # Reset circuit breaker on successful LLM call
+            if self.api_failure_count > 0:
+                logger.info(
+                    f"LLM API call succeeded - Resetting circuit breaker "
+                    f"(was at {self.api_failure_count} failures)"
+                )
+            self.api_failure_count = 0
+            self.circuit_breaker_open = False
             # Process LLM results and add fallbacks
             processed_results = []
             for _i, (commit, llm_result) in enumerate(zip(commits, llm_results)):
@@ -616,7 +735,40 @@ class BatchCommitClassifier:
             return processed_results
         except Exception as e:
-            logger.error(f"LLM classification failed for batch {batch_id}: {e}")
+            # Track consecutive failures for circuit breaker
+            self.api_failure_count += 1
+            logger.error(
+                f"LLM classification failed for batch {batch_id}: {e} "
+                f"(Failure {self.api_failure_count}/{self.max_consecutive_failures})"
+            )
+            # Open circuit breaker after max consecutive failures
+            if (
+                self.api_failure_count >= self.max_consecutive_failures
+                and not self.circuit_breaker_open
+            ):
+                self.circuit_breaker_open = True
+                logger.error(
+                    f"CIRCUIT BREAKER OPENED after {self.api_failure_count} consecutive API failures. "
+                    f"All subsequent batches will use fallback classification until API recovers. "
+                    f"This prevents the system from hanging on repeated timeouts."
+                )
+            # Provide more context about the failure
+            if "timeout" in str(e).lower():
+                logger.error(
+                    f"Classification timed out. Consider: \n"
+                    f"  1. Reducing batch_size (current: {self.batch_size})\n"
+                    f"  2. Increasing timeout_seconds in LLM config\n"
+                    f"  3. Checking API service status"
+                )
+            elif "connection" in str(e).lower():
+                logger.error(
+                    "Connection error. Check:\n"
+                    "  1. Internet connectivity\n"
+                    "  2. API endpoint availability\n"
+                    "  3. Firewall/proxy settings"
+                )
             # Fall back to rule-based classification for entire batch
             if self.fallback_enabled:

gitflow-analytics 1.3.6__py3-none-any.whl → 3.3.0__py3-none-any.whl

gitflow-analytics 1.3.6py3-none-any.whl → 3.3.0py3-none-any.whl