PyPI - gitflow-analytics - Versions diffs - 1.0.1__py3-none-any.whl → 1.3.6__py3-none-any.whl - Mend

gitflow-analytics 1.0.1py3-none-any.whl → 1.3.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (119) hide show

gitflow_analytics/__init__.py +11 -11
gitflow_analytics/_version.py +2 -2
gitflow_analytics/classification/__init__.py +31 -0
gitflow_analytics/classification/batch_classifier.py +752 -0
gitflow_analytics/classification/classifier.py +464 -0
gitflow_analytics/classification/feature_extractor.py +725 -0
gitflow_analytics/classification/linguist_analyzer.py +574 -0
gitflow_analytics/classification/model.py +455 -0
gitflow_analytics/cli.py +4490 -378
gitflow_analytics/cli_rich.py +503 -0
gitflow_analytics/config/__init__.py +43 -0
gitflow_analytics/config/errors.py +261 -0
gitflow_analytics/config/loader.py +904 -0
gitflow_analytics/config/profiles.py +264 -0
gitflow_analytics/config/repository.py +124 -0
gitflow_analytics/config/schema.py +441 -0
gitflow_analytics/config/validator.py +154 -0
gitflow_analytics/config.py +44 -398
gitflow_analytics/core/analyzer.py +1320 -172
gitflow_analytics/core/branch_mapper.py +132 -132
gitflow_analytics/core/cache.py +1554 -175
gitflow_analytics/core/data_fetcher.py +1193 -0
gitflow_analytics/core/identity.py +571 -185
gitflow_analytics/core/metrics_storage.py +526 -0
gitflow_analytics/core/progress.py +372 -0
gitflow_analytics/core/schema_version.py +269 -0
gitflow_analytics/extractors/base.py +13 -11
gitflow_analytics/extractors/ml_tickets.py +1100 -0
gitflow_analytics/extractors/story_points.py +77 -59
gitflow_analytics/extractors/tickets.py +841 -89
gitflow_analytics/identity_llm/__init__.py +6 -0
gitflow_analytics/identity_llm/analysis_pass.py +231 -0
gitflow_analytics/identity_llm/analyzer.py +464 -0
gitflow_analytics/identity_llm/models.py +76 -0
gitflow_analytics/integrations/github_integration.py +258 -87
gitflow_analytics/integrations/jira_integration.py +572 -123
gitflow_analytics/integrations/orchestrator.py +206 -82
gitflow_analytics/metrics/activity_scoring.py +322 -0
gitflow_analytics/metrics/branch_health.py +470 -0
gitflow_analytics/metrics/dora.py +542 -179
gitflow_analytics/models/database.py +986 -59
gitflow_analytics/pm_framework/__init__.py +115 -0
gitflow_analytics/pm_framework/adapters/__init__.py +50 -0
gitflow_analytics/pm_framework/adapters/jira_adapter.py +1845 -0
gitflow_analytics/pm_framework/base.py +406 -0
gitflow_analytics/pm_framework/models.py +211 -0
gitflow_analytics/pm_framework/orchestrator.py +652 -0
gitflow_analytics/pm_framework/registry.py +333 -0
gitflow_analytics/qualitative/__init__.py +29 -0
gitflow_analytics/qualitative/chatgpt_analyzer.py +259 -0
gitflow_analytics/qualitative/classifiers/__init__.py +13 -0
gitflow_analytics/qualitative/classifiers/change_type.py +742 -0
gitflow_analytics/qualitative/classifiers/domain_classifier.py +506 -0
gitflow_analytics/qualitative/classifiers/intent_analyzer.py +535 -0
gitflow_analytics/qualitative/classifiers/llm/__init__.py +35 -0
gitflow_analytics/qualitative/classifiers/llm/base.py +193 -0
gitflow_analytics/qualitative/classifiers/llm/batch_processor.py +383 -0
gitflow_analytics/qualitative/classifiers/llm/cache.py +479 -0
gitflow_analytics/qualitative/classifiers/llm/cost_tracker.py +435 -0
gitflow_analytics/qualitative/classifiers/llm/openai_client.py +403 -0
gitflow_analytics/qualitative/classifiers/llm/prompts.py +373 -0
gitflow_analytics/qualitative/classifiers/llm/response_parser.py +287 -0
gitflow_analytics/qualitative/classifiers/llm_commit_classifier.py +607 -0
gitflow_analytics/qualitative/classifiers/risk_analyzer.py +438 -0
gitflow_analytics/qualitative/core/__init__.py +13 -0
gitflow_analytics/qualitative/core/llm_fallback.py +657 -0
gitflow_analytics/qualitative/core/nlp_engine.py +382 -0
gitflow_analytics/qualitative/core/pattern_cache.py +479 -0
gitflow_analytics/qualitative/core/processor.py +673 -0
gitflow_analytics/qualitative/enhanced_analyzer.py +2236 -0
gitflow_analytics/qualitative/example_enhanced_usage.py +420 -0
gitflow_analytics/qualitative/models/__init__.py +25 -0
gitflow_analytics/qualitative/models/schemas.py +306 -0
gitflow_analytics/qualitative/utils/__init__.py +13 -0
gitflow_analytics/qualitative/utils/batch_processor.py +339 -0
gitflow_analytics/qualitative/utils/cost_tracker.py +345 -0
gitflow_analytics/qualitative/utils/metrics.py +361 -0
gitflow_analytics/qualitative/utils/text_processing.py +285 -0
gitflow_analytics/reports/__init__.py +100 -0
gitflow_analytics/reports/analytics_writer.py +550 -18
gitflow_analytics/reports/base.py +648 -0
gitflow_analytics/reports/branch_health_writer.py +322 -0
gitflow_analytics/reports/classification_writer.py +924 -0
gitflow_analytics/reports/cli_integration.py +427 -0
gitflow_analytics/reports/csv_writer.py +1700 -216
gitflow_analytics/reports/data_models.py +504 -0
gitflow_analytics/reports/database_report_generator.py +427 -0
gitflow_analytics/reports/example_usage.py +344 -0
gitflow_analytics/reports/factory.py +499 -0
gitflow_analytics/reports/formatters.py +698 -0
gitflow_analytics/reports/html_generator.py +1116 -0
gitflow_analytics/reports/interfaces.py +489 -0
gitflow_analytics/reports/json_exporter.py +2770 -0
gitflow_analytics/reports/narrative_writer.py +2289 -158
gitflow_analytics/reports/story_point_correlation.py +1144 -0
gitflow_analytics/reports/weekly_trends_writer.py +389 -0
gitflow_analytics/training/__init__.py +5 -0
gitflow_analytics/training/model_loader.py +377 -0
gitflow_analytics/training/pipeline.py +550 -0
gitflow_analytics/tui/__init__.py +5 -0
gitflow_analytics/tui/app.py +724 -0
gitflow_analytics/tui/screens/__init__.py +8 -0
gitflow_analytics/tui/screens/analysis_progress_screen.py +496 -0
gitflow_analytics/tui/screens/configuration_screen.py +523 -0
gitflow_analytics/tui/screens/loading_screen.py +348 -0
gitflow_analytics/tui/screens/main_screen.py +321 -0
gitflow_analytics/tui/screens/results_screen.py +722 -0
gitflow_analytics/tui/widgets/__init__.py +7 -0
gitflow_analytics/tui/widgets/data_table.py +255 -0
gitflow_analytics/tui/widgets/export_modal.py +301 -0
gitflow_analytics/tui/widgets/progress_widget.py +187 -0
gitflow_analytics-1.3.6.dist-info/METADATA +1015 -0
gitflow_analytics-1.3.6.dist-info/RECORD +122 -0
gitflow_analytics-1.0.1.dist-info/METADATA +0 -463
gitflow_analytics-1.0.1.dist-info/RECORD +0 -31
{gitflow_analytics-1.0.1.dist-info → gitflow_analytics-1.3.6.dist-info}/WHEEL +0 -0
{gitflow_analytics-1.0.1.dist-info → gitflow_analytics-1.3.6.dist-info}/entry_points.txt +0 -0
{gitflow_analytics-1.0.1.dist-info → gitflow_analytics-1.3.6.dist-info}/licenses/LICENSE +0 -0
{gitflow_analytics-1.0.1.dist-info → gitflow_analytics-1.3.6.dist-info}/top_level.txt +0 -0

gitflow_analytics/metrics/dora.py CHANGED Viewed

@@ -1,289 +1,346 @@
 """DORA (DevOps Research and Assessment) metrics calculation."""
-from datetime import datetime
-from typing import Any, Dict, List
+from datetime import datetime, timedelta
+from typing import Any, Optional
 import numpy as np
+import pytz
 class DORAMetricsCalculator:
     """Calculate DORA metrics for software delivery performance."""
-    def __init__(self):
+    def __init__(self) -> None:
         """Initialize DORA metrics calculator."""
-        self.deployment_patterns = [
-            'deploy', 'release', 'ship', 'live', 'production', 'prod'
-        ]
-        self.failure_patterns = [
-            'revert', 'rollback', 'hotfix', 'emergency', 'incident', 'outage'
-        ]
-    def calculate_dora_metrics(self,
-                             commits: List[Dict[str, Any]],
-                             prs: List[Dict[str, Any]],
-                             start_date: datetime,
-                             end_date: datetime) -> Dict[str, Any]:
+        self.deployment_patterns = ["deploy", "release", "ship", "live", "production", "prod"]
+        self.failure_patterns = ["revert", "rollback", "hotfix", "emergency", "incident", "outage"]
+    def _normalize_timestamp_to_utc(self, timestamp: Optional[datetime]) -> Optional[datetime]:
+        """Normalize any timestamp to UTC timezone-aware datetime.
+        WHY: Ensures all timestamps are timezone-aware UTC to prevent
+        comparison errors when sorting mixed timezone objects.
+        Args:
+            timestamp: DateTime object that may be timezone-naive, timezone-aware, or None
+        Returns:
+            Timezone-aware datetime in UTC, or None if input is None
+        """
+        if timestamp is None:
+            return None
+        if timestamp.tzinfo is None:
+            # Assume naive timestamps are UTC
+            return timestamp.replace(tzinfo=pytz.UTC)
+        else:
+            # Convert timezone-aware timestamps to UTC
+            return timestamp.astimezone(pytz.UTC)
+    def calculate_dora_metrics(
+        self,
+        commits: list[dict[str, Any]],
+        prs: list[dict[str, Any]],
+        start_date: datetime,
+        end_date: datetime,
+    ) -> dict[str, Any]:
         """Calculate the four key DORA metrics."""
         # Identify deployments and failures
         deployments = self._identify_deployments(commits, prs)
         failures = self._identify_failures(commits, prs)
         # Calculate metrics
         deployment_frequency = self._calculate_deployment_frequency(
             deployments, start_date, end_date
         )
         lead_time = self._calculate_lead_time(prs, deployments)
-        change_failure_rate = self._calculate_change_failure_rate(
-            deployments, failures
-        )
+        change_failure_rate = self._calculate_change_failure_rate(deployments, failures)
         mttr = self._calculate_mttr(failures, commits)
         # Determine performance level
         performance_level = self._determine_performance_level(
             deployment_frequency, lead_time, change_failure_rate, mttr
         )
         return {
-            'deployment_frequency': deployment_frequency,
-            'lead_time_hours': lead_time,
-            'change_failure_rate': change_failure_rate,
-            'mttr_hours': mttr,
-            'performance_level': performance_level,
-            'total_deployments': len(deployments),
-            'total_failures': len(failures),
-            'metrics_period_weeks': (end_date - start_date).days / 7
+            "deployment_frequency": deployment_frequency,
+            "lead_time_hours": lead_time,
+            "change_failure_rate": change_failure_rate,
+            "mttr_hours": mttr,
+            "performance_level": performance_level,
+            "total_deployments": len(deployments),
+            "total_failures": len(failures),
+            "metrics_period_weeks": (end_date - start_date).days / 7,
         }
-    def _identify_deployments(self, commits: List[Dict[str, Any]],
-                            prs: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
+    def _identify_deployments(
+        self, commits: list[dict[str, Any]], prs: list[dict[str, Any]]
+    ) -> list[dict[str, Any]]:
         """Identify deployment events from commits and PRs."""
         deployments = []
         # Check commits for deployment patterns
         for commit in commits:
-            message_lower = commit['message'].lower()
+            message_lower = commit["message"].lower()
             if any(pattern in message_lower for pattern in self.deployment_patterns):
-                deployments.append({
-                    'type': 'commit',
-                    'timestamp': commit['timestamp'],
-                    'identifier': commit['hash'],
-                    'message': commit['message']
-                })
+                deployments.append(
+                    {
+                        "type": "commit",
+                        "timestamp": self._normalize_timestamp_to_utc(commit["timestamp"]),
+                        "identifier": commit["hash"],
+                        "message": commit["message"],
+                    }
+                )
         # Check PR titles and labels for deployments
         for pr in prs:
             # Check title
-            title_lower = pr.get('title', '').lower()
+            title_lower = pr.get("title", "").lower()
             if any(pattern in title_lower for pattern in self.deployment_patterns):
-                deployments.append({
-                    'type': 'pr',
-                    'timestamp': pr.get('merged_at', pr.get('created_at')),
-                    'identifier': f"PR#{pr['number']}",
-                    'message': pr['title']
-                })
+                raw_timestamp = pr.get("merged_at", pr.get("created_at"))
+                deployments.append(
+                    {
+                        "type": "pr",
+                        "timestamp": self._normalize_timestamp_to_utc(raw_timestamp),
+                        "identifier": f"PR#{pr.get('number', 'unknown')}",
+                        "message": pr["title"],
+                    }
+                )
                 continue
             # Check labels
-            labels_lower = [label.lower() for label in pr.get('labels', [])]
-            if any(any(pattern in label for pattern in self.deployment_patterns)
-                   for label in labels_lower):
-                deployments.append({
-                    'type': 'pr',
-                    'timestamp': pr.get('merged_at', pr.get('created_at')),
-                    'identifier': f"PR#{pr['number']}",
-                    'message': pr['title']
-                })
-        # Remove duplicates and sort by timestamp
+            labels_lower = [label.lower() for label in pr.get("labels", [])]
+            if any(
+                any(pattern in label for pattern in self.deployment_patterns)
+                for label in labels_lower
+            ):
+                raw_timestamp = pr.get("merged_at", pr.get("created_at"))
+                deployments.append(
+                    {
+                        "type": "pr",
+                        "timestamp": self._normalize_timestamp_to_utc(raw_timestamp),
+                        "identifier": f"PR#{pr.get('number', 'unknown')}",
+                        "message": pr["title"],
+                    }
+                )
+        # Filter out deployments with None timestamps
+        deployments = [d for d in deployments if d["timestamp"] is not None]
+        # Remove duplicates and sort by timestamp (now all are timezone-aware UTC)
         seen = set()
         unique_deployments = []
-        for dep in sorted(deployments, key=lambda x: x['timestamp']):
+        for dep in sorted(deployments, key=lambda x: x["timestamp"]):
             key = f"{dep['type']}:{dep['identifier']}"
             if key not in seen:
                 seen.add(key)
                 unique_deployments.append(dep)
         return unique_deployments
-    def _identify_failures(self, commits: List[Dict[str, Any]],
-                         prs: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
+    def _identify_failures(
+        self, commits: list[dict[str, Any]], prs: list[dict[str, Any]]
+    ) -> list[dict[str, Any]]:
         """Identify failure events from commits and PRs."""
         failures = []
         # Check commits for failure patterns
         for commit in commits:
-            message_lower = commit['message'].lower()
+            message_lower = commit["message"].lower()
             if any(pattern in message_lower for pattern in self.failure_patterns):
-                failures.append({
-                    'type': 'commit',
-                    'timestamp': commit['timestamp'],
-                    'identifier': commit['hash'],
-                    'message': commit['message'],
-                    'is_hotfix': 'hotfix' in message_lower or 'emergency' in message_lower
-                })
+                failures.append(
+                    {
+                        "type": "commit",
+                        "timestamp": self._normalize_timestamp_to_utc(commit["timestamp"]),
+                        "identifier": commit["hash"],
+                        "message": commit["message"],
+                        "is_hotfix": "hotfix" in message_lower or "emergency" in message_lower,
+                    }
+                )
         # Check PRs for failure patterns
         for pr in prs:
-            title_lower = pr.get('title', '').lower()
-            labels_lower = [label.lower() for label in pr.get('labels', [])]
-            is_failure = (
-                any(pattern in title_lower for pattern in self.failure_patterns) or
-                any(any(pattern in label for pattern in self.failure_patterns)
-                    for label in labels_lower)
+            title_lower = pr.get("title", "").lower()
+            labels_lower = [label.lower() for label in pr.get("labels", [])]
+            is_failure = any(pattern in title_lower for pattern in self.failure_patterns) or any(
+                any(pattern in label for pattern in self.failure_patterns) for label in labels_lower
             )
             if is_failure:
-                failures.append({
-                    'type': 'pr',
-                    'timestamp': pr.get('merged_at', pr.get('created_at')),
-                    'identifier': f"PR#{pr['number']}",
-                    'message': pr['title'],
-                    'is_hotfix': 'hotfix' in title_lower or 'emergency' in title_lower
-                })
+                raw_timestamp = pr.get("merged_at", pr.get("created_at"))
+                failures.append(
+                    {
+                        "type": "pr",
+                        "timestamp": self._normalize_timestamp_to_utc(raw_timestamp),
+                        "identifier": f"PR#{pr.get('number', 'unknown')}",
+                        "message": pr["title"],
+                        "is_hotfix": "hotfix" in title_lower or "emergency" in title_lower,
+                    }
+                )
+        # Filter out failures with None timestamps
+        failures = [f for f in failures if f["timestamp"] is not None]
         return failures
-    def _calculate_deployment_frequency(self, deployments: List[Dict[str, Any]],
-                                      start_date: datetime,
-                                      end_date: datetime) -> Dict[str, Any]:
+    def _calculate_deployment_frequency(
+        self, deployments: list[dict[str, Any]], start_date: datetime, end_date: datetime
+    ) -> dict[str, Any]:
         """Calculate deployment frequency metrics."""
         if not deployments:
-            return {
-                'daily_average': 0,
-                'weekly_average': 0,
-                'category': 'Low'
-            }
-        # Filter deployments in date range
+            return {"daily_average": 0, "weekly_average": 0, "category": "Low"}
+        # Normalize date range to timezone-aware UTC
+        start_date_utc = self._normalize_timestamp_to_utc(start_date)
+        end_date_utc = self._normalize_timestamp_to_utc(end_date)
+        # Handle case where normalization failed
+        if start_date_utc is None or end_date_utc is None:
+            return {"daily_average": 0, "weekly_average": 0, "category": "Low"}
+        # Filter deployments in date range (timestamps are already normalized to UTC)
         period_deployments = [
-            d for d in deployments
-            if start_date <= d['timestamp'] <= end_date
+            d for d in deployments if start_date_utc <= d["timestamp"] <= end_date_utc
         ]
-        days = (end_date - start_date).days
+        days = (end_date_utc - start_date_utc).days
         weeks = days / 7
         daily_avg = len(period_deployments) / days if days > 0 else 0
         weekly_avg = len(period_deployments) / weeks if weeks > 0 else 0
         # Categorize based on DORA standards
         if daily_avg >= 1:
-            category = 'Elite'  # Multiple deploys per day
+            category = "Elite"  # Multiple deploys per day
         elif weekly_avg >= 1:
-            category = 'High'   # Between once per day and once per week
+            category = "High"  # Between once per day and once per week
         elif weekly_avg >= 0.25:
-            category = 'Medium' # Between once per week and once per month
+            category = "Medium"  # Between once per week and once per month
         else:
-            category = 'Low'    # Less than once per month
-        return {
-            'daily_average': daily_avg,
-            'weekly_average': weekly_avg,
-            'category': category
-        }
-    def _calculate_lead_time(self, prs: List[Dict[str, Any]],
-                           deployments: List[Dict[str, Any]]) -> float:
+            category = "Low"  # Less than once per month
+        return {"daily_average": daily_avg, "weekly_average": weekly_avg, "category": category}
+    def _calculate_lead_time(
+        self, prs: list[dict[str, Any]], deployments: list[dict[str, Any]]
+    ) -> float:
         """Calculate lead time for changes in hours."""
         if not prs:
             return 0
         lead_times = []
         for pr in prs:
-            if not pr.get('created_at') or not pr.get('merged_at'):
+            if not pr.get("created_at") or not pr.get("merged_at"):
                 continue
             # Calculate time from PR creation to merge
-            lead_time = (pr['merged_at'] - pr['created_at']).total_seconds() / 3600
+            # Normalize both timestamps to UTC
+            created_at = self._normalize_timestamp_to_utc(pr["created_at"])
+            merged_at = self._normalize_timestamp_to_utc(pr["merged_at"])
+            # Skip if either timestamp is None after normalization
+            if created_at is None or merged_at is None:
+                continue
+            lead_time = (merged_at - created_at).total_seconds() / 3600
             lead_times.append(lead_time)
         if not lead_times:
             return 0
         # Return median lead time
         return float(np.median(lead_times))
-    def _calculate_change_failure_rate(self, deployments: List[Dict[str, Any]],
-                                     failures: List[Dict[str, Any]]) -> float:
+    def _calculate_change_failure_rate(
+        self, deployments: list[dict[str, Any]], failures: list[dict[str, Any]]
+    ) -> float:
         """Calculate the percentage of deployments causing failures."""
         if not deployments:
             return 0
         # Count failures that occurred within 24 hours of a deployment
         failure_causing_deployments = 0
         for deployment in deployments:
-            deploy_time = deployment['timestamp']
+            deploy_time = deployment["timestamp"]  # Already normalized to UTC
             # Check if any failure occurred within 24 hours
             for failure in failures:
-                failure_time = failure['timestamp']
+                failure_time = failure["timestamp"]  # Already normalized to UTC
                 time_diff = abs((failure_time - deploy_time).total_seconds() / 3600)
                 if time_diff <= 24:  # Within 24 hours
                     failure_causing_deployments += 1
                     break
         return (failure_causing_deployments / len(deployments)) * 100
-    def _calculate_mttr(self, failures: List[Dict[str, Any]],
-                      commits: List[Dict[str, Any]]) -> float:
+    def _calculate_mttr(
+        self, failures: list[dict[str, Any]], commits: list[dict[str, Any]]
+    ) -> float:
         """Calculate mean time to recovery in hours."""
         if not failures:
             return 0
         recovery_times = []
         # For each failure, find the recovery time
-        for i, failure in enumerate(failures):
-            failure_time = failure['timestamp']
+        for _i, failure in enumerate(failures):
+            failure_time = failure["timestamp"]  # Already normalized to UTC
             # Look for recovery indicators in subsequent commits
             recovery_time = None
             # Check subsequent commits for recovery patterns
             for commit in commits:
-                if commit['timestamp'] <= failure_time:
+                commit_time = self._normalize_timestamp_to_utc(commit["timestamp"])
+                if commit_time <= failure_time:
                     continue
-                message_lower = commit['message'].lower()
-                recovery_patterns = ['fixed', 'resolved', 'recovery', 'restored']
+                message_lower = commit["message"].lower()
+                recovery_patterns = ["fixed", "resolved", "recovery", "restored"]
                 if any(pattern in message_lower for pattern in recovery_patterns):
-                    recovery_time = commit['timestamp']
+                    recovery_time = commit_time
                     break
             # If we found a recovery, calculate MTTR
             if recovery_time:
                 mttr = (recovery_time - failure_time).total_seconds() / 3600
                 recovery_times.append(mttr)
             # For hotfixes, assume quick recovery (2 hours)
-            elif failure.get('is_hotfix'):
+            elif failure.get("is_hotfix"):
                 recovery_times.append(2.0)
         if not recovery_times:
             # If no explicit recovery found, estimate based on failure type
             return 4.0  # Default 4 hours
         return float(np.mean(recovery_times))
-    def _determine_performance_level(self, deployment_freq: Dict[str, Any],
-                                   lead_time_hours: float,
-                                   change_failure_rate: float,
-                                   mttr_hours: float) -> str:
+    def _determine_performance_level(
+        self,
+        deployment_freq: dict[str, Any],
+        lead_time_hours: float,
+        change_failure_rate: float,
+        mttr_hours: float,
+    ) -> str:
         """Determine overall performance level based on DORA metrics."""
         scores = []
         # Deployment frequency score
-        freq_category = deployment_freq['category']
-        freq_scores = {'Elite': 4, 'High': 3, 'Medium': 2, 'Low': 1}
+        freq_category = deployment_freq["category"]
+        freq_scores = {"Elite": 4, "High": 3, "Medium": 2, "Low": 1}
         scores.append(freq_scores.get(freq_category, 1))
         # Lead time score
         if lead_time_hours < 24:  # Less than one day
             scores.append(4)  # Elite
@@ -293,7 +350,7 @@ class DORAMetricsCalculator:
             scores.append(2)  # Medium
         else:
             scores.append(1)  # Low
         # Change failure rate score
         if change_failure_rate <= 15:
             scores.append(4)  # Elite (0-15%)
@@ -303,7 +360,7 @@ class DORAMetricsCalculator:
             scores.append(2)  # Medium
         else:
             scores.append(1)  # Low
         # MTTR score
         if mttr_hours < 1:  # Less than one hour
             scores.append(4)  # Elite
@@ -313,15 +370,321 @@ class DORAMetricsCalculator:
             scores.append(2)  # Medium
         else:
             scores.append(1)  # Low
         # Average score determines overall level
         avg_score = sum(scores) / len(scores)
         if avg_score >= 3.5:
-            return 'Elite'
+            return "Elite"
         elif avg_score >= 2.5:
-            return 'High'
+            return "High"
         elif avg_score >= 1.5:
-            return 'Medium'
+            return "Medium"
         else:
-            return 'Low'
+            return "Low"
+    def calculate_weekly_dora_metrics(
+        self,
+        commits: list[dict[str, Any]],
+        prs: list[dict[str, Any]],
+        start_date: datetime,
+        end_date: datetime,
+    ) -> list[dict[str, Any]]:
+        """Calculate DORA metrics broken down by week.
+        WHY: Weekly breakdowns provide trend analysis and enable identification
+        of performance patterns over time. This helps teams track improvements
+        and identify periods of degraded performance.
+        DESIGN DECISION: Uses Monday-Sunday week boundaries for consistency
+        with other reporting functions. Includes rolling averages to smooth
+        out weekly variations and provide clearer trend indicators.
+        Args:
+            commits: List of commit data dictionaries
+            prs: List of pull request data dictionaries
+            start_date: Start of analysis period
+            end_date: End of analysis period
+        Returns:
+            List of weekly DORA metrics with trend analysis
+        """
+        # Normalize date range to timezone-aware UTC
+        start_date_utc = self._normalize_timestamp_to_utc(start_date)
+        end_date_utc = self._normalize_timestamp_to_utc(end_date)
+        if start_date_utc is None or end_date_utc is None:
+            return []
+        # Identify deployments and failures for the entire period
+        all_deployments = self._identify_deployments(commits, prs)
+        all_failures = self._identify_failures(commits, prs)
+        # Generate week boundaries
+        weeks = self._generate_week_boundaries(start_date_utc, end_date_utc)
+        weekly_metrics = []
+        previous_weeks_data = []  # For rolling averages
+        for week_start, week_end in weeks:
+            # Filter data for this week
+            week_deployments = [
+                d for d in all_deployments if week_start <= d["timestamp"] <= week_end
+            ]
+            week_failures = [f for f in all_failures if week_start <= f["timestamp"] <= week_end]
+            week_commits = [
+                c
+                for c in commits
+                if week_start <= self._normalize_timestamp_to_utc(c["timestamp"]) <= week_end
+            ]
+            week_prs = [
+                pr
+                for pr in prs
+                if pr.get("merged_at")
+                and week_start <= self._normalize_timestamp_to_utc(pr["merged_at"]) <= week_end
+            ]
+            # Calculate weekly metrics
+            deployment_frequency = len(week_deployments)
+            # Calculate lead time for PRs merged this week
+            lead_times = []
+            for pr in week_prs:
+                if pr.get("created_at") and pr.get("merged_at"):
+                    created_at = self._normalize_timestamp_to_utc(pr["created_at"])
+                    merged_at = self._normalize_timestamp_to_utc(pr["merged_at"])
+                    if created_at and merged_at:
+                        lead_time = (merged_at - created_at).total_seconds() / 3600
+                        lead_times.append(lead_time)
+            avg_lead_time = float(np.median(lead_times)) if lead_times else 0.0
+            # Calculate change failure rate
+            change_failure_rate = 0.0
+            if week_deployments:
+                failure_causing_deployments = 0
+                for deployment in week_deployments:
+                    deploy_time = deployment["timestamp"]
+                    # Check if any failure occurred within 24 hours
+                    for failure in week_failures:
+                        failure_time = failure["timestamp"]
+                        time_diff = abs((failure_time - deploy_time).total_seconds() / 3600)
+                        if time_diff <= 24:  # Within 24 hours
+                            failure_causing_deployments += 1
+                            break
+                change_failure_rate = (failure_causing_deployments / len(week_deployments)) * 100
+            # Calculate MTTR for failures this week
+            recovery_times = []
+            for failure in week_failures:
+                failure_time = failure["timestamp"]
+                # Look for recovery in subsequent commits within reasonable time
+                recovery_time = None
+                for commit in week_commits:
+                    commit_time = self._normalize_timestamp_to_utc(commit["timestamp"])
+                    if commit_time <= failure_time:
+                        continue
+                    message_lower = commit["message"].lower()
+                    recovery_patterns = ["fixed", "resolved", "recovery", "restored"]
+                    if any(pattern in message_lower for pattern in recovery_patterns):
+                        recovery_time = commit_time
+                        break
+                if recovery_time:
+                    mttr = (recovery_time - failure_time).total_seconds() / 3600
+                    recovery_times.append(mttr)
+                elif failure.get("is_hotfix"):
+                    recovery_times.append(2.0)  # Assume quick recovery for hotfixes
+            avg_mttr = float(np.mean(recovery_times)) if recovery_times else 0.0
+            # Store current week data
+            week_data = {
+                "week_start": week_start.strftime("%Y-%m-%d"),
+                "week_end": week_end.strftime("%Y-%m-%d"),
+                "deployment_frequency": deployment_frequency,
+                "lead_time_hours": round(avg_lead_time, 2),
+                "change_failure_rate": round(change_failure_rate, 2),
+                "mttr_hours": round(avg_mttr, 2),
+                "total_failures": len(week_failures),
+                "total_commits": len(week_commits),
+                "total_prs": len(week_prs),
+            }
+            # Calculate rolling averages (4-week window)
+            previous_weeks_data.append(week_data.copy())
+            if len(previous_weeks_data) > 4:
+                previous_weeks_data.pop(0)
+            # 4-week rolling averages
+            if len(previous_weeks_data) >= 2:
+                week_data["deployment_frequency_4w_avg"] = round(
+                    np.mean([w["deployment_frequency"] for w in previous_weeks_data]), 1
+                )
+                lead_times_4w = [
+                    w["lead_time_hours"] for w in previous_weeks_data if w["lead_time_hours"] > 0
+                ]
+                week_data["lead_time_4w_avg"] = round(
+                    np.mean(lead_times_4w) if lead_times_4w else 0, 1
+                )
+                cfr_4w = [
+                    w["change_failure_rate"]
+                    for w in previous_weeks_data
+                    if w["change_failure_rate"] > 0
+                ]
+                week_data["change_failure_rate_4w_avg"] = round(np.mean(cfr_4w) if cfr_4w else 0, 1)
+                mttr_4w = [w["mttr_hours"] for w in previous_weeks_data if w["mttr_hours"] > 0]
+                week_data["mttr_4w_avg"] = round(np.mean(mttr_4w) if mttr_4w else 0, 1)
+            else:
+                week_data["deployment_frequency_4w_avg"] = week_data["deployment_frequency"]
+                week_data["lead_time_4w_avg"] = week_data["lead_time_hours"]
+                week_data["change_failure_rate_4w_avg"] = week_data["change_failure_rate"]
+                week_data["mttr_4w_avg"] = week_data["mttr_hours"]
+            # Calculate week-over-week changes (if we have previous week)
+            if len(weekly_metrics) > 0:
+                prev_week = weekly_metrics[-1]
+                # Deployment frequency change
+                if prev_week["deployment_frequency"] > 0:
+                    df_change = (
+                        (week_data["deployment_frequency"] - prev_week["deployment_frequency"])
+                        / prev_week["deployment_frequency"]
+                        * 100
+                    )
+                    week_data["deployment_frequency_change_pct"] = round(df_change, 1)
+                else:
+                    week_data["deployment_frequency_change_pct"] = (
+                        0.0 if week_data["deployment_frequency"] == 0 else 100.0
+                    )
+                # Lead time change
+                if prev_week["lead_time_hours"] > 0:
+                    lt_change = (
+                        (week_data["lead_time_hours"] - prev_week["lead_time_hours"])
+                        / prev_week["lead_time_hours"]
+                        * 100
+                    )
+                    week_data["lead_time_change_pct"] = round(lt_change, 1)
+                else:
+                    week_data["lead_time_change_pct"] = (
+                        0.0 if week_data["lead_time_hours"] == 0 else 100.0
+                    )
+                # Change failure rate change
+                if prev_week["change_failure_rate"] > 0:
+                    cfr_change = (
+                        (week_data["change_failure_rate"] - prev_week["change_failure_rate"])
+                        / prev_week["change_failure_rate"]
+                        * 100
+                    )
+                    week_data["change_failure_rate_change_pct"] = round(cfr_change, 1)
+                else:
+                    week_data["change_failure_rate_change_pct"] = (
+                        0.0 if week_data["change_failure_rate"] == 0 else 100.0
+                    )
+                # MTTR change
+                if prev_week["mttr_hours"] > 0:
+                    mttr_change = (
+                        (week_data["mttr_hours"] - prev_week["mttr_hours"])
+                        / prev_week["mttr_hours"]
+                        * 100
+                    )
+                    week_data["mttr_change_pct"] = round(mttr_change, 1)
+                else:
+                    week_data["mttr_change_pct"] = 0.0 if week_data["mttr_hours"] == 0 else 100.0
+            else:
+                # First week - no changes to calculate
+                week_data["deployment_frequency_change_pct"] = 0.0
+                week_data["lead_time_change_pct"] = 0.0
+                week_data["change_failure_rate_change_pct"] = 0.0
+                week_data["mttr_change_pct"] = 0.0
+            # Add trend indicators
+            week_data["deployment_frequency_trend"] = self._get_trend_indicator(
+                week_data["deployment_frequency_change_pct"], "higher_better"
+            )
+            week_data["lead_time_trend"] = self._get_trend_indicator(
+                week_data["lead_time_change_pct"], "lower_better"
+            )
+            week_data["change_failure_rate_trend"] = self._get_trend_indicator(
+                week_data["change_failure_rate_change_pct"], "lower_better"
+            )
+            week_data["mttr_trend"] = self._get_trend_indicator(
+                week_data["mttr_change_pct"], "lower_better"
+            )
+            weekly_metrics.append(week_data)
+        return weekly_metrics
+    def _generate_week_boundaries(
+        self, start_date: datetime, end_date: datetime
+    ) -> list[tuple[datetime, datetime]]:
+        """Generate Monday-Sunday week boundaries for the given date range.
+        WHY: Consistent week boundaries ensure that weekly metrics align with
+        other reporting functions and provide predictable time buckets for analysis.
+        Args:
+            start_date: Start of analysis period (timezone-aware UTC)
+            end_date: End of analysis period (timezone-aware UTC)
+        Returns:
+            List of (week_start, week_end) tuples with Monday-Sunday boundaries
+        """
+        weeks = []
+        # Find the Monday of the week containing start_date
+        days_since_monday = start_date.weekday()
+        current_week_start = start_date - timedelta(days=days_since_monday)
+        current_week_start = current_week_start.replace(hour=0, minute=0, second=0, microsecond=0)
+        while current_week_start <= end_date:
+            week_end = current_week_start + timedelta(
+                days=6, hours=23, minutes=59, seconds=59, microseconds=999999
+            )
+            # Only include weeks that overlap with our analysis period
+            if week_end >= start_date:
+                weeks.append((current_week_start, week_end))
+            current_week_start += timedelta(days=7)
+        return weeks
+    def _get_trend_indicator(self, change_pct: float, direction: str) -> str:
+        """Get trend indicator based on change percentage and desired direction.
+        WHY: Provides intuitive trend indicators that account for whether
+        increases or decreases are desirable for each metric.
+        Args:
+            change_pct: Percentage change from previous period
+            direction: "higher_better" or "lower_better"
+        Returns:
+            Trend indicator: "improving", "declining", or "stable"
+        """
+        if abs(change_pct) < 5:  # Less than 5% change considered stable
+            return "stable"
+        if direction == "higher_better":
+            return "improving" if change_pct > 0 else "declining"
+        else:  # lower_better
+            return "improving" if change_pct < 0 else "declining"

gitflow-analytics 1.0.1__py3-none-any.whl → 1.3.6__py3-none-any.whl

gitflow-analytics 1.0.1py3-none-any.whl → 1.3.6py3-none-any.whl