PyPI - gitflow-analytics - Versions diffs - 1.0.3__py3-none-any.whl → 1.3.11__py3-none-any.whl - Mend

gitflow-analytics 1.0.3py3-none-any.whl → 1.3.11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (116) hide show

gitflow_analytics/_version.py +1 -1
gitflow_analytics/classification/__init__.py +31 -0
gitflow_analytics/classification/batch_classifier.py +752 -0
gitflow_analytics/classification/classifier.py +464 -0
gitflow_analytics/classification/feature_extractor.py +725 -0
gitflow_analytics/classification/linguist_analyzer.py +574 -0
gitflow_analytics/classification/model.py +455 -0
gitflow_analytics/cli.py +4158 -350
gitflow_analytics/cli_rich.py +198 -48
gitflow_analytics/config/__init__.py +43 -0
gitflow_analytics/config/errors.py +261 -0
gitflow_analytics/config/loader.py +905 -0
gitflow_analytics/config/profiles.py +264 -0
gitflow_analytics/config/repository.py +124 -0
gitflow_analytics/config/schema.py +444 -0
gitflow_analytics/config/validator.py +154 -0
gitflow_analytics/config.py +44 -508
gitflow_analytics/core/analyzer.py +1209 -98
gitflow_analytics/core/cache.py +1337 -29
gitflow_analytics/core/data_fetcher.py +1285 -0
gitflow_analytics/core/identity.py +363 -14
gitflow_analytics/core/metrics_storage.py +526 -0
gitflow_analytics/core/progress.py +372 -0
gitflow_analytics/core/schema_version.py +269 -0
gitflow_analytics/extractors/ml_tickets.py +1100 -0
gitflow_analytics/extractors/story_points.py +8 -1
gitflow_analytics/extractors/tickets.py +749 -11
gitflow_analytics/identity_llm/__init__.py +6 -0
gitflow_analytics/identity_llm/analysis_pass.py +231 -0
gitflow_analytics/identity_llm/analyzer.py +464 -0
gitflow_analytics/identity_llm/models.py +76 -0
gitflow_analytics/integrations/github_integration.py +175 -11
gitflow_analytics/integrations/jira_integration.py +461 -24
gitflow_analytics/integrations/orchestrator.py +124 -1
gitflow_analytics/metrics/activity_scoring.py +322 -0
gitflow_analytics/metrics/branch_health.py +470 -0
gitflow_analytics/metrics/dora.py +379 -20
gitflow_analytics/models/database.py +843 -53
gitflow_analytics/pm_framework/__init__.py +115 -0
gitflow_analytics/pm_framework/adapters/__init__.py +50 -0
gitflow_analytics/pm_framework/adapters/jira_adapter.py +1845 -0
gitflow_analytics/pm_framework/base.py +406 -0
gitflow_analytics/pm_framework/models.py +211 -0
gitflow_analytics/pm_framework/orchestrator.py +652 -0
gitflow_analytics/pm_framework/registry.py +333 -0
gitflow_analytics/qualitative/__init__.py +9 -10
gitflow_analytics/qualitative/chatgpt_analyzer.py +259 -0
gitflow_analytics/qualitative/classifiers/__init__.py +3 -3
gitflow_analytics/qualitative/classifiers/change_type.py +518 -244
gitflow_analytics/qualitative/classifiers/domain_classifier.py +272 -165
gitflow_analytics/qualitative/classifiers/intent_analyzer.py +321 -222
gitflow_analytics/qualitative/classifiers/llm/__init__.py +35 -0
gitflow_analytics/qualitative/classifiers/llm/base.py +193 -0
gitflow_analytics/qualitative/classifiers/llm/batch_processor.py +383 -0
gitflow_analytics/qualitative/classifiers/llm/cache.py +479 -0
gitflow_analytics/qualitative/classifiers/llm/cost_tracker.py +435 -0
gitflow_analytics/qualitative/classifiers/llm/openai_client.py +403 -0
gitflow_analytics/qualitative/classifiers/llm/prompts.py +373 -0
gitflow_analytics/qualitative/classifiers/llm/response_parser.py +287 -0
gitflow_analytics/qualitative/classifiers/llm_commit_classifier.py +607 -0
gitflow_analytics/qualitative/classifiers/risk_analyzer.py +215 -189
gitflow_analytics/qualitative/core/__init__.py +4 -4
gitflow_analytics/qualitative/core/llm_fallback.py +239 -235
gitflow_analytics/qualitative/core/nlp_engine.py +157 -148
gitflow_analytics/qualitative/core/pattern_cache.py +214 -192
gitflow_analytics/qualitative/core/processor.py +381 -248
gitflow_analytics/qualitative/enhanced_analyzer.py +2236 -0
gitflow_analytics/qualitative/example_enhanced_usage.py +420 -0
gitflow_analytics/qualitative/models/__init__.py +7 -7
gitflow_analytics/qualitative/models/schemas.py +155 -121
gitflow_analytics/qualitative/utils/__init__.py +4 -4
gitflow_analytics/qualitative/utils/batch_processor.py +136 -123
gitflow_analytics/qualitative/utils/cost_tracker.py +142 -140
gitflow_analytics/qualitative/utils/metrics.py +172 -158
gitflow_analytics/qualitative/utils/text_processing.py +146 -104
gitflow_analytics/reports/__init__.py +100 -0
gitflow_analytics/reports/analytics_writer.py +539 -14
gitflow_analytics/reports/base.py +648 -0
gitflow_analytics/reports/branch_health_writer.py +322 -0
gitflow_analytics/reports/classification_writer.py +924 -0
gitflow_analytics/reports/cli_integration.py +427 -0
gitflow_analytics/reports/csv_writer.py +1676 -212
gitflow_analytics/reports/data_models.py +504 -0
gitflow_analytics/reports/database_report_generator.py +427 -0
gitflow_analytics/reports/example_usage.py +344 -0
gitflow_analytics/reports/factory.py +499 -0
gitflow_analytics/reports/formatters.py +698 -0
gitflow_analytics/reports/html_generator.py +1116 -0
gitflow_analytics/reports/interfaces.py +489 -0
gitflow_analytics/reports/json_exporter.py +2770 -0
gitflow_analytics/reports/narrative_writer.py +2287 -158
gitflow_analytics/reports/story_point_correlation.py +1144 -0
gitflow_analytics/reports/weekly_trends_writer.py +389 -0
gitflow_analytics/training/__init__.py +5 -0
gitflow_analytics/training/model_loader.py +377 -0
gitflow_analytics/training/pipeline.py +550 -0
gitflow_analytics/tui/__init__.py +1 -1
gitflow_analytics/tui/app.py +129 -126
gitflow_analytics/tui/screens/__init__.py +3 -3
gitflow_analytics/tui/screens/analysis_progress_screen.py +188 -179
gitflow_analytics/tui/screens/configuration_screen.py +154 -178
gitflow_analytics/tui/screens/loading_screen.py +100 -110
gitflow_analytics/tui/screens/main_screen.py +89 -72
gitflow_analytics/tui/screens/results_screen.py +305 -281
gitflow_analytics/tui/widgets/__init__.py +2 -2
gitflow_analytics/tui/widgets/data_table.py +67 -69
gitflow_analytics/tui/widgets/export_modal.py +76 -76
gitflow_analytics/tui/widgets/progress_widget.py +41 -46
gitflow_analytics-1.3.11.dist-info/METADATA +1015 -0
gitflow_analytics-1.3.11.dist-info/RECORD +122 -0
gitflow_analytics-1.0.3.dist-info/METADATA +0 -490
gitflow_analytics-1.0.3.dist-info/RECORD +0 -62
{gitflow_analytics-1.0.3.dist-info → gitflow_analytics-1.3.11.dist-info}/WHEEL +0 -0
{gitflow_analytics-1.0.3.dist-info → gitflow_analytics-1.3.11.dist-info}/entry_points.txt +0 -0
{gitflow_analytics-1.0.3.dist-info → gitflow_analytics-1.3.11.dist-info}/licenses/LICENSE +0 -0
{gitflow_analytics-1.0.3.dist-info → gitflow_analytics-1.3.11.dist-info}/top_level.txt +0 -0

gitflow_analytics/qualitative/core/llm_fallback.py CHANGED Viewed

@@ -1,13 +1,12 @@
 """LLM fallback system for uncertain commit classifications using OpenRouter."""
-import asyncio
+import hashlib
 import json
 import logging
-import time
-import uuid
-from typing import Dict, List, Optional, Tuple, Any
-import hashlib
 import os
+import time
+from pathlib import Path
+from typing import Any, Optional
 from ..models.schemas import LLMConfig, QualitativeCommitData
 from ..utils.cost_tracker import CostTracker
@@ -16,23 +15,26 @@ from ..utils.text_processing import TextProcessor
 try:
     import openai
     import tiktoken
     OPENAI_AVAILABLE = True
 except ImportError:
     OPENAI_AVAILABLE = False
     # Create mock objects for type hints when not available
     class MockOpenAI:
         class OpenAI:
             pass
     openai = MockOpenAI()
     tiktoken = None
 class ModelRouter:
     """Smart model selection based on complexity and cost constraints."""
     def __init__(self, config: LLMConfig, cost_tracker: CostTracker):
         """Initialize model router.
         Args:
             config: LLM configuration
             cost_tracker: Cost tracking instance
@@ -40,51 +42,52 @@ class ModelRouter:
         self.config = config
         self.cost_tracker = cost_tracker
         self.logger = logging.getLogger(__name__)
     def select_model(self, complexity_score: float, batch_size: int) -> str:
         """Select appropriate model based on complexity and budget.
         Args:
             complexity_score: Complexity score (0.0 to 1.0)
             batch_size: Number of commits in batch
         Returns:
             Selected model name
         """
         # Check daily budget remaining
         remaining_budget = self.cost_tracker.check_budget_remaining()
         # If we're over budget, use free model
         if remaining_budget <= 0:
             self.logger.warning("Daily budget exceeded, using free model")
             return self.config.fallback_model
         # For simple cases or when budget is tight, use free model
         if complexity_score < 0.3 or remaining_budget < 0.50:
             return self.config.fallback_model
         # For complex cases with sufficient budget, use premium model
         if complexity_score > self.config.complexity_threshold and remaining_budget > 2.0:
             return self.config.complex_model
         # Default to primary model (Claude Haiku - fast and cheap)
         return self.config.primary_model
 class LLMFallback:
     """Strategic LLM usage for uncertain cases via OpenRouter.
     This class provides intelligent fallback to LLM processing when NLP
     classification confidence is below the threshold. It uses OpenRouter
     to access multiple models cost-effectively.
     """
-    def __init__(self, config: LLMConfig):
+    def __init__(self, config: LLMConfig, cache_dir: Optional[Path] = None):
         """Initialize LLM fallback system.
         Args:
             config: LLM configuration
+            cache_dir: Cache directory for cost tracking (defaults to config cache_dir)
         Raises:
             ImportError: If OpenAI library is not available
         """
@@ -92,36 +95,41 @@ class LLMFallback:
             raise ImportError(
                 "OpenAI library required for LLM fallback. Install with: pip install openai"
             )
         self.config = config
         self.logger = logging.getLogger(__name__)
         # Initialize OpenRouter client
         self.client = self._initialize_openrouter_client()
-        # Initialize utilities
-        self.cost_tracker = CostTracker(daily_budget=config.max_daily_cost)
+        # Initialize utilities with proper cache directory
+        cost_cache_dir = cache_dir / ".qualitative_cache" if cache_dir else None
+        self.cost_tracker = CostTracker(
+            cache_dir=cost_cache_dir, daily_budget=config.max_daily_cost
+        )
         self.model_router = ModelRouter(config, self.cost_tracker)
         self.text_processor = TextProcessor()
         # Batch processing cache
         self.batch_cache = {}
         # Token encoder for cost estimation
         try:
             self.encoding = tiktoken.get_encoding("cl100k_base")  # GPT-4 encoding
         except Exception:
             self.encoding = None
-            self.logger.warning("Could not load tiktoken encoder, token estimation may be inaccurate")
+            self.logger.warning(
+                "Could not load tiktoken encoder, token estimation may be inaccurate"
+            )
         self.logger.info("LLM fallback system initialized with OpenRouter")
     def _initialize_openrouter_client(self) -> openai.OpenAI:
         """Initialize OpenRouter client with API key.
         Returns:
             Configured OpenAI client for OpenRouter
         Raises:
             ValueError: If API key is not configured
         """
@@ -130,117 +138,116 @@ class LLMFallback:
             raise ValueError(
                 "OpenRouter API key not configured. Set OPENROUTER_API_KEY environment variable."
             )
         return openai.OpenAI(
             base_url=self.config.base_url,
             api_key=api_key,
             default_headers={
                 "HTTP-Referer": "https://github.com/bobmatnyc/gitflow-analytics",
-                "X-Title": "GitFlow Analytics - Qualitative Analysis"
-            }
+                "X-Title": "GitFlow Analytics - Qualitative Analysis",
+            },
         )
     def _resolve_api_key(self) -> Optional[str]:
         """Resolve OpenRouter API key from config or environment.
         Returns:
             API key string or None if not found
         """
         api_key = self.config.openrouter_api_key
         if api_key.startswith("${") and api_key.endswith("}"):
             env_var = api_key[2:-1]
             return os.environ.get(env_var)
         else:
             return api_key
-    def group_similar_commits(self, commits: List[Dict[str, Any]]) -> List[List[Dict[str, Any]]]:
+    def group_similar_commits(self, commits: list[dict[str, Any]]) -> list[list[dict[str, Any]]]:
         """Group similar commits for efficient batch processing.
         Args:
             commits: List of commit dictionaries
         Returns:
             List of commit groups
         """
         if not commits:
             return []
         groups = []
         similarity_threshold = self.config.similarity_threshold
         for commit in commits:
             # Find similar group or create new one
             placed = False
             for group in groups:
                 if len(group) >= self.config.max_group_size:
                     continue  # Group is full
                 # Calculate similarity with first commit in group
                 similarity = self.text_processor.calculate_message_similarity(
-                    commit.get('message', ''),
-                    group[0].get('message', '')
+                    commit.get("message", ""), group[0].get("message", "")
                 )
                 if similarity > similarity_threshold:
                     group.append(commit)
                     placed = True
                     break
             if not placed:
                 groups.append([commit])
         self.logger.debug(f"Grouped {len(commits)} commits into {len(groups)} groups")
         return groups
-    def process_group(self, commits: List[Dict[str, Any]]) -> List[QualitativeCommitData]:
+    def process_group(self, commits: list[dict[str, Any]]) -> list[QualitativeCommitData]:
         """Process a group of similar commits with OpenRouter.
         Args:
             commits: List of similar commit dictionaries
         Returns:
             List of QualitativeCommitData with LLM analysis
         """
         if not commits:
             return []
         start_time = time.time()
         # Check cache first
         cache_key = self._generate_group_cache_key(commits)
         if cache_key in self.batch_cache:
             self.logger.debug(f"Using cached result for {len(commits)} commits")
             template_result = self.batch_cache[cache_key]
             return self._apply_template_to_group(template_result, commits)
         # Assess complexity and select model
         complexity_score = self._assess_complexity(commits)
         selected_model = self.model_router.select_model(complexity_score, len(commits))
         self.logger.debug(
             f"Processing {len(commits)} commits with {selected_model} "
             f"(complexity: {complexity_score:.2f})"
         )
         # Build optimized prompt
         prompt = self._build_batch_classification_prompt(commits)
         # Estimate tokens and cost
         estimated_input_tokens = self._estimate_tokens(prompt)
         if not self.cost_tracker.can_afford_call(selected_model, estimated_input_tokens * 2):
             self.logger.warning("Cannot afford LLM call, using fallback model")
             selected_model = self.config.fallback_model
         # Make OpenRouter API call
         try:
             response = self._call_openrouter(prompt, selected_model)
             processing_time = time.time() - start_time
             # Parse response
             results = self._parse_llm_response(response, commits)
             # Track costs and performance
             estimated_output_tokens = self._estimate_tokens(response)
             self.cost_tracker.record_call(
@@ -249,22 +256,22 @@ class LLMFallback:
                 output_tokens=estimated_output_tokens,
                 processing_time=processing_time,
                 batch_size=len(commits),
-                success=len(results) > 0
+                success=len(results) > 0,
             )
             # Cache successful result
             if results:
                 self.batch_cache[cache_key] = self._create_template_from_results(results)
             # Update processing time in results
             for result in results:
                 result.processing_time_ms = (processing_time * 1000) / len(results)
             return results
         except Exception as e:
             self.logger.error(f"OpenRouter processing failed: {e}")
             # Record failed call
             self.cost_tracker.record_call(
                 model=selected_model,
@@ -273,25 +280,25 @@ class LLMFallback:
                 processing_time=time.time() - start_time,
                 batch_size=len(commits),
                 success=False,
-                error_message=str(e)
+                error_message=str(e),
             )
             # Try fallback model if primary failed
             if selected_model != self.config.fallback_model:
                 return self._retry_with_fallback_model(commits, prompt)
             else:
                 return self._create_fallback_results(commits)
     def _call_openrouter(self, prompt: str, model: str) -> str:
         """Make API call to OpenRouter with selected model.
         Args:
             prompt: Classification prompt
             model: Model to use
         Returns:
             Response content
         Raises:
             Exception: If API call fails
         """
@@ -300,52 +307,52 @@ class LLMFallback:
                 model=model,
                 messages=[
                     {
-                        "role": "system",
-                        "content": "You are an expert Git commit classifier. Analyze commits and respond only with valid JSON. Be concise but accurate."
+                        "role": "system",
+                        "content": "You are an expert Git commit classifier. Analyze commits and respond only with valid JSON. Be concise but accurate.",
                     },
-                    {"role": "user", "content": prompt}
+                    {"role": "user", "content": prompt},
                 ],
                 max_tokens=self.config.max_tokens,
                 temperature=self.config.temperature,
-                stream=False
+                stream=False,
             )
             return response.choices[0].message.content
         except Exception as e:
             self.logger.error(f"OpenRouter API call failed: {e}")
             raise
-    def _build_batch_classification_prompt(self, commits: List[Dict[str, Any]]) -> str:
+    def _build_batch_classification_prompt(self, commits: list[dict[str, Any]]) -> str:
         """Build optimized prompt for OpenRouter batch processing.
         Args:
             commits: List of commit dictionaries
         Returns:
             Formatted prompt string
         """
         # Limit to max group size for token management
-        commits_to_process = commits[:self.config.max_group_size]
+        commits_to_process = commits[: self.config.max_group_size]
         commit_data = []
         for i, commit in enumerate(commits_to_process, 1):
-            message = commit.get('message', '')[:150]  # Truncate long messages
-            files = commit.get('files_changed', [])
+            message = commit.get("message", "")[:150]  # Truncate long messages
+            files = commit.get("files_changed", [])
             # Include key file context
             files_context = ""
             if files:
                 key_files = files[:5]  # Top 5 files
                 files_context = f" | Modified: {', '.join(key_files)}"
             # Add size context
-            insertions = commit.get('insertions', 0)
-            deletions = commit.get('deletions', 0)
+            insertions = commit.get("insertions", 0)
+            deletions = commit.get("deletions", 0)
             size_context = f" | +{insertions}/-{deletions}"
             commit_data.append(f"{i}. {message}{files_context}{size_context}")
         prompt = f"""Analyze these Git commits and classify each one. Consider the commit message, modified files, and change size.
 Commits to classify:
@@ -363,134 +370,132 @@ Respond with JSON array only:
 [{{"id": 1, "change_type": "feature", "business_domain": "frontend", "risk_level": "low", "confidence": 0.9, "urgency": "routine", "complexity": "moderate"}}]"""
         return prompt
-    def _parse_llm_response(self, response: str, commits: List[Dict[str, Any]]) -> List[QualitativeCommitData]:
+    def _parse_llm_response(
+        self, response: str, commits: list[dict[str, Any]]
+    ) -> list[QualitativeCommitData]:
         """Parse LLM response into QualitativeCommitData objects.
         Args:
             response: JSON response from LLM
             commits: Original commit dictionaries
         Returns:
             List of QualitativeCommitData objects
         """
         try:
             # Clean response (remove any markdown formatting)
             cleaned_response = response.strip()
-            if cleaned_response.startswith('```json'):
+            if cleaned_response.startswith("```json"):
                 cleaned_response = cleaned_response[7:]
-            if cleaned_response.endswith('```'):
+            if cleaned_response.endswith("```"):
                 cleaned_response = cleaned_response[:-3]
             cleaned_response = cleaned_response.strip()
             classifications = json.loads(cleaned_response)
             if not isinstance(classifications, list):
                 raise ValueError("Response is not a JSON array")
             results = []
             for i, commit in enumerate(commits):
                 if i < len(classifications):
                     classification = classifications[i]
                 else:
                     # Fallback if fewer classifications than commits
                     classification = {
-                        'change_type': 'unknown',
-                        'business_domain': 'unknown',
-                        'risk_level': 'medium',
-                        'confidence': 0.5,
-                        'urgency': 'routine',
-                        'complexity': 'moderate'
+                        "change_type": "unknown",
+                        "business_domain": "unknown",
+                        "risk_level": "medium",
+                        "confidence": 0.5,
+                        "urgency": "routine",
+                        "complexity": "moderate",
                     }
                 result = QualitativeCommitData(
                     # Copy existing commit fields
-                    hash=commit.get('hash', ''),
-                    message=commit.get('message', ''),
-                    author_name=commit.get('author_name', ''),
-                    author_email=commit.get('author_email', ''),
-                    timestamp=commit.get('timestamp', time.time()),
-                    files_changed=commit.get('files_changed', []),
-                    insertions=commit.get('insertions', 0),
-                    deletions=commit.get('deletions', 0),
+                    hash=commit.get("hash", ""),
+                    message=commit.get("message", ""),
+                    author_name=commit.get("author_name", ""),
+                    author_email=commit.get("author_email", ""),
+                    timestamp=commit.get("timestamp", time.time()),
+                    files_changed=commit.get("files_changed", []),
+                    insertions=commit.get("insertions", 0),
+                    deletions=commit.get("deletions", 0),
                     # LLM-provided classifications
-                    change_type=classification.get('change_type', 'unknown'),
-                    change_type_confidence=classification.get('confidence', 0.5),
-                    business_domain=classification.get('business_domain', 'unknown'),
-                    domain_confidence=classification.get('confidence', 0.5),
-                    risk_level=classification.get('risk_level', 'medium'),
-                    risk_factors=classification.get('risk_factors', []),
+                    change_type=classification.get("change_type", "unknown"),
+                    change_type_confidence=classification.get("confidence", 0.5),
+                    business_domain=classification.get("business_domain", "unknown"),
+                    domain_confidence=classification.get("confidence", 0.5),
+                    risk_level=classification.get("risk_level", "medium"),
+                    risk_factors=classification.get("risk_factors", []),
                     # Intent signals from LLM analysis
                     intent_signals={
-                        'urgency': classification.get('urgency', 'routine'),
-                        'complexity': classification.get('complexity', 'moderate'),
-                        'confidence': classification.get('confidence', 0.5),
-                        'signals': [f"llm_classified:{classification.get('change_type', 'unknown')}"]
+                        "urgency": classification.get("urgency", "routine"),
+                        "complexity": classification.get("complexity", "moderate"),
+                        "confidence": classification.get("confidence", 0.5),
+                        "signals": [
+                            f"llm_classified:{classification.get('change_type', 'unknown')}"
+                        ],
                     },
                     collaboration_patterns={},
-                    technical_context={
-                        'llm_model': 'openrouter',
-                        'processing_method': 'batch'
-                    },
+                    technical_context={"llm_model": "openrouter", "processing_method": "batch"},
                     # Processing metadata
-                    processing_method='llm',
+                    processing_method="llm",
                     processing_time_ms=0,  # Set by caller
-                    confidence_score=classification.get('confidence', 0.5)
+                    confidence_score=classification.get("confidence", 0.5),
                 )
                 results.append(result)
             return results
         except (json.JSONDecodeError, KeyError, ValueError) as e:
             self.logger.error(f"Failed to parse LLM response: {e}")
             self.logger.debug(f"Raw response: {response}")
             return self._create_fallback_results(commits)
-    def _assess_complexity(self, commits: List[Dict[str, Any]]) -> float:
+    def _assess_complexity(self, commits: list[dict[str, Any]]) -> float:
         """Assess complexity of commits for model selection.
         Args:
             commits: List of commit dictionaries
         Returns:
             Complexity score (0.0 to 1.0)
         """
         if not commits:
             return 0.0
         total_complexity = 0.0
         for commit in commits:
             # Message complexity
-            message = commit.get('message', '')
+            message = commit.get("message", "")
             message_complexity = min(1.0, len(message.split()) / 20.0)
             # File change complexity
-            files_changed = len(commit.get('files_changed', []))
+            files_changed = len(commit.get("files_changed", []))
             file_complexity = min(1.0, files_changed / 15.0)
             # Size complexity
-            total_changes = commit.get('insertions', 0) + commit.get('deletions', 0)
+            total_changes = commit.get("insertions", 0) + commit.get("deletions", 0)
             size_complexity = min(1.0, total_changes / 200.0)
             # Combine complexities
-            commit_complexity = (message_complexity * 0.3 +
-                               file_complexity * 0.4 +
-                               size_complexity * 0.3)
+            commit_complexity = (
+                message_complexity * 0.3 + file_complexity * 0.4 + size_complexity * 0.3
+            )
             total_complexity += commit_complexity
         return total_complexity / len(commits)
     def _estimate_tokens(self, text: str) -> int:
         """Estimate token count for text.
         Args:
             text: Text to count tokens for
         Returns:
             Estimated token count
         """
@@ -499,105 +504,104 @@ Respond with JSON array only:
                 return len(self.encoding.encode(text))
             except Exception:
                 pass
         # Fallback estimation (roughly 4 characters per token)
         return len(text) // 4
-    def _generate_group_cache_key(self, commits: List[Dict[str, Any]]) -> str:
+    def _generate_group_cache_key(self, commits: list[dict[str, Any]]) -> str:
         """Generate cache key for a group of commits.
         Args:
             commits: List of commit dictionaries
         Returns:
             Cache key string
         """
         # Create fingerprint from commit messages and file patterns
         fingerprints = []
         for commit in commits:
-            message = commit.get('message', '')
-            files = commit.get('files_changed', [])
+            message = commit.get("message", "")
+            files = commit.get("files_changed", [])
             fingerprint = self.text_processor.create_semantic_fingerprint(message, files)
             fingerprints.append(fingerprint)
-        combined_fingerprint = '|'.join(sorted(fingerprints))
+        combined_fingerprint = "|".join(sorted(fingerprints))
         return hashlib.md5(combined_fingerprint.encode()).hexdigest()
-    def _create_template_from_results(self, results: List[QualitativeCommitData]) -> Dict[str, Any]:
+    def _create_template_from_results(self, results: list[QualitativeCommitData]) -> dict[str, Any]:
         """Create a template from successful results for caching.
         Args:
             results: List of analysis results
         Returns:
             Template dictionary
         """
         if not results:
             return {}
         # Use first result as template
         template = results[0]
         return {
-            'change_type': template.change_type,
-            'business_domain': template.business_domain,
-            'risk_level': template.risk_level,
-            'confidence_score': template.confidence_score
+            "change_type": template.change_type,
+            "business_domain": template.business_domain,
+            "risk_level": template.risk_level,
+            "confidence_score": template.confidence_score,
         }
-    def _apply_template_to_group(self, template: Dict[str, Any],
-                                commits: List[Dict[str, Any]]) -> List[QualitativeCommitData]:
+    def _apply_template_to_group(
+        self, template: dict[str, Any], commits: list[dict[str, Any]]
+    ) -> list[QualitativeCommitData]:
         """Apply cached template to a group of commits.
         Args:
             template: Cached analysis template
             commits: List of commit dictionaries
         Returns:
             List of QualitativeCommitData using template
         """
         results = []
         for commit in commits:
             result = QualitativeCommitData(
                 # Copy existing commit fields
-                hash=commit.get('hash', ''),
-                message=commit.get('message', ''),
-                author_name=commit.get('author_name', ''),
-                author_email=commit.get('author_email', ''),
-                timestamp=commit.get('timestamp', time.time()),
-                files_changed=commit.get('files_changed', []),
-                insertions=commit.get('insertions', 0),
-                deletions=commit.get('deletions', 0),
+                hash=commit.get("hash", ""),
+                message=commit.get("message", ""),
+                author_name=commit.get("author_name", ""),
+                author_email=commit.get("author_email", ""),
+                timestamp=commit.get("timestamp", time.time()),
+                files_changed=commit.get("files_changed", []),
+                insertions=commit.get("insertions", 0),
+                deletions=commit.get("deletions", 0),
                 # Apply template values
-                change_type=template.get('change_type', 'unknown'),
-                change_type_confidence=template.get('confidence_score', 0.5),
-                business_domain=template.get('business_domain', 'unknown'),
-                domain_confidence=template.get('confidence_score', 0.5),
-                risk_level=template.get('risk_level', 'medium'),
+                change_type=template.get("change_type", "unknown"),
+                change_type_confidence=template.get("confidence_score", 0.5),
+                business_domain=template.get("business_domain", "unknown"),
+                domain_confidence=template.get("confidence_score", 0.5),
+                risk_level=template.get("risk_level", "medium"),
                 risk_factors=[],
-                intent_signals={'confidence': template.get('confidence_score', 0.5)},
+                intent_signals={"confidence": template.get("confidence_score", 0.5)},
                 collaboration_patterns={},
-                technical_context={'processing_method': 'cached_template'},
+                technical_context={"processing_method": "cached_template"},
                 # Processing metadata
-                processing_method='llm',
+                processing_method="llm",
                 processing_time_ms=1.0,  # Very fast for cached results
-                confidence_score=template.get('confidence_score', 0.5)
+                confidence_score=template.get("confidence_score", 0.5),
             )
             results.append(result)
         return results
-    def _retry_with_fallback_model(self, commits: List[Dict[str, Any]],
-                                  prompt: str) -> List[QualitativeCommitData]:
+    def _retry_with_fallback_model(
+        self, commits: list[dict[str, Any]], prompt: str
+    ) -> list[QualitativeCommitData]:
         """Retry processing with fallback model.
         Args:
             commits: List of commit dictionaries
             prompt: Classification prompt
         Returns:
             List of QualitativeCommitData or fallback results
         """
@@ -608,46 +612,46 @@ Respond with JSON array only:
         except Exception as e:
             self.logger.error(f"Fallback model also failed: {e}")
             return self._create_fallback_results(commits)
-    def _create_fallback_results(self, commits: List[Dict[str, Any]]) -> List[QualitativeCommitData]:
+    def _create_fallback_results(
+        self, commits: list[dict[str, Any]]
+    ) -> list[QualitativeCommitData]:
         """Create fallback results when LLM processing fails.
         Args:
             commits: List of commit dictionaries
         Returns:
             List of QualitativeCommitData with default values
         """
         results = []
         for commit in commits:
             result = QualitativeCommitData(
                 # Basic commit info
-                hash=commit.get('hash', ''),
-                message=commit.get('message', ''),
-                author_name=commit.get('author_name', ''),
-                author_email=commit.get('author_email', ''),
-                timestamp=commit.get('timestamp', time.time()),
-                files_changed=commit.get('files_changed', []),
-                insertions=commit.get('insertions', 0),
-                deletions=commit.get('deletions', 0),
+                hash=commit.get("hash", ""),
+                message=commit.get("message", ""),
+                author_name=commit.get("author_name", ""),
+                author_email=commit.get("author_email", ""),
+                timestamp=commit.get("timestamp", time.time()),
+                files_changed=commit.get("files_changed", []),
+                insertions=commit.get("insertions", 0),
+                deletions=commit.get("deletions", 0),
                 # Default classifications
-                change_type='unknown',
+                change_type="unknown",
                 change_type_confidence=0.0,
-                business_domain='unknown',
+                business_domain="unknown",
                 domain_confidence=0.0,
-                risk_level='medium',
-                risk_factors=['llm_processing_failed'],
-                intent_signals={'confidence': 0.0},
+                risk_level="medium",
+                risk_factors=["llm_processing_failed"],
+                intent_signals={"confidence": 0.0},
                 collaboration_patterns={},
-                technical_context={'processing_method': 'fallback'},
+                technical_context={"processing_method": "fallback"},
                 # Processing metadata
-                processing_method='llm',
+                processing_method="llm",
                 processing_time_ms=0.0,
-                confidence_score=0.0
+                confidence_score=0.0,
             )
             results.append(result)
-        return results
+        return results

gitflow-analytics 1.0.3__py3-none-any.whl → 1.3.11__py3-none-any.whl

gitflow-analytics 1.0.3py3-none-any.whl → 1.3.11py3-none-any.whl