PyPI - gitflow-analytics - Versions diffs - 1.0.3__py3-none-any.whl → 1.3.6__py3-none-any.whl - Mend

gitflow-analytics 1.0.3py3-none-any.whl → 1.3.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (116) hide show

gitflow_analytics/_version.py +1 -1
gitflow_analytics/classification/__init__.py +31 -0
gitflow_analytics/classification/batch_classifier.py +752 -0
gitflow_analytics/classification/classifier.py +464 -0
gitflow_analytics/classification/feature_extractor.py +725 -0
gitflow_analytics/classification/linguist_analyzer.py +574 -0
gitflow_analytics/classification/model.py +455 -0
gitflow_analytics/cli.py +4108 -350
gitflow_analytics/cli_rich.py +198 -48
gitflow_analytics/config/__init__.py +43 -0
gitflow_analytics/config/errors.py +261 -0
gitflow_analytics/config/loader.py +904 -0
gitflow_analytics/config/profiles.py +264 -0
gitflow_analytics/config/repository.py +124 -0
gitflow_analytics/config/schema.py +441 -0
gitflow_analytics/config/validator.py +154 -0
gitflow_analytics/config.py +44 -508
gitflow_analytics/core/analyzer.py +1209 -98
gitflow_analytics/core/cache.py +1337 -29
gitflow_analytics/core/data_fetcher.py +1193 -0
gitflow_analytics/core/identity.py +363 -14
gitflow_analytics/core/metrics_storage.py +526 -0
gitflow_analytics/core/progress.py +372 -0
gitflow_analytics/core/schema_version.py +269 -0
gitflow_analytics/extractors/ml_tickets.py +1100 -0
gitflow_analytics/extractors/story_points.py +8 -1
gitflow_analytics/extractors/tickets.py +749 -11
gitflow_analytics/identity_llm/__init__.py +6 -0
gitflow_analytics/identity_llm/analysis_pass.py +231 -0
gitflow_analytics/identity_llm/analyzer.py +464 -0
gitflow_analytics/identity_llm/models.py +76 -0
gitflow_analytics/integrations/github_integration.py +175 -11
gitflow_analytics/integrations/jira_integration.py +461 -24
gitflow_analytics/integrations/orchestrator.py +124 -1
gitflow_analytics/metrics/activity_scoring.py +322 -0
gitflow_analytics/metrics/branch_health.py +470 -0
gitflow_analytics/metrics/dora.py +379 -20
gitflow_analytics/models/database.py +843 -53
gitflow_analytics/pm_framework/__init__.py +115 -0
gitflow_analytics/pm_framework/adapters/__init__.py +50 -0
gitflow_analytics/pm_framework/adapters/jira_adapter.py +1845 -0
gitflow_analytics/pm_framework/base.py +406 -0
gitflow_analytics/pm_framework/models.py +211 -0
gitflow_analytics/pm_framework/orchestrator.py +652 -0
gitflow_analytics/pm_framework/registry.py +333 -0
gitflow_analytics/qualitative/__init__.py +9 -10
gitflow_analytics/qualitative/chatgpt_analyzer.py +259 -0
gitflow_analytics/qualitative/classifiers/__init__.py +3 -3
gitflow_analytics/qualitative/classifiers/change_type.py +518 -244
gitflow_analytics/qualitative/classifiers/domain_classifier.py +272 -165
gitflow_analytics/qualitative/classifiers/intent_analyzer.py +321 -222
gitflow_analytics/qualitative/classifiers/llm/__init__.py +35 -0
gitflow_analytics/qualitative/classifiers/llm/base.py +193 -0
gitflow_analytics/qualitative/classifiers/llm/batch_processor.py +383 -0
gitflow_analytics/qualitative/classifiers/llm/cache.py +479 -0
gitflow_analytics/qualitative/classifiers/llm/cost_tracker.py +435 -0
gitflow_analytics/qualitative/classifiers/llm/openai_client.py +403 -0
gitflow_analytics/qualitative/classifiers/llm/prompts.py +373 -0
gitflow_analytics/qualitative/classifiers/llm/response_parser.py +287 -0
gitflow_analytics/qualitative/classifiers/llm_commit_classifier.py +607 -0
gitflow_analytics/qualitative/classifiers/risk_analyzer.py +215 -189
gitflow_analytics/qualitative/core/__init__.py +4 -4
gitflow_analytics/qualitative/core/llm_fallback.py +239 -235
gitflow_analytics/qualitative/core/nlp_engine.py +157 -148
gitflow_analytics/qualitative/core/pattern_cache.py +214 -192
gitflow_analytics/qualitative/core/processor.py +381 -248
gitflow_analytics/qualitative/enhanced_analyzer.py +2236 -0
gitflow_analytics/qualitative/example_enhanced_usage.py +420 -0
gitflow_analytics/qualitative/models/__init__.py +7 -7
gitflow_analytics/qualitative/models/schemas.py +155 -121
gitflow_analytics/qualitative/utils/__init__.py +4 -4
gitflow_analytics/qualitative/utils/batch_processor.py +136 -123
gitflow_analytics/qualitative/utils/cost_tracker.py +142 -140
gitflow_analytics/qualitative/utils/metrics.py +172 -158
gitflow_analytics/qualitative/utils/text_processing.py +146 -104
gitflow_analytics/reports/__init__.py +100 -0
gitflow_analytics/reports/analytics_writer.py +539 -14
gitflow_analytics/reports/base.py +648 -0
gitflow_analytics/reports/branch_health_writer.py +322 -0
gitflow_analytics/reports/classification_writer.py +924 -0
gitflow_analytics/reports/cli_integration.py +427 -0
gitflow_analytics/reports/csv_writer.py +1676 -212
gitflow_analytics/reports/data_models.py +504 -0
gitflow_analytics/reports/database_report_generator.py +427 -0
gitflow_analytics/reports/example_usage.py +344 -0
gitflow_analytics/reports/factory.py +499 -0
gitflow_analytics/reports/formatters.py +698 -0
gitflow_analytics/reports/html_generator.py +1116 -0
gitflow_analytics/reports/interfaces.py +489 -0
gitflow_analytics/reports/json_exporter.py +2770 -0
gitflow_analytics/reports/narrative_writer.py +2287 -158
gitflow_analytics/reports/story_point_correlation.py +1144 -0
gitflow_analytics/reports/weekly_trends_writer.py +389 -0
gitflow_analytics/training/__init__.py +5 -0
gitflow_analytics/training/model_loader.py +377 -0
gitflow_analytics/training/pipeline.py +550 -0
gitflow_analytics/tui/__init__.py +1 -1
gitflow_analytics/tui/app.py +129 -126
gitflow_analytics/tui/screens/__init__.py +3 -3
gitflow_analytics/tui/screens/analysis_progress_screen.py +188 -179
gitflow_analytics/tui/screens/configuration_screen.py +154 -178
gitflow_analytics/tui/screens/loading_screen.py +100 -110
gitflow_analytics/tui/screens/main_screen.py +89 -72
gitflow_analytics/tui/screens/results_screen.py +305 -281
gitflow_analytics/tui/widgets/__init__.py +2 -2
gitflow_analytics/tui/widgets/data_table.py +67 -69
gitflow_analytics/tui/widgets/export_modal.py +76 -76
gitflow_analytics/tui/widgets/progress_widget.py +41 -46
gitflow_analytics-1.3.6.dist-info/METADATA +1015 -0
gitflow_analytics-1.3.6.dist-info/RECORD +122 -0
gitflow_analytics-1.0.3.dist-info/METADATA +0 -490
gitflow_analytics-1.0.3.dist-info/RECORD +0 -62
{gitflow_analytics-1.0.3.dist-info → gitflow_analytics-1.3.6.dist-info}/WHEEL +0 -0
{gitflow_analytics-1.0.3.dist-info → gitflow_analytics-1.3.6.dist-info}/entry_points.txt +0 -0
{gitflow_analytics-1.0.3.dist-info → gitflow_analytics-1.3.6.dist-info}/licenses/LICENSE +0 -0
{gitflow_analytics-1.0.3.dist-info → gitflow_analytics-1.3.6.dist-info}/top_level.txt +0 -0

gitflow_analytics/qualitative/classifiers/change_type.py CHANGED Viewed

@@ -1,214 +1,482 @@
 """Change type classifier using semantic analysis of commit messages."""
+import importlib.util
 import logging
 import re
-from typing import Dict, List, Tuple, Set, Any, Optional
-from pathlib import Path
+from typing import Any, Optional
 from ..models.schemas import ChangeTypeConfig
-try:
-    import spacy
+# Check if spacy is available without importing it
+SPACY_AVAILABLE = importlib.util.find_spec("spacy") is not None
+if SPACY_AVAILABLE:
     from spacy.tokens import Doc
-    SPACY_AVAILABLE = True
-except ImportError:
-    SPACY_AVAILABLE = False
+else:
     Doc = Any
 class ChangeTypeClassifier:
     """Classify commits by change type using semantic analysis.
     This classifier determines the type of change represented by a commit
     (feature, bugfix, refactor, etc.) by analyzing the commit message semantics
     and file patterns.
     The classification uses a combination of:
     - Semantic keyword matching with action/object/context patterns
     - File pattern analysis for additional signals
     - Rule-based patterns for common commit message formats
     """
     def __init__(self, config: ChangeTypeConfig):
         """Initialize change type classifier.
         Args:
             config: Configuration for change type classification
         """
         self.config = config
         self.logger = logging.getLogger(__name__)
         # Define semantic patterns for each change type
         self.change_patterns = {
-            'feature': {
-                'action_words': {
-                    'add', 'implement', 'create', 'build', 'introduce', 'develop',
-                    'enable', 'support', 'allow', 'provide', 'include'
+            "feature": {
+                "action_words": {
+                    "add",
+                    "implement",
+                    "create",
+                    "build",
+                    "introduce",
+                    "develop",
+                    "enable",
+                    "support",
+                    "allow",
+                    "provide",
+                    "include",
+                    "addition",
+                    "initialize",
+                    "prepare",
+                    "extend",
+                },
+                "object_words": {
+                    "feature",
+                    "functionality",
+                    "capability",
+                    "component",
+                    "module",
+                    "endpoint",
+                    "api",
+                    "service",
+                    "interface",
+                    "system",
+                    "integration",
+                    "column",
+                    "field",
+                    "property",
+                },
+                "context_words": {
+                    "new",
+                    "initial",
+                    "first",
+                    "user",
+                    "client",
+                    "support",
+                    "enhancement",
+                    "improvement",
+                    "missing",
+                    "space",
+                    "sticky",
+                },
+            },
+            "bugfix": {
+                "action_words": {
+                    "fix",
+                    "resolve",
+                    "correct",
+                    "repair",
+                    "patch",
+                    "address",
+                    "handle",
+                    "solve",
+                    "debug",
+                    "prevent",
+                    "corrected",
+                },
+                "object_words": {
+                    "bug",
+                    "issue",
+                    "problem",
+                    "error",
+                    "defect",
+                    "exception",
+                    "crash",
+                    "failure",
+                    "leak",
+                    "regression",
+                    "beacon",
+                    "beacons",
                 },
-                'object_words': {
-                    'feature', 'functionality', 'capability', 'component', 'module',
-                    'endpoint', 'api', 'service', 'interface', 'system'
+                "context_words": {
+                    "broken",
+                    "failing",
+                    "incorrect",
+                    "wrong",
+                    "invalid",
+                    "missing",
+                    "null",
+                    "undefined",
+                    "not",
+                    "allowing",
                 },
-                'context_words': {
-                    'new', 'initial', 'first', 'user', 'client', 'support',
-                    'enhancement', 'improvement'
-                }
             },
-            'bugfix': {
-                'action_words': {
-                    'fix', 'resolve', 'correct', 'repair', 'patch', 'address',
-                    'handle', 'solve', 'debug', 'prevent'
+            "refactor": {
+                "action_words": {
+                    "refactor",
+                    "restructure",
+                    "reorganize",
+                    "cleanup",
+                    "simplify",
+                    "optimize",
+                    "improve",
+                    "enhance",
+                    "streamline",
+                    "consolidate",
+                    "refine",
+                    "ensure",
+                    "replace",
+                    "improves",
                 },
-                'object_words': {
-                    'bug', 'issue', 'problem', 'error', 'defect', 'exception',
-                    'crash', 'failure', 'leak', 'regression'
+                "object_words": {
+                    "code",
+                    "structure",
+                    "architecture",
+                    "design",
+                    "logic",
+                    "method",
+                    "function",
+                    "class",
+                    "module",
+                    "combo",
+                    "behavior",
+                    "focus",
+                },
+                "context_words": {
+                    "better",
+                    "cleaner",
+                    "simpler",
+                    "efficient",
+                    "maintainable",
+                    "readable",
+                    "performance",
+                    "box",
+                    "hacking",
                 },
-                'context_words': {
-                    'broken', 'failing', 'incorrect', 'wrong', 'invalid',
-                    'missing', 'null', 'undefined'
-                }
             },
-            'refactor': {
-                'action_words': {
-                    'refactor', 'restructure', 'reorganize', 'cleanup', 'simplify',
-                    'optimize', 'improve', 'enhance', 'streamline', 'consolidate'
+            "docs": {
+                "action_words": {
+                    "update",
+                    "add",
+                    "improve",
+                    "write",
+                    "document",
+                    "clarify",
+                    "explain",
+                    "describe",
+                    "detail",
+                    "added",
+                },
+                "object_words": {
+                    "documentation",
+                    "readme",
+                    "docs",
+                    "comment",
+                    "docstring",
+                    "guide",
+                    "tutorial",
+                    "example",
+                    "specification",
+                    "translations",
+                    "spanish",
+                    "label",
                 },
-                'object_words': {
-                    'code', 'structure', 'architecture', 'design', 'logic',
-                    'method', 'function', 'class', 'module'
+                "context_words": {
+                    "explain",
+                    "clarify",
+                    "describe",
+                    "instruction",
+                    "help",
+                    "change",
+                    "dynamically",
+                    "language",
                 },
-                'context_words': {
-                    'better', 'cleaner', 'simpler', 'efficient', 'maintainable',
-                    'readable', 'performance'
-                }
             },
-            'docs': {
-                'action_words': {
-                    'update', 'add', 'improve', 'write', 'document', 'clarify',
-                    'explain', 'describe', 'detail'
+            "test": {
+                "action_words": {
+                    "add",
+                    "update",
+                    "fix",
+                    "improve",
+                    "write",
+                    "create",
+                    "enhance",
+                    "extend",
+                },
+                "object_words": {
+                    "test",
+                    "spec",
+                    "coverage",
+                    "unit",
+                    "integration",
+                    "e2e",
+                    "testing",
+                    "mock",
+                    "stub",
+                    "fixture",
                 },
-                'object_words': {
-                    'documentation', 'readme', 'docs', 'comment', 'docstring',
-                    'guide', 'tutorial', 'example', 'specification'
+                "context_words": {
+                    "testing",
+                    "verify",
+                    "validate",
+                    "check",
+                    "ensure",
+                    "coverage",
+                    "assertion",
                 },
-                'context_words': {
-                    'explain', 'clarify', 'describe', 'instruction', 'help'
-                }
             },
-            'test': {
-                'action_words': {
-                    'add', 'update', 'fix', 'improve', 'write', 'create',
-                    'enhance', 'extend'
+            "chore": {
+                "action_words": {
+                    "update",
+                    "bump",
+                    "upgrade",
+                    "configure",
+                    "setup",
+                    "install",
+                    "remove",
+                    "delete",
+                    "clean",
+                    "sync",
+                    "merge",
                 },
-                'object_words': {
-                    'test', 'spec', 'coverage', 'unit', 'integration', 'e2e',
-                    'testing', 'mock', 'stub', 'fixture'
+                "object_words": {
+                    "dependency",
+                    "package",
+                    "config",
+                    "configuration",
+                    "build",
+                    "version",
+                    "tool",
+                    "script",
+                    "workflow",
+                    "console",
+                    "log",
+                    "main",
+                },
+                "context_words": {
+                    "maintenance",
+                    "housekeeping",
+                    "routine",
+                    "automated",
+                    "ci",
+                    "cd",
+                    "pipeline",
+                    "auto",
+                    "removal",
                 },
-                'context_words': {
-                    'testing', 'verify', 'validate', 'check', 'ensure',
-                    'coverage', 'assertion'
-                }
             },
-            'chore': {
-                'action_words': {
-                    'update', 'bump', 'upgrade', 'configure', 'setup', 'install',
-                    'remove', 'delete', 'clean'
+            "security": {
+                "action_words": {
+                    "fix",
+                    "secure",
+                    "protect",
+                    "validate",
+                    "sanitize",
+                    "encrypt",
+                    "authenticate",
+                    "authorize",
+                },
+                "object_words": {
+                    "security",
+                    "vulnerability",
+                    "exploit",
+                    "xss",
+                    "csrf",
+                    "injection",
+                    "authentication",
+                    "authorization",
+                    "permission",
                 },
-                'object_words': {
-                    'dependency', 'package', 'config', 'configuration', 'build',
-                    'version', 'tool', 'script', 'workflow'
+                "context_words": {
+                    "secure",
+                    "safe",
+                    "protected",
+                    "validated",
+                    "sanitized",
+                    "encrypted",
+                    "threat",
+                    "attack",
                 },
-                'context_words': {
-                    'maintenance', 'housekeeping', 'routine', 'automated',
-                    'ci', 'cd', 'pipeline'
-                }
             },
-            'security': {
-                'action_words': {
-                    'fix', 'secure', 'protect', 'validate', 'sanitize',
-                    'encrypt', 'authenticate', 'authorize'
+            "hotfix": {
+                "action_words": {"hotfix", "fix", "patch", "urgent", "critical", "emergency"},
+                "object_words": {
+                    "production",
+                    "critical",
+                    "urgent",
+                    "emergency",
+                    "hotfix",
+                    "issue",
+                    "bug",
+                    "problem",
                 },
-                'object_words': {
-                    'security', 'vulnerability', 'exploit', 'xss', 'csrf',
-                    'injection', 'authentication', 'authorization', 'permission'
+                "context_words": {
+                    "urgent",
+                    "critical",
+                    "immediate",
+                    "production",
+                    "live",
+                    "emergency",
+                    "asap",
                 },
-                'context_words': {
-                    'secure', 'safe', 'protected', 'validated', 'sanitized',
-                    'encrypted', 'threat', 'attack'
-                }
             },
-            'hotfix': {
-                'action_words': {
-                    'hotfix', 'fix', 'patch', 'urgent', 'critical', 'emergency'
+            "config": {
+                "action_words": {
+                    "configure",
+                    "setup",
+                    "adjust",
+                    "modify",
+                    "change",
+                    "update",
+                    "tweak",
+                    "changing",
+                },
+                "object_words": {
+                    "config",
+                    "configuration",
+                    "settings",
+                    "environment",
+                    "parameter",
+                    "option",
+                    "flag",
+                    "variable",
+                    "roles",
+                    "user",
+                    "schema",
+                    "access",
+                    "levels",
                 },
-                'object_words': {
-                    'production', 'critical', 'urgent', 'emergency', 'hotfix',
-                    'issue', 'bug', 'problem'
+                "context_words": {
+                    "environment",
+                    "production",
+                    "development",
+                    "staging",
+                    "deployment",
+                    "setup",
+                    "roles",
+                    "permission",
+                    "api",
                 },
-                'context_words': {
-                    'urgent', 'critical', 'immediate', 'production', 'live',
-                    'emergency', 'asap'
-                }
             },
-            'config': {
-                'action_words': {
-                    'configure', 'setup', 'adjust', 'modify', 'change',
-                    'update', 'tweak'
+            "integration": {
+                "action_words": {
+                    "integrate",
+                    "add",
+                    "implement",
+                    "connect",
+                    "setup",
+                    "remove",
+                    "extend",
+                    "removing",
                 },
-                'object_words': {
-                    'config', 'configuration', 'settings', 'environment',
-                    'parameter', 'option', 'flag', 'variable'
+                "object_words": {
+                    "integration",
+                    "posthog",
+                    "iubenda",
+                    "auth0",
+                    "oauth",
+                    "api",
+                    "service",
+                    "third-party",
+                    "external",
+                    "mena",
                 },
-                'context_words': {
-                    'environment', 'production', 'development', 'staging',
-                    'deployment', 'setup'
-                }
-            }
+                "context_words": {
+                    "collection",
+                    "data",
+                    "privacy",
+                    "policy",
+                    "implementation",
+                    "access",
+                    "redirect",
+                },
+            },
         }
         # File pattern signals for change types
         self.file_patterns = {
-            'test': [
-                r'.*test.*\.py$', r'.*spec.*\.js$', r'.*test.*\.java$',
-                r'test_.*\.py$', r'.*_test\.go$', r'.*\.test\.(js|ts)$',
-                r'__tests__/.*', r'tests?/.*', r'spec/.*'
+            "test": [
+                r".*test.*\.py$",
+                r".*spec.*\.js$",
+                r".*test.*\.java$",
+                r"test_.*\.py$",
+                r".*_test\.go$",
+                r".*\.test\.(js|ts)$",
+                r"__tests__/.*",
+                r"tests?/.*",
+                r"spec/.*",
             ],
-            'docs': [
-                r'.*\.md$', r'.*\.rst$', r'.*\.txt$', r'README.*',
-                r'CHANGELOG.*', r'docs?/.*', r'documentation/.*'
+            "docs": [
+                r".*\.md$",
+                r".*\.rst$",
+                r".*\.txt$",
+                r"README.*",
+                r"CHANGELOG.*",
+                r"docs?/.*",
+                r"documentation/.*",
             ],
-            'config': [
-                r'.*\.ya?ml$', r'.*\.json$', r'.*\.toml$', r'.*\.ini$',
-                r'.*\.env.*', r'Dockerfile.*', r'.*config.*', r'\.github/.*'
+            "config": [
+                r".*\.ya?ml$",
+                r".*\.json$",
+                r".*\.toml$",
+                r".*\.ini$",
+                r".*\.env.*",
+                r"Dockerfile.*",
+                r".*config.*",
+                r"\.github/.*",
+            ],
+            "chore": [
+                r"package.*\.json$",
+                r"requirements.*\.txt$",
+                r"Pipfile.*",
+                r"pom\.xml$",
+                r"build\.gradle$",
+                r".*\.lock$",
             ],
-            'chore': [
-                r'package.*\.json$', r'requirements.*\.txt$', r'Pipfile.*',
-                r'pom\.xml$', r'build\.gradle$', r'.*\.lock$'
-            ]
         }
         # Compile regex patterns for efficiency
         self._compile_file_patterns()
         # Common commit message prefixes
         self.prefix_patterns = {
-            'feat': 'feature',
-            'feature': 'feature',
-            'fix': 'bugfix',
-            'bugfix': 'bugfix',
-            'refactor': 'refactor',
-            'docs': 'docs',
-            'test': 'test',
-            'chore': 'chore',
-            'security': 'security',
-            'hotfix': 'hotfix',
-            'config': 'config',
-            'style': 'chore',  # Style changes are usually chores
-            'perf': 'refactor',  # Performance improvements are refactoring
-            'build': 'chore',
-            'ci': 'chore'
+            "feat": "feature",
+            "feature": "feature",
+            "fix": "bugfix",
+            "bugfix": "bugfix",
+            "refactor": "refactor",
+            "docs": "docs",
+            "test": "test",
+            "chore": "chore",
+            "security": "security",
+            "hotfix": "hotfix",
+            "config": "config",
+            "integration": "integration",
+            "integrate": "integration",
+            "style": "chore",  # Style changes are usually chores
+            "perf": "refactor",  # Performance improvements are refactoring
+            "build": "chore",
+            "ci": "chore",
         }
     def _compile_file_patterns(self) -> None:
         """Compile regex patterns for file matching."""
         self.compiled_file_patterns = {}
@@ -216,253 +484,259 @@ class ChangeTypeClassifier:
             self.compiled_file_patterns[change_type] = [
                 re.compile(pattern, re.IGNORECASE) for pattern in patterns
             ]
-    def classify(self, message: str, doc: Doc, files: List[str]) -> Tuple[str, float]:
+    def classify(self, message: str, doc: Doc, files: list[str]) -> tuple[str, float]:
         """Classify commit change type with confidence score.
         Args:
             message: Commit message
             doc: spaCy processed document
             files: List of changed files
         Returns:
             Tuple of (change_type, confidence_score)
         """
         if not message:
-            return 'unknown', 0.0
+            return "unknown", 0.0
         # Step 1: Check for conventional commit prefixes
         prefix_result = self._check_conventional_prefix(message)
         if prefix_result:
             change_type, confidence = prefix_result
             if confidence >= self.config.min_confidence:
                 return change_type, confidence
         # Step 2: Semantic analysis of message content
         semantic_scores = self._analyze_semantic_content(message, doc)
         # Step 3: File pattern analysis
         file_scores = self._analyze_file_patterns(files)
         # Step 4: Combine scores with weights
         combined_scores = self._combine_scores(semantic_scores, file_scores)
         # Step 5: Select best match
         if not combined_scores:
-            return 'unknown', 0.0
+            return "unknown", 0.0
         best_type = max(combined_scores.keys(), key=lambda k: combined_scores[k])
         confidence = combined_scores[best_type]
         # Apply confidence threshold
         if confidence < self.config.min_confidence:
-            return 'unknown', confidence
+            return "unknown", confidence
         return best_type, confidence
-    def _check_conventional_prefix(self, message: str) -> Optional[Tuple[str, float]]:
+    def _check_conventional_prefix(self, message: str) -> Optional[tuple[str, float]]:
         """Check for conventional commit message prefixes.
         Args:
             message: Commit message
         Returns:
             Tuple of (change_type, confidence) if found, None otherwise
         """
         # Look for conventional commit format: type(scope): description
-        conventional_pattern = r'^(\w+)(?:\([^)]*\))?\s*:\s*(.+)'
+        conventional_pattern = r"^(\w+)(?:\([^)]*\))?\s*:\s*(.+)"
         match = re.match(conventional_pattern, message.strip(), re.IGNORECASE)
         if match:
             prefix = match.group(1).lower()
             if prefix in self.prefix_patterns:
                 return self.prefix_patterns[prefix], 0.9  # High confidence for explicit prefixes
         # Check for simple prefixes at start of message
         words = message.lower().split()
         if words:
-            first_word = words[0].rstrip(':').rstrip('-')
+            first_word = words[0].rstrip(":").rstrip("-")
             if first_word in self.prefix_patterns:
                 return self.prefix_patterns[first_word], 0.8
         return None
-    def _analyze_semantic_content(self, message: str, doc: Doc) -> Dict[str, float]:
+    def _analyze_semantic_content(self, message: str, doc: Doc) -> dict[str, float]:
         """Analyze semantic content of commit message.
         Args:
             message: Commit message
             doc: spaCy processed document
         Returns:
             Dictionary of change_type -> confidence_score
         """
         if not SPACY_AVAILABLE or not doc:
             # Fallback to simple keyword matching
             return self._simple_keyword_analysis(message.lower())
         # Extract semantic features from spaCy doc
         features = self._extract_semantic_features(doc)
         # Calculate similarity to each change type
         scores = {}
         for change_type, patterns in self.change_patterns.items():
             similarity = self._calculate_semantic_similarity(features, patterns)
             if similarity > 0:
                 scores[change_type] = similarity
         return scores
-    def _extract_semantic_features(self, doc: Doc) -> Dict[str, Set[str]]:
+    def _extract_semantic_features(self, doc: Doc) -> dict[str, set[str]]:
         """Extract semantic features from spaCy document.
         Args:
             doc: spaCy processed document
         Returns:
             Dictionary of feature_type -> set_of_words
         """
         features = {
-            'verbs': set(),
-            'nouns': set(),
-            'adjectives': set(),
-            'entities': set(),
-            'lemmas': set()
+            "verbs": set(),
+            "nouns": set(),
+            "adjectives": set(),
+            "entities": set(),
+            "lemmas": set(),
         }
         for token in doc:
             if token.is_stop or token.is_punct or len(token.text) < 2:
                 continue
             lemma = token.lemma_.lower()
-            features['lemmas'].add(lemma)
-            if token.pos_ == 'VERB':
-                features['verbs'].add(lemma)
-            elif token.pos_ in ['NOUN', 'PROPN']:
-                features['nouns'].add(lemma)
-            elif token.pos_ == 'ADJ':
-                features['adjectives'].add(lemma)
+            features["lemmas"].add(lemma)
+            if token.pos_ == "VERB":
+                features["verbs"].add(lemma)
+            elif token.pos_ in ["NOUN", "PROPN"]:
+                features["nouns"].add(lemma)
+            elif token.pos_ == "ADJ":
+                features["adjectives"].add(lemma)
         # Add named entities
         for ent in doc.ents:
-            features['entities'].add(ent.text.lower())
+            features["entities"].add(ent.text.lower())
         return features
-    def _calculate_semantic_similarity(self, features: Dict[str, Set[str]],
-                                     patterns: Dict[str, Set[str]]) -> float:
+    def _calculate_semantic_similarity(
+        self, features: dict[str, set[str]], patterns: dict[str, set[str]]
+    ) -> float:
         """Calculate semantic similarity between features and patterns.
         Args:
             features: Extracted semantic features
             patterns: Change type patterns
         Returns:
             Similarity score (0.0 to 1.0)
         """
         similarity_score = 0.0
         # Action words (verbs) - highest weight
-        action_matches = len(features['verbs'].intersection(patterns['action_words']))
+        action_matches = len(features["verbs"].intersection(patterns["action_words"]))
         if action_matches > 0:
             similarity_score += action_matches * 0.5
-        # Object words (nouns) - medium weight
-        object_matches = len(features['nouns'].intersection(patterns['object_words']))
+        # Object words (nouns) - medium weight
+        object_matches = len(features["nouns"].intersection(patterns["object_words"]))
         if object_matches > 0:
             similarity_score += object_matches * 0.3
         # Context words (any lemma) - lower weight
-        all_lemmas = features['lemmas']
-        context_matches = len(all_lemmas.intersection(patterns['context_words']))
+        all_lemmas = features["lemmas"]
+        context_matches = len(all_lemmas.intersection(patterns["context_words"]))
         if context_matches > 0:
             similarity_score += context_matches * 0.2
         # Normalize by maximum possible score
-        max_possible = len(patterns['action_words']) * 0.5 + \
-                      len(patterns['object_words']) * 0.3 + \
-                      len(patterns['context_words']) * 0.2
+        max_possible = (
+            len(patterns["action_words"]) * 0.5
+            + len(patterns["object_words"]) * 0.3
+            + len(patterns["context_words"]) * 0.2
+        )
         return min(1.0, similarity_score / max_possible) if max_possible > 0 else 0.0
-    def _simple_keyword_analysis(self, message: str) -> Dict[str, float]:
+    def _simple_keyword_analysis(self, message: str) -> dict[str, float]:
         """Simple keyword-based analysis fallback.
         Args:
             message: Lowercase commit message
         Returns:
             Dictionary of change_type -> confidence_score
         """
         scores = {}
-        words = set(re.findall(r'\b\w+\b', message))
+        words = set(re.findall(r"\b\w+\b", message))
         for change_type, patterns in self.change_patterns.items():
-            all_pattern_words = patterns['action_words'] | patterns['object_words'] | patterns['context_words']
+            all_pattern_words = (
+                patterns["action_words"] | patterns["object_words"] | patterns["context_words"]
+            )
             matches = len(words.intersection(all_pattern_words))
             if matches > 0:
                 # Simple scoring based on keyword matches
                 scores[change_type] = min(1.0, matches / 5.0)  # Scale to 0-1
         return scores
-    def _analyze_file_patterns(self, files: List[str]) -> Dict[str, float]:
+    def _analyze_file_patterns(self, files: list[str]) -> dict[str, float]:
         """Analyze file patterns for change type signals.
         Args:
             files: List of changed file paths
         Returns:
             Dictionary of change_type -> confidence_score
         """
         if not files:
             return {}
         scores = {}
         for change_type, patterns in self.compiled_file_patterns.items():
             matching_files = 0
             for file_path in files:
                 for pattern in patterns:
                     if pattern.search(file_path):
                         matching_files += 1
                         break  # Don't double-count same file
             if matching_files > 0:
                 # File pattern confidence based on proportion of matching files
                 confidence = min(1.0, matching_files / len(files))
                 scores[change_type] = confidence
         return scores
-    def _combine_scores(self, semantic_scores: Dict[str, float],
-                       file_scores: Dict[str, float]) -> Dict[str, float]:
+    def _combine_scores(
+        self, semantic_scores: dict[str, float], file_scores: dict[str, float]
+    ) -> dict[str, float]:
         """Combine semantic and file pattern scores.
         Args:
             semantic_scores: Scores from semantic analysis
             file_scores: Scores from file pattern analysis
         Returns:
             Combined scores dictionary
         """
         combined = {}
         all_types = set(semantic_scores.keys()) | set(file_scores.keys())
         for change_type in all_types:
             semantic_score = semantic_scores.get(change_type, 0.0)
             file_score = file_scores.get(change_type, 0.0)
             # Weighted combination
             combined_score = (
-                semantic_score * self.config.semantic_weight +
-                file_score * self.config.file_pattern_weight
+                semantic_score * self.config.semantic_weight
+                + file_score * self.config.file_pattern_weight
             )
             if combined_score > 0:
                 combined[change_type] = combined_score
-        return combined
+        return combined

gitflow-analytics 1.0.3__py3-none-any.whl → 1.3.6__py3-none-any.whl

gitflow-analytics 1.0.3py3-none-any.whl → 1.3.6py3-none-any.whl