PyPI - empathy-framework - Versions diffs - 5.0.1__py3-none-any.whl → 5.1.0__py3-none-any.whl - Mend

empathy-framework 5.0.1py3-none-any.whl → 5.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (61) hide show

{empathy_framework-5.0.1.dist-info → empathy_framework-5.1.0.dist-info}/METADATA +311 -150
{empathy_framework-5.0.1.dist-info → empathy_framework-5.1.0.dist-info}/RECORD +60 -33
empathy_framework-5.1.0.dist-info/licenses/LICENSE +201 -0
empathy_framework-5.1.0.dist-info/licenses/LICENSE_CHANGE_ANNOUNCEMENT.md +101 -0
empathy_llm_toolkit/providers.py +175 -35
empathy_llm_toolkit/utils/tokens.py +150 -30
empathy_os/__init__.py +1 -1
empathy_os/cli/commands/batch.py +256 -0
empathy_os/cli/commands/cache.py +248 -0
empathy_os/cli/commands/inspect.py +1 -2
empathy_os/cli/commands/metrics.py +1 -1
empathy_os/cli/commands/routing.py +285 -0
empathy_os/cli/commands/workflow.py +2 -1
empathy_os/cli/parsers/__init__.py +6 -0
empathy_os/cli/parsers/batch.py +118 -0
empathy_os/cli/parsers/cache 2.py +65 -0
empathy_os/cli/parsers/cache.py +65 -0
empathy_os/cli/parsers/routing.py +110 -0
empathy_os/cli_minimal.py +3 -3
empathy_os/cli_router 2.py +416 -0
empathy_os/dashboard/__init__.py +1 -2
empathy_os/dashboard/app 2.py +512 -0
empathy_os/dashboard/app.py +1 -1
empathy_os/dashboard/simple_server 2.py +403 -0
empathy_os/dashboard/standalone_server 2.py +536 -0
empathy_os/dashboard/standalone_server.py +22 -11
empathy_os/memory/types 2.py +441 -0
empathy_os/metrics/collector.py +31 -0
empathy_os/models/__init__.py +19 -0
empathy_os/models/adaptive_routing 2.py +437 -0
empathy_os/models/auth_cli.py +444 -0
empathy_os/models/auth_strategy.py +450 -0
empathy_os/models/token_estimator.py +21 -13
empathy_os/project_index/scanner_parallel 2.py +291 -0
empathy_os/telemetry/agent_coordination 2.py +478 -0
empathy_os/telemetry/agent_coordination.py +14 -16
empathy_os/telemetry/agent_tracking 2.py +350 -0
empathy_os/telemetry/agent_tracking.py +18 -20
empathy_os/telemetry/approval_gates 2.py +563 -0
empathy_os/telemetry/approval_gates.py +27 -39
empathy_os/telemetry/event_streaming 2.py +405 -0
empathy_os/telemetry/event_streaming.py +22 -22
empathy_os/telemetry/feedback_loop 2.py +557 -0
empathy_os/telemetry/feedback_loop.py +14 -17
empathy_os/workflows/__init__.py +8 -0
empathy_os/workflows/autonomous_test_gen.py +569 -0
empathy_os/workflows/batch_processing.py +56 -10
empathy_os/workflows/bug_predict.py +45 -0
empathy_os/workflows/code_review.py +92 -22
empathy_os/workflows/document_gen.py +594 -62
empathy_os/workflows/llm_base.py +363 -0
empathy_os/workflows/perf_audit.py +69 -0
empathy_os/workflows/release_prep.py +54 -0
empathy_os/workflows/security_audit.py +154 -79
empathy_os/workflows/test_gen.py +60 -0
empathy_os/workflows/test_gen_behavioral.py +477 -0
empathy_os/workflows/test_gen_parallel.py +341 -0
empathy_framework-5.0.1.dist-info/licenses/LICENSE +0 -139
{empathy_framework-5.0.1.dist-info → empathy_framework-5.1.0.dist-info}/WHEEL +0 -0
{empathy_framework-5.0.1.dist-info → empathy_framework-5.1.0.dist-info}/entry_points.txt +0 -0
{empathy_framework-5.0.1.dist-info → empathy_framework-5.1.0.dist-info}/top_level.txt +0 -0

empathy_os/workflows/llm_base.py ADDED Viewed

@@ -0,0 +1,363 @@
+"""Base class for LLM-enhanced workflow generation.
+Provides reusable patterns for hybrid LLM + template generation with:
+- Smart caching for expensive operations
+- Fallback to templates when LLM fails
+- Quality validation
+- Dashboard integration
+- Cost tracking
+Copyright 2026 Smart-AI-Memory
+Licensed under Apache 2.0
+"""
+import hashlib
+import json
+import logging
+import os
+from abc import ABC, abstractmethod
+from datetime import datetime, timedelta
+from typing import Any
+logger = logging.getLogger(__name__)
+class LLMWorkflowGenerator(ABC):
+    """Base class for LLM-enhanced workflow generation.
+    Provides hybrid approach: intelligent LLM generation with fallback templates.
+    Usage:
+        class TestGeneratorLLM(LLMWorkflowGenerator):
+            def _generate_with_template(self, context: dict) -> str:
+                return create_template(context)
+            def _validate(self, result: str) -> bool:
+                return validate_python_syntax(result)
+        generator = TestGeneratorLLM(model_tier="capable")
+        output = generator.generate(context, prompt)
+    """
+    def __init__(
+        self,
+        model_tier: str = "capable",
+        enable_cache: bool = True,
+        cache_ttl_hours: int = 24,
+    ):
+        """Initialize LLM workflow generator.
+        Args:
+            model_tier: Model tier to use (cheap, capable, premium)
+            enable_cache: Whether to cache LLM responses
+            cache_ttl_hours: Cache time-to-live in hours
+        """
+        self.model_tier = model_tier
+        self.enable_cache = enable_cache
+        self.cache_ttl = timedelta(hours=cache_ttl_hours)
+        self._cache: dict[str, tuple[str, datetime]] = {}
+        self._stats = {
+            "llm_requests": 0,
+            "llm_failures": 0,
+            "template_fallbacks": 0,
+            "cache_hits": 0,
+            "cache_misses": 0,
+            "total_tokens": 0,
+            "total_cost_usd": 0.0,
+        }
+    def generate(self, context: dict[str, Any], prompt: str) -> str:
+        """Generate output with LLM, fallback to template.
+        Args:
+            context: Context dict for generation
+            prompt: LLM prompt
+        Returns:
+            Generated output (from LLM or template)
+        """
+        # Check cache first
+        if self.enable_cache:
+            cache_key = self._make_cache_key(context, prompt)
+            cached = self._get_from_cache(cache_key)
+            if cached:
+                self._stats["cache_hits"] += 1
+                logger.debug(f"Cache hit for {cache_key[:16]}...")
+                return cached
+            self._stats["cache_misses"] += 1
+        # Try LLM generation
+        try:
+            self._stats["llm_requests"] += 1
+            result = self._generate_with_llm(prompt)
+            # Validate result
+            if self._validate(result):
+                # Cache successful result
+                if self.enable_cache:
+                    self._put_in_cache(cache_key, result)
+                # Track tokens and cost
+                self._update_usage_stats(result)
+                logger.info("LLM generation successful")
+                return result
+            else:
+                logger.warning("LLM result failed validation")
+        except Exception as e:
+            self._stats["llm_failures"] += 1
+            logger.warning(f"LLM generation failed: {e}")
+        # Fallback to template
+        self._stats["template_fallbacks"] += 1
+        logger.info("Falling back to template generation")
+        return self._generate_with_template(context)
+    def _generate_with_llm(self, prompt: str) -> str:
+        """Generate using LLM API.
+        Args:
+            prompt: LLM prompt
+        Returns:
+            Generated content
+        Raises:
+            Exception: If LLM generation fails
+        """
+        try:
+            import anthropic
+        except ImportError:
+            raise ImportError("anthropic package not installed")
+        # Get API key
+        api_key = os.getenv("ANTHROPIC_API_KEY")
+        if not api_key:
+            raise ValueError("ANTHROPIC_API_KEY not set")
+        # Get model ID for tier
+        model_id = self._get_model_id(self.model_tier)
+        # Call Anthropic API
+        logger.debug(f"Calling LLM with {self.model_tier} tier (model: {model_id})")
+        client = anthropic.Anthropic(api_key=api_key)
+        response = client.messages.create(
+            model=model_id,
+            max_tokens=4000,
+            messages=[{"role": "user", "content": prompt}],
+        )
+        if not response.content:
+            raise ValueError("Empty LLM response")
+        result = response.content[0].text.strip()
+        # Clean up markdown fences if present
+        if result.startswith("```python"):
+            result = result[len("```python") :].strip()
+        elif result.startswith("```"):
+            result = result[3:].strip()
+        if result.endswith("```"):
+            result = result[:-3].strip()
+        return result
+    def _get_model_id(self, tier: str) -> str:
+        """Get model ID for tier.
+        Args:
+            tier: Model tier (cheap, capable, premium)
+        Returns:
+            Model ID string
+        """
+        from empathy_os.models.registry import get_model
+        model_info = get_model("anthropic", tier)
+        if not model_info:
+            raise ValueError(f"No model found for tier: {tier}")
+        return model_info.model_id
+    def _make_cache_key(self, context: dict[str, Any], prompt: str) -> str:
+        """Create cache key from context and prompt.
+        Args:
+            context: Context dict
+            prompt: Prompt string
+        Returns:
+            Cache key (hex hash)
+        """
+        # Combine context and prompt for cache key
+        cache_data = {
+            "context": context,
+            "prompt": prompt,
+            "model_tier": self.model_tier,
+        }
+        cache_json = json.dumps(cache_data, sort_keys=True)
+        return hashlib.sha256(cache_json.encode()).hexdigest()
+    def _get_from_cache(self, cache_key: str) -> str | None:
+        """Get item from cache if not expired.
+        Args:
+            cache_key: Cache key
+        Returns:
+            Cached value or None if not found/expired
+        """
+        if cache_key not in self._cache:
+            return None
+        value, timestamp = self._cache[cache_key]
+        # Check if expired
+        if datetime.now() - timestamp > self.cache_ttl:
+            del self._cache[cache_key]
+            return None
+        return value
+    def _put_in_cache(self, cache_key: str, value: str):
+        """Put item in cache with current timestamp.
+        Args:
+            cache_key: Cache key
+            value: Value to cache
+        """
+        self._cache[cache_key] = (value, datetime.now())
+    def _update_usage_stats(self, result: str):
+        """Update token and cost statistics.
+        Args:
+            result: Generated result
+        """
+        # Rough token estimate (4 chars per token)
+        estimated_tokens = len(result) // 4
+        self._stats["total_tokens"] += estimated_tokens
+        # Cost estimation (based on capable tier: $3/M input, $15/M output)
+        if self.model_tier == "cheap":
+            cost_per_token = 1.0 / 1_000_000  # $1/M tokens
+        elif self.model_tier == "capable":
+            cost_per_token = 15.0 / 1_000_000  # $15/M output tokens
+        elif self.model_tier == "premium":
+            cost_per_token = 75.0 / 1_000_000  # $75/M output tokens
+        else:
+            cost_per_token = 15.0 / 1_000_000
+        self._stats["total_cost_usd"] += estimated_tokens * cost_per_token
+    def get_stats(self) -> dict[str, Any]:
+        """Get generation statistics.
+        Returns:
+            Dict with usage stats
+        """
+        stats = self._stats.copy()
+        # Calculate rates
+        total_requests = stats["llm_requests"]
+        if total_requests > 0:
+            stats["llm_success_rate"] = (
+                total_requests - stats["llm_failures"]
+            ) / total_requests
+            stats["template_fallback_rate"] = stats["template_fallbacks"] / total_requests
+        else:
+            stats["llm_success_rate"] = 0.0
+            stats["template_fallback_rate"] = 0.0
+        # Cache performance
+        total_cache_ops = stats["cache_hits"] + stats["cache_misses"]
+        if total_cache_ops > 0:
+            stats["cache_hit_rate"] = stats["cache_hits"] / total_cache_ops
+        else:
+            stats["cache_hit_rate"] = 0.0
+        return stats
+    def clear_cache(self):
+        """Clear the cache."""
+        self._cache.clear()
+        logger.info("Cache cleared")
+    @abstractmethod
+    def _generate_with_template(self, context: dict[str, Any]) -> str:
+        """Generate using template fallback.
+        Args:
+            context: Context dict with generation data
+        Returns:
+            Generated output from template
+        Note:
+            Subclasses must implement this method.
+        """
+        raise NotImplementedError("Subclass must implement _generate_with_template")
+    @abstractmethod
+    def _validate(self, result: str) -> bool:
+        """Validate generated output.
+        Args:
+            result: Generated output to validate
+        Returns:
+            True if valid, False otherwise
+        Note:
+            Subclasses must implement this method.
+        """
+        raise NotImplementedError("Subclass must implement _validate")
+class TestGeneratorLLM(LLMWorkflowGenerator):
+    """Example LLM-enhanced test generator.
+    Shows how to use the base class for test generation.
+    """
+    def _generate_with_template(self, context: dict[str, Any]) -> str:
+        """Fallback template generation.
+        Args:
+            context: Must contain 'module_name', 'module_path'
+        Returns:
+            Template test file
+        """
+        module_name = context.get("module_name", "unknown")
+        module_path = context.get("module_path", "unknown")
+        return f'''"""Behavioral tests for {module_name}.
+Generated by template fallback.
+Copyright 2026 Smart-AI-Memory
+Licensed under Apache 2.0
+"""
+import pytest
+def test_{module_name}_placeholder():
+    """Placeholder test - implement actual tests."""
+    # TODO: Implement comprehensive tests
+    pass
+'''
+    def _validate(self, result: str) -> bool:
+        """Validate test file has basic structure.
+        Args:
+            result: Generated test file content
+        Returns:
+            True if valid test file structure
+        """
+        # Check for basic test file structure
+        required = ["import pytest", "def test_", '"""']
+        return all(req in result for req in required) and len(result) > 100

empathy_os/workflows/perf_audit.py CHANGED Viewed

@@ -140,18 +140,22 @@ class PerformanceAuditWorkflow(BaseWorkflow):
     def __init__(
         self,
         min_hotspots_for_premium: int = 3,
+        enable_auth_strategy: bool = True,
         **kwargs: Any,
     ):
         """Initialize performance audit workflow.
         Args:
             min_hotspots_for_premium: Minimum hotspots to trigger premium optimization
+            enable_auth_strategy: Enable intelligent auth routing (default: True)
             **kwargs: Additional arguments passed to BaseWorkflow
         """
         super().__init__(**kwargs)
         self.min_hotspots_for_premium = min_hotspots_for_premium
+        self.enable_auth_strategy = enable_auth_strategy
         self._hotspot_count: int = 0
+        self._auth_mode_used: str | None = None
     def should_skip_stage(self, stage_name: str, input_data: Any) -> tuple[bool, str | None]:
         """Downgrade optimize stage if few hotspots.
@@ -199,6 +203,70 @@ class PerformanceAuditWorkflow(BaseWorkflow):
         files_scanned = 0
         target = Path(target_path)
+        # === AUTH STRATEGY INTEGRATION ===
+        if self.enable_auth_strategy:
+            try:
+                import logging
+                from empathy_os.models import (
+                    count_lines_of_code,
+                    get_auth_strategy,
+                    get_module_size_category,
+                )
+                logger = logging.getLogger(__name__)
+                # Calculate total LOC for the project/path
+                total_lines = 0
+                if target.is_file():
+                    total_lines = count_lines_of_code(target)
+                elif target.is_dir():
+                    # Estimate total lines for directory
+                    for ext in file_types:
+                        for file_path in target.rglob(f"*{ext}"):
+                            if any(
+                                skip in str(file_path)
+                                for skip in [".git", "node_modules", "__pycache__", "venv", "test"]
+                            ):
+                                continue
+                            try:
+                                total_lines += count_lines_of_code(file_path)
+                            except Exception:
+                                pass
+                if total_lines > 0:
+                    strategy = get_auth_strategy()
+                    recommended_mode = strategy.get_recommended_mode(total_lines)
+                    self._auth_mode_used = recommended_mode.value
+                    size_category = get_module_size_category(total_lines)
+                    logger.info(
+                        f"Performance audit target: {target_path} "
+                        f"({total_lines:,} LOC, {size_category})"
+                    )
+                    logger.info(f"Recommended auth mode: {recommended_mode.value}")
+                    cost_estimate = strategy.estimate_cost(total_lines, recommended_mode)
+                    if recommended_mode.value == "subscription":
+                        logger.info(
+                            f"Cost estimate: ~${cost_estimate:.4f} "
+                            "(significantly cheaper with subscription)"
+                        )
+                    else:
+                        logger.info(f"Cost estimate: ~${cost_estimate:.4f} (API-based)")
+            except ImportError as e:
+                import logging
+                logger = logging.getLogger(__name__)
+                logger.debug(f"Auth strategy not available: {e}")
+            except Exception as e:
+                import logging
+                logger = logging.getLogger(__name__)
+                logger.warning(f"Auth strategy detection failed: {e}")
+        # === END AUTH STRATEGY INTEGRATION ===
         if target.exists():
             for ext in file_types:
                 for file_path in target.rglob(f"*{ext}"):
@@ -468,6 +536,7 @@ Provide detailed optimization strategies."""
             "perf_score": hotspot_result.get("perf_score", 0),
             "perf_level": hotspot_result.get("perf_level", "unknown"),
             "model_tier_used": tier.value,
+            "auth_mode_used": self._auth_mode_used,
         }
         # Merge parsed XML data if available

empathy_os/workflows/release_prep.py CHANGED Viewed

@@ -60,6 +60,7 @@ class ReleasePreparationWorkflow(BaseWorkflow):
         skip_approve_if_clean: bool = True,
         use_security_crew: bool = False,
         crew_config: dict | None = None,
+        enable_auth_strategy: bool = True,
         **kwargs: Any,
     ):
         """Initialize release preparation workflow.
@@ -68,6 +69,7 @@ class ReleasePreparationWorkflow(BaseWorkflow):
             skip_approve_if_clean: Skip premium approval if all checks pass
             use_security_crew: Enable SecurityAuditCrew for comprehensive security audit
             crew_config: Configuration dict for SecurityAuditCrew
+            enable_auth_strategy: Enable intelligent auth routing (default: True)
             **kwargs: Additional arguments passed to BaseWorkflow
         """
@@ -75,7 +77,9 @@ class ReleasePreparationWorkflow(BaseWorkflow):
         self.skip_approve_if_clean = skip_approve_if_clean
         self.use_security_crew = use_security_crew
         self.crew_config = crew_config or {}
+        self.enable_auth_strategy = enable_auth_strategy
         self._has_blockers: bool = False
+        self._auth_mode_used: str | None = None
         # Dynamically configure stages based on security crew setting
         if use_security_crew:
@@ -137,6 +141,52 @@ class ReleasePreparationWorkflow(BaseWorkflow):
         Executes lint, type checking, and tests.
         """
         target_path = input_data.get("path", ".")
+        # === AUTH STRATEGY INTEGRATION ===
+        if self.enable_auth_strategy:
+            try:
+                import logging
+                from pathlib import Path
+                from empathy_os.models import (
+                    count_lines_of_code,
+                    get_auth_strategy,
+                    get_module_size_category,
+                )
+                logger = logging.getLogger(__name__)
+                # Calculate total LOC for project/directory
+                target = Path(target_path)
+                total_lines = 0
+                if target.is_file():
+                    total_lines = count_lines_of_code(target)
+                elif target.is_dir():
+                    for py_file in target.rglob("*.py"):
+                        try:
+                            total_lines += count_lines_of_code(py_file)
+                        except Exception:
+                            pass
+                if total_lines > 0:
+                    strategy = get_auth_strategy()
+                    recommended_mode = strategy.get_recommended_mode(total_lines)
+                    self._auth_mode_used = recommended_mode.value
+                    size_category = get_module_size_category(total_lines)
+                    logger.info(f"Release prep target: {target_path} ({total_lines:,} LOC, {size_category})")
+                    logger.info(f"Recommended auth mode: {recommended_mode.value}")
+                    cost_estimate = strategy.estimate_cost(total_lines, recommended_mode)
+                    if recommended_mode.value == "subscription":
+                        logger.info(f"Cost: {cost_estimate['quota_cost']}")
+                    else:
+                        logger.info(f"Cost: ~${cost_estimate['monetary_cost']:.4f}")
+            except Exception as e:
+                import logging
+                logger = logging.getLogger(__name__)
+                logger.warning(f"Auth strategy detection failed: {e}")
         checks: dict[str, dict] = {}
         # Lint check (ruff)
@@ -640,6 +690,10 @@ Provide a comprehensive release readiness assessment."""
             "model_tier_used": tier.value,
         }
+        # Include auth mode used for telemetry
+        if self._auth_mode_used:
+            result["auth_mode_used"] = self._auth_mode_used
         # Merge parsed XML data if available
         if parsed_data.get("xml_parsed"):
             result.update(

empathy-framework 5.0.1__py3-none-any.whl → 5.1.0__py3-none-any.whl

empathy-framework 5.0.1py3-none-any.whl → 5.1.0py3-none-any.whl