PyPI - empathy-framework - Versions diffs - 4.7.0__py3-none-any.whl → 4.8.0__py3-none-any.whl - Mend

empathy-framework 4.7.0py3-none-any.whl → 4.8.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (86) hide show

empathy_framework-4.8.0.dist-info/METADATA +753 -0
{empathy_framework-4.7.0.dist-info → empathy_framework-4.8.0.dist-info}/RECORD +83 -37
{empathy_framework-4.7.0.dist-info → empathy_framework-4.8.0.dist-info}/WHEEL +1 -1
{empathy_framework-4.7.0.dist-info → empathy_framework-4.8.0.dist-info}/entry_points.txt +2 -1
empathy_os/__init__.py +2 -0
empathy_os/cache/hash_only.py +6 -3
empathy_os/cache/hybrid.py +6 -3
empathy_os/cli/__init__.py +128 -238
empathy_os/cli/__main__.py +5 -33
empathy_os/cli/commands/__init__.py +1 -8
empathy_os/cli/commands/help.py +331 -0
empathy_os/cli/commands/info.py +140 -0
empathy_os/cli/commands/inspect.py +437 -0
empathy_os/cli/commands/metrics.py +92 -0
empathy_os/cli/commands/orchestrate.py +184 -0
empathy_os/cli/commands/patterns.py +207 -0
empathy_os/cli/commands/provider.py +93 -81
empathy_os/cli/commands/setup.py +96 -0
empathy_os/cli/commands/status.py +235 -0
empathy_os/cli/commands/sync.py +166 -0
empathy_os/cli/commands/tier.py +121 -0
empathy_os/cli/commands/workflow.py +574 -0
empathy_os/cli/parsers/__init__.py +62 -0
empathy_os/cli/parsers/help.py +41 -0
empathy_os/cli/parsers/info.py +26 -0
empathy_os/cli/parsers/inspect.py +66 -0
empathy_os/cli/parsers/metrics.py +42 -0
empathy_os/cli/parsers/orchestrate.py +61 -0
empathy_os/cli/parsers/patterns.py +54 -0
empathy_os/cli/parsers/provider.py +40 -0
empathy_os/cli/parsers/setup.py +42 -0
empathy_os/cli/parsers/status.py +47 -0
empathy_os/cli/parsers/sync.py +31 -0
empathy_os/cli/parsers/tier.py +33 -0
empathy_os/cli/parsers/workflow.py +77 -0
empathy_os/cli/utils/__init__.py +1 -0
empathy_os/cli/utils/data.py +242 -0
empathy_os/cli/utils/helpers.py +68 -0
empathy_os/{cli.py → cli_legacy.py} +27 -27
empathy_os/cli_minimal.py +662 -0
empathy_os/cli_router.py +384 -0
empathy_os/cli_unified.py +38 -2
empathy_os/memory/__init__.py +19 -5
empathy_os/memory/short_term.py +14 -404
empathy_os/memory/types.py +437 -0
empathy_os/memory/unified.py +61 -48
empathy_os/models/fallback.py +1 -1
empathy_os/models/provider_config.py +59 -344
empathy_os/models/registry.py +31 -180
empathy_os/monitoring/alerts.py +14 -20
empathy_os/monitoring/alerts_cli.py +24 -7
empathy_os/project_index/__init__.py +2 -0
empathy_os/project_index/index.py +210 -5
empathy_os/project_index/scanner.py +45 -14
empathy_os/project_index/scanner_parallel.py +291 -0
empathy_os/socratic/ab_testing.py +1 -1
empathy_os/vscode_bridge 2.py +173 -0
empathy_os/workflows/__init__.py +31 -2
empathy_os/workflows/base.py +349 -325
empathy_os/workflows/bug_predict.py +8 -0
empathy_os/workflows/builder.py +273 -0
empathy_os/workflows/caching.py +253 -0
empathy_os/workflows/code_review_pipeline.py +1 -0
empathy_os/workflows/history.py +510 -0
empathy_os/workflows/output.py +410 -0
empathy_os/workflows/perf_audit.py +125 -19
empathy_os/workflows/progress.py +324 -22
empathy_os/workflows/progressive/README 2.md +454 -0
empathy_os/workflows/progressive/__init__ 2.py +92 -0
empathy_os/workflows/progressive/cli 2.py +242 -0
empathy_os/workflows/progressive/core 2.py +488 -0
empathy_os/workflows/progressive/orchestrator 2.py +701 -0
empathy_os/workflows/progressive/reports 2.py +528 -0
empathy_os/workflows/progressive/telemetry 2.py +280 -0
empathy_os/workflows/progressive/test_gen 2.py +514 -0
empathy_os/workflows/progressive/workflow 2.py +628 -0
empathy_os/workflows/routing.py +168 -0
empathy_os/workflows/secure_release.py +1 -0
empathy_os/workflows/security_audit.py +190 -0
empathy_os/workflows/security_audit_phase3.py +328 -0
empathy_os/workflows/telemetry_mixin.py +269 -0
empathy_framework-4.7.0.dist-info/METADATA +0 -1598
empathy_os/dashboard/__init__.py +0 -15
empathy_os/dashboard/server.py +0 -941
{empathy_framework-4.7.0.dist-info → empathy_framework-4.8.0.dist-info}/licenses/LICENSE +0 -0
{empathy_framework-4.7.0.dist-info → empathy_framework-4.8.0.dist-info}/top_level.txt +0 -0

empathy_os/workflows/routing.py ADDED Viewed

@@ -0,0 +1,168 @@
+"""Tier routing strategies for workflow execution.
+Provides pluggable routing algorithms to determine which model tier
+should handle each workflow stage.
+Copyright 2025 Smart-AI-Memory
+Licensed under Fair Source License 0.9
+"""
+from __future__ import annotations
+from abc import ABC, abstractmethod
+from dataclasses import dataclass
+from typing import TYPE_CHECKING
+if TYPE_CHECKING:
+    from empathy_os.workflows.base import ModelTier
+@dataclass
+class RoutingContext:
+    """Context information for routing decisions.
+    Attributes:
+        task_type: Type of task (analyze, generate, review, etc.)
+        input_size: Estimated input tokens
+        complexity: Task complexity (simple, moderate, complex)
+        budget_remaining: Remaining budget in USD
+        latency_sensitivity: Latency requirements (low, medium, high)
+    """
+    task_type: str
+    input_size: int
+    complexity: str  # "simple" | "moderate" | "complex"
+    budget_remaining: float
+    latency_sensitivity: str  # "low" | "medium" | "high"
+class TierRoutingStrategy(ABC):
+    """Abstract base class for tier routing strategies.
+    Subclasses implement different routing algorithms:
+    - CostOptimizedRouting: Minimize cost
+    - PerformanceOptimizedRouting: Minimize latency
+    - BalancedRouting: Balance cost and performance
+    - HybridRouting: User-configured tier mappings
+    """
+    @abstractmethod
+    def route(self, context: RoutingContext) -> ModelTier:
+        """Route task to appropriate tier.
+        Args:
+            context: Routing context with task information
+        Returns:
+            ModelTier to use for this task
+        """
+        pass
+    @abstractmethod
+    def can_fallback(self, tier: ModelTier) -> bool:
+        """Whether fallback to cheaper tier is allowed.
+        Args:
+            tier: The tier that failed or exceeded budget
+        Returns:
+            True if fallback is allowed, False otherwise
+        """
+        pass
+class CostOptimizedRouting(TierRoutingStrategy):
+    """Route to cheapest tier that can handle the task.
+    Default strategy. Prioritizes cost savings over speed.
+    Example:
+        >>> strategy = CostOptimizedRouting()
+        >>> tier = strategy.route(context)  # CHEAP for simple tasks
+    """
+    def route(self, context: RoutingContext) -> ModelTier:
+        """Route based on task complexity, preferring cheaper tiers."""
+        from empathy_os.workflows.base import ModelTier
+        if context.complexity == "simple":
+            return ModelTier.CHEAP
+        elif context.complexity == "complex":
+            return ModelTier.PREMIUM
+        return ModelTier.CAPABLE
+    def can_fallback(self, tier: ModelTier) -> bool:
+        """Allow fallback except for CHEAP tier."""
+        from empathy_os.workflows.base import ModelTier
+        return tier != ModelTier.CHEAP
+class PerformanceOptimizedRouting(TierRoutingStrategy):
+    """Route to fastest tier regardless of cost.
+    Use for latency-sensitive workflows like interactive tools.
+    Example:
+        >>> strategy = PerformanceOptimizedRouting()
+        >>> tier = strategy.route(context)  # PREMIUM for high latency sensitivity
+    """
+    def route(self, context: RoutingContext) -> ModelTier:
+        """Route based on latency requirements."""
+        from empathy_os.workflows.base import ModelTier
+        if context.latency_sensitivity == "high":
+            return ModelTier.PREMIUM
+        return ModelTier.CAPABLE
+    def can_fallback(self, tier: ModelTier) -> bool:
+        """Never fallback - performance is priority."""
+        return False
+class BalancedRouting(TierRoutingStrategy):
+    """Balance cost and performance with budget awareness.
+    Adjusts tier selection based on remaining budget and task complexity.
+    Example:
+        >>> strategy = BalancedRouting(total_budget=50.0)
+        >>> tier = strategy.route(context)  # Adapts based on budget
+    """
+    def __init__(self, total_budget: float):
+        """Initialize with total budget.
+        Args:
+            total_budget: Total budget in USD for this workflow execution
+        Raises:
+            ValueError: If total_budget is not positive
+        """
+        if total_budget <= 0:
+            raise ValueError("total_budget must be positive")
+        self.total_budget = total_budget
+    def route(self, context: RoutingContext) -> ModelTier:
+        """Route based on budget ratio and complexity."""
+        from empathy_os.workflows.base import ModelTier
+        budget_ratio = context.budget_remaining / self.total_budget
+        # Low budget - use cheap tier
+        if budget_ratio < 0.2:
+            return ModelTier.CHEAP
+        # High budget + complex task - use premium
+        if budget_ratio > 0.7 and context.complexity == "complex":
+            return ModelTier.PREMIUM
+        # Default to capable
+        return ModelTier.CAPABLE
+    def can_fallback(self, tier: ModelTier) -> bool:
+        """Allow fallback when budget-constrained."""
+        return True

empathy_os/workflows/secure_release.py CHANGED Viewed

@@ -166,6 +166,7 @@ class SecureReleasePipeline:
                 _get_crew_audit,
                 crew_report_to_workflow_format,
             )
             adapters_available = True
         except ImportError:
             adapters_available = False

empathy_os/workflows/security_audit.py CHANGED Viewed

@@ -342,11 +342,29 @@ class SecurityAuditWorkflow(BaseWorkflow):
                                     if self._is_detection_code(line_content, match.group()):
                                         continue
+                                    # Phase 2: Skip safe SQL parameterization patterns
+                                    if vuln_type == "sql_injection":
+                                        if self._is_safe_sql_parameterization(
+                                            line_content,
+                                            match.group(),
+                                            content,
+                                        ):
+                                            continue
                                     # Skip fake/test credentials
                                     if vuln_type == "hardcoded_secret":
                                         if self._is_fake_credential(match.group()):
                                             continue
+                                    # Phase 2: Skip safe random usage (tests, demos, documented)
+                                    if vuln_type == "insecure_random":
+                                        if self._is_safe_random_usage(
+                                            line_content,
+                                            file_name,
+                                            content,
+                                        ):
+                                            continue
                                     # Skip command_injection in documentation strings
                                     if vuln_type == "command_injection":
                                         if self._is_documentation_or_string(
@@ -380,6 +398,29 @@ class SecurityAuditWorkflow(BaseWorkflow):
                     except OSError:
                         continue
+        # Phase 3: Apply AST-based filtering for command injection
+        try:
+            from .security_audit_phase3 import apply_phase3_filtering
+            # Separate command injection findings
+            cmd_findings = [f for f in findings if f["type"] == "command_injection"]
+            other_findings = [f for f in findings if f["type"] != "command_injection"]
+            # Apply Phase 3 filtering to command injection
+            filtered_cmd = apply_phase3_filtering(cmd_findings)
+            # Combine back
+            findings = other_findings + filtered_cmd
+            logger.info(
+                f"Phase 3: Filtered command_injection from {len(cmd_findings)} to {len(filtered_cmd)} "
+                f"({len(cmd_findings) - len(filtered_cmd)} false positives removed)"
+            )
+        except ImportError:
+            logger.debug("Phase 3 module not available, skipping AST-based filtering")
+        except Exception as e:
+            logger.warning(f"Phase 3 filtering failed: {e}")
         input_tokens = len(str(input_data)) // 4
         output_tokens = len(str(findings)) // 4
@@ -541,6 +582,154 @@ class SecurityAuditWorkflow(BaseWorkflow):
         return False
+    def _is_safe_sql_parameterization(self, line_content: str, match_text: str, file_content: str) -> bool:
+        """Check if SQL query uses safe parameterization despite f-string usage.
+        Phase 2 Enhancement: Detects safe patterns like:
+        - placeholders = ",".join("?" * len(ids))
+        - cursor.execute(f"... IN ({placeholders})", ids)
+        This prevents false positives for the SQLite-recommended pattern
+        of building dynamic placeholder strings.
+        Args:
+            line_content: The line containing the match (may be incomplete for multi-line)
+            match_text: The matched text
+            file_content: Full file content for context analysis
+        Returns:
+            True if this is safe parameterized SQL, False otherwise
+        """
+        # Get the position of the match in the full file content
+        match_pos = file_content.find(match_text)
+        if match_pos == -1:
+            # Try to find cursor.execute
+            match_pos = file_content.find("cursor.execute")
+            if match_pos == -1:
+                return False
+        # Extract a larger context (next 200 chars after match)
+        context = file_content[match_pos:match_pos + 200]
+        # Also get lines before the match for placeholder detection
+        lines_before = file_content[:match_pos].split("\n")
+        recent_lines = lines_before[-10:] if len(lines_before) > 10 else lines_before
+        # Pattern 1: Check if this is a placeholder-based parameterized query
+        # Look for: cursor.execute(f"... IN ({placeholders})", params)
+        if "placeholders" in context or any("placeholders" in line for line in recent_lines[-5:]):
+            # Check if context has both f-string and separate parameters
+            # Pattern: f"...{placeholders}..." followed by comma and params
+            if re.search(r'f["\'][^"\']*\{placeholders\}[^"\']*["\']\s*,\s*\w+', context):
+                return True  # Safe - has separate parameters
+            # Also check if recent lines built the placeholders
+            for prev_line in reversed(recent_lines):
+                if "placeholders" in prev_line and '"?"' in prev_line and "join" in prev_line:
+                    # Found placeholder construction
+                    # Now check if the execute has separate parameters
+                    if "," in context and any(param in context for param in ["run_ids", "ids", "params", "values", ")"]):
+                        return True
+        # Pattern 2: Check if f-string only builds SQL structure with constants
+        # Example: f"SELECT * FROM {TABLE_NAME}" where TABLE_NAME is a constant
+        f_string_vars = re.findall(r'\{(\w+)\}', context)
+        if f_string_vars:
+            # Check if all variables are constants (UPPERCASE or table/column names)
+            all_constants = all(
+                var.isupper() or "TABLE" in var.upper() or "COLUMN" in var.upper()
+                for var in f_string_vars
+            )
+            if all_constants:
+                return True  # Safe - using constants, not user data
+        # Pattern 3: Check for security note comments nearby
+        # If developers added security notes, it's likely safe
+        for prev_line in reversed(recent_lines[-3:]):
+            if "security note" in prev_line.lower() and "safe" in prev_line.lower():
+                return True
+        return False
+    def _is_safe_random_usage(self, line_content: str, file_path: str, file_content: str) -> bool:
+        """Check if random usage is in a safe context (tests, simulations, non-crypto).
+        Phase 2 Enhancement: Reduces false positives for random module usage
+        in test fixtures, A/B testing simulations, and demo code.
+        Args:
+            line_content: The line containing the match
+            file_path: Path to the file being scanned
+            file_content: Full file content for context analysis
+        Returns:
+            True if random usage is safe/documented, False if potentially insecure
+        """
+        # Check if file is a test file
+        is_test = any(pattern in file_path.lower() for pattern in ["/test", "test_", "conftest"])
+        # Check for explicit security notes nearby
+        lines = file_content.split("\n")
+        line_index = None
+        for i, line in enumerate(lines):
+            if line_content.strip() in line:
+                line_index = i
+                break
+        if line_index is not None:
+            # Check 5 lines before and after for security notes
+            context_start = max(0, line_index - 5)
+            context_end = min(len(lines), line_index + 5)
+            context = "\n".join(lines[context_start:context_end]).lower()
+            # Look for clarifying comments
+            safe_indicators = [
+                "security note",
+                "not cryptographic",
+                "not for crypto",
+                "test data",
+                "demo data",
+                "simulation",
+                "reproducible",
+                "deterministic",
+                "fixed seed",
+                "not used for security",
+                "not used for secrets",
+                "not used for tokens",
+            ]
+            if any(indicator in context for indicator in safe_indicators):
+                return True  # Documented as safe
+        # Check for common safe random patterns
+        line_lower = line_content.lower()
+        # Pattern 1: Fixed seed (reproducible tests)
+        if "random.seed(" in line_lower:
+            return True  # Fixed seed is for reproducibility, not security
+        # Pattern 2: A/B testing, simulations, demos
+        safe_contexts = [
+            "simulation",
+            "demo",
+            "a/b test",
+            "ab_test",
+            "fixture",
+            "mock",
+            "example",
+            "sample",
+        ]
+        if any(context in file_path.lower() for context in safe_contexts):
+            return True
+        # If it's a test file without crypto indicators, it's probably safe
+        if is_test:
+            crypto_indicators = ["password", "secret", "token", "key", "crypto", "auth"]
+            if not any(indicator in file_path.lower() for indicator in crypto_indicators):
+                return True
+        return False
     async def _assess(self, input_data: dict, tier: ModelTier) -> tuple[dict, int, int]:
         """Risk scoring and severity classification.
@@ -674,6 +863,7 @@ class SecurityAuditWorkflow(BaseWorkflow):
         """
         try:
             from .security_adapters import _check_crew_available
             adapters_available = True
         except ImportError:
             adapters_available = False

empathy-framework 4.7.0__py3-none-any.whl → 4.8.0__py3-none-any.whl

empathy-framework 4.7.0py3-none-any.whl → 4.8.0py3-none-any.whl