PyPI - empathy-framework - Versions diffs - 4.6.6__py3-none-any.whl → 4.7.0__py3-none-any.whl - Mend

empathy-framework 4.6.6py3-none-any.whl → 4.7.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (247) hide show

{empathy_framework-4.6.6.dist-info → empathy_framework-4.7.0.dist-info}/METADATA +7 -6
empathy_framework-4.7.0.dist-info/RECORD +354 -0
{empathy_framework-4.6.6.dist-info → empathy_framework-4.7.0.dist-info}/top_level.txt +0 -2
empathy_healthcare_plugin/monitors/monitoring/__init__.py +9 -9
empathy_llm_toolkit/agent_factory/__init__.py +6 -6
empathy_llm_toolkit/agent_factory/adapters/wizard_adapter.py +7 -10
empathy_llm_toolkit/agents_md/__init__.py +22 -0
empathy_llm_toolkit/agents_md/loader.py +218 -0
empathy_llm_toolkit/agents_md/parser.py +271 -0
empathy_llm_toolkit/agents_md/registry.py +307 -0
empathy_llm_toolkit/commands/__init__.py +51 -0
empathy_llm_toolkit/commands/context.py +375 -0
empathy_llm_toolkit/commands/loader.py +301 -0
empathy_llm_toolkit/commands/models.py +231 -0
empathy_llm_toolkit/commands/parser.py +371 -0
empathy_llm_toolkit/commands/registry.py +429 -0
empathy_llm_toolkit/config/__init__.py +8 -8
empathy_llm_toolkit/config/unified.py +3 -7
empathy_llm_toolkit/context/__init__.py +22 -0
empathy_llm_toolkit/context/compaction.py +455 -0
empathy_llm_toolkit/context/manager.py +434 -0
empathy_llm_toolkit/hooks/__init__.py +24 -0
empathy_llm_toolkit/hooks/config.py +306 -0
empathy_llm_toolkit/hooks/executor.py +289 -0
empathy_llm_toolkit/hooks/registry.py +302 -0
empathy_llm_toolkit/hooks/scripts/__init__.py +39 -0
empathy_llm_toolkit/hooks/scripts/evaluate_session.py +201 -0
empathy_llm_toolkit/hooks/scripts/first_time_init.py +285 -0
empathy_llm_toolkit/hooks/scripts/pre_compact.py +207 -0
empathy_llm_toolkit/hooks/scripts/session_end.py +183 -0
empathy_llm_toolkit/hooks/scripts/session_start.py +163 -0
empathy_llm_toolkit/hooks/scripts/suggest_compact.py +225 -0
empathy_llm_toolkit/learning/__init__.py +30 -0
empathy_llm_toolkit/learning/evaluator.py +438 -0
empathy_llm_toolkit/learning/extractor.py +514 -0
empathy_llm_toolkit/learning/storage.py +560 -0
empathy_llm_toolkit/providers.py +4 -11
empathy_llm_toolkit/security/__init__.py +17 -17
empathy_llm_toolkit/utils/tokens.py +2 -5
empathy_os/__init__.py +202 -70
empathy_os/cache_monitor.py +5 -3
empathy_os/cli/__init__.py +11 -55
empathy_os/cli/__main__.py +29 -15
empathy_os/cli/commands/inspection.py +21 -12
empathy_os/cli/commands/memory.py +4 -12
empathy_os/cli/commands/profiling.py +198 -0
empathy_os/cli/commands/utilities.py +27 -7
empathy_os/cli.py +28 -57
empathy_os/cli_unified.py +525 -1164
empathy_os/cost_tracker.py +9 -3
empathy_os/dashboard/server.py +200 -2
empathy_os/hot_reload/__init__.py +7 -7
empathy_os/hot_reload/config.py +6 -7
empathy_os/hot_reload/integration.py +35 -35
empathy_os/hot_reload/reloader.py +57 -57
empathy_os/hot_reload/watcher.py +28 -28
empathy_os/hot_reload/websocket.py +2 -2
empathy_os/memory/__init__.py +11 -4
empathy_os/memory/claude_memory.py +1 -1
empathy_os/memory/cross_session.py +8 -12
empathy_os/memory/edges.py +6 -6
empathy_os/memory/file_session.py +770 -0
empathy_os/memory/graph.py +30 -30
empathy_os/memory/nodes.py +6 -6
empathy_os/memory/short_term.py +15 -9
empathy_os/memory/unified.py +606 -140
empathy_os/meta_workflows/agent_creator.py +3 -9
empathy_os/meta_workflows/cli_meta_workflows.py +113 -53
empathy_os/meta_workflows/form_engine.py +6 -18
empathy_os/meta_workflows/intent_detector.py +64 -24
empathy_os/meta_workflows/models.py +3 -1
empathy_os/meta_workflows/pattern_learner.py +13 -31
empathy_os/meta_workflows/plan_generator.py +55 -47
empathy_os/meta_workflows/session_context.py +2 -3
empathy_os/meta_workflows/workflow.py +20 -51
empathy_os/models/cli.py +2 -2
empathy_os/models/tasks.py +1 -2
empathy_os/models/telemetry.py +4 -1
empathy_os/models/token_estimator.py +3 -1
empathy_os/monitoring/alerts.py +938 -9
empathy_os/monitoring/alerts_cli.py +346 -183
empathy_os/orchestration/execution_strategies.py +12 -29
empathy_os/orchestration/pattern_learner.py +20 -26
empathy_os/orchestration/real_tools.py +6 -15
empathy_os/platform_utils.py +2 -1
empathy_os/plugins/__init__.py +2 -2
empathy_os/plugins/base.py +64 -64
empathy_os/plugins/registry.py +32 -32
empathy_os/project_index/index.py +49 -15
empathy_os/project_index/models.py +1 -2
empathy_os/project_index/reports.py +1 -1
empathy_os/project_index/scanner.py +1 -0
empathy_os/redis_memory.py +10 -7
empathy_os/resilience/__init__.py +1 -1
empathy_os/resilience/health.py +10 -10
empathy_os/routing/__init__.py +7 -7
empathy_os/routing/chain_executor.py +37 -37
empathy_os/routing/classifier.py +36 -36
empathy_os/routing/smart_router.py +40 -40
empathy_os/routing/{wizard_registry.py → workflow_registry.py} +47 -47
empathy_os/scaffolding/__init__.py +8 -8
empathy_os/scaffolding/__main__.py +1 -1
empathy_os/scaffolding/cli.py +28 -28
empathy_os/socratic/__init__.py +3 -19
empathy_os/socratic/ab_testing.py +25 -36
empathy_os/socratic/blueprint.py +38 -38
empathy_os/socratic/cli.py +34 -20
empathy_os/socratic/collaboration.py +30 -28
empathy_os/socratic/domain_templates.py +9 -1
empathy_os/socratic/embeddings.py +17 -13
empathy_os/socratic/engine.py +135 -70
empathy_os/socratic/explainer.py +70 -60
empathy_os/socratic/feedback.py +24 -19
empathy_os/socratic/forms.py +15 -10
empathy_os/socratic/generator.py +51 -35
empathy_os/socratic/llm_analyzer.py +25 -23
empathy_os/socratic/mcp_server.py +99 -159
empathy_os/socratic/session.py +19 -13
empathy_os/socratic/storage.py +98 -67
empathy_os/socratic/success.py +38 -27
empathy_os/socratic/visual_editor.py +51 -39
empathy_os/socratic/web_ui.py +99 -66
empathy_os/telemetry/cli.py +3 -1
empathy_os/telemetry/usage_tracker.py +1 -3
empathy_os/test_generator/__init__.py +3 -3
empathy_os/test_generator/cli.py +28 -28
empathy_os/test_generator/generator.py +64 -66
empathy_os/test_generator/risk_analyzer.py +11 -11
empathy_os/vscode_bridge.py +173 -0
empathy_os/workflows/__init__.py +212 -120
empathy_os/workflows/batch_processing.py +8 -24
empathy_os/workflows/bug_predict.py +1 -1
empathy_os/workflows/code_review.py +20 -5
empathy_os/workflows/code_review_pipeline.py +13 -8
empathy_os/workflows/keyboard_shortcuts/workflow.py +6 -2
empathy_os/workflows/manage_documentation.py +1 -0
empathy_os/workflows/orchestrated_health_check.py +6 -11
empathy_os/workflows/orchestrated_release_prep.py +3 -3
empathy_os/workflows/pr_review.py +18 -10
empathy_os/workflows/progressive/__init__.py +2 -12
empathy_os/workflows/progressive/cli.py +14 -37
empathy_os/workflows/progressive/core.py +12 -12
empathy_os/workflows/progressive/orchestrator.py +166 -144
empathy_os/workflows/progressive/reports.py +22 -31
empathy_os/workflows/progressive/telemetry.py +8 -14
empathy_os/workflows/progressive/test_gen.py +29 -48
empathy_os/workflows/progressive/workflow.py +31 -70
empathy_os/workflows/release_prep.py +21 -6
empathy_os/workflows/release_prep_crew.py +1 -0
empathy_os/workflows/secure_release.py +13 -6
empathy_os/workflows/security_audit.py +8 -3
empathy_os/workflows/test_coverage_boost_crew.py +3 -2
empathy_os/workflows/test_maintenance_crew.py +1 -0
empathy_os/workflows/test_runner.py +16 -12
empathy_software_plugin/SOFTWARE_PLUGIN_README.md +25 -703
empathy_software_plugin/cli.py +0 -122
coach_wizards/__init__.py +0 -45
coach_wizards/accessibility_wizard.py +0 -91
coach_wizards/api_wizard.py +0 -91
coach_wizards/base_wizard.py +0 -209
coach_wizards/cicd_wizard.py +0 -91
coach_wizards/code_reviewer_README.md +0 -60
coach_wizards/code_reviewer_wizard.py +0 -180
coach_wizards/compliance_wizard.py +0 -91
coach_wizards/database_wizard.py +0 -91
coach_wizards/debugging_wizard.py +0 -91
coach_wizards/documentation_wizard.py +0 -91
coach_wizards/generate_wizards.py +0 -347
coach_wizards/localization_wizard.py +0 -173
coach_wizards/migration_wizard.py +0 -91
coach_wizards/monitoring_wizard.py +0 -91
coach_wizards/observability_wizard.py +0 -91
coach_wizards/performance_wizard.py +0 -91
coach_wizards/prompt_engineering_wizard.py +0 -661
coach_wizards/refactoring_wizard.py +0 -91
coach_wizards/scaling_wizard.py +0 -90
coach_wizards/security_wizard.py +0 -92
coach_wizards/testing_wizard.py +0 -91
empathy_framework-4.6.6.dist-info/RECORD +0 -410
empathy_llm_toolkit/wizards/__init__.py +0 -43
empathy_llm_toolkit/wizards/base_wizard.py +0 -364
empathy_llm_toolkit/wizards/customer_support_wizard.py +0 -190
empathy_llm_toolkit/wizards/healthcare_wizard.py +0 -378
empathy_llm_toolkit/wizards/patient_assessment_README.md +0 -64
empathy_llm_toolkit/wizards/patient_assessment_wizard.py +0 -193
empathy_llm_toolkit/wizards/technology_wizard.py +0 -209
empathy_os/wizard_factory_cli.py +0 -170
empathy_software_plugin/wizards/__init__.py +0 -42
empathy_software_plugin/wizards/advanced_debugging_wizard.py +0 -395
empathy_software_plugin/wizards/agent_orchestration_wizard.py +0 -511
empathy_software_plugin/wizards/ai_collaboration_wizard.py +0 -503
empathy_software_plugin/wizards/ai_context_wizard.py +0 -441
empathy_software_plugin/wizards/ai_documentation_wizard.py +0 -503
empathy_software_plugin/wizards/base_wizard.py +0 -288
empathy_software_plugin/wizards/book_chapter_wizard.py +0 -519
empathy_software_plugin/wizards/code_review_wizard.py +0 -604
empathy_software_plugin/wizards/debugging/__init__.py +0 -50
empathy_software_plugin/wizards/debugging/bug_risk_analyzer.py +0 -414
empathy_software_plugin/wizards/debugging/config_loaders.py +0 -446
empathy_software_plugin/wizards/debugging/fix_applier.py +0 -469
empathy_software_plugin/wizards/debugging/language_patterns.py +0 -385
empathy_software_plugin/wizards/debugging/linter_parsers.py +0 -470
empathy_software_plugin/wizards/debugging/verification.py +0 -369
empathy_software_plugin/wizards/enhanced_testing_wizard.py +0 -537
empathy_software_plugin/wizards/memory_enhanced_debugging_wizard.py +0 -816
empathy_software_plugin/wizards/multi_model_wizard.py +0 -501
empathy_software_plugin/wizards/pattern_extraction_wizard.py +0 -422
empathy_software_plugin/wizards/pattern_retriever_wizard.py +0 -400
empathy_software_plugin/wizards/performance/__init__.py +0 -9
empathy_software_plugin/wizards/performance/bottleneck_detector.py +0 -221
empathy_software_plugin/wizards/performance/profiler_parsers.py +0 -278
empathy_software_plugin/wizards/performance/trajectory_analyzer.py +0 -429
empathy_software_plugin/wizards/performance_profiling_wizard.py +0 -305
empathy_software_plugin/wizards/prompt_engineering_wizard.py +0 -425
empathy_software_plugin/wizards/rag_pattern_wizard.py +0 -461
empathy_software_plugin/wizards/security/__init__.py +0 -32
empathy_software_plugin/wizards/security/exploit_analyzer.py +0 -290
empathy_software_plugin/wizards/security/owasp_patterns.py +0 -241
empathy_software_plugin/wizards/security/vulnerability_scanner.py +0 -604
empathy_software_plugin/wizards/security_analysis_wizard.py +0 -322
empathy_software_plugin/wizards/security_learning_wizard.py +0 -740
empathy_software_plugin/wizards/tech_debt_wizard.py +0 -726
empathy_software_plugin/wizards/testing/__init__.py +0 -27
empathy_software_plugin/wizards/testing/coverage_analyzer.py +0 -459
empathy_software_plugin/wizards/testing/quality_analyzer.py +0 -525
empathy_software_plugin/wizards/testing/test_suggester.py +0 -533
empathy_software_plugin/wizards/testing_wizard.py +0 -274
wizards/__init__.py +0 -82
wizards/admission_assessment_wizard.py +0 -644
wizards/care_plan.py +0 -321
wizards/clinical_assessment.py +0 -769
wizards/discharge_planning.py +0 -77
wizards/discharge_summary_wizard.py +0 -468
wizards/dosage_calculation.py +0 -497
wizards/incident_report_wizard.py +0 -454
wizards/medication_reconciliation.py +0 -85
wizards/nursing_assessment.py +0 -171
wizards/patient_education.py +0 -654
wizards/quality_improvement.py +0 -705
wizards/sbar_report.py +0 -324
wizards/sbar_wizard.py +0 -608
wizards/shift_handoff_wizard.py +0 -535
wizards/soap_note_wizard.py +0 -679
wizards/treatment_plan.py +0 -15
{empathy_framework-4.6.6.dist-info → empathy_framework-4.7.0.dist-info}/WHEEL +0 -0
{empathy_framework-4.6.6.dist-info → empathy_framework-4.7.0.dist-info}/entry_points.txt +0 -0
{empathy_framework-4.6.6.dist-info → empathy_framework-4.7.0.dist-info}/licenses/LICENSE +0 -0

empathy_os/workflows/progressive/orchestrator.py CHANGED Viewed

@@ -11,11 +11,7 @@ The MetaOrchestrator is responsible for:
 import logging
 from typing import Any
-from empathy_os.workflows.progressive.core import (
-    EscalationConfig,
-    Tier,
-    TierResult,
-)
+from empathy_os.workflows.progressive.core import EscalationConfig, Tier, TierResult
 logger = logging.getLogger(__name__)
@@ -50,15 +46,11 @@ class MetaOrchestrator:
         self.tier_history: dict[Tier, list[float]] = {
             Tier.CHEAP: [],
             Tier.CAPABLE: [],
-            Tier.PREMIUM: []
+            Tier.PREMIUM: [],
         }
     def should_escalate(
-        self,
-        tier: Tier,
-        result: TierResult,
-        attempt: int,
-        config: EscalationConfig
+        self, tier: Tier, result: TierResult, attempt: int, config: EscalationConfig
     ) -> tuple[bool, str]:
         """Determine if tier should escalate to next tier.
@@ -104,9 +96,7 @@ class MetaOrchestrator:
             return False, "Premium tier is final"
     def _check_cheap_escalation(
-        self,
-        result: TierResult,
-        config: EscalationConfig
+        self, result: TierResult, config: EscalationConfig
     ) -> tuple[bool, str]:
         """Check if cheap tier should escalate to capable.
@@ -127,24 +117,30 @@ class MetaOrchestrator:
         # Check syntax errors (prioritize over CQS)
         if syntax_error_count > config.cheap_to_capable_max_syntax_errors:
-            return True, f"{syntax_error_count} syntax errors exceeds limit {config.cheap_to_capable_max_syntax_errors}"
+            return (
+                True,
+                f"{syntax_error_count} syntax errors exceeds limit {config.cheap_to_capable_max_syntax_errors}",
+            )
         # Check failure rate
         if failure_rate > config.cheap_to_capable_failure_rate:
-            return True, f"Failure rate {failure_rate:.1%} exceeds threshold {config.cheap_to_capable_failure_rate:.1%}"
+            return (
+                True,
+                f"Failure rate {failure_rate:.1%} exceeds threshold {config.cheap_to_capable_failure_rate:.1%}",
+            )
         # Check CQS threshold
         if cqs < config.cheap_to_capable_min_cqs:
-            return True, f"Quality score {cqs:.1f} below threshold {config.cheap_to_capable_min_cqs}"
+            return (
+                True,
+                f"Quality score {cqs:.1f} below threshold {config.cheap_to_capable_min_cqs}",
+            )
         # All checks passed, no escalation needed
         return False, f"Quality acceptable (CQS={cqs:.1f})"
     def _check_capable_escalation(
-        self,
-        result: TierResult,
-        attempt: int,
-        config: EscalationConfig
+        self, result: TierResult, attempt: int, config: EscalationConfig
     ) -> tuple[bool, str]:
         """Check if capable tier should escalate to premium.
@@ -165,15 +161,24 @@ class MetaOrchestrator:
         # Check max attempts first
         if attempt >= config.capable_max_attempts:
-            return True, f"Max attempts ({config.capable_max_attempts}) reached without achieving target quality"
+            return (
+                True,
+                f"Max attempts ({config.capable_max_attempts}) reached without achieving target quality",
+            )
         # Check syntax errors (strict for capable tier)
         if syntax_error_count > config.capable_to_premium_max_syntax_errors:
-            return True, f"{syntax_error_count} syntax errors exceeds limit {config.capable_to_premium_max_syntax_errors}"
+            return (
+                True,
+                f"{syntax_error_count} syntax errors exceeds limit {config.capable_to_premium_max_syntax_errors}",
+            )
         # Check failure rate
         if failure_rate > config.capable_to_premium_failure_rate:
-            return True, f"Failure rate {failure_rate:.1%} exceeds threshold {config.capable_to_premium_failure_rate:.1%}"
+            return (
+                True,
+                f"Failure rate {failure_rate:.1%} exceeds threshold {config.capable_to_premium_failure_rate:.1%}",
+            )
         # Check stagnation (consecutive runs with <5% improvement)
         # Only check if we have enough history
@@ -181,7 +186,7 @@ class MetaOrchestrator:
             is_stagnant, stagnation_reason = self._detect_stagnation(
                 self.tier_history[Tier.CAPABLE],
                 config.improvement_threshold,
-                config.consecutive_stagnation_limit
+                config.consecutive_stagnation_limit,
             )
             if is_stagnant:
@@ -189,16 +194,16 @@ class MetaOrchestrator:
         # Check CQS threshold (after stagnation check)
         if cqs < config.capable_to_premium_min_cqs and attempt >= config.capable_min_attempts:
-            return True, f"Quality score {cqs:.1f} below threshold {config.capable_to_premium_min_cqs}"
+            return (
+                True,
+                f"Quality score {cqs:.1f} below threshold {config.capable_to_premium_min_cqs}",
+            )
         # No escalation needed
         return False, f"Quality acceptable (CQS={cqs:.1f}), continuing improvement"
     def _detect_stagnation(
-        self,
-        cqs_history: list[float],
-        improvement_threshold: float,
-        consecutive_limit: int
+        self, cqs_history: list[float], improvement_threshold: float, consecutive_limit: int
     ) -> tuple[bool, str]:
         """Detect if improvement has stagnated.
@@ -246,10 +251,7 @@ class MetaOrchestrator:
         return False, "No stagnation detected"
     def build_tier_prompt(
-        self,
-        tier: Tier,
-        base_task: str,
-        failure_context: dict[str, Any] | None = None
+        self, tier: Tier, base_task: str, failure_context: dict[str, Any] | None = None
     ) -> str:
         """Build XML-enhanced prompt with failure context.
@@ -304,11 +306,7 @@ class MetaOrchestrator:
   </instructions>
 </task>"""
-    def _build_capable_prompt(
-        self,
-        base_task: str,
-        failure_context: dict[str, Any] | None
-    ) -> str:
+    def _build_capable_prompt(self, base_task: str, failure_context: dict[str, Any] | None) -> str:
         """Build enhanced prompt for capable tier with failure context.
         Args:
@@ -359,12 +357,14 @@ class MetaOrchestrator:
         # Add failure pattern analysis
         if failure_patterns:
             prompt_parts.append("    <failure_analysis>")
-            prompt_parts.append(f"      <total_failures>{failure_patterns.get('total_failures', 0)}</total_failures>")
+            prompt_parts.append(
+                f"      <total_failures>{failure_patterns.get('total_failures', 0)}</total_failures>"
+            )
             prompt_parts.append("      <patterns>")
             error_types = failure_patterns.get("error_types", {})
             for error_type, count in sorted(error_types.items(), key=lambda x: -x[1]):
-                prompt_parts.append(f"        <pattern type=\"{error_type}\" count=\"{count}\" />")
+                prompt_parts.append(f'        <pattern type="{error_type}" count="{count}" />')
             prompt_parts.append("      </patterns>")
@@ -382,68 +382,74 @@ class MetaOrchestrator:
                 error = example.get("error", "Unknown error")
                 code_snippet = example.get("code", "")[:200]  # Limit snippet length
-                prompt_parts.append(f"      <example number=\"{i}\">")
+                prompt_parts.append(f'      <example number="{i}">')
                 prompt_parts.append(f"        <error>{self._escape_xml(error)}</error>")
                 if code_snippet:
-                    prompt_parts.append(f"        <code_snippet>{self._escape_xml(code_snippet)}</code_snippet>")
+                    prompt_parts.append(
+                        f"        <code_snippet>{self._escape_xml(code_snippet)}</code_snippet>"
+                    )
                 prompt_parts.append("      </example>")
             prompt_parts.append("    </failed_attempts>")
             prompt_parts.append("")
-        prompt_parts.extend([
-            "    <improvement_needed>",
-            "      The cheap tier struggled with these items. Analyze the failure",
-            "      patterns above and generate improved solutions that specifically",
-            "      address these issues.",
-            "    </improvement_needed>",
-            "  </context_from_previous_tier>",
-            "",
-            "  <your_task>",
-            "    Generate improved output that avoids the specific failure patterns identified above.",
-            "",
-            "    <quality_requirements>",
-            "      <pass_rate>80%+</pass_rate>",
-            "      <coverage>70%+</coverage>",
-            "      <quality_score>80+</quality_score>",
-            "    </quality_requirements>",
-            "",
-            "    <focus_areas>",
-        ])
+        prompt_parts.extend(
+            [
+                "    <improvement_needed>",
+                "      The cheap tier struggled with these items. Analyze the failure",
+                "      patterns above and generate improved solutions that specifically",
+                "      address these issues.",
+                "    </improvement_needed>",
+                "  </context_from_previous_tier>",
+                "",
+                "  <your_task>",
+                "    Generate improved output that avoids the specific failure patterns identified above.",
+                "",
+                "    <quality_requirements>",
+                "      <pass_rate>80%+</pass_rate>",
+                "      <coverage>70%+</coverage>",
+                "      <quality_score>80+</quality_score>",
+                "    </quality_requirements>",
+                "",
+                "    <focus_areas>",
+            ]
+        )
         # Add targeted focus areas based on failure patterns
         if failure_patterns:
             error_types = failure_patterns.get("error_types", {})
             if "async_errors" in error_types:
-                prompt_parts.append("      <focus area=\"async\">Proper async/await patterns and error handling</focus>")
+                prompt_parts.append(
+                    '      <focus area="async">Proper async/await patterns and error handling</focus>'
+                )
             if "mocking_errors" in error_types:
-                prompt_parts.append("      <focus area=\"mocking\">Correct mock setup and teardown</focus>")
+                prompt_parts.append(
+                    '      <focus area="mocking">Correct mock setup and teardown</focus>'
+                )
             if "syntax_errors" in error_types:
-                prompt_parts.append("      <focus area=\"syntax\">Valid Python syntax and imports</focus>")
+                prompt_parts.append(
+                    '      <focus area="syntax">Valid Python syntax and imports</focus>'
+                )
             if "other_errors" in error_types:
-                prompt_parts.append("      <focus area=\"general\">Edge cases and error handling</focus>")
+                prompt_parts.append(
+                    '      <focus area="general">Edge cases and error handling</focus>'
+                )
         else:
             # Default focus areas
-            prompt_parts.extend([
-                "      <focus area=\"syntax\">Correct syntax and structure</focus>",
-                "      <focus area=\"coverage\">Comprehensive test coverage</focus>",
-                "      <focus area=\"errors\">Proper error handling</focus>",
-                "      <focus area=\"edge_cases\">Edge case coverage</focus>",
-            ])
-        prompt_parts.extend([
-            "    </focus_areas>",
-            "  </your_task>",
-            "</task>"
-        ])
+            prompt_parts.extend(
+                [
+                    '      <focus area="syntax">Correct syntax and structure</focus>',
+                    '      <focus area="coverage">Comprehensive test coverage</focus>',
+                    '      <focus area="errors">Proper error handling</focus>',
+                    '      <focus area="edge_cases">Edge case coverage</focus>',
+                ]
+            )
+        prompt_parts.extend(["    </focus_areas>", "  </your_task>", "</task>"])
         return "\n".join(prompt_parts)
-    def _build_premium_prompt(
-        self,
-        base_task: str,
-        failure_context: dict[str, Any] | None
-    ) -> str:
+    def _build_premium_prompt(self, base_task: str, failure_context: dict[str, Any] | None) -> str:
         """Build comprehensive prompt for premium tier.
         Args:
@@ -503,25 +509,35 @@ class MetaOrchestrator:
         # Add detailed failure analysis
         if failure_patterns:
             prompt_parts.append("    <persistent_issues>")
-            prompt_parts.append(f"      <total_failures>{failure_patterns.get('total_failures', 0)}</total_failures>")
+            prompt_parts.append(
+                f"      <total_failures>{failure_patterns.get('total_failures', 0)}</total_failures>"
+            )
             prompt_parts.append("      <failure_patterns>")
             error_types = failure_patterns.get("error_types", {})
             for error_type, count in sorted(error_types.items(), key=lambda x: -x[1]):
-                prompt_parts.append(f"        <pattern type=\"{error_type}\" count=\"{count}\">")
+                prompt_parts.append(f'        <pattern type="{error_type}" count="{count}">')
                 # Add specific guidance per error type
                 if error_type == "async_errors":
-                    prompt_parts.append("          <guidance>Use proper async/await patterns, handle timeouts correctly</guidance>")
+                    prompt_parts.append(
+                        "          <guidance>Use proper async/await patterns, handle timeouts correctly</guidance>"
+                    )
                 elif error_type == "mocking_errors":
-                    prompt_parts.append("          <guidance>Ensure mocks are properly configured and reset</guidance>")
+                    prompt_parts.append(
+                        "          <guidance>Ensure mocks are properly configured and reset</guidance>"
+                    )
                 elif error_type == "syntax_errors":
-                    prompt_parts.append("          <guidance>Double-check syntax, imports, and type annotations</guidance>")
+                    prompt_parts.append(
+                        "          <guidance>Double-check syntax, imports, and type annotations</guidance>"
+                    )
                 prompt_parts.append("        </pattern>")
             prompt_parts.append("      </failure_patterns>")
-            prompt_parts.append(f"      <primary_issue>{failure_patterns.get('primary_issue', 'unknown')}</primary_issue>")
+            prompt_parts.append(
+                f"      <primary_issue>{failure_patterns.get('primary_issue', 'unknown')}</primary_issue>"
+            )
             prompt_parts.append("    </persistent_issues>")
             prompt_parts.append("")
@@ -535,67 +551,77 @@ class MetaOrchestrator:
                 code_snippet = example.get("code", "")[:300]  # More context for premium
                 quality_score = example.get("quality_score", 0)
-                prompt_parts.append(f"      <attempt number=\"{i}\" quality_score=\"{quality_score}\">")
+                prompt_parts.append(f'      <attempt number="{i}" quality_score="{quality_score}">')
                 prompt_parts.append(f"        <error>{self._escape_xml(error)}</error>")
                 if code_snippet:
-                    prompt_parts.append(f"        <code_snippet>{self._escape_xml(code_snippet)}</code_snippet>")
+                    prompt_parts.append(
+                        f"        <code_snippet>{self._escape_xml(code_snippet)}</code_snippet>"
+                    )
                 prompt_parts.append("      </attempt>")
             prompt_parts.append("    </capable_tier_attempts>")
             prompt_parts.append("")
-        prompt_parts.extend([
-            "  </escalation_context>",
-            "",
-            "  <expert_task>",
-            "    <critical_notice>",
-            "      You are the FINAL tier in the progressive escalation system.",
-            "      Previous tiers (cheap and capable) have attempted this task",
-            "      multiple times and could not achieve the required quality.",
-            "",
-            "      This is the last automated attempt before human review.",
-            "      Excellence is not optional - it is required.",
-            "    </critical_notice>",
-            "",
-            "    <expert_techniques>",
-            "      Apply sophisticated approaches:",
-            "      - Deep analysis of why previous attempts failed",
-            "      - Production-grade error handling and edge cases",
-            "      - Comprehensive documentation and clarity",
-            "      - Defensive programming against subtle bugs",
-        ])
+        prompt_parts.extend(
+            [
+                "  </escalation_context>",
+                "",
+                "  <expert_task>",
+                "    <critical_notice>",
+                "      You are the FINAL tier in the progressive escalation system.",
+                "      Previous tiers (cheap and capable) have attempted this task",
+                "      multiple times and could not achieve the required quality.",
+                "",
+                "      This is the last automated attempt before human review.",
+                "      Excellence is not optional - it is required.",
+                "    </critical_notice>",
+                "",
+                "    <expert_techniques>",
+                "      Apply sophisticated approaches:",
+                "      - Deep analysis of why previous attempts failed",
+                "      - Production-grade error handling and edge cases",
+                "      - Comprehensive documentation and clarity",
+                "      - Defensive programming against subtle bugs",
+            ]
+        )
         # Add specific techniques based on failure patterns
         if failure_patterns:
             error_types = failure_patterns.get("error_types", {})
             if "async_errors" in error_types:
-                prompt_parts.append("      - Advanced async patterns (asyncio.gather, proper timeouts)")
+                prompt_parts.append(
+                    "      - Advanced async patterns (asyncio.gather, proper timeouts)"
+                )
             if "mocking_errors" in error_types:
-                prompt_parts.append("      - Sophisticated mocking (pytest fixtures, proper lifecycle)")
+                prompt_parts.append(
+                    "      - Sophisticated mocking (pytest fixtures, proper lifecycle)"
+                )
             if "syntax_errors" in error_types:
                 prompt_parts.append("      - Rigorous syntax validation before submission")
-        prompt_parts.extend([
-            "    </expert_techniques>",
-            "",
-            "    <quality_requirements>",
-            "      <pass_rate>95%+</pass_rate>",
-            "      <coverage>85%+</coverage>",
-            "      <quality_score>95+</quality_score>",
-            "      <zero_syntax_errors>MANDATORY</zero_syntax_errors>",
-            "    </quality_requirements>",
-            "",
-            "    <success_criteria>",
-            "      Your implementation must:",
-            "      1. Address ALL failure patterns identified above",
-            "      2. Achieve exceptional quality scores (95+)",
-            "      3. Have zero syntax errors or runtime failures",
-            "      4. Include comprehensive edge case coverage",
-            "      5. Be production-ready with proper documentation",
-            "    </success_criteria>",
-            "  </expert_task>",
-            "</task>"
-        ])
+        prompt_parts.extend(
+            [
+                "    </expert_techniques>",
+                "",
+                "    <quality_requirements>",
+                "      <pass_rate>95%+</pass_rate>",
+                "      <coverage>85%+</coverage>",
+                "      <quality_score>95+</quality_score>",
+                "      <zero_syntax_errors>MANDATORY</zero_syntax_errors>",
+                "    </quality_requirements>",
+                "",
+                "    <success_criteria>",
+                "      Your implementation must:",
+                "      1. Address ALL failure patterns identified above",
+                "      2. Achieve exceptional quality scores (95+)",
+                "      3. Have zero syntax errors or runtime failures",
+                "      4. Include comprehensive edge case coverage",
+                "      5. Be production-ready with proper documentation",
+                "    </success_criteria>",
+                "  </expert_task>",
+                "</task>",
+            ]
+        )
         return "\n".join(prompt_parts)
@@ -613,8 +639,7 @@ class MetaOrchestrator:
             'Error: &lt;missing&gt;'
         """
         return (
-            text
-            .replace("&", "&amp;")
+            text.replace("&", "&amp;")
             .replace("<", "&lt;")
             .replace(">", "&gt;")
             .replace('"', "&quot;")
@@ -622,9 +647,7 @@ class MetaOrchestrator:
         )
     def create_agent_team(
-        self,
-        tier: Tier,
-        failure_context: dict[str, Any] | None = None
+        self, tier: Tier, failure_context: dict[str, Any] | None = None
     ) -> list[str]:
         """Create specialized agent team for tier.
@@ -658,10 +681,7 @@ class MetaOrchestrator:
         else:  # PREMIUM
             return ["generator", "analyzer", "reviewer"]
-    def analyze_failure_patterns(
-        self,
-        failures: list[dict[str, Any]]
-    ) -> dict[str, Any]:
+    def analyze_failure_patterns(self, failures: list[dict[str, Any]]) -> dict[str, Any]:
         """Analyze failure patterns to inform next tier.
         Groups failures by type and identifies common issues.
@@ -697,5 +717,7 @@ class MetaOrchestrator:
         return {
             "total_failures": len(failures),
             "error_types": error_types,
-            "primary_issue": max(error_types.items(), key=lambda x: x[1])[0] if error_types else "unknown"
+            "primary_issue": (
+                max(error_types.items(), key=lambda x: x[1])[0] if error_types else "unknown"
+            ),
         }

empathy_os/workflows/progressive/reports.py CHANGED Viewed

@@ -13,10 +13,7 @@ from pathlib import Path
 from typing import Any
 from empathy_os.config import _validate_file_path
-from empathy_os.workflows.progressive.core import (
-    ProgressiveWorkflowResult,
-    Tier,
-)
+from empathy_os.workflows.progressive.core import ProgressiveWorkflowResult, Tier
 logger = logging.getLogger(__name__)
@@ -61,7 +58,9 @@ def generate_progression_report(result: ProgressiveWorkflowResult) -> str:
     # Cost savings
     if result.cost_savings > 0:
-        report.append(f"Cost Savings: ${result.cost_savings:.2f} ({result.cost_savings_percent:.0f}% vs all-Premium)")
+        report.append(
+            f"Cost Savings: ${result.cost_savings:.2f} ({result.cost_savings_percent:.0f}% vs all-Premium)"
+        )
         report.append("")
     report.append("TIER BREAKDOWN:")
@@ -69,11 +68,7 @@ def generate_progression_report(result: ProgressiveWorkflowResult) -> str:
     # Tier-by-tier breakdown
     for tier_result in result.tier_results:
-        tier_emoji = {
-            Tier.CHEAP: "💰",
-            Tier.CAPABLE: "📊",
-            Tier.PREMIUM: "💎"
-        }[tier_result.tier]
+        tier_emoji = {Tier.CHEAP: "💰", Tier.CAPABLE: "📊", Tier.PREMIUM: "💎"}[tier_result.tier]
         report.append(f"{tier_emoji} {tier_result.tier.value.upper()} Tier ({tier_result.model})")
         report.append(f"   • Items: {len(tier_result.generated_items)}")
@@ -147,14 +142,16 @@ def save_results_to_disk(result: ProgressiveWorkflowResult, storage_path: str) -
         summary = {
             "workflow": result.workflow_name,
             "task_id": result.task_id,
-            "timestamp": result.tier_results[0].timestamp.isoformat() if result.tier_results else None,
+            "timestamp": (
+                result.tier_results[0].timestamp.isoformat() if result.tier_results else None
+            ),
             "total_cost": result.total_cost,
             "total_duration": result.total_duration,
             "cost_savings": result.cost_savings,
             "cost_savings_percent": result.cost_savings_percent,
             "success": result.success,
             "tier_count": len(result.tier_results),
-            "final_cqs": result.final_result.quality_score if result.final_result else 0
+            "final_cqs": result.final_result.quality_score if result.final_result else 0,
         }
         summary_file = validated_dir / "summary.json"
@@ -179,9 +176,9 @@ def save_results_to_disk(result: ProgressiveWorkflowResult, storage_path: str) -
                     "test_pass_rate": tier_result.failure_analysis.test_pass_rate,
                     "coverage": tier_result.failure_analysis.coverage_percent,
                     "assertion_depth": tier_result.failure_analysis.assertion_depth,
-                    "confidence": tier_result.failure_analysis.confidence_score
+                    "confidence": tier_result.failure_analysis.confidence_score,
                 },
-                "item_count": len(tier_result.generated_items)
+                "item_count": len(tier_result.generated_items),
             }
             tier_file = validated_dir / f"tier_{i}_{tier_result.tier.value}.json"
@@ -222,7 +219,9 @@ def _format_duration(seconds: float) -> str:
     return f"{minutes}m {remaining_seconds}s"
-def load_result_from_disk(task_id: str, storage_path: str = ".empathy/progressive_runs") -> dict[str, Any]:
+def load_result_from_disk(
+    task_id: str, storage_path: str = ".empathy/progressive_runs"
+) -> dict[str, Any]:
     """Load saved result from disk.
     Args:
@@ -262,11 +261,7 @@ def load_result_from_disk(task_id: str, storage_path: str = ".empathy/progressiv
     report_file = task_dir / "report.txt"
     report = report_file.read_text() if report_file.exists() else ""
-    return {
-        "summary": summary,
-        "tier_results": tier_results,
-        "report": report
-    }
+    return {"summary": summary, "tier_results": tier_results, "report": report}
 def list_saved_results(storage_path: str = ".empathy/progressive_runs") -> list[dict[str, Any]]:
@@ -311,9 +306,7 @@ def list_saved_results(storage_path: str = ".empathy/progressive_runs") -> list[
 def cleanup_old_results(
-    storage_path: str = ".empathy/progressive_runs",
-    retention_days: int = 30,
-    dry_run: bool = False
+    storage_path: str = ".empathy/progressive_runs", retention_days: int = 30, dry_run: bool = False
 ) -> tuple[int, int]:
     """Clean up old progressive workflow results.
@@ -363,6 +356,7 @@ def cleanup_old_results(
                 # Old result, delete it
                 if not dry_run:
                     import shutil
                     shutil.rmtree(task_dir)
                     logger.info(f"Deleted old result: {task_dir.name}")
                 else:
@@ -378,9 +372,7 @@ def cleanup_old_results(
     return (deleted_count, retained_count)
-def generate_cost_analytics(
-    storage_path: str = ".empathy/progressive_runs"
-) -> dict[str, Any]:
+def generate_cost_analytics(storage_path: str = ".empathy/progressive_runs") -> dict[str, Any]:
     """Generate cost optimization analytics from saved results.
     Analyzes historical progressive workflow runs to provide insights:
@@ -408,7 +400,7 @@ def generate_cost_analytics(
             "total_runs": 0,
             "total_cost": 0.0,
             "total_savings": 0.0,
-            "avg_savings_percent": 0.0
+            "avg_savings_percent": 0.0,
         }
     total_runs = len(results)
@@ -417,8 +409,7 @@ def generate_cost_analytics(
     # Calculate average savings percent (weighted by cost)
     weighted_savings = sum(
-        r.get("cost_savings_percent", 0) * r.get("total_cost", 0)
-        for r in results
+        r.get("cost_savings_percent", 0) * r.get("total_cost", 0) for r in results
     )
     avg_savings_percent = weighted_savings / total_cost if total_cost > 0 else 0
@@ -450,7 +441,7 @@ def generate_cost_analytics(
                 "runs": 0,
                 "total_cost": 0.0,
                 "total_savings": 0.0,
-                "successes": 0
+                "successes": 0,
             }
         stats = workflow_stats[workflow]
@@ -476,7 +467,7 @@ def generate_cost_analytics(
         "avg_final_cqs": round(avg_cqs, 1),
         "tier_usage": tier_usage,
         "tier_costs": tier_costs,
-        "workflow_stats": workflow_stats
+        "workflow_stats": workflow_stats,
     }

empathy-framework 4.6.6__py3-none-any.whl → 4.7.0__py3-none-any.whl

empathy-framework 4.6.6py3-none-any.whl → 4.7.0py3-none-any.whl