attune-ai 2.0.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- attune/__init__.py +358 -0
- attune/adaptive/__init__.py +13 -0
- attune/adaptive/task_complexity.py +127 -0
- attune/agent_monitoring.py +414 -0
- attune/cache/__init__.py +117 -0
- attune/cache/base.py +166 -0
- attune/cache/dependency_manager.py +256 -0
- attune/cache/hash_only.py +251 -0
- attune/cache/hybrid.py +457 -0
- attune/cache/storage.py +285 -0
- attune/cache_monitor.py +356 -0
- attune/cache_stats.py +298 -0
- attune/cli/__init__.py +152 -0
- attune/cli/__main__.py +12 -0
- attune/cli/commands/__init__.py +1 -0
- attune/cli/commands/batch.py +264 -0
- attune/cli/commands/cache.py +248 -0
- attune/cli/commands/help.py +331 -0
- attune/cli/commands/info.py +140 -0
- attune/cli/commands/inspect.py +436 -0
- attune/cli/commands/inspection.py +57 -0
- attune/cli/commands/memory.py +48 -0
- attune/cli/commands/metrics.py +92 -0
- attune/cli/commands/orchestrate.py +184 -0
- attune/cli/commands/patterns.py +207 -0
- attune/cli/commands/profiling.py +202 -0
- attune/cli/commands/provider.py +98 -0
- attune/cli/commands/routing.py +285 -0
- attune/cli/commands/setup.py +96 -0
- attune/cli/commands/status.py +235 -0
- attune/cli/commands/sync.py +166 -0
- attune/cli/commands/tier.py +121 -0
- attune/cli/commands/utilities.py +114 -0
- attune/cli/commands/workflow.py +579 -0
- attune/cli/core.py +32 -0
- attune/cli/parsers/__init__.py +68 -0
- attune/cli/parsers/batch.py +118 -0
- attune/cli/parsers/cache.py +65 -0
- attune/cli/parsers/help.py +41 -0
- attune/cli/parsers/info.py +26 -0
- attune/cli/parsers/inspect.py +66 -0
- attune/cli/parsers/metrics.py +42 -0
- attune/cli/parsers/orchestrate.py +61 -0
- attune/cli/parsers/patterns.py +54 -0
- attune/cli/parsers/provider.py +40 -0
- attune/cli/parsers/routing.py +110 -0
- attune/cli/parsers/setup.py +42 -0
- attune/cli/parsers/status.py +47 -0
- attune/cli/parsers/sync.py +31 -0
- attune/cli/parsers/tier.py +33 -0
- attune/cli/parsers/workflow.py +77 -0
- attune/cli/utils/__init__.py +1 -0
- attune/cli/utils/data.py +242 -0
- attune/cli/utils/helpers.py +68 -0
- attune/cli_legacy.py +3957 -0
- attune/cli_minimal.py +1159 -0
- attune/cli_router.py +437 -0
- attune/cli_unified.py +814 -0
- attune/config/__init__.py +66 -0
- attune/config/xml_config.py +286 -0
- attune/config.py +545 -0
- attune/coordination.py +870 -0
- attune/core.py +1511 -0
- attune/core_modules/__init__.py +15 -0
- attune/cost_tracker.py +626 -0
- attune/dashboard/__init__.py +41 -0
- attune/dashboard/app.py +512 -0
- attune/dashboard/simple_server.py +435 -0
- attune/dashboard/standalone_server.py +547 -0
- attune/discovery.py +306 -0
- attune/emergence.py +306 -0
- attune/exceptions.py +123 -0
- attune/feedback_loops.py +373 -0
- attune/hot_reload/README.md +473 -0
- attune/hot_reload/__init__.py +62 -0
- attune/hot_reload/config.py +83 -0
- attune/hot_reload/integration.py +229 -0
- attune/hot_reload/reloader.py +298 -0
- attune/hot_reload/watcher.py +183 -0
- attune/hot_reload/websocket.py +177 -0
- attune/levels.py +577 -0
- attune/leverage_points.py +441 -0
- attune/logging_config.py +261 -0
- attune/mcp/__init__.py +10 -0
- attune/mcp/server.py +506 -0
- attune/memory/__init__.py +237 -0
- attune/memory/claude_memory.py +469 -0
- attune/memory/config.py +224 -0
- attune/memory/control_panel.py +1290 -0
- attune/memory/control_panel_support.py +145 -0
- attune/memory/cross_session.py +845 -0
- attune/memory/edges.py +179 -0
- attune/memory/encryption.py +159 -0
- attune/memory/file_session.py +770 -0
- attune/memory/graph.py +570 -0
- attune/memory/long_term.py +913 -0
- attune/memory/long_term_types.py +99 -0
- attune/memory/mixins/__init__.py +25 -0
- attune/memory/mixins/backend_init_mixin.py +249 -0
- attune/memory/mixins/capabilities_mixin.py +208 -0
- attune/memory/mixins/handoff_mixin.py +208 -0
- attune/memory/mixins/lifecycle_mixin.py +49 -0
- attune/memory/mixins/long_term_mixin.py +352 -0
- attune/memory/mixins/promotion_mixin.py +109 -0
- attune/memory/mixins/short_term_mixin.py +182 -0
- attune/memory/nodes.py +179 -0
- attune/memory/redis_bootstrap.py +540 -0
- attune/memory/security/__init__.py +31 -0
- attune/memory/security/audit_logger.py +932 -0
- attune/memory/security/pii_scrubber.py +640 -0
- attune/memory/security/secrets_detector.py +678 -0
- attune/memory/short_term.py +2192 -0
- attune/memory/simple_storage.py +302 -0
- attune/memory/storage/__init__.py +15 -0
- attune/memory/storage_backend.py +167 -0
- attune/memory/summary_index.py +583 -0
- attune/memory/types.py +446 -0
- attune/memory/unified.py +182 -0
- attune/meta_workflows/__init__.py +74 -0
- attune/meta_workflows/agent_creator.py +248 -0
- attune/meta_workflows/builtin_templates.py +567 -0
- attune/meta_workflows/cli_commands/__init__.py +56 -0
- attune/meta_workflows/cli_commands/agent_commands.py +321 -0
- attune/meta_workflows/cli_commands/analytics_commands.py +442 -0
- attune/meta_workflows/cli_commands/config_commands.py +232 -0
- attune/meta_workflows/cli_commands/memory_commands.py +182 -0
- attune/meta_workflows/cli_commands/template_commands.py +354 -0
- attune/meta_workflows/cli_commands/workflow_commands.py +382 -0
- attune/meta_workflows/cli_meta_workflows.py +59 -0
- attune/meta_workflows/form_engine.py +292 -0
- attune/meta_workflows/intent_detector.py +409 -0
- attune/meta_workflows/models.py +569 -0
- attune/meta_workflows/pattern_learner.py +738 -0
- attune/meta_workflows/plan_generator.py +384 -0
- attune/meta_workflows/session_context.py +397 -0
- attune/meta_workflows/template_registry.py +229 -0
- attune/meta_workflows/workflow.py +984 -0
- attune/metrics/__init__.py +12 -0
- attune/metrics/collector.py +31 -0
- attune/metrics/prompt_metrics.py +194 -0
- attune/models/__init__.py +172 -0
- attune/models/__main__.py +13 -0
- attune/models/adaptive_routing.py +437 -0
- attune/models/auth_cli.py +444 -0
- attune/models/auth_strategy.py +450 -0
- attune/models/cli.py +655 -0
- attune/models/empathy_executor.py +354 -0
- attune/models/executor.py +257 -0
- attune/models/fallback.py +762 -0
- attune/models/provider_config.py +282 -0
- attune/models/registry.py +472 -0
- attune/models/tasks.py +359 -0
- attune/models/telemetry/__init__.py +71 -0
- attune/models/telemetry/analytics.py +594 -0
- attune/models/telemetry/backend.py +196 -0
- attune/models/telemetry/data_models.py +431 -0
- attune/models/telemetry/storage.py +489 -0
- attune/models/token_estimator.py +420 -0
- attune/models/validation.py +280 -0
- attune/monitoring/__init__.py +52 -0
- attune/monitoring/alerts.py +946 -0
- attune/monitoring/alerts_cli.py +448 -0
- attune/monitoring/multi_backend.py +271 -0
- attune/monitoring/otel_backend.py +362 -0
- attune/optimization/__init__.py +19 -0
- attune/optimization/context_optimizer.py +272 -0
- attune/orchestration/__init__.py +67 -0
- attune/orchestration/agent_templates.py +707 -0
- attune/orchestration/config_store.py +499 -0
- attune/orchestration/execution_strategies.py +2111 -0
- attune/orchestration/meta_orchestrator.py +1168 -0
- attune/orchestration/pattern_learner.py +696 -0
- attune/orchestration/real_tools.py +931 -0
- attune/pattern_cache.py +187 -0
- attune/pattern_library.py +542 -0
- attune/patterns/debugging/all_patterns.json +81 -0
- attune/patterns/debugging/workflow_20260107_1770825e.json +77 -0
- attune/patterns/refactoring_memory.json +89 -0
- attune/persistence.py +564 -0
- attune/platform_utils.py +265 -0
- attune/plugins/__init__.py +28 -0
- attune/plugins/base.py +361 -0
- attune/plugins/registry.py +268 -0
- attune/project_index/__init__.py +32 -0
- attune/project_index/cli.py +335 -0
- attune/project_index/index.py +667 -0
- attune/project_index/models.py +504 -0
- attune/project_index/reports.py +474 -0
- attune/project_index/scanner.py +777 -0
- attune/project_index/scanner_parallel.py +291 -0
- attune/prompts/__init__.py +61 -0
- attune/prompts/config.py +77 -0
- attune/prompts/context.py +177 -0
- attune/prompts/parser.py +285 -0
- attune/prompts/registry.py +313 -0
- attune/prompts/templates.py +208 -0
- attune/redis_config.py +302 -0
- attune/redis_memory.py +799 -0
- attune/resilience/__init__.py +56 -0
- attune/resilience/circuit_breaker.py +256 -0
- attune/resilience/fallback.py +179 -0
- attune/resilience/health.py +300 -0
- attune/resilience/retry.py +209 -0
- attune/resilience/timeout.py +135 -0
- attune/routing/__init__.py +43 -0
- attune/routing/chain_executor.py +433 -0
- attune/routing/classifier.py +217 -0
- attune/routing/smart_router.py +234 -0
- attune/routing/workflow_registry.py +343 -0
- attune/scaffolding/README.md +589 -0
- attune/scaffolding/__init__.py +35 -0
- attune/scaffolding/__main__.py +14 -0
- attune/scaffolding/cli.py +240 -0
- attune/scaffolding/templates/base_wizard.py.jinja2 +121 -0
- attune/scaffolding/templates/coach_wizard.py.jinja2 +321 -0
- attune/scaffolding/templates/domain_wizard.py.jinja2 +408 -0
- attune/scaffolding/templates/linear_flow_wizard.py.jinja2 +203 -0
- attune/socratic/__init__.py +256 -0
- attune/socratic/ab_testing.py +958 -0
- attune/socratic/blueprint.py +533 -0
- attune/socratic/cli.py +703 -0
- attune/socratic/collaboration.py +1114 -0
- attune/socratic/domain_templates.py +924 -0
- attune/socratic/embeddings.py +738 -0
- attune/socratic/engine.py +794 -0
- attune/socratic/explainer.py +682 -0
- attune/socratic/feedback.py +772 -0
- attune/socratic/forms.py +629 -0
- attune/socratic/generator.py +732 -0
- attune/socratic/llm_analyzer.py +637 -0
- attune/socratic/mcp_server.py +702 -0
- attune/socratic/session.py +312 -0
- attune/socratic/storage.py +667 -0
- attune/socratic/success.py +730 -0
- attune/socratic/visual_editor.py +860 -0
- attune/socratic/web_ui.py +958 -0
- attune/telemetry/__init__.py +39 -0
- attune/telemetry/agent_coordination.py +475 -0
- attune/telemetry/agent_tracking.py +367 -0
- attune/telemetry/approval_gates.py +545 -0
- attune/telemetry/cli.py +1231 -0
- attune/telemetry/commands/__init__.py +14 -0
- attune/telemetry/commands/dashboard_commands.py +696 -0
- attune/telemetry/event_streaming.py +409 -0
- attune/telemetry/feedback_loop.py +567 -0
- attune/telemetry/usage_tracker.py +591 -0
- attune/templates.py +754 -0
- attune/test_generator/__init__.py +38 -0
- attune/test_generator/__main__.py +14 -0
- attune/test_generator/cli.py +234 -0
- attune/test_generator/generator.py +355 -0
- attune/test_generator/risk_analyzer.py +216 -0
- attune/test_generator/templates/unit_test.py.jinja2 +272 -0
- attune/tier_recommender.py +384 -0
- attune/tools.py +183 -0
- attune/trust/__init__.py +28 -0
- attune/trust/circuit_breaker.py +579 -0
- attune/trust_building.py +527 -0
- attune/validation/__init__.py +19 -0
- attune/validation/xml_validator.py +281 -0
- attune/vscode_bridge.py +173 -0
- attune/workflow_commands.py +780 -0
- attune/workflow_patterns/__init__.py +33 -0
- attune/workflow_patterns/behavior.py +249 -0
- attune/workflow_patterns/core.py +76 -0
- attune/workflow_patterns/output.py +99 -0
- attune/workflow_patterns/registry.py +255 -0
- attune/workflow_patterns/structural.py +288 -0
- attune/workflows/__init__.py +539 -0
- attune/workflows/autonomous_test_gen.py +1268 -0
- attune/workflows/base.py +2667 -0
- attune/workflows/batch_processing.py +342 -0
- attune/workflows/bug_predict.py +1084 -0
- attune/workflows/builder.py +273 -0
- attune/workflows/caching.py +253 -0
- attune/workflows/code_review.py +1048 -0
- attune/workflows/code_review_adapters.py +312 -0
- attune/workflows/code_review_pipeline.py +722 -0
- attune/workflows/config.py +645 -0
- attune/workflows/dependency_check.py +644 -0
- attune/workflows/document_gen/__init__.py +25 -0
- attune/workflows/document_gen/config.py +30 -0
- attune/workflows/document_gen/report_formatter.py +162 -0
- attune/workflows/document_gen/workflow.py +1426 -0
- attune/workflows/document_manager.py +216 -0
- attune/workflows/document_manager_README.md +134 -0
- attune/workflows/documentation_orchestrator.py +1205 -0
- attune/workflows/history.py +510 -0
- attune/workflows/keyboard_shortcuts/__init__.py +39 -0
- attune/workflows/keyboard_shortcuts/generators.py +391 -0
- attune/workflows/keyboard_shortcuts/parsers.py +416 -0
- attune/workflows/keyboard_shortcuts/prompts.py +295 -0
- attune/workflows/keyboard_shortcuts/schema.py +193 -0
- attune/workflows/keyboard_shortcuts/workflow.py +509 -0
- attune/workflows/llm_base.py +363 -0
- attune/workflows/manage_docs.py +87 -0
- attune/workflows/manage_docs_README.md +134 -0
- attune/workflows/manage_documentation.py +821 -0
- attune/workflows/new_sample_workflow1.py +149 -0
- attune/workflows/new_sample_workflow1_README.md +150 -0
- attune/workflows/orchestrated_health_check.py +849 -0
- attune/workflows/orchestrated_release_prep.py +600 -0
- attune/workflows/output.py +413 -0
- attune/workflows/perf_audit.py +863 -0
- attune/workflows/pr_review.py +762 -0
- attune/workflows/progress.py +785 -0
- attune/workflows/progress_server.py +322 -0
- attune/workflows/progressive/README 2.md +454 -0
- attune/workflows/progressive/README.md +454 -0
- attune/workflows/progressive/__init__.py +82 -0
- attune/workflows/progressive/cli.py +219 -0
- attune/workflows/progressive/core.py +488 -0
- attune/workflows/progressive/orchestrator.py +723 -0
- attune/workflows/progressive/reports.py +520 -0
- attune/workflows/progressive/telemetry.py +274 -0
- attune/workflows/progressive/test_gen.py +495 -0
- attune/workflows/progressive/workflow.py +589 -0
- attune/workflows/refactor_plan.py +694 -0
- attune/workflows/release_prep.py +895 -0
- attune/workflows/release_prep_crew.py +969 -0
- attune/workflows/research_synthesis.py +404 -0
- attune/workflows/routing.py +168 -0
- attune/workflows/secure_release.py +593 -0
- attune/workflows/security_adapters.py +297 -0
- attune/workflows/security_audit.py +1329 -0
- attune/workflows/security_audit_phase3.py +355 -0
- attune/workflows/seo_optimization.py +633 -0
- attune/workflows/step_config.py +234 -0
- attune/workflows/telemetry_mixin.py +269 -0
- attune/workflows/test5.py +125 -0
- attune/workflows/test5_README.md +158 -0
- attune/workflows/test_coverage_boost_crew.py +849 -0
- attune/workflows/test_gen/__init__.py +52 -0
- attune/workflows/test_gen/ast_analyzer.py +249 -0
- attune/workflows/test_gen/config.py +88 -0
- attune/workflows/test_gen/data_models.py +38 -0
- attune/workflows/test_gen/report_formatter.py +289 -0
- attune/workflows/test_gen/test_templates.py +381 -0
- attune/workflows/test_gen/workflow.py +655 -0
- attune/workflows/test_gen.py +54 -0
- attune/workflows/test_gen_behavioral.py +477 -0
- attune/workflows/test_gen_parallel.py +341 -0
- attune/workflows/test_lifecycle.py +526 -0
- attune/workflows/test_maintenance.py +627 -0
- attune/workflows/test_maintenance_cli.py +590 -0
- attune/workflows/test_maintenance_crew.py +840 -0
- attune/workflows/test_runner.py +622 -0
- attune/workflows/tier_tracking.py +531 -0
- attune/workflows/xml_enhanced_crew.py +285 -0
- attune_ai-2.0.0.dist-info/METADATA +1026 -0
- attune_ai-2.0.0.dist-info/RECORD +457 -0
- attune_ai-2.0.0.dist-info/WHEEL +5 -0
- attune_ai-2.0.0.dist-info/entry_points.txt +26 -0
- attune_ai-2.0.0.dist-info/licenses/LICENSE +201 -0
- attune_ai-2.0.0.dist-info/licenses/LICENSE_CHANGE_ANNOUNCEMENT.md +101 -0
- attune_ai-2.0.0.dist-info/top_level.txt +5 -0
- attune_healthcare/__init__.py +13 -0
- attune_healthcare/monitors/__init__.py +9 -0
- attune_healthcare/monitors/clinical_protocol_monitor.py +315 -0
- attune_healthcare/monitors/monitoring/__init__.py +44 -0
- attune_healthcare/monitors/monitoring/protocol_checker.py +300 -0
- attune_healthcare/monitors/monitoring/protocol_loader.py +214 -0
- attune_healthcare/monitors/monitoring/sensor_parsers.py +306 -0
- attune_healthcare/monitors/monitoring/trajectory_analyzer.py +389 -0
- attune_llm/README.md +553 -0
- attune_llm/__init__.py +28 -0
- attune_llm/agent_factory/__init__.py +53 -0
- attune_llm/agent_factory/adapters/__init__.py +85 -0
- attune_llm/agent_factory/adapters/autogen_adapter.py +312 -0
- attune_llm/agent_factory/adapters/crewai_adapter.py +483 -0
- attune_llm/agent_factory/adapters/haystack_adapter.py +298 -0
- attune_llm/agent_factory/adapters/langchain_adapter.py +362 -0
- attune_llm/agent_factory/adapters/langgraph_adapter.py +333 -0
- attune_llm/agent_factory/adapters/native.py +228 -0
- attune_llm/agent_factory/adapters/wizard_adapter.py +423 -0
- attune_llm/agent_factory/base.py +305 -0
- attune_llm/agent_factory/crews/__init__.py +67 -0
- attune_llm/agent_factory/crews/code_review.py +1113 -0
- attune_llm/agent_factory/crews/health_check.py +1262 -0
- attune_llm/agent_factory/crews/refactoring.py +1128 -0
- attune_llm/agent_factory/crews/security_audit.py +1018 -0
- attune_llm/agent_factory/decorators.py +287 -0
- attune_llm/agent_factory/factory.py +558 -0
- attune_llm/agent_factory/framework.py +193 -0
- attune_llm/agent_factory/memory_integration.py +328 -0
- attune_llm/agent_factory/resilient.py +320 -0
- attune_llm/agents_md/__init__.py +22 -0
- attune_llm/agents_md/loader.py +218 -0
- attune_llm/agents_md/parser.py +271 -0
- attune_llm/agents_md/registry.py +307 -0
- attune_llm/claude_memory.py +466 -0
- attune_llm/cli/__init__.py +8 -0
- attune_llm/cli/sync_claude.py +487 -0
- attune_llm/code_health.py +1313 -0
- attune_llm/commands/__init__.py +51 -0
- attune_llm/commands/context.py +375 -0
- attune_llm/commands/loader.py +301 -0
- attune_llm/commands/models.py +231 -0
- attune_llm/commands/parser.py +371 -0
- attune_llm/commands/registry.py +429 -0
- attune_llm/config/__init__.py +29 -0
- attune_llm/config/unified.py +291 -0
- attune_llm/context/__init__.py +22 -0
- attune_llm/context/compaction.py +455 -0
- attune_llm/context/manager.py +434 -0
- attune_llm/contextual_patterns.py +361 -0
- attune_llm/core.py +907 -0
- attune_llm/git_pattern_extractor.py +435 -0
- attune_llm/hooks/__init__.py +24 -0
- attune_llm/hooks/config.py +306 -0
- attune_llm/hooks/executor.py +289 -0
- attune_llm/hooks/registry.py +302 -0
- attune_llm/hooks/scripts/__init__.py +39 -0
- attune_llm/hooks/scripts/evaluate_session.py +201 -0
- attune_llm/hooks/scripts/first_time_init.py +285 -0
- attune_llm/hooks/scripts/pre_compact.py +207 -0
- attune_llm/hooks/scripts/session_end.py +183 -0
- attune_llm/hooks/scripts/session_start.py +163 -0
- attune_llm/hooks/scripts/suggest_compact.py +225 -0
- attune_llm/learning/__init__.py +30 -0
- attune_llm/learning/evaluator.py +438 -0
- attune_llm/learning/extractor.py +514 -0
- attune_llm/learning/storage.py +560 -0
- attune_llm/levels.py +227 -0
- attune_llm/pattern_confidence.py +414 -0
- attune_llm/pattern_resolver.py +272 -0
- attune_llm/pattern_summary.py +350 -0
- attune_llm/providers.py +967 -0
- attune_llm/routing/__init__.py +32 -0
- attune_llm/routing/model_router.py +362 -0
- attune_llm/security/IMPLEMENTATION_SUMMARY.md +413 -0
- attune_llm/security/PHASE2_COMPLETE.md +384 -0
- attune_llm/security/PHASE2_SECRETS_DETECTOR_COMPLETE.md +271 -0
- attune_llm/security/QUICK_REFERENCE.md +316 -0
- attune_llm/security/README.md +262 -0
- attune_llm/security/__init__.py +62 -0
- attune_llm/security/audit_logger.py +929 -0
- attune_llm/security/audit_logger_example.py +152 -0
- attune_llm/security/pii_scrubber.py +640 -0
- attune_llm/security/secrets_detector.py +678 -0
- attune_llm/security/secrets_detector_example.py +304 -0
- attune_llm/security/secure_memdocs.py +1192 -0
- attune_llm/security/secure_memdocs_example.py +278 -0
- attune_llm/session_status.py +745 -0
- attune_llm/state.py +246 -0
- attune_llm/utils/__init__.py +5 -0
- attune_llm/utils/tokens.py +349 -0
- attune_software/SOFTWARE_PLUGIN_README.md +57 -0
- attune_software/__init__.py +13 -0
- attune_software/cli/__init__.py +120 -0
- attune_software/cli/inspect.py +362 -0
- attune_software/cli.py +574 -0
- attune_software/plugin.py +188 -0
- workflow_scaffolding/__init__.py +11 -0
- workflow_scaffolding/__main__.py +12 -0
- workflow_scaffolding/cli.py +206 -0
- workflow_scaffolding/generator.py +265 -0
|
@@ -0,0 +1,723 @@
|
|
|
1
|
+
"""Meta-orchestrator for progressive tier escalation decisions.
|
|
2
|
+
|
|
3
|
+
The MetaOrchestrator is responsible for:
|
|
4
|
+
1. Analyzing tier execution results
|
|
5
|
+
2. Making escalation decisions
|
|
6
|
+
3. Creating specialized agent teams
|
|
7
|
+
4. Building XML-enhanced prompts with failure context
|
|
8
|
+
5. Detecting stagnation patterns
|
|
9
|
+
"""
|
|
10
|
+
|
|
11
|
+
import logging
|
|
12
|
+
from typing import Any
|
|
13
|
+
|
|
14
|
+
from attune.workflows.progressive.core import EscalationConfig, Tier, TierResult
|
|
15
|
+
|
|
16
|
+
logger = logging.getLogger(__name__)
|
|
17
|
+
|
|
18
|
+
|
|
19
|
+
class MetaOrchestrator:
|
|
20
|
+
"""Meta-agent that orchestrates progressive tier decisions.
|
|
21
|
+
|
|
22
|
+
The MetaOrchestrator acts as a higher-level intelligence that:
|
|
23
|
+
- Analyzes tier results objectively
|
|
24
|
+
- Decides when to escalate vs retry
|
|
25
|
+
- Detects stagnation patterns
|
|
26
|
+
- Creates specialized agent teams per tier
|
|
27
|
+
- Builds context-aware prompts
|
|
28
|
+
|
|
29
|
+
This separates escalation logic from workflow logic, allowing
|
|
30
|
+
workflows to focus on their domain-specific tasks.
|
|
31
|
+
|
|
32
|
+
Example:
|
|
33
|
+
>>> orchestrator = MetaOrchestrator()
|
|
34
|
+
>>> should_esc, reason = orchestrator.should_escalate(
|
|
35
|
+
... tier=Tier.CHEAP,
|
|
36
|
+
... result=cheap_result,
|
|
37
|
+
... attempt=2,
|
|
38
|
+
... config=config
|
|
39
|
+
... )
|
|
40
|
+
>>> if should_esc:
|
|
41
|
+
... print(f"Escalating: {reason}")
|
|
42
|
+
"""
|
|
43
|
+
|
|
44
|
+
def __init__(self) -> None:
|
|
45
|
+
"""Initialize meta-orchestrator."""
|
|
46
|
+
self.tier_history: dict[Tier, list[float]] = {
|
|
47
|
+
Tier.CHEAP: [],
|
|
48
|
+
Tier.CAPABLE: [],
|
|
49
|
+
Tier.PREMIUM: [],
|
|
50
|
+
}
|
|
51
|
+
|
|
52
|
+
def should_escalate(
|
|
53
|
+
self, tier: Tier, result: TierResult, attempt: int, config: EscalationConfig
|
|
54
|
+
) -> tuple[bool, str]:
|
|
55
|
+
"""Determine if tier should escalate to next tier.
|
|
56
|
+
|
|
57
|
+
Multi-criteria decision based on:
|
|
58
|
+
- Quality score vs thresholds
|
|
59
|
+
- Syntax errors
|
|
60
|
+
- Failure rate
|
|
61
|
+
- Attempt count
|
|
62
|
+
- Stagnation detection (for CAPABLE tier)
|
|
63
|
+
|
|
64
|
+
Args:
|
|
65
|
+
tier: Current tier
|
|
66
|
+
result: Execution result
|
|
67
|
+
attempt: Attempt number at this tier
|
|
68
|
+
config: Escalation configuration
|
|
69
|
+
|
|
70
|
+
Returns:
|
|
71
|
+
Tuple of (should_escalate, reason)
|
|
72
|
+
|
|
73
|
+
Example:
|
|
74
|
+
>>> should_esc, reason = orchestrator.should_escalate(
|
|
75
|
+
... Tier.CHEAP, result, 2, config
|
|
76
|
+
... )
|
|
77
|
+
>>> # (True, "Quality score 65 below threshold 70")
|
|
78
|
+
"""
|
|
79
|
+
cqs = result.quality_score
|
|
80
|
+
|
|
81
|
+
# Track CQS history for stagnation detection
|
|
82
|
+
self.tier_history[tier].append(cqs)
|
|
83
|
+
|
|
84
|
+
# Check if we've met minimum attempts
|
|
85
|
+
min_attempts = config.get_min_attempts(tier)
|
|
86
|
+
if attempt < min_attempts:
|
|
87
|
+
return False, f"Only {attempt}/{min_attempts} attempts completed"
|
|
88
|
+
|
|
89
|
+
# Tier-specific threshold checks
|
|
90
|
+
if tier == Tier.CHEAP:
|
|
91
|
+
return self._check_cheap_escalation(result, config)
|
|
92
|
+
elif tier == Tier.CAPABLE:
|
|
93
|
+
return self._check_capable_escalation(result, attempt, config)
|
|
94
|
+
else: # PREMIUM
|
|
95
|
+
# Premium doesn't escalate (highest tier)
|
|
96
|
+
return False, "Premium tier is final"
|
|
97
|
+
|
|
98
|
+
def _check_cheap_escalation(
|
|
99
|
+
self, result: TierResult, config: EscalationConfig
|
|
100
|
+
) -> tuple[bool, str]:
|
|
101
|
+
"""Check if cheap tier should escalate to capable.
|
|
102
|
+
|
|
103
|
+
Args:
|
|
104
|
+
result: Cheap tier result
|
|
105
|
+
config: Escalation configuration
|
|
106
|
+
|
|
107
|
+
Returns:
|
|
108
|
+
Tuple of (should_escalate, reason)
|
|
109
|
+
"""
|
|
110
|
+
cqs = result.quality_score
|
|
111
|
+
failure_rate = 1.0 - result.success_rate
|
|
112
|
+
syntax_error_count = len(result.failure_analysis.syntax_errors)
|
|
113
|
+
|
|
114
|
+
# Check severity first (critical failures)
|
|
115
|
+
if result.failure_analysis.failure_severity == "CRITICAL":
|
|
116
|
+
return True, "Critical failures detected (consider skipping to Premium)"
|
|
117
|
+
|
|
118
|
+
# Check syntax errors (prioritize over CQS)
|
|
119
|
+
if syntax_error_count > config.cheap_to_capable_max_syntax_errors:
|
|
120
|
+
return (
|
|
121
|
+
True,
|
|
122
|
+
f"{syntax_error_count} syntax errors exceeds limit {config.cheap_to_capable_max_syntax_errors}",
|
|
123
|
+
)
|
|
124
|
+
|
|
125
|
+
# Check failure rate
|
|
126
|
+
if failure_rate > config.cheap_to_capable_failure_rate:
|
|
127
|
+
return (
|
|
128
|
+
True,
|
|
129
|
+
f"Failure rate {failure_rate:.1%} exceeds threshold {config.cheap_to_capable_failure_rate:.1%}",
|
|
130
|
+
)
|
|
131
|
+
|
|
132
|
+
# Check CQS threshold
|
|
133
|
+
if cqs < config.cheap_to_capable_min_cqs:
|
|
134
|
+
return (
|
|
135
|
+
True,
|
|
136
|
+
f"Quality score {cqs:.1f} below threshold {config.cheap_to_capable_min_cqs}",
|
|
137
|
+
)
|
|
138
|
+
|
|
139
|
+
# All checks passed, no escalation needed
|
|
140
|
+
return False, f"Quality acceptable (CQS={cqs:.1f})"
|
|
141
|
+
|
|
142
|
+
def _check_capable_escalation(
|
|
143
|
+
self, result: TierResult, attempt: int, config: EscalationConfig
|
|
144
|
+
) -> tuple[bool, str]:
|
|
145
|
+
"""Check if capable tier should escalate to premium.
|
|
146
|
+
|
|
147
|
+
Includes stagnation detection: if improvement is <5% for 2 consecutive
|
|
148
|
+
attempts, escalate even if quality is borderline acceptable.
|
|
149
|
+
|
|
150
|
+
Args:
|
|
151
|
+
result: Capable tier result
|
|
152
|
+
attempt: Attempt number
|
|
153
|
+
config: Escalation configuration
|
|
154
|
+
|
|
155
|
+
Returns:
|
|
156
|
+
Tuple of (should_escalate, reason)
|
|
157
|
+
"""
|
|
158
|
+
cqs = result.quality_score
|
|
159
|
+
failure_rate = 1.0 - result.success_rate
|
|
160
|
+
syntax_error_count = len(result.failure_analysis.syntax_errors)
|
|
161
|
+
|
|
162
|
+
# Check max attempts first
|
|
163
|
+
if attempt >= config.capable_max_attempts:
|
|
164
|
+
return (
|
|
165
|
+
True,
|
|
166
|
+
f"Max attempts ({config.capable_max_attempts}) reached without achieving target quality",
|
|
167
|
+
)
|
|
168
|
+
|
|
169
|
+
# Check syntax errors (strict for capable tier)
|
|
170
|
+
if syntax_error_count > config.capable_to_premium_max_syntax_errors:
|
|
171
|
+
return (
|
|
172
|
+
True,
|
|
173
|
+
f"{syntax_error_count} syntax errors exceeds limit {config.capable_to_premium_max_syntax_errors}",
|
|
174
|
+
)
|
|
175
|
+
|
|
176
|
+
# Check failure rate
|
|
177
|
+
if failure_rate > config.capable_to_premium_failure_rate:
|
|
178
|
+
return (
|
|
179
|
+
True,
|
|
180
|
+
f"Failure rate {failure_rate:.1%} exceeds threshold {config.capable_to_premium_failure_rate:.1%}",
|
|
181
|
+
)
|
|
182
|
+
|
|
183
|
+
# Check stagnation (consecutive runs with <5% improvement)
|
|
184
|
+
# Only check if we have enough history
|
|
185
|
+
if len(self.tier_history[Tier.CAPABLE]) >= config.consecutive_stagnation_limit + 1:
|
|
186
|
+
is_stagnant, stagnation_reason = self._detect_stagnation(
|
|
187
|
+
self.tier_history[Tier.CAPABLE],
|
|
188
|
+
config.improvement_threshold,
|
|
189
|
+
config.consecutive_stagnation_limit,
|
|
190
|
+
)
|
|
191
|
+
|
|
192
|
+
if is_stagnant:
|
|
193
|
+
return True, f"Stagnation detected: {stagnation_reason}"
|
|
194
|
+
|
|
195
|
+
# Check CQS threshold (after stagnation check)
|
|
196
|
+
if cqs < config.capable_to_premium_min_cqs and attempt >= config.capable_min_attempts:
|
|
197
|
+
return (
|
|
198
|
+
True,
|
|
199
|
+
f"Quality score {cqs:.1f} below threshold {config.capable_to_premium_min_cqs}",
|
|
200
|
+
)
|
|
201
|
+
|
|
202
|
+
# No escalation needed
|
|
203
|
+
return False, f"Quality acceptable (CQS={cqs:.1f}), continuing improvement"
|
|
204
|
+
|
|
205
|
+
def _detect_stagnation(
|
|
206
|
+
self, cqs_history: list[float], improvement_threshold: float, consecutive_limit: int
|
|
207
|
+
) -> tuple[bool, str]:
|
|
208
|
+
"""Detect if improvement has stagnated.
|
|
209
|
+
|
|
210
|
+
Stagnation is defined as N consecutive attempts with <X% improvement.
|
|
211
|
+
|
|
212
|
+
Args:
|
|
213
|
+
cqs_history: List of CQS scores (chronological)
|
|
214
|
+
improvement_threshold: Min improvement % to avoid stagnation
|
|
215
|
+
consecutive_limit: Number of consecutive stagnations before escalating
|
|
216
|
+
|
|
217
|
+
Returns:
|
|
218
|
+
Tuple of (is_stagnant, reason)
|
|
219
|
+
|
|
220
|
+
Example:
|
|
221
|
+
>>> history = [75, 76, 77, 77.5]
|
|
222
|
+
>>> is_stagnant, reason = orchestrator._detect_stagnation(
|
|
223
|
+
... history, improvement_threshold=5.0, consecutive_limit=2
|
|
224
|
+
... )
|
|
225
|
+
>>> # (True, "2 consecutive runs with <5% improvement")
|
|
226
|
+
"""
|
|
227
|
+
if len(cqs_history) < consecutive_limit + 1:
|
|
228
|
+
return False, "Insufficient history for stagnation detection"
|
|
229
|
+
|
|
230
|
+
# Check last N improvements
|
|
231
|
+
consecutive_stagnations = 0
|
|
232
|
+
|
|
233
|
+
for i in range(len(cqs_history) - 1, 0, -1):
|
|
234
|
+
current = cqs_history[i]
|
|
235
|
+
previous = cqs_history[i - 1]
|
|
236
|
+
|
|
237
|
+
improvement = current - previous
|
|
238
|
+
|
|
239
|
+
if improvement < improvement_threshold:
|
|
240
|
+
consecutive_stagnations += 1
|
|
241
|
+
|
|
242
|
+
if consecutive_stagnations >= consecutive_limit:
|
|
243
|
+
return True, (
|
|
244
|
+
f"{consecutive_stagnations} consecutive runs with "
|
|
245
|
+
f"<{improvement_threshold}% improvement"
|
|
246
|
+
)
|
|
247
|
+
else:
|
|
248
|
+
# Improvement above threshold, reset counter
|
|
249
|
+
break
|
|
250
|
+
|
|
251
|
+
return False, "No stagnation detected"
|
|
252
|
+
|
|
253
|
+
def build_tier_prompt(
|
|
254
|
+
self, tier: Tier, base_task: str, failure_context: dict[str, Any] | None = None
|
|
255
|
+
) -> str:
|
|
256
|
+
"""Build XML-enhanced prompt with failure context.
|
|
257
|
+
|
|
258
|
+
Creates tier-appropriate prompts:
|
|
259
|
+
- CHEAP: Simple, focused prompt
|
|
260
|
+
- CAPABLE: Enhanced with failure analysis from cheap tier
|
|
261
|
+
- PREMIUM: Comprehensive with full escalation context
|
|
262
|
+
|
|
263
|
+
Args:
|
|
264
|
+
tier: Which tier this prompt is for
|
|
265
|
+
base_task: Base task description
|
|
266
|
+
failure_context: Context from previous tier (if escalating)
|
|
267
|
+
|
|
268
|
+
Returns:
|
|
269
|
+
XML-enhanced prompt string
|
|
270
|
+
|
|
271
|
+
Example:
|
|
272
|
+
>>> prompt = orchestrator.build_tier_prompt(
|
|
273
|
+
... Tier.CAPABLE,
|
|
274
|
+
... "Generate tests for module.py",
|
|
275
|
+
... failure_context={"previous_tier": Tier.CHEAP, ...}
|
|
276
|
+
... )
|
|
277
|
+
"""
|
|
278
|
+
if tier == Tier.CHEAP:
|
|
279
|
+
return self._build_cheap_prompt(base_task)
|
|
280
|
+
elif tier == Tier.CAPABLE:
|
|
281
|
+
return self._build_capable_prompt(base_task, failure_context)
|
|
282
|
+
else: # PREMIUM
|
|
283
|
+
return self._build_premium_prompt(base_task, failure_context)
|
|
284
|
+
|
|
285
|
+
def _build_cheap_prompt(self, base_task: str) -> str:
|
|
286
|
+
"""Build simple prompt for cheap tier.
|
|
287
|
+
|
|
288
|
+
Args:
|
|
289
|
+
base_task: Task description
|
|
290
|
+
|
|
291
|
+
Returns:
|
|
292
|
+
XML-enhanced prompt
|
|
293
|
+
"""
|
|
294
|
+
return f"""<task>
|
|
295
|
+
<objective>{base_task}</objective>
|
|
296
|
+
|
|
297
|
+
<quality_requirements>
|
|
298
|
+
<pass_rate>70%+</pass_rate>
|
|
299
|
+
<coverage>60%+</coverage>
|
|
300
|
+
<syntax>No syntax errors</syntax>
|
|
301
|
+
</quality_requirements>
|
|
302
|
+
|
|
303
|
+
<instructions>
|
|
304
|
+
Generate high-quality output that meets the quality requirements.
|
|
305
|
+
Focus on correctness and completeness.
|
|
306
|
+
</instructions>
|
|
307
|
+
</task>"""
|
|
308
|
+
|
|
309
|
+
def _build_capable_prompt(self, base_task: str, failure_context: dict[str, Any] | None) -> str:
|
|
310
|
+
"""Build enhanced prompt for capable tier with failure context.
|
|
311
|
+
|
|
312
|
+
Args:
|
|
313
|
+
base_task: Task description
|
|
314
|
+
failure_context: Context from cheap tier
|
|
315
|
+
|
|
316
|
+
Returns:
|
|
317
|
+
XML-enhanced prompt with failure analysis
|
|
318
|
+
"""
|
|
319
|
+
if not failure_context:
|
|
320
|
+
# No context, use enhanced base prompt
|
|
321
|
+
return f"""<task>
|
|
322
|
+
<objective>{base_task}</objective>
|
|
323
|
+
|
|
324
|
+
<quality_requirements>
|
|
325
|
+
<pass_rate>80%+</pass_rate>
|
|
326
|
+
<coverage>70%+</coverage>
|
|
327
|
+
<quality_score>80+</quality_score>
|
|
328
|
+
</quality_requirements>
|
|
329
|
+
|
|
330
|
+
<instructions>
|
|
331
|
+
Generate high-quality output with comprehensive coverage.
|
|
332
|
+
Ensure all edge cases are handled correctly.
|
|
333
|
+
</instructions>
|
|
334
|
+
</task>"""
|
|
335
|
+
|
|
336
|
+
# Extract detailed failure context
|
|
337
|
+
previous_cqs = failure_context.get("previous_cqs", 0)
|
|
338
|
+
reason = failure_context.get("reason", "Quality below threshold")
|
|
339
|
+
failures = failure_context.get("failures", [])
|
|
340
|
+
examples = failure_context.get("examples", [])
|
|
341
|
+
|
|
342
|
+
# Analyze failure patterns
|
|
343
|
+
failure_patterns = self.analyze_failure_patterns(failures) if failures else {}
|
|
344
|
+
|
|
345
|
+
# Build detailed prompt with failure analysis
|
|
346
|
+
prompt_parts = [
|
|
347
|
+
"<task>",
|
|
348
|
+
f" <objective>{base_task}</objective>",
|
|
349
|
+
"",
|
|
350
|
+
" <context_from_previous_tier>",
|
|
351
|
+
" <tier>cheap</tier>",
|
|
352
|
+
f" <quality_score>{previous_cqs:.1f}</quality_score>",
|
|
353
|
+
f" <escalation_reason>{reason}</escalation_reason>",
|
|
354
|
+
"",
|
|
355
|
+
]
|
|
356
|
+
|
|
357
|
+
# Add failure pattern analysis
|
|
358
|
+
if failure_patterns:
|
|
359
|
+
prompt_parts.append(" <failure_analysis>")
|
|
360
|
+
prompt_parts.append(
|
|
361
|
+
f" <total_failures>{failure_patterns.get('total_failures', 0)}</total_failures>"
|
|
362
|
+
)
|
|
363
|
+
prompt_parts.append(" <patterns>")
|
|
364
|
+
|
|
365
|
+
error_types = failure_patterns.get("error_types", {})
|
|
366
|
+
for error_type, count in sorted(error_types.items(), key=lambda x: -x[1]):
|
|
367
|
+
prompt_parts.append(f' <pattern type="{error_type}" count="{count}" />')
|
|
368
|
+
|
|
369
|
+
prompt_parts.append(" </patterns>")
|
|
370
|
+
|
|
371
|
+
primary_issue = failure_patterns.get("primary_issue", "unknown")
|
|
372
|
+
prompt_parts.append(f" <primary_issue>{primary_issue}</primary_issue>")
|
|
373
|
+
prompt_parts.append(" </failure_analysis>")
|
|
374
|
+
prompt_parts.append("")
|
|
375
|
+
|
|
376
|
+
# Add concrete failure examples (max 3)
|
|
377
|
+
if examples:
|
|
378
|
+
prompt_parts.append(" <failed_attempts>")
|
|
379
|
+
prompt_parts.append(" <!-- Examples of what the cheap tier produced -->")
|
|
380
|
+
|
|
381
|
+
for i, example in enumerate(examples[:3], 1):
|
|
382
|
+
error = example.get("error", "Unknown error")
|
|
383
|
+
code_snippet = example.get("code", "")[:200] # Limit snippet length
|
|
384
|
+
|
|
385
|
+
prompt_parts.append(f' <example number="{i}">')
|
|
386
|
+
prompt_parts.append(f" <error>{self._escape_xml(error)}</error>")
|
|
387
|
+
if code_snippet:
|
|
388
|
+
prompt_parts.append(
|
|
389
|
+
f" <code_snippet>{self._escape_xml(code_snippet)}</code_snippet>"
|
|
390
|
+
)
|
|
391
|
+
prompt_parts.append(" </example>")
|
|
392
|
+
|
|
393
|
+
prompt_parts.append(" </failed_attempts>")
|
|
394
|
+
prompt_parts.append("")
|
|
395
|
+
|
|
396
|
+
prompt_parts.extend(
|
|
397
|
+
[
|
|
398
|
+
" <improvement_needed>",
|
|
399
|
+
" The cheap tier struggled with these items. Analyze the failure",
|
|
400
|
+
" patterns above and generate improved solutions that specifically",
|
|
401
|
+
" address these issues.",
|
|
402
|
+
" </improvement_needed>",
|
|
403
|
+
" </context_from_previous_tier>",
|
|
404
|
+
"",
|
|
405
|
+
" <your_task>",
|
|
406
|
+
" Generate improved output that avoids the specific failure patterns identified above.",
|
|
407
|
+
"",
|
|
408
|
+
" <quality_requirements>",
|
|
409
|
+
" <pass_rate>80%+</pass_rate>",
|
|
410
|
+
" <coverage>70%+</coverage>",
|
|
411
|
+
" <quality_score>80+</quality_score>",
|
|
412
|
+
" </quality_requirements>",
|
|
413
|
+
"",
|
|
414
|
+
" <focus_areas>",
|
|
415
|
+
]
|
|
416
|
+
)
|
|
417
|
+
|
|
418
|
+
# Add targeted focus areas based on failure patterns
|
|
419
|
+
if failure_patterns:
|
|
420
|
+
error_types = failure_patterns.get("error_types", {})
|
|
421
|
+
if "async_errors" in error_types:
|
|
422
|
+
prompt_parts.append(
|
|
423
|
+
' <focus area="async">Proper async/await patterns and error handling</focus>'
|
|
424
|
+
)
|
|
425
|
+
if "mocking_errors" in error_types:
|
|
426
|
+
prompt_parts.append(
|
|
427
|
+
' <focus area="mocking">Correct mock setup and teardown</focus>'
|
|
428
|
+
)
|
|
429
|
+
if "syntax_errors" in error_types:
|
|
430
|
+
prompt_parts.append(
|
|
431
|
+
' <focus area="syntax">Valid Python syntax and imports</focus>'
|
|
432
|
+
)
|
|
433
|
+
if "other_errors" in error_types:
|
|
434
|
+
prompt_parts.append(
|
|
435
|
+
' <focus area="general">Edge cases and error handling</focus>'
|
|
436
|
+
)
|
|
437
|
+
else:
|
|
438
|
+
# Default focus areas
|
|
439
|
+
prompt_parts.extend(
|
|
440
|
+
[
|
|
441
|
+
' <focus area="syntax">Correct syntax and structure</focus>',
|
|
442
|
+
' <focus area="coverage">Comprehensive test coverage</focus>',
|
|
443
|
+
' <focus area="errors">Proper error handling</focus>',
|
|
444
|
+
' <focus area="edge_cases">Edge case coverage</focus>',
|
|
445
|
+
]
|
|
446
|
+
)
|
|
447
|
+
|
|
448
|
+
prompt_parts.extend([" </focus_areas>", " </your_task>", "</task>"])
|
|
449
|
+
|
|
450
|
+
return "\n".join(prompt_parts)
|
|
451
|
+
|
|
452
|
+
def _build_premium_prompt(self, base_task: str, failure_context: dict[str, Any] | None) -> str:
|
|
453
|
+
"""Build comprehensive prompt for premium tier.
|
|
454
|
+
|
|
455
|
+
Args:
|
|
456
|
+
base_task: Task description
|
|
457
|
+
failure_context: Context from previous tiers
|
|
458
|
+
|
|
459
|
+
Returns:
|
|
460
|
+
XML-enhanced prompt with full escalation context
|
|
461
|
+
"""
|
|
462
|
+
if not failure_context:
|
|
463
|
+
return f"""<task>
|
|
464
|
+
<objective>{base_task}</objective>
|
|
465
|
+
|
|
466
|
+
<quality_requirements>
|
|
467
|
+
<pass_rate>95%+</pass_rate>
|
|
468
|
+
<coverage>85%+</coverage>
|
|
469
|
+
<quality_score>95+</quality_score>
|
|
470
|
+
</quality_requirements>
|
|
471
|
+
|
|
472
|
+
<expert_instructions>
|
|
473
|
+
Apply expert-level techniques to generate exceptional output.
|
|
474
|
+
This is the highest tier - excellence is expected.
|
|
475
|
+
</expert_instructions>
|
|
476
|
+
</task>"""
|
|
477
|
+
|
|
478
|
+
# Extract comprehensive escalation context
|
|
479
|
+
previous_tier = failure_context.get("previous_tier", Tier.CAPABLE)
|
|
480
|
+
previous_cqs = failure_context.get("previous_cqs", 0)
|
|
481
|
+
reason = failure_context.get("reason", "Previous tier unsuccessful")
|
|
482
|
+
failures = failure_context.get("failures", [])
|
|
483
|
+
examples = failure_context.get("examples", [])
|
|
484
|
+
|
|
485
|
+
# Analyze persistent failure patterns
|
|
486
|
+
failure_patterns = self.analyze_failure_patterns(failures) if failures else {}
|
|
487
|
+
|
|
488
|
+
prompt_parts = [
|
|
489
|
+
"<task>",
|
|
490
|
+
f" <objective>{base_task}</objective>",
|
|
491
|
+
"",
|
|
492
|
+
" <escalation_context>",
|
|
493
|
+
f" <previous_tier>{previous_tier.value}</previous_tier>",
|
|
494
|
+
f" <quality_score>{previous_cqs:.1f}</quality_score>",
|
|
495
|
+
f" <escalation_reason>{self._escape_xml(reason)}</escalation_reason>",
|
|
496
|
+
"",
|
|
497
|
+
" <progression_analysis>",
|
|
498
|
+
" This task has been escalated through multiple tiers:",
|
|
499
|
+
" 1. CHEAP tier: Initial attempt with basic models",
|
|
500
|
+
" 2. CAPABLE tier: Enhanced attempt with better models",
|
|
501
|
+
" 3. PREMIUM tier (current): Final expert-level attempt",
|
|
502
|
+
"",
|
|
503
|
+
" The fact that this reached premium tier indicates a complex",
|
|
504
|
+
" or difficult case requiring expert-level handling.",
|
|
505
|
+
" </progression_analysis>",
|
|
506
|
+
"",
|
|
507
|
+
]
|
|
508
|
+
|
|
509
|
+
# Add detailed failure analysis
|
|
510
|
+
if failure_patterns:
|
|
511
|
+
prompt_parts.append(" <persistent_issues>")
|
|
512
|
+
prompt_parts.append(
|
|
513
|
+
f" <total_failures>{failure_patterns.get('total_failures', 0)}</total_failures>"
|
|
514
|
+
)
|
|
515
|
+
prompt_parts.append(" <failure_patterns>")
|
|
516
|
+
|
|
517
|
+
error_types = failure_patterns.get("error_types", {})
|
|
518
|
+
for error_type, count in sorted(error_types.items(), key=lambda x: -x[1]):
|
|
519
|
+
prompt_parts.append(f' <pattern type="{error_type}" count="{count}">')
|
|
520
|
+
|
|
521
|
+
# Add specific guidance per error type
|
|
522
|
+
if error_type == "async_errors":
|
|
523
|
+
prompt_parts.append(
|
|
524
|
+
" <guidance>Use proper async/await patterns, handle timeouts correctly</guidance>"
|
|
525
|
+
)
|
|
526
|
+
elif error_type == "mocking_errors":
|
|
527
|
+
prompt_parts.append(
|
|
528
|
+
" <guidance>Ensure mocks are properly configured and reset</guidance>"
|
|
529
|
+
)
|
|
530
|
+
elif error_type == "syntax_errors":
|
|
531
|
+
prompt_parts.append(
|
|
532
|
+
" <guidance>Double-check syntax, imports, and type annotations</guidance>"
|
|
533
|
+
)
|
|
534
|
+
|
|
535
|
+
prompt_parts.append(" </pattern>")
|
|
536
|
+
|
|
537
|
+
prompt_parts.append(" </failure_patterns>")
|
|
538
|
+
prompt_parts.append(
|
|
539
|
+
f" <primary_issue>{failure_patterns.get('primary_issue', 'unknown')}</primary_issue>"
|
|
540
|
+
)
|
|
541
|
+
prompt_parts.append(" </persistent_issues>")
|
|
542
|
+
prompt_parts.append("")
|
|
543
|
+
|
|
544
|
+
# Add concrete examples from capable tier
|
|
545
|
+
if examples:
|
|
546
|
+
prompt_parts.append(" <capable_tier_attempts>")
|
|
547
|
+
prompt_parts.append(" <!-- Examples from the capable tier's attempts -->")
|
|
548
|
+
|
|
549
|
+
for i, example in enumerate(examples[:3], 1):
|
|
550
|
+
error = example.get("error", "Unknown error")
|
|
551
|
+
code_snippet = example.get("code", "")[:300] # More context for premium
|
|
552
|
+
quality_score = example.get("quality_score", 0)
|
|
553
|
+
|
|
554
|
+
prompt_parts.append(f' <attempt number="{i}" quality_score="{quality_score}">')
|
|
555
|
+
prompt_parts.append(f" <error>{self._escape_xml(error)}</error>")
|
|
556
|
+
if code_snippet:
|
|
557
|
+
prompt_parts.append(
|
|
558
|
+
f" <code_snippet>{self._escape_xml(code_snippet)}</code_snippet>"
|
|
559
|
+
)
|
|
560
|
+
prompt_parts.append(" </attempt>")
|
|
561
|
+
|
|
562
|
+
prompt_parts.append(" </capable_tier_attempts>")
|
|
563
|
+
prompt_parts.append("")
|
|
564
|
+
|
|
565
|
+
prompt_parts.extend(
|
|
566
|
+
[
|
|
567
|
+
" </escalation_context>",
|
|
568
|
+
"",
|
|
569
|
+
" <expert_task>",
|
|
570
|
+
" <critical_notice>",
|
|
571
|
+
" You are the FINAL tier in the progressive escalation system.",
|
|
572
|
+
" Previous tiers (cheap and capable) have attempted this task",
|
|
573
|
+
" multiple times and could not achieve the required quality.",
|
|
574
|
+
"",
|
|
575
|
+
" This is the last automated attempt before human review.",
|
|
576
|
+
" Excellence is not optional - it is required.",
|
|
577
|
+
" </critical_notice>",
|
|
578
|
+
"",
|
|
579
|
+
" <expert_techniques>",
|
|
580
|
+
" Apply sophisticated approaches:",
|
|
581
|
+
" - Deep analysis of why previous attempts failed",
|
|
582
|
+
" - Production-grade error handling and edge cases",
|
|
583
|
+
" - Comprehensive documentation and clarity",
|
|
584
|
+
" - Defensive programming against subtle bugs",
|
|
585
|
+
]
|
|
586
|
+
)
|
|
587
|
+
|
|
588
|
+
# Add specific techniques based on failure patterns
|
|
589
|
+
if failure_patterns:
|
|
590
|
+
error_types = failure_patterns.get("error_types", {})
|
|
591
|
+
if "async_errors" in error_types:
|
|
592
|
+
prompt_parts.append(
|
|
593
|
+
" - Advanced async patterns (asyncio.gather, proper timeouts)"
|
|
594
|
+
)
|
|
595
|
+
if "mocking_errors" in error_types:
|
|
596
|
+
prompt_parts.append(
|
|
597
|
+
" - Sophisticated mocking (pytest fixtures, proper lifecycle)"
|
|
598
|
+
)
|
|
599
|
+
if "syntax_errors" in error_types:
|
|
600
|
+
prompt_parts.append(" - Rigorous syntax validation before submission")
|
|
601
|
+
|
|
602
|
+
prompt_parts.extend(
|
|
603
|
+
[
|
|
604
|
+
" </expert_techniques>",
|
|
605
|
+
"",
|
|
606
|
+
" <quality_requirements>",
|
|
607
|
+
" <pass_rate>95%+</pass_rate>",
|
|
608
|
+
" <coverage>85%+</coverage>",
|
|
609
|
+
" <quality_score>95+</quality_score>",
|
|
610
|
+
" <zero_syntax_errors>MANDATORY</zero_syntax_errors>",
|
|
611
|
+
" </quality_requirements>",
|
|
612
|
+
"",
|
|
613
|
+
" <success_criteria>",
|
|
614
|
+
" Your implementation must:",
|
|
615
|
+
" 1. Address ALL failure patterns identified above",
|
|
616
|
+
" 2. Achieve exceptional quality scores (95+)",
|
|
617
|
+
" 3. Have zero syntax errors or runtime failures",
|
|
618
|
+
" 4. Include comprehensive edge case coverage",
|
|
619
|
+
" 5. Be production-ready with proper documentation",
|
|
620
|
+
" </success_criteria>",
|
|
621
|
+
" </expert_task>",
|
|
622
|
+
"</task>",
|
|
623
|
+
]
|
|
624
|
+
)
|
|
625
|
+
|
|
626
|
+
return "\n".join(prompt_parts)
|
|
627
|
+
|
|
628
|
+
def _escape_xml(self, text: str) -> str:
|
|
629
|
+
"""Escape special XML characters.
|
|
630
|
+
|
|
631
|
+
Args:
|
|
632
|
+
text: Text to escape
|
|
633
|
+
|
|
634
|
+
Returns:
|
|
635
|
+
XML-safe text
|
|
636
|
+
|
|
637
|
+
Example:
|
|
638
|
+
>>> orchestrator._escape_xml("Error: <missing>")
|
|
639
|
+
'Error: <missing>'
|
|
640
|
+
"""
|
|
641
|
+
return (
|
|
642
|
+
text.replace("&", "&")
|
|
643
|
+
.replace("<", "<")
|
|
644
|
+
.replace(">", ">")
|
|
645
|
+
.replace('"', """)
|
|
646
|
+
.replace("'", "'")
|
|
647
|
+
)
|
|
648
|
+
|
|
649
|
+
def create_agent_team(
|
|
650
|
+
self, tier: Tier, failure_context: dict[str, Any] | None = None
|
|
651
|
+
) -> list[str]:
|
|
652
|
+
"""Create specialized agent team for tier.
|
|
653
|
+
|
|
654
|
+
Different tiers get different agent compositions:
|
|
655
|
+
- CHEAP: Single generator agent
|
|
656
|
+
- CAPABLE: Generator + Analyzer
|
|
657
|
+
- PREMIUM: Generator + Analyzer + Reviewer
|
|
658
|
+
|
|
659
|
+
Args:
|
|
660
|
+
tier: Which tier
|
|
661
|
+
failure_context: Context from previous tier
|
|
662
|
+
|
|
663
|
+
Returns:
|
|
664
|
+
List of agent types to create
|
|
665
|
+
|
|
666
|
+
Note:
|
|
667
|
+
This returns agent type names. Actual agent creation
|
|
668
|
+
will be implemented when we integrate with the agent system.
|
|
669
|
+
|
|
670
|
+
Example:
|
|
671
|
+
>>> agents = orchestrator.create_agent_team(
|
|
672
|
+
... Tier.CAPABLE,
|
|
673
|
+
... failure_context={...}
|
|
674
|
+
... )
|
|
675
|
+
>>> # ["generator", "analyzer"]
|
|
676
|
+
"""
|
|
677
|
+
if tier == Tier.CHEAP:
|
|
678
|
+
return ["generator"]
|
|
679
|
+
elif tier == Tier.CAPABLE:
|
|
680
|
+
return ["generator", "analyzer"]
|
|
681
|
+
else: # PREMIUM
|
|
682
|
+
return ["generator", "analyzer", "reviewer"]
|
|
683
|
+
|
|
684
|
+
def analyze_failure_patterns(self, failures: list[dict[str, Any]]) -> dict[str, Any]:
|
|
685
|
+
"""Analyze failure patterns to inform next tier.
|
|
686
|
+
|
|
687
|
+
Groups failures by type and identifies common issues.
|
|
688
|
+
|
|
689
|
+
Args:
|
|
690
|
+
failures: List of failed items with error details
|
|
691
|
+
|
|
692
|
+
Returns:
|
|
693
|
+
Failure pattern analysis
|
|
694
|
+
|
|
695
|
+
Example:
|
|
696
|
+
>>> patterns = orchestrator.analyze_failure_patterns(
|
|
697
|
+
... [{"error": "SyntaxError: async"}, ...]
|
|
698
|
+
... )
|
|
699
|
+
>>> # {"async_errors": 15, "mocking_errors": 10, ...}
|
|
700
|
+
"""
|
|
701
|
+
# Group by error type
|
|
702
|
+
error_types: dict[str, int] = {}
|
|
703
|
+
|
|
704
|
+
for failure in failures:
|
|
705
|
+
error = failure.get("error", "unknown")
|
|
706
|
+
|
|
707
|
+
# Categorize error
|
|
708
|
+
if "async" in error.lower() or "await" in error.lower():
|
|
709
|
+
error_types["async_errors"] = error_types.get("async_errors", 0) + 1
|
|
710
|
+
elif "mock" in error.lower():
|
|
711
|
+
error_types["mocking_errors"] = error_types.get("mocking_errors", 0) + 1
|
|
712
|
+
elif "syntax" in error.lower():
|
|
713
|
+
error_types["syntax_errors"] = error_types.get("syntax_errors", 0) + 1
|
|
714
|
+
else:
|
|
715
|
+
error_types["other_errors"] = error_types.get("other_errors", 0) + 1
|
|
716
|
+
|
|
717
|
+
return {
|
|
718
|
+
"total_failures": len(failures),
|
|
719
|
+
"error_types": error_types,
|
|
720
|
+
"primary_issue": (
|
|
721
|
+
max(error_types.items(), key=lambda x: x[1])[0] if error_types else "unknown"
|
|
722
|
+
),
|
|
723
|
+
}
|