PyPI - kubiya-control-plane-api - Versions diffs - 0.9.15__py3-none-any.whl - Mend

kubiya-control-plane-api 0.9.15__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (479) hide show

control_plane_api/LICENSE +676 -0
control_plane_api/README.md +350 -0
control_plane_api/__init__.py +4 -0
control_plane_api/__version__.py +8 -0
control_plane_api/alembic/README +1 -0
control_plane_api/alembic/env.py +121 -0
control_plane_api/alembic/script.py.mako +28 -0
control_plane_api/alembic/versions/2613c65c3dbe_initial_database_setup.py +32 -0
control_plane_api/alembic/versions/2df520d4927d_merge_heads.py +28 -0
control_plane_api/alembic/versions/43abf98d6a01_add_paused_status_to_executions.py +73 -0
control_plane_api/alembic/versions/6289854264cb_merge_multiple_heads.py +28 -0
control_plane_api/alembic/versions/6a4d4dc3d8dc_generate_execution_transitions.py +50 -0
control_plane_api/alembic/versions/87d11cf0a783_add_disconnected_status_to_worker_.py +44 -0
control_plane_api/alembic/versions/add_ephemeral_queue_support.py +85 -0
control_plane_api/alembic/versions/add_model_type_to_llm_models.py +31 -0
control_plane_api/alembic/versions/add_plan_executions_table.py +114 -0
control_plane_api/alembic/versions/add_trace_span_tables.py +154 -0
control_plane_api/alembic/versions/add_user_info_to_traces.py +36 -0
control_plane_api/alembic/versions/adjusting_foreign_keys.py +32 -0
control_plane_api/alembic/versions/b4983d976db2_initial_tables.py +1128 -0
control_plane_api/alembic/versions/d181a3b40e71_rename_custom_metadata_to_metadata_in_.py +50 -0
control_plane_api/alembic/versions/df9117888e82_add_missing_columns.py +82 -0
control_plane_api/alembic/versions/f25de6ad895a_missing_migrations.py +34 -0
control_plane_api/alembic/versions/f71305fb69b9_fix_ephemeral_queue_deletion_foreign_key.py +54 -0
control_plane_api/alembic/versions/mark_local_exec_queues_as_ephemeral.py +68 -0
control_plane_api/alembic.ini +148 -0
control_plane_api/api/index.py +12 -0
control_plane_api/app/__init__.py +11 -0
control_plane_api/app/activities/__init__.py +20 -0
control_plane_api/app/activities/agent_activities.py +384 -0
control_plane_api/app/activities/plan_generation_activities.py +499 -0
control_plane_api/app/activities/team_activities.py +424 -0
control_plane_api/app/activities/temporal_cloud_activities.py +588 -0
control_plane_api/app/config/__init__.py +35 -0
control_plane_api/app/config/api_config.py +469 -0
control_plane_api/app/config/config_loader.py +224 -0
control_plane_api/app/config/model_pricing.py +323 -0
control_plane_api/app/config/storage_config.py +159 -0
control_plane_api/app/config.py +115 -0
control_plane_api/app/controllers/__init__.py +0 -0
control_plane_api/app/controllers/execution_environment_controller.py +1315 -0
control_plane_api/app/database.py +135 -0
control_plane_api/app/exceptions.py +408 -0
control_plane_api/app/lib/__init__.py +11 -0
control_plane_api/app/lib/environment.py +65 -0
control_plane_api/app/lib/event_bus/__init__.py +17 -0
control_plane_api/app/lib/event_bus/base.py +136 -0
control_plane_api/app/lib/event_bus/manager.py +335 -0
control_plane_api/app/lib/event_bus/providers/__init__.py +6 -0
control_plane_api/app/lib/event_bus/providers/http_provider.py +166 -0
control_plane_api/app/lib/event_bus/providers/nats_provider.py +324 -0
control_plane_api/app/lib/event_bus/providers/redis_provider.py +233 -0
control_plane_api/app/lib/event_bus/providers/websocket_provider.py +497 -0
control_plane_api/app/lib/job_executor.py +330 -0
control_plane_api/app/lib/kubiya_client.py +293 -0
control_plane_api/app/lib/litellm_pricing.py +166 -0
control_plane_api/app/lib/mcp_validation.py +163 -0
control_plane_api/app/lib/nats/__init__.py +13 -0
control_plane_api/app/lib/nats/credentials_manager.py +288 -0
control_plane_api/app/lib/nats/listener.py +374 -0
control_plane_api/app/lib/planning_prompt_builder.py +153 -0
control_plane_api/app/lib/planning_tools/__init__.py +41 -0
control_plane_api/app/lib/planning_tools/agents.py +409 -0
control_plane_api/app/lib/planning_tools/agno_toolkit.py +836 -0
control_plane_api/app/lib/planning_tools/base.py +119 -0
control_plane_api/app/lib/planning_tools/cognitive_memory_tools.py +403 -0
control_plane_api/app/lib/planning_tools/context_graph_tools.py +545 -0
control_plane_api/app/lib/planning_tools/environments.py +218 -0
control_plane_api/app/lib/planning_tools/knowledge.py +204 -0
control_plane_api/app/lib/planning_tools/models.py +93 -0
control_plane_api/app/lib/planning_tools/planning_service.py +646 -0
control_plane_api/app/lib/planning_tools/resources.py +242 -0
control_plane_api/app/lib/planning_tools/teams.py +334 -0
control_plane_api/app/lib/policy_enforcer_client.py +1016 -0
control_plane_api/app/lib/redis_client.py +803 -0
control_plane_api/app/lib/sqlalchemy_utils.py +486 -0
control_plane_api/app/lib/state_transition_tools/__init__.py +7 -0
control_plane_api/app/lib/state_transition_tools/execution_context.py +388 -0
control_plane_api/app/lib/storage/__init__.py +20 -0
control_plane_api/app/lib/storage/base_provider.py +274 -0
control_plane_api/app/lib/storage/provider_factory.py +157 -0
control_plane_api/app/lib/storage/vercel_blob_provider.py +468 -0
control_plane_api/app/lib/supabase.py +71 -0
control_plane_api/app/lib/supabase_utils.py +138 -0
control_plane_api/app/lib/task_planning/__init__.py +138 -0
control_plane_api/app/lib/task_planning/agent_factory.py +308 -0
control_plane_api/app/lib/task_planning/agents.py +389 -0
control_plane_api/app/lib/task_planning/cache.py +218 -0
control_plane_api/app/lib/task_planning/entity_resolver.py +273 -0
control_plane_api/app/lib/task_planning/helpers.py +293 -0
control_plane_api/app/lib/task_planning/hooks.py +474 -0
control_plane_api/app/lib/task_planning/models.py +503 -0
control_plane_api/app/lib/task_planning/plan_validator.py +166 -0
control_plane_api/app/lib/task_planning/planning_workflow.py +2911 -0
control_plane_api/app/lib/task_planning/runner.py +656 -0
control_plane_api/app/lib/task_planning/streaming_hook.py +213 -0
control_plane_api/app/lib/task_planning/workflow.py +424 -0
control_plane_api/app/lib/templating/__init__.py +88 -0
control_plane_api/app/lib/templating/compiler.py +278 -0
control_plane_api/app/lib/templating/engine.py +178 -0
control_plane_api/app/lib/templating/parsers/__init__.py +29 -0
control_plane_api/app/lib/templating/parsers/base.py +96 -0
control_plane_api/app/lib/templating/parsers/env.py +85 -0
control_plane_api/app/lib/templating/parsers/graph.py +112 -0
control_plane_api/app/lib/templating/parsers/secret.py +87 -0
control_plane_api/app/lib/templating/parsers/simple.py +81 -0
control_plane_api/app/lib/templating/resolver.py +366 -0
control_plane_api/app/lib/templating/types.py +214 -0
control_plane_api/app/lib/templating/validator.py +201 -0
control_plane_api/app/lib/temporal_client.py +232 -0
control_plane_api/app/lib/temporal_credentials_cache.py +178 -0
control_plane_api/app/lib/temporal_credentials_service.py +203 -0
control_plane_api/app/lib/validation/__init__.py +24 -0
control_plane_api/app/lib/validation/runtime_validation.py +388 -0
control_plane_api/app/main.py +531 -0
control_plane_api/app/middleware/__init__.py +10 -0
control_plane_api/app/middleware/auth.py +645 -0
control_plane_api/app/middleware/exception_handler.py +267 -0
control_plane_api/app/middleware/prometheus_middleware.py +173 -0
control_plane_api/app/middleware/rate_limiting.py +384 -0
control_plane_api/app/middleware/request_id.py +202 -0
control_plane_api/app/models/__init__.py +40 -0
control_plane_api/app/models/agent.py +90 -0
control_plane_api/app/models/analytics.py +206 -0
control_plane_api/app/models/associations.py +107 -0
control_plane_api/app/models/auth_user.py +73 -0
control_plane_api/app/models/context.py +161 -0
control_plane_api/app/models/custom_integration.py +99 -0
control_plane_api/app/models/environment.py +64 -0
control_plane_api/app/models/execution.py +125 -0
control_plane_api/app/models/execution_transition.py +50 -0
control_plane_api/app/models/job.py +159 -0
control_plane_api/app/models/llm_model.py +78 -0
control_plane_api/app/models/orchestration.py +66 -0
control_plane_api/app/models/plan_execution.py +102 -0
control_plane_api/app/models/presence.py +49 -0
control_plane_api/app/models/project.py +61 -0
control_plane_api/app/models/project_management.py +85 -0
control_plane_api/app/models/session.py +29 -0
control_plane_api/app/models/skill.py +155 -0
control_plane_api/app/models/system_tables.py +43 -0
control_plane_api/app/models/task_planning.py +372 -0
control_plane_api/app/models/team.py +86 -0
control_plane_api/app/models/trace.py +257 -0
control_plane_api/app/models/user_profile.py +54 -0
control_plane_api/app/models/worker.py +221 -0
control_plane_api/app/models/workflow.py +161 -0
control_plane_api/app/models/workspace.py +50 -0
control_plane_api/app/observability/__init__.py +177 -0
control_plane_api/app/observability/context_logging.py +475 -0
control_plane_api/app/observability/decorators.py +337 -0
control_plane_api/app/observability/local_span_processor.py +702 -0
control_plane_api/app/observability/metrics.py +303 -0
control_plane_api/app/observability/middleware.py +246 -0
control_plane_api/app/observability/optional.py +115 -0
control_plane_api/app/observability/tracing.py +382 -0
control_plane_api/app/policies/README.md +149 -0
control_plane_api/app/policies/approved_users.rego +62 -0
control_plane_api/app/policies/business_hours.rego +51 -0
control_plane_api/app/policies/rate_limiting.rego +100 -0
control_plane_api/app/policies/tool_enforcement/README.md +336 -0
control_plane_api/app/policies/tool_enforcement/bash_command_validation.rego +71 -0
control_plane_api/app/policies/tool_enforcement/business_hours_enforcement.rego +82 -0
control_plane_api/app/policies/tool_enforcement/mcp_tool_allowlist.rego +58 -0
control_plane_api/app/policies/tool_enforcement/production_safeguards.rego +80 -0
control_plane_api/app/policies/tool_enforcement/role_based_tool_access.rego +44 -0
control_plane_api/app/policies/tool_restrictions.rego +86 -0
control_plane_api/app/routers/__init__.py +4 -0
control_plane_api/app/routers/agents.py +382 -0
control_plane_api/app/routers/agents_v2.py +1598 -0
control_plane_api/app/routers/analytics.py +1310 -0
control_plane_api/app/routers/auth.py +59 -0
control_plane_api/app/routers/client_config.py +57 -0
control_plane_api/app/routers/context_graph.py +561 -0
control_plane_api/app/routers/context_manager.py +577 -0
control_plane_api/app/routers/custom_integrations.py +490 -0
control_plane_api/app/routers/enforcer.py +132 -0
control_plane_api/app/routers/environment_context.py +252 -0
control_plane_api/app/routers/environments.py +761 -0
control_plane_api/app/routers/execution_environment.py +847 -0
control_plane_api/app/routers/executions/__init__.py +28 -0
control_plane_api/app/routers/executions/router.py +286 -0
control_plane_api/app/routers/executions/services/__init__.py +22 -0
control_plane_api/app/routers/executions/services/demo_worker_health.py +156 -0
control_plane_api/app/routers/executions/services/status_service.py +420 -0
control_plane_api/app/routers/executions/services/test_worker_health.py +480 -0
control_plane_api/app/routers/executions/services/worker_health.py +514 -0
control_plane_api/app/routers/executions/streaming/__init__.py +22 -0
control_plane_api/app/routers/executions/streaming/deduplication.py +352 -0
control_plane_api/app/routers/executions/streaming/event_buffer.py +353 -0
control_plane_api/app/routers/executions/streaming/event_formatter.py +964 -0
control_plane_api/app/routers/executions/streaming/history_loader.py +588 -0
control_plane_api/app/routers/executions/streaming/live_source.py +693 -0
control_plane_api/app/routers/executions/streaming/streamer.py +849 -0
control_plane_api/app/routers/executions.py +4888 -0
control_plane_api/app/routers/health.py +165 -0
control_plane_api/app/routers/health_v2.py +394 -0
control_plane_api/app/routers/integration_templates.py +496 -0
control_plane_api/app/routers/integrations.py +287 -0
control_plane_api/app/routers/jobs.py +1809 -0
control_plane_api/app/routers/metrics.py +517 -0
control_plane_api/app/routers/models.py +82 -0
control_plane_api/app/routers/models_v2.py +628 -0
control_plane_api/app/routers/plan_executions.py +1481 -0
control_plane_api/app/routers/plan_generation_async.py +304 -0
control_plane_api/app/routers/policies.py +669 -0
control_plane_api/app/routers/presence.py +234 -0
control_plane_api/app/routers/projects.py +987 -0
control_plane_api/app/routers/runners.py +379 -0
control_plane_api/app/routers/runtimes.py +172 -0
control_plane_api/app/routers/secrets.py +171 -0
control_plane_api/app/routers/skills.py +1010 -0
control_plane_api/app/routers/skills_definitions.py +140 -0
control_plane_api/app/routers/storage.py +456 -0
control_plane_api/app/routers/task_planning.py +611 -0
control_plane_api/app/routers/task_queues.py +650 -0
control_plane_api/app/routers/team_context.py +274 -0
control_plane_api/app/routers/teams.py +1747 -0
control_plane_api/app/routers/templates.py +248 -0
control_plane_api/app/routers/traces.py +571 -0
control_plane_api/app/routers/websocket_client.py +479 -0
control_plane_api/app/routers/websocket_executions_status.py +437 -0
control_plane_api/app/routers/websocket_gateway.py +323 -0
control_plane_api/app/routers/websocket_traces.py +576 -0
control_plane_api/app/routers/worker_queues.py +2555 -0
control_plane_api/app/routers/worker_websocket.py +419 -0
control_plane_api/app/routers/workers.py +1004 -0
control_plane_api/app/routers/workflows.py +204 -0
control_plane_api/app/runtimes/__init__.py +6 -0
control_plane_api/app/runtimes/validation.py +344 -0
control_plane_api/app/schemas/__init__.py +1 -0
control_plane_api/app/schemas/job_schemas.py +302 -0
control_plane_api/app/schemas/mcp_schemas.py +311 -0
control_plane_api/app/schemas/template_schemas.py +133 -0
control_plane_api/app/schemas/trace_schemas.py +168 -0
control_plane_api/app/schemas/worker_queue_observability_schemas.py +165 -0
control_plane_api/app/services/__init__.py +1 -0
control_plane_api/app/services/agno_planning_strategy.py +233 -0
control_plane_api/app/services/agno_service.py +838 -0
control_plane_api/app/services/claude_code_planning_service.py +203 -0
control_plane_api/app/services/context_graph_client.py +224 -0
control_plane_api/app/services/custom_integration_service.py +415 -0
control_plane_api/app/services/integration_resolution_service.py +345 -0
control_plane_api/app/services/litellm_service.py +394 -0
control_plane_api/app/services/plan_generator.py +79 -0
control_plane_api/app/services/planning_strategy.py +66 -0
control_plane_api/app/services/planning_strategy_factory.py +118 -0
control_plane_api/app/services/policy_service.py +615 -0
control_plane_api/app/services/state_transition_service.py +755 -0
control_plane_api/app/services/storage_service.py +593 -0
control_plane_api/app/services/temporal_cloud_provisioning.py +150 -0
control_plane_api/app/services/toolsets/context_graph_skill.py +432 -0
control_plane_api/app/services/trace_retention.py +354 -0
control_plane_api/app/services/worker_queue_metrics_service.py +190 -0
control_plane_api/app/services/workflow_cancellation_manager.py +135 -0
control_plane_api/app/services/workflow_operations_service.py +611 -0
control_plane_api/app/skills/__init__.py +100 -0
control_plane_api/app/skills/base.py +239 -0
control_plane_api/app/skills/builtin/__init__.py +37 -0
control_plane_api/app/skills/builtin/agent_communication/__init__.py +8 -0
control_plane_api/app/skills/builtin/agent_communication/skill.py +246 -0
control_plane_api/app/skills/builtin/code_ingestion/__init__.py +4 -0
control_plane_api/app/skills/builtin/code_ingestion/skill.py +267 -0
control_plane_api/app/skills/builtin/cognitive_memory/__init__.py +4 -0
control_plane_api/app/skills/builtin/cognitive_memory/skill.py +174 -0
control_plane_api/app/skills/builtin/contextual_awareness/__init__.py +4 -0
control_plane_api/app/skills/builtin/contextual_awareness/skill.py +387 -0
control_plane_api/app/skills/builtin/data_visualization/__init__.py +4 -0
control_plane_api/app/skills/builtin/data_visualization/skill.py +154 -0
control_plane_api/app/skills/builtin/docker/__init__.py +4 -0
control_plane_api/app/skills/builtin/docker/skill.py +104 -0
control_plane_api/app/skills/builtin/file_generation/__init__.py +4 -0
control_plane_api/app/skills/builtin/file_generation/skill.py +94 -0
control_plane_api/app/skills/builtin/file_system/__init__.py +4 -0
control_plane_api/app/skills/builtin/file_system/skill.py +110 -0
control_plane_api/app/skills/builtin/knowledge_api/__init__.py +5 -0
control_plane_api/app/skills/builtin/knowledge_api/skill.py +124 -0
control_plane_api/app/skills/builtin/python/__init__.py +4 -0
control_plane_api/app/skills/builtin/python/skill.py +92 -0
control_plane_api/app/skills/builtin/remote_filesystem/__init__.py +5 -0
control_plane_api/app/skills/builtin/remote_filesystem/skill.py +170 -0
control_plane_api/app/skills/builtin/shell/__init__.py +4 -0
control_plane_api/app/skills/builtin/shell/skill.py +161 -0
control_plane_api/app/skills/builtin/slack/__init__.py +3 -0
control_plane_api/app/skills/builtin/slack/skill.py +302 -0
control_plane_api/app/skills/builtin/workflow_executor/__init__.py +4 -0
control_plane_api/app/skills/builtin/workflow_executor/skill.py +469 -0
control_plane_api/app/skills/business_intelligence.py +189 -0
control_plane_api/app/skills/config.py +63 -0
control_plane_api/app/skills/loaders/__init__.py +14 -0
control_plane_api/app/skills/loaders/base.py +73 -0
control_plane_api/app/skills/loaders/filesystem_loader.py +199 -0
control_plane_api/app/skills/registry.py +125 -0
control_plane_api/app/utils/helpers.py +12 -0
control_plane_api/app/utils/workflow_executor.py +354 -0
control_plane_api/app/workflows/__init__.py +11 -0
control_plane_api/app/workflows/agent_execution.py +520 -0
control_plane_api/app/workflows/agent_execution_with_skills.py +223 -0
control_plane_api/app/workflows/namespace_provisioning.py +326 -0
control_plane_api/app/workflows/plan_generation.py +254 -0
control_plane_api/app/workflows/team_execution.py +442 -0
control_plane_api/scripts/seed_models.py +240 -0
control_plane_api/scripts/validate_existing_tool_names.py +492 -0
control_plane_api/shared/__init__.py +8 -0
control_plane_api/shared/version.py +17 -0
control_plane_api/test_deduplication.py +274 -0
control_plane_api/test_executor_deduplication_e2e.py +309 -0
control_plane_api/test_job_execution_e2e.py +283 -0
control_plane_api/test_real_integration.py +193 -0
control_plane_api/version.py +38 -0
control_plane_api/worker/__init__.py +0 -0
control_plane_api/worker/activities/__init__.py +0 -0
control_plane_api/worker/activities/agent_activities.py +1585 -0
control_plane_api/worker/activities/approval_activities.py +234 -0
control_plane_api/worker/activities/job_activities.py +199 -0
control_plane_api/worker/activities/runtime_activities.py +1167 -0
control_plane_api/worker/activities/skill_activities.py +282 -0
control_plane_api/worker/activities/team_activities.py +479 -0
control_plane_api/worker/agent_runtime_server.py +370 -0
control_plane_api/worker/binary_manager.py +333 -0
control_plane_api/worker/config/__init__.py +31 -0
control_plane_api/worker/config/worker_config.py +273 -0
control_plane_api/worker/control_plane_client.py +1491 -0
control_plane_api/worker/examples/analytics_integration_example.py +362 -0
control_plane_api/worker/health_monitor.py +159 -0
control_plane_api/worker/metrics.py +237 -0
control_plane_api/worker/models/__init__.py +1 -0
control_plane_api/worker/models/error_events.py +105 -0
control_plane_api/worker/models/inputs.py +89 -0
control_plane_api/worker/runtimes/__init__.py +35 -0
control_plane_api/worker/runtimes/agent_runtime/runtime.py +485 -0
control_plane_api/worker/runtimes/agno/__init__.py +34 -0
control_plane_api/worker/runtimes/agno/config.py +248 -0
control_plane_api/worker/runtimes/agno/hooks.py +385 -0
control_plane_api/worker/runtimes/agno/mcp_builder.py +195 -0
control_plane_api/worker/runtimes/agno/runtime.py +1063 -0
control_plane_api/worker/runtimes/agno/utils.py +163 -0
control_plane_api/worker/runtimes/base.py +979 -0
control_plane_api/worker/runtimes/claude_code/__init__.py +38 -0
control_plane_api/worker/runtimes/claude_code/cleanup.py +184 -0
control_plane_api/worker/runtimes/claude_code/client_pool.py +529 -0
control_plane_api/worker/runtimes/claude_code/config.py +829 -0
control_plane_api/worker/runtimes/claude_code/hooks.py +482 -0
control_plane_api/worker/runtimes/claude_code/litellm_proxy.py +1702 -0
control_plane_api/worker/runtimes/claude_code/mcp_builder.py +467 -0
control_plane_api/worker/runtimes/claude_code/mcp_discovery.py +558 -0
control_plane_api/worker/runtimes/claude_code/runtime.py +1546 -0
control_plane_api/worker/runtimes/claude_code/tool_mapper.py +403 -0
control_plane_api/worker/runtimes/claude_code/utils.py +149 -0
control_plane_api/worker/runtimes/factory.py +173 -0
control_plane_api/worker/runtimes/model_utils.py +107 -0
control_plane_api/worker/runtimes/validation.py +93 -0
control_plane_api/worker/services/__init__.py +1 -0
control_plane_api/worker/services/agent_communication_tools.py +908 -0
control_plane_api/worker/services/agent_executor.py +485 -0
control_plane_api/worker/services/agent_executor_v2.py +793 -0
control_plane_api/worker/services/analytics_collector.py +457 -0
control_plane_api/worker/services/analytics_service.py +464 -0
control_plane_api/worker/services/approval_tools.py +310 -0
control_plane_api/worker/services/approval_tools_agno.py +207 -0
control_plane_api/worker/services/cancellation_manager.py +177 -0
control_plane_api/worker/services/code_ingestion_tools.py +465 -0
control_plane_api/worker/services/contextual_awareness_tools.py +405 -0
control_plane_api/worker/services/data_visualization.py +834 -0
control_plane_api/worker/services/event_publisher.py +531 -0
control_plane_api/worker/services/jira_tools.py +257 -0
control_plane_api/worker/services/remote_filesystem_tools.py +498 -0
control_plane_api/worker/services/runtime_analytics.py +328 -0
control_plane_api/worker/services/session_service.py +365 -0
control_plane_api/worker/services/skill_context_enhancement.py +181 -0
control_plane_api/worker/services/skill_factory.py +471 -0
control_plane_api/worker/services/system_prompt_enhancement.py +410 -0
control_plane_api/worker/services/team_executor.py +715 -0
control_plane_api/worker/services/team_executor_v2.py +1866 -0
control_plane_api/worker/services/tool_enforcement.py +254 -0
control_plane_api/worker/services/workflow_executor/__init__.py +52 -0
control_plane_api/worker/services/workflow_executor/event_processor.py +287 -0
control_plane_api/worker/services/workflow_executor/event_publisher.py +210 -0
control_plane_api/worker/services/workflow_executor/executors/__init__.py +15 -0
control_plane_api/worker/services/workflow_executor/executors/base.py +270 -0
control_plane_api/worker/services/workflow_executor/executors/json_executor.py +50 -0
control_plane_api/worker/services/workflow_executor/executors/python_executor.py +50 -0
control_plane_api/worker/services/workflow_executor/models.py +142 -0
control_plane_api/worker/services/workflow_executor_tools.py +1748 -0
control_plane_api/worker/skills/__init__.py +12 -0
control_plane_api/worker/skills/builtin/context_graph_search/README.md +213 -0
control_plane_api/worker/skills/builtin/context_graph_search/__init__.py +5 -0
control_plane_api/worker/skills/builtin/context_graph_search/agno_impl.py +808 -0
control_plane_api/worker/skills/builtin/context_graph_search/skill.yaml +67 -0
control_plane_api/worker/skills/builtin/contextual_awareness/__init__.py +4 -0
control_plane_api/worker/skills/builtin/contextual_awareness/agno_impl.py +62 -0
control_plane_api/worker/skills/builtin/data_visualization/agno_impl.py +18 -0
control_plane_api/worker/skills/builtin/data_visualization/skill.yaml +84 -0
control_plane_api/worker/skills/builtin/docker/agno_impl.py +65 -0
control_plane_api/worker/skills/builtin/docker/skill.yaml +60 -0
control_plane_api/worker/skills/builtin/file_generation/agno_impl.py +47 -0
control_plane_api/worker/skills/builtin/file_generation/skill.yaml +64 -0
control_plane_api/worker/skills/builtin/file_system/agno_impl.py +32 -0
control_plane_api/worker/skills/builtin/file_system/skill.yaml +54 -0
control_plane_api/worker/skills/builtin/knowledge_api/__init__.py +4 -0
control_plane_api/worker/skills/builtin/knowledge_api/agno_impl.py +50 -0
control_plane_api/worker/skills/builtin/knowledge_api/skill.yaml +66 -0
control_plane_api/worker/skills/builtin/python/agno_impl.py +25 -0
control_plane_api/worker/skills/builtin/python/skill.yaml +60 -0
control_plane_api/worker/skills/builtin/schema_fix_mixin.py +260 -0
control_plane_api/worker/skills/builtin/shell/agno_impl.py +31 -0
control_plane_api/worker/skills/builtin/shell/skill.yaml +60 -0
control_plane_api/worker/skills/builtin/slack/__init__.py +3 -0
control_plane_api/worker/skills/builtin/slack/agno_impl.py +1282 -0
control_plane_api/worker/skills/builtin/slack/skill.yaml +276 -0
control_plane_api/worker/skills/builtin/workflow_executor/agno_impl.py +62 -0
control_plane_api/worker/skills/builtin/workflow_executor/skill.yaml +79 -0
control_plane_api/worker/skills/loaders/__init__.py +5 -0
control_plane_api/worker/skills/loaders/base.py +23 -0
control_plane_api/worker/skills/loaders/filesystem_loader.py +357 -0
control_plane_api/worker/skills/registry.py +208 -0
control_plane_api/worker/tests/__init__.py +1 -0
control_plane_api/worker/tests/conftest.py +12 -0
control_plane_api/worker/tests/e2e/__init__.py +0 -0
control_plane_api/worker/tests/e2e/test_context_graph_real_api.py +338 -0
control_plane_api/worker/tests/e2e/test_context_graph_templates_e2e.py +523 -0
control_plane_api/worker/tests/e2e/test_enforcement_e2e.py +344 -0
control_plane_api/worker/tests/e2e/test_execution_flow.py +571 -0
control_plane_api/worker/tests/e2e/test_single_execution_mode.py +656 -0
control_plane_api/worker/tests/integration/__init__.py +0 -0
control_plane_api/worker/tests/integration/test_builtin_skills_fixes.py +245 -0
control_plane_api/worker/tests/integration/test_context_graph_search_integration.py +365 -0
control_plane_api/worker/tests/integration/test_control_plane_integration.py +308 -0
control_plane_api/worker/tests/integration/test_hook_enforcement_integration.py +579 -0
control_plane_api/worker/tests/integration/test_scheduled_job_workflow.py +237 -0
control_plane_api/worker/tests/integration/test_system_prompt_enhancement_integration.py +343 -0
control_plane_api/worker/tests/unit/__init__.py +0 -0
control_plane_api/worker/tests/unit/test_builtin_skill_autoload.py +396 -0
control_plane_api/worker/tests/unit/test_context_graph_search.py +450 -0
control_plane_api/worker/tests/unit/test_context_graph_templates.py +403 -0
control_plane_api/worker/tests/unit/test_control_plane_client.py +401 -0
control_plane_api/worker/tests/unit/test_control_plane_client_jobs.py +345 -0
control_plane_api/worker/tests/unit/test_job_activities.py +353 -0
control_plane_api/worker/tests/unit/test_skill_context_enhancement.py +321 -0
control_plane_api/worker/tests/unit/test_system_prompt_enhancement.py +415 -0
control_plane_api/worker/tests/unit/test_tool_enforcement.py +324 -0
control_plane_api/worker/utils/__init__.py +1 -0
control_plane_api/worker/utils/chunk_batcher.py +330 -0
control_plane_api/worker/utils/environment.py +65 -0
control_plane_api/worker/utils/error_publisher.py +260 -0
control_plane_api/worker/utils/event_batcher.py +256 -0
control_plane_api/worker/utils/logging_config.py +335 -0
control_plane_api/worker/utils/logging_helper.py +326 -0
control_plane_api/worker/utils/parameter_validator.py +120 -0
control_plane_api/worker/utils/retry_utils.py +60 -0
control_plane_api/worker/utils/streaming_utils.py +665 -0
control_plane_api/worker/utils/tool_validation.py +332 -0
control_plane_api/worker/utils/workspace_manager.py +163 -0
control_plane_api/worker/websocket_client.py +393 -0
control_plane_api/worker/worker.py +1297 -0
control_plane_api/worker/workflows/__init__.py +0 -0
control_plane_api/worker/workflows/agent_execution.py +909 -0
control_plane_api/worker/workflows/scheduled_job_wrapper.py +332 -0
control_plane_api/worker/workflows/team_execution.py +611 -0
kubiya_control_plane_api-0.9.15.dist-info/METADATA +354 -0
kubiya_control_plane_api-0.9.15.dist-info/RECORD +479 -0
kubiya_control_plane_api-0.9.15.dist-info/WHEEL +5 -0
kubiya_control_plane_api-0.9.15.dist-info/entry_points.txt +5 -0
kubiya_control_plane_api-0.9.15.dist-info/licenses/LICENSE +676 -0
kubiya_control_plane_api-0.9.15.dist-info/top_level.txt +3 -0
scripts/__init__.py +1 -0
scripts/migrations.py +39 -0
scripts/seed_worker_queues.py +128 -0
scripts/setup_agent_runtime.py +142 -0
worker_internal/__init__.py +1 -0
worker_internal/planner/__init__.py +1 -0
worker_internal/planner/activities.py +1499 -0
worker_internal/planner/agent_tools.py +197 -0
worker_internal/planner/event_models.py +148 -0
worker_internal/planner/event_publisher.py +67 -0
worker_internal/planner/models.py +199 -0
worker_internal/planner/retry_logic.py +134 -0
worker_internal/planner/worker.py +300 -0
worker_internal/planner/workflows.py +970 -0

control_plane_api/app/services/state_transition_service.py ADDED Viewed

@@ -0,0 +1,755 @@
+"""
+State Transition Service
+Provides intelligent state transition decisions for executions using an Agno AI agent.
+Analyzes execution context and determines the appropriate next state with reasoning.
+"""
+import os
+import time
+import asyncio
+from typing import Dict, Any, Literal, Optional
+from datetime import datetime, timezone
+from pydantic import BaseModel, Field
+import structlog
+from agno.agent import Agent
+from agno.models.litellm import LiteLLM
+from control_plane_api.app.lib.state_transition_tools.execution_context import ExecutionContextTools
+from control_plane_api.app.database import get_db
+from control_plane_api.app.models.execution import Execution
+from control_plane_api.app.models.execution_transition import ExecutionTransition
+from sqlalchemy.orm import Session
+logger = structlog.get_logger()
+class StateTransitionDecision(BaseModel):
+    """
+    Structured output from the state transition AI agent
+    """
+    recommended_state: Literal["running", "waiting_for_input", "completed", "failed"] = Field(
+        description="The recommended state to transition to"
+    )
+    confidence: Literal["low", "medium", "high"] = Field(
+        description="Confidence level in this decision"
+    )
+    reasoning: str = Field(
+        description="Detailed explanation of why this state was chosen"
+    )
+    decision_factors: Dict[str, Any] = Field(
+        description="Key factors that influenced this decision",
+        default_factory=dict
+    )
+    should_continue_automatically: bool = Field(
+        description="Whether the execution should continue without user input",
+        default=False
+    )
+    estimated_user_action_needed: bool = Field(
+        description="Whether user action or input is likely needed",
+        default=False
+    )
+class StateTransitionService:
+    """
+    Service for intelligent state transition decisions using Agno AI agent
+    """
+    def __init__(self, organization_id: Optional[str] = None):
+        """
+        Initialize state transition service
+        Args:
+            organization_id: Organization context for filtering
+        """
+        self.organization_id = organization_id
+        # Get LiteLLM configuration
+        self.litellm_api_url = (
+            os.getenv("LITELLM_API_URL")
+            or os.getenv("LITELLM_API_BASE")
+            or "https://llm-proxy.kubiya.ai"
+        ).strip()
+        self.litellm_api_key = os.getenv("LITELLM_API_KEY", "").strip()
+        if not self.litellm_api_key:
+            raise ValueError("LITELLM_API_KEY environment variable not set")
+        # Get model from env var or use default
+        self.model = os.getenv("STATE_TRANSITION_MODEL", "kubiya/claude-sonnet-4").strip()
+        # Get control plane URL for tools
+        self.control_plane_url = os.getenv("CONTROL_PLANE_API_URL", "http://localhost:8000")
+        logger.info(
+            "state_transition_service_initialized",
+            model=self.model,
+            litellm_api_url=self.litellm_api_url,
+            organization_id=organization_id,
+        )
+    def _create_transition_agent(self) -> Agent:
+        """
+        Create an Agno agent for state transition decisions
+        Returns:
+            Configured Agent instance
+        """
+        # Initialize context tools
+        context_tools = ExecutionContextTools(
+            base_url=self.control_plane_url,
+            organization_id=self.organization_id,
+        )
+        # Create agent with structured output
+        agent = Agent(
+            name="State Transition Analyzer",
+            role="Expert in analyzing execution states and determining optimal transitions",
+            model=LiteLLM(
+                id=f"openai/{self.model}",
+                api_base=self.litellm_api_url,
+                api_key=self.litellm_api_key,
+            ),
+            output_schema=StateTransitionDecision,
+            tools=[context_tools],
+            instructions=[
+                "You are an expert at analyzing execution states and determining optimal state transitions.",
+                "",
+                "**Your Task:**",
+                "Analyze the execution context and recommend the appropriate next state.",
+                "",
+                "**Available States:**",
+                "1. **completed**: Task is fully done",
+                "   - finish_reason = 'stop' or 'end_turn'",
+                "   - Response contains completion signals ('done', 'finished', 'completed', 'success')",
+                "   - No pending tool calls or error conditions",
+                "   - User's intent has been clearly satisfied",
+                "   - No follow-up questions or clarifications needed",
+                "",
+                "2. **waiting_for_input**: Needs user input",
+                "   - Asking questions or clarifications",
+                "   - Ambiguous requirements need resolution",
+                "   - Waiting for approval or feedback",
+                "   - finish_reason = 'stop' but task not fully complete",
+                "   - Agent explicitly asked user for input",
+                "",
+                "3. **failed**: Unrecoverable error",
+                "   - finish_reason = 'error'",
+                "   - Repeated tool failures (>3 consecutive failures)",
+                "   - Error message indicates blocker (auth, permissions, not found)",
+                "   - Cannot proceed without external intervention",
+                "   - Use the check_error_recoverability tool to assess errors",
+                "",
+                "4. **running**: Continue automatically",
+                "   - finish_reason = 'tool_use' (still actively working)",
+                "   - Multi-step task in progress",
+                "   - No user input needed yet",
+                "   - Can make autonomous progress",
+                "   - Agent is gathering information or executing tasks",
+                "",
+                "**Decision Process:**",
+                "1. Use get_execution_details() to understand the execution",
+                "2. Use get_recent_turns() to see the latest activity",
+                "3. Analyze the most recent turn's finish_reason",
+                "4. Check if there are errors with check_error_recoverability()",
+                "5. Review tool call patterns if needed with get_tool_call_patterns()",
+                "6. Make a confident decision based on all context",
+                "",
+                "**Important Guidelines:**",
+                "- Be decisive - don't overthink simple cases",
+                "- finish_reason='stop' usually means waiting_for_input or completed",
+                "- finish_reason='tool_use' usually means running (continue)",
+                "- finish_reason='error' usually means failed (unless recoverable)",
+                "- Look for completion signals in the response text",
+                "- If the agent asked a question, it's usually waiting_for_input",
+                "- If unsure between completed and waiting_for_input, prefer waiting_for_input (safer)",
+                "",
+                "**Output Requirements:**",
+                "- Provide clear, concise reasoning (2-4 sentences)",
+                "- Set confidence based on clarity of signals",
+                "- Include key decision factors (finish_reason, error status, completion signals, etc.)",
+                "- Be specific about why you chose this state",
+            ],
+            markdown=False,
+            add_history_to_context=False,
+            retries=2,
+        )
+        logger.info(
+            "state_transition_agent_created",
+            model=self.model,
+            tools_count=1,
+        )
+        return agent
+    async def analyze_and_transition(
+        self,
+        execution_id: str,
+        turn_number: int,
+        turn_data: Any,
+    ) -> StateTransitionDecision:
+        """
+        Analyze execution context and determine state transition
+        Args:
+            execution_id: The execution ID
+            turn_number: The turn number
+            turn_data: Turn metrics data
+        Returns:
+            StateTransitionDecision with recommendation and reasoning
+        """
+        start_time = time.time()
+        try:
+            logger.info(
+                "analyzing_state_transition",
+                execution_id=execution_id,
+                turn_number=turn_number,
+                finish_reason=turn_data.finish_reason if turn_data else None,
+            )
+            # Create agent
+            agent = self._create_transition_agent()
+            # Build analysis prompt
+            prompt = self._build_analysis_prompt(execution_id, turn_number, turn_data)
+            # Run agent (synchronous run in async wrapper)
+            response = await asyncio.to_thread(agent.run, prompt)
+            # Extract decision from response
+            decision = response.content if isinstance(response.content, StateTransitionDecision) else response.content
+            # Calculate decision time
+            decision_time_ms = int((time.time() - start_time) * 1000)
+            logger.info(
+                "state_transition_decision_made",
+                execution_id=execution_id,
+                turn_number=turn_number,
+                from_state="running",
+                to_state=decision.recommended_state,
+                confidence=decision.confidence,
+                decision_time_ms=decision_time_ms,
+            )
+            # Record transition in database
+            await self._record_transition(
+                execution_id=execution_id,
+                turn_number=turn_number,
+                from_state="running",
+                to_state=decision.recommended_state,
+                decision=decision,
+                decision_time_ms=decision_time_ms,
+            )
+            # Update execution status
+            await self._update_execution_status(
+                execution_id=execution_id,
+                new_status=decision.recommended_state,
+            )
+            return decision
+        except Exception as e:
+            decision_time_ms = int((time.time() - start_time) * 1000)
+            logger.error(
+                "state_transition_analysis_failed",
+                execution_id=execution_id,
+                turn_number=turn_number,
+                error=str(e),
+                decision_time_ms=decision_time_ms,
+            )
+            raise
+    def _build_analysis_prompt(
+        self,
+        execution_id: str,
+        turn_number: int,
+        turn_data: Any,
+    ) -> str:
+        """
+        Build the analysis prompt for the AI agent
+        Args:
+            execution_id: The execution ID
+            turn_number: The turn number
+            turn_data: Turn metrics data
+        Returns:
+            Formatted prompt string
+        """
+        finish_reason = turn_data.finish_reason if turn_data else "unknown"
+        error_message = turn_data.error_message if turn_data else None
+        response_preview = turn_data.response_preview if turn_data else None
+        tools_called = turn_data.tools_called_count if turn_data else 0
+        prompt = f"""
+# State Transition Analysis Request
+## Execution Information
+- Execution ID: {execution_id}
+- Turn Number: {turn_number}
+- Finish Reason: {finish_reason}
+- Tools Called This Turn: {tools_called}
+## Recent Turn Details
+"""
+        if response_preview:
+            prompt += f"\n**Response Preview:**\n{response_preview[:500]}\n"
+        if error_message:
+            prompt += f"\n**Error Message:**\n{error_message[:300]}\n"
+        prompt += """
+## Your Task
+Analyze this execution and determine the appropriate next state.
+**Steps:**
+1. Call get_execution_details() to understand the execution context
+2. Call get_recent_turns() to see the recent activity pattern
+3. If there's an error, call check_error_recoverability() to assess it
+4. Based on all context, recommend the next state with clear reasoning
+**Focus on:**
+- The finish_reason is a critical signal
+- Look for completion indicators in the response
+- Check if the agent is asking questions
+- Assess error recoverability if present
+- Consider if the task can continue autonomously
+Be decisive and provide a clear recommendation.
+"""
+        return prompt
+    async def _append_system_message_to_session(
+        self,
+        execution_id: str,
+        to_state: str,
+        reasoning: str,
+        confidence: str,
+        db: Session = None,
+    ) -> None:
+        """
+        Append a system message to the session history about the state transition
+        Args:
+            execution_id: The execution ID
+            to_state: The new state
+            reasoning: The AI reasoning for the transition
+            confidence: The confidence level
+            db: Optional database session (if already open)
+        """
+        await _append_system_message_to_session_helper(
+            db=db,
+            execution_id=execution_id,
+            to_state=to_state,
+            reasoning=reasoning,
+            confidence=confidence,
+            organization_id=self.organization_id,
+        )
+    async def _record_transition(
+        self,
+        execution_id: str,
+        turn_number: int,
+        from_state: str,
+        to_state: str,
+        decision: StateTransitionDecision,
+        decision_time_ms: int,
+    ) -> None:
+        """
+        Record state transition in database using SQLAlchemy
+        Args:
+            execution_id: The execution ID
+            turn_number: The turn number
+            from_state: The previous state
+            to_state: The new state
+            decision: The AI decision object
+            decision_time_ms: Time taken to make decision
+        """
+        try:
+            # Get database session in async context
+            from control_plane_api.app.database import get_session_local
+            SessionLocal = get_session_local()
+            db = SessionLocal()
+            try:
+                # Get organization from execution
+                execution = db.query(Execution).filter(Execution.id == execution_id).first()
+                if not execution:
+                    logger.warning("execution_not_found_for_transition", execution_id=execution_id)
+                    return
+                organization_id = execution.organization_id
+                # Create transition record
+                transition_record = ExecutionTransition(
+                    organization_id=organization_id,
+                    execution_id=execution_id,
+                    turn_number=turn_number,
+                    from_state=from_state,
+                    to_state=to_state,
+                    reasoning=decision.reasoning,
+                    confidence=decision.confidence,
+                    decision_factors=decision.decision_factors,
+                    ai_model=self.model,
+                    decision_time_ms=decision_time_ms,
+                    is_manual_override=False,
+                )
+                db.add(transition_record)
+                db.commit()
+                db.refresh(transition_record)
+                logger.info(
+                    "transition_recorded",
+                    execution_id=execution_id,
+                    turn_number=turn_number,
+                    transition_id=str(transition_record.id),
+                )
+                # Add system message to session history
+                await self._append_system_message_to_session(
+                    execution_id=execution_id,
+                    to_state=to_state,
+                    reasoning=decision.reasoning,
+                    confidence=decision.confidence,
+                    db=db,
+                )
+            finally:
+                db.close()
+        except Exception as e:
+            logger.error(
+                "record_transition_failed",
+                execution_id=execution_id,
+                error=str(e),
+            )
+            # Don't raise - recording failure shouldn't block state transition
+    async def _update_execution_status(
+        self,
+        execution_id: str,
+        new_status: str,
+    ) -> None:
+        """
+        Update execution status in database using SQLAlchemy
+        Args:
+            execution_id: The execution ID
+            new_status: The new status to set
+        """
+        try:
+            from control_plane_api.app.database import get_session_local
+            SessionLocal = get_session_local()
+            db = SessionLocal()
+            try:
+                execution = db.query(Execution).filter(Execution.id == execution_id).first()
+                if execution:
+                    execution.status = new_status.lower()
+                    # Add completed_at if transitioning to completed or failed
+                    if new_status in ["completed", "failed"]:
+                        execution.completed_at = datetime.now(timezone.utc)
+                    db.commit()
+                    logger.info(
+                        "execution_status_updated",
+                        execution_id=execution_id,
+                        new_status=new_status,
+                    )
+                    # Push status event to Redis for live streaming
+                    try:
+                        from control_plane_api.app.lib.redis_client import get_redis_client
+                        import json
+                        redis_client = get_redis_client()
+                        if redis_client:
+                            status_event = {
+                                "event_type": "status",
+                                "status": new_status.lower(),
+                                "execution_id": execution_id,
+                                "source": "state_transition_service",
+                                "timestamp": datetime.now(timezone.utc).isoformat().replace("+00:00", "Z")
+                            }
+                            redis_key = f"execution:{execution_id}:events"
+                            # Use asyncio.create_task for async Redis push
+                            import asyncio
+                            loop = asyncio.get_event_loop()
+                            if loop.is_running():
+                                asyncio.create_task(redis_client.lpush(redis_key, json.dumps(status_event)))
+                            else:
+                                loop.run_until_complete(redis_client.lpush(redis_key, json.dumps(status_event)))
+                            logger.info(
+                                "status_event_pushed_to_redis",
+                                execution_id=execution_id,
+                                status=new_status,
+                            )
+                    except Exception as redis_error:
+                        logger.warning(
+                            "redis_status_push_failed",
+                            execution_id=execution_id,
+                            status=new_status,
+                            error=str(redis_error),
+                        )
+                        # Don't raise - Redis push failure shouldn't block state transition
+                else:
+                    logger.warning(
+                        "execution_not_found_for_status_update",
+                        execution_id=execution_id,
+                        new_status=new_status,
+                    )
+            finally:
+                db.close()
+        except Exception as e:
+            logger.error(
+                "update_execution_status_failed",
+                execution_id=execution_id,
+                new_status=new_status,
+                error=str(e),
+            )
+            # Don't raise - status update failure shouldn't block the transition
+async def update_execution_state_safe(
+    execution_id: str,
+    state: str,
+    reasoning: str,
+) -> None:
+    """
+    Safely update execution state with fallback reasoning using SQLAlchemy
+    Used when AI decision fails or times out.
+    Args:
+        execution_id: The execution ID
+        state: The state to set
+        reasoning: Why this fallback state was chosen
+    """
+    try:
+        from control_plane_api.app.database import get_session_local
+        SessionLocal = get_session_local()
+        db = SessionLocal()
+        try:
+            # Get execution
+            execution = db.query(Execution).filter(Execution.id == execution_id).first()
+            if not execution:
+                logger.warning("execution_not_found_for_safe_update", execution_id=execution_id)
+                return
+            # Update execution status
+            execution.status = state.lower()
+            if state in ["completed", "failed"]:
+                execution.completed_at = datetime.now(timezone.utc)
+            db.commit()
+            logger.info(
+                "fallback_state_update_committed",
+                execution_id=execution_id,
+                state=state,
+            )
+            # Push status event to Redis for live streaming
+            try:
+                from control_plane_api.app.lib.redis_client import get_redis_client
+                import json
+                import asyncio
+                redis_client = get_redis_client()
+                if redis_client:
+                    status_event = {
+                        "event_type": "status",
+                        "status": state.lower(),
+                        "execution_id": execution_id,
+                        "source": "state_transition_fallback",
+                        "timestamp": datetime.now(timezone.utc).isoformat().replace("+00:00", "Z")
+                    }
+                    redis_key = f"execution:{execution_id}:events"
+                    # Use asyncio for async Redis push
+                    loop = asyncio.get_event_loop()
+                    if loop.is_running():
+                        asyncio.create_task(redis_client.lpush(redis_key, json.dumps(status_event)))
+                    else:
+                        loop.run_until_complete(redis_client.lpush(redis_key, json.dumps(status_event)))
+                    logger.info(
+                        "fallback_status_event_pushed_to_redis",
+                        execution_id=execution_id,
+                        status=state,
+                    )
+            except Exception as redis_error:
+                logger.warning(
+                    "fallback_redis_status_push_failed",
+                    execution_id=execution_id,
+                    status=state,
+                    error=str(redis_error),
+                )
+                # Don't raise - Redis push failure shouldn't block fallback state transition
+            # Record fallback transition
+            transition_record = ExecutionTransition(
+                organization_id=execution.organization_id,
+                execution_id=execution_id,
+                turn_number=0,  # Unknown turn number
+                from_state="running",
+                to_state=state,
+                reasoning=f"FALLBACK: {reasoning}",
+                confidence="low",
+                decision_factors={"fallback": True, "reason": reasoning},
+                ai_model="fallback",
+                decision_time_ms=0,
+                is_manual_override=False,
+            )
+            db.add(transition_record)
+            db.commit()
+            # Add system message to session history
+            await _append_system_message_to_session_helper(
+                db=db,
+                execution_id=execution_id,
+                to_state=state,
+                reasoning=f"FALLBACK: {reasoning}",
+                confidence="low",
+                organization_id=execution.organization_id,
+            )
+            logger.info(
+                "fallback_state_update",
+                execution_id=execution_id,
+                state=state,
+                reasoning=reasoning,
+            )
+        finally:
+            db.close()
+    except Exception as e:
+        logger.error(
+            "fallback_state_update_failed",
+            execution_id=execution_id,
+            state=state,
+            error=str(e),
+        )
+async def _append_system_message_to_session_helper(
+    db: Session,
+    execution_id: str,
+    to_state: str,
+    reasoning: str,
+    confidence: str,
+    organization_id: Optional[str] = None,
+) -> None:
+    """
+    Helper function to append system message to session using SQLAlchemy (used by fallback too)
+    Args:
+        db: SQLAlchemy database session
+        execution_id: The execution ID
+        to_state: The new state
+        reasoning: The reasoning for the transition
+        confidence: The confidence level
+        organization_id: Optional organization ID for filtering
+    """
+    try:
+        # Check if Session model exists, if not skip (sessions may not be migrated yet)
+        try:
+            from control_plane_api.app.models.session import Session as SessionModel
+        except ImportError:
+            logger.debug(
+                "session_model_not_available",
+                execution_id=execution_id,
+                note="Skipping session message append - Session model not yet migrated"
+            )
+            return
+        # Get the current session
+        if organization_id:
+            session = db.query(SessionModel).filter(
+                SessionModel.execution_id == execution_id,
+                SessionModel.organization_id == organization_id
+            ).first()
+        else:
+            # Fallback to execution_id only if organization_id not provided (backward compatibility)
+            session = db.query(SessionModel).filter(SessionModel.execution_id == execution_id).first()
+        if not session:
+            logger.warning(
+                "session_not_found_for_transition_message",
+                execution_id=execution_id
+            )
+            return
+        messages = session.messages or []
+        # Create system message about the transition
+        state_emoji = {
+            "completed": "✅",
+            "waiting_for_input": "⏸️",
+            "failed": "❌",
+            "running": "▶️"
+        }.get(to_state, "🔄")
+        state_display = to_state.replace("_", " ").title()
+        system_message = {
+            "role": "system",
+            "content": f"{state_emoji} **State Transition: {state_display}**\n\n{reasoning}\n\n*Confidence: {confidence}*",
+            "timestamp": datetime.now(timezone.utc).isoformat(),
+            "message_id": f"{execution_id}_system_transition_{int(datetime.now(timezone.utc).timestamp() * 1000000)}",
+        }
+        # Append the system message
+        messages.append(system_message)
+        # Update the session
+        session.messages = messages
+        session.updated_at = datetime.now(timezone.utc)
+        db.commit()
+        logger.info(
+            "system_message_appended_to_session",
+            execution_id=execution_id,
+            to_state=to_state,
+        )
+    except Exception as e:
+        logger.error(
+            "append_system_message_failed",
+            execution_id=execution_id,
+            error=str(e),
+        )
+        # Don't raise - message failure shouldn't block state transition