PyPI - pyworkflow-engine - Versions diffs - 0.1.7__py3-none-any.whl - Mend

pyworkflow-engine 0.1.7__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (196) hide show

dashboard/backend/app/__init__.py +1 -0
dashboard/backend/app/config.py +32 -0
dashboard/backend/app/controllers/__init__.py +6 -0
dashboard/backend/app/controllers/run_controller.py +86 -0
dashboard/backend/app/controllers/workflow_controller.py +33 -0
dashboard/backend/app/dependencies/__init__.py +5 -0
dashboard/backend/app/dependencies/storage.py +50 -0
dashboard/backend/app/repositories/__init__.py +6 -0
dashboard/backend/app/repositories/run_repository.py +80 -0
dashboard/backend/app/repositories/workflow_repository.py +27 -0
dashboard/backend/app/rest/__init__.py +8 -0
dashboard/backend/app/rest/v1/__init__.py +12 -0
dashboard/backend/app/rest/v1/health.py +33 -0
dashboard/backend/app/rest/v1/runs.py +133 -0
dashboard/backend/app/rest/v1/workflows.py +41 -0
dashboard/backend/app/schemas/__init__.py +23 -0
dashboard/backend/app/schemas/common.py +16 -0
dashboard/backend/app/schemas/event.py +24 -0
dashboard/backend/app/schemas/hook.py +25 -0
dashboard/backend/app/schemas/run.py +54 -0
dashboard/backend/app/schemas/step.py +28 -0
dashboard/backend/app/schemas/workflow.py +31 -0
dashboard/backend/app/server.py +87 -0
dashboard/backend/app/services/__init__.py +6 -0
dashboard/backend/app/services/run_service.py +240 -0
dashboard/backend/app/services/workflow_service.py +155 -0
dashboard/backend/main.py +18 -0
docs/concepts/cancellation.mdx +362 -0
docs/concepts/continue-as-new.mdx +434 -0
docs/concepts/events.mdx +266 -0
docs/concepts/fault-tolerance.mdx +370 -0
docs/concepts/hooks.mdx +552 -0
docs/concepts/limitations.mdx +167 -0
docs/concepts/schedules.mdx +775 -0
docs/concepts/sleep.mdx +312 -0
docs/concepts/steps.mdx +301 -0
docs/concepts/workflows.mdx +255 -0
docs/guides/cli.mdx +942 -0
docs/guides/configuration.mdx +560 -0
docs/introduction.mdx +155 -0
docs/quickstart.mdx +279 -0
examples/__init__.py +1 -0
examples/celery/__init__.py +1 -0
examples/celery/durable/docker-compose.yml +55 -0
examples/celery/durable/pyworkflow.config.yaml +12 -0
examples/celery/durable/workflows/__init__.py +122 -0
examples/celery/durable/workflows/basic.py +87 -0
examples/celery/durable/workflows/batch_processing.py +102 -0
examples/celery/durable/workflows/cancellation.py +273 -0
examples/celery/durable/workflows/child_workflow_patterns.py +240 -0
examples/celery/durable/workflows/child_workflows.py +202 -0
examples/celery/durable/workflows/continue_as_new.py +260 -0
examples/celery/durable/workflows/fault_tolerance.py +210 -0
examples/celery/durable/workflows/hooks.py +211 -0
examples/celery/durable/workflows/idempotency.py +112 -0
examples/celery/durable/workflows/long_running.py +99 -0
examples/celery/durable/workflows/retries.py +101 -0
examples/celery/durable/workflows/schedules.py +209 -0
examples/celery/transient/01_basic_workflow.py +91 -0
examples/celery/transient/02_fault_tolerance.py +257 -0
examples/celery/transient/__init__.py +20 -0
examples/celery/transient/pyworkflow.config.yaml +25 -0
examples/local/__init__.py +1 -0
examples/local/durable/01_basic_workflow.py +94 -0
examples/local/durable/02_file_storage.py +132 -0
examples/local/durable/03_retries.py +169 -0
examples/local/durable/04_long_running.py +119 -0
examples/local/durable/05_event_log.py +145 -0
examples/local/durable/06_idempotency.py +148 -0
examples/local/durable/07_hooks.py +334 -0
examples/local/durable/08_cancellation.py +233 -0
examples/local/durable/09_child_workflows.py +198 -0
examples/local/durable/10_child_workflow_patterns.py +265 -0
examples/local/durable/11_continue_as_new.py +249 -0
examples/local/durable/12_schedules.py +198 -0
examples/local/durable/__init__.py +1 -0
examples/local/transient/01_quick_tasks.py +87 -0
examples/local/transient/02_retries.py +130 -0
examples/local/transient/03_sleep.py +141 -0
examples/local/transient/__init__.py +1 -0
pyworkflow/__init__.py +256 -0
pyworkflow/aws/__init__.py +68 -0
pyworkflow/aws/context.py +234 -0
pyworkflow/aws/handler.py +184 -0
pyworkflow/aws/testing.py +310 -0
pyworkflow/celery/__init__.py +41 -0
pyworkflow/celery/app.py +198 -0
pyworkflow/celery/scheduler.py +315 -0
pyworkflow/celery/tasks.py +1746 -0
pyworkflow/cli/__init__.py +132 -0
pyworkflow/cli/__main__.py +6 -0
pyworkflow/cli/commands/__init__.py +1 -0
pyworkflow/cli/commands/hooks.py +640 -0
pyworkflow/cli/commands/quickstart.py +495 -0
pyworkflow/cli/commands/runs.py +773 -0
pyworkflow/cli/commands/scheduler.py +130 -0
pyworkflow/cli/commands/schedules.py +794 -0
pyworkflow/cli/commands/setup.py +703 -0
pyworkflow/cli/commands/worker.py +413 -0
pyworkflow/cli/commands/workflows.py +1257 -0
pyworkflow/cli/output/__init__.py +1 -0
pyworkflow/cli/output/formatters.py +321 -0
pyworkflow/cli/output/styles.py +121 -0
pyworkflow/cli/utils/__init__.py +1 -0
pyworkflow/cli/utils/async_helpers.py +30 -0
pyworkflow/cli/utils/config.py +130 -0
pyworkflow/cli/utils/config_generator.py +344 -0
pyworkflow/cli/utils/discovery.py +53 -0
pyworkflow/cli/utils/docker_manager.py +651 -0
pyworkflow/cli/utils/interactive.py +364 -0
pyworkflow/cli/utils/storage.py +115 -0
pyworkflow/config.py +329 -0
pyworkflow/context/__init__.py +63 -0
pyworkflow/context/aws.py +230 -0
pyworkflow/context/base.py +416 -0
pyworkflow/context/local.py +930 -0
pyworkflow/context/mock.py +381 -0
pyworkflow/core/__init__.py +0 -0
pyworkflow/core/exceptions.py +353 -0
pyworkflow/core/registry.py +313 -0
pyworkflow/core/scheduled.py +328 -0
pyworkflow/core/step.py +494 -0
pyworkflow/core/workflow.py +294 -0
pyworkflow/discovery.py +248 -0
pyworkflow/engine/__init__.py +0 -0
pyworkflow/engine/events.py +879 -0
pyworkflow/engine/executor.py +682 -0
pyworkflow/engine/replay.py +273 -0
pyworkflow/observability/__init__.py +19 -0
pyworkflow/observability/logging.py +234 -0
pyworkflow/primitives/__init__.py +33 -0
pyworkflow/primitives/child_handle.py +174 -0
pyworkflow/primitives/child_workflow.py +372 -0
pyworkflow/primitives/continue_as_new.py +101 -0
pyworkflow/primitives/define_hook.py +150 -0
pyworkflow/primitives/hooks.py +97 -0
pyworkflow/primitives/resume_hook.py +210 -0
pyworkflow/primitives/schedule.py +545 -0
pyworkflow/primitives/shield.py +96 -0
pyworkflow/primitives/sleep.py +100 -0
pyworkflow/runtime/__init__.py +21 -0
pyworkflow/runtime/base.py +179 -0
pyworkflow/runtime/celery.py +310 -0
pyworkflow/runtime/factory.py +101 -0
pyworkflow/runtime/local.py +706 -0
pyworkflow/scheduler/__init__.py +9 -0
pyworkflow/scheduler/local.py +248 -0
pyworkflow/serialization/__init__.py +0 -0
pyworkflow/serialization/decoder.py +146 -0
pyworkflow/serialization/encoder.py +162 -0
pyworkflow/storage/__init__.py +54 -0
pyworkflow/storage/base.py +612 -0
pyworkflow/storage/config.py +185 -0
pyworkflow/storage/dynamodb.py +1315 -0
pyworkflow/storage/file.py +827 -0
pyworkflow/storage/memory.py +549 -0
pyworkflow/storage/postgres.py +1161 -0
pyworkflow/storage/schemas.py +486 -0
pyworkflow/storage/sqlite.py +1136 -0
pyworkflow/utils/__init__.py +0 -0
pyworkflow/utils/duration.py +177 -0
pyworkflow/utils/schedule.py +391 -0
pyworkflow_engine-0.1.7.dist-info/METADATA +687 -0
pyworkflow_engine-0.1.7.dist-info/RECORD +196 -0
pyworkflow_engine-0.1.7.dist-info/WHEEL +5 -0
pyworkflow_engine-0.1.7.dist-info/entry_points.txt +2 -0
pyworkflow_engine-0.1.7.dist-info/licenses/LICENSE +21 -0
pyworkflow_engine-0.1.7.dist-info/top_level.txt +5 -0
tests/examples/__init__.py +0 -0
tests/integration/__init__.py +0 -0
tests/integration/test_cancellation.py +330 -0
tests/integration/test_child_workflows.py +439 -0
tests/integration/test_continue_as_new.py +428 -0
tests/integration/test_dynamodb_storage.py +1146 -0
tests/integration/test_fault_tolerance.py +369 -0
tests/integration/test_schedule_storage.py +484 -0
tests/unit/__init__.py +0 -0
tests/unit/backends/__init__.py +1 -0
tests/unit/backends/test_dynamodb_storage.py +1554 -0
tests/unit/backends/test_postgres_storage.py +1281 -0
tests/unit/backends/test_sqlite_storage.py +1460 -0
tests/unit/conftest.py +41 -0
tests/unit/test_cancellation.py +364 -0
tests/unit/test_child_workflows.py +680 -0
tests/unit/test_continue_as_new.py +441 -0
tests/unit/test_event_limits.py +316 -0
tests/unit/test_executor.py +320 -0
tests/unit/test_fault_tolerance.py +334 -0
tests/unit/test_hooks.py +495 -0
tests/unit/test_registry.py +261 -0
tests/unit/test_replay.py +420 -0
tests/unit/test_schedule_schemas.py +285 -0
tests/unit/test_schedule_utils.py +286 -0
tests/unit/test_scheduled_workflow.py +274 -0
tests/unit/test_step.py +353 -0
tests/unit/test_workflow.py +243 -0

tests/integration/test_fault_tolerance.py ADDED Viewed

@@ -0,0 +1,369 @@
+"""
+Integration tests for fault tolerance features.
+Tests cover the full workflow recovery flow after simulated worker failures.
+"""
+from datetime import UTC, datetime
+import pytest
+from pyworkflow import (
+    reset_config,
+    workflow,
+)
+from pyworkflow.engine.events import (
+    EventType,
+    create_step_completed_event,
+    create_workflow_interrupted_event,
+    create_workflow_started_event,
+)
+from pyworkflow.serialization.encoder import serialize, serialize_args, serialize_kwargs
+from pyworkflow.storage.memory import InMemoryStorageBackend
+from pyworkflow.storage.schemas import RunStatus, WorkflowRun
+@pytest.fixture
+def storage():
+    """Provide a clean in-memory storage backend for each test."""
+    return InMemoryStorageBackend()
+@pytest.fixture(autouse=True)
+def reset_pyworkflow_config():
+    """Reset configuration before and after each test."""
+    reset_config()
+    yield
+    reset_config()
+class TestRecoveryDetection:
+    """Tests for detecting recovery scenarios."""
+    @pytest.mark.asyncio
+    async def test_detect_running_workflow_as_recovery_scenario(self, storage):
+        """A workflow in RUNNING status should be detected as recovery scenario."""
+        # Create a workflow run that's stuck in RUNNING (simulates worker crash)
+        run = WorkflowRun(
+            run_id="test_run",
+            workflow_name="test_workflow",
+            status=RunStatus.RUNNING,
+            created_at=datetime.now(UTC),
+            started_at=datetime.now(UTC),
+            input_args=serialize_args(),
+            input_kwargs=serialize_kwargs(),
+            recovery_attempts=0,
+            max_recovery_attempts=3,
+            recover_on_worker_loss=True,
+        )
+        await storage.create_run(run)
+        # Verify the run is in RUNNING status
+        retrieved_run = await storage.get_run("test_run")
+        assert retrieved_run.status == RunStatus.RUNNING
+        assert retrieved_run.recover_on_worker_loss is True
+    @pytest.mark.asyncio
+    async def test_recovery_disabled_workflow(self, storage):
+        """Workflow with recover_on_worker_loss=False should not auto-recover."""
+        run = WorkflowRun(
+            run_id="test_run",
+            workflow_name="test_workflow",
+            status=RunStatus.RUNNING,
+            created_at=datetime.now(UTC),
+            input_args=serialize_args(),
+            input_kwargs=serialize_kwargs(),
+            recovery_attempts=0,
+            max_recovery_attempts=3,
+            recover_on_worker_loss=False,  # Disabled
+        )
+        await storage.create_run(run)
+        retrieved_run = await storage.get_run("test_run")
+        assert retrieved_run.recover_on_worker_loss is False
+class TestInterruptedEventRecording:
+    """Tests for recording WORKFLOW_INTERRUPTED events."""
+    @pytest.mark.asyncio
+    async def test_record_interrupted_event(self, storage):
+        """Should record WORKFLOW_INTERRUPTED event on recovery."""
+        # Create workflow run
+        run = WorkflowRun(
+            run_id="test_run",
+            workflow_name="test_workflow",
+            status=RunStatus.RUNNING,
+            created_at=datetime.now(UTC),
+            input_args=serialize_args(),
+            input_kwargs=serialize_kwargs(),
+        )
+        await storage.create_run(run)
+        # Record workflow started event
+        start_event = create_workflow_started_event(
+            run_id="test_run",
+            workflow_name="test_workflow",
+            args=serialize_args(),
+            kwargs=serialize_kwargs(),
+        )
+        await storage.record_event(start_event)
+        # Record step completed event
+        step_event = create_step_completed_event(
+            run_id="test_run",
+            step_id="step_1",
+            result=serialize(42),
+            step_name="test_step",
+        )
+        await storage.record_event(step_event)
+        # Simulate worker crash - record interrupted event
+        interrupted_event = create_workflow_interrupted_event(
+            run_id="test_run",
+            reason="worker_lost",
+            worker_id="worker_1",
+            last_event_sequence=2,
+            error="Worker process terminated",
+            recovery_attempt=1,
+            recoverable=True,
+        )
+        await storage.record_event(interrupted_event)
+        # Verify events
+        events = await storage.get_events("test_run")
+        assert len(events) == 3
+        # Check interrupted event
+        interrupted = [e for e in events if e.type == EventType.WORKFLOW_INTERRUPTED]
+        assert len(interrupted) == 1
+        assert interrupted[0].data["reason"] == "worker_lost"
+        assert interrupted[0].data["recovery_attempt"] == 1
+class TestRecoveryAttemptTracking:
+    """Tests for tracking recovery attempts."""
+    @pytest.mark.asyncio
+    async def test_increment_recovery_attempts(self, storage):
+        """Should increment recovery_attempts on each recovery."""
+        run = WorkflowRun(
+            run_id="test_run",
+            workflow_name="test_workflow",
+            status=RunStatus.RUNNING,
+            created_at=datetime.now(UTC),
+            input_args=serialize_args(),
+            input_kwargs=serialize_kwargs(),
+            recovery_attempts=0,
+            max_recovery_attempts=3,
+        )
+        await storage.create_run(run)
+        # First recovery attempt
+        await storage.update_run_recovery_attempts("test_run", 1)
+        run1 = await storage.get_run("test_run")
+        assert run1.recovery_attempts == 1
+        # Second recovery attempt
+        await storage.update_run_recovery_attempts("test_run", 2)
+        run2 = await storage.get_run("test_run")
+        assert run2.recovery_attempts == 2
+        # Third recovery attempt
+        await storage.update_run_recovery_attempts("test_run", 3)
+        run3 = await storage.get_run("test_run")
+        assert run3.recovery_attempts == 3
+    @pytest.mark.asyncio
+    async def test_max_recovery_attempts_exceeded(self, storage):
+        """Should mark workflow as FAILED when max attempts exceeded."""
+        run = WorkflowRun(
+            run_id="test_run",
+            workflow_name="test_workflow",
+            status=RunStatus.RUNNING,
+            created_at=datetime.now(UTC),
+            input_args=serialize_args(),
+            input_kwargs=serialize_kwargs(),
+            recovery_attempts=3,  # Already at max
+            max_recovery_attempts=3,
+        )
+        await storage.create_run(run)
+        # Simulating what would happen when max exceeded
+        await storage.update_run_status(
+            run_id="test_run",
+            status=RunStatus.FAILED,
+            error="Exceeded max recovery attempts (3)",
+        )
+        run = await storage.get_run("test_run")
+        assert run.status == RunStatus.FAILED
+        assert "max recovery attempts" in run.error.lower()
+class TestEventReplayWithInterruption:
+    """Tests for event replay after interruption."""
+    @pytest.mark.asyncio
+    async def test_replay_preserves_step_results_after_interruption(self, storage):
+        """Step results should be preserved and replayable after interruption."""
+        from pyworkflow.context import LocalContext
+        from pyworkflow.engine.replay import replay_events
+        # Create events simulating a workflow that was interrupted
+        events = [
+            create_workflow_started_event(
+                run_id="test_run",
+                workflow_name="test_workflow",
+                args=serialize_args("arg1"),
+                kwargs=serialize_kwargs(key="value"),
+            ),
+            create_step_completed_event(
+                run_id="test_run",
+                step_id="step_1",
+                result=serialize({"processed": True}),
+                step_name="step_1",
+            ),
+            create_step_completed_event(
+                run_id="test_run",
+                step_id="step_2",
+                result=serialize(100),
+                step_name="step_2",
+            ),
+            create_workflow_interrupted_event(
+                run_id="test_run",
+                reason="worker_lost",
+                recovery_attempt=1,
+            ),
+        ]
+        # Assign sequence numbers
+        for i, event in enumerate(events):
+            event.sequence = i + 1
+            await storage.record_event(event)
+        # Load events and replay
+        loaded_events = await storage.get_events("test_run")
+        ctx = LocalContext(
+            run_id="test_run",
+            workflow_name="test_workflow",
+            storage=storage,
+            event_log=loaded_events,
+            durable=True,
+        )
+        await replay_events(ctx, loaded_events)
+        # Verify step results are available
+        assert ctx.get_step_result("step_1") == {"processed": True}
+        assert ctx.get_step_result("step_2") == 100
+class TestStatusTransitions:
+    """Tests for workflow status transitions during recovery."""
+    @pytest.mark.asyncio
+    async def test_running_to_interrupted(self, storage):
+        """RUNNING -> INTERRUPTED transition."""
+        run = WorkflowRun(
+            run_id="test_run",
+            workflow_name="test_workflow",
+            status=RunStatus.RUNNING,
+            created_at=datetime.now(UTC),
+            input_args=serialize_args(),
+            input_kwargs=serialize_kwargs(),
+        )
+        await storage.create_run(run)
+        await storage.update_run_status(
+            run_id="test_run",
+            status=RunStatus.INTERRUPTED,
+        )
+        run = await storage.get_run("test_run")
+        assert run.status == RunStatus.INTERRUPTED
+    @pytest.mark.asyncio
+    async def test_interrupted_to_running_on_recovery(self, storage):
+        """INTERRUPTED -> RUNNING transition on recovery."""
+        run = WorkflowRun(
+            run_id="test_run",
+            workflow_name="test_workflow",
+            status=RunStatus.INTERRUPTED,
+            created_at=datetime.now(UTC),
+            input_args=serialize_args(),
+            input_kwargs=serialize_kwargs(),
+            recovery_attempts=1,
+        )
+        await storage.create_run(run)
+        # Recovery starts
+        await storage.update_run_status(
+            run_id="test_run",
+            status=RunStatus.RUNNING,
+        )
+        run = await storage.get_run("test_run")
+        assert run.status == RunStatus.RUNNING
+    @pytest.mark.asyncio
+    async def test_interrupted_to_failed_on_max_attempts(self, storage):
+        """INTERRUPTED -> FAILED when max attempts exceeded."""
+        run = WorkflowRun(
+            run_id="test_run",
+            workflow_name="test_workflow",
+            status=RunStatus.INTERRUPTED,
+            created_at=datetime.now(UTC),
+            input_args=serialize_args(),
+            input_kwargs=serialize_kwargs(),
+            recovery_attempts=3,
+            max_recovery_attempts=3,
+        )
+        await storage.create_run(run)
+        await storage.update_run_status(
+            run_id="test_run",
+            status=RunStatus.FAILED,
+            error="Exceeded max recovery attempts",
+        )
+        run = await storage.get_run("test_run")
+        assert run.status == RunStatus.FAILED
+class TestWorkflowDecoratorRecoveryConfig:
+    """Tests for workflow decorator recovery configuration."""
+    def test_workflow_decorator_stores_recovery_config(self):
+        """@workflow decorator should store recovery config on wrapper."""
+        @workflow(
+            name="test_recovery_config_1",
+            recover_on_worker_loss=True,
+            max_recovery_attempts=5,
+        )
+        async def my_workflow():
+            pass
+        assert my_workflow.__workflow_recover_on_worker_loss__ is True
+        assert my_workflow.__workflow_max_recovery_attempts__ == 5
+    def test_workflow_decorator_defaults_none(self):
+        """@workflow decorator should default recovery config to None when called with ()."""
+        @workflow(name="test_recovery_config_2")
+        async def my_workflow():
+            pass
+        assert my_workflow.__workflow_recover_on_worker_loss__ is None
+        assert my_workflow.__workflow_max_recovery_attempts__ is None
+    def test_workflow_decorator_disable_recovery(self):
+        """@workflow decorator can disable recovery."""
+        @workflow(name="test_recovery_config_3", recover_on_worker_loss=False)
+        async def my_workflow():
+            pass
+        assert my_workflow.__workflow_recover_on_worker_loss__ is False