PyPI - pyworkflow-engine - Versions diffs - 0.1.22__py3-none-any.whl → 0.1.24__py3-none-any.whl - Mend

pyworkflow-engine 0.1.22py3-none-any.whl → 0.1.24py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

pyworkflow/__init__.py +1 -1
pyworkflow/celery/app.py +18 -0
pyworkflow/celery/tasks.py +61 -71
pyworkflow/storage/base.py +36 -0
pyworkflow/storage/cassandra.py +34 -0
pyworkflow/storage/dynamodb.py +34 -0
pyworkflow/storage/file.py +52 -0
pyworkflow/storage/memory.py +37 -0
pyworkflow/storage/migrations/__init__.py +15 -0
pyworkflow/storage/migrations/base.py +299 -0
pyworkflow/storage/mysql.py +186 -5
pyworkflow/storage/postgres.py +197 -6
pyworkflow/storage/sqlite.py +171 -5
{pyworkflow_engine-0.1.22.dist-info → pyworkflow_engine-0.1.24.dist-info}/METADATA +1 -1
{pyworkflow_engine-0.1.22.dist-info → pyworkflow_engine-0.1.24.dist-info}/RECORD +19 -17
{pyworkflow_engine-0.1.22.dist-info → pyworkflow_engine-0.1.24.dist-info}/WHEEL +0 -0
{pyworkflow_engine-0.1.22.dist-info → pyworkflow_engine-0.1.24.dist-info}/entry_points.txt +0 -0
{pyworkflow_engine-0.1.22.dist-info → pyworkflow_engine-0.1.24.dist-info}/licenses/LICENSE +0 -0
{pyworkflow_engine-0.1.22.dist-info → pyworkflow_engine-0.1.24.dist-info}/top_level.txt +0 -0

pyworkflow/__init__.py CHANGED Viewed

@@ -29,7 +29,7 @@ Quick Start:
     >>> run_id = await start(my_workflow, "Alice")
 """
-__version__ = "0.1.22"
+__version__ = "0.1.24"
 # Configuration
 from pyworkflow.config import (

pyworkflow/celery/app.py CHANGED Viewed

@@ -151,6 +151,8 @@ def create_celery_app(
     sentinel_master_name: str | None = None,
     broker_transport_options: dict[str, Any] | None = None,
     result_backend_transport_options: dict[str, Any] | None = None,
+    worker_max_memory_per_child: int | None = None,
+    worker_max_tasks_per_child: int | None = None,
 ) -> Celery:
     """
     Create and configure a Celery application for PyWorkflow.
@@ -162,6 +164,8 @@ def create_celery_app(
         sentinel_master_name: Redis Sentinel master name. Priority: parameter > PYWORKFLOW_CELERY_SENTINEL_MASTER env var > "mymaster"
         broker_transport_options: Additional transport options for the broker (merged with defaults)
         result_backend_transport_options: Additional transport options for the result backend (merged with defaults)
+        worker_max_memory_per_child: Max memory per worker child process (KB). Priority: parameter > PYWORKFLOW_WORKER_MAX_MEMORY env var > None (no limit)
+        worker_max_tasks_per_child: Max tasks per worker child before recycling. Priority: parameter > PYWORKFLOW_WORKER_MAX_TASKS env var > None (no limit)
     Returns:
         Configured Celery application
@@ -170,6 +174,8 @@ def create_celery_app(
         PYWORKFLOW_CELERY_BROKER: Celery broker URL (used if broker_url param not provided)
         PYWORKFLOW_CELERY_RESULT_BACKEND: Result backend URL (used if result_backend param not provided)
         PYWORKFLOW_CELERY_SENTINEL_MASTER: Sentinel master name (used if sentinel_master_name param not provided)
+        PYWORKFLOW_WORKER_MAX_MEMORY: Max memory per worker child (KB) (used if worker_max_memory_per_child param not provided)
+        PYWORKFLOW_WORKER_MAX_TASKS: Max tasks per worker child (used if worker_max_tasks_per_child param not provided)
     Examples:
         # Default configuration (uses env vars if set, otherwise localhost Redis)
@@ -202,6 +208,14 @@ def create_celery_app(
         or "redis://localhost:6379/1"
     )
+    # Worker memory limits (KB) - prevents memory leaks from accumulating
+    # Priority: parameter > env var > None (no limit by default)
+    max_memory_env = os.getenv("PYWORKFLOW_WORKER_MAX_MEMORY")
+    max_memory = worker_max_memory_per_child or (int(max_memory_env) if max_memory_env else None)
+    max_tasks_env = os.getenv("PYWORKFLOW_WORKER_MAX_TASKS")
+    max_tasks = worker_max_tasks_per_child or (int(max_tasks_env) if max_tasks_env else None)
     # Detect broker and backend types
     is_sentinel_broker = is_sentinel_url(broker_url)
     is_sentinel_backend = is_sentinel_url(result_backend)
@@ -310,6 +324,10 @@ def create_celery_app(
         # Logging
         worker_log_format="[%(asctime)s: %(levelname)s/%(processName)s] %(message)s",
         worker_task_log_format="[%(asctime)s: %(levelname)s/%(processName)s] [%(task_name)s(%(task_id)s)] %(message)s",
+        # Worker memory management - prevents memory leaks from accumulating
+        # When set, workers are recycled after exceeding these limits
+        worker_max_memory_per_child=max_memory,  # KB, None = no limit
+        worker_max_tasks_per_child=max_tasks,  # None = no limit
     )
     # Configure singleton locking for Redis or Sentinel brokers

pyworkflow/celery/tasks.py CHANGED Viewed

@@ -11,7 +11,6 @@ These tasks enable:
 import asyncio
 import random
-import traceback
 import uuid
 from collections.abc import Callable
 from datetime import UTC, datetime
@@ -172,10 +171,9 @@ def execute_step_task(
         raise FatalError(f"Step '{step_name}' not found in registry")
     # Ignore processing step if already completed (idempotency)
-    events = run_async(storage.get_events(run_id))
-    already_completed = any(
-        evt.type == EventType.STEP_COMPLETED and evt.data.get("step_id") == step_id
-        for evt in events
+    # Use has_event() for efficient EXISTS check instead of loading all events
+    already_completed = run_async(
+        storage.has_event(run_id, EventType.STEP_COMPLETED.value, step_id=step_id)
     )
     if already_completed:
         logger.warning(
@@ -398,10 +396,9 @@ async def _record_step_completion_and_resume(
         await storage.connect()
     # Idempotency check: skip if step already completed
-    events = await storage.get_events(run_id)
-    already_completed = any(
-        evt.type == EventType.STEP_COMPLETED and evt.data.get("step_id") == step_id
-        for evt in events
+    # Use has_event() for efficient EXISTS check instead of loading all events
+    already_completed = await storage.has_event(
+        run_id, EventType.STEP_COMPLETED.value, step_id=step_id
     )
     if already_completed:
         logger.info(
@@ -414,26 +411,23 @@ async def _record_step_completion_and_resume(
     # Wait for WORKFLOW_SUSPENDED event before recording STEP_COMPLETED
     # This prevents race conditions where both events get the same sequence number
+    # Use has_event() for memory-efficient polling instead of loading all events
     max_wait_attempts = 50  # 50 * 10ms = 500ms max wait
     wait_interval = 0.01  # 10ms between checks
-    for attempt in range(max_wait_attempts):
-        has_suspended = any(
-            evt.type == EventType.WORKFLOW_SUSPENDED
-            and evt.data.get("step_id") == step_id
-            for evt in events
+    for _attempt in range(max_wait_attempts):
+        has_suspended = await storage.has_event(
+            run_id, EventType.WORKFLOW_SUSPENDED.value, step_id=step_id
         )
         if has_suspended:
             break
-        # Wait and refresh events
+        # Wait and check again
         await asyncio.sleep(wait_interval)
-        events = await storage.get_events(run_id)
         # Also check if step was already completed by another task during wait
-        already_completed = any(
-            evt.type == EventType.STEP_COMPLETED and evt.data.get("step_id") == step_id
-            for evt in events
+        already_completed = await storage.has_event(
+            run_id, EventType.STEP_COMPLETED.value, step_id=step_id
         )
         if already_completed:
             logger.info(
@@ -506,17 +500,18 @@ async def _record_step_failure_and_resume(
         await storage.connect()
     # Idempotency check: skip if step already completed or terminally failed
-    events = await storage.get_events(run_id)
-    already_handled = any(
-        (evt.type == EventType.STEP_COMPLETED and evt.data.get("step_id") == step_id)
-        or (
-            evt.type == EventType.STEP_FAILED
-            and evt.data.get("step_id") == step_id
-            and not evt.data.get("is_retryable", True)
-        )
-        for evt in events
+    # Use has_event() for efficient EXISTS check instead of loading all events
+    # Note: For STEP_FAILED with is_retryable check, we use has_event for STEP_COMPLETED
+    # and separately check STEP_FAILED (non-retryable failures are rare, so this is still efficient)
+    already_completed = await storage.has_event(
+        run_id, EventType.STEP_COMPLETED.value, step_id=step_id
+    )
+    # For terminal failures, we check separately (is_retryable=false in data)
+    # This is less common, so checking completion first is the fast path
+    already_failed_terminal = await storage.has_event(
+        run_id, EventType.STEP_FAILED.value, step_id=step_id, is_retryable="False"
     )
-    if already_handled:
+    if already_completed or already_failed_terminal:
         logger.info(
             "Step already completed/failed by another task, skipping",
             run_id=run_id,
@@ -527,33 +522,28 @@ async def _record_step_failure_and_resume(
     # Wait for WORKFLOW_SUSPENDED event before recording STEP_FAILED
     # This prevents race conditions where both events get the same sequence number
+    # Use has_event() for memory-efficient polling instead of loading all events
     max_wait_attempts = 50  # 50 * 10ms = 500ms max wait
     wait_interval = 0.01  # 10ms between checks
-    for attempt in range(max_wait_attempts):
-        has_suspended = any(
-            evt.type == EventType.WORKFLOW_SUSPENDED
-            and evt.data.get("step_id") == step_id
-            for evt in events
+    for _attempt in range(max_wait_attempts):
+        has_suspended = await storage.has_event(
+            run_id, EventType.WORKFLOW_SUSPENDED.value, step_id=step_id
         )
         if has_suspended:
             break
-        # Wait and refresh events
+        # Wait and check again
         await asyncio.sleep(wait_interval)
-        events = await storage.get_events(run_id)
         # Also check if step was already handled by another task during wait
-        already_handled = any(
-            (evt.type == EventType.STEP_COMPLETED and evt.data.get("step_id") == step_id)
-            or (
-                evt.type == EventType.STEP_FAILED
-                and evt.data.get("step_id") == step_id
-                and not evt.data.get("is_retryable", True)
-            )
-            for evt in events
+        already_completed = await storage.has_event(
+            run_id, EventType.STEP_COMPLETED.value, step_id=step_id
+        )
+        already_failed_terminal = await storage.has_event(
+            run_id, EventType.STEP_FAILED.value, step_id=step_id, is_retryable="False"
         )
-        if already_handled:
+        if already_completed or already_failed_terminal:
             logger.info(
                 "Step already completed/failed by another task during wait, skipping",
                 run_id=run_id,
@@ -891,13 +881,13 @@ async def _execute_child_workflow_on_worker(
         # For step dispatch suspensions, check if step already completed/failed
         if step_id and e.reason.startswith("step_dispatch:"):
-            events = await storage.get_events(child_run_id)
-            step_finished = any(
-                evt.type in (EventType.STEP_COMPLETED, EventType.STEP_FAILED)
-                and evt.data.get("step_id") == step_id
-                for evt in events
+            step_completed = await storage.has_event(
+                child_run_id, EventType.STEP_COMPLETED.value, step_id=step_id
             )
-            if step_finished:
+            step_failed = await storage.has_event(
+                child_run_id, EventType.STEP_FAILED.value, step_id=step_id
+            )
+            if step_completed or step_failed:
                 logger.info(
                     "Child step finished before suspension completed, scheduling resume",
                     child_run_id=child_run_id,
@@ -1144,8 +1134,8 @@ async def _handle_workflow_recovery(
         return False
     # Get last event sequence
-    events = await storage.get_events(run.run_id)
-    last_event_sequence = max((e.sequence or 0 for e in events), default=0) if events else None
+    latest_event = await storage.get_latest_event(run.run_id)
+    last_event_sequence = latest_event.sequence if latest_event else None
     # Record interruption event
     interrupted_event = create_workflow_interrupted_event(
@@ -1287,13 +1277,13 @@ async def _recover_workflow_on_worker(
         # For step dispatch suspensions, check if step already completed/failed
         if step_id and e.reason.startswith("step_dispatch:"):
-            events = await storage.get_events(run_id)
-            step_finished = any(
-                evt.type in (EventType.STEP_COMPLETED, EventType.STEP_FAILED)
-                and evt.data.get("step_id") == step_id
-                for evt in events
+            step_completed = await storage.has_event(
+                run_id, EventType.STEP_COMPLETED.value, step_id=step_id
             )
-            if step_finished:
+            step_failed = await storage.has_event(
+                run_id, EventType.STEP_FAILED.value, step_id=step_id
+            )
+            if step_completed or step_failed:
                 logger.info(
                     "Step finished before recovery suspension completed, scheduling resume",
                     run_id=run_id,
@@ -1679,13 +1669,13 @@ async def _start_workflow_on_worker(
         # For step dispatch suspensions, check if step already completed/failed (race condition)
         # If so, schedule resume immediately
         if step_id and e.reason.startswith("step_dispatch:"):
-            events = await storage.get_events(run_id)
-            step_finished = any(
-                evt.type in (EventType.STEP_COMPLETED, EventType.STEP_FAILED)
-                and evt.data.get("step_id") == step_id
-                for evt in events
+            step_completed = await storage.has_event(
+                run_id, EventType.STEP_COMPLETED.value, step_id=step_id
             )
-            if step_finished:
+            step_failed = await storage.has_event(
+                run_id, EventType.STEP_FAILED.value, step_id=step_id
+            )
+            if step_completed or step_failed:
                 logger.info(
                     "Step finished before suspension completed, scheduling resume",
                     run_id=run_id,
@@ -2269,13 +2259,13 @@ async def _resume_workflow_on_worker(
         # For step dispatch suspensions, check if step already completed/failed
         if step_id and e.reason.startswith("step_dispatch:"):
-            events = await storage.get_events(run_id)
-            step_finished = any(
-                evt.type in (EventType.STEP_COMPLETED, EventType.STEP_FAILED)
-                and evt.data.get("step_id") == step_id
-                for evt in events
+            step_completed = await storage.has_event(
+                run_id, EventType.STEP_COMPLETED.value, step_id=step_id
+            )
+            step_failed = await storage.has_event(
+                run_id, EventType.STEP_FAILED.value, step_id=step_id
             )
-            if step_finished:
+            if step_completed or step_failed:
                 logger.info(
                     "Step finished before resume suspension completed, scheduling resume",
                     run_id=run_id,

pyworkflow/storage/base.py CHANGED Viewed

@@ -203,6 +203,42 @@ class StorageBackend(ABC):
         """
         pass
+    @abstractmethod
+    async def has_event(
+        self,
+        run_id: str,
+        event_type: str,
+        **filters: str,
+    ) -> bool:
+        """
+        Check if an event exists matching the criteria.
+        This is a memory-efficient alternative to get_events() when you only
+        need to check for existence. Uses SQL EXISTS queries in SQL backends
+        for O(1) memory usage instead of loading all events.
+        Args:
+            run_id: Workflow run identifier
+            event_type: Event type to check for (e.g., "step_completed")
+            **filters: Additional filters to match against event data fields.
+                       For example, step_id="abc" will check data->>'step_id' = 'abc'
+        Returns:
+            True if a matching event exists, False otherwise
+        Example:
+            # Check if step completed
+            exists = await storage.has_event(
+                run_id, "step_completed", step_id="step_123"
+            )
+            # Check if workflow suspended for a specific step
+            exists = await storage.has_event(
+                run_id, "workflow_suspended", step_id="step_123"
+            )
+        """
+        pass
     @abstractmethod
     async def get_latest_event(
         self,

pyworkflow/storage/cassandra.py CHANGED Viewed

@@ -896,6 +896,40 @@ class CassandraStorageBackend(StorageBackend):
         return None
+    async def has_event(
+        self,
+        run_id: str,
+        event_type: str,
+        **filters: str,
+    ) -> bool:
+        """
+        Check if an event exists matching the criteria.
+        Loads events of the specified type and filters in Python for efficiency.
+        Args:
+            run_id: Workflow run identifier
+            event_type: Event type to check for
+            **filters: Additional filters for event data fields
+        Returns:
+            True if a matching event exists, False otherwise
+        """
+        # Load only events of the specific type
+        events = await self.get_events(run_id, event_types=[event_type])
+        # Filter in Python
+        for event in events:
+            match = True
+            for key, value in filters.items():
+                if str(event.data.get(key)) != str(value):
+                    match = False
+                    break
+            if match:
+                return True
+        return False
     # Step Operations
     async def create_step(self, step: StepExecution) -> None:

pyworkflow/storage/dynamodb.py CHANGED Viewed

@@ -588,6 +588,40 @@ class DynamoDBStorageBackend(StorageBackend):
             return self._item_to_event(self._item_to_dict(items[0]))
+    async def has_event(
+        self,
+        run_id: str,
+        event_type: str,
+        **filters: str,
+    ) -> bool:
+        """
+        Check if an event exists matching the criteria.
+        Loads events of the specified type and filters in Python for efficiency.
+        Args:
+            run_id: Workflow run identifier
+            event_type: Event type to check for
+            **filters: Additional filters for event data fields
+        Returns:
+            True if a matching event exists, False otherwise
+        """
+        # Load only events of the specific type
+        events = await self.get_events(run_id, event_types=[event_type])
+        # Filter in Python
+        for event in events:
+            match = True
+            for key, value in filters.items():
+                if str(event.data.get(key)) != str(value):
+                    match = False
+                    break
+            if match:
+                return True
+        return False
     # Step Operations
     async def create_step(self, step: StepExecution) -> None:

pyworkflow/storage/file.py CHANGED Viewed

@@ -373,6 +373,58 @@ class FileStorageBackend(StorageBackend):
         events = await self.get_events(run_id, event_types=[event_type] if event_type else None)
         return events[-1] if events else None
+    async def has_event(
+        self,
+        run_id: str,
+        event_type: str,
+        **filters: str,
+    ) -> bool:
+        """
+        Check if an event exists using file-based iteration with early termination.
+        Reads the events file line by line and returns as soon as a match is found,
+        avoiding loading the entire event log into memory.
+        Args:
+            run_id: Workflow run identifier
+            event_type: Event type to check for
+            **filters: Additional filters for event data fields
+        Returns:
+            True if a matching event exists, False otherwise
+        """
+        events_file = self.events_dir / f"{run_id}.jsonl"
+        if not events_file.exists():
+            return False
+        def _check() -> bool:
+            with events_file.open("r") as f:
+                for line in f:
+                    if not line.strip():
+                        continue
+                    data = json.loads(line)
+                    # Check event type
+                    if data["type"] != event_type:
+                        continue
+                    # Check all data filters
+                    match = True
+                    event_data = data.get("data", {})
+                    for key, value in filters.items():
+                        if str(event_data.get(key)) != str(value):
+                            match = False
+                            break
+                    if match:
+                        return True
+            return False
+        return await asyncio.to_thread(_check)
     # Step Operations
     async def create_step(self, step: StepExecution) -> None:

pyworkflow/storage/memory.py CHANGED Viewed

@@ -250,6 +250,43 @@ class InMemoryStorageBackend(StorageBackend):
             # Return event with highest sequence
             return max(events, key=lambda e: e.sequence or 0)
+    async def has_event(
+        self,
+        run_id: str,
+        event_type: str,
+        **filters: str,
+    ) -> bool:
+        """
+        Check if an event exists by loading events of the specific type and filtering.
+        This approach:
+        1. Uses the event_types filter to load only events of the target type
+        2. Filters in Python on the loaded data
+        3. Significantly reduces memory vs loading ALL events
+        Args:
+            run_id: Workflow run identifier
+            event_type: Event type to check for
+            **filters: Additional filters for event data fields
+        Returns:
+            True if a matching event exists, False otherwise
+        """
+        # Load only events of the specific type
+        events = await self.get_events(run_id, event_types=[event_type])
+        # Filter in Python
+        for event in events:
+            match = True
+            for key, value in filters.items():
+                if str(event.data.get(key)) != str(value):
+                    match = False
+                    break
+            if match:
+                return True
+        return False
     # Step Operations
     async def create_step(self, step: StepExecution) -> None:

pyworkflow/storage/migrations/__init__.py ADDED Viewed

@@ -0,0 +1,15 @@
+"""
+Database schema migration framework for PyWorkflow storage backends.
+This module provides a migration framework that allows storage backends to
+evolve their schema over time while maintaining backward compatibility with
+existing databases.
+"""
+from pyworkflow.storage.migrations.base import (
+    Migration,
+    MigrationRegistry,
+    MigrationRunner,
+)
+__all__ = ["Migration", "MigrationRegistry", "MigrationRunner"]

pyworkflow-engine 0.1.22__py3-none-any.whl → 0.1.24__py3-none-any.whl

pyworkflow-engine 0.1.22py3-none-any.whl → 0.1.24py3-none-any.whl