PyPI - pyworkflow-engine - Versions diffs - 0.1.7__py3-none-any.whl - Mend

pyworkflow-engine 0.1.7__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (196) hide show

dashboard/backend/app/__init__.py +1 -0
dashboard/backend/app/config.py +32 -0
dashboard/backend/app/controllers/__init__.py +6 -0
dashboard/backend/app/controllers/run_controller.py +86 -0
dashboard/backend/app/controllers/workflow_controller.py +33 -0
dashboard/backend/app/dependencies/__init__.py +5 -0
dashboard/backend/app/dependencies/storage.py +50 -0
dashboard/backend/app/repositories/__init__.py +6 -0
dashboard/backend/app/repositories/run_repository.py +80 -0
dashboard/backend/app/repositories/workflow_repository.py +27 -0
dashboard/backend/app/rest/__init__.py +8 -0
dashboard/backend/app/rest/v1/__init__.py +12 -0
dashboard/backend/app/rest/v1/health.py +33 -0
dashboard/backend/app/rest/v1/runs.py +133 -0
dashboard/backend/app/rest/v1/workflows.py +41 -0
dashboard/backend/app/schemas/__init__.py +23 -0
dashboard/backend/app/schemas/common.py +16 -0
dashboard/backend/app/schemas/event.py +24 -0
dashboard/backend/app/schemas/hook.py +25 -0
dashboard/backend/app/schemas/run.py +54 -0
dashboard/backend/app/schemas/step.py +28 -0
dashboard/backend/app/schemas/workflow.py +31 -0
dashboard/backend/app/server.py +87 -0
dashboard/backend/app/services/__init__.py +6 -0
dashboard/backend/app/services/run_service.py +240 -0
dashboard/backend/app/services/workflow_service.py +155 -0
dashboard/backend/main.py +18 -0
docs/concepts/cancellation.mdx +362 -0
docs/concepts/continue-as-new.mdx +434 -0
docs/concepts/events.mdx +266 -0
docs/concepts/fault-tolerance.mdx +370 -0
docs/concepts/hooks.mdx +552 -0
docs/concepts/limitations.mdx +167 -0
docs/concepts/schedules.mdx +775 -0
docs/concepts/sleep.mdx +312 -0
docs/concepts/steps.mdx +301 -0
docs/concepts/workflows.mdx +255 -0
docs/guides/cli.mdx +942 -0
docs/guides/configuration.mdx +560 -0
docs/introduction.mdx +155 -0
docs/quickstart.mdx +279 -0
examples/__init__.py +1 -0
examples/celery/__init__.py +1 -0
examples/celery/durable/docker-compose.yml +55 -0
examples/celery/durable/pyworkflow.config.yaml +12 -0
examples/celery/durable/workflows/__init__.py +122 -0
examples/celery/durable/workflows/basic.py +87 -0
examples/celery/durable/workflows/batch_processing.py +102 -0
examples/celery/durable/workflows/cancellation.py +273 -0
examples/celery/durable/workflows/child_workflow_patterns.py +240 -0
examples/celery/durable/workflows/child_workflows.py +202 -0
examples/celery/durable/workflows/continue_as_new.py +260 -0
examples/celery/durable/workflows/fault_tolerance.py +210 -0
examples/celery/durable/workflows/hooks.py +211 -0
examples/celery/durable/workflows/idempotency.py +112 -0
examples/celery/durable/workflows/long_running.py +99 -0
examples/celery/durable/workflows/retries.py +101 -0
examples/celery/durable/workflows/schedules.py +209 -0
examples/celery/transient/01_basic_workflow.py +91 -0
examples/celery/transient/02_fault_tolerance.py +257 -0
examples/celery/transient/__init__.py +20 -0
examples/celery/transient/pyworkflow.config.yaml +25 -0
examples/local/__init__.py +1 -0
examples/local/durable/01_basic_workflow.py +94 -0
examples/local/durable/02_file_storage.py +132 -0
examples/local/durable/03_retries.py +169 -0
examples/local/durable/04_long_running.py +119 -0
examples/local/durable/05_event_log.py +145 -0
examples/local/durable/06_idempotency.py +148 -0
examples/local/durable/07_hooks.py +334 -0
examples/local/durable/08_cancellation.py +233 -0
examples/local/durable/09_child_workflows.py +198 -0
examples/local/durable/10_child_workflow_patterns.py +265 -0
examples/local/durable/11_continue_as_new.py +249 -0
examples/local/durable/12_schedules.py +198 -0
examples/local/durable/__init__.py +1 -0
examples/local/transient/01_quick_tasks.py +87 -0
examples/local/transient/02_retries.py +130 -0
examples/local/transient/03_sleep.py +141 -0
examples/local/transient/__init__.py +1 -0
pyworkflow/__init__.py +256 -0
pyworkflow/aws/__init__.py +68 -0
pyworkflow/aws/context.py +234 -0
pyworkflow/aws/handler.py +184 -0
pyworkflow/aws/testing.py +310 -0
pyworkflow/celery/__init__.py +41 -0
pyworkflow/celery/app.py +198 -0
pyworkflow/celery/scheduler.py +315 -0
pyworkflow/celery/tasks.py +1746 -0
pyworkflow/cli/__init__.py +132 -0
pyworkflow/cli/__main__.py +6 -0
pyworkflow/cli/commands/__init__.py +1 -0
pyworkflow/cli/commands/hooks.py +640 -0
pyworkflow/cli/commands/quickstart.py +495 -0
pyworkflow/cli/commands/runs.py +773 -0
pyworkflow/cli/commands/scheduler.py +130 -0
pyworkflow/cli/commands/schedules.py +794 -0
pyworkflow/cli/commands/setup.py +703 -0
pyworkflow/cli/commands/worker.py +413 -0
pyworkflow/cli/commands/workflows.py +1257 -0
pyworkflow/cli/output/__init__.py +1 -0
pyworkflow/cli/output/formatters.py +321 -0
pyworkflow/cli/output/styles.py +121 -0
pyworkflow/cli/utils/__init__.py +1 -0
pyworkflow/cli/utils/async_helpers.py +30 -0
pyworkflow/cli/utils/config.py +130 -0
pyworkflow/cli/utils/config_generator.py +344 -0
pyworkflow/cli/utils/discovery.py +53 -0
pyworkflow/cli/utils/docker_manager.py +651 -0
pyworkflow/cli/utils/interactive.py +364 -0
pyworkflow/cli/utils/storage.py +115 -0
pyworkflow/config.py +329 -0
pyworkflow/context/__init__.py +63 -0
pyworkflow/context/aws.py +230 -0
pyworkflow/context/base.py +416 -0
pyworkflow/context/local.py +930 -0
pyworkflow/context/mock.py +381 -0
pyworkflow/core/__init__.py +0 -0
pyworkflow/core/exceptions.py +353 -0
pyworkflow/core/registry.py +313 -0
pyworkflow/core/scheduled.py +328 -0
pyworkflow/core/step.py +494 -0
pyworkflow/core/workflow.py +294 -0
pyworkflow/discovery.py +248 -0
pyworkflow/engine/__init__.py +0 -0
pyworkflow/engine/events.py +879 -0
pyworkflow/engine/executor.py +682 -0
pyworkflow/engine/replay.py +273 -0
pyworkflow/observability/__init__.py +19 -0
pyworkflow/observability/logging.py +234 -0
pyworkflow/primitives/__init__.py +33 -0
pyworkflow/primitives/child_handle.py +174 -0
pyworkflow/primitives/child_workflow.py +372 -0
pyworkflow/primitives/continue_as_new.py +101 -0
pyworkflow/primitives/define_hook.py +150 -0
pyworkflow/primitives/hooks.py +97 -0
pyworkflow/primitives/resume_hook.py +210 -0
pyworkflow/primitives/schedule.py +545 -0
pyworkflow/primitives/shield.py +96 -0
pyworkflow/primitives/sleep.py +100 -0
pyworkflow/runtime/__init__.py +21 -0
pyworkflow/runtime/base.py +179 -0
pyworkflow/runtime/celery.py +310 -0
pyworkflow/runtime/factory.py +101 -0
pyworkflow/runtime/local.py +706 -0
pyworkflow/scheduler/__init__.py +9 -0
pyworkflow/scheduler/local.py +248 -0
pyworkflow/serialization/__init__.py +0 -0
pyworkflow/serialization/decoder.py +146 -0
pyworkflow/serialization/encoder.py +162 -0
pyworkflow/storage/__init__.py +54 -0
pyworkflow/storage/base.py +612 -0
pyworkflow/storage/config.py +185 -0
pyworkflow/storage/dynamodb.py +1315 -0
pyworkflow/storage/file.py +827 -0
pyworkflow/storage/memory.py +549 -0
pyworkflow/storage/postgres.py +1161 -0
pyworkflow/storage/schemas.py +486 -0
pyworkflow/storage/sqlite.py +1136 -0
pyworkflow/utils/__init__.py +0 -0
pyworkflow/utils/duration.py +177 -0
pyworkflow/utils/schedule.py +391 -0
pyworkflow_engine-0.1.7.dist-info/METADATA +687 -0
pyworkflow_engine-0.1.7.dist-info/RECORD +196 -0
pyworkflow_engine-0.1.7.dist-info/WHEEL +5 -0
pyworkflow_engine-0.1.7.dist-info/entry_points.txt +2 -0
pyworkflow_engine-0.1.7.dist-info/licenses/LICENSE +21 -0
pyworkflow_engine-0.1.7.dist-info/top_level.txt +5 -0
tests/examples/__init__.py +0 -0
tests/integration/__init__.py +0 -0
tests/integration/test_cancellation.py +330 -0
tests/integration/test_child_workflows.py +439 -0
tests/integration/test_continue_as_new.py +428 -0
tests/integration/test_dynamodb_storage.py +1146 -0
tests/integration/test_fault_tolerance.py +369 -0
tests/integration/test_schedule_storage.py +484 -0
tests/unit/__init__.py +0 -0
tests/unit/backends/__init__.py +1 -0
tests/unit/backends/test_dynamodb_storage.py +1554 -0
tests/unit/backends/test_postgres_storage.py +1281 -0
tests/unit/backends/test_sqlite_storage.py +1460 -0
tests/unit/conftest.py +41 -0
tests/unit/test_cancellation.py +364 -0
tests/unit/test_child_workflows.py +680 -0
tests/unit/test_continue_as_new.py +441 -0
tests/unit/test_event_limits.py +316 -0
tests/unit/test_executor.py +320 -0
tests/unit/test_fault_tolerance.py +334 -0
tests/unit/test_hooks.py +495 -0
tests/unit/test_registry.py +261 -0
tests/unit/test_replay.py +420 -0
tests/unit/test_schedule_schemas.py +285 -0
tests/unit/test_schedule_utils.py +286 -0
tests/unit/test_scheduled_workflow.py +274 -0
tests/unit/test_step.py +353 -0
tests/unit/test_workflow.py +243 -0

pyworkflow/storage/file.py ADDED Viewed

@@ -0,0 +1,827 @@
+"""
+File-based storage backend using JSON files.
+This backend stores workflow data in local JSON files, suitable for:
+- Development and testing
+- Single-machine deployments
+- Low-volume production use
+Data is stored in a directory structure:
+    base_path/
+        runs/
+            {run_id}.json
+        events/
+            {run_id}.jsonl  (append-only)
+        steps/
+            {step_id}.json
+        hooks/
+            {hook_id}.json
+        schedules/
+            {schedule_id}.json
+        _token_index.json  (token -> hook_id mapping)
+"""
+import asyncio
+import json
+from datetime import UTC, datetime
+from pathlib import Path
+from filelock import FileLock
+from pyworkflow.engine.events import Event, EventType
+from pyworkflow.storage.base import StorageBackend
+from pyworkflow.storage.schemas import (
+    Hook,
+    HookStatus,
+    RunStatus,
+    Schedule,
+    ScheduleStatus,
+    StepExecution,
+    WorkflowRun,
+)
+class FileStorageBackend(StorageBackend):
+    """
+    File-based storage backend using JSON files.
+    Thread-safe using file locks for concurrent access.
+    """
+    def __init__(self, base_path: str = "./pyworkflow_data"):
+        """
+        Initialize file storage backend.
+        Args:
+            base_path: Base directory for storing workflow data
+        """
+        self.base_path = Path(base_path)
+        self.runs_dir = self.base_path / "runs"
+        self.events_dir = self.base_path / "events"
+        self.steps_dir = self.base_path / "steps"
+        self.hooks_dir = self.base_path / "hooks"
+        self.schedules_dir = self.base_path / "schedules"
+        self.locks_dir = self.base_path / ".locks"
+        self._token_index_file = self.base_path / "_token_index.json"
+        # Create directories
+        for dir_path in [
+            self.runs_dir,
+            self.events_dir,
+            self.steps_dir,
+            self.hooks_dir,
+            self.schedules_dir,
+            self.locks_dir,
+        ]:
+            dir_path.mkdir(parents=True, exist_ok=True)
+    # Workflow Run Operations
+    async def create_run(self, run: WorkflowRun) -> None:
+        """Create a new workflow run record."""
+        run_file = self.runs_dir / f"{run.run_id}.json"
+        if run_file.exists():
+            raise ValueError(f"Workflow run {run.run_id} already exists")
+        data = run.to_dict()
+        # Use file lock for thread safety
+        lock_file = self.locks_dir / f"{run.run_id}.lock"
+        lock = FileLock(str(lock_file))
+        def _write() -> None:
+            with lock:
+                run_file.write_text(json.dumps(data, indent=2))
+        await asyncio.to_thread(_write)
+    async def get_run(self, run_id: str) -> WorkflowRun | None:
+        """Retrieve a workflow run by ID."""
+        run_file = self.runs_dir / f"{run_id}.json"
+        if not run_file.exists():
+            return None
+        lock_file = self.locks_dir / f"{run_id}.lock"
+        lock = FileLock(str(lock_file))
+        def _read() -> dict | None:
+            with lock:
+                if not run_file.exists():
+                    return None
+                content = run_file.read_text()
+                if not content.strip():
+                    # File exists but is empty (race condition) - treat as not found
+                    return None
+                return json.loads(content)
+        data = await asyncio.to_thread(_read)
+        return WorkflowRun.from_dict(data) if data else None
+    async def get_run_by_idempotency_key(self, key: str) -> WorkflowRun | None:
+        """Retrieve a workflow run by idempotency key."""
+        def _search() -> dict | None:
+            for run_file in self.runs_dir.glob("*.json"):
+                data = json.loads(run_file.read_text())
+                if data.get("idempotency_key") == key:
+                    return data
+            return None
+        data = await asyncio.to_thread(_search)
+        return WorkflowRun.from_dict(data) if data else None
+    async def update_run_status(
+        self,
+        run_id: str,
+        status: RunStatus,
+        result: str | None = None,
+        error: str | None = None,
+    ) -> None:
+        """Update workflow run status."""
+        run_file = self.runs_dir / f"{run_id}.json"
+        if not run_file.exists():
+            raise ValueError(f"Workflow run {run_id} not found")
+        lock_file = self.locks_dir / f"{run_id}.lock"
+        lock = FileLock(str(lock_file))
+        def _update() -> None:
+            with lock:
+                data = json.loads(run_file.read_text())
+                data["status"] = status.value
+                data["updated_at"] = datetime.now(UTC).isoformat()
+                if result is not None:
+                    data["result"] = result
+                if error is not None:
+                    data["error"] = error
+                if status == RunStatus.COMPLETED:
+                    data["completed_at"] = datetime.now(UTC).isoformat()
+                run_file.write_text(json.dumps(data, indent=2))
+        await asyncio.to_thread(_update)
+    async def update_run_recovery_attempts(
+        self,
+        run_id: str,
+        recovery_attempts: int,
+    ) -> None:
+        """Update the recovery attempts counter for a workflow run."""
+        run_file = self.runs_dir / f"{run_id}.json"
+        if not run_file.exists():
+            raise ValueError(f"Workflow run {run_id} not found")
+        lock_file = self.locks_dir / f"{run_id}.lock"
+        lock = FileLock(str(lock_file))
+        def _update() -> None:
+            with lock:
+                data = json.loads(run_file.read_text())
+                data["recovery_attempts"] = recovery_attempts
+                data["updated_at"] = datetime.now(UTC).isoformat()
+                run_file.write_text(json.dumps(data, indent=2))
+        await asyncio.to_thread(_update)
+    async def list_runs(
+        self,
+        query: str | None = None,
+        status: RunStatus | None = None,
+        start_time: datetime | None = None,
+        end_time: datetime | None = None,
+        limit: int = 100,
+        cursor: str | None = None,
+    ) -> tuple[list[WorkflowRun], str | None]:
+        """List workflow runs with optional filtering and cursor-based pagination."""
+        def _list() -> tuple[list[dict], str | None]:
+            runs = []
+            query_lower = query.lower() if query else None
+            for run_file in self.runs_dir.glob("*.json"):
+                data = json.loads(run_file.read_text())
+                # Apply query filter (case-insensitive substring in workflow_name or input_kwargs)
+                if query_lower:
+                    workflow_name = data.get("workflow_name", "").lower()
+                    input_kwargs = json.dumps(data.get("input_kwargs", {})).lower()
+                    if query_lower not in workflow_name and query_lower not in input_kwargs:
+                        continue
+                # Apply status filter
+                if status and data.get("status") != status.value:
+                    continue
+                # Apply time filters (based on started_at)
+                started_at_str = data.get("started_at")
+                if started_at_str:
+                    started_at = datetime.fromisoformat(started_at_str)
+                    # Make timezone-aware comparison if needed
+                    if start_time and started_at < start_time:
+                        continue
+                    if end_time and started_at >= end_time:
+                        continue
+                elif start_time or end_time:
+                    # If run hasn't started yet and we have time filters, skip it
+                    continue
+                runs.append(data)
+            # Sort by (created_at DESC, run_id DESC) for deterministic ordering
+            runs.sort(key=lambda r: (r.get("created_at", ""), r.get("run_id", "")), reverse=True)
+            # Apply cursor-based pagination
+            if cursor:
+                # Find the cursor position and start after it
+                cursor_found = False
+                filtered_runs = []
+                for run in runs:
+                    if cursor_found:
+                        filtered_runs.append(run)
+                    elif run.get("run_id") == cursor:
+                        cursor_found = True
+                runs = filtered_runs
+            # Apply limit and determine next_cursor
+            if len(runs) > limit:
+                result_runs = runs[:limit]
+                next_cursor = result_runs[-1].get("run_id") if result_runs else None
+            else:
+                result_runs = runs[:limit]
+                next_cursor = None
+            return result_runs, next_cursor
+        run_data_list, next_cursor = await asyncio.to_thread(_list)
+        return [WorkflowRun.from_dict(data) for data in run_data_list], next_cursor
+    # Event Log Operations
+    async def record_event(self, event: Event) -> None:
+        """Record an event to the append-only event log."""
+        events_file = self.events_dir / f"{event.run_id}.jsonl"
+        lock_file = self.locks_dir / f"events_{event.run_id}.lock"
+        lock = FileLock(str(lock_file))
+        def _append() -> None:
+            with lock:
+                # Get next sequence number
+                sequence = 1
+                if events_file.exists():
+                    with events_file.open("r") as f:
+                        for line in f:
+                            if line.strip():
+                                sequence += 1
+                event.sequence = sequence
+                # Append event
+                event_data = {
+                    "event_id": event.event_id,
+                    "run_id": event.run_id,
+                    "type": event.type.value,
+                    "sequence": event.sequence,
+                    "timestamp": event.timestamp.isoformat(),
+                    "data": event.data,
+                }
+                with events_file.open("a") as f:
+                    f.write(json.dumps(event_data) + "\n")
+        await asyncio.to_thread(_append)
+    async def get_events(
+        self,
+        run_id: str,
+        event_types: list[str] | None = None,
+    ) -> list[Event]:
+        """Retrieve all events for a workflow run."""
+        events_file = self.events_dir / f"{run_id}.jsonl"
+        if not events_file.exists():
+            return []
+        def _read() -> list[Event]:
+            events = []
+            with events_file.open("r") as f:
+                for line in f:
+                    if not line.strip():
+                        continue
+                    data = json.loads(line)
+                    # Apply type filter
+                    if event_types and data["type"] not in event_types:
+                        continue
+                    events.append(
+                        Event(
+                            event_id=data["event_id"],
+                            run_id=data["run_id"],
+                            type=EventType(data["type"]),
+                            sequence=data["sequence"],
+                            timestamp=datetime.fromisoformat(data["timestamp"]),
+                            data=data["data"],
+                        )
+                    )
+            return sorted(events, key=lambda e: e.sequence or 0)
+        return await asyncio.to_thread(_read)
+    async def get_latest_event(
+        self,
+        run_id: str,
+        event_type: str | None = None,
+    ) -> Event | None:
+        """Get the latest event for a run."""
+        events = await self.get_events(run_id, event_types=[event_type] if event_type else None)
+        return events[-1] if events else None
+    # Step Operations
+    async def create_step(self, step: StepExecution) -> None:
+        """Create a step execution record."""
+        step_file = self.steps_dir / f"{step.step_id}.json"
+        if step_file.exists():
+            raise ValueError(f"Step {step.step_id} already exists")
+        data = step.to_dict()
+        def _write() -> None:
+            step_file.write_text(json.dumps(data, indent=2))
+        await asyncio.to_thread(_write)
+    async def get_step(self, step_id: str) -> StepExecution | None:
+        """Retrieve a step execution by ID."""
+        step_file = self.steps_dir / f"{step_id}.json"
+        if not step_file.exists():
+            return None
+        def _read() -> dict:
+            return json.loads(step_file.read_text())
+        data = await asyncio.to_thread(_read)
+        return StepExecution.from_dict(data)
+    async def update_step_status(
+        self,
+        step_id: str,
+        status: str,
+        result: str | None = None,
+        error: str | None = None,
+    ) -> None:
+        """Update step execution status."""
+        step_file = self.steps_dir / f"{step_id}.json"
+        if not step_file.exists():
+            raise ValueError(f"Step {step_id} not found")
+        def _update() -> None:
+            data = json.loads(step_file.read_text())
+            data["status"] = status
+            data["updated_at"] = datetime.utcnow().isoformat()
+            if result is not None:
+                data["result"] = result
+            if error is not None:
+                data["error"] = error
+            if status == "completed":
+                data["completed_at"] = datetime.utcnow().isoformat()
+            step_file.write_text(json.dumps(data, indent=2))
+        await asyncio.to_thread(_update)
+    async def list_steps(self, run_id: str) -> list[StepExecution]:
+        """List all steps for a workflow run."""
+        def _list() -> list[dict]:
+            steps = []
+            for step_file in self.steps_dir.glob("*.json"):
+                data = json.loads(step_file.read_text())
+                if data.get("run_id") == run_id:
+                    steps.append(data)
+            # Sort by created_at
+            steps.sort(key=lambda s: s.get("created_at", ""))
+            return steps
+        step_data_list = await asyncio.to_thread(_list)
+        return [StepExecution.from_dict(data) for data in step_data_list]
+    # Hook Operations
+    def _load_token_index(self) -> dict:
+        """Load the token -> hook_id index."""
+        if self._token_index_file.exists():
+            return json.loads(self._token_index_file.read_text())
+        return {}
+    def _save_token_index(self, index: dict) -> None:
+        """Save the token -> hook_id index."""
+        self._token_index_file.write_text(json.dumps(index, indent=2))
+    async def create_hook(self, hook: Hook) -> None:
+        """Create a hook record."""
+        hook_file = self.hooks_dir / f"{hook.hook_id}.json"
+        lock_file = self.locks_dir / "token_index.lock"
+        lock = FileLock(str(lock_file))
+        data = hook.to_dict()
+        def _write() -> None:
+            with lock:
+                hook_file.write_text(json.dumps(data, indent=2))
+                # Update token index
+                index = self._load_token_index()
+                index[hook.token] = hook.hook_id
+                self._save_token_index(index)
+        await asyncio.to_thread(_write)
+    async def get_hook(self, hook_id: str) -> Hook | None:
+        """Retrieve a hook by ID."""
+        hook_file = self.hooks_dir / f"{hook_id}.json"
+        if not hook_file.exists():
+            return None
+        def _read() -> dict:
+            return json.loads(hook_file.read_text())
+        data = await asyncio.to_thread(_read)
+        return Hook.from_dict(data)
+    async def get_hook_by_token(self, token: str) -> Hook | None:
+        """Retrieve a hook by its token."""
+        def _lookup() -> str | None:
+            index = self._load_token_index()
+            return index.get(token)
+        hook_id = await asyncio.to_thread(_lookup)
+        if hook_id:
+            return await self.get_hook(hook_id)
+        return None
+    async def update_hook_status(
+        self,
+        hook_id: str,
+        status: HookStatus,
+        payload: str | None = None,
+    ) -> None:
+        """Update hook status and optionally payload."""
+        hook_file = self.hooks_dir / f"{hook_id}.json"
+        if not hook_file.exists():
+            raise ValueError(f"Hook {hook_id} not found")
+        lock_file = self.locks_dir / f"hook_{hook_id}.lock"
+        lock = FileLock(str(lock_file))
+        def _update() -> None:
+            with lock:
+                data = json.loads(hook_file.read_text())
+                data["status"] = status.value
+                if payload is not None:
+                    data["payload"] = payload
+                if status == HookStatus.RECEIVED:
+                    data["received_at"] = datetime.now(UTC).isoformat()
+                hook_file.write_text(json.dumps(data, indent=2))
+        await asyncio.to_thread(_update)
+    async def list_hooks(
+        self,
+        run_id: str | None = None,
+        status: HookStatus | None = None,
+        limit: int = 100,
+        offset: int = 0,
+    ) -> list[Hook]:
+        """List hooks with optional filtering."""
+        def _list() -> list[dict]:
+            hooks = []
+            for hook_file in self.hooks_dir.glob("*.json"):
+                data = json.loads(hook_file.read_text())
+                # Apply filters
+                if run_id and data.get("run_id") != run_id:
+                    continue
+                if status and data.get("status") != status.value:
+                    continue
+                hooks.append(data)
+            # Sort by created_at descending
+            hooks.sort(key=lambda h: h.get("created_at", ""), reverse=True)
+            # Apply pagination
+            return hooks[offset : offset + limit]
+        hook_data_list = await asyncio.to_thread(_list)
+        return [Hook.from_dict(data) for data in hook_data_list]
+    # Cancellation Flag Operations
+    async def set_cancellation_flag(self, run_id: str) -> None:
+        """Set a cancellation flag for a workflow run."""
+        cancel_file = self.runs_dir / f"{run_id}.cancel"
+        lock_file = self.locks_dir / f"{run_id}_cancel.lock"
+        lock = FileLock(str(lock_file))
+        def _write() -> None:
+            with lock:
+                cancel_file.write_text(datetime.now(UTC).isoformat())
+        await asyncio.to_thread(_write)
+    async def check_cancellation_flag(self, run_id: str) -> bool:
+        """Check if a cancellation flag is set for a workflow run."""
+        cancel_file = self.runs_dir / f"{run_id}.cancel"
+        def _check() -> bool:
+            return cancel_file.exists()
+        return await asyncio.to_thread(_check)
+    async def clear_cancellation_flag(self, run_id: str) -> None:
+        """Clear the cancellation flag for a workflow run."""
+        cancel_file = self.runs_dir / f"{run_id}.cancel"
+        lock_file = self.locks_dir / f"{run_id}_cancel.lock"
+        lock = FileLock(str(lock_file))
+        def _clear() -> None:
+            with lock:
+                if cancel_file.exists():
+                    cancel_file.unlink()
+        await asyncio.to_thread(_clear)
+    # Continue-As-New Chain Operations
+    async def update_run_continuation(
+        self,
+        run_id: str,
+        continued_to_run_id: str,
+    ) -> None:
+        """Update the continuation link for a workflow run."""
+        run_file = self.runs_dir / f"{run_id}.json"
+        if not run_file.exists():
+            raise ValueError(f"Workflow run {run_id} not found")
+        lock_file = self.locks_dir / f"{run_id}.lock"
+        lock = FileLock(str(lock_file))
+        def _update() -> None:
+            with lock:
+                data = json.loads(run_file.read_text())
+                data["continued_to_run_id"] = continued_to_run_id
+                data["updated_at"] = datetime.now(UTC).isoformat()
+                run_file.write_text(json.dumps(data, indent=2))
+        await asyncio.to_thread(_update)
+    async def get_workflow_chain(
+        self,
+        run_id: str,
+    ) -> list[WorkflowRun]:
+        """Get all runs in a continue-as-new chain."""
+        run = await self.get_run(run_id)
+        if not run:
+            return []
+        # Walk backwards to find the start of the chain
+        current = run
+        while current.continued_from_run_id:
+            prev = await self.get_run(current.continued_from_run_id)
+            if not prev:
+                break
+            current = prev
+        # Build chain from start to end
+        chain = [current]
+        while current.continued_to_run_id:
+            next_run = await self.get_run(current.continued_to_run_id)
+            if not next_run:
+                break
+            chain.append(next_run)
+            current = next_run
+        return chain
+    # Child Workflow Operations
+    async def get_children(
+        self,
+        parent_run_id: str,
+        status: RunStatus | None = None,
+    ) -> list[WorkflowRun]:
+        """Get all child workflow runs for a parent workflow."""
+        def _list() -> list[dict]:
+            children = []
+            for run_file in self.runs_dir.glob("*.json"):
+                data = json.loads(run_file.read_text())
+                # Filter by parent_run_id
+                if data.get("parent_run_id") != parent_run_id:
+                    continue
+                # Filter by status if provided
+                if status and data.get("status") != status.value:
+                    continue
+                children.append(data)
+            # Sort by created_at
+            children.sort(key=lambda r: r.get("created_at", ""))
+            return children
+        child_data_list = await asyncio.to_thread(_list)
+        return [WorkflowRun.from_dict(data) for data in child_data_list]
+    async def get_parent(self, run_id: str) -> WorkflowRun | None:
+        """Get the parent workflow run for a child workflow."""
+        run = await self.get_run(run_id)
+        if run and run.parent_run_id:
+            return await self.get_run(run.parent_run_id)
+        return None
+    async def get_nesting_depth(self, run_id: str) -> int:
+        """Get the nesting depth for a workflow."""
+        run = await self.get_run(run_id)
+        return run.nesting_depth if run else 0
+    # Schedule Operations
+    async def create_schedule(self, schedule: Schedule) -> None:
+        """Create a new schedule record."""
+        schedule_file = self.schedules_dir / f"{schedule.schedule_id}.json"
+        if schedule_file.exists():
+            raise ValueError(f"Schedule {schedule.schedule_id} already exists")
+        data = schedule.to_dict()
+        lock_file = self.locks_dir / f"schedule_{schedule.schedule_id}.lock"
+        lock = FileLock(str(lock_file))
+        def _write() -> None:
+            with lock:
+                schedule_file.write_text(json.dumps(data, indent=2))
+        await asyncio.to_thread(_write)
+    async def get_schedule(self, schedule_id: str) -> Schedule | None:
+        """Retrieve a schedule by ID."""
+        schedule_file = self.schedules_dir / f"{schedule_id}.json"
+        if not schedule_file.exists():
+            return None
+        lock_file = self.locks_dir / f"schedule_{schedule_id}.lock"
+        lock = FileLock(str(lock_file))
+        def _read() -> dict | None:
+            with lock:
+                if not schedule_file.exists():
+                    return None
+                return json.loads(schedule_file.read_text())
+        data = await asyncio.to_thread(_read)
+        return Schedule.from_dict(data) if data else None
+    async def update_schedule(self, schedule: Schedule) -> None:
+        """Update an existing schedule."""
+        schedule_file = self.schedules_dir / f"{schedule.schedule_id}.json"
+        if not schedule_file.exists():
+            raise ValueError(f"Schedule {schedule.schedule_id} does not exist")
+        data = schedule.to_dict()
+        lock_file = self.locks_dir / f"schedule_{schedule.schedule_id}.lock"
+        lock = FileLock(str(lock_file))
+        def _write() -> None:
+            with lock:
+                schedule_file.write_text(json.dumps(data, indent=2))
+        await asyncio.to_thread(_write)
+    async def delete_schedule(self, schedule_id: str) -> None:
+        """Mark a schedule as deleted (soft delete)."""
+        schedule = await self.get_schedule(schedule_id)
+        if not schedule:
+            raise ValueError(f"Schedule {schedule_id} does not exist")
+        schedule.status = ScheduleStatus.DELETED
+        schedule.updated_at = datetime.now(UTC)
+        await self.update_schedule(schedule)
+    async def list_schedules(
+        self,
+        workflow_name: str | None = None,
+        status: ScheduleStatus | None = None,
+        limit: int = 100,
+        offset: int = 0,
+    ) -> list[Schedule]:
+        """List schedules with optional filtering."""
+        def _list() -> list[dict]:
+            schedules = []
+            for schedule_file in self.schedules_dir.glob("*.json"):
+                try:
+                    data = json.loads(schedule_file.read_text())
+                    # Apply filters
+                    if workflow_name and data.get("workflow_name") != workflow_name:
+                        continue
+                    if status and data.get("status") != status.value:
+                        continue
+                    schedules.append(data)
+                except (json.JSONDecodeError, KeyError):
+                    continue
+            # Sort by created_at descending
+            schedules.sort(key=lambda x: x.get("created_at", ""), reverse=True)
+            # Apply pagination
+            return schedules[offset : offset + limit]
+        schedule_data_list = await asyncio.to_thread(_list)
+        return [Schedule.from_dict(data) for data in schedule_data_list]
+    async def get_due_schedules(self, now: datetime) -> list[Schedule]:
+        """Get all schedules that are due to run."""
+        now_iso = now.isoformat()
+        def _list_due() -> list[dict]:
+            due_schedules = []
+            for schedule_file in self.schedules_dir.glob("*.json"):
+                try:
+                    data = json.loads(schedule_file.read_text())
+                    # Check criteria
+                    if data.get("status") != ScheduleStatus.ACTIVE.value:
+                        continue
+                    next_run = data.get("next_run_time")
+                    if not next_run:
+                        continue
+                    if next_run > now_iso:
+                        continue
+                    due_schedules.append(data)
+                except (json.JSONDecodeError, KeyError):
+                    continue
+            # Sort by next_run_time ascending
+            due_schedules.sort(key=lambda x: x.get("next_run_time", ""))
+            return due_schedules
+        schedule_data_list = await asyncio.to_thread(_list_due)
+        return [Schedule.from_dict(data) for data in schedule_data_list]
+    async def add_running_run(self, schedule_id: str, run_id: str) -> None:
+        """Add a run_id to the schedule's running_run_ids list."""
+        schedule = await self.get_schedule(schedule_id)
+        if not schedule:
+            raise ValueError(f"Schedule {schedule_id} does not exist")
+        if run_id not in schedule.running_run_ids:
+            schedule.running_run_ids.append(run_id)
+            schedule.updated_at = datetime.now(UTC)
+            await self.update_schedule(schedule)
+    async def remove_running_run(self, schedule_id: str, run_id: str) -> None:
+        """Remove a run_id from the schedule's running_run_ids list."""
+        schedule = await self.get_schedule(schedule_id)
+        if not schedule:
+            raise ValueError(f"Schedule {schedule_id} does not exist")
+        if run_id in schedule.running_run_ids:
+            schedule.running_run_ids.remove(run_id)
+            schedule.updated_at = datetime.now(UTC)
+            await self.update_schedule(schedule)