PyPI - hatchet-sdk - Versions diffs - 1.12.3__py3-none-any.whl → 1.13.0__py3-none-any.whl - Mend

hatchet-sdk 1.12.3py3-none-any.whl → 1.13.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of hatchet-sdk might be problematic. Click here for more details.

Files changed (48) hide show

hatchet_sdk/__init__.py +46 -40
hatchet_sdk/clients/admin.py +18 -23
hatchet_sdk/clients/dispatcher/action_listener.py +4 -3
hatchet_sdk/clients/dispatcher/dispatcher.py +1 -4
hatchet_sdk/clients/event_ts.py +2 -1
hatchet_sdk/clients/events.py +16 -12
hatchet_sdk/clients/listeners/durable_event_listener.py +4 -2
hatchet_sdk/clients/listeners/pooled_listener.py +2 -2
hatchet_sdk/clients/listeners/run_event_listener.py +7 -8
hatchet_sdk/clients/listeners/workflow_listener.py +14 -6
hatchet_sdk/clients/rest/api_response.py +3 -2
hatchet_sdk/clients/rest/tenacity_utils.py +6 -8
hatchet_sdk/config.py +2 -0
hatchet_sdk/connection.py +10 -4
hatchet_sdk/context/context.py +170 -46
hatchet_sdk/context/worker_context.py +4 -7
hatchet_sdk/contracts/dispatcher_pb2.py +38 -38
hatchet_sdk/contracts/dispatcher_pb2.pyi +4 -2
hatchet_sdk/contracts/events_pb2.py +13 -13
hatchet_sdk/contracts/events_pb2.pyi +4 -2
hatchet_sdk/contracts/v1/workflows_pb2.py +1 -1
hatchet_sdk/contracts/v1/workflows_pb2.pyi +2 -2
hatchet_sdk/exceptions.py +99 -1
hatchet_sdk/features/cron.py +2 -2
hatchet_sdk/features/filters.py +3 -3
hatchet_sdk/features/runs.py +4 -4
hatchet_sdk/features/scheduled.py +8 -9
hatchet_sdk/hatchet.py +65 -64
hatchet_sdk/opentelemetry/instrumentor.py +20 -20
hatchet_sdk/runnables/action.py +1 -2
hatchet_sdk/runnables/contextvars.py +19 -0
hatchet_sdk/runnables/task.py +37 -29
hatchet_sdk/runnables/types.py +9 -8
hatchet_sdk/runnables/workflow.py +57 -42
hatchet_sdk/utils/proto_enums.py +4 -4
hatchet_sdk/utils/timedelta_to_expression.py +2 -3
hatchet_sdk/utils/typing.py +11 -17
hatchet_sdk/waits.py +6 -5
hatchet_sdk/worker/action_listener_process.py +33 -13
hatchet_sdk/worker/runner/run_loop_manager.py +15 -11
hatchet_sdk/worker/runner/runner.py +102 -92
hatchet_sdk/worker/runner/utils/capture_logs.py +72 -31
hatchet_sdk/worker/worker.py +29 -25
hatchet_sdk/workflow_run.py +4 -2
{hatchet_sdk-1.12.3.dist-info → hatchet_sdk-1.13.0.dist-info}/METADATA +1 -1
{hatchet_sdk-1.12.3.dist-info → hatchet_sdk-1.13.0.dist-info}/RECORD +48 -48
{hatchet_sdk-1.12.3.dist-info → hatchet_sdk-1.13.0.dist-info}/WHEEL +0 -0
{hatchet_sdk-1.12.3.dist-info → hatchet_sdk-1.13.0.dist-info}/entry_points.txt +0 -0

hatchet_sdk/utils/typing.py CHANGED Viewed

@@ -1,20 +1,11 @@
 import sys
-from typing import (
-    Any,
-    Awaitable,
-    Coroutine,
-    Generator,
-    Mapping,
-    Type,
-    TypeAlias,
-    TypeGuard,
-    TypeVar,
-)
+from collections.abc import Awaitable, Coroutine, Generator
+from typing import Any, Literal, TypeAlias, TypeGuard, TypeVar
 from pydantic import BaseModel
-def is_basemodel_subclass(model: Any) -> TypeGuard[Type[BaseModel]]:
+def is_basemodel_subclass(model: Any) -> TypeGuard[type[BaseModel]]:
     try:
         return issubclass(model, BaseModel)
     except TypeError:
@@ -22,18 +13,21 @@ def is_basemodel_subclass(model: Any) -> TypeGuard[Type[BaseModel]]:
 class TaskIOValidator(BaseModel):
-    workflow_input: Type[BaseModel] | None = None
-    step_output: Type[BaseModel] | None = None
+    workflow_input: type[BaseModel] | None = None
+    step_output: type[BaseModel] | None = None
-JSONSerializableMapping = Mapping[str, Any]
+JSONSerializableMapping = dict[str, Any]
 _T_co = TypeVar("_T_co", covariant=True)
 if sys.version_info >= (3, 12):
-    AwaitableLike: TypeAlias = Awaitable[_T_co]  # noqa: Y047
-    CoroutineLike: TypeAlias = Coroutine[Any, Any, _T_co]  # noqa: Y047
+    AwaitableLike: TypeAlias = Awaitable[_T_co]
+    CoroutineLike: TypeAlias = Coroutine[Any, Any, _T_co]
 else:
     AwaitableLike: TypeAlias = Generator[Any, None, _T_co] | Awaitable[_T_co]
     CoroutineLike: TypeAlias = Generator[Any, None, _T_co] | Coroutine[Any, Any, _T_co]
+STOP_LOOP_TYPE = Literal["STOP_LOOP"]
+STOP_LOOP: STOP_LOOP_TYPE = "STOP_LOOP"  # Sentinel object to stop the loop

hatchet_sdk/waits.py CHANGED Viewed

@@ -6,6 +6,7 @@ from uuid import uuid4
 from pydantic import BaseModel, Field
+from hatchet_sdk.config import ClientConfig
 from hatchet_sdk.contracts.v1.shared.condition_pb2 import Action as ProtoAction
 from hatchet_sdk.contracts.v1.shared.condition_pb2 import (
     BaseMatchCondition,
@@ -53,7 +54,7 @@ class Condition(ABC):
     @abstractmethod
     def to_proto(
-        self,
+        self, config: ClientConfig
     ) -> UserEventMatchCondition | ParentOverrideMatchCondition | SleepMatchCondition:
         pass
@@ -71,7 +72,7 @@ class SleepCondition(Condition):
         self.duration = duration
-    def to_proto(self) -> SleepMatchCondition:
+    def to_proto(self, config: ClientConfig) -> SleepMatchCondition:
         return SleepMatchCondition(
             base=self.base.to_proto(),
             sleep_for=timedelta_to_expr(self.duration),
@@ -95,10 +96,10 @@ class UserEventCondition(Condition):
         self.event_key = event_key
         self.expression = expression
-    def to_proto(self) -> UserEventMatchCondition:
+    def to_proto(self, config: ClientConfig) -> UserEventMatchCondition:
         return UserEventMatchCondition(
             base=self.base.to_proto(),
-            user_event_key=self.event_key,
+            user_event_key=config.apply_namespace(self.event_key),
         )
@@ -124,7 +125,7 @@ class ParentCondition(Condition):
         self.parent = parent
-    def to_proto(self) -> ParentOverrideMatchCondition:
+    def to_proto(self, config: ClientConfig) -> ParentOverrideMatchCondition:
         return ParentOverrideMatchCondition(
             base=self.base.to_proto(),
             parent_readable_id=self.parent.name,

hatchet_sdk/worker/action_listener_process.py CHANGED Viewed

@@ -4,9 +4,10 @@ import signal
 import time
 from dataclasses import dataclass
 from multiprocessing import Queue
-from typing import Any, Literal
+from typing import Any
 import grpc
+from grpc.aio import UnaryUnaryCall
 from hatchet_sdk.client import Client
 from hatchet_sdk.clients.dispatcher.action_listener import (
@@ -19,6 +20,9 @@ from hatchet_sdk.config import ClientConfig
 from hatchet_sdk.contracts.dispatcher_pb2 import (
     GROUP_KEY_EVENT_TYPE_STARTED,
     STEP_EVENT_TYPE_STARTED,
+    ActionEventResponse,
+    GroupKeyActionEvent,
+    StepActionEvent,
 )
 from hatchet_sdk.logger import logger
 from hatchet_sdk.runnables.action import Action, ActionType
@@ -29,6 +33,7 @@ from hatchet_sdk.runnables.contextvars import (
     ctx_workflow_run_id,
 )
 from hatchet_sdk.utils.backoff import exp_backoff_sleep
+from hatchet_sdk.utils.typing import STOP_LOOP, STOP_LOOP_TYPE
 ACTION_EVENT_RETRY_COUNT = 5
@@ -41,9 +46,6 @@ class ActionEvent:
     should_not_retry: bool
-STOP_LOOP_TYPE = Literal["STOP_LOOP"]
-STOP_LOOP: STOP_LOOP_TYPE = "STOP_LOOP"  # Sentinel object to stop the loop
 BLOCKED_THREAD_WARNING = "THE TIME TO START THE TASK RUN IS TOO LONG, THE EVENT LOOP MAY BE BLOCKED. See https://docs.hatchet.run/blog/warning-event-loop-blocked for details and debugging help."
@@ -56,9 +58,9 @@ class WorkerActionListenerProcess:
         config: ClientConfig,
         action_queue: "Queue[Action]",
         event_queue: "Queue[ActionEvent | STOP_LOOP_TYPE]",
-        handle_kill: bool = True,
-        debug: bool = False,
-        labels: dict[str, str | int] = {},
+        handle_kill: bool,
+        debug: bool,
+        labels: dict[str, str | int],
     ) -> None:
         self.name = name
         self.actions = actions
@@ -75,6 +77,14 @@ class WorkerActionListenerProcess:
         self.action_loop_task: asyncio.Task[None] | None = None
         self.event_send_loop_task: asyncio.Task[None] | None = None
         self.running_step_runs: dict[str, float] = {}
+        self.step_action_events: set[
+            asyncio.Task[UnaryUnaryCall[StepActionEvent, ActionEventResponse] | None]
+        ] = set()
+        self.group_key_action_events: set[
+            asyncio.Task[
+                UnaryUnaryCall[GroupKeyActionEvent, ActionEventResponse] | None
+            ]
+        ] = set()
         if self.debug:
             logger.setLevel(logging.DEBUG)
@@ -144,20 +154,21 @@ class WorkerActionListenerProcess:
                 break
             logger.debug(f"tx: event: {event.action.action_id}/{event.type}")
-            asyncio.create_task(self.send_event(event))
+            t = asyncio.create_task(self.send_event(event))
+            self.step_action_events.add(t)
+            t.add_done_callback(lambda t: self.step_action_events.discard(t))
     async def start_blocked_main_loop(self) -> None:
         threshold = 1
         while not self.killing:
             count = 0
-            for _, start_time in self.running_step_runs.items():
+            for start_time in self.running_step_runs.values():
                 diff = self.now() - start_time
                 if diff > threshold:
                     count += 1
             if count > 0:
                 logger.warning(f"{BLOCKED_THREAD_WARNING}: Waiting Steps {count}")
-                print(asyncio.current_task())
             await asyncio.sleep(1)
     async def send_event(self, event: ActionEvent, retry_attempt: int = 1) -> None:
@@ -187,7 +198,7 @@ class WorkerActionListenerProcess:
                                 self.now()
                             )
-                    asyncio.create_task(
+                    send_started_event_task = asyncio.create_task(
                         self.dispatcher_client.send_step_action_event(
                             event.action,
                             event.type,
@@ -195,14 +206,23 @@ class WorkerActionListenerProcess:
                             event.should_not_retry,
                         )
                     )
+                    self.step_action_events.add(send_started_event_task)
+                    send_started_event_task.add_done_callback(
+                        lambda t: self.step_action_events.discard(t)
+                    )
                 case ActionType.CANCEL_STEP_RUN:
                     logger.debug("unimplemented event send")
                 case ActionType.START_GET_GROUP_KEY:
-                    asyncio.create_task(
+                    get_group_key_task = asyncio.create_task(
                         self.dispatcher_client.send_group_key_action_event(
                             event.action, event.type, event.payload
                         )
                     )
+                    self.group_key_action_events.add(get_group_key_task)
+                    get_group_key_task.add_done_callback(
+                        lambda t: self.group_key_action_events.discard(t)
+                    )
                 case _:
                     logger.error("unknown action type for event send")
         except Exception as e:
@@ -317,7 +337,7 @@ def worker_action_listener_process(*args: Any, **kwargs: Any) -> None:
         process = WorkerActionListenerProcess(*args, **kwargs)
         await process.start()
         # Keep the process running
-        while not process.killing:
+        while not process.killing:  # noqa: ASYNC110
             await asyncio.sleep(0.1)
     asyncio.run(run())

hatchet_sdk/worker/runner/run_loop_manager.py CHANGED Viewed

@@ -1,19 +1,17 @@
 import asyncio
 import logging
 from multiprocessing import Queue
-from typing import Any, Literal, TypeVar
+from typing import Any, TypeVar
 from hatchet_sdk.client import Client
 from hatchet_sdk.config import ClientConfig
 from hatchet_sdk.logger import logger
 from hatchet_sdk.runnables.action import Action
 from hatchet_sdk.runnables.task import Task
+from hatchet_sdk.utils.typing import STOP_LOOP, STOP_LOOP_TYPE
 from hatchet_sdk.worker.action_listener_process import ActionEvent
 from hatchet_sdk.worker.runner.runner import Runner
-from hatchet_sdk.worker.runner.utils.capture_logs import capture_logs
-STOP_LOOP_TYPE = Literal["STOP_LOOP"]
-STOP_LOOP: STOP_LOOP_TYPE = "STOP_LOOP"
+from hatchet_sdk.worker.runner.utils.capture_logs import AsyncLogSender, capture_logs
 T = TypeVar("T")
@@ -28,10 +26,10 @@ class WorkerActionRunLoopManager:
         action_queue: "Queue[Action | STOP_LOOP_TYPE]",
         event_queue: "Queue[ActionEvent]",
         loop: asyncio.AbstractEventLoop,
-        handle_kill: bool = True,
-        debug: bool = False,
-        labels: dict[str, str | int] = {},
-        lifespan_context: Any | None = None,
+        handle_kill: bool,
+        debug: bool,
+        labels: dict[str, str | int] | None,
+        lifespan_context: Any | None,
     ) -> None:
         self.name = name
         self.action_registry = action_registry
@@ -52,15 +50,19 @@ class WorkerActionRunLoopManager:
         self.runner: Runner | None = None
         self.client = Client(config=self.config, debug=self.debug)
+        self.start_loop_manager_task: asyncio.Task[None] | None = None
+        self.log_sender = AsyncLogSender(self.client.event)
+        self.log_task = self.loop.create_task(self.log_sender.consume())
         self.start()
     def start(self) -> None:
-        k = self.loop.create_task(self.aio_start())  # noqa: F841
+        self.start_loop_manager_task = self.loop.create_task(self.aio_start())
     async def aio_start(self, retry_count: int = 1) -> None:
         await capture_logs(
             self.client.log_interceptor,
-            self.client.event,
+            self.log_sender,
             self._async_start,
         )()
@@ -75,6 +77,7 @@ class WorkerActionRunLoopManager:
         self.killing = True
         self.action_queue.put(STOP_LOOP)
+        self.log_sender.publish(STOP_LOOP)
     async def wait_for_tasks(self) -> None:
         if self.runner:
@@ -89,6 +92,7 @@ class WorkerActionRunLoopManager:
             self.action_registry,
             self.labels,
             self.lifespan_context,
+            self.log_sender,
         )
         logger.debug(f"'{self.name}' waiting for {list(self.action_registry.keys())}")

hatchet_sdk/worker/runner/runner.py CHANGED Viewed

@@ -1,14 +1,14 @@
 import asyncio
-import contextvars
 import ctypes
 import functools
 import json
-import traceback
+from collections.abc import Callable
 from concurrent.futures import ThreadPoolExecutor
+from contextlib import suppress
 from enum import Enum
 from multiprocessing import Queue
 from threading import Thread, current_thread
-from typing import Any, Callable, Dict, Literal, cast, overload
+from typing import Any, Literal, cast, overload
 from pydantic import BaseModel
@@ -30,7 +30,7 @@ from hatchet_sdk.contracts.dispatcher_pb2 import (
     STEP_EVENT_TYPE_FAILED,
     STEP_EVENT_TYPE_STARTED,
 )
-from hatchet_sdk.exceptions import NonRetryableException
+from hatchet_sdk.exceptions import NonRetryableException, TaskRunError
 from hatchet_sdk.features.runs import RunsClient
 from hatchet_sdk.logger import logger
 from hatchet_sdk.runnables.action import Action, ActionKey, ActionType
@@ -40,12 +40,17 @@ from hatchet_sdk.runnables.contextvars import (
     ctx_worker_id,
     ctx_workflow_run_id,
     spawn_index_lock,
+    task_count,
     workflow_spawn_indices,
 )
 from hatchet_sdk.runnables.task import Task
 from hatchet_sdk.runnables.types import R, TWorkflowInput
 from hatchet_sdk.worker.action_listener_process import ActionEvent
-from hatchet_sdk.worker.runner.utils.capture_logs import copy_context_vars
+from hatchet_sdk.worker.runner.utils.capture_logs import (
+    AsyncLogSender,
+    ContextVarToCopy,
+    copy_context_vars,
+)
 class WorkerStatus(Enum):
@@ -61,10 +66,11 @@ class Runner:
         event_queue: "Queue[ActionEvent]",
         config: ClientConfig,
         slots: int,
-        handle_kill: bool = True,
-        action_registry: dict[str, Task[TWorkflowInput, R]] = {},
-        labels: dict[str, str | int] = {},
-        lifespan_context: Any | None = None,
+        handle_kill: bool,
+        action_registry: dict[str, Task[TWorkflowInput, R]],
+        labels: dict[str, str | int] | None,
+        lifespan_context: Any | None,
+        log_sender: AsyncLogSender,
     ):
         # We store the config so we can dynamically create clients for the dispatcher client.
         self.config = config
@@ -72,13 +78,14 @@ class Runner:
         self.slots = slots
         self.tasks: dict[ActionKey, asyncio.Task[Any]] = {}  # Store run ids and futures
         self.contexts: dict[ActionKey, Context] = {}  # Store run ids and contexts
-        self.action_registry = action_registry
+        self.action_registry = action_registry or {}
         self.event_queue = event_queue
         # The thread pool is used for synchronous functions which need to run concurrently
         self.thread_pool = ThreadPoolExecutor(max_workers=slots)
-        self.threads: Dict[ActionKey, Thread] = {}  # Store run ids and threads
+        self.threads: dict[ActionKey, Thread] = {}  # Store run ids and threads
+        self.running_tasks = set[asyncio.Task[Exception | None]]()
         self.killing = False
         self.handle_kill = handle_kill
@@ -101,10 +108,11 @@ class Runner:
         self.durable_event_listener = DurableEventListener(self.config)
         self.worker_context = WorkerContext(
-            labels=labels, client=Client(config=config).dispatcher
+            labels=labels or {}, client=Client(config=config).dispatcher
         )
         self.lifespan_context = lifespan_context
+        self.log_sender = log_sender
         if self.config.enable_thread_pool_monitoring:
             self.start_background_monitoring()
@@ -116,67 +124,68 @@ class Runner:
         if self.worker_context.id() is None:
             self.worker_context._worker_id = action.worker_id
+        t: asyncio.Task[Exception | None] | None = None
         match action.action_type:
             case ActionType.START_STEP_RUN:
                 log = f"run: start step: {action.action_id}/{action.step_run_id}"
                 logger.info(log)
-                asyncio.create_task(self.handle_start_step_run(action))
+                t = asyncio.create_task(self.handle_start_step_run(action))
             case ActionType.CANCEL_STEP_RUN:
                 log = f"cancel: step run:  {action.action_id}/{action.step_run_id}/{action.retry_count}"
                 logger.info(log)
-                asyncio.create_task(self.handle_cancel_action(action))
+                t = asyncio.create_task(self.handle_cancel_action(action))
             case ActionType.START_GET_GROUP_KEY:
                 log = f"run: get group key:  {action.action_id}/{action.get_group_key_run_id}"
                 logger.info(log)
-                asyncio.create_task(self.handle_start_group_key_run(action))
+                t = asyncio.create_task(self.handle_start_group_key_run(action))
             case _:
                 log = f"unknown action type: {action.action_type}"
                 logger.error(log)
+        if t is not None:
+            self.running_tasks.add(t)
+            t.add_done_callback(lambda task: self.running_tasks.discard(task))
     def step_run_callback(self, action: Action) -> Callable[[asyncio.Task[Any]], None]:
         def inner_callback(task: asyncio.Task[Any]) -> None:
             self.cleanup_run_id(action.key)
-            errored = False
-            cancelled = task.cancelled()
-            output = None
+            if task.cancelled():
+                return
-            # Get the output from the future
             try:
-                if not cancelled:
-                    output = task.result()
+                output = task.result()
             except Exception as e:
-                errored = True
                 should_not_retry = isinstance(e, NonRetryableException)
+                exc = TaskRunError.from_exception(e)
                 # This except is coming from the application itself, so we want to send that to the Hatchet instance
                 self.event_queue.put(
                     ActionEvent(
                         action=action,
                         type=STEP_EVENT_TYPE_FAILED,
-                        payload=str(pretty_format_exception(f"{e}", e)),
+                        payload=exc.serialize(),
                         should_not_retry=should_not_retry,
                     )
                 )
                 logger.error(
-                    f"failed step run: {action.action_id}/{action.step_run_id}"
+                    f"failed step run: {action.action_id}/{action.step_run_id}\n{exc.serialize()}"
                 )
-            if not errored and not cancelled:
-                self.event_queue.put(
-                    ActionEvent(
-                        action=action,
-                        type=STEP_EVENT_TYPE_COMPLETED,
-                        payload=self.serialize_output(output),
-                        should_not_retry=False,
-                    )
-                )
+                return
-                logger.info(
-                    f"finished step run: {action.action_id}/{action.step_run_id}"
+            self.event_queue.put(
+                ActionEvent(
+                    action=action,
+                    type=STEP_EVENT_TYPE_COMPLETED,
+                    payload=self.serialize_output(output),
+                    should_not_retry=False,
                 )
+            )
+            logger.info(f"finished step run: {action.action_id}/{action.step_run_id}")
         return inner_callback
@@ -186,51 +195,46 @@ class Runner:
         def inner_callback(task: asyncio.Task[Any]) -> None:
             self.cleanup_run_id(action.key)
-            errored = False
-            cancelled = task.cancelled()
-            output = None
+            if task.cancelled():
+                return
-            # Get the output from the future
             try:
-                if not cancelled:
-                    output = task.result()
+                output = task.result()
             except Exception as e:
-                errored = True
+                exc = TaskRunError.from_exception(e)
                 self.event_queue.put(
                     ActionEvent(
                         action=action,
                         type=GROUP_KEY_EVENT_TYPE_FAILED,
-                        payload=str(pretty_format_exception(f"{e}", e)),
+                        payload=exc.serialize(),
                         should_not_retry=False,
                     )
                 )
                 logger.error(
-                    f"failed step run: {action.action_id}/{action.step_run_id}"
+                    f"failed step run: {action.action_id}/{action.step_run_id}\n{exc.serialize()}"
                 )
-            if not errored and not cancelled:
-                self.event_queue.put(
-                    ActionEvent(
-                        action=action,
-                        type=GROUP_KEY_EVENT_TYPE_COMPLETED,
-                        payload=self.serialize_output(output),
-                        should_not_retry=False,
-                    )
-                )
+                return
-                logger.info(
-                    f"finished step run: {action.action_id}/{action.step_run_id}"
+            self.event_queue.put(
+                ActionEvent(
+                    action=action,
+                    type=GROUP_KEY_EVENT_TYPE_COMPLETED,
+                    payload=self.serialize_output(output),
+                    should_not_retry=False,
                 )
+            )
+            logger.info(f"finished step run: {action.action_id}/{action.step_run_id}")
         return inner_callback
     def thread_action_func(
         self, ctx: Context, task: Task[TWorkflowInput, R], action: Action
     ) -> R:
-        if action.step_run_id:
-            self.threads[action.key] = current_thread()
-        elif action.get_group_key_run_id:
+        if action.step_run_id or action.get_group_key_run_id:
             self.threads[action.key] = current_thread()
         return task.call(ctx)
@@ -250,28 +254,36 @@ class Runner:
         try:
             if task.is_async_function:
                 return await task.aio_call(ctx)
-            else:
-                pfunc = functools.partial(
-                    # we must copy the context vars to the new thread, as only asyncio natively supports
-                    # contextvars
-                    copy_context_vars,
-                    contextvars.copy_context().items(),
-                    self.thread_action_func,
-                    ctx,
-                    task,
-                    action,
-                )
-                loop = asyncio.get_event_loop()
-                return await loop.run_in_executor(self.thread_pool, pfunc)
-        except Exception as e:
-            logger.error(
-                pretty_format_exception(
-                    f"exception raised in action ({action.action_id}, retry={action.retry_count}):\n{e}",
-                    e,
-                )
+            pfunc = functools.partial(
+                # we must copy the context vars to the new thread, as only asyncio natively supports
+                # contextvars
+                copy_context_vars,
+                [
+                    ContextVarToCopy(
+                        name="ctx_step_run_id",
+                        value=action.step_run_id,
+                    ),
+                    ContextVarToCopy(
+                        name="ctx_workflow_run_id",
+                        value=action.workflow_run_id,
+                    ),
+                    ContextVarToCopy(
+                        name="ctx_worker_id",
+                        value=action.worker_id,
+                    ),
+                    ContextVarToCopy(
+                        name="ctx_action_key",
+                        value=action.key,
+                    ),
+                ],
+                self.thread_action_func,
+                ctx,
+                task,
+                action,
             )
-            raise e
+            loop = asyncio.get_event_loop()
+            return await loop.run_in_executor(self.thread_pool, pfunc)
         finally:
             self.cleanup_run_id(action.key)
@@ -295,7 +307,7 @@ class Runner:
             while True:
                 await self.log_thread_pool_status()
-                for key in self.threads.keys():
+                for key in self.threads:
                     if key not in self.tasks:
                         logger.debug(f"Potential zombie thread found for key {key}")
@@ -350,6 +362,7 @@ class Runner:
             worker=self.worker_context,
             runs_client=self.runs_client,
             lifespan_context=self.lifespan_context,
+            log_sender=self.log_sender,
         )
     ## IMPORTANT: Keep this method's signature in sync with the wrapper in the OTel instrumentor
@@ -361,7 +374,8 @@ class Runner:
         if action_func:
             context = self.create_context(
-                action, True if action_func.is_durable else False
+                action,
+                True if action_func.is_durable else False,  # noqa: SIM210
             )
             self.contexts[action.key] = context
@@ -382,11 +396,12 @@ class Runner:
             task.add_done_callback(self.step_run_callback(action))
             self.tasks[action.key] = task
-            try:
+            task_count.increment()
+            ## FIXME: Handle cancelled exceptions and other special exceptions
+            ## that we don't want to suppress here
+            with suppress(Exception):
                 await task
-            except Exception:
-                # do nothing, this should be caught in the callback
-                pass
         ## Once the step run completes, we need to remove the workflow spawn index
         ## so we don't leak memory
@@ -444,7 +459,7 @@ class Runner:
             res = ctypes.pythonapi.PyThreadState_SetAsyncExc(ctypes.c_long(ident), exc)
             if res == 0:
                 raise ValueError("Invalid thread ID")
-            elif res != 1:
+            if res != 1:
                 logger.error("PyThreadState_SetAsyncExc failed")
                 # Call with exception set to 0 is needed to cleanup properly.
@@ -505,8 +520,3 @@ class Runner:
             logger.info(f"waiting for {running} tasks to finish...")
             await asyncio.sleep(1)
             running = len(self.tasks.keys())
-def pretty_format_exception(message: str, e: Exception) -> str:
-    trace = "".join(traceback.format_exception(type(e), e, e.__traceback__))
-    return f"{message}\n{trace}"

hatchet-sdk 1.12.3__py3-none-any.whl → 1.13.0__py3-none-any.whl

Potentially problematic release.

hatchet-sdk 1.12.3py3-none-any.whl → 1.13.0py3-none-any.whl