PyPI - modal - Versions diffs - 1.0.3.dev10__py3-none-any.whl → 1.2.3.dev7__py3-none-any.whl - Mend

modal 1.0.3.dev10py3-none-any.whl → 1.2.3.dev7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of modal might be problematic. Click here for more details.

Files changed (160) hide show

modal/__init__.py +0 -2
modal/__main__.py +3 -4
modal/_billing.py +80 -0
modal/_clustered_functions.py +7 -3
modal/_clustered_functions.pyi +15 -3
modal/_container_entrypoint.py +51 -69
modal/_functions.py +508 -240
modal/_grpc_client.py +171 -0
modal/_load_context.py +105 -0
modal/_object.py +81 -21
modal/_output.py +58 -45
modal/_partial_function.py +48 -73
modal/_pty.py +7 -3
modal/_resolver.py +26 -46
modal/_runtime/asgi.py +4 -3
modal/_runtime/container_io_manager.py +358 -220
modal/_runtime/container_io_manager.pyi +296 -101
modal/_runtime/execution_context.py +18 -2
modal/_runtime/execution_context.pyi +64 -7
modal/_runtime/gpu_memory_snapshot.py +262 -57
modal/_runtime/user_code_imports.py +28 -58
modal/_serialization.py +90 -6
modal/_traceback.py +42 -1
modal/_tunnel.pyi +380 -12
modal/_utils/async_utils.py +84 -29
modal/_utils/auth_token_manager.py +111 -0
modal/_utils/blob_utils.py +181 -58
modal/_utils/deprecation.py +19 -0
modal/_utils/function_utils.py +91 -47
modal/_utils/grpc_utils.py +89 -66
modal/_utils/mount_utils.py +26 -1
modal/_utils/name_utils.py +17 -3
modal/_utils/task_command_router_client.py +536 -0
modal/_utils/time_utils.py +34 -6
modal/app.py +256 -88
modal/app.pyi +909 -92
modal/billing.py +5 -0
modal/builder/2025.06.txt +18 -0
modal/builder/PREVIEW.txt +18 -0
modal/builder/base-images.json +58 -0
modal/cli/_download.py +19 -3
modal/cli/_traceback.py +3 -2
modal/cli/app.py +4 -4
modal/cli/cluster.py +15 -7
modal/cli/config.py +5 -3
modal/cli/container.py +7 -6
modal/cli/dict.py +22 -16
modal/cli/entry_point.py +12 -5
modal/cli/environment.py +5 -4
modal/cli/import_refs.py +3 -3
modal/cli/launch.py +102 -5
modal/cli/network_file_system.py +11 -12
modal/cli/profile.py +3 -2
modal/cli/programs/launch_instance_ssh.py +94 -0
modal/cli/programs/run_jupyter.py +1 -1
modal/cli/programs/run_marimo.py +95 -0
modal/cli/programs/vscode.py +1 -1
modal/cli/queues.py +57 -26
modal/cli/run.py +91 -23
modal/cli/secret.py +48 -22
modal/cli/token.py +7 -8
modal/cli/utils.py +4 -7
modal/cli/volume.py +31 -25
modal/client.py +15 -85
modal/client.pyi +183 -62
modal/cloud_bucket_mount.py +5 -3
modal/cloud_bucket_mount.pyi +197 -5
modal/cls.py +200 -126
modal/cls.pyi +446 -68
modal/config.py +29 -11
modal/container_process.py +319 -19
modal/container_process.pyi +190 -20
modal/dict.py +290 -71
modal/dict.pyi +835 -83
modal/environments.py +15 -27
modal/environments.pyi +46 -24
modal/exception.py +14 -2
modal/experimental/__init__.py +194 -40
modal/experimental/flash.py +618 -0
modal/experimental/flash.pyi +380 -0
modal/experimental/ipython.py +11 -7
modal/file_io.py +29 -36
modal/file_io.pyi +251 -53
modal/file_pattern_matcher.py +56 -16
modal/functions.pyi +673 -92
modal/gpu.py +1 -1
modal/image.py +528 -176
modal/image.pyi +1572 -145
modal/io_streams.py +458 -128
modal/io_streams.pyi +433 -52
modal/mount.py +216 -151
modal/mount.pyi +225 -78
modal/network_file_system.py +45 -62
modal/network_file_system.pyi +277 -56
modal/object.pyi +93 -17
modal/parallel_map.py +942 -129
modal/parallel_map.pyi +294 -15
modal/partial_function.py +0 -2
modal/partial_function.pyi +234 -19
modal/proxy.py +17 -8
modal/proxy.pyi +36 -3
modal/queue.py +270 -65
modal/queue.pyi +817 -57
modal/runner.py +115 -101
modal/runner.pyi +205 -49
modal/sandbox.py +512 -136
modal/sandbox.pyi +845 -111
modal/schedule.py +1 -1
modal/secret.py +300 -70
modal/secret.pyi +589 -34
modal/serving.py +7 -11
modal/serving.pyi +7 -8
modal/snapshot.py +11 -8
modal/snapshot.pyi +25 -4
modal/token_flow.py +4 -4
modal/token_flow.pyi +28 -8
modal/volume.py +416 -158
modal/volume.pyi +1117 -121
{modal-1.0.3.dev10.dist-info → modal-1.2.3.dev7.dist-info}/METADATA +10 -9
modal-1.2.3.dev7.dist-info/RECORD +195 -0
modal_docs/mdmd/mdmd.py +17 -4
modal_proto/api.proto +534 -79
modal_proto/api_grpc.py +337 -1
modal_proto/api_pb2.py +1522 -968
modal_proto/api_pb2.pyi +1619 -134
modal_proto/api_pb2_grpc.py +699 -4
modal_proto/api_pb2_grpc.pyi +226 -14
modal_proto/modal_api_grpc.py +175 -154
modal_proto/sandbox_router.proto +145 -0
modal_proto/sandbox_router_grpc.py +105 -0
modal_proto/sandbox_router_pb2.py +149 -0
modal_proto/sandbox_router_pb2.pyi +333 -0
modal_proto/sandbox_router_pb2_grpc.py +203 -0
modal_proto/sandbox_router_pb2_grpc.pyi +75 -0
modal_proto/task_command_router.proto +144 -0
modal_proto/task_command_router_grpc.py +105 -0
modal_proto/task_command_router_pb2.py +149 -0
modal_proto/task_command_router_pb2.pyi +333 -0
modal_proto/task_command_router_pb2_grpc.py +203 -0
modal_proto/task_command_router_pb2_grpc.pyi +75 -0
modal_version/__init__.py +1 -1
modal/requirements/PREVIEW.txt +0 -16
modal/requirements/base-images.json +0 -26
modal-1.0.3.dev10.dist-info/RECORD +0 -179
modal_proto/modal_options_grpc.py +0 -3
modal_proto/options.proto +0 -19
modal_proto/options_grpc.py +0 -3
modal_proto/options_pb2.py +0 -35
modal_proto/options_pb2.pyi +0 -20
modal_proto/options_pb2_grpc.py +0 -4
modal_proto/options_pb2_grpc.pyi +0 -7
/modal/{requirements → builder}/2023.12.312.txt +0 -0
/modal/{requirements → builder}/2023.12.txt +0 -0
/modal/{requirements → builder}/2024.04.txt +0 -0
/modal/{requirements → builder}/2024.10.txt +0 -0
/modal/{requirements → builder}/README.md +0 -0
{modal-1.0.3.dev10.dist-info → modal-1.2.3.dev7.dist-info}/WHEEL +0 -0
{modal-1.0.3.dev10.dist-info → modal-1.2.3.dev7.dist-info}/entry_points.txt +0 -0
{modal-1.0.3.dev10.dist-info → modal-1.2.3.dev7.dist-info}/licenses/LICENSE +0 -0
{modal-1.0.3.dev10.dist-info → modal-1.2.3.dev7.dist-info}/top_level.txt +0 -0

modal/_runtime/container_io_manager.pyi CHANGED Viewed

@@ -9,13 +9,25 @@ import synchronicity.combined_types
 import typing
 import typing_extensions
-class UserException(Exception): ...
-class Sentinel: ...
+class UserException(Exception):
+    """Used to shut down the task gracefully."""
+    ...
+class Sentinel:
+    """Used to get type-stubs to work with this object."""
+    ...
 class IOContext:
+    """Context object for managing input, function calls, and function executions
+    in a batched or single input context.
+    """
     input_ids: list[str]
     retry_counts: list[int]
     function_call_ids: list[str]
+    attempt_tokens: list[str]
     function_inputs: list[modal_proto.api_pb2.FunctionInput]
     finalized_function: modal._runtime.user_code_imports.FinalizedFunction
     _cancel_issued: bool
@@ -26,32 +38,56 @@ class IOContext:
         input_ids: list[str],
         retry_counts: list[int],
         function_call_ids: list[str],
+        attempt_tokens: list[str],
         finalized_function: modal._runtime.user_code_imports.FinalizedFunction,
         function_inputs: list[modal_proto.api_pb2.FunctionInput],
         is_batched: bool,
         client: modal.client._Client,
-    ): ...
+    ):
+        """Initialize self.  See help(type(self)) for accurate signature."""
+        ...
     @classmethod
     async def create(
         cls,
         client: modal.client._Client,
         finalized_functions: dict[str, modal._runtime.user_code_imports.FinalizedFunction],
-        inputs: list[tuple[str, int, str, modal_proto.api_pb2.FunctionInput]],
+        inputs: list[tuple[str, int, str, str, modal_proto.api_pb2.FunctionInput]],
         is_batched: bool,
     ) -> IOContext: ...
     def set_cancel_callback(self, cb: collections.abc.Callable[[], None]): ...
     def cancel(self): ...
     def _args_and_kwargs(self) -> tuple[tuple[typing.Any, ...], dict[str, list[typing.Any]]]: ...
-    def call_finalized_function(self) -> typing.Any: ...
-    def validate_output_data(self, data: typing.Any) -> list[typing.Any]: ...
+    def _generator_output_format(self) -> int: ...
+    def _prepare_batch_output(self, data: typing.Any) -> list[typing.Any]: ...
+    def call_function_sync(self) -> list[typing.Any]: ...
+    async def call_function_async(self) -> list[typing.Any]: ...
+    def call_generator_sync(self) -> typing.Generator[typing.Any, None, None]: ...
+    def call_generator_async(self) -> collections.abc.AsyncGenerator[typing.Any, None]: ...
+    async def output_items_cancellation(self, started_at: float): ...
+    def _determine_output_format(self, input_format: int) -> int: ...
+    async def output_items_exception(
+        self, started_at: float, task_id: str, exc: BaseException
+    ) -> list[modal_proto.api_pb2.FunctionPutOutputsItem]: ...
+    def output_items_generator_done(
+        self, started_at: float, items_total: int
+    ) -> list[modal_proto.api_pb2.FunctionPutOutputsItem]: ...
+    async def output_items(
+        self, started_at: float, data: list[typing.Any]
+    ) -> list[modal_proto.api_pb2.FunctionPutOutputsItem]: ...
 class InputSlots:
+    """A semaphore that allows dynamically adjusting the concurrency."""
     active: int
     value: int
     waiter: typing.Optional[asyncio.Future]
     closed: bool
-    def __init__(self, value: int) -> None: ...
+    def __init__(self, value: int) -> None:
+        """Initialize self.  See help(type(self)) for accurate signature."""
+        ...
     async def acquire(self) -> None: ...
     def _wake_waiter(self) -> None: ...
     def release(self) -> None: ...
@@ -59,11 +95,18 @@ class InputSlots:
     async def close(self) -> None: ...
 class _ContainerIOManager:
+    """Synchronizes all RPC calls and network operations for a running container.
+    TODO: maybe we shouldn't synchronize the whole class.
+    Then we could potentially move a bunch of the global functions onto it.
+    """
     task_id: str
     function_id: str
     app_id: str
     function_def: modal_proto.api_pb2.Function
     checkpoint_id: typing.Optional[str]
+    input_plane_server_url: typing.Optional[str]
     calls_completed: int
     total_user_time: float
     current_input_id: typing.Optional[str]
@@ -81,7 +124,6 @@ class _ContainerIOManager:
     _is_interactivity_enabled: bool
     _fetching_inputs: bool
     _client: modal.client._Client
-    _GENERATOR_STOP_SENTINEL: typing.ClassVar[Sentinel]
     _singleton: typing.ClassVar[typing.Optional[_ContainerIOManager]]
     def _init(self, container_args: modal_proto.api_pb2.ContainerArguments, client: modal.client._Client): ...
@@ -90,9 +132,15 @@ class _ContainerIOManager:
     @staticmethod
     def __new__(
         cls, container_args: modal_proto.api_pb2.ContainerArguments, client: modal.client._Client
-    ) -> _ContainerIOManager: ...
+    ) -> _ContainerIOManager:
+        """Create and return a new object.  See help(type) for accurate signature."""
+        ...
     @classmethod
-    def _reset_singleton(cls): ...
+    def _reset_singleton(cls):
+        """Only used for tests."""
+        ...
     async def hello(self): ...
     async def _run_heartbeat_loop(self): ...
     async def _heartbeat_handle_cancellations(self) -> bool: ...
@@ -100,46 +148,82 @@ class _ContainerIOManager:
     def stop_heartbeat(self): ...
     def dynamic_concurrency_manager(self) -> typing.AsyncContextManager[None]: ...
     async def _dynamic_concurrency_loop(self): ...
-    def serialize_data_format(self, obj: typing.Any, data_format: int) -> bytes: ...
-    async def format_blob_data(self, data: bytes) -> dict[str, typing.Any]: ...
-    def get_data_in(self, function_call_id: str) -> collections.abc.AsyncIterator[typing.Any]: ...
+    def get_data_in(
+        self, function_call_id: str, attempt_token: typing.Optional[str]
+    ) -> collections.abc.AsyncIterator[typing.Any]:
+        """Read from the `data_in` stream of a function call."""
+        ...
     async def put_data_out(
-        self, function_call_id: str, start_index: int, data_format: int, serialized_messages: list[typing.Any]
-    ) -> None: ...
-    async def generator_output_task(
-        self, function_call_id: str, data_format: int, message_rx: asyncio.queues.Queue
-    ) -> None: ...
-    async def _queue_create(self, size: int) -> asyncio.queues.Queue: ...
-    async def _queue_put(self, queue: asyncio.queues.Queue, value: typing.Any) -> None: ...
+        self,
+        function_call_id: str,
+        attempt_token: str,
+        start_index: int,
+        data_format: int,
+        serialized_messages: list[typing.Any],
+    ) -> None:
+        """Put data onto the `data_out` stream of a function call.
+        This is used for generator outputs, which includes web endpoint responses. Note that this
+        was introduced as a performance optimization in client version 0.57, so older clients will
+        still use the previous Postgres-backed system based on `FunctionPutOutputs()`.
+        """
+        ...
+    def generator_output_sender(
+        self, function_call_id: str, attempt_token: str, data_format: int, message_rx: asyncio.queues.Queue
+    ) -> typing.AsyncContextManager[None]:
+        """Runs background task that feeds generator outputs into a function call's `data_out` stream."""
+        ...
+    async def _queue_create(self, size: int) -> asyncio.queues.Queue:
+        """Create a queue, on the synchronicity event loop (needed on Python 3.8 and 3.9)."""
+        ...
+    async def _queue_put(self, queue: asyncio.queues.Queue, value: typing.Any) -> None:
+        """Put a value onto a queue, using the synchronicity event loop."""
+        ...
     def get_average_call_time(self) -> float: ...
     def get_max_inputs_to_fetch(self): ...
     def _generate_inputs(
         self, batch_max_size: int, batch_wait_ms: int
-    ) -> collections.abc.AsyncIterator[list[tuple[str, int, str, modal_proto.api_pb2.FunctionInput]]]: ...
+    ) -> collections.abc.AsyncIterator[list[tuple[str, int, str, str, modal_proto.api_pb2.FunctionInput]]]: ...
     def run_inputs_outputs(
         self,
         finalized_functions: dict[str, modal._runtime.user_code_imports.FinalizedFunction],
         batch_max_size: int = 0,
         batch_wait_ms: int = 0,
     ) -> collections.abc.AsyncIterator[IOContext]: ...
-    async def _push_outputs(
-        self,
-        io_context: IOContext,
-        started_at: float,
-        data_format: int,
-        results: list[modal_proto.api_pb2.GenericResult],
-    ) -> None: ...
-    def serialize_exception(self, exc: BaseException) -> bytes: ...
-    def serialize_traceback(self, exc: BaseException) -> tuple[typing.Optional[bytes], typing.Optional[bytes]]: ...
-    def handle_user_exception(self) -> typing.AsyncContextManager[None]: ...
-    def handle_input_exception(self, io_context: IOContext, started_at: float) -> typing.AsyncContextManager[None]: ...
+    async def _send_outputs(self, started_at: float, outputs: list[modal_proto.api_pb2.FunctionPutOutputsItem]) -> None:
+        """Send pre-built output items with retry and chunking."""
+        ...
+    def handle_user_exception(self) -> typing.AsyncContextManager[None]:
+        """Sets the task as failed in a way where it's not retried.
+        Used for handling exceptions from container lifecycle methods at the moment, which should
+        trigger a task failure state.
+        """
+        ...
+    def handle_input_exception(self, io_context: IOContext, started_at: float) -> typing.AsyncContextManager[None]:
+        """Handle an exception while processing a function input."""
+        ...
     def exit_context(self, started_at, input_ids: list[str]): ...
-    async def push_outputs(
-        self, io_context: IOContext, started_at: float, data: typing.Any, data_format: int
-    ) -> None: ...
+    async def push_outputs(self, io_context: IOContext, started_at: float, output_data: list[typing.Any]) -> None: ...
     async def memory_restore(self) -> None: ...
-    async def memory_snapshot(self) -> None: ...
-    async def volume_commit(self, volume_ids: list[str]) -> None: ...
+    async def memory_snapshot(self) -> None:
+        """Message server indicating that function is ready to be checkpointed."""
+        ...
+    async def volume_commit(self, volume_ids: list[str]) -> None:
+        """Perform volume commit for given `volume_ids`.
+        Only used on container exit to persist uncommitted changes on behalf of user.
+        """
+        ...
     async def interact(self, from_breakpoint: bool = False): ...
     @property
     def target_concurrency(self) -> int: ...
@@ -148,20 +232,41 @@ class _ContainerIOManager:
     @property
     def input_concurrency_enabled(self) -> int: ...
     @classmethod
-    def get_input_concurrency(cls) -> int: ...
+    def get_input_concurrency(cls) -> int:
+        """Returns the number of usable input slots.
+        If concurrency is reduced, active slots can exceed allotted slots. Returns the larger value
+        in this case.
+        """
+        ...
     @classmethod
-    def set_input_concurrency(cls, concurrency: int): ...
+    def set_input_concurrency(cls, concurrency: int):
+        """Edit the number of input slots.
+        This disables the background loop which automatically adjusts concurrency
+        within [target_concurrency, max_concurrency].
+        """
+        ...
     @classmethod
     def stop_fetching_inputs(cls): ...
 SUPERSELF = typing.TypeVar("SUPERSELF", covariant=True)
 class ContainerIOManager:
+    """Synchronizes all RPC calls and network operations for a running container.
+    TODO: maybe we shouldn't synchronize the whole class.
+    Then we could potentially move a bunch of the global functions onto it.
+    """
     task_id: str
     function_id: str
     app_id: str
     function_def: modal_proto.api_pb2.Function
     checkpoint_id: typing.Optional[str]
+    input_plane_server_url: typing.Optional[str]
     calls_completed: int
     total_user_time: float
     current_input_id: typing.Optional[str]
@@ -179,15 +284,19 @@ class ContainerIOManager:
     _is_interactivity_enabled: bool
     _fetching_inputs: bool
     _client: modal.client.Client
-    _GENERATOR_STOP_SENTINEL: typing.ClassVar[Sentinel]
     _singleton: typing.ClassVar[typing.Optional[ContainerIOManager]]
-    def __init__(self, /, *args, **kwargs): ...
+    def __init__(self, /, *args, **kwargs):
+        """Initialize self.  See help(type(self)) for accurate signature."""
+        ...
     def _init(self, container_args: modal_proto.api_pb2.ContainerArguments, client: modal.client.Client): ...
     @property
     def heartbeat_condition(self) -> asyncio.locks.Condition: ...
     @classmethod
-    def _reset_singleton(cls): ...
+    def _reset_singleton(cls):
+        """Only used for tests."""
+        ...
     class __hello_spec(typing_extensions.Protocol[SUPERSELF]):
         def __call__(self, /): ...
@@ -229,45 +338,92 @@ class ContainerIOManager:
     _dynamic_concurrency_loop: ___dynamic_concurrency_loop_spec[typing_extensions.Self]
-    def serialize_data_format(self, obj: typing.Any, data_format: int) -> bytes: ...
-    class __format_blob_data_spec(typing_extensions.Protocol[SUPERSELF]):
-        def __call__(self, /, data: bytes) -> dict[str, typing.Any]: ...
-        async def aio(self, /, data: bytes) -> dict[str, typing.Any]: ...
-    format_blob_data: __format_blob_data_spec[typing_extensions.Self]
     class __get_data_in_spec(typing_extensions.Protocol[SUPERSELF]):
-        def __call__(self, /, function_call_id: str) -> typing.Iterator[typing.Any]: ...
-        def aio(self, /, function_call_id: str) -> collections.abc.AsyncIterator[typing.Any]: ...
+        def __call__(
+            self, /, function_call_id: str, attempt_token: typing.Optional[str]
+        ) -> typing.Iterator[typing.Any]:
+            """Read from the `data_in` stream of a function call."""
+            ...
+        def aio(
+            self, /, function_call_id: str, attempt_token: typing.Optional[str]
+        ) -> collections.abc.AsyncIterator[typing.Any]:
+            """Read from the `data_in` stream of a function call."""
+            ...
     get_data_in: __get_data_in_spec[typing_extensions.Self]
     class __put_data_out_spec(typing_extensions.Protocol[SUPERSELF]):
         def __call__(
-            self, /, function_call_id: str, start_index: int, data_format: int, serialized_messages: list[typing.Any]
-        ) -> None: ...
+            self,
+            /,
+            function_call_id: str,
+            attempt_token: str,
+            start_index: int,
+            data_format: int,
+            serialized_messages: list[typing.Any],
+        ) -> None:
+            """Put data onto the `data_out` stream of a function call.
+            This is used for generator outputs, which includes web endpoint responses. Note that this
+            was introduced as a performance optimization in client version 0.57, so older clients will
+            still use the previous Postgres-backed system based on `FunctionPutOutputs()`.
+            """
+            ...
         async def aio(
-            self, /, function_call_id: str, start_index: int, data_format: int, serialized_messages: list[typing.Any]
-        ) -> None: ...
+            self,
+            /,
+            function_call_id: str,
+            attempt_token: str,
+            start_index: int,
+            data_format: int,
+            serialized_messages: list[typing.Any],
+        ) -> None:
+            """Put data onto the `data_out` stream of a function call.
+            This is used for generator outputs, which includes web endpoint responses. Note that this
+            was introduced as a performance optimization in client version 0.57, so older clients will
+            still use the previous Postgres-backed system based on `FunctionPutOutputs()`.
+            """
+            ...
     put_data_out: __put_data_out_spec[typing_extensions.Self]
-    class __generator_output_task_spec(typing_extensions.Protocol[SUPERSELF]):
-        def __call__(self, /, function_call_id: str, data_format: int, message_rx: asyncio.queues.Queue) -> None: ...
-        async def aio(self, /, function_call_id: str, data_format: int, message_rx: asyncio.queues.Queue) -> None: ...
+    class __generator_output_sender_spec(typing_extensions.Protocol[SUPERSELF]):
+        def __call__(
+            self, /, function_call_id: str, attempt_token: str, data_format: int, message_rx: asyncio.queues.Queue
+        ) -> synchronicity.combined_types.AsyncAndBlockingContextManager[None]:
+            """Runs background task that feeds generator outputs into a function call's `data_out` stream."""
+            ...
-    generator_output_task: __generator_output_task_spec[typing_extensions.Self]
+        def aio(
+            self, /, function_call_id: str, attempt_token: str, data_format: int, message_rx: asyncio.queues.Queue
+        ) -> typing.AsyncContextManager[None]:
+            """Runs background task that feeds generator outputs into a function call's `data_out` stream."""
+            ...
+    generator_output_sender: __generator_output_sender_spec[typing_extensions.Self]
     class ___queue_create_spec(typing_extensions.Protocol[SUPERSELF]):
-        def __call__(self, /, size: int) -> asyncio.queues.Queue: ...
-        async def aio(self, /, size: int) -> asyncio.queues.Queue: ...
+        def __call__(self, /, size: int) -> asyncio.queues.Queue:
+            """Create a queue, on the synchronicity event loop (needed on Python 3.8 and 3.9)."""
+            ...
+        async def aio(self, /, size: int) -> asyncio.queues.Queue:
+            """Create a queue, on the synchronicity event loop (needed on Python 3.8 and 3.9)."""
+            ...
     _queue_create: ___queue_create_spec[typing_extensions.Self]
     class ___queue_put_spec(typing_extensions.Protocol[SUPERSELF]):
-        def __call__(self, /, queue: asyncio.queues.Queue, value: typing.Any) -> None: ...
-        async def aio(self, /, queue: asyncio.queues.Queue, value: typing.Any) -> None: ...
+        def __call__(self, /, queue: asyncio.queues.Queue, value: typing.Any) -> None:
+            """Put a value onto a queue, using the synchronicity event loop."""
+            ...
+        async def aio(self, /, queue: asyncio.queues.Queue, value: typing.Any) -> None:
+            """Put a value onto a queue, using the synchronicity event loop."""
+            ...
     _queue_put: ___queue_put_spec[typing_extensions.Self]
@@ -277,10 +433,10 @@ class ContainerIOManager:
     class ___generate_inputs_spec(typing_extensions.Protocol[SUPERSELF]):
         def __call__(
             self, /, batch_max_size: int, batch_wait_ms: int
-        ) -> typing.Iterator[list[tuple[str, int, str, modal_proto.api_pb2.FunctionInput]]]: ...
+        ) -> typing.Iterator[list[tuple[str, int, str, str, modal_proto.api_pb2.FunctionInput]]]: ...
         def aio(
             self, /, batch_max_size: int, batch_wait_ms: int
-        ) -> collections.abc.AsyncIterator[list[tuple[str, int, str, modal_proto.api_pb2.FunctionInput]]]: ...
+        ) -> collections.abc.AsyncIterator[list[tuple[str, int, str, str, modal_proto.api_pb2.FunctionInput]]]: ...
     _generate_inputs: ___generate_inputs_spec[typing_extensions.Self]
@@ -302,50 +458,54 @@ class ContainerIOManager:
     run_inputs_outputs: __run_inputs_outputs_spec[typing_extensions.Self]
-    class ___push_outputs_spec(typing_extensions.Protocol[SUPERSELF]):
-        def __call__(
-            self,
-            /,
-            io_context: IOContext,
-            started_at: float,
-            data_format: int,
-            results: list[modal_proto.api_pb2.GenericResult],
-        ) -> None: ...
-        async def aio(
-            self,
-            /,
-            io_context: IOContext,
-            started_at: float,
-            data_format: int,
-            results: list[modal_proto.api_pb2.GenericResult],
-        ) -> None: ...
+    class ___send_outputs_spec(typing_extensions.Protocol[SUPERSELF]):
+        def __call__(self, /, started_at: float, outputs: list[modal_proto.api_pb2.FunctionPutOutputsItem]) -> None:
+            """Send pre-built output items with retry and chunking."""
+            ...
-    _push_outputs: ___push_outputs_spec[typing_extensions.Self]
+        async def aio(self, /, started_at: float, outputs: list[modal_proto.api_pb2.FunctionPutOutputsItem]) -> None:
+            """Send pre-built output items with retry and chunking."""
+            ...
-    def serialize_exception(self, exc: BaseException) -> bytes: ...
-    def serialize_traceback(self, exc: BaseException) -> tuple[typing.Optional[bytes], typing.Optional[bytes]]: ...
+    _send_outputs: ___send_outputs_spec[typing_extensions.Self]
     class __handle_user_exception_spec(typing_extensions.Protocol[SUPERSELF]):
-        def __call__(self, /) -> synchronicity.combined_types.AsyncAndBlockingContextManager[None]: ...
-        def aio(self, /) -> typing.AsyncContextManager[None]: ...
+        def __call__(self, /) -> synchronicity.combined_types.AsyncAndBlockingContextManager[None]:
+            """Sets the task as failed in a way where it's not retried.
+            Used for handling exceptions from container lifecycle methods at the moment, which should
+            trigger a task failure state.
+            """
+            ...
+        def aio(self, /) -> typing.AsyncContextManager[None]:
+            """Sets the task as failed in a way where it's not retried.
+            Used for handling exceptions from container lifecycle methods at the moment, which should
+            trigger a task failure state.
+            """
+            ...
     handle_user_exception: __handle_user_exception_spec[typing_extensions.Self]
     class __handle_input_exception_spec(typing_extensions.Protocol[SUPERSELF]):
         def __call__(
             self, /, io_context: IOContext, started_at: float
-        ) -> synchronicity.combined_types.AsyncAndBlockingContextManager[None]: ...
-        def aio(self, /, io_context: IOContext, started_at: float) -> typing.AsyncContextManager[None]: ...
+        ) -> synchronicity.combined_types.AsyncAndBlockingContextManager[None]:
+            """Handle an exception while processing a function input."""
+            ...
+        def aio(self, /, io_context: IOContext, started_at: float) -> typing.AsyncContextManager[None]:
+            """Handle an exception while processing a function input."""
+            ...
     handle_input_exception: __handle_input_exception_spec[typing_extensions.Self]
     def exit_context(self, started_at, input_ids: list[str]): ...
     class __push_outputs_spec(typing_extensions.Protocol[SUPERSELF]):
-        def __call__(self, /, io_context: IOContext, started_at: float, data: typing.Any, data_format: int) -> None: ...
-        async def aio(
-            self, /, io_context: IOContext, started_at: float, data: typing.Any, data_format: int
-        ) -> None: ...
+        def __call__(self, /, io_context: IOContext, started_at: float, output_data: list[typing.Any]) -> None: ...
+        async def aio(self, /, io_context: IOContext, started_at: float, output_data: list[typing.Any]) -> None: ...
     push_outputs: __push_outputs_spec[typing_extensions.Self]
@@ -356,14 +516,28 @@ class ContainerIOManager:
     memory_restore: __memory_restore_spec[typing_extensions.Self]
     class __memory_snapshot_spec(typing_extensions.Protocol[SUPERSELF]):
-        def __call__(self, /) -> None: ...
-        async def aio(self, /) -> None: ...
+        def __call__(self, /) -> None:
+            """Message server indicating that function is ready to be checkpointed."""
+            ...
+        async def aio(self, /) -> None:
+            """Message server indicating that function is ready to be checkpointed."""
+            ...
     memory_snapshot: __memory_snapshot_spec[typing_extensions.Self]
     class __volume_commit_spec(typing_extensions.Protocol[SUPERSELF]):
-        def __call__(self, /, volume_ids: list[str]) -> None: ...
-        async def aio(self, /, volume_ids: list[str]) -> None: ...
+        def __call__(self, /, volume_ids: list[str]) -> None:
+            """Perform volume commit for given `volume_ids`.
+            Only used on container exit to persist uncommitted changes on behalf of user.
+            """
+            ...
+        async def aio(self, /, volume_ids: list[str]) -> None:
+            """Perform volume commit for given `volume_ids`.
+            Only used on container exit to persist uncommitted changes on behalf of user.
+            """
+            ...
     volume_commit: __volume_commit_spec[typing_extensions.Self]
@@ -380,13 +554,34 @@ class ContainerIOManager:
     @property
     def input_concurrency_enabled(self) -> int: ...
     @classmethod
-    def get_input_concurrency(cls) -> int: ...
+    def get_input_concurrency(cls) -> int:
+        """Returns the number of usable input slots.
+        If concurrency is reduced, active slots can exceed allotted slots. Returns the larger value
+        in this case.
+        """
+        ...
     @classmethod
-    def set_input_concurrency(cls, concurrency: int): ...
+    def set_input_concurrency(cls, concurrency: int):
+        """Edit the number of input slots.
+        This disables the background loop which automatically adjusts concurrency
+        within [target_concurrency, max_concurrency].
+        """
+        ...
     @classmethod
     def stop_fetching_inputs(cls): ...
-def check_fastapi_pydantic_compatibility(exc: ImportError) -> None: ...
+def check_fastapi_pydantic_compatibility(exc: ImportError) -> None:
+    """Add a helpful note to an exception that is likely caused by a pydantic<>fastapi version incompatibility.
+    We need this becasue the legacy set of container requirements (image_builder_version=2023.12) contains a
+    version of fastapi that is not forwards-compatible with pydantic 2.0+, and users commonly run into issues
+    building an image that specifies a more recent version only for pydantic.
+    """
+    ...
 MAX_OUTPUT_BATCH_SIZE: int

modal/_runtime/execution_context.py CHANGED Viewed

@@ -72,22 +72,38 @@ def current_function_call_id() -> Optional[str]:
         return None
-def _set_current_context_ids(input_ids: list[str], function_call_ids: list[str]) -> Callable[[], None]:
-    assert len(input_ids) == len(function_call_ids) and len(input_ids) > 0
+def current_attempt_token() -> Optional[str]:
+    # This ContextVar isn't useful to expose to users.
+    try:
+        return _current_attempt_token.get()
+    except LookupError:
+        return None
+def _set_current_context_ids(
+    input_ids: list[str], function_call_ids: list[str], attempt_tokens: list[str]
+) -> Callable[[], None]:
+    assert len(input_ids) == len(function_call_ids) == len(attempt_tokens) and input_ids
     input_id = input_ids[0]
     function_call_id = function_call_ids[0]
+    attempt_token = attempt_tokens[0]
     input_token = _current_input_id.set(input_id)
     function_call_token = _current_function_call_id.set(function_call_id)
+    attempt_token_token = _current_attempt_token.set(attempt_token)
     def _reset_current_context_ids():
         _current_input_id.reset(input_token)
         _current_function_call_id.reset(function_call_token)
+        _current_attempt_token.reset(attempt_token_token)
     return _reset_current_context_ids
 _current_input_id: ContextVar = ContextVar("_current_input_id")
 _current_function_call_id: ContextVar = ContextVar("_current_function_call_id")
+_current_attempt_token: ContextVar = ContextVar("_current_attempt_token")
 _is_currently_importing = False  # we set this to True while a container is importing user code

modal 1.0.3.dev10__py3-none-any.whl → 1.2.3.dev7__py3-none-any.whl

Potentially problematic release.

modal 1.0.3.dev10py3-none-any.whl → 1.2.3.dev7py3-none-any.whl