PyPI - modal - Versions diffs - 1.0.3.dev10__py3-none-any.whl → 1.2.3.dev7__py3-none-any.whl - Mend

modal 1.0.3.dev10py3-none-any.whl → 1.2.3.dev7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of modal might be problematic. Click here for more details.

Files changed (160) hide show

modal/__init__.py +0 -2
modal/__main__.py +3 -4
modal/_billing.py +80 -0
modal/_clustered_functions.py +7 -3
modal/_clustered_functions.pyi +15 -3
modal/_container_entrypoint.py +51 -69
modal/_functions.py +508 -240
modal/_grpc_client.py +171 -0
modal/_load_context.py +105 -0
modal/_object.py +81 -21
modal/_output.py +58 -45
modal/_partial_function.py +48 -73
modal/_pty.py +7 -3
modal/_resolver.py +26 -46
modal/_runtime/asgi.py +4 -3
modal/_runtime/container_io_manager.py +358 -220
modal/_runtime/container_io_manager.pyi +296 -101
modal/_runtime/execution_context.py +18 -2
modal/_runtime/execution_context.pyi +64 -7
modal/_runtime/gpu_memory_snapshot.py +262 -57
modal/_runtime/user_code_imports.py +28 -58
modal/_serialization.py +90 -6
modal/_traceback.py +42 -1
modal/_tunnel.pyi +380 -12
modal/_utils/async_utils.py +84 -29
modal/_utils/auth_token_manager.py +111 -0
modal/_utils/blob_utils.py +181 -58
modal/_utils/deprecation.py +19 -0
modal/_utils/function_utils.py +91 -47
modal/_utils/grpc_utils.py +89 -66
modal/_utils/mount_utils.py +26 -1
modal/_utils/name_utils.py +17 -3
modal/_utils/task_command_router_client.py +536 -0
modal/_utils/time_utils.py +34 -6
modal/app.py +256 -88
modal/app.pyi +909 -92
modal/billing.py +5 -0
modal/builder/2025.06.txt +18 -0
modal/builder/PREVIEW.txt +18 -0
modal/builder/base-images.json +58 -0
modal/cli/_download.py +19 -3
modal/cli/_traceback.py +3 -2
modal/cli/app.py +4 -4
modal/cli/cluster.py +15 -7
modal/cli/config.py +5 -3
modal/cli/container.py +7 -6
modal/cli/dict.py +22 -16
modal/cli/entry_point.py +12 -5
modal/cli/environment.py +5 -4
modal/cli/import_refs.py +3 -3
modal/cli/launch.py +102 -5
modal/cli/network_file_system.py +11 -12
modal/cli/profile.py +3 -2
modal/cli/programs/launch_instance_ssh.py +94 -0
modal/cli/programs/run_jupyter.py +1 -1
modal/cli/programs/run_marimo.py +95 -0
modal/cli/programs/vscode.py +1 -1
modal/cli/queues.py +57 -26
modal/cli/run.py +91 -23
modal/cli/secret.py +48 -22
modal/cli/token.py +7 -8
modal/cli/utils.py +4 -7
modal/cli/volume.py +31 -25
modal/client.py +15 -85
modal/client.pyi +183 -62
modal/cloud_bucket_mount.py +5 -3
modal/cloud_bucket_mount.pyi +197 -5
modal/cls.py +200 -126
modal/cls.pyi +446 -68
modal/config.py +29 -11
modal/container_process.py +319 -19
modal/container_process.pyi +190 -20
modal/dict.py +290 -71
modal/dict.pyi +835 -83
modal/environments.py +15 -27
modal/environments.pyi +46 -24
modal/exception.py +14 -2
modal/experimental/__init__.py +194 -40
modal/experimental/flash.py +618 -0
modal/experimental/flash.pyi +380 -0
modal/experimental/ipython.py +11 -7
modal/file_io.py +29 -36
modal/file_io.pyi +251 -53
modal/file_pattern_matcher.py +56 -16
modal/functions.pyi +673 -92
modal/gpu.py +1 -1
modal/image.py +528 -176
modal/image.pyi +1572 -145
modal/io_streams.py +458 -128
modal/io_streams.pyi +433 -52
modal/mount.py +216 -151
modal/mount.pyi +225 -78
modal/network_file_system.py +45 -62
modal/network_file_system.pyi +277 -56
modal/object.pyi +93 -17
modal/parallel_map.py +942 -129
modal/parallel_map.pyi +294 -15
modal/partial_function.py +0 -2
modal/partial_function.pyi +234 -19
modal/proxy.py +17 -8
modal/proxy.pyi +36 -3
modal/queue.py +270 -65
modal/queue.pyi +817 -57
modal/runner.py +115 -101
modal/runner.pyi +205 -49
modal/sandbox.py +512 -136
modal/sandbox.pyi +845 -111
modal/schedule.py +1 -1
modal/secret.py +300 -70
modal/secret.pyi +589 -34
modal/serving.py +7 -11
modal/serving.pyi +7 -8
modal/snapshot.py +11 -8
modal/snapshot.pyi +25 -4
modal/token_flow.py +4 -4
modal/token_flow.pyi +28 -8
modal/volume.py +416 -158
modal/volume.pyi +1117 -121
{modal-1.0.3.dev10.dist-info → modal-1.2.3.dev7.dist-info}/METADATA +10 -9
modal-1.2.3.dev7.dist-info/RECORD +195 -0
modal_docs/mdmd/mdmd.py +17 -4
modal_proto/api.proto +534 -79
modal_proto/api_grpc.py +337 -1
modal_proto/api_pb2.py +1522 -968
modal_proto/api_pb2.pyi +1619 -134
modal_proto/api_pb2_grpc.py +699 -4
modal_proto/api_pb2_grpc.pyi +226 -14
modal_proto/modal_api_grpc.py +175 -154
modal_proto/sandbox_router.proto +145 -0
modal_proto/sandbox_router_grpc.py +105 -0
modal_proto/sandbox_router_pb2.py +149 -0
modal_proto/sandbox_router_pb2.pyi +333 -0
modal_proto/sandbox_router_pb2_grpc.py +203 -0
modal_proto/sandbox_router_pb2_grpc.pyi +75 -0
modal_proto/task_command_router.proto +144 -0
modal_proto/task_command_router_grpc.py +105 -0
modal_proto/task_command_router_pb2.py +149 -0
modal_proto/task_command_router_pb2.pyi +333 -0
modal_proto/task_command_router_pb2_grpc.py +203 -0
modal_proto/task_command_router_pb2_grpc.pyi +75 -0
modal_version/__init__.py +1 -1
modal/requirements/PREVIEW.txt +0 -16
modal/requirements/base-images.json +0 -26
modal-1.0.3.dev10.dist-info/RECORD +0 -179
modal_proto/modal_options_grpc.py +0 -3
modal_proto/options.proto +0 -19
modal_proto/options_grpc.py +0 -3
modal_proto/options_pb2.py +0 -35
modal_proto/options_pb2.pyi +0 -20
modal_proto/options_pb2_grpc.py +0 -4
modal_proto/options_pb2_grpc.pyi +0 -7
/modal/{requirements → builder}/2023.12.312.txt +0 -0
/modal/{requirements → builder}/2023.12.txt +0 -0
/modal/{requirements → builder}/2024.04.txt +0 -0
/modal/{requirements → builder}/2024.10.txt +0 -0
/modal/{requirements → builder}/README.md +0 -0
{modal-1.0.3.dev10.dist-info → modal-1.2.3.dev7.dist-info}/WHEEL +0 -0
{modal-1.0.3.dev10.dist-info → modal-1.2.3.dev7.dist-info}/entry_points.txt +0 -0
{modal-1.0.3.dev10.dist-info → modal-1.2.3.dev7.dist-info}/licenses/LICENSE +0 -0
{modal-1.0.3.dev10.dist-info → modal-1.2.3.dev7.dist-info}/top_level.txt +0 -0

modal/_partial_function.py CHANGED Viewed

@@ -19,7 +19,7 @@ from ._functions import _Function
 from ._utils.async_utils import synchronizer
 from ._utils.deprecation import deprecation_warning
 from ._utils.function_utils import callable_has_non_self_params
-from .config import logger
+from .config import config, logger
 from .exception import InvalidError
 MAX_MAX_BATCH_SIZE = 1000
@@ -31,7 +31,6 @@ if typing.TYPE_CHECKING:
 class _PartialFunctionFlags(enum.IntFlag):
     # Lifecycle method flags
-    BUILD = 1  # Deprecated, will be removed
     ENTER_PRE_SNAPSHOT = 2
     ENTER_POST_SNAPSHOT = 4
     EXIT = 8
@@ -55,8 +54,7 @@ class _PartialFunctionFlags(enum.IntFlag):
     @staticmethod
     def lifecycle_flags() -> int:
         return (
-            _PartialFunctionFlags.BUILD  # Deprecated, will be removed
-            | _PartialFunctionFlags.ENTER_PRE_SNAPSHOT
+            _PartialFunctionFlags.ENTER_PRE_SNAPSHOT
             | _PartialFunctionFlags.ENTER_POST_SNAPSHOT
             | _PartialFunctionFlags.EXIT
         )
@@ -95,6 +93,26 @@ NullaryFuncOrMethod = Union[Callable[[], Any], Callable[[Any], Any]]
 NullaryMethod = Callable[[Any], Any]
+def verify_concurrent_params(params: _PartialFunctionParams, is_flash: bool = False) -> None:
+    def _verify_concurrent_params_with_flash_settings(params: _PartialFunctionParams) -> None:
+        if params.max_concurrent_inputs is not None:
+            raise TypeError(
+                "@modal.concurrent(max_inputs=...) is not yet supported for Flash functions. "
+                "Use `@modal.concurrent(target_inputs=...)` instead."
+            )
+        if params.target_concurrent_inputs is None:
+            raise TypeError("`@modal.concurrent()` missing required argument: `target_inputs`.")
+    def _verify_concurrent_params(params: _PartialFunctionParams) -> None:
+        if params.max_concurrent_inputs is None:
+            raise TypeError("`@modal.concurrent()` missing required argument: `max_inputs`.")
+    if is_flash:
+        _verify_concurrent_params_with_flash_settings(params)
+    else:
+        _verify_concurrent_params(params)
 class _PartialFunction(typing.Generic[P, ReturnType, OriginalReturnType]):
     """Object produced by a decorator in the `modal` namespace
@@ -284,7 +302,7 @@ class _MethodDecoratorType:
 # TODO(elias): fix support for coroutine type unwrapping for methods (static typing)
 def _method(
-    _warn_parentheses_missing=None,
+    _warn_parentheses_missing=None,  # mdmd:line-hidden
     *,
     # Set this to True if it's a non-generator function returning
     # a [sync/async] generator object
@@ -339,7 +357,7 @@ def _parse_custom_domains(custom_domains: Optional[Iterable[str]] = None) -> lis
 def _fastapi_endpoint(
-    _warn_parentheses_missing=None,
+    _warn_parentheses_missing=None,  # mdmd:line-hidden
     *,
     method: str = "GET",  # REST method for the created endpoint.
     label: Optional[str] = None,  # Label for created endpoint. Final subdomain will be <workspace>--<label>.modal.run.
@@ -380,6 +398,7 @@ def _fastapi_endpoint(
         method=method,
         web_endpoint_docs=docs,
         requested_suffix=label or "",
+        ephemeral_suffix=config.get("dev_suffix"),
         async_mode=api_pb2.WEBHOOK_ASYNC_MODE_AUTO,
         custom_domains=_parse_custom_domains(custom_domains),
         requires_proxy_auth=requires_proxy_auth,
@@ -402,7 +421,7 @@ def _fastapi_endpoint(
 def _web_endpoint(
-    _warn_parentheses_missing=None,
+    _warn_parentheses_missing=None,  # mdmd:line-hidden
     *,
     method: str = "GET",  # REST method for the created endpoint.
     label: Optional[str] = None,  # Label for created endpoint. Final subdomain will be <workspace>--<label>.modal.run.
@@ -448,6 +467,7 @@ def _web_endpoint(
         method=method,
         web_endpoint_docs=docs,
         requested_suffix=label or "",
+        ephemeral_suffix=config.get("dev_suffix"),
         async_mode=api_pb2.WEBHOOK_ASYNC_MODE_AUTO,
         custom_domains=_parse_custom_domains(custom_domains),
         requires_proxy_auth=requires_proxy_auth,
@@ -470,7 +490,7 @@ def _web_endpoint(
 def _asgi_app(
-    _warn_parentheses_missing=None,
+    _warn_parentheses_missing=None,  # mdmd:line-hidden
     *,
     label: Optional[str] = None,  # Label for created endpoint. Final subdomain will be <workspace>--<label>.modal.run.
     custom_domains: Optional[Iterable[str]] = None,  # Deploy this endpoint on a custom domain.
@@ -507,6 +527,7 @@ def _asgi_app(
     webhook_config = api_pb2.WebhookConfig(
         type=api_pb2.WEBHOOK_TYPE_ASGI_APP,
         requested_suffix=label or "",
+        ephemeral_suffix=config.get("dev_suffix"),
         async_mode=api_pb2.WEBHOOK_ASYNC_MODE_AUTO,
         custom_domains=_parse_custom_domains(custom_domains),
         requires_proxy_auth=requires_proxy_auth,
@@ -527,7 +548,7 @@ def _asgi_app(
 def _wsgi_app(
-    _warn_parentheses_missing=None,
+    _warn_parentheses_missing=None,  # mdmd:line-hidden
     *,
     label: Optional[str] = None,  # Label for created endpoint. Final subdomain will be <workspace>--<label>.modal.run.
     custom_domains: Optional[Iterable[str]] = None,  # Deploy this endpoint on a custom domain.
@@ -538,7 +559,7 @@ def _wsgi_app(
     Web Server Gateway Interface (WSGI) is a standard for synchronous Python web apps.
     It has been [succeeded by the ASGI interface](https://asgi.readthedocs.io/en/latest/introduction.html#wsgi-compatibility)
     which is compatible with ASGI and supports additional functionality such as web sockets.
-    Modal supports ASGI via [`asgi_app`](/docs/reference/modal.asgi_app).
+    Modal supports ASGI via [`asgi_app`](https://modal.com/docs/reference/modal.asgi_app).
     **Usage:**
@@ -564,6 +585,7 @@ def _wsgi_app(
     webhook_config = api_pb2.WebhookConfig(
         type=api_pb2.WEBHOOK_TYPE_WSGI_APP,
         requested_suffix=label or "",
+        ephemeral_suffix=config.get("dev_suffix"),
         async_mode=api_pb2.WEBHOOK_ASYNC_MODE_AUTO,
         custom_domains=_parse_custom_domains(custom_domains),
         requires_proxy_auth=requires_proxy_auth,
@@ -625,6 +647,7 @@ def _web_server(
     webhook_config = api_pb2.WebhookConfig(
         type=api_pb2.WEBHOOK_TYPE_WEB_SERVER,
         requested_suffix=label or "",
+        ephemeral_suffix=config.get("dev_suffix"),
         async_mode=api_pb2.WEBHOOK_ASYNC_MODE_AUTO,
         custom_domains=_parse_custom_domains(custom_domains),
         web_server_port=port,
@@ -646,61 +669,8 @@ def _web_server(
     return wrapper
-def _build(
-    _warn_parentheses_missing=None, *, force: bool = False, timeout: int = 86400
-) -> Callable[[Union[_PartialFunction, NullaryMethod]], _PartialFunction]:
-    """mdmd:hidden
-    Decorator for methods that execute at _build time_ to create a new Image layer.
-    **Deprecated**: This function is deprecated. We recommend using `modal.Volume`
-    to store large assets (such as model weights) instead of writing them to the
-    Image during the build process. For other use cases, you can replace this
-    decorator with the `Image.run_function` method.
-    **Usage**
-    ```python notest
-    @app.cls(gpu="A10G")
-    class AlpacaLoRAModel:
-        @build()
-        def download_models(self):
-            model = LlamaForCausalLM.from_pretrained(
-                base_model,
-            )
-            PeftModel.from_pretrained(model, lora_weights)
-            LlamaTokenizer.from_pretrained(base_model)
-    ```
-    """
-    if _warn_parentheses_missing is not None:
-        raise InvalidError(
-            "Positional arguments are not allowed. Did you forget parentheses? Suggestion: `@modal.build()`."
-        )
-    deprecation_warning(
-        (2025, 1, 15),
-        "The `@modal.build` decorator is deprecated and will be removed in a future release."
-        "\n\nWe now recommend storing large assets (such as model weights) using a `modal.Volume`"
-        " instead of writing them directly into the `modal.Image` filesystem."
-        " For other use cases we recommend using `Image.run_function` instead."
-        "\n\nSee https://modal.com/docs/guide/modal-1-0-migration for more information.",
-    )
-    flags = _PartialFunctionFlags.BUILD
-    params = _PartialFunctionParams(force_build=force, build_timeout=timeout)
-    def wrapper(obj: Union[_PartialFunction, NullaryMethod]) -> _PartialFunction:
-        if isinstance(obj, _PartialFunction):
-            pf = obj.stack(flags, params)
-        else:
-            pf = _PartialFunction(obj, flags, params)
-        pf.validate_obj_compatibility("build")
-        return pf
-    return wrapper
 def _enter(
-    _warn_parentheses_missing=None,
+    _warn_parentheses_missing=None,  # mdmd:line-hidden
     *,
     snap: bool = False,
 ) -> Callable[[Union[_PartialFunction, NullaryMethod]], _PartialFunction]:
@@ -751,7 +721,7 @@ def _exit(_warn_parentheses_missing=None) -> Callable[[NullaryMethod], _PartialF
 def _batched(
-    _warn_parentheses_missing=None,
+    _warn_parentheses_missing=None,  # mdmd:line-hidden
     *,
     max_batch_size: int,
     wait_ms: int,
@@ -789,12 +759,12 @@ def _batched(
         )
     if max_batch_size < 1:
         raise InvalidError("max_batch_size must be a positive integer.")
-    if max_batch_size >= MAX_MAX_BATCH_SIZE:
-        raise InvalidError(f"max_batch_size must be less than {MAX_MAX_BATCH_SIZE}.")
+    if max_batch_size > MAX_MAX_BATCH_SIZE:
+        raise InvalidError(f"max_batch_size cannot be greater than {MAX_MAX_BATCH_SIZE}.")
     if wait_ms < 0:
         raise InvalidError("wait_ms must be a non-negative integer.")
-    if wait_ms >= MAX_BATCH_WAIT_MS:
-        raise InvalidError(f"wait_ms must be less than {MAX_BATCH_WAIT_MS}.")
+    if wait_ms > MAX_BATCH_WAIT_MS:
+        raise InvalidError(f"wait_ms cannot be greater than {MAX_BATCH_WAIT_MS}.")
     flags = _PartialFunctionFlags.CALLABLE_INTERFACE | _PartialFunctionFlags.BATCHED
     params = _PartialFunctionParams(batch_max_size=max_batch_size, batch_wait_ms=wait_ms)
@@ -813,9 +783,9 @@ def _batched(
 def _concurrent(
-    _warn_parentheses_missing=None,
+    _warn_parentheses_missing=None,  # mdmd:line-hidden
     *,
-    max_inputs: int,  # Hard limit on each container's input concurrency
+    max_inputs: Optional[int] = None,  # Hard limit on each container's input concurrency
     target_inputs: Optional[int] = None,  # Input concurrency that Modal's autoscaler should target
 ) -> Callable[
     [Union[Callable[P, ReturnType], _PartialFunction[P, ReturnType, ReturnType]]],
@@ -867,7 +837,7 @@ def _concurrent(
             "Positional arguments are not allowed. Did you forget parentheses? Suggestion: `@modal.concurrent()`."
         )
-    if target_inputs and target_inputs > max_inputs:
+    if max_inputs is not None and target_inputs is not None and target_inputs > max_inputs:
         raise InvalidError("`target_inputs` parameter cannot be greater than `max_inputs`.")
     flags = _PartialFunctionFlags.CONCURRENT
@@ -891,7 +861,12 @@ def _concurrent(
 # NOTE: clustered is currently exposed through modal.experimental, not the top-level namespace
-def _clustered(size: int, broadcast: bool = True, rdma: bool = False):
+def _clustered(
+    size: int, broadcast: bool = True, rdma: bool = False
+) -> Callable[
+    [Union[Callable[P, ReturnType], _PartialFunction[P, ReturnType, ReturnType]]],
+    _PartialFunction[P, ReturnType, ReturnType],
+]:
     """Provision clusters of colocated and networked containers for the Function.
     Parameters:

modal/_pty.py CHANGED Viewed

@@ -7,8 +7,11 @@ from typing import Optional
 from modal_proto import api_pb2
-def get_winsz(fd) -> tuple[Optional[int], Optional[int]]:
+def get_winsz(fd=None) -> tuple[Optional[int], Optional[int]]:
     try:
+        if fd is None:
+            fd = sys.stdin.fileno()
         import fcntl
         import struct
         import termios
@@ -40,8 +43,8 @@ def raw_terminal():
         termios.tcsetattr(fd, termios.TCSADRAIN, old_settings)
-def get_pty_info(shell: bool) -> api_pb2.PTYInfo:
-    rows, cols = get_winsz(sys.stdin.fileno())
+def get_pty_info(shell: bool, no_terminate_on_idle_stdin: bool = False) -> api_pb2.PTYInfo:
+    rows, cols = get_winsz()
     return api_pb2.PTYInfo(
         enabled=True,  # TODO(erikbern): deprecated
         winsz_rows=rows,
@@ -50,4 +53,5 @@ def get_pty_info(shell: bool) -> api_pb2.PTYInfo:
         env_colorterm=os.environ.get("COLORTERM"),
         env_term_program=os.environ.get("TERM_PROGRAM"),
         pty_type=api_pb2.PTYInfo.PTY_TYPE_SHELL if shell else api_pb2.PTYInfo.PTY_TYPE_FUNCTION,
+        no_terminate_on_idle_stdin=no_terminate_on_idle_stdin,
     )

modal/_resolver.py CHANGED Viewed

@@ -8,19 +8,16 @@ from asyncio import Future
 from collections.abc import Hashable
 from typing import TYPE_CHECKING, Optional
-from grpclib import GRPCError, Status
+import modal._object
+from modal._traceback import suppress_tb_frames
 from modal_proto import api_pb2
+from ._load_context import LoadContext
 from ._utils.async_utils import TaskContext
-from .client import _Client
-from .exception import NotFoundError
 if TYPE_CHECKING:
     from rich.tree import Tree
-    import modal._object
 class StatusRow:
     def __init__(self, progress: "typing.Optional[Tree]"):
@@ -50,19 +47,10 @@ class StatusRow:
 class Resolver:
     _local_uuid_to_future: dict[str, Future]
-    _environment_name: Optional[str]
-    _app_id: Optional[str]
     _deduplication_cache: dict[Hashable, Future]
-    _client: _Client
     _build_start: float
-    def __init__(
-        self,
-        client: _Client,
-        *,
-        environment_name: Optional[str] = None,
-        app_id: Optional[str] = None,
-    ):
+    def __init__(self):
         try:
             # TODO(michael) If we don't clean this up more thoroughly, it would probably
             # be good to have a single source of truth for "rich is installed" rather than
@@ -77,9 +65,6 @@ class Resolver:
         self._local_uuid_to_future = {}
         self._tree = tree
-        self._client = client
-        self._app_id = app_id
-        self._environment_name = environment_name
         self._deduplication_cache = {}
         with tempfile.TemporaryFile() as temp_file:
@@ -87,27 +72,24 @@ class Resolver:
             # to the mtime on mounted files, and want those measurements to have the same resolution.
             self._build_start = os.fstat(temp_file.fileno()).st_mtime
-    @property
-    def app_id(self) -> Optional[str]:
-        return self._app_id
-    @property
-    def client(self):
-        return self._client
-    @property
-    def environment_name(self):
-        return self._environment_name
     @property
     def build_start(self) -> float:
         return self._build_start
-    async def preload(self, obj, existing_object_id: Optional[str]):
+    async def preload(
+        self, obj: "modal._object._Object", parent_load_context: "LoadContext", existing_object_id: Optional[str]
+    ):
         if obj._preload is not None:
-            await obj._preload(obj, self, existing_object_id)
+            load_context = obj._load_context_overrides.merged_with(parent_load_context)
+            await obj._preload(obj, self, load_context, existing_object_id)
-    async def load(self, obj: "modal._object._Object", existing_object_id: Optional[str] = None):
+    async def load(
+        self,
+        obj: "modal._object._Object",
+        parent_load_context: "LoadContext",
+        *,
+        existing_object_id: Optional[str] = None,
+    ):
         if obj._is_hydrated and obj._is_another_app:
             # No need to reload this, it won't typically change
             if obj.local_uuid not in self._local_uuid_to_future:
@@ -131,25 +113,23 @@ class Resolver:
             cached_future = self._deduplication_cache.get(deduplication_key)
             if cached_future:
                 hydrated_object = await cached_future
-                obj._hydrate(hydrated_object.object_id, self._client, hydrated_object._get_metadata())
+                # Use the client from the already-hydrated object
+                obj._hydrate(hydrated_object.object_id, hydrated_object.client, hydrated_object._get_metadata())
                 return obj
         if not cached_future:
             # don't run any awaits within this if-block to prevent race conditions
             async def loader():
-                # Wait for all its dependencies
+                load_context = await obj._load_context_overrides.merged_with(parent_load_context).apply_defaults()
                 # TODO(erikbern): do we need existing_object_id for those?
-                await TaskContext.gather(*[self.load(dep) for dep in obj.deps()])
+                await TaskContext.gather(*[self.load(dep, load_context) for dep in obj.deps()])
                 # Load the object itself
                 if not obj._load:
                     raise Exception(f"Object {obj} has no loader function")
-                try:
-                    await obj._load(obj, self, existing_object_id)
-                except GRPCError as exc:
-                    if exc.status == Status.NOT_FOUND:
-                        raise NotFoundError(exc.message)
-                    raise
+                await obj._load(obj, self, load_context, existing_object_id)
                 # Check that the id of functions didn't change
                 # Persisted refs are ignored because their life cycle is managed independently.
@@ -169,9 +149,9 @@ class Resolver:
             self._local_uuid_to_future[obj.local_uuid] = cached_future
             if deduplication_key is not None:
                 self._deduplication_cache[deduplication_key] = cached_future
-        # TODO(elias): print original exception/trace rather than the Resolver-internal trace
-        return await cached_future
+        with suppress_tb_frames(2):
+            # skip current frame + `loader()` closure frame from above
+            return await cached_future
     def objects(self) -> list["modal._object._Object"]:
         unique_objects: dict[str, "modal._object._Object"] = {}

modal/_runtime/asgi.py CHANGED Viewed

@@ -16,7 +16,7 @@ from modal.config import logger
 from modal.exception import ExecutionError, InvalidError
 from modal.experimental import stop_fetching_inputs
-from .execution_context import current_function_call_id
+from .execution_context import current_attempt_token, current_function_call_id
 FIRST_MESSAGE_TIMEOUT_SECONDS = 5.0
@@ -106,6 +106,7 @@ def asgi_app_wrapper(asgi_app, container_io_manager) -> tuple[Callable[..., Asyn
             raise ExecutionError("Unpexected state in ASGI scope")
         scope["state"] = state
         function_call_id = current_function_call_id()
+        attempt_token = current_attempt_token()
         assert function_call_id, "internal error: function_call_id not set in asgi_app() scope"
         messages_from_app: asyncio.Queue[dict[str, Any]] = asyncio.Queue(1)
@@ -119,7 +120,7 @@ def asgi_app_wrapper(asgi_app, container_io_manager) -> tuple[Callable[..., Asyn
         async def handle_first_input_timeout():
             if scope["type"] == "http":
-                await messages_from_app.put({"type": "http.response.start", "status": 502})
+                await messages_from_app.put({"type": "http.response.start", "status": 408})
                 await messages_from_app.put(
                     {
                         "type": "http.response.body",
@@ -142,7 +143,7 @@ def asgi_app_wrapper(asgi_app, container_io_manager) -> tuple[Callable[..., Asyn
             # This initial message, "http.request" or "websocket.connect", should be sent
             # immediately after starting the ASGI app's function call. If it is not received, that
             # indicates a request cancellation or other abnormal circumstance.
-            message_gen = container_io_manager.get_data_in.aio(function_call_id)
+            message_gen = container_io_manager.get_data_in.aio(function_call_id, attempt_token)
             first_message_task = asyncio.create_task(message_gen.__anext__())
             try:

modal 1.0.3.dev10__py3-none-any.whl → 1.2.3.dev7__py3-none-any.whl

Potentially problematic release.

modal 1.0.3.dev10py3-none-any.whl → 1.2.3.dev7py3-none-any.whl