PyPI - modal - Versions diffs - 1.1.5.dev66__py3-none-any.whl → 1.3.1.dev8__py3-none-any.whl - Mend

modal 1.1.5.dev66py3-none-any.whl → 1.3.1.dev8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of modal might be problematic. Click here for more details.

Files changed (143) hide show

modal/__init__.py +4 -4
modal/__main__.py +4 -29
modal/_billing.py +84 -0
modal/_clustered_functions.py +1 -3
modal/_container_entrypoint.py +33 -208
modal/_functions.py +171 -138
modal/_grpc_client.py +191 -0
modal/_ipython.py +16 -6
modal/_load_context.py +106 -0
modal/_object.py +72 -21
modal/_output.py +12 -14
modal/_partial_function.py +31 -4
modal/_resolver.py +44 -57
modal/_runtime/container_io_manager.py +30 -28
modal/_runtime/container_io_manager.pyi +42 -44
modal/_runtime/gpu_memory_snapshot.py +9 -7
modal/_runtime/user_code_event_loop.py +80 -0
modal/_runtime/user_code_imports.py +236 -10
modal/_serialization.py +2 -1
modal/_traceback.py +4 -13
modal/_tunnel.py +16 -11
modal/_tunnel.pyi +25 -3
modal/_utils/async_utils.py +337 -10
modal/_utils/auth_token_manager.py +1 -4
modal/_utils/blob_utils.py +29 -22
modal/_utils/function_utils.py +20 -21
modal/_utils/grpc_testing.py +6 -3
modal/_utils/grpc_utils.py +223 -64
modal/_utils/mount_utils.py +26 -1
modal/_utils/name_utils.py +2 -3
modal/_utils/package_utils.py +0 -1
modal/_utils/rand_pb_testing.py +8 -1
modal/_utils/task_command_router_client.py +524 -0
modal/_vendor/cloudpickle.py +144 -48
modal/app.py +285 -105
modal/app.pyi +216 -53
modal/billing.py +5 -0
modal/builder/2025.06.txt +6 -3
modal/builder/PREVIEW.txt +2 -1
modal/builder/base-images.json +4 -2
modal/cli/_download.py +19 -3
modal/cli/cluster.py +4 -2
modal/cli/config.py +3 -1
modal/cli/container.py +5 -4
modal/cli/dict.py +5 -2
modal/cli/entry_point.py +26 -2
modal/cli/environment.py +2 -16
modal/cli/launch.py +1 -76
modal/cli/network_file_system.py +5 -20
modal/cli/programs/run_jupyter.py +1 -1
modal/cli/programs/vscode.py +1 -1
modal/cli/queues.py +5 -4
modal/cli/run.py +24 -204
modal/cli/secret.py +1 -2
modal/cli/shell.py +375 -0
modal/cli/utils.py +1 -13
modal/cli/volume.py +11 -17
modal/client.py +16 -125
modal/client.pyi +94 -144
modal/cloud_bucket_mount.py +3 -1
modal/cloud_bucket_mount.pyi +4 -0
modal/cls.py +101 -64
modal/cls.pyi +9 -8
modal/config.py +21 -1
modal/container_process.py +288 -12
modal/container_process.pyi +99 -38
modal/dict.py +72 -33
modal/dict.pyi +88 -57
modal/environments.py +16 -8
modal/environments.pyi +6 -2
modal/exception.py +154 -16
modal/experimental/__init__.py +24 -53
modal/experimental/flash.py +161 -74
modal/experimental/flash.pyi +97 -49
modal/file_io.py +50 -92
modal/file_io.pyi +117 -89
modal/functions.pyi +70 -87
modal/image.py +82 -47
modal/image.pyi +51 -30
modal/io_streams.py +500 -149
modal/io_streams.pyi +279 -189
modal/mount.py +60 -46
modal/mount.pyi +41 -17
modal/network_file_system.py +19 -11
modal/network_file_system.pyi +72 -39
modal/object.pyi +114 -22
modal/parallel_map.py +42 -44
modal/parallel_map.pyi +9 -17
modal/partial_function.pyi +4 -2
modal/proxy.py +14 -6
modal/proxy.pyi +10 -2
modal/queue.py +45 -38
modal/queue.pyi +88 -52
modal/runner.py +96 -96
modal/runner.pyi +44 -27
modal/sandbox.py +225 -107
modal/sandbox.pyi +226 -60
modal/secret.py +58 -56
modal/secret.pyi +28 -13
modal/serving.py +7 -11
modal/serving.pyi +7 -8
modal/snapshot.py +29 -15
modal/snapshot.pyi +18 -10
modal/token_flow.py +1 -1
modal/token_flow.pyi +4 -6
modal/volume.py +102 -55
modal/volume.pyi +125 -66
{modal-1.1.5.dev66.dist-info → modal-1.3.1.dev8.dist-info}/METADATA +10 -9
modal-1.3.1.dev8.dist-info/RECORD +189 -0
modal_proto/api.proto +141 -70
modal_proto/api_grpc.py +42 -26
modal_proto/api_pb2.py +1123 -1103
modal_proto/api_pb2.pyi +331 -83
modal_proto/api_pb2_grpc.py +80 -48
modal_proto/api_pb2_grpc.pyi +26 -18
modal_proto/modal_api_grpc.py +175 -174
modal_proto/task_command_router.proto +164 -0
modal_proto/task_command_router_grpc.py +138 -0
modal_proto/task_command_router_pb2.py +180 -0
modal_proto/{sandbox_router_pb2.pyi → task_command_router_pb2.pyi} +148 -57
modal_proto/task_command_router_pb2_grpc.py +272 -0
modal_proto/task_command_router_pb2_grpc.pyi +100 -0
modal_version/__init__.py +1 -1
modal_version/__main__.py +1 -1
modal/cli/programs/launch_instance_ssh.py +0 -94
modal/cli/programs/run_marimo.py +0 -95
modal-1.1.5.dev66.dist-info/RECORD +0 -191
modal_proto/modal_options_grpc.py +0 -3
modal_proto/options.proto +0 -19
modal_proto/options_grpc.py +0 -3
modal_proto/options_pb2.py +0 -35
modal_proto/options_pb2.pyi +0 -20
modal_proto/options_pb2_grpc.py +0 -4
modal_proto/options_pb2_grpc.pyi +0 -7
modal_proto/sandbox_router.proto +0 -125
modal_proto/sandbox_router_grpc.py +0 -89
modal_proto/sandbox_router_pb2.py +0 -128
modal_proto/sandbox_router_pb2_grpc.py +0 -169
modal_proto/sandbox_router_pb2_grpc.pyi +0 -63
{modal-1.1.5.dev66.dist-info → modal-1.3.1.dev8.dist-info}/WHEEL +0 -0
{modal-1.1.5.dev66.dist-info → modal-1.3.1.dev8.dist-info}/entry_points.txt +0 -0
{modal-1.1.5.dev66.dist-info → modal-1.3.1.dev8.dist-info}/licenses/LICENSE +0 -0
{modal-1.1.5.dev66.dist-info → modal-1.3.1.dev8.dist-info}/top_level.txt +0 -0

modal/_utils/async_utils.py CHANGED Viewed

@@ -1,12 +1,16 @@
 # Copyright Modal Labs 2022
 import asyncio
 import concurrent.futures
+import contextlib
 import functools
 import inspect
 import itertools
+import os
 import sys
 import time
+import types
 import typing
+import warnings
 from collections.abc import AsyncGenerator, AsyncIterable, Awaitable, Iterable, Iterator
 from contextlib import asynccontextmanager
 from dataclasses import dataclass
@@ -22,10 +26,14 @@ from typing import (
 import synchronicity
 from synchronicity.async_utils import Runner
+from synchronicity.combined_types import MethodWithAio
 from synchronicity.exceptions import NestedEventLoops
 from typing_extensions import ParamSpec, assert_type
-from ..exception import InvalidError
+from modal._ipython import is_interactive_ipython
+from modal._utils.deprecation import deprecation_warning
+from ..exception import AsyncUsageWarning, InvalidError
 from .logger import logger
 T = TypeVar("T")
@@ -36,7 +44,285 @@ if sys.platform == "win32":
     # quick workaround for deadlocks on shutdown - need to investigate further
     asyncio.set_event_loop_policy(asyncio.WindowsSelectorEventLoopPolicy())
-synchronizer = synchronicity.Synchronizer()
+def rewrite_sync_to_async(code_line: str, original_func: Callable) -> tuple[bool, str]:
+    """
+    Rewrite a blocking call to use async/await syntax.
+    Handles four patterns:
+    1. __aiter__: for x in obj -> async for x in obj
+    2. __aenter__: with obj as x -> async with obj as x
+    3. Async generators in for loops: for x in obj.method(...) -> async for x in obj.method(...)
+    4. Regular methods: obj.method() -> await obj.method.aio()
+    Args:
+        code_line: The line of code containing the blocking call
+        original_func: The original function object being called
+    Returns:
+        A tuple of (success, rewritten_code):
+        - success: True if the pattern was found and rewritten, False if falling back to generic
+        - rewritten_code: The rewritten code or a generic suggestion
+    """
+    import re
+    func_name = original_func.__name__  # type: ignore
+    # Check if this is an async generator function
+    is_async_gen = inspect.isasyncgenfunction(original_func)
+    # Handle __aiter__ pattern: for x in obj -> async for x in obj
+    if func_name == "__aiter__" and code_line.startswith("for "):
+        suggestion = code_line.replace("for ", "async for ", 1)
+        return (True, suggestion)
+    # Handle __aenter__ pattern: with obj as x -> async with obj as x
+    if func_name == "__aenter__" and code_line.startswith("with "):
+        suggestion = code_line.replace("with ", "async with ", 1)
+        return (True, suggestion)
+    # Handle __setitem__ pattern: dct['key'] = value -> suggest alternative
+    if func_name == "__setitem__":
+        # Try to extract the object and key from the bracket syntax
+        setitem_match = re.match(r"(\w+)\[([^\]]+)\]\s*=\s*(.+)", code_line.strip())
+        if setitem_match:
+            obj, key, value = setitem_match.groups()
+            suggestion = (
+                f"You can't use `{obj}[{key}] = {value}` syntax asynchronously - "
+                f"there may be an alternative api, e.g. {obj}.put.aio({key}, {value})"
+            )
+            return (False, suggestion)
+        return (False, f"await ...{func_name}.aio(...)")
+    # Handle __getitem__ pattern: dct['key'] -> suggest alternative
+    if func_name == "__getitem__":
+        # Try to extract the object and key from the bracket syntax
+        getitem_match = re.match(r"(\w+)\[([^\]]+)\]$", code_line.strip())
+        if getitem_match:
+            obj, key = getitem_match.groups()
+            suggestion = (
+                f"You can't use `{obj}[{key}]` syntax asynchronously - "
+                f"there may be an alternative api, e.g. {obj}.get.aio({key})"
+            )
+            return (False, suggestion)
+        return (False, f"await ...{func_name}.aio(...)")
+    # Handle async generator methods in for loops: for x in obj.method(...) -> async for x in obj.method(...)
+    if is_async_gen and code_line.strip().startswith("for "):
+        # Pattern: for <var> in <expr>.<method>(<args>):
+        for_pattern = rf"(for\s+\w+\s+in\s+.*\.){re.escape(func_name)}(\s*\()"
+        for_match = re.search(for_pattern, code_line)
+        if for_match:
+            # Just replace "for" with "async for" - no .aio() needed for async generators
+            suggestion = code_line.replace("for ", "async for ", 1)
+            return (True, suggestion)
+    # Handle regular method calls and property access
+    # First check if it's a property access (no parentheses after the name)
+    property_pattern = rf"\.{re.escape(func_name)}(?!\s*\()"
+    property_match = re.search(property_pattern, code_line)
+    if property_match:
+        # This is a property access, rewrite to use await without .aio()
+        # Find the start of the expression (skip statement keywords and assignments)
+        statement_start = 0
+        prefix_match = re.match(r"^(\s*(?:\w+\s*=|return|yield|raise)\s+)", code_line)
+        if prefix_match:
+            statement_start = len(prefix_match.group(1))
+        before_expr = code_line[:statement_start]
+        after_prefix = code_line[statement_start:]
+        # Just add await before the expression for properties
+        suggestion = before_expr + "await " + after_prefix.lstrip()
+        return (True, suggestion)
+    # Try to find a method call (with parentheses)
+    method_pattern = rf"\.{re.escape(func_name)}\s*\("
+    method_match = re.search(method_pattern, code_line)
+    if not method_match:
+        # Can't find the function call or property
+        return (False, f"await ...{func_name}.aio(...)")
+    # Safety check: don't attempt rewrite for complex expressions
+    unsafe_keywords = ["if", "elif", "while", "and", "or", "not", "in", "is", "for"]
+    # Check if line contains control flow keywords (might be too complex)
+    for keyword in unsafe_keywords:
+        if re.search(rf"\b{keyword}\b", code_line):
+            # Fall back to generic suggestion for complex expressions
+            return (False, f"await ...{func_name}.aio(...)")
+    # Find the start of the object expression that leads to the method call
+    # We need to find where the object/chain starts, e.g., in "2 * foo.bar.method()" we want "foo"
+    # Work backwards from the method match to find the start of the identifier chain
+    method_start = method_match.start()
+    # Find the start of the identifier chain (the object being called)
+    # Walk backwards to find identifiers and dots that form the chain
+    expr_start = method_start
+    i = method_start - 1
+    while i >= 0:
+        c = code_line[i]
+        if c.isalnum() or c == "_" or c == ".":
+            expr_start = i
+            i -= 1
+        elif c.isspace():
+            # Skip whitespace within the chain (though unusual)
+            i -= 1
+        else:
+            # Found a non-identifier character, stop
+            break
+    # Now expr_start points to the start of the object chain (e.g., "foo" in "foo.method()")
+    # But we need to check if the identifier we found is actually a keyword like return/yield/raise
+    # In that case, skip over it and find the actual object
+    before_obj = code_line[:expr_start]
+    obj_and_rest = code_line[expr_start:]
+    # Check if what we found starts with a statement keyword
+    keyword_match = re.match(r"^(return|yield|raise)\s+", obj_and_rest)
+    if keyword_match:
+        # The "object" we found is actually a keyword, adjust to skip it
+        keyword_len = len(keyword_match.group(0))
+        before_obj = code_line[: expr_start + keyword_len]
+        obj_and_rest = code_line[expr_start + keyword_len :]
+    # Add .aio() after the method name and await before the object
+    rewritten_expr = re.sub(rf"(\.{re.escape(func_name)})\s*\(", r"\1.aio(", obj_and_rest, count=1)
+    suggestion = before_obj + "await " + rewritten_expr
+    return (True, suggestion)
+@dataclass
+class _CallFrame:
+    """Simple dataclass to hold call frame information."""
+    filename: str
+    lineno: int
+    line: Optional[str]
+def _extract_user_call_frame():
+    """
+    Extract the call frame from user code by filtering out frames from synchronicity and asyncio.
+    Returns a _CallFrame with the filename, line number, and source line, or None if not found.
+    """
+    import linecache
+    import os
+    # Get the current call stack
+    stack = inspect.stack()
+    # Get the absolute path of this module to filter it out
+    this_file = os.path.abspath(__file__)
+    # Filter out frames from synchronicity, asyncio, and this module
+    for frame_info in stack:
+        filename = frame_info.filename
+        # Skip frames from synchronicity, asyncio packages, and this module
+        # Use path separators to ensure we're matching packages, not just filenames containing these words
+        if (
+            os.path.sep + "synchronicity" + os.path.sep in filename
+            or os.path.sep + "asyncio" + os.path.sep in filename
+            or os.path.abspath(filename) == this_file
+        ):
+            continue
+        # Found a user frame
+        line = linecache.getline(filename, frame_info.lineno)
+        return _CallFrame(filename=filename, lineno=frame_info.lineno, line=line if line else None)
+    # Fallback if we can't find a suitable frame
+    return None
+def _blocking_in_async_warning(original_func: types.FunctionType):
+    if is_interactive_ipython():
+        # in notebooks or interactive sessions where sync usage is expected
+        # even if it's actually running in an event loop
+        return
+    import warnings
+    # Skip warnings for __aexit__ and __anext__ - the __aenter__ and __aiter__ warnings are sufficient
+    if original_func:
+        func_name = getattr(original_func, "__name__", str(original_func))
+        if func_name in ("__aexit__", "__anext__"):
+            # These dunders would typically already have caused a warning on the __aenter__ or __aiter__ respectively
+            return
+    # Extract the call frame from the stack
+    call_frame = _extract_user_call_frame()
+    # Build detailed warning message with location and function first
+    message_parts = [
+        "A blocking Modal interface is being used in an async context.",
+        "\n\nThis may cause performance issues or bugs.",
+        " Consider rewriting to use Modal's async interfaces:",
+        "\nhttps://modal.com/docs/guide/async",
+    ]
+    # Generate intelligent suggestion based on the context
+    suggestion = None
+    code_line = None
+    if original_func and call_frame and call_frame.line:
+        code_line = call_frame.line.strip()
+        # Use the unified rewrite function for all patterns
+        _, suggestion = rewrite_sync_to_async(code_line, original_func)
+    # Add suggestion in "change X to Y" format
+    if suggestion and code_line:
+        # this is a bit ugly, but the warnings formatter will show the offending source line
+        # on the last line regardless what we do, so we add this to not make it look out of place
+        message_parts.append(f"\n\nSuggested rewrite:\n  {suggestion}\n\nOriginal line:")
+    # Use warn_explicit to provide precise location information from the call frame
+    if call_frame:
+        # Extract module name from filename, or use a default
+        module_name = os.path.splitext(os.path.basename(call_frame.filename))[0]
+        warnings.warn_explicit(
+            "".join(message_parts),
+            AsyncUsageWarning,
+            filename=call_frame.filename,
+            lineno=call_frame.lineno,
+            module=module_name,
+        )
+    else:
+        # Fallback to regular warn if no frame information available
+        warnings.warn("".join(message_parts), AsyncUsageWarning)
+def _safe_blocking_in_async_warning(original_func: types.FunctionType):
+    """
+    Safety wrapper around _blocking_in_async_warning to ensure it never raises exceptions.
+    This is non-critical functionality (just a warning), so we don't want it to break user code.
+    However, if the warning has been configured to be treated as an error (via filterwarnings),
+    we should let that propagate.
+    """
+    from ..config import config
+    if not config.get("async_warnings"):
+        return
+    try:
+        _blocking_in_async_warning(original_func)
+    except AsyncUsageWarning:
+        # Re-raise the warning if it's been configured as an error
+        raise
+    except Exception:
+        # Silently ignore any other errors in the warning system
+        # We don't want the warning mechanism itself to cause problems
+        pass
+synchronizer = synchronicity.Synchronizer(blocking_in_async_callback=_safe_blocking_in_async_warning)
 def synchronize_api(obj, target_module=None):
@@ -51,6 +337,10 @@ def synchronize_api(obj, target_module=None):
     return synchronizer.create_blocking(obj, blocking_name, target_module=target_module)
+# Used for testing to configure the `n_attempts` that `retry` will use.
+RETRY_N_ATTEMPTS_OVERRIDE: Optional[int] = None
 def retry(direct_fn=None, *, n_attempts=3, base_delay=0, delay_factor=2, timeout=90):
     """Decorator that calls an async function multiple times, with a given timeout.
@@ -75,8 +365,13 @@ def retry(direct_fn=None, *, n_attempts=3, base_delay=0, delay_factor=2, timeout
     def decorator(fn):
         @functools.wraps(fn)
         async def f_wrapped(*args, **kwargs):
+            if RETRY_N_ATTEMPTS_OVERRIDE is not None:
+                local_n_attempts = RETRY_N_ATTEMPTS_OVERRIDE
+            else:
+                local_n_attempts = n_attempts
             delay = base_delay
-            for i in range(n_attempts):
+            for i in range(local_n_attempts):
                 t0 = time.time()
                 try:
                     return await asyncio.wait_for(fn(*args, **kwargs), timeout=timeout)
@@ -84,12 +379,12 @@ def retry(direct_fn=None, *, n_attempts=3, base_delay=0, delay_factor=2, timeout
                     logger.debug(f"Function {fn} was cancelled")
                     raise
                 except Exception as e:
-                    if i >= n_attempts - 1:
+                    if i >= local_n_attempts - 1:
                         raise
                     logger.debug(
                         f"Failed invoking function {fn}: {e}"
                         f" (took {time.time() - t0}s, sleeping {delay}s"
-                        f" and trying {n_attempts - i - 1} more times)"
+                        f" and trying {local_n_attempts - i - 1} more times)"
                     )
                 await asyncio.sleep(delay)
                 delay *= delay_factor
@@ -125,7 +420,8 @@ class TaskContext:
     _loops: set[asyncio.Task]
     def __init__(self, grace: Optional[float] = None):
-        self._grace = grace
+        self._grace = grace  # grace is the time we want for tasks to finish before cancelling them
+        self._cancellation_grace: float = 1.0  # extra graceperiod for the cancellation itself to "bubble up"
         self._loops = set()
     async def start(self):
@@ -157,22 +453,29 @@ class TaskContext:
             # still needs to be handled
             # (https://stackoverflow.com/a/63356323/2475114)
             if gather_future:
-                try:
+                with contextlib.suppress(asyncio.CancelledError):
                     await gather_future
-                except asyncio.CancelledError:
-                    pass
+            cancelled_tasks: list[asyncio.Task] = []
             for task in self._tasks:
                 if task.done() and not task.cancelled():
                     # Raise any exceptions if they happened.
                     # Only tasks without a done_callback will still be present in self._tasks
                     task.result()
-                if task.done() or task in self._loops:  # Note: Legacy code, we can probably cancel loops.
+                if task.done():
                     continue
                 # Cancel any remaining unfinished tasks.
                 task.cancel()
+                cancelled_tasks.append(task)
+            cancellation_gather = asyncio.gather(*cancelled_tasks, return_exceptions=True)
+            try:
+                await asyncio.wait_for(cancellation_gather, timeout=self._cancellation_grace)
+            except asyncio.TimeoutError:
+                warnings.warn(f"Internal warning: Tasks did not cancel in a timely manner: {cancelled_tasks}")
             await asyncio.sleep(0)  # wake up coroutines waiting for cancellations
     async def __aexit__(self, exc_type, value, tb):
@@ -370,6 +673,7 @@ class _WarnIfGeneratorIsNotConsumed:
         self.function_name = function_name
         self.iterated = False
         self.warned = False
+        self.__wrapped__ = gen
     def __aiter__(self):
         self.iterated = True
@@ -878,3 +1182,26 @@ async def async_chain(*generators: AsyncGenerator[T, None]) -> AsyncGenerator[T,
                 logger.exception(f"Error closing async generator: {e}")
         if first_exception is not None:
             raise first_exception
+def deprecate_aio_usage(deprecation_date: tuple[int, int, int], readable_sync_call: str):
+    # Note: Currently only works on methods, not top level functions
+    def deco(sync_implementation):
+        if isinstance(sync_implementation, classmethod):
+            sync_implementation = sync_implementation.__func__
+            is_classmethod = True
+        else:
+            is_classmethod = False
+        async def _async_proxy(*args, **kwargs):
+            deprecation_warning(
+                deprecation_date,
+                f"""The async constructor {readable_sync_call}.aio(...) will be deprecated in a future version of Modal.
+                Please use {readable_sync_call}(...) instead (it doesn't perform any IO, and is safe in async contexts)
+                """,
+            )
+            return sync_implementation(*args, **kwargs)
+        return MethodWithAio(sync_implementation, _async_proxy, synchronizer, is_classmethod=is_classmethod)
+    return deco

modal/_utils/auth_token_manager.py CHANGED Viewed

@@ -9,7 +9,6 @@ from typing import Any
 from modal.exception import ExecutionError
 from modal_proto import api_pb2, modal_api_grpc
-from .grpc_utils import retry_transient_errors
 from .logger import logger
@@ -66,9 +65,7 @@ class _AuthTokenManager:
             # new token. Once we have a new token, the other coroutines will unblock and return from here.
             if self._token and not self._needs_refresh():
                 return
-            resp: api_pb2.AuthTokenGetResponse = await retry_transient_errors(
-                self._stub.AuthTokenGet, api_pb2.AuthTokenGetRequest()
-            )
+            resp: api_pb2.AuthTokenGetResponse = await self._stub.AuthTokenGet(api_pb2.AuthTokenGetRequest())
             if not resp.token:
                 # Not expected
                 raise ExecutionError(

modal/_utils/blob_utils.py CHANGED Viewed

@@ -4,7 +4,6 @@ import dataclasses
 import hashlib
 import os
 import platform
-import random
 import time
 from collections.abc import AsyncIterator
 from contextlib import AbstractContextManager, contextmanager
@@ -27,7 +26,6 @@ from modal_proto.modal_api_grpc import ModalClientModal
 from ..exception import ExecutionError
 from .async_utils import TaskContext, retry
-from .grpc_utils import retry_transient_errors
 from .hash_utils import UploadHashes, get_upload_hashes
 from .http_utils import ClientSessionRegistry
 from .logger import logger
@@ -59,10 +57,8 @@ MULTIPART_UPLOAD_THRESHOLD = 1024**3
 # For block based storage like volumefs2: the size of a block
 BLOCK_SIZE: int = 8 * 1024 * 1024
-HEALTHY_R2_UPLOAD_PERCENTAGE = 0.95
-@retry(n_attempts=5, base_delay=0.5, timeout=None)
+@retry(n_attempts=3, base_delay=0.3, timeout=None)
 async def _upload_to_s3_url(
     upload_url,
     payload: "BytesIOSegmentPayload",
@@ -153,12 +149,13 @@ async def perform_multipart_upload(
     part_etags = await TaskContext.gather(*upload_coros)
     # The body of the complete_multipart_upload command needs some data in xml format:
-    completion_body = "<CompleteMultipartUpload>\n"
+    completion_parts = ["<CompleteMultipartUpload>"]
     for part_number, etag in enumerate(part_etags, 1):
-        completion_body += f"""<Part>\n<PartNumber>{part_number}</PartNumber>\n<ETag>"{etag}"</ETag>\n</Part>\n"""
-    completion_body += "</CompleteMultipartUpload>"
+        completion_parts.append(f"""<Part>\n<PartNumber>{part_number}</PartNumber>\n<ETag>"{etag}"</ETag>\n</Part>""")
+    completion_parts.append("</CompleteMultipartUpload>")
+    completion_body = "\n".join(completion_parts)
-    # etag of combined object should be md5 hex of concatendated md5 *bytes* from parts + `-{num_parts}`
+    # etag of combined object should be md5 hex of concatenated md5 *bytes* from parts + `-{num_parts}`
     bin_hash_parts = [bytes.fromhex(etag) for etag in part_etags]
     expected_multipart_etag = hashlib.md5(b"".join(bin_hash_parts)).hexdigest() + f"-{len(part_etags)}"
@@ -191,13 +188,10 @@ def get_content_length(data: BinaryIO) -> int:
 async def _blob_upload_with_fallback(
     items, blob_ids: list[str], callback, content_length: int
 ) -> tuple[str, bool, int]:
+    """Try uploading to each provider in order, with fallback on failure."""
     r2_throughput_bytes_s = 0
     r2_failed = False
     for idx, (item, blob_id) in enumerate(zip(items, blob_ids)):
-        # We want to default to R2 95% of the time and S3 5% of the time.
-        # To ensure the failure path is continuously exercised.
-        if idx == 0 and len(items) > 1 and random.random() > HEALTHY_R2_UPLOAD_PERCENTAGE:
-            continue
         try:
             if blob_id.endswith(":r2"):
                 t0 = time.monotonic_ns()
@@ -207,7 +201,7 @@ async def _blob_upload_with_fallback(
             else:
                 await callback(item)
             return blob_id, r2_failed, r2_throughput_bytes_s
-        except Exception as _:
+        except Exception:
             if blob_id.endswith(":r2"):
                 r2_failed = True
             # Ignore all errors except the last one, since we're out of fallback options.
@@ -229,7 +223,7 @@ async def _blob_upload(
         content_sha256_base64=upload_hashes.sha256_base64,
         content_length=content_length,
     )
-    resp = await retry_transient_errors(stub.BlobCreate, req)
+    resp = await stub.BlobCreate(req)
     if resp.WhichOneof("upload_types_oneof") == "multiparts":
@@ -335,7 +329,7 @@ async def blob_download(blob_id: str, stub: ModalClientModal) -> bytes:
     logger.debug(f"Downloading large blob {blob_id}")
     t0 = time.time()
     req = api_pb2.BlobGetRequest(blob_id=blob_id)
-    resp = await retry_transient_errors(stub.BlobGet, req)
+    resp = await stub.BlobGet(req)
     data = await _download_from_url(resp.download_url)
     size_mib = len(data) / 1024 / 1024
     dur_s = max(time.time() - t0, 0.001)  # avoid division by zero
@@ -348,7 +342,7 @@ async def blob_download(blob_id: str, stub: ModalClientModal) -> bytes:
 async def blob_iter(blob_id: str, stub: ModalClientModal) -> AsyncIterator[bytes]:
     req = api_pb2.BlobGetRequest(blob_id=blob_id)
-    resp = await retry_transient_errors(stub.BlobGet, req)
+    resp = await stub.BlobGet(req)
     download_url = resp.download_url
     async with ClientSessionRegistry.get_session().get(download_url) as s3_resp:
         # S3 signal to slow down request rate.
@@ -372,11 +366,17 @@ class FileUploadSpec:
     mount_filename: str
     use_blob: bool
-    content: Optional[bytes]  # typically None if using blob, required otherwise
     sha256_hex: str
     md5_hex: str
     mode: int  # file permission bits (last 12 bits of st_mode)
     size: int
+    content: Optional[bytes] = None  # Set for very small files to avoid double-read
+    def read_content(self) -> bytes:
+        """Read content from source."""
+        with self.source() as fp:
+            fp.seek(0)
+            return fp.read()
 def _get_file_upload_spec(
@@ -385,6 +385,7 @@ def _get_file_upload_spec(
     mount_filename: PurePosixPath,
     mode: int,
 ) -> FileUploadSpec:
+    content = None
     with source() as fp:
         # Current position is ignored - we always upload from position 0
         fp.seek(0, os.SEEK_END)
@@ -395,12 +396,18 @@ def _get_file_upload_spec(
             # TODO(dano): remove the placeholder md5 once we stop requiring md5 for blobs
             md5_hex = "baadbaadbaadbaadbaadbaadbaadbaad" if size > MULTIPART_UPLOAD_THRESHOLD else None
             use_blob = True
-            content = None
             hashes = get_upload_hashes(fp, md5_hex=md5_hex)
         else:
             use_blob = False
-            content = fp.read()
-            hashes = get_upload_hashes(content)
+            # For very small files (< 256 KiB), read content once and cache it
+            # This avoids double-read penalty while limiting memory usage
+            if size < 256 * 1024:  # 256 KiB threshold
+                fp.seek(0)
+                content = fp.read()
+                hashes = get_upload_hashes(content)
+            else:
+                # For medium files (256 KiB - 4 MiB), compute hashes without caching content
+                hashes = get_upload_hashes(fp)
     return FileUploadSpec(
         source=source,
@@ -408,11 +415,11 @@ def _get_file_upload_spec(
         source_is_path=isinstance(source_description, Path),
         mount_filename=mount_filename.as_posix(),
         use_blob=use_blob,
-        content=content,
         sha256_hex=hashes.sha256_hex(),
         md5_hex=hashes.md5_hex(),
         mode=mode & 0o7777,
         size=size,
+        content=content,
     )

modal 1.1.5.dev66__py3-none-any.whl → 1.3.1.dev8__py3-none-any.whl

Potentially problematic release.

modal 1.1.5.dev66py3-none-any.whl → 1.3.1.dev8py3-none-any.whl