modal 1.1.4.dev16__py3-none-any.whl → 1.1.4.dev17__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- modal/client.pyi +2 -2
- modal/experimental/flash.py +33 -12
- modal/functions.pyi +6 -6
- {modal-1.1.4.dev16.dist-info → modal-1.1.4.dev17.dist-info}/METADATA +1 -1
- {modal-1.1.4.dev16.dist-info → modal-1.1.4.dev17.dist-info}/RECORD +10 -10
- modal_version/__init__.py +1 -1
- {modal-1.1.4.dev16.dist-info → modal-1.1.4.dev17.dist-info}/WHEEL +0 -0
- {modal-1.1.4.dev16.dist-info → modal-1.1.4.dev17.dist-info}/entry_points.txt +0 -0
- {modal-1.1.4.dev16.dist-info → modal-1.1.4.dev17.dist-info}/licenses/LICENSE +0 -0
- {modal-1.1.4.dev16.dist-info → modal-1.1.4.dev17.dist-info}/top_level.txt +0 -0
modal/client.pyi
CHANGED
@@ -33,7 +33,7 @@ class _Client:
|
|
33
33
|
server_url: str,
|
34
34
|
client_type: int,
|
35
35
|
credentials: typing.Optional[tuple[str, str]],
|
36
|
-
version: str = "1.1.4.
|
36
|
+
version: str = "1.1.4.dev17",
|
37
37
|
):
|
38
38
|
"""mdmd:hidden
|
39
39
|
The Modal client object is not intended to be instantiated directly by users.
|
@@ -164,7 +164,7 @@ class Client:
|
|
164
164
|
server_url: str,
|
165
165
|
client_type: int,
|
166
166
|
credentials: typing.Optional[tuple[str, str]],
|
167
|
-
version: str = "1.1.4.
|
167
|
+
version: str = "1.1.4.dev17",
|
168
168
|
):
|
169
169
|
"""mdmd:hidden
|
170
170
|
The Modal client object is not intended to be instantiated directly by users.
|
modal/experimental/flash.py
CHANGED
@@ -213,8 +213,8 @@ class _FlashPrometheusAutoscaler:
|
|
213
213
|
)
|
214
214
|
|
215
215
|
logger.warning(
|
216
|
-
f"[Modal Flash] Scaling to {actual_target_containers} containers.
|
217
|
-
f"made in {time.time() - autoscaling_time} seconds."
|
216
|
+
f"[Modal Flash] Scaling to {actual_target_containers=} containers. "
|
217
|
+
f" Autoscaling decision made in {time.time() - autoscaling_time} seconds."
|
218
218
|
)
|
219
219
|
|
220
220
|
await self.autoscaling_decisions_dict.put(
|
@@ -223,9 +223,7 @@ class _FlashPrometheusAutoscaler:
|
|
223
223
|
)
|
224
224
|
await self.autoscaling_decisions_dict.put("current_replicas", actual_target_containers)
|
225
225
|
|
226
|
-
await self.cls.update_autoscaler(
|
227
|
-
min_containers=actual_target_containers,
|
228
|
-
)
|
226
|
+
await self.cls.update_autoscaler(min_containers=actual_target_containers)
|
229
227
|
|
230
228
|
if time.time() - autoscaling_time < self.autoscaling_interval_seconds:
|
231
229
|
await asyncio.sleep(self.autoscaling_interval_seconds - (time.time() - autoscaling_time))
|
@@ -239,6 +237,8 @@ class _FlashPrometheusAutoscaler:
|
|
239
237
|
await asyncio.sleep(self.autoscaling_interval_seconds)
|
240
238
|
|
241
239
|
async def _compute_target_containers(self, current_replicas: int) -> int:
|
240
|
+
# current_replicas is the number of live containers + cold starting containers (not yet live)
|
241
|
+
# containers is the number of live containers that are registered in flash dns
|
242
242
|
containers = await self._get_all_containers()
|
243
243
|
if len(containers) > current_replicas:
|
244
244
|
logger.info(
|
@@ -271,11 +271,17 @@ class _FlashPrometheusAutoscaler:
|
|
271
271
|
sum_metric += container_metrics[target_metric][0].value
|
272
272
|
containers_with_metrics += 1
|
273
273
|
|
274
|
+
# n_containers_missing_metric is the number of unhealthy containers + number of cold starting containers
|
274
275
|
n_containers_missing_metric = current_replicas - containers_with_metrics
|
276
|
+
# n_containers_unhealthy is the number of live containers that are not emitting metrics i.e. unhealthy
|
277
|
+
n_containers_unhealthy = len(containers) - containers_with_metrics
|
278
|
+
|
279
|
+
# Scale up assuming that every unhealthy container is at 2x the target metric value.
|
280
|
+
scale_up_target_metric_value = (sum_metric + n_containers_unhealthy * target_metric_value) / (
|
281
|
+
(containers_with_metrics + n_containers_unhealthy) or 1
|
282
|
+
)
|
275
283
|
|
276
|
-
# Scale
|
277
|
-
# value of the metric when scaling up and the maximum value of the metric when scaling down.
|
278
|
-
scale_up_target_metric_value = sum_metric / (containers_with_metrics or 1)
|
284
|
+
# Scale down assuming that every container (including cold starting containers) are at the target metric value.
|
279
285
|
scale_down_target_metric_value = (
|
280
286
|
sum_metric + n_containers_missing_metric * target_metric_value
|
281
287
|
) / current_replicas
|
@@ -290,9 +296,14 @@ class _FlashPrometheusAutoscaler:
|
|
290
296
|
desired_replicas = math.ceil(current_replicas * scale_down_ratio)
|
291
297
|
|
292
298
|
logger.warning(
|
293
|
-
f"[Modal Flash] Current replicas: {current_replicas},
|
294
|
-
f"
|
295
|
-
f"
|
299
|
+
f"[Modal Flash] Current replicas: {current_replicas}, "
|
300
|
+
f"target metric value: {target_metric_value}, "
|
301
|
+
f"current sum of metric values: {sum_metric}, "
|
302
|
+
f"number of containers with metrics: {containers_with_metrics}, "
|
303
|
+
f"number of containers unhealthy: {n_containers_unhealthy}, "
|
304
|
+
f"number of containers missing metric (includes unhealthy): {n_containers_missing_metric}, "
|
305
|
+
f"scale up ratio: {scale_up_ratio}, "
|
306
|
+
f"scale down ratio: {scale_down_ratio}, "
|
296
307
|
f"desired replicas: {desired_replicas}"
|
297
308
|
)
|
298
309
|
|
@@ -312,9 +323,19 @@ class _FlashPrometheusAutoscaler:
|
|
312
323
|
logger.warning(f"[Modal Flash] Error getting metrics from {url}: {e}")
|
313
324
|
return None
|
314
325
|
|
326
|
+
# Read body with timeout/error handling and parse Prometheus metrics
|
327
|
+
try:
|
328
|
+
text_body = await response.text()
|
329
|
+
except asyncio.TimeoutError:
|
330
|
+
logger.warning(f"[Modal Flash] Timeout reading metrics body from {url}")
|
331
|
+
return None
|
332
|
+
except Exception as e:
|
333
|
+
logger.warning(f"[Modal Flash] Error reading metrics body from {url}: {e}")
|
334
|
+
return None
|
335
|
+
|
315
336
|
# Parse the text-based Prometheus metrics format
|
316
337
|
metrics: dict[str, list[Sample]] = defaultdict(list)
|
317
|
-
for family in text_string_to_metric_families(
|
338
|
+
for family in text_string_to_metric_families(text_body):
|
318
339
|
for sample in family.samples:
|
319
340
|
metrics[sample.name] += [sample]
|
320
341
|
|
modal/functions.pyi
CHANGED
@@ -433,7 +433,7 @@ class Function(
|
|
433
433
|
|
434
434
|
_call_generator: ___call_generator_spec[typing_extensions.Self]
|
435
435
|
|
436
|
-
class __remote_spec(typing_extensions.Protocol[
|
436
|
+
class __remote_spec(typing_extensions.Protocol[P_INNER, ReturnType_INNER, SUPERSELF]):
|
437
437
|
def __call__(self, /, *args: P_INNER.args, **kwargs: P_INNER.kwargs) -> ReturnType_INNER:
|
438
438
|
"""Calls the function remotely, executing it with the given arguments and returning the execution's result."""
|
439
439
|
...
|
@@ -442,7 +442,7 @@ class Function(
|
|
442
442
|
"""Calls the function remotely, executing it with the given arguments and returning the execution's result."""
|
443
443
|
...
|
444
444
|
|
445
|
-
remote: __remote_spec[modal._functions.
|
445
|
+
remote: __remote_spec[modal._functions.P, modal._functions.ReturnType, typing_extensions.Self]
|
446
446
|
|
447
447
|
class __remote_gen_spec(typing_extensions.Protocol[SUPERSELF]):
|
448
448
|
def __call__(self, /, *args, **kwargs) -> typing.Generator[typing.Any, None, None]:
|
@@ -469,7 +469,7 @@ class Function(
|
|
469
469
|
"""
|
470
470
|
...
|
471
471
|
|
472
|
-
class ___experimental_spawn_spec(typing_extensions.Protocol[
|
472
|
+
class ___experimental_spawn_spec(typing_extensions.Protocol[P_INNER, ReturnType_INNER, SUPERSELF]):
|
473
473
|
def __call__(self, /, *args: P_INNER.args, **kwargs: P_INNER.kwargs) -> FunctionCall[ReturnType_INNER]:
|
474
474
|
"""[Experimental] Calls the function with the given arguments, without waiting for the results.
|
475
475
|
|
@@ -493,7 +493,7 @@ class Function(
|
|
493
493
|
...
|
494
494
|
|
495
495
|
_experimental_spawn: ___experimental_spawn_spec[
|
496
|
-
modal._functions.
|
496
|
+
modal._functions.P, modal._functions.ReturnType, typing_extensions.Self
|
497
497
|
]
|
498
498
|
|
499
499
|
class ___spawn_map_inner_spec(typing_extensions.Protocol[P_INNER, SUPERSELF]):
|
@@ -502,7 +502,7 @@ class Function(
|
|
502
502
|
|
503
503
|
_spawn_map_inner: ___spawn_map_inner_spec[modal._functions.P, typing_extensions.Self]
|
504
504
|
|
505
|
-
class __spawn_spec(typing_extensions.Protocol[
|
505
|
+
class __spawn_spec(typing_extensions.Protocol[P_INNER, ReturnType_INNER, SUPERSELF]):
|
506
506
|
def __call__(self, /, *args: P_INNER.args, **kwargs: P_INNER.kwargs) -> FunctionCall[ReturnType_INNER]:
|
507
507
|
"""Calls the function with the given arguments, without waiting for the results.
|
508
508
|
|
@@ -523,7 +523,7 @@ class Function(
|
|
523
523
|
"""
|
524
524
|
...
|
525
525
|
|
526
|
-
spawn: __spawn_spec[modal._functions.
|
526
|
+
spawn: __spawn_spec[modal._functions.P, modal._functions.ReturnType, typing_extensions.Self]
|
527
527
|
|
528
528
|
def get_raw_f(self) -> collections.abc.Callable[..., typing.Any]:
|
529
529
|
"""Return the inner Python object wrapped by this Modal Function."""
|
@@ -22,7 +22,7 @@ modal/app.py,sha256=hJU3DGzP5GwYRmBj57XajljkQtLxkKftxXih2TYRcKo,48047
|
|
22
22
|
modal/app.pyi,sha256=0U2xVKD3yfHe5l2bcihTDjPl__tzOvx1AIYOTebu-5o,43375
|
23
23
|
modal/call_graph.py,sha256=1g2DGcMIJvRy-xKicuf63IVE98gJSnQsr8R_NVMptNc,2581
|
24
24
|
modal/client.py,sha256=kyAIVB3Ay-XKJizQ_1ufUFB__EagV0MLmHJpyYyJ7J0,18636
|
25
|
-
modal/client.pyi,sha256=
|
25
|
+
modal/client.pyi,sha256=lxLNas06tmdopgkHnv71sy6XFQF5iYnRYkW7QoveobU,15831
|
26
26
|
modal/cloud_bucket_mount.py,sha256=YOe9nnvSr4ZbeCn587d7_VhE9IioZYRvF9VYQTQux08,5914
|
27
27
|
modal/cloud_bucket_mount.pyi,sha256=-qSfYAQvIoO_l2wsCCGTG5ZUwQieNKXdAO00yP1-LYU,7394
|
28
28
|
modal/cls.py,sha256=1mBcExFrLDTZwkD3Dzu8F26_CL0CGktOV9pE60Y8g_E,40689
|
@@ -39,7 +39,7 @@ modal/file_io.py,sha256=OSKr77TujcXGJW1iikzYiHckLSmv07QBgBHcxxYEkoI,21456
|
|
39
39
|
modal/file_io.pyi,sha256=xtO6Glf_BFwDE7QiQQo24QqcMf_Vv-iz7WojcGVlLBU,15932
|
40
40
|
modal/file_pattern_matcher.py,sha256=A_Kdkej6q7YQyhM_2-BvpFmPqJ0oHb54B6yf9VqvPVE,8116
|
41
41
|
modal/functions.py,sha256=kcNHvqeGBxPI7Cgd57NIBBghkfbeFJzXO44WW0jSmao,325
|
42
|
-
modal/functions.pyi,sha256=
|
42
|
+
modal/functions.pyi,sha256=h1oPAvbErW_i1Glzf_HsQenG-uH4KZk7X6razFbif6M,38890
|
43
43
|
modal/gpu.py,sha256=Fe5ORvVPDIstSq1xjmM6OoNgLYFWvogP9r5BgmD3hYg,6769
|
44
44
|
modal/image.py,sha256=nXN9k_6gApHFy8-Bk_XT2Zu3jsDsGVrC3QcuiDC4yRY,103543
|
45
45
|
modal/image.pyi,sha256=vKdb5PpYM8wcpq9PQegeVMjrPLzAipuV4q994NZiL84,69325
|
@@ -150,10 +150,10 @@ modal/cli/programs/run_jupyter.py,sha256=44Lpvqk2l3hH-uOkmAOzw60NEsfB5uaRDWDKVsh
|
|
150
150
|
modal/cli/programs/run_marimo.py,sha256=HyZ2za0NYqg31-mGxFQxUIAJ3Q-jRaMocEwWwI5-cdw,2887
|
151
151
|
modal/cli/programs/vscode.py,sha256=KbTAaIXyQBVCDXxXjmBHmKpgXkUw0q4R4KkJvUjCYgk,3380
|
152
152
|
modal/experimental/__init__.py,sha256=dPBPpxsmjZMLF3YjRrXoTvT01pl65wxi4UdFZsOem3w,15082
|
153
|
-
modal/experimental/flash.py,sha256=
|
153
|
+
modal/experimental/flash.py,sha256=gydlThBSPgS8HA53Lwi0gUAFVtpdXu20IYAQXJSoTP0,21092
|
154
154
|
modal/experimental/flash.pyi,sha256=A8_qJGtGoXEzKDdHbvhmCw7oqfneFEvJQK3ZdTOvUdU,10830
|
155
155
|
modal/experimental/ipython.py,sha256=TrCfmol9LGsRZMeDoeMPx3Hv3BFqQhYnmD_iH0pqdhk,2904
|
156
|
-
modal-1.1.4.
|
156
|
+
modal-1.1.4.dev17.dist-info/licenses/LICENSE,sha256=psuoW8kuDP96RQsdhzwOqi6fyWv0ct8CR6Jr7He_P_k,10173
|
157
157
|
modal_docs/__init__.py,sha256=svYKtV8HDwDCN86zbdWqyq5T8sMdGDj0PVlzc2tIxDM,28
|
158
158
|
modal_docs/gen_cli_docs.py,sha256=c1yfBS_x--gL5bs0N4ihMwqwX8l3IBWSkBAKNNIi6bQ,3801
|
159
159
|
modal_docs/gen_reference_docs.py,sha256=d_CQUGQ0rfw28u75I2mov9AlS773z9rG40-yq5o7g2U,6359
|
@@ -176,10 +176,10 @@ modal_proto/options_pb2.pyi,sha256=l7DBrbLO7q3Ir-XDkWsajm0d0TQqqrfuX54i4BMpdQg,1
|
|
176
176
|
modal_proto/options_pb2_grpc.py,sha256=1oboBPFxaTEXt9Aw7EAj8gXHDCNMhZD2VXqocC9l_gk,159
|
177
177
|
modal_proto/options_pb2_grpc.pyi,sha256=CImmhxHsYnF09iENPoe8S4J-n93jtgUYD2JPAc0yJSI,247
|
178
178
|
modal_proto/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
179
|
-
modal_version/__init__.py,sha256=
|
179
|
+
modal_version/__init__.py,sha256=N2wz9sFgRKKg4OHYFwU3AVZM3zIM6izEe5fPZoeS-LU,121
|
180
180
|
modal_version/__main__.py,sha256=2FO0yYQQwDTh6udt1h-cBnGd1c4ZyHnHSI4BksxzVac,105
|
181
|
-
modal-1.1.4.
|
182
|
-
modal-1.1.4.
|
183
|
-
modal-1.1.4.
|
184
|
-
modal-1.1.4.
|
185
|
-
modal-1.1.4.
|
181
|
+
modal-1.1.4.dev17.dist-info/METADATA,sha256=otNiNfsuOjyFRzVqMRsj9VBaXbc62iXHds0Hoee0L_4,2460
|
182
|
+
modal-1.1.4.dev17.dist-info/WHEEL,sha256=1tXe9gY0PYatrMPMDd6jXqjfpz_B-Wqm32CPfRC58XU,91
|
183
|
+
modal-1.1.4.dev17.dist-info/entry_points.txt,sha256=An-wYgeEUnm6xzrAP9_NTSTSciYvvEWsMZILtYrvpAI,46
|
184
|
+
modal-1.1.4.dev17.dist-info/top_level.txt,sha256=4BWzoKYREKUZ5iyPzZpjqx4G8uB5TWxXPDwibLcVa7k,43
|
185
|
+
modal-1.1.4.dev17.dist-info/RECORD,,
|
modal_version/__init__.py
CHANGED
File without changes
|
File without changes
|
File without changes
|
File without changes
|