modal 1.1.4.dev16__py3-none-any.whl → 1.1.4.dev17__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
modal/client.pyi CHANGED
@@ -33,7 +33,7 @@ class _Client:
33
33
  server_url: str,
34
34
  client_type: int,
35
35
  credentials: typing.Optional[tuple[str, str]],
36
- version: str = "1.1.4.dev16",
36
+ version: str = "1.1.4.dev17",
37
37
  ):
38
38
  """mdmd:hidden
39
39
  The Modal client object is not intended to be instantiated directly by users.
@@ -164,7 +164,7 @@ class Client:
164
164
  server_url: str,
165
165
  client_type: int,
166
166
  credentials: typing.Optional[tuple[str, str]],
167
- version: str = "1.1.4.dev16",
167
+ version: str = "1.1.4.dev17",
168
168
  ):
169
169
  """mdmd:hidden
170
170
  The Modal client object is not intended to be instantiated directly by users.
@@ -213,8 +213,8 @@ class _FlashPrometheusAutoscaler:
213
213
  )
214
214
 
215
215
  logger.warning(
216
- f"[Modal Flash] Scaling to {actual_target_containers} containers. Autoscaling decision "
217
- f"made in {time.time() - autoscaling_time} seconds."
216
+ f"[Modal Flash] Scaling to {actual_target_containers=} containers. "
217
+ f" Autoscaling decision made in {time.time() - autoscaling_time} seconds."
218
218
  )
219
219
 
220
220
  await self.autoscaling_decisions_dict.put(
@@ -223,9 +223,7 @@ class _FlashPrometheusAutoscaler:
223
223
  )
224
224
  await self.autoscaling_decisions_dict.put("current_replicas", actual_target_containers)
225
225
 
226
- await self.cls.update_autoscaler(
227
- min_containers=actual_target_containers,
228
- )
226
+ await self.cls.update_autoscaler(min_containers=actual_target_containers)
229
227
 
230
228
  if time.time() - autoscaling_time < self.autoscaling_interval_seconds:
231
229
  await asyncio.sleep(self.autoscaling_interval_seconds - (time.time() - autoscaling_time))
@@ -239,6 +237,8 @@ class _FlashPrometheusAutoscaler:
239
237
  await asyncio.sleep(self.autoscaling_interval_seconds)
240
238
 
241
239
  async def _compute_target_containers(self, current_replicas: int) -> int:
240
+ # current_replicas is the number of live containers + cold starting containers (not yet live)
241
+ # containers is the number of live containers that are registered in flash dns
242
242
  containers = await self._get_all_containers()
243
243
  if len(containers) > current_replicas:
244
244
  logger.info(
@@ -271,11 +271,17 @@ class _FlashPrometheusAutoscaler:
271
271
  sum_metric += container_metrics[target_metric][0].value
272
272
  containers_with_metrics += 1
273
273
 
274
+ # n_containers_missing_metric is the number of unhealthy containers + number of cold starting containers
274
275
  n_containers_missing_metric = current_replicas - containers_with_metrics
276
+ # n_containers_unhealthy is the number of live containers that are not emitting metrics i.e. unhealthy
277
+ n_containers_unhealthy = len(containers) - containers_with_metrics
278
+
279
+ # Scale up assuming that every unhealthy container is at 2x the target metric value.
280
+ scale_up_target_metric_value = (sum_metric + n_containers_unhealthy * target_metric_value) / (
281
+ (containers_with_metrics + n_containers_unhealthy) or 1
282
+ )
275
283
 
276
- # Scale up / down conservatively: Any container that is missing the metric is assumed to be at the minimum
277
- # value of the metric when scaling up and the maximum value of the metric when scaling down.
278
- scale_up_target_metric_value = sum_metric / (containers_with_metrics or 1)
284
+ # Scale down assuming that every container (including cold starting containers) are at the target metric value.
279
285
  scale_down_target_metric_value = (
280
286
  sum_metric + n_containers_missing_metric * target_metric_value
281
287
  ) / current_replicas
@@ -290,9 +296,14 @@ class _FlashPrometheusAutoscaler:
290
296
  desired_replicas = math.ceil(current_replicas * scale_down_ratio)
291
297
 
292
298
  logger.warning(
293
- f"[Modal Flash] Current replicas: {current_replicas}, target metric value: {target_metric_value}, "
294
- f"current sum of metric values: {sum_metric}, number of containers missing metric: "
295
- f"{n_containers_missing_metric}, scale up ratio: {scale_up_ratio}, scale down ratio: {scale_down_ratio}, "
299
+ f"[Modal Flash] Current replicas: {current_replicas}, "
300
+ f"target metric value: {target_metric_value}, "
301
+ f"current sum of metric values: {sum_metric}, "
302
+ f"number of containers with metrics: {containers_with_metrics}, "
303
+ f"number of containers unhealthy: {n_containers_unhealthy}, "
304
+ f"number of containers missing metric (includes unhealthy): {n_containers_missing_metric}, "
305
+ f"scale up ratio: {scale_up_ratio}, "
306
+ f"scale down ratio: {scale_down_ratio}, "
296
307
  f"desired replicas: {desired_replicas}"
297
308
  )
298
309
 
@@ -312,9 +323,19 @@ class _FlashPrometheusAutoscaler:
312
323
  logger.warning(f"[Modal Flash] Error getting metrics from {url}: {e}")
313
324
  return None
314
325
 
326
+ # Read body with timeout/error handling and parse Prometheus metrics
327
+ try:
328
+ text_body = await response.text()
329
+ except asyncio.TimeoutError:
330
+ logger.warning(f"[Modal Flash] Timeout reading metrics body from {url}")
331
+ return None
332
+ except Exception as e:
333
+ logger.warning(f"[Modal Flash] Error reading metrics body from {url}: {e}")
334
+ return None
335
+
315
336
  # Parse the text-based Prometheus metrics format
316
337
  metrics: dict[str, list[Sample]] = defaultdict(list)
317
- for family in text_string_to_metric_families(await response.text()):
338
+ for family in text_string_to_metric_families(text_body):
318
339
  for sample in family.samples:
319
340
  metrics[sample.name] += [sample]
320
341
 
modal/functions.pyi CHANGED
@@ -433,7 +433,7 @@ class Function(
433
433
 
434
434
  _call_generator: ___call_generator_spec[typing_extensions.Self]
435
435
 
436
- class __remote_spec(typing_extensions.Protocol[ReturnType_INNER, P_INNER, SUPERSELF]):
436
+ class __remote_spec(typing_extensions.Protocol[P_INNER, ReturnType_INNER, SUPERSELF]):
437
437
  def __call__(self, /, *args: P_INNER.args, **kwargs: P_INNER.kwargs) -> ReturnType_INNER:
438
438
  """Calls the function remotely, executing it with the given arguments and returning the execution's result."""
439
439
  ...
@@ -442,7 +442,7 @@ class Function(
442
442
  """Calls the function remotely, executing it with the given arguments and returning the execution's result."""
443
443
  ...
444
444
 
445
- remote: __remote_spec[modal._functions.ReturnType, modal._functions.P, typing_extensions.Self]
445
+ remote: __remote_spec[modal._functions.P, modal._functions.ReturnType, typing_extensions.Self]
446
446
 
447
447
  class __remote_gen_spec(typing_extensions.Protocol[SUPERSELF]):
448
448
  def __call__(self, /, *args, **kwargs) -> typing.Generator[typing.Any, None, None]:
@@ -469,7 +469,7 @@ class Function(
469
469
  """
470
470
  ...
471
471
 
472
- class ___experimental_spawn_spec(typing_extensions.Protocol[ReturnType_INNER, P_INNER, SUPERSELF]):
472
+ class ___experimental_spawn_spec(typing_extensions.Protocol[P_INNER, ReturnType_INNER, SUPERSELF]):
473
473
  def __call__(self, /, *args: P_INNER.args, **kwargs: P_INNER.kwargs) -> FunctionCall[ReturnType_INNER]:
474
474
  """[Experimental] Calls the function with the given arguments, without waiting for the results.
475
475
 
@@ -493,7 +493,7 @@ class Function(
493
493
  ...
494
494
 
495
495
  _experimental_spawn: ___experimental_spawn_spec[
496
- modal._functions.ReturnType, modal._functions.P, typing_extensions.Self
496
+ modal._functions.P, modal._functions.ReturnType, typing_extensions.Self
497
497
  ]
498
498
 
499
499
  class ___spawn_map_inner_spec(typing_extensions.Protocol[P_INNER, SUPERSELF]):
@@ -502,7 +502,7 @@ class Function(
502
502
 
503
503
  _spawn_map_inner: ___spawn_map_inner_spec[modal._functions.P, typing_extensions.Self]
504
504
 
505
- class __spawn_spec(typing_extensions.Protocol[ReturnType_INNER, P_INNER, SUPERSELF]):
505
+ class __spawn_spec(typing_extensions.Protocol[P_INNER, ReturnType_INNER, SUPERSELF]):
506
506
  def __call__(self, /, *args: P_INNER.args, **kwargs: P_INNER.kwargs) -> FunctionCall[ReturnType_INNER]:
507
507
  """Calls the function with the given arguments, without waiting for the results.
508
508
 
@@ -523,7 +523,7 @@ class Function(
523
523
  """
524
524
  ...
525
525
 
526
- spawn: __spawn_spec[modal._functions.ReturnType, modal._functions.P, typing_extensions.Self]
526
+ spawn: __spawn_spec[modal._functions.P, modal._functions.ReturnType, typing_extensions.Self]
527
527
 
528
528
  def get_raw_f(self) -> collections.abc.Callable[..., typing.Any]:
529
529
  """Return the inner Python object wrapped by this Modal Function."""
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: modal
3
- Version: 1.1.4.dev16
3
+ Version: 1.1.4.dev17
4
4
  Summary: Python client library for Modal
5
5
  Author-email: Modal Labs <support@modal.com>
6
6
  License: Apache-2.0
@@ -22,7 +22,7 @@ modal/app.py,sha256=hJU3DGzP5GwYRmBj57XajljkQtLxkKftxXih2TYRcKo,48047
22
22
  modal/app.pyi,sha256=0U2xVKD3yfHe5l2bcihTDjPl__tzOvx1AIYOTebu-5o,43375
23
23
  modal/call_graph.py,sha256=1g2DGcMIJvRy-xKicuf63IVE98gJSnQsr8R_NVMptNc,2581
24
24
  modal/client.py,sha256=kyAIVB3Ay-XKJizQ_1ufUFB__EagV0MLmHJpyYyJ7J0,18636
25
- modal/client.pyi,sha256=oevgdxlsUFTyEK2NVmRDzB75uqZcOZrIFZEYQRJAmAg,15831
25
+ modal/client.pyi,sha256=lxLNas06tmdopgkHnv71sy6XFQF5iYnRYkW7QoveobU,15831
26
26
  modal/cloud_bucket_mount.py,sha256=YOe9nnvSr4ZbeCn587d7_VhE9IioZYRvF9VYQTQux08,5914
27
27
  modal/cloud_bucket_mount.pyi,sha256=-qSfYAQvIoO_l2wsCCGTG5ZUwQieNKXdAO00yP1-LYU,7394
28
28
  modal/cls.py,sha256=1mBcExFrLDTZwkD3Dzu8F26_CL0CGktOV9pE60Y8g_E,40689
@@ -39,7 +39,7 @@ modal/file_io.py,sha256=OSKr77TujcXGJW1iikzYiHckLSmv07QBgBHcxxYEkoI,21456
39
39
  modal/file_io.pyi,sha256=xtO6Glf_BFwDE7QiQQo24QqcMf_Vv-iz7WojcGVlLBU,15932
40
40
  modal/file_pattern_matcher.py,sha256=A_Kdkej6q7YQyhM_2-BvpFmPqJ0oHb54B6yf9VqvPVE,8116
41
41
  modal/functions.py,sha256=kcNHvqeGBxPI7Cgd57NIBBghkfbeFJzXO44WW0jSmao,325
42
- modal/functions.pyi,sha256=vXmQ5-tlrxSV8E8eI0yEF2HUeF0Bd6VyQVxMCW3SpBE,38890
42
+ modal/functions.pyi,sha256=h1oPAvbErW_i1Glzf_HsQenG-uH4KZk7X6razFbif6M,38890
43
43
  modal/gpu.py,sha256=Fe5ORvVPDIstSq1xjmM6OoNgLYFWvogP9r5BgmD3hYg,6769
44
44
  modal/image.py,sha256=nXN9k_6gApHFy8-Bk_XT2Zu3jsDsGVrC3QcuiDC4yRY,103543
45
45
  modal/image.pyi,sha256=vKdb5PpYM8wcpq9PQegeVMjrPLzAipuV4q994NZiL84,69325
@@ -150,10 +150,10 @@ modal/cli/programs/run_jupyter.py,sha256=44Lpvqk2l3hH-uOkmAOzw60NEsfB5uaRDWDKVsh
150
150
  modal/cli/programs/run_marimo.py,sha256=HyZ2za0NYqg31-mGxFQxUIAJ3Q-jRaMocEwWwI5-cdw,2887
151
151
  modal/cli/programs/vscode.py,sha256=KbTAaIXyQBVCDXxXjmBHmKpgXkUw0q4R4KkJvUjCYgk,3380
152
152
  modal/experimental/__init__.py,sha256=dPBPpxsmjZMLF3YjRrXoTvT01pl65wxi4UdFZsOem3w,15082
153
- modal/experimental/flash.py,sha256=7U6VuQ-7Y0HQximH4nHYq_4HDkdgRL60DE_-KRhj-Q0,19910
153
+ modal/experimental/flash.py,sha256=gydlThBSPgS8HA53Lwi0gUAFVtpdXu20IYAQXJSoTP0,21092
154
154
  modal/experimental/flash.pyi,sha256=A8_qJGtGoXEzKDdHbvhmCw7oqfneFEvJQK3ZdTOvUdU,10830
155
155
  modal/experimental/ipython.py,sha256=TrCfmol9LGsRZMeDoeMPx3Hv3BFqQhYnmD_iH0pqdhk,2904
156
- modal-1.1.4.dev16.dist-info/licenses/LICENSE,sha256=psuoW8kuDP96RQsdhzwOqi6fyWv0ct8CR6Jr7He_P_k,10173
156
+ modal-1.1.4.dev17.dist-info/licenses/LICENSE,sha256=psuoW8kuDP96RQsdhzwOqi6fyWv0ct8CR6Jr7He_P_k,10173
157
157
  modal_docs/__init__.py,sha256=svYKtV8HDwDCN86zbdWqyq5T8sMdGDj0PVlzc2tIxDM,28
158
158
  modal_docs/gen_cli_docs.py,sha256=c1yfBS_x--gL5bs0N4ihMwqwX8l3IBWSkBAKNNIi6bQ,3801
159
159
  modal_docs/gen_reference_docs.py,sha256=d_CQUGQ0rfw28u75I2mov9AlS773z9rG40-yq5o7g2U,6359
@@ -176,10 +176,10 @@ modal_proto/options_pb2.pyi,sha256=l7DBrbLO7q3Ir-XDkWsajm0d0TQqqrfuX54i4BMpdQg,1
176
176
  modal_proto/options_pb2_grpc.py,sha256=1oboBPFxaTEXt9Aw7EAj8gXHDCNMhZD2VXqocC9l_gk,159
177
177
  modal_proto/options_pb2_grpc.pyi,sha256=CImmhxHsYnF09iENPoe8S4J-n93jtgUYD2JPAc0yJSI,247
178
178
  modal_proto/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
179
- modal_version/__init__.py,sha256=QXpaiTjNP06yYihxFZ9XCmnyWZlsEF8DBHKKo7w2_9Y,121
179
+ modal_version/__init__.py,sha256=N2wz9sFgRKKg4OHYFwU3AVZM3zIM6izEe5fPZoeS-LU,121
180
180
  modal_version/__main__.py,sha256=2FO0yYQQwDTh6udt1h-cBnGd1c4ZyHnHSI4BksxzVac,105
181
- modal-1.1.4.dev16.dist-info/METADATA,sha256=Q23DVkB7U7xPfrKgcE6akJkZ9neMGjDucWJ4j9F6-Tw,2460
182
- modal-1.1.4.dev16.dist-info/WHEEL,sha256=1tXe9gY0PYatrMPMDd6jXqjfpz_B-Wqm32CPfRC58XU,91
183
- modal-1.1.4.dev16.dist-info/entry_points.txt,sha256=An-wYgeEUnm6xzrAP9_NTSTSciYvvEWsMZILtYrvpAI,46
184
- modal-1.1.4.dev16.dist-info/top_level.txt,sha256=4BWzoKYREKUZ5iyPzZpjqx4G8uB5TWxXPDwibLcVa7k,43
185
- modal-1.1.4.dev16.dist-info/RECORD,,
181
+ modal-1.1.4.dev17.dist-info/METADATA,sha256=otNiNfsuOjyFRzVqMRsj9VBaXbc62iXHds0Hoee0L_4,2460
182
+ modal-1.1.4.dev17.dist-info/WHEEL,sha256=1tXe9gY0PYatrMPMDd6jXqjfpz_B-Wqm32CPfRC58XU,91
183
+ modal-1.1.4.dev17.dist-info/entry_points.txt,sha256=An-wYgeEUnm6xzrAP9_NTSTSciYvvEWsMZILtYrvpAI,46
184
+ modal-1.1.4.dev17.dist-info/top_level.txt,sha256=4BWzoKYREKUZ5iyPzZpjqx4G8uB5TWxXPDwibLcVa7k,43
185
+ modal-1.1.4.dev17.dist-info/RECORD,,
modal_version/__init__.py CHANGED
@@ -1,4 +1,4 @@
1
1
  # Copyright Modal Labs 2025
2
2
  """Supplies the current version of the modal client library."""
3
3
 
4
- __version__ = "1.1.4.dev16"
4
+ __version__ = "1.1.4.dev17"