torchmonarch-nightly 2025.6.29__cp313-cp313-manylinux2014_x86_64.whl → 2025.7.1__cp313-cp313-manylinux2014_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
monarch/_rust_bindings.so CHANGED
Binary file
monarch/actor_mesh.py CHANGED
@@ -521,8 +521,21 @@ class _Actor:
521
521
  return None
522
522
 
523
523
  if self.instance is None:
524
+ # This could happen because of the following reasons. Both
525
+ # indicates a possible bug in the framework:
526
+ # 1. the execution of the previous message for "__init__" failed,
527
+ # but that error is not surfaced to the caller.
528
+ # - TODO(T229200522): there is a known bug. fix it.
529
+ # 2. this message is delivered to this actor before the previous
530
+ # message of "__init__" is delivered. Out-of-order delivery
531
+ # should never happen. It indicates either a bug in the
532
+ # message delivery mechanism, or the framework accidentally
533
+ # mixed the usage of cast and direct send.
524
534
  raise AssertionError(
525
- "__init__ failed earlier and no Actor object is available"
535
+ f"""
536
+ actor object is missing when executing method {message.method}
537
+ on actor {mailbox.actor_id}
538
+ """
526
539
  )
527
540
  the_method = getattr(self.instance, message.method)._method
528
541
 
Binary file
@@ -9,6 +9,7 @@ import ctypes
9
9
  import sys
10
10
 
11
11
  import click
12
+ from monarch._rust_bindings.monarch_extension.blocking import blocking_function
12
13
 
13
14
  from monarch._rust_bindings.monarch_extension.panic import panicking_function
14
15
 
@@ -36,6 +37,11 @@ class ErrorActor(Actor):
36
37
  """Endpoint that calls a Rust function that panics."""
37
38
  panicking_function()
38
39
 
40
+ @endpoint
41
+ async def cause_stuck(self) -> None:
42
+ """Endpoint that causes the process to hang indefinitely."""
43
+ blocking_function()
44
+
39
45
  @endpoint
40
46
  async def await_then_error(self) -> None:
41
47
  await asyncio.sleep(0.1)
@@ -171,6 +177,28 @@ async def _error_unmonitored():
171
177
  await asyncio.sleep(300)
172
178
 
173
179
 
180
+ """
181
+ TODO: This test should be enabled when stop() is fully implemented.
182
+ async def _error_unmonitored():
183
+ print("I actually ran")
184
+ sys.stdout.flush()
185
+
186
+ proc = await proc_mesh(gpus=1)
187
+ actor = await proc.spawn("error_actor", ErrorActor)
188
+
189
+ # fire and forget
190
+ send(actor.cause_stuck, (), {}, None, "all")
191
+ proc_mesh.stop()
192
+
193
+ # Wait. Eventually a supervision event will get propagated and the process
194
+ # will exit.
195
+ #
196
+ # If an event is not delivered, the test will time out before this sleep
197
+ # finishes.
198
+ await asyncio.sleep(300)
199
+ """
200
+
201
+
174
202
  @main.command("error-unmonitored")
175
203
  def error_unmonitored():
176
204
  asyncio.run(_error_unmonitored())
@@ -434,6 +434,7 @@ class DebugeeActor(Actor):
434
434
  return _debugee_actor_internal(rank)
435
435
 
436
436
 
437
+ @pytest.mark.oss_skip # pyre-ignore[56] TODO T229449782
437
438
  async def test_debug() -> None:
438
439
  input_mock = AsyncMock()
439
440
  input_mock.side_effect = [
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: torchmonarch-nightly
3
- Version: 2025.6.29
3
+ Version: 2025.7.1
4
4
  Summary: Monarch: Single controller library
5
5
  Author: Meta
6
6
  Author-email: oncall+monarch@xmail.facebook.com
@@ -1,7 +1,7 @@
1
1
  monarch/__init__.py,sha256=iUvWHc0-7Q2tovRoRxOIiA3TsefMXCbWl-jEfQ2djew,6897
2
- monarch/_rust_bindings.so,sha256=9cUwsCXdRE_hw101yv6QOQ3n2FwUKURjVkhqrVYqBTI,43742616
2
+ monarch/_rust_bindings.so,sha256=U-ZaYneJGkTj3JtIL5JQAZ_PDlU2urIw6bLbtPaxZR0,44319160
3
3
  monarch/_testing.py,sha256=jOIOG6jcZBzvEvG_DwSnwCkaMVXvSun6sJAG6nXemww,7859
4
- monarch/actor_mesh.py,sha256=QqKHVTJk9H_I-v7GoxgOdOL8-ymnRpGvNFdda0-cNrE,24534
4
+ monarch/actor_mesh.py,sha256=-IEXcIGdpVWzEV3CNeWhNJb4siMRBtnwDCtQydz7Db0,25369
5
5
  monarch/allocator.py,sha256=l0_mN43AH3K2aCchb5fk8ml95rvdgR31nRC_PqRmZWg,7865
6
6
  monarch/bootstrap_main.py,sha256=RCUQhJk07yMFiKp6HzQuqZFUpkgsT9kVEyimiwjn6_E,1827
7
7
  monarch/cached_remote_function.py,sha256=kYdB6r4OHx_T_uX4q3tCNcp1t2DJwF8tPTIahUiT2pU,8785
@@ -12,7 +12,7 @@ monarch/future.py,sha256=g1VYJl8ReBBS6VbikwWilnFqEr5qJDiSKid92AnWFV4,2058
12
12
  monarch/gradient_generator.py,sha256=Rl3dmXGceTdCc1mYBg2JciR88ywGPnW7TVkL86KwqEA,6366
13
13
  monarch/memory.py,sha256=ol86dBhFAJqg78iF25-BuK0wuwj1onR8FIioZ_B0gjw,1377
14
14
  monarch/mesh_controller.py,sha256=JIg2-MIGhqeFCXn793j8ivEu5-8ePksu--H_Pv0-Ltk,10377
15
- monarch/monarch_controller,sha256=6hzB3c6q4SEgxWIK_fAqANlfnCy4rcX0AwDkLcz9PYY,21723584
15
+ monarch/monarch_controller,sha256=5E5TBqZB-_dRrKZqrKSvATydY65ujHHWE6dR5lfXlAY,22426416
16
16
  monarch/notebook.py,sha256=zu9MKDFKf1-rCM2TqFSRJjMBeiWuKcJSyUFLvoZRQzs,25949
17
17
  monarch/opaque_module.py,sha256=oajOu_WD1hD4hxE8HDdO-tvWY7KDHWd7VaAhJEa5L2I,10446
18
18
  monarch/opaque_object.py,sha256=IVpll4pyuKZMo_EnPh4s0qnx8RlAcJrJ1yoLX6E75wQ,2782
@@ -133,7 +133,7 @@ monarch_supervisor/python_executable.py,sha256=WfCiK3wdAvm9Jxx5jgjGF991NgGc9-oHU
133
133
  tests/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
134
134
  tests/dispatch_bench.py,sha256=sU_m-8KAjQgYTsxI5khV664NdgLLutidni69Rtowk98,3933
135
135
  tests/dispatch_bench_helper.py,sha256=1ORgAMrRgjAjmmWeCHLLQd_bda9mJk0rS2ucEbRu28s,633
136
- tests/error_test_binary.py,sha256=BRj13wAROsUWx4jcxc07HYN2n-xyBNhnnRAhjqah-A0,5582
136
+ tests/error_test_binary.py,sha256=vfbBI6fkWTPo-Gksi2YGPw8wSxfdOHlSALpHQ6e2MIE,6386
137
137
  tests/sleep_binary.py,sha256=XfLYaAfwm9xgzM-svs8fhAeFhwYIg6SyVEnx4e6wbUw,1009
138
138
  tests/test_actor_error.py,sha256=hMpaJDkvowBM_fKuitQdKmq3iyvySaom8KNLmxEsZ-o,9534
139
139
  tests/test_alloc.py,sha256=D6DdQbtOZEvvnnc7LV-WyWFMk0Xb77eblH6Oz90zJTA,745
@@ -146,7 +146,7 @@ tests/test_future.py,sha256=cXzaNi2YDwVyjR541ScXmgktX1YFsKzbl8wep0DMVbk,3032
146
146
  tests/test_grad_generator.py,sha256=p4Pm4kMEeGldt2jUVAkGKCB0mLccKI28pltH6OTGbQA,3412
147
147
  tests/test_mock_cuda.py,sha256=5hisElxeLJ5MHw3KM9gwxBiXiMaG-Rm382u3AsQcDOI,3068
148
148
  tests/test_pdb_actor.py,sha256=5KJhuhcZDPWMdjC6eAtDdwnz1W7jNFXvIrMSFaCWaPw,3858
149
- tests/test_python_actors.py,sha256=0kF3LQpvPnAqT6xbNaBQxaG3gsMyBzzM4Ou7om9ZhoE,20069
149
+ tests/test_python_actors.py,sha256=EXGiWBFscJtFbOk7hESJqSCSuW1SC6UlXIIzEOfwAYI,20126
150
150
  tests/test_remote_functions.py,sha256=5nxYB8dfA9NT9f9Od9O3htgQtPbiRNiXZ1Kgtn75sOQ,50056
151
151
  tests/test_rust_backend.py,sha256=94S3R995ZkyIhEiBsM5flcjf5X7bscEAHBtInbTRFe8,7776
152
152
  tests/test_signal_safe_block_on.py,sha256=bmal0XgzJowZXJV6T1Blow5a-vZluYWusCThLMGxyTE,3336
@@ -157,9 +157,9 @@ tests/simulator/test_profiling.py,sha256=TGYCfzTLdkpIwnOuO6KApprmrgPIRQe60KRX3wk
157
157
  tests/simulator/test_simulator.py,sha256=LO8lA0ssY-OGEBL5ipEu74f97Y765TEwfUOv-DtIptM,14568
158
158
  tests/simulator/test_task.py,sha256=ipqBDuDAysuo1xOB9S5psaFvwe6VATD43IovCTSs0t4,2327
159
159
  tests/simulator/test_worker.py,sha256=QrWWIJ3HDgDLkBPRc2mwYPlOQoXQcj1qRfc0WUfKkFY,3507
160
- torchmonarch_nightly-2025.6.29.dist-info/licenses/LICENSE,sha256=e0Eotbf_rHOYPuEUlppIbvwy4SN98CZnl_hqwvbDA4Q,1530
161
- torchmonarch_nightly-2025.6.29.dist-info/METADATA,sha256=pfxXahOAFVZWSQpbC-6VgvxpOnSxa8Acic1RsONWV6U,2780
162
- torchmonarch_nightly-2025.6.29.dist-info/WHEEL,sha256=OlISbtpDcfagPrLwG7WtpcZbPTUnoKPnwphA_26fNqE,104
163
- torchmonarch_nightly-2025.6.29.dist-info/entry_points.txt,sha256=sqfQ16oZqjEvttUI-uj9BBXIIE6jt05bYFSmy-2hyXI,106
164
- torchmonarch_nightly-2025.6.29.dist-info/top_level.txt,sha256=E-ZssZzyM17glpVrh-S9--qJ-w9p2EjuYOuNw9tQ4Eg,33
165
- torchmonarch_nightly-2025.6.29.dist-info/RECORD,,
160
+ torchmonarch_nightly-2025.7.1.dist-info/licenses/LICENSE,sha256=e0Eotbf_rHOYPuEUlppIbvwy4SN98CZnl_hqwvbDA4Q,1530
161
+ torchmonarch_nightly-2025.7.1.dist-info/METADATA,sha256=69r1r82Eei3iFcfZuQho0RtfcgLoS31nXUf3vg_R1XQ,2779
162
+ torchmonarch_nightly-2025.7.1.dist-info/WHEEL,sha256=OlISbtpDcfagPrLwG7WtpcZbPTUnoKPnwphA_26fNqE,104
163
+ torchmonarch_nightly-2025.7.1.dist-info/entry_points.txt,sha256=sqfQ16oZqjEvttUI-uj9BBXIIE6jt05bYFSmy-2hyXI,106
164
+ torchmonarch_nightly-2025.7.1.dist-info/top_level.txt,sha256=E-ZssZzyM17glpVrh-S9--qJ-w9p2EjuYOuNw9tQ4Eg,33
165
+ torchmonarch_nightly-2025.7.1.dist-info/RECORD,,