torchmonarch-nightly 2025.6.29__cp313-cp313-manylinux2014_x86_64.whl → 2025.7.1__cp313-cp313-manylinux2014_x86_64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- monarch/_rust_bindings.so +0 -0
- monarch/actor_mesh.py +14 -1
- monarch/monarch_controller +0 -0
- tests/error_test_binary.py +28 -0
- tests/test_python_actors.py +1 -0
- {torchmonarch_nightly-2025.6.29.dist-info → torchmonarch_nightly-2025.7.1.dist-info}/METADATA +1 -1
- {torchmonarch_nightly-2025.6.29.dist-info → torchmonarch_nightly-2025.7.1.dist-info}/RECORD +11 -11
- {torchmonarch_nightly-2025.6.29.dist-info → torchmonarch_nightly-2025.7.1.dist-info}/WHEEL +0 -0
- {torchmonarch_nightly-2025.6.29.dist-info → torchmonarch_nightly-2025.7.1.dist-info}/entry_points.txt +0 -0
- {torchmonarch_nightly-2025.6.29.dist-info → torchmonarch_nightly-2025.7.1.dist-info}/licenses/LICENSE +0 -0
- {torchmonarch_nightly-2025.6.29.dist-info → torchmonarch_nightly-2025.7.1.dist-info}/top_level.txt +0 -0
monarch/_rust_bindings.so
CHANGED
Binary file
|
monarch/actor_mesh.py
CHANGED
@@ -521,8 +521,21 @@ class _Actor:
|
|
521
521
|
return None
|
522
522
|
|
523
523
|
if self.instance is None:
|
524
|
+
# This could happen because of the following reasons. Both
|
525
|
+
# indicates a possible bug in the framework:
|
526
|
+
# 1. the execution of the previous message for "__init__" failed,
|
527
|
+
# but that error is not surfaced to the caller.
|
528
|
+
# - TODO(T229200522): there is a known bug. fix it.
|
529
|
+
# 2. this message is delivered to this actor before the previous
|
530
|
+
# message of "__init__" is delivered. Out-of-order delivery
|
531
|
+
# should never happen. It indicates either a bug in the
|
532
|
+
# message delivery mechanism, or the framework accidentally
|
533
|
+
# mixed the usage of cast and direct send.
|
524
534
|
raise AssertionError(
|
525
|
-
"
|
535
|
+
f"""
|
536
|
+
actor object is missing when executing method {message.method}
|
537
|
+
on actor {mailbox.actor_id}
|
538
|
+
"""
|
526
539
|
)
|
527
540
|
the_method = getattr(self.instance, message.method)._method
|
528
541
|
|
monarch/monarch_controller
CHANGED
Binary file
|
tests/error_test_binary.py
CHANGED
@@ -9,6 +9,7 @@ import ctypes
|
|
9
9
|
import sys
|
10
10
|
|
11
11
|
import click
|
12
|
+
from monarch._rust_bindings.monarch_extension.blocking import blocking_function
|
12
13
|
|
13
14
|
from monarch._rust_bindings.monarch_extension.panic import panicking_function
|
14
15
|
|
@@ -36,6 +37,11 @@ class ErrorActor(Actor):
|
|
36
37
|
"""Endpoint that calls a Rust function that panics."""
|
37
38
|
panicking_function()
|
38
39
|
|
40
|
+
@endpoint
|
41
|
+
async def cause_stuck(self) -> None:
|
42
|
+
"""Endpoint that causes the process to hang indefinitely."""
|
43
|
+
blocking_function()
|
44
|
+
|
39
45
|
@endpoint
|
40
46
|
async def await_then_error(self) -> None:
|
41
47
|
await asyncio.sleep(0.1)
|
@@ -171,6 +177,28 @@ async def _error_unmonitored():
|
|
171
177
|
await asyncio.sleep(300)
|
172
178
|
|
173
179
|
|
180
|
+
"""
|
181
|
+
TODO: This test should be enabled when stop() is fully implemented.
|
182
|
+
async def _error_unmonitored():
|
183
|
+
print("I actually ran")
|
184
|
+
sys.stdout.flush()
|
185
|
+
|
186
|
+
proc = await proc_mesh(gpus=1)
|
187
|
+
actor = await proc.spawn("error_actor", ErrorActor)
|
188
|
+
|
189
|
+
# fire and forget
|
190
|
+
send(actor.cause_stuck, (), {}, None, "all")
|
191
|
+
proc_mesh.stop()
|
192
|
+
|
193
|
+
# Wait. Eventually a supervision event will get propagated and the process
|
194
|
+
# will exit.
|
195
|
+
#
|
196
|
+
# If an event is not delivered, the test will time out before this sleep
|
197
|
+
# finishes.
|
198
|
+
await asyncio.sleep(300)
|
199
|
+
"""
|
200
|
+
|
201
|
+
|
174
202
|
@main.command("error-unmonitored")
|
175
203
|
def error_unmonitored():
|
176
204
|
asyncio.run(_error_unmonitored())
|
tests/test_python_actors.py
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
monarch/__init__.py,sha256=iUvWHc0-7Q2tovRoRxOIiA3TsefMXCbWl-jEfQ2djew,6897
|
2
|
-
monarch/_rust_bindings.so,sha256=
|
2
|
+
monarch/_rust_bindings.so,sha256=U-ZaYneJGkTj3JtIL5JQAZ_PDlU2urIw6bLbtPaxZR0,44319160
|
3
3
|
monarch/_testing.py,sha256=jOIOG6jcZBzvEvG_DwSnwCkaMVXvSun6sJAG6nXemww,7859
|
4
|
-
monarch/actor_mesh.py,sha256
|
4
|
+
monarch/actor_mesh.py,sha256=-IEXcIGdpVWzEV3CNeWhNJb4siMRBtnwDCtQydz7Db0,25369
|
5
5
|
monarch/allocator.py,sha256=l0_mN43AH3K2aCchb5fk8ml95rvdgR31nRC_PqRmZWg,7865
|
6
6
|
monarch/bootstrap_main.py,sha256=RCUQhJk07yMFiKp6HzQuqZFUpkgsT9kVEyimiwjn6_E,1827
|
7
7
|
monarch/cached_remote_function.py,sha256=kYdB6r4OHx_T_uX4q3tCNcp1t2DJwF8tPTIahUiT2pU,8785
|
@@ -12,7 +12,7 @@ monarch/future.py,sha256=g1VYJl8ReBBS6VbikwWilnFqEr5qJDiSKid92AnWFV4,2058
|
|
12
12
|
monarch/gradient_generator.py,sha256=Rl3dmXGceTdCc1mYBg2JciR88ywGPnW7TVkL86KwqEA,6366
|
13
13
|
monarch/memory.py,sha256=ol86dBhFAJqg78iF25-BuK0wuwj1onR8FIioZ_B0gjw,1377
|
14
14
|
monarch/mesh_controller.py,sha256=JIg2-MIGhqeFCXn793j8ivEu5-8ePksu--H_Pv0-Ltk,10377
|
15
|
-
monarch/monarch_controller,sha256=
|
15
|
+
monarch/monarch_controller,sha256=5E5TBqZB-_dRrKZqrKSvATydY65ujHHWE6dR5lfXlAY,22426416
|
16
16
|
monarch/notebook.py,sha256=zu9MKDFKf1-rCM2TqFSRJjMBeiWuKcJSyUFLvoZRQzs,25949
|
17
17
|
monarch/opaque_module.py,sha256=oajOu_WD1hD4hxE8HDdO-tvWY7KDHWd7VaAhJEa5L2I,10446
|
18
18
|
monarch/opaque_object.py,sha256=IVpll4pyuKZMo_EnPh4s0qnx8RlAcJrJ1yoLX6E75wQ,2782
|
@@ -133,7 +133,7 @@ monarch_supervisor/python_executable.py,sha256=WfCiK3wdAvm9Jxx5jgjGF991NgGc9-oHU
|
|
133
133
|
tests/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
134
134
|
tests/dispatch_bench.py,sha256=sU_m-8KAjQgYTsxI5khV664NdgLLutidni69Rtowk98,3933
|
135
135
|
tests/dispatch_bench_helper.py,sha256=1ORgAMrRgjAjmmWeCHLLQd_bda9mJk0rS2ucEbRu28s,633
|
136
|
-
tests/error_test_binary.py,sha256=
|
136
|
+
tests/error_test_binary.py,sha256=vfbBI6fkWTPo-Gksi2YGPw8wSxfdOHlSALpHQ6e2MIE,6386
|
137
137
|
tests/sleep_binary.py,sha256=XfLYaAfwm9xgzM-svs8fhAeFhwYIg6SyVEnx4e6wbUw,1009
|
138
138
|
tests/test_actor_error.py,sha256=hMpaJDkvowBM_fKuitQdKmq3iyvySaom8KNLmxEsZ-o,9534
|
139
139
|
tests/test_alloc.py,sha256=D6DdQbtOZEvvnnc7LV-WyWFMk0Xb77eblH6Oz90zJTA,745
|
@@ -146,7 +146,7 @@ tests/test_future.py,sha256=cXzaNi2YDwVyjR541ScXmgktX1YFsKzbl8wep0DMVbk,3032
|
|
146
146
|
tests/test_grad_generator.py,sha256=p4Pm4kMEeGldt2jUVAkGKCB0mLccKI28pltH6OTGbQA,3412
|
147
147
|
tests/test_mock_cuda.py,sha256=5hisElxeLJ5MHw3KM9gwxBiXiMaG-Rm382u3AsQcDOI,3068
|
148
148
|
tests/test_pdb_actor.py,sha256=5KJhuhcZDPWMdjC6eAtDdwnz1W7jNFXvIrMSFaCWaPw,3858
|
149
|
-
tests/test_python_actors.py,sha256=
|
149
|
+
tests/test_python_actors.py,sha256=EXGiWBFscJtFbOk7hESJqSCSuW1SC6UlXIIzEOfwAYI,20126
|
150
150
|
tests/test_remote_functions.py,sha256=5nxYB8dfA9NT9f9Od9O3htgQtPbiRNiXZ1Kgtn75sOQ,50056
|
151
151
|
tests/test_rust_backend.py,sha256=94S3R995ZkyIhEiBsM5flcjf5X7bscEAHBtInbTRFe8,7776
|
152
152
|
tests/test_signal_safe_block_on.py,sha256=bmal0XgzJowZXJV6T1Blow5a-vZluYWusCThLMGxyTE,3336
|
@@ -157,9 +157,9 @@ tests/simulator/test_profiling.py,sha256=TGYCfzTLdkpIwnOuO6KApprmrgPIRQe60KRX3wk
|
|
157
157
|
tests/simulator/test_simulator.py,sha256=LO8lA0ssY-OGEBL5ipEu74f97Y765TEwfUOv-DtIptM,14568
|
158
158
|
tests/simulator/test_task.py,sha256=ipqBDuDAysuo1xOB9S5psaFvwe6VATD43IovCTSs0t4,2327
|
159
159
|
tests/simulator/test_worker.py,sha256=QrWWIJ3HDgDLkBPRc2mwYPlOQoXQcj1qRfc0WUfKkFY,3507
|
160
|
-
torchmonarch_nightly-2025.
|
161
|
-
torchmonarch_nightly-2025.
|
162
|
-
torchmonarch_nightly-2025.
|
163
|
-
torchmonarch_nightly-2025.
|
164
|
-
torchmonarch_nightly-2025.
|
165
|
-
torchmonarch_nightly-2025.
|
160
|
+
torchmonarch_nightly-2025.7.1.dist-info/licenses/LICENSE,sha256=e0Eotbf_rHOYPuEUlppIbvwy4SN98CZnl_hqwvbDA4Q,1530
|
161
|
+
torchmonarch_nightly-2025.7.1.dist-info/METADATA,sha256=69r1r82Eei3iFcfZuQho0RtfcgLoS31nXUf3vg_R1XQ,2779
|
162
|
+
torchmonarch_nightly-2025.7.1.dist-info/WHEEL,sha256=OlISbtpDcfagPrLwG7WtpcZbPTUnoKPnwphA_26fNqE,104
|
163
|
+
torchmonarch_nightly-2025.7.1.dist-info/entry_points.txt,sha256=sqfQ16oZqjEvttUI-uj9BBXIIE6jt05bYFSmy-2hyXI,106
|
164
|
+
torchmonarch_nightly-2025.7.1.dist-info/top_level.txt,sha256=E-ZssZzyM17glpVrh-S9--qJ-w9p2EjuYOuNw9tQ4Eg,33
|
165
|
+
torchmonarch_nightly-2025.7.1.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|
{torchmonarch_nightly-2025.6.29.dist-info → torchmonarch_nightly-2025.7.1.dist-info}/top_level.txt
RENAMED
File without changes
|