torchx-nightly 2025.6.18__py3-none-any.whl → 2025.6.20__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of torchx-nightly might be problematic. Click here for more details.
- torchx/components/dist.py +3 -3
- {torchx_nightly-2025.6.18.dist-info → torchx_nightly-2025.6.20.dist-info}/METADATA +1 -1
- {torchx_nightly-2025.6.18.dist-info → torchx_nightly-2025.6.20.dist-info}/RECORD +7 -7
- {torchx_nightly-2025.6.18.dist-info → torchx_nightly-2025.6.20.dist-info}/LICENSE +0 -0
- {torchx_nightly-2025.6.18.dist-info → torchx_nightly-2025.6.20.dist-info}/WHEEL +0 -0
- {torchx_nightly-2025.6.18.dist-info → torchx_nightly-2025.6.20.dist-info}/entry_points.txt +0 -0
- {torchx_nightly-2025.6.18.dist-info → torchx_nightly-2025.6.20.dist-info}/top_level.txt +0 -0
torchx/components/dist.py
CHANGED
|
@@ -132,9 +132,6 @@ def spmd(
|
|
|
132
132
|
j: {nnodes}x{nproc_per_node}. For GPU hosts omitting nproc_per_node will infer it from the GPU count on the host
|
|
133
133
|
env: environment variables to be passed to the run (e.g. ENV1=v1,ENV2=v2,ENV3=v3)
|
|
134
134
|
max_retries: the number of scheduler retries allowed
|
|
135
|
-
rdzv_port: the port on rank0's host to use for hosting the c10d store used for rendezvous.
|
|
136
|
-
Only takes effect when running multi-node. When running single node, this parameter
|
|
137
|
-
is ignored and a random free port is chosen.
|
|
138
135
|
mounts: (for docker based runs only) mounts to mount into the worker environment/container
|
|
139
136
|
(ex. type=<bind/volume>,src=/host,dst=/job[,readonly]).
|
|
140
137
|
debug: whether to run with preset debug flags enabled
|
|
@@ -174,6 +171,7 @@ def ddp(
|
|
|
174
171
|
max_retries: int = 0,
|
|
175
172
|
rdzv_port: int = 29500,
|
|
176
173
|
rdzv_backend: str = "c10d",
|
|
174
|
+
rdzv_conf: Optional[str] = None,
|
|
177
175
|
mounts: Optional[List[str]] = None,
|
|
178
176
|
debug: bool = False,
|
|
179
177
|
tee: int = 3,
|
|
@@ -208,6 +206,7 @@ def ddp(
|
|
|
208
206
|
Only takes effect when running multi-node. When running single node, this parameter
|
|
209
207
|
is ignored and a random free port is chosen.
|
|
210
208
|
rdzv_backend: the rendezvous backend to use. Only takes effect when running multi-node.
|
|
209
|
+
rdzv_conf: the additional rendezvous configuration to use (ex. join_timeout=600,close_timeout=600,timeout=600).
|
|
211
210
|
mounts: mounts to mount into the worker environment/container (ex. type=<bind/volume>,src=/host,dst=/job[,readonly]).
|
|
212
211
|
See scheduler documentation for more info.
|
|
213
212
|
debug: whether to run with preset debug flags enabled
|
|
@@ -258,6 +257,7 @@ def ddp(
|
|
|
258
257
|
"torchrun",
|
|
259
258
|
"--rdzv_backend",
|
|
260
259
|
rdzv_backend,
|
|
260
|
+
*(["--rdzv_conf", rdzv_conf] if rdzv_conf is not None else []),
|
|
261
261
|
"--rdzv_endpoint",
|
|
262
262
|
rdzv_endpoint,
|
|
263
263
|
"--rdzv_id",
|
|
@@ -24,7 +24,7 @@ torchx/cli/colors.py,sha256=yLMes7e_UoLAfhxE0W6edhc58t83UHAlnCN2ANPeuXw,568
|
|
|
24
24
|
torchx/cli/main.py,sha256=1Jf2cnO6Y2W69Adt88avmNPVrL6ZR4Hkff6GVB4293k,3484
|
|
25
25
|
torchx/components/__init__.py,sha256=6Sb8RWRGObajkH7eFSKv5bHaN5bzTqJiSEmrIIo3OIc,12121
|
|
26
26
|
torchx/components/component_test_base.py,sha256=22iNSdVa_qTW3SMM30Pw5UEWlK4DZVw0C03EqYiaLOI,4150
|
|
27
|
-
torchx/components/dist.py,sha256=
|
|
27
|
+
torchx/components/dist.py,sha256=9jECk3jjQ4Yh4oWDK8vnQ7kcI0-OWCbbwj8uvBdI9FU,14588
|
|
28
28
|
torchx/components/interpret.py,sha256=g8gkKdDJvsBfX1ZrpVT7n2bMEtmwRV_1AqDyAnnQ_aA,697
|
|
29
29
|
torchx/components/metrics.py,sha256=1gbp8BfzZWGa7PD1db5vRADlONzmae4qSBUUdCWayr0,2814
|
|
30
30
|
torchx/components/serve.py,sha256=uxIC5gU2ecg0EJIPX_oEPzNNOXRAre4j2eXusrgwGAI,2156
|
|
@@ -115,9 +115,9 @@ torchx/workspace/__init__.py,sha256=FqN8AN4VhR1C_SBY10MggQvNZmyanbbuPuE-JCjkyUY,
|
|
|
115
115
|
torchx/workspace/api.py,sha256=PtDkGTC5lX03pRoYpuMz2KCmM1ZOycRP1UknqvNb97Y,6341
|
|
116
116
|
torchx/workspace/dir_workspace.py,sha256=npNW_IjUZm_yS5r-8hrRkH46ndDd9a_eApT64m1S1T4,2268
|
|
117
117
|
torchx/workspace/docker_workspace.py,sha256=PFu2KQNVC-0p2aKJ-W_BKA9ZOmXdCY2ABEkCExp3udQ,10269
|
|
118
|
-
torchx_nightly-2025.6.
|
|
119
|
-
torchx_nightly-2025.6.
|
|
120
|
-
torchx_nightly-2025.6.
|
|
121
|
-
torchx_nightly-2025.6.
|
|
122
|
-
torchx_nightly-2025.6.
|
|
123
|
-
torchx_nightly-2025.6.
|
|
118
|
+
torchx_nightly-2025.6.20.dist-info/LICENSE,sha256=WVHfXhFC0Ia8LTKt_nJVYobdqTJVg_4J3Crrfm2A8KQ,1721
|
|
119
|
+
torchx_nightly-2025.6.20.dist-info/METADATA,sha256=dLZF00f12ZkXgCz2pkxO3My4t78eMek-C63BX2E7I6M,6120
|
|
120
|
+
torchx_nightly-2025.6.20.dist-info/WHEEL,sha256=tZoeGjtWxWRfdplE7E3d45VPlLNQnvbKiYnx7gwAy8A,92
|
|
121
|
+
torchx_nightly-2025.6.20.dist-info/entry_points.txt,sha256=T328AMXeKI3JZnnxfkEew2ZcMN1oQDtkXjMz7lkV-P4,169
|
|
122
|
+
torchx_nightly-2025.6.20.dist-info/top_level.txt,sha256=pxew3bc2gsiViS0zADs0jb6kC5v8o_Yy_85fhHj_J1A,7
|
|
123
|
+
torchx_nightly-2025.6.20.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|