@@ -61,7 +61,7 @@ def __init__(
61
61
max_retries : int = 0 ,
62
62
mounts : Optional [List [str ]] = None ,
63
63
rdzv_port : int = 29500 ,
64
- rdzv_backend : str = "c10d" ,
64
+ rdzv_backend : str = None ,
65
65
scheduler_args : Optional [Dict [str , str ]] = None ,
66
66
image : Optional [str ] = None ,
67
67
):
@@ -106,7 +106,9 @@ def _dry_run(self, cluster: "Cluster"):
106
106
env = self .env ,
107
107
max_retries = self .max_retries ,
108
108
rdzv_port = self .rdzv_port ,
109
- rdzv_backend = self .rdzv_backend ,
109
+ rdzv_backend = self .rdzv_backend
110
+ if self .rdzv_backend is not None
111
+ else "static" ,
110
112
mounts = self .mounts ,
111
113
),
112
114
scheduler = cluster .torchx_scheduler ,
@@ -145,7 +147,9 @@ def _dry_run_no_cluster(self):
145
147
env = self .env , # should this still exist?
146
148
max_retries = self .max_retries ,
147
149
rdzv_port = self .rdzv_port , # should this still exist?
148
- rdzv_backend = self .rdzv_backend ,
150
+ rdzv_backend = self .rdzv_backend
151
+ if self .rdzv_backend is not None
152
+ else "c10d" ,
149
153
mounts = self .mounts ,
150
154
image = self .image
151
155
if self .image is not None
0 commit comments