We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ad74bb3 commit 7638439Copy full SHA for 7638439
src/lightning/pytorch/strategies/deepspeed.py
@@ -366,7 +366,7 @@ def _init_deepspeed_distributed(self) -> None:
366
f"MEMBER: {self.global_rank + 1}/{self.world_size}"
367
)
368
self._process_group_backend = self._get_process_group_backend()
369
- deepspeed.init_distributed(self._process_group_backend, distributed_port=self.cluster_environment.main_port)
+ deepspeed.init_distributed(self._process_group_backend, distributed_port=self.cluster_environment.main_port, timeout=self._timeout)
370
371
def _set_node_environment_variables(self) -> None:
372
assert self.cluster_environment is not None
0 commit comments