We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent d1df979 commit 443f61aCopy full SHA for 443f61a
launcher/src/main.rs
@@ -499,6 +499,9 @@ fn shard_manager(
499
env.push(("MASTER_PORT".into(), master_port.to_string().into()));
500
env.push(("NCCL_ASYNC_ERROR_HANDLING".into(), "1".into()));
501
502
+ // See https://discuss.pytorch.org/t/cuda-allocation-lifetime-for-inputs-to-distributed-all-reduce/191573
503
+ env.push(("TORCH_NCCL_AVOID_RECORD_STREAMS".into(), "1".into()));
504
+
505
// Safetensors load fast
506
env.push(("SAFETENSORS_FAST_GPU".into(), "1".into()));
507
0 commit comments