Skip to content
Open
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 3 additions & 1 deletion torchft/manager.py
Original file line number Diff line number Diff line change
Expand Up @@ -730,7 +730,9 @@ def _async_quorum(
f"resetting fr recording for quorum id {self._quorum_id}"
)
self._update_fr_path()
torch._C._distributed_c10d._reset_fr_recording_nccl() # pyre-ignore
# Only reset FR recording if available (requires NCCL Flight Recorder support)
if hasattr(torch._C._distributed_c10d, "_reset_fr_recording_nccl"):
torch._C._distributed_c10d._reset_fr_recording_nccl() # pyre-ignore
except Exception as e:
self._logger.exception(f"got exception in pg configure: {e}")
self.report_error(e)
Expand Down
Loading