We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 8d826a3 commit de3d371Copy full SHA for de3d371
colossalai/zero/low_level/low_level_optim.py
@@ -371,7 +371,7 @@ def _run_reduction(self):
371
for i, sz in enumerate(bucket_store.sizes):
372
grp = bucket_store.torch_pg if len(bucket_store.sizes) == 1 else bucket_store.torch_pg[i]
373
flat_grads_list = list(cur_flat_grads.split(len(cur_flat_grads) // sz))
374
- received_grad = torch.zeros_like(flat_grads_list[0])
+ received_grad = torch.empty_like(flat_grads_list[0])
375
if self._fp8_communication:
376
reduce_scatter_fp8(
377
received_grad,
0 commit comments