We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b03774f commit 97d8cb5Copy full SHA for 97d8cb5
tests/test_cute_dsl_blockscaled_gemm_allreduce_two_shot.py
@@ -38,7 +38,7 @@ def create_mc_tensor(torch_tensor_cpu, dtype, is_dynamic_layout=True):
38
dtype=torch_tensor_cpu.dtype
39
)
40
41
- torch_symm_tensor_lmn.copy_(torch_tensor_cpu)
+ torch_symm_tensor_lmn.copy_(torch_tensor_cpu_lmn)
42
torch_symm_tensor = torch_symm_tensor_lmn.permute(1, 2, 0)
43
symm = symm_mem.rendezvous(torch_symm_tensor, group=dist.group.WORLD.group_name)
44
mc_ptr = symm.multicast_ptr
0 commit comments