Skip to content

Commit 31b4061

Browse files
committed
compile
1 parent e8aedb3 commit 31b4061

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

csrc/deepep/ops2/op_kernel/a2/moe_distribute_dispatch_a2_pipeline.h

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -503,7 +503,7 @@ __aicore__ inline void MoeDistributeDispatchA2Pipeline<TemplateMC2TypeA2Pipeline
503503
continue;
504504
}
505505
GlobalTensor<uint8_t> dstRankRecvRingU8Tensor;
506-
dstRankRecvRingU8Tensor.SetGlobalBuffer((__gm__ uint8_t *) (hccl_.GetWindowsInAddr(rankId_)) + halfWinSize_ / 2);
506+
dstRankRecvRingU8Tensor.SetGlobalBuffer((__gm__ uint8_t *) (hccl_.GetWindowsInAddr(localDstRank)) + halfWinSize_ / 2);
507507
LocalTensor<uint32_t> localHccsHeadTailTensor;
508508
GlobalTensor<uint32_t> globalHccsHeadTailTensor;
509509
globalHccsHeadTailTensor.SetGlobalBuffer((__gm__ uint32_t *)hccsHeadTailGM[localDstRank]);
@@ -525,7 +525,7 @@ __aicore__ inline void MoeDistributeDispatchA2Pipeline<TemplateMC2TypeA2Pipeline
525525
}
526526
}
527527
SyncFunc<AscendC::HardEvent::S_MTE3>();
528-
DataCopyPad(dstRankRecvRingU8Tensor[tokenStructLen_ * index], tokenStructInRdmaTensor_,
528+
DataCopyPad(dstRankRecvRingU8Tensor[hccsItemNum * localDstRank + tokenStructLen_ * index], tokenStructInRdmaTensor_,
529529
tokenStructParams);
530530
DataCopyPad(rdmaRecvRingU8Tensor_[(i * rdmaItemNum + rdmaHead) * tokenStructLen_], tokenStructInRdmaTensor_,
531531
tokenStructParams);

0 commit comments

Comments
 (0)