@@ -5310,18 +5310,18 @@ static MachineBasicBlock *lowerWaveReduce(MachineInstr &MI,
53105310 case AMDGPU::S_MAX_U32:
53115311 case AMDGPU::S_MAX_I32:
53125312 case AMDGPU::S_AND_B32:
5313- case AMDGPU::S_AND_B64:
5314- case AMDGPU::S_OR_B32:
5315- case AMDGPU::S_OR_B64: {
5313+ case AMDGPU::S_OR_B32: {
53165314 // Idempotent operations.
53175315 BuildMI(BB, MI, DL, TII->get(AMDGPU::S_MOV_B32), DstReg).addReg(SrcReg);
53185316 RetBB = &BB;
53195317 break;
53205318 }
5321- case AMDGPU::V_CMP_LT_U64_e64: // umin
5322- case AMDGPU::V_CMP_LT_I64_e64: // min
5323- case AMDGPU::V_CMP_GT_U64_e64: // umax
5324- case AMDGPU::V_CMP_GT_I64_e64: { // max
5319+ case AMDGPU::V_CMP_LT_U64_e64: // umin
5320+ case AMDGPU::V_CMP_LT_I64_e64: // min
5321+ case AMDGPU::V_CMP_GT_U64_e64: // umax
5322+ case AMDGPU::V_CMP_GT_I64_e64: // max
5323+ case AMDGPU::S_AND_B64:
5324+ case AMDGPU::S_OR_B64: {
53255325 // Idempotent operations.
53265326 BuildMI(BB, MI, DL, TII->get(AMDGPU::S_MOV_B64), DstReg).addReg(SrcReg);
53275327 RetBB = &BB;
@@ -5365,7 +5365,7 @@ static MachineBasicBlock *lowerWaveReduce(MachineInstr &MI,
53655365 .addReg(NewAccumulator->getOperand(0).getReg())
53665366 .addImm(1)
53675367 .setOperandDead(3); // Dead scc
5368- if (is32BitOpc ) {
5368+ if (Opc == AMDGPU::S_XOR_B32 ) {
53695369 BuildMI(BB, MI, DL, TII->get(AMDGPU::S_MUL_I32), DstReg)
53705370 .addReg(SrcReg)
53715371 .addReg(ParityRegister);
0 commit comments