@@ -5395,18 +5395,18 @@ static MachineBasicBlock *lowerWaveReduce(MachineInstr &MI,
53955395 case AMDGPU::S_MAX_U32:
53965396 case AMDGPU::S_MAX_I32:
53975397 case AMDGPU::S_AND_B32:
5398- case AMDGPU::S_AND_B64:
5399- case AMDGPU::S_OR_B32:
5400- case AMDGPU::S_OR_B64: {
5398+ case AMDGPU::S_OR_B32: {
54015399 // Idempotent operations.
54025400 BuildMI(BB, MI, DL, TII->get(AMDGPU::S_MOV_B32), DstReg).addReg(SrcReg);
54035401 RetBB = &BB;
54045402 break;
54055403 }
5406- case AMDGPU::V_CMP_LT_U64_e64: // umin
5407- case AMDGPU::V_CMP_LT_I64_e64: // min
5408- case AMDGPU::V_CMP_GT_U64_e64: // umax
5409- case AMDGPU::V_CMP_GT_I64_e64: { // max
5404+ case AMDGPU::V_CMP_LT_U64_e64: // umin
5405+ case AMDGPU::V_CMP_LT_I64_e64: // min
5406+ case AMDGPU::V_CMP_GT_U64_e64: // umax
5407+ case AMDGPU::V_CMP_GT_I64_e64: // max
5408+ case AMDGPU::S_AND_B64:
5409+ case AMDGPU::S_OR_B64: {
54105410 // Idempotent operations.
54115411 BuildMI(BB, MI, DL, TII->get(AMDGPU::S_MOV_B64), DstReg).addReg(SrcReg);
54125412 RetBB = &BB;
@@ -5459,7 +5459,7 @@ static MachineBasicBlock *lowerWaveReduce(MachineInstr &MI,
54595459 .addReg(NewAccumulator->getOperand(0).getReg())
54605460 .addImm(1)
54615461 .setOperandDead(3); // Dead scc
5462- if (is32BitOpc ) {
5462+ if (Opc == AMDGPU::S_XOR_B32 ) {
54635463 BuildMI(BB, MI, DL, TII->get(AMDGPU::S_MUL_I32), DstReg)
54645464 .addReg(SrcReg)
54655465 .addReg(ParityRegister);
0 commit comments