Skip to content

Commit e5b6539

Browse files
committed
Review comments
Change-Id: I36ddacfdb0806e988e0d8bc0c9ad018dc7e57e6f
1 parent f6cb3c5 commit e5b6539

File tree

2 files changed

+16
-14
lines changed

2 files changed

+16
-14
lines changed

llvm/lib/CodeGen/TargetInstrInfo.cpp

Lines changed: 11 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -476,9 +476,6 @@ static const TargetRegisterClass *canFoldCopy(const MachineInstr &MI,
476476
if (FoldOp.getSubReg() || LiveOp.getSubReg())
477477
return nullptr;
478478

479-
if (LiveOp.isUndef())
480-
return nullptr;
481-
482479
Register FoldReg = FoldOp.getReg();
483480
Register LiveReg = LiveOp.getReg();
484481

@@ -775,12 +772,18 @@ MachineInstr *TargetInstrInfo::foldMemoryOperand(MachineInstr &MI,
775772

776773
const MachineOperand &MO = MI.getOperand(1 - Ops[0]);
777774
MachineBasicBlock::iterator Pos = MI;
778-
779-
if (Flags == MachineMemOperand::MOStore)
780-
storeRegToStackSlot(*MBB, Pos, MO.getReg(), MO.isKill(), FI, RC, TRI,
781-
Register());
782-
else
775+
if (Flags == MachineMemOperand::MOStore) {
776+
if (MO.isUndef()) {
777+
// If this is an undef copy, we do not need to bother we inserting spill
778+
// code.
779+
BuildMI(*MBB, Pos, MI.getDebugLoc(), get(TargetOpcode::KILL)).add(MO);
780+
} else {
781+
storeRegToStackSlot(*MBB, Pos, MO.getReg(), MO.isKill(), FI, RC, TRI,
782+
Register());
783+
}
784+
} else
783785
loadRegFromStackSlot(*MBB, Pos, MO.getReg(), FI, RC, TRI, Register());
786+
784787
return &*--Pos;
785788
}
786789

llvm/test/CodeGen/AMDGPU/regalloc-undef-copy-fold.mir

Lines changed: 5 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -41,14 +41,13 @@ body: |
4141
bb.0:
4242
; CHECK-LABEL: name: foo
4343
; CHECK: INLINEASM &"; def $0 $1 $2 $3 $4", 1 /* sideeffect attdialect */, 10 /* regdef */, def %10, 10 /* regdef */, def %1, 10 /* regdef */, def %2, 10 /* regdef */, def $vgpr0_vgpr1_vgpr2_vgpr3, 10 /* regdef */, implicit-def $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15
44-
; CHECK-NEXT: [[COPY:%[0-9]+]]:av_128 = COPY undef $vgpr0_vgpr1_vgpr2_vgpr3
45-
; CHECK-NEXT: SI_SPILL_AV128_SAVE [[COPY]], %stack.2, $sgpr32, 0, implicit $exec :: (store (s128) into %stack.2, align 4, addrspace 5)
44+
; CHECK-NEXT: KILL undef $vgpr0_vgpr1_vgpr2_vgpr3
4645
; CHECK-NEXT: SI_SPILL_AV160_SAVE %2, %stack.1, $sgpr32, 0, implicit $exec :: (store (s160) into %stack.1, align 4, addrspace 5)
4746
; CHECK-NEXT: SI_SPILL_AV256_SAVE %1, %stack.3, $sgpr32, 0, implicit $exec :: (store (s256) into %stack.3, align 4, addrspace 5)
48-
; CHECK-NEXT: [[COPY1:%[0-9]+]]:vreg_512 = COPY %10
49-
; CHECK-NEXT: SI_SPILL_V512_SAVE [[COPY1]], %stack.0, $sgpr32, 0, implicit $exec :: (store (s512) into %stack.0, align 4, addrspace 5)
50-
; CHECK-NEXT: [[COPY2:%[0-9]+]]:vreg_512 = COPY $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15
51-
; CHECK-NEXT: SI_SPILL_V512_SAVE [[COPY2]], %stack.6, $sgpr32, 0, implicit $exec :: (store (s512) into %stack.6, align 4, addrspace 5)
47+
; CHECK-NEXT: [[COPY:%[0-9]+]]:vreg_512 = COPY %10
48+
; CHECK-NEXT: SI_SPILL_V512_SAVE [[COPY]], %stack.0, $sgpr32, 0, implicit $exec :: (store (s512) into %stack.0, align 4, addrspace 5)
49+
; CHECK-NEXT: [[COPY1:%[0-9]+]]:vreg_512 = COPY $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15
50+
; CHECK-NEXT: SI_SPILL_V512_SAVE [[COPY1]], %stack.6, $sgpr32, 0, implicit $exec :: (store (s512) into %stack.6, align 4, addrspace 5)
5251
; CHECK-NEXT: INLINEASM &"; clobber", 1 /* sideeffect attdialect */, 10 /* regdef */, implicit-def early-clobber $vgpr0_vgpr1_vgpr2_vgpr3_vgpr4_vgpr5_vgpr6_vgpr7_vgpr8_vgpr9_vgpr10_vgpr11_vgpr12_vgpr13_vgpr14_vgpr15_vgpr16_vgpr17_vgpr18_vgpr19_vgpr20_vgpr21_vgpr22_vgpr23_vgpr24_vgpr25_vgpr26_vgpr27_vgpr28_vgpr29_vgpr30_vgpr31
5352
; CHECK-NEXT: [[SI_SPILL_V512_RESTORE:%[0-9]+]]:vreg_512 = SI_SPILL_V512_RESTORE %stack.6, $sgpr32, 0, implicit $exec :: (load (s512) from %stack.6, align 4, addrspace 5)
5453
; CHECK-NEXT: $agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15_agpr16 = COPY [[SI_SPILL_V512_RESTORE]]

0 commit comments

Comments
 (0)