Skip to content

Commit fa7263c

Browse files
committed
Switch to getOccupancyWithNumVGPRs
1 parent 09be8bf commit fa7263c

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

llvm/lib/Target/AMDGPU/SIInsertWaitcnts.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2610,8 +2610,8 @@ bool SIInsertWaitcnts::runOnMachineFunction(MachineFunction &MF) {
26102610
// waveslot limited kernel runs slower with the deallocation.
26112611
if (!ReleaseVGPRInsts.empty() &&
26122612
(MF.getFrameInfo().hasCalls() ||
2613-
AMDGPU::IsaInfo::getTotalNumVGPRs(ST) /
2614-
TRI->getNumUsedPhysRegs(*MRI, AMDGPU::VGPR_32RegClass) <
2613+
ST->getOccupancyWithNumVGPRs(
2614+
TRI->getNumUsedPhysRegs(*MRI, AMDGPU::VGPR_32RegClass)) <
26152615
AMDGPU::IsaInfo::getMaxWavesPerEU(ST))) {
26162616
for (MachineInstr *MI : ReleaseVGPRInsts) {
26172617
if (ST->requiresNopBeforeDeallocVGPRs()) {

0 commit comments

Comments
 (0)