Skip to content

Commit 024cc97

Browse files
committed
Fix merge issue in rtl.cpp
1 parent 65f0ae0 commit 024cc97

File tree

1 file changed

+1
-13
lines changed
  • offload/plugins-nextgen/amdgpu/src

1 file changed

+1
-13
lines changed

offload/plugins-nextgen/amdgpu/src/rtl.cpp

Lines changed: 1 addition & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -5128,8 +5128,7 @@ Error AMDGPUKernelTy::launchImpl(GenericDeviceTy &GenericDevice,
51285128
return Err;
51295129

51305130
// Only COV5 implicitargs needs to be set. COV4 implicitargs are not used.
5131-
if (ImplArgs &&
5132-
getImplicitArgsSize() == sizeof(hsa_utils::AMDGPUImplicitArgsTy)) {
5131+
if (ImplArgs) {
51335132
DP("Setting fields of ImplicitArgs for COV5\n");
51345133
ImplArgs->BlockCountX = NumBlocks[0];
51355134
ImplArgs->BlockCountY = NumBlocks[1];
@@ -5144,17 +5143,6 @@ Error AMDGPUKernelTy::launchImpl(GenericDeviceTy &GenericDevice,
51445143
(uint64_t)AMDGPUDevice.getPreAllocatedDeviceMemoryPool();
51455144
ImplArgs->DynamicLdsSize = KernelArgs.DynCGroupMem;
51465145
}
5147-
// Set the COV5+ implicit arguments to the appropriate values.
5148-
ImplArgs->BlockCountX = NumBlocks[0];
5149-
ImplArgs->BlockCountY = NumBlocks[1];
5150-
ImplArgs->BlockCountZ = NumBlocks[2];
5151-
ImplArgs->GroupSizeX = NumThreads[0];
5152-
ImplArgs->GroupSizeY = NumThreads[1];
5153-
ImplArgs->GroupSizeZ = NumThreads[2];
5154-
ImplArgs->GridDims = NumBlocks[2] * NumThreads[2] > 1
5155-
? 3
5156-
: 1 + (NumBlocks[1] * NumThreads[1] != 1);
5157-
ImplArgs->DynamicLdsSize = KernelArgs.DynCGroupMem;
51585146

51595147
// Get required OMPT-related data
51605148
auto LocalOmptEventInfo = getOrNullOmptEventInfo(AsyncInfoWrapper);

0 commit comments

Comments
 (0)