Skip to content

Commit 4e31ba9

Browse files
committed
change low trip 16000, min_threads low trip 32
OMPX_LowTripCount("LIBOMPTARGET_AMDGPU_LOW_TRIPCOUNT", 16000), OMPX_SmallBlockSize("LIBOMPTARGET_MIN_THREADS_FOR_LOW_TRIP_COUNT", 32), Change-Id: I19b8b10e219c91015079aeee6080d487acf3c694
1 parent 92c9e9a commit 4e31ba9

File tree

1 file changed

+2
-2
lines changed
  • offload/plugins-nextgen/amdgpu/src

1 file changed

+2
-2
lines changed

offload/plugins-nextgen/amdgpu/src/rtl.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2760,8 +2760,8 @@ struct AMDGPUDeviceTy : public GenericDeviceTy, AMDGenericDeviceTy {
27602760
"LIBOMPTARGET_AMDGPU_BIG_JUMP_LOOP_TEAMS_PER_CU", 0),
27612761
OMPX_BigJumpLoopMaxTotalTeams(
27622762
"LIBOMPTARGET_AMDGPU_BIG_JUMP_LOOP_MAX_TOTAL_TEAMS", 1024 * 1024),
2763-
OMPX_LowTripCount("LIBOMPTARGET_AMDGPU_LOW_TRIPCOUNT", 2000),
2764-
OMPX_SmallBlockSize("LIBOMPTARGET_MIN_THREADS_FOR_LOW_TRIP_COUNT", 8),
2763+
OMPX_LowTripCount("LIBOMPTARGET_AMDGPU_LOW_TRIPCOUNT", 16000),
2764+
OMPX_SmallBlockSize("LIBOMPTARGET_MIN_THREADS_FOR_LOW_TRIP_COUNT", 32),
27652765
OMPX_NumBlocksForLowTripcount("LIBOMPTARGET_BLOCKS_FOR_LOW_TRIP_COUNT",
27662766
0),
27672767
OMPX_WavesPerCUForLowTripcount(

0 commit comments

Comments
 (0)