Skip to content

Commit dbd8049

Browse files
committed
[OpenMP][plugin] Improve 521.miniswp set default for
LIBOMPTARGET_AMDGPU_GENERIC_SPMD_TEAMS_PER_CU from 0 to 6. time base new improvement mi300x 64.4 55.3 16.5% mi300a 118.9 96.1 23.7% mi250 178.1 151.4 17.7%
1 parent a1caab7 commit dbd8049

File tree

1 file changed

+1
-1
lines changed
  • offload/plugins-nextgen/amdgpu/src

1 file changed

+1
-1
lines changed

offload/plugins-nextgen/amdgpu/src/rtl.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2906,7 +2906,7 @@ struct AMDGPUDeviceTy : public GenericDeviceTy, AMDGenericDeviceTy {
29062906
OMPX_QueueSize("LIBOMPTARGET_AMDGPU_HSA_QUEUE_SIZE", 512),
29072907
OMPX_DefaultTeamsPerCU("LIBOMPTARGET_AMDGPU_TEAMS_PER_CU", 4),
29082908
OMPX_GenericSpmdTeamsPerCU(
2909-
"LIBOMPTARGET_AMDGPU_GENERIC_SPMD_TEAMS_PER_CU", 0),
2909+
"LIBOMPTARGET_AMDGPU_GENERIC_SPMD_TEAMS_PER_CU", 6),
29102910
OMPX_BigJumpLoopTeamsPerCU(
29112911
"LIBOMPTARGET_AMDGPU_BIG_JUMP_LOOP_TEAMS_PER_CU", 0),
29122912
OMPX_BigJumpLoopMaxTotalTeams(

0 commit comments

Comments
 (0)