Skip to content

Commit b34d2e7

Browse files
committed
[OpenMP][plugin] Improve 521.miniswp set default for
LIBOMPTARGET_AMDGPU_GENERIC_SPMD_TEAMS_PER_CU from 0 to 6. time base new improvement mi300x 64.4 55.3 16.5% mi300a 118.9 96.1 23.7% mi250 178.1 151.4 17.7%
1 parent 8ef0c44 commit b34d2e7

File tree

1 file changed

+1
-1
lines changed
  • offload/plugins-nextgen/amdgpu/src

1 file changed

+1
-1
lines changed

offload/plugins-nextgen/amdgpu/src/rtl.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2655,7 +2655,7 @@ struct AMDGPUDeviceTy : public GenericDeviceTy, AMDGenericDeviceTy {
26552655
OMPX_QueueSize("LIBOMPTARGET_AMDGPU_HSA_QUEUE_SIZE", 512),
26562656
OMPX_DefaultTeamsPerCU("LIBOMPTARGET_AMDGPU_TEAMS_PER_CU", 6),
26572657
OMPX_GenericSpmdTeamsPerCU(
2658-
"LIBOMPTARGET_AMDGPU_GENERIC_SPMD_TEAMS_PER_CU", 0),
2658+
"LIBOMPTARGET_AMDGPU_GENERIC_SPMD_TEAMS_PER_CU", 6),
26592659
OMPX_BigJumpLoopTeamsPerCU(
26602660
"LIBOMPTARGET_AMDGPU_BIG_JUMP_LOOP_TEAMS_PER_CU", 0),
26612661
OMPX_LowTripCount("LIBOMPTARGET_AMDGPU_LOW_TRIPCOUNT", 2000),

0 commit comments

Comments
 (0)