@@ -2655,7 +2655,7 @@ struct AMDGPUDeviceTy : public GenericDeviceTy, AMDGenericDeviceTy {
2655
2655
OMPX_QueueSize (" LIBOMPTARGET_AMDGPU_HSA_QUEUE_SIZE" , 512 ),
2656
2656
OMPX_DefaultTeamsPerCU (" LIBOMPTARGET_AMDGPU_TEAMS_PER_CU" , 6 ),
2657
2657
OMPX_GenericSpmdTeamsPerCU (
2658
- " LIBOMPTARGET_AMDGPU_GENERIC_SPMD_TEAMS_PER_CU" , 0 ),
2658
+ " LIBOMPTARGET_AMDGPU_GENERIC_SPMD_TEAMS_PER_CU" , 6 ),
2659
2659
OMPX_BigJumpLoopTeamsPerCU (
2660
2660
" LIBOMPTARGET_AMDGPU_BIG_JUMP_LOOP_TEAMS_PER_CU" , 0 ),
2661
2661
OMPX_LowTripCount (" LIBOMPTARGET_AMDGPU_LOW_TRIPCOUNT" , 2000 ),
@@ -2676,7 +2676,7 @@ struct AMDGPUDeviceTy : public GenericDeviceTy, AMDGenericDeviceTy {
2676
2676
OMPX_StreamBusyWait (" LIBOMPTARGET_AMDGPU_STREAM_BUSYWAIT" , 2000000 ),
2677
2677
OMPX_UseMultipleSdmaEngines (
2678
2678
// setting default to true here appears to solve random sdma problem
2679
- " LIBOMPTARGET_AMDGPU_USE_MULTIPLE_SDMA_ENGINES" , false ),
2679
+ " LIBOMPTARGET_AMDGPU_USE_MULTIPLE_SDMA_ENGINES" , true ),
2680
2680
OMPX_ApuMaps (" OMPX_APU_MAPS" , false ),
2681
2681
OMPX_EnableGFX90ACoarseGrainUsmMaps (
2682
2682
" OMPX_ENABLE_GFX90A_COARSE_GRAIN_USM_MAPS" , false ),
0 commit comments