Skip to content

Commit 81604b4

Browse files
committed
dpl-workflow.sh: use different MI100 serialization workaround with better performance
1 parent d22033c commit 81604b4

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

prodtests/full-system-test/dpl-workflow.sh

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -270,7 +270,8 @@ if [[ $GPUTYPE == "HIP" ]]; then
270270
TIMESLICEOFFSET=$(($GPU_FIRST_ID + ($NUMAGPUIDS != 0 ? ($NGPUS * $NUMAID) : 0)))
271271
GPU_CONFIG+=" --environment \"ROCR_VISIBLE_DEVICES={timeslice${TIMESLICEOFFSET}}\""
272272
fi
273-
[[ $EPNSYNCMODE == 1 || ! -z ${OPTIMIZED_PARALLEL_ASYNC:-} ]] && [[ ${EPN_NODE_MI100:-} == "1" ]] && [[ ${DISABLE_MI100_SERIALIZATION:-0} != 1 ]] && GPU_CONFIG_KEY+="GPU_proc.serializeGPU=3;"
273+
# serialization workaround for MI100 nodes: remove it again if the problem will be fixed in ROCm, then also remove the DISABLE_MI100_SERIALIZATION flag in the O2DPG parse script
274+
[[ $EPNSYNCMODE == 1 || ! -z ${OPTIMIZED_PARALLEL_ASYNC:-} ]] && [[ ${EPN_NODE_MI100:-} == "1" ]] && [[ ${DISABLE_MI100_SERIALIZATION:-0} != 1 ]] && GPU_CONFIG_KEY+="GPU_proc.amdMI100SerializationWorkaround=1;"
274275
#export HSA_TOOLS_LIB=/opt/rocm/lib/librocm-debug-agent.so.2
275276
else
276277
GPU_CONFIG_KEY+="GPU_proc.deviceNum=-2;"

0 commit comments

Comments
 (0)