Skip to content

Commit de31829

Browse files
committed
dpl-workflow.sh: add env variable to use full MI100 serialization in online
1 parent c864689 commit de31829

File tree

1 file changed

+7
-2
lines changed

1 file changed

+7
-2
lines changed

prodtests/full-system-test/dpl-workflow.sh

Lines changed: 7 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -278,8 +278,13 @@ if [[ $GPUTYPE == "HIP" ]]; then
278278
GPU_CONFIG+=" --environment \"ROCR_VISIBLE_DEVICES={timeslice${TIMESLICEOFFSET}}\""
279279
fi
280280
# serialization workaround for MI100 nodes: remove it again if the problem will be fixed in ROCm, then also remove the DISABLE_MI100_SERIALIZATION flag in the O2DPG parse script
281-
[[ $EPNSYNCMODE == 1 ]] && [[ ${EPN_NODE_MI100:-} == "1" ]] && [[ ${DISABLE_MI100_SERIALIZATION:-0} != 1 ]] && GPU_CONFIG_KEY+="GPU_proc.amdMI100SerializationWorkaround=1;"
282-
[[ -n ${OPTIMIZED_PARALLEL_ASYNC:-} ]] && [[ ${EPN_NODE_MI100:-} == "1" ]] && [[ ${DISABLE_MI100_SERIALIZATION:-0} != 1 ]] && GPU_CONFIG_KEY+="GPU_proc.serializeGPU=3;"
281+
if [[ ${EPN_NODE_MI100:-} == "1" && ${DISABLE_MI100_SERIALIZATION:-0} != 1 ]]; then
282+
if [[ -n ${OPTIMIZED_PARALLEL_ASYNC:-} ]] || [[ $EPNSYNCMODE == 1 && ${FULL_MI100_SERIALIZATION:-0} == 1 ]]; then
283+
GPU_CONFIG_KEY+="GPU_proc.serializeGPU=3;"
284+
elif [[ $EPNSYNCMODE == 1 ]]; then
285+
GPU_CONFIG_KEY+="GPU_proc.amdMI100SerializationWorkaround=1;"
286+
fi
287+
fi
283288
#export HSA_TOOLS_LIB=/opt/rocm/lib/librocm-debug-agent.so.2
284289
else
285290
GPU_CONFIG_KEY+="GPU_proc.deviceNum=-2;"

0 commit comments

Comments
 (0)