Skip to content

Commit cee2a83

Browse files
Reduce number of iterations for ncu profiling
1 parent 1a8011f commit cee2a83

File tree

1 file changed

+4
-5
lines changed

1 file changed

+4
-5
lines changed

.github/workflows/standalone-benchmark.yml

Lines changed: 4 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -97,17 +97,16 @@ jobs:
9797
source /etc/profile.d/modules.sh
9898
module load ninja/fortran-v1.11.1.g9-15 Vc/1.4.5-10 boost/v1.83.0-alice2-57 fmt/11.1.2-14 CMake/v3.31.6-10 ms_gsl/4.2.1-3 Clang/v20.1.7-9 TBB/v2022.3.0-3 ROOT/v6-36-04-alice9-15 ONNXRuntime/v1.22.0-71 GLFW/3.3.2-25
9999
cd ${STANDALONE_DIR}
100-
ncu --set none --metrics gpu__time_duration.avg --export ${{ matrix.name }} --clock-control none --force-overwrite ${TIMING_CA} --runs 42 --debug 1 --PROCdebugMarkdown 1 # Generates ${{ matrix.name }}.ncu-rep
100+
ncu --set none --metrics gpu__time_duration.avg --export ${{ matrix.name }} --clock-control none --force-overwrite ${TIMING_CA} --runs 21 --debug 1 --PROCdebugMarkdown 1 # Generates ${{ matrix.name }}.ncu-rep
101101
ncu --import ${STANDALONE_DIR}/${{ matrix.name }}.ncu-rep --print-units base --csv > /root/${PROFILER_CSV}
102102
rm -rf ${STANDALONE_DIR}/events/50kHz ${STANDALONE_DIR}/build
103-
python3 ${GITHUB_WORKSPACE}/.github/scripts/profiler_ncu.py --runs 42 --input /root/${PROFILER_CSV} --output /root/${PROFILER_CSV}
103+
python3 ${GITHUB_WORKSPACE}/.github/scripts/profiler_ncu.py --runs 21 --input /root/${PROFILER_CSV} --output /root/${PROFILER_CSV}
104104
105105
- name: Profiler - Nsight Systems
106106
if: ${{ matrix.name == 'nvidia-l40s' }}
107107
run: |
108-
curl -fL --retry 3 -o ${STANDALONE_DIR}/nsys.rpm https://developer.nvidia.com/downloads/assets/tools/secure/nsight-systems/2026_2/NsightSystems-linux-cli-public-2026.2.1.210-3763964.rpm
109-
dnf install -y ${STANDALONE_DIR}/nsys.rpm
110-
rm -f ${STANDALONE_DIR}/nsys.rpm
108+
dnf config-manager --add-repo "https://developer.download.nvidia.com/devtools/repos/rhel$(source /etc/os-release; echo ${VERSION_ID%%.*})/$(rpm --eval '%{_arch}' | sed s/aarch/arm/)/"
109+
dnf install -y nsight-systems-cli-2026.2.1
111110
source /etc/profile.d/modules.sh
112111
module load ninja/fortran-v1.11.1.g9-15 Vc/1.4.5-10 boost/v1.83.0-alice2-57 fmt/11.1.2-14 CMake/v3.31.6-10 ms_gsl/4.2.1-3 Clang/v20.1.7-9 TBB/v2022.3.0-3 ROOT/v6-36-04-alice9-15 ONNXRuntime/v1.22.0-71 GLFW/3.3.2-25
113112
cd ${STANDALONE_DIR}

0 commit comments

Comments
 (0)