2121 runner : cern-nextgen-h100
2222 cmake_args : -DENABLE_CUDA=1 -DENABLE_HIP=0 -DCUDA_COMPUTETARGET=90
2323 profiler : nsys profile -o nvidia-h100
24- profiler_post : nsys stats --report cuda_gpu_kern_sum --force-export=true --format csv nvidia-h100.nsys-rep >
24+ profiler_post : nsys stats --report cuda_gpu_kern_sum --timeunit us -- force-export=true --format csv nvidia-h100.nsys-rep >
2525 - name : nvidia-l40s
2626 vendor : nvidia
2727 runner : cern-nextgen-l40s
@@ -107,7 +107,7 @@ jobs:
107107 source /etc/profile.d/modules.sh
108108 module load ninja/fortran-v1.11.1.g9-15 Vc/1.4.5-10 boost/v1.83.0-alice2-57 fmt/11.1.2-14 CMake/v3.31.6-10 ms_gsl/4.2.1-3 Clang/v20.1.7-9 TBB/v2022.3.0-3 ROOT/v6-36-04-alice9-15 ONNXRuntime/v1.22.0-71 GLFW/3.3.2-25
109109 cd ${STANDALONE_DIR}
110- ${{ matrix.profiler }} ${STANDALONE_DIR}/ca -e 50kHz -g --memSize 15000000000 --sync --debug 1 --runs 42 --runsInit 0 --PROCdebugMarkdown 1 --PROCresetTimers 1 --PROCdebugCSV /root/${BENCHMARK_CSV}
110+ ${{ matrix.profiler }} ${STANDALONE_DIR}/ca -e 50kHz -g --memSize 15000000000 --sync --debug 1 --runs 42 --runsInit 2 --PROCdebugMarkdown 1 --PROCresetTimers 1 --PROCdebugCSV /root/${BENCHMARK_CSV}
111111 ${{ matrix.profiler_post }} /root/${PROFILER_CSV}
112112 rm -rf ${STANDALONE_DIR}/events/50kHz ${STANDALONE_DIR}/build
113113
@@ -116,7 +116,7 @@ jobs:
116116 source /etc/profile.d/modules.sh
117117 module load ninja/fortran-v1.11.1.g9-15 Vc/1.4.5-10 boost/v1.83.0-alice2-57 fmt/11.1.2-14 CMake/v3.31.6-10 ms_gsl/4.2.1-3 Clang/v20.1.7-9 TBB/v2022.3.0-3 ROOT/v6-36-04-alice9-15 ONNXRuntime/v1.22.0-71 GLFW/3.3.2-25
118118 python3 ${GITHUB_WORKSPACE}/.github/scripts/profiler_${{ matrix.vendor }}.py --runs 42 --input /root/${PROFILER_CSV} --output /root/reduced_${PROFILER_CSV}
119- python3 ${GITHUB_WORKSPACE}/.github/scripts/merge_runs.py --discard 0 --input /root/${BENCHMARK_CSV} --output /root/reduced_${BENCHMARK_CSV}
119+ python3 ${GITHUB_WORKSPACE}/.github/scripts/merge_runs.py --discard 2 --input /root/${BENCHMARK_CSV} --output /root/reduced_${BENCHMARK_CSV}
120120 #python3 ${GITHUB_WORKSPACE}/.github/scripts/csv_to_md.py --baseline ${STANDALONE_DIR}/baseline/${PROFILER_CSV} --current /root/${PROFILER_CSV} >> ${GITHUB_STEP_SUMMARY}
121121 #echo -e "\n\n" >> ${GITHUB_STEP_SUMMARY}
122122 #python3 ${GITHUB_WORKSPACE}/.github/scripts/csv_to_md.py --baseline ${STANDALONE_DIR}/baseline/${BENCHMARK_CSV} --current /root/${BENCHMARK_CSV} >> ${GITHUB_STEP_SUMMARY}
0 commit comments