@@ -104,8 +104,8 @@ jobs:
104104 source /etc/profile.d/modules.sh
105105 module load ninja/fortran-v1.11.1.g9-15 Vc/1.4.5-10 boost/v1.83.0-alice2-57 fmt/11.1.2-14 CMake/v3.31.6-10 ms_gsl/4.2.1-3 Clang/v20.1.7-9 TBB/v2022.3.0-3 ROOT/v6-36-04-alice9-15 ONNXRuntime/v1.22.0-71 GLFW/3.3.2-25
106106 cd ${STANDALONE_DIR}
107- ${TIMING_CA} --debug 1 --runs ${{ matrix.standalone_runs }} --runsInit 2 --PROCdebugMarkdown 1 --PROCresetTimers 1 --PROCdebugCSV /root/${BENCHMARK_CSV}
108- python3 ${GITHUB_WORKSPACE}/.github/scripts/merge_runs .py --discard 2 --input /root/${BENCHMARK_CSV} --output /root/summary_${BENCHMARK_CSV}
107+ ${TIMING_CA} --debug 1 --runs ${{ matrix.standalone_runs }} --runsInit 0 --PROCdebugMarkdown 1 --PROCresetTimers 1 --PROCdebugCSV /root/${BENCHMARK_CSV}
108+ python3 ${GITHUB_WORKSPACE}/.github/scripts/profiler_standalone .py --discard 0 --input /root/${BENCHMARK_CSV} --output /root/summary_${BENCHMARK_CSV}
109109
110110 - name : Profiler - Nsight Compute
111111 if : ${{ matrix.name == 'nvidia-h100' }}
@@ -117,7 +117,7 @@ jobs:
117117 ncu --set none --metrics gpu__time_duration.avg --export ${{ matrix.name }} --clock-control none --force-overwrite ${TIMING_CA} --runs ${{ matrix.profiler_runs }} --debug 1 --PROCdebugMarkdown 1 # Generates ${{ matrix.name }}.ncu-rep
118118 ncu --import ${STANDALONE_DIR}/${{ matrix.name }}.ncu-rep --print-units base --csv > /root/${PROFILER_CSV}
119119 rm -rf ${STANDALONE_DIR}/events/50kHz ${STANDALONE_DIR}/build
120- python3 ${GITHUB_WORKSPACE}/.github/scripts/profiler_ncu.py --runs ${{ matrix.profiler_runs }} -- input /root/${PROFILER_CSV} --output /root/summary_${PROFILER_CSV}
120+ python3 ${GITHUB_WORKSPACE}/.github/scripts/profiler_ncu.py --input /root/${PROFILER_CSV} --output /root/summary_${PROFILER_CSV}
121121
122122 - name : Profiler - Nsight Systems
123123 if : ${{ matrix.name == 'nvidia-l40s' }}
@@ -130,7 +130,7 @@ jobs:
130130 nsys profile -o ${{ matrix.name }} ${TIMING_CA} --runs ${{ matrix.profiler_runs }} --debug 1 --PROCdebugMarkdown 1 # Generates ${{ matrix.name }}.nsys-rep
131131 nsys stats --report cuda_gpu_kern_sum --timeunit usec --force-export=true --format csv ${{ matrix.name }}.nsys-rep > /root/${PROFILER_CSV}
132132 rm -rf ${STANDALONE_DIR}/events/50kHz ${STANDALONE_DIR}/build
133- python3 ${GITHUB_WORKSPACE}/.github/scripts/profiler_nsys.py --runs ${{ matrix.profiler_runs }} -- input /root/${PROFILER_CSV} --output /root/summary_${PROFILER_CSV}
133+ python3 ${GITHUB_WORKSPACE}/.github/scripts/profiler_nsys.py --input /root/${PROFILER_CSV} --output /root/summary_${PROFILER_CSV}
134134
135135 - name : Profiler - rocprofv2
136136 if : ${{ matrix.name == 'amd-mi300x' || matrix.name == 'amd-w7900' }}
@@ -141,23 +141,23 @@ jobs:
141141 rocprofv2 --output-directory /root --output-file-name ${{ matrix.name }} ${TIMING_CA} --runs ${{ matrix.standalone_runs }} --debug 1 --PROCdebugMarkdown 1 # Generates results_${{ matrix.name }}.csv
142142 rm -rf ${STANDALONE_DIR}/events/50kHz ${STANDALONE_DIR}/build
143143 mv /root/results_${{ matrix.name }}.csv /root/${PROFILER_CSV}
144- python3 ${GITHUB_WORKSPACE}/.github/scripts/profiler_rocprofv2.py --runs ${{ matrix.profiler_runs }} -- input /root/${PROFILER_CSV} --output /root/summary_${PROFILER_CSV}
144+ python3 ${GITHUB_WORKSPACE}/.github/scripts/profiler_rocprofv2.py --input /root/${PROFILER_CSV} --output /root/summary_${PROFILER_CSV}
145145
146146 - name : Upload Artifact
147147 uses : actions/upload-artifact@v6
148148 with :
149149 name : ${{ matrix.name }}-artifact
150150 path : " /root/*.csv"
151151
152- - name : Display table on GitHub web
153- run : |
154- source /etc/profile.d/modules.sh
155- module load ninja/fortran-v1.11.1.g9-15 Vc/1.4.5-10 boost/v1.83.0-alice2-57 fmt/11.1.2-14 CMake/v3.31.6-10 ms_gsl/4.2.1-3 Clang/v20.1.7-9 TBB/v2022.3.0-3 ROOT/v6-36-04-alice9-15 ONNXRuntime/v1.22.0-71 GLFW/3.3.2-25
156- mkdir -p ${STANDALONE_DIR}/baseline
157- curl -fL --retry 3 -o ${STANDALONE_DIR}/baseline/summary_${PROFILER_CSV} https://cernbox.cern.ch/remote.php/dav/public-files/SfYXgQOHFga2w75/baseline/summary_${PROFILER_CSV}
158- curl -fL --retry 3 -o ${STANDALONE_DIR}/baseline/summary_${BENCHMARK_CSV} https://cernbox.cern.ch/remote.php/dav/public-files/SfYXgQOHFga2w75/baseline/summary_${BENCHMARK_CSV}
159- python3 ${GITHUB_WORKSPACE}/.github/scripts/csv_to_md.py --runs ${{ matrix.profiler_runs }} --baseline ${STANDALONE_DIR}/baseline/summary_${PROFILER_CSV} --current /root/summary_${PROFILER_CSV} >> ${GITHUB_STEP_SUMMARY}
160- echo -e "\n\n" >> ${GITHUB_STEP_SUMMARY}
161- python3 ${GITHUB_WORKSPACE}/.github/scripts/csv_to_md.py --runs ${{ matrix.standalone_runs }} --baseline ${STANDALONE_DIR}/baseline/summary_${BENCHMARK_CSV} --current /root/summary_${BENCHMARK_CSV} >> ${GITHUB_STEP_SUMMARY}
162- rm -rf ${STANDALONE_DIR}/baseline
163- if : ${{ matrix.name != 'cpu' }}
152+ # - name: Display table on GitHub web
153+ # run: |
154+ # source /etc/profile.d/modules.sh
155+ # module load ninja/fortran-v1.11.1.g9-15 Vc/1.4.5-10 boost/v1.83.0-alice2-57 fmt/11.1.2-14 CMake/v3.31.6-10 ms_gsl/4.2.1-3 Clang/v20.1.7-9 TBB/v2022.3.0-3 ROOT/v6-36-04-alice9-15 ONNXRuntime/v1.22.0-71 GLFW/3.3.2-25
156+ # mkdir -p ${STANDALONE_DIR}/baseline
157+ # curl -fL --retry 3 -o ${STANDALONE_DIR}/baseline/summary_${PROFILER_CSV} https://cernbox.cern.ch/remote.php/dav/public-files/SfYXgQOHFga2w75/baseline/summary_${PROFILER_CSV}
158+ # curl -fL --retry 3 -o ${STANDALONE_DIR}/baseline/summary_${BENCHMARK_CSV} https://cernbox.cern.ch/remote.php/dav/public-files/SfYXgQOHFga2w75/baseline/summary_${BENCHMARK_CSV}
159+ # python3 ${GITHUB_WORKSPACE}/.github/scripts/csv_to_md.py --runs ${{ matrix.profiler_runs }} --baseline ${STANDALONE_DIR}/baseline/summary_${PROFILER_CSV} --current /root/summary_${PROFILER_CSV} >> ${GITHUB_STEP_SUMMARY}
160+ # echo -e "\n\n" >> ${GITHUB_STEP_SUMMARY}
161+ # python3 ${GITHUB_WORKSPACE}/.github/scripts/csv_to_md.py --runs ${{ matrix.standalone_runs }} --baseline ${STANDALONE_DIR}/baseline/summary_${BENCHMARK_CSV} --current /root/summary_${BENCHMARK_CSV} >> ${GITHUB_STEP_SUMMARY}
162+ # rm -rf ${STANDALONE_DIR}/baseline
163+ # if: ${{ matrix.name != 'cpu' }}
0 commit comments