Skip to content

Commit f5d8b0c

Browse files
Update
1 parent cbc795e commit f5d8b0c

4 files changed

Lines changed: 8 additions & 8 deletions

File tree

.github/scripts/merge_runs.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@
2222

2323
data = [["name", "time", "stdev"]]
2424
for name, time_list in time_dict.items():
25-
mean = statistics.mean(time_list[args.discard:])
25+
mean = int(statistics.mean(time_list[args.discard:]))
2626
runs = len(time_list[args.discard:])
2727
stdev = 0.0 if runs == 1 else statistics.stdev(time_list[args.discard:])
2828
data.append([name, mean, stdev])

.github/scripts/profiler_amd.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@
2525
data = [["name", "time", "stdev"]]
2626
for name, time_list in time_dict.items():
2727
count = len(time_list) / args.runs
28-
mean = statistics.mean(time_list) * count
28+
mean = int(statistics.mean(time_list) * count)
2929
stdev = 0 if args.runs == 1 else statistics.stdev(time_list) * count
3030
data.append([name, mean, stdev])
3131

.github/scripts/profiler_nvidia.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -18,8 +18,8 @@
1818
if row:
1919
full_name = row[8]
2020
instances = int(row[2])
21-
time = int(row[1]) / 1000.0
22-
sigma = float(row[7]) / 1000.0
21+
time = int(row[1])
22+
sigma = float(row[7])
2323
if len(full_name) > 5 and full_name[:5] == "krnl_":
2424
name = full_name[5:]
2525
ntsi_list.append([name, time, sigma, instances])
@@ -29,7 +29,7 @@
2929
data = [["name", "time", "stdev"]]
3030
for name, time, sigma, instances in ntsi_list:
3131
count = instances / args.runs
32-
mean = time * count
32+
mean = int(time * count)
3333
stdev = sigma * count
3434
data.append([name, mean, stdev])
3535

.github/workflows/standalone-benchmark.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@ jobs:
2121
runner: cern-nextgen-h100
2222
cmake_args: -DENABLE_CUDA=1 -DENABLE_HIP=0 -DCUDA_COMPUTETARGET=90
2323
profiler: nsys profile -o nvidia-h100
24-
profiler_post: nsys stats --report cuda_gpu_kern_sum --force-export=true --format csv nvidia-h100.nsys-rep >
24+
profiler_post: nsys stats --report cuda_gpu_kern_sum --timeunit us --force-export=true --format csv nvidia-h100.nsys-rep >
2525
- name: nvidia-l40s
2626
vendor: nvidia
2727
runner: cern-nextgen-l40s
@@ -107,7 +107,7 @@ jobs:
107107
source /etc/profile.d/modules.sh
108108
module load ninja/fortran-v1.11.1.g9-15 Vc/1.4.5-10 boost/v1.83.0-alice2-57 fmt/11.1.2-14 CMake/v3.31.6-10 ms_gsl/4.2.1-3 Clang/v20.1.7-9 TBB/v2022.3.0-3 ROOT/v6-36-04-alice9-15 ONNXRuntime/v1.22.0-71 GLFW/3.3.2-25
109109
cd ${STANDALONE_DIR}
110-
${{ matrix.profiler }} ${STANDALONE_DIR}/ca -e 50kHz -g --memSize 15000000000 --sync --debug 1 --runs 42 --runsInit 0 --PROCdebugMarkdown 1 --PROCresetTimers 1 --PROCdebugCSV /root/${BENCHMARK_CSV}
110+
${{ matrix.profiler }} ${STANDALONE_DIR}/ca -e 50kHz -g --memSize 15000000000 --sync --debug 1 --runs 42 --runsInit 2 --PROCdebugMarkdown 1 --PROCresetTimers 1 --PROCdebugCSV /root/${BENCHMARK_CSV}
111111
${{ matrix.profiler_post }} /root/${PROFILER_CSV}
112112
rm -rf ${STANDALONE_DIR}/events/50kHz ${STANDALONE_DIR}/build
113113
@@ -116,7 +116,7 @@ jobs:
116116
source /etc/profile.d/modules.sh
117117
module load ninja/fortran-v1.11.1.g9-15 Vc/1.4.5-10 boost/v1.83.0-alice2-57 fmt/11.1.2-14 CMake/v3.31.6-10 ms_gsl/4.2.1-3 Clang/v20.1.7-9 TBB/v2022.3.0-3 ROOT/v6-36-04-alice9-15 ONNXRuntime/v1.22.0-71 GLFW/3.3.2-25
118118
python3 ${GITHUB_WORKSPACE}/.github/scripts/profiler_${{ matrix.vendor }}.py --runs 42 --input /root/${PROFILER_CSV} --output /root/reduced_${PROFILER_CSV}
119-
python3 ${GITHUB_WORKSPACE}/.github/scripts/merge_runs.py --discard 0 --input /root/${BENCHMARK_CSV} --output /root/reduced_${BENCHMARK_CSV}
119+
python3 ${GITHUB_WORKSPACE}/.github/scripts/merge_runs.py --discard 2 --input /root/${BENCHMARK_CSV} --output /root/reduced_${BENCHMARK_CSV}
120120
#python3 ${GITHUB_WORKSPACE}/.github/scripts/csv_to_md.py --baseline ${STANDALONE_DIR}/baseline/${PROFILER_CSV} --current /root/${PROFILER_CSV} >> ${GITHUB_STEP_SUMMARY}
121121
#echo -e "\n\n" >> ${GITHUB_STEP_SUMMARY}
122122
#python3 ${GITHUB_WORKSPACE}/.github/scripts/csv_to_md.py --baseline ${STANDALONE_DIR}/baseline/${BENCHMARK_CSV} --current /root/${BENCHMARK_CSV} >> ${GITHUB_STEP_SUMMARY}

0 commit comments

Comments
 (0)