Skip to content

Commit 649e52a

Browse files
Use --debug 1 only for CPU
1 parent a909199 commit 649e52a

3 files changed

Lines changed: 7 additions & 7 deletions

File tree

.github/workflows/standalone-benchmark.yml

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@ jobs:
1717
name: [cpu, nvidia-h100, nvidia-l40s, amd-mi300x, amd-w7900]
1818
include:
1919
- name: cpu
20-
runner: cern-nextgen-mi300x
20+
runner: cern-nextgen-cpuintensive
2121
cmake_args: -DENABLE_CUDA=0 -DENABLE_HIP=0
2222
profiler_runs: 42
2323
standalone_runs: 42
@@ -53,7 +53,7 @@ jobs:
5353
STANDALONE_DIR: /root/standalone
5454
BENCHMARK_CSV: standalone_${{ matrix.name }}.csv
5555
PROFILER_CSV: profiler_${{ matrix.name }}.csv
56-
TIMING_CA: ./ca -e 50kHz ${{ matrix.cpu_gpu }} --seed 0 --sync --runsInit 0 --PROCresetTimers 1 --PROCdebugMarkdown 1 --debug 1 # Add --runs 42 for benchmark runs
56+
TIMING_CA: ./ca -e 50kHz ${{ matrix.cpu_gpu }} --seed 0 --sync --runsInit 0 --PROCresetTimers 1 --PROCdebugMarkdown 1 # Add --runs 42 for benchmark runs
5757
LD_LIBRARY_PATH: /usr/local/cuda-13.0/compat
5858

5959
name: ${{ matrix.name }}
@@ -99,13 +99,13 @@ jobs:
9999
env:
100100
DETERMINISTIC_MODE: OFF
101101

102-
- name: Benchmark Track Reconstruction
102+
- name: Standalone Benchmark Track
103103
run: |
104104
source /etc/profile.d/modules.sh
105105
module load ninja/fortran-v1.11.1.g9-15 Vc/1.4.5-10 boost/v1.83.0-alice2-57 fmt/11.1.2-14 CMake/v3.31.6-10 ms_gsl/4.2.1-3 Clang/v20.1.7-9 TBB/v2022.3.0-3 ROOT/v6-36-04-alice9-15 ONNXRuntime/v1.22.0-71 GLFW/3.3.2-25
106106
cd ${STANDALONE_DIR}
107-
${TIMING_CA} --runs ${{ matrix.standalone_runs }} --PROCdebugCSV /root/${BENCHMARK_CSV}
108-
python3 ${GITHUB_WORKSPACE}/.github/scripts/profiler_standalone.py --discard 0 --input /root/${BENCHMARK_CSV} --output /root/summary_${BENCHMARK_CSV}
107+
${TIMING_CA} --runs ${{ matrix.standalone_runs }} --PROCdebugCSV /root/${BENCHMARK_CSV} --debug 1
108+
python3 ${GITHUB_WORKSPACE}/.github/scripts/profiler_standalone.py --discard 2 --input /root/${BENCHMARK_CSV} --output /root/summary_${BENCHMARK_CSV}
109109
110110
- name: Profiler - Nsight Compute
111111
if: ${{ matrix.name == 'nvidia-h100' }}

GPU/GPUTracking/SectorTracker/GPUTPCTrack.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@
2121

2222
namespace o2::gpu
2323
{
24-
constexpr MemLayout::Flag GPUTPCTrackLayout = MemLayout::Flag::aos;
24+
constexpr MemLayout::Flag GPUTPCTrackLayout = MemLayout::Flag::soa;
2525

2626
/**
2727
* @class GPUTPCTrack

GPU/GPUTracking/SectorTracker/GPUTPCTracklet.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@
2121

2222
namespace o2::gpu
2323
{
24-
constexpr MemLayout::Flag GPUTPCTrackletLayout = MemLayout::Flag::aos;
24+
constexpr MemLayout::Flag GPUTPCTrackletLayout = MemLayout::Flag::soa;
2525

2626
/**
2727
* @class GPUTPCTracklet

0 commit comments

Comments
 (0)