Skip to content

Commit 6e2c039

Browse files
Use --debug only with standalone
1 parent 1472ee8 commit 6e2c039

2 files changed

Lines changed: 10 additions & 10 deletions

File tree

.github/workflows/standalone-benchmark.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -53,7 +53,7 @@ jobs:
5353
STANDALONE_DIR: /root/standalone
5454
BENCHMARK_CSV: standalone_${{ matrix.name }}.csv
5555
PROFILER_CSV: profiler_${{ matrix.name }}.csv
56-
TIMING_CA: ./ca -e 50kHz ${{ matrix.cpu_gpu }} --seed 0 --sync --runsInit 0 --PROCresetTimers 1 --PROCdebugMarkdown 1 --debug 1 # Add --runs 42 for benchmark runs
56+
TIMING_CA: ./ca -e 50kHz ${{ matrix.cpu_gpu }} --seed 0 --sync --runsInit 0 --PROCresetTimers 1 --PROCdebugMarkdown 1 # Add --runs 42 for benchmark runs
5757
LD_LIBRARY_PATH: /usr/local/cuda-13.0/compat
5858

5959
name: ${{ matrix.name }}
@@ -99,13 +99,13 @@ jobs:
9999
env:
100100
DETERMINISTIC_MODE: OFF
101101

102-
- name: Benchmark Track Reconstruction
102+
- name: Standalone Benchmark Track
103103
run: |
104104
source /etc/profile.d/modules.sh
105105
module load ninja/fortran-v1.11.1.g9-15 Vc/1.4.5-10 boost/v1.83.0-alice2-57 fmt/11.1.2-14 CMake/v3.31.6-10 ms_gsl/4.2.1-3 Clang/v20.1.7-9 TBB/v2022.3.0-3 ROOT/v6-36-04-alice9-15 ONNXRuntime/v1.22.0-71 GLFW/3.3.2-25
106106
cd ${STANDALONE_DIR}
107-
${TIMING_CA} --runs ${{ matrix.standalone_runs }} --PROCdebugCSV /root/${BENCHMARK_CSV}
108-
python3 ${GITHUB_WORKSPACE}/.github/scripts/profiler_standalone.py --discard 0 --input /root/${BENCHMARK_CSV} --output /root/summary_${BENCHMARK_CSV}
107+
${TIMING_CA} --runs ${{ matrix.standalone_runs }} --PROCdebugCSV /root/${BENCHMARK_CSV} --debug 1
108+
python3 ${GITHUB_WORKSPACE}/.github/scripts/profiler_standalone.py --discard 2 --input /root/${BENCHMARK_CSV} --output /root/summary_${BENCHMARK_CSV}
109109
110110
- name: Profiler - Nsight Compute
111111
if: ${{ matrix.name == 'nvidia-h100' }}

GPU/Common/MemLayout.h

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -292,20 +292,20 @@ struct interface<S, F, Flag::soa> { using type = wrapper<S, F>; };
292292

293293
#define MEMLAYOUT_APPLY_UNARY(...)\
294294
template <class Function>\
295-
constexpr auto apply(Function&& f) { return f(__VA_ARGS__); }\
295+
__attribute__((flatten)) constexpr auto apply(Function&& f) { return f(__VA_ARGS__); }\
296296
template <class Function>\
297-
constexpr auto apply(Function&& f) const { return f(__VA_ARGS__); }\
297+
__attribute__((flatten)) constexpr auto apply(Function&& f) const { return f(__VA_ARGS__); }\
298298

299299
#define MEMLAYOUT_EXPAND(m) f(m, other.m)
300300

301301
#define MEMLAYOUT_APPLY_BINARY(STRUCT_NAME, ...)\
302302
template <template <class> class F_other, class Function>\
303-
constexpr STRUCT_NAME apply(STRUCT_NAME<F_other>& other, Function&& f) { return {__VA_ARGS__}; }\
303+
__attribute__((flatten)) constexpr STRUCT_NAME apply(STRUCT_NAME<F_other>& other, Function&& f) { return {__VA_ARGS__}; }\
304304
template <template <class> class F_other, class Function>\
305-
constexpr STRUCT_NAME apply(STRUCT_NAME<F_other>& other, Function&& f) const { return {__VA_ARGS__}; }\
305+
__attribute__((flatten)) constexpr STRUCT_NAME apply(STRUCT_NAME<F_other>& other, Function&& f) const { return {__VA_ARGS__}; }\
306306
template <template <class> class F_other, class Function>\
307-
constexpr STRUCT_NAME apply(const STRUCT_NAME<F_other>& other, Function&& f) { return {__VA_ARGS__}; }\
307+
__attribute__((flatten)) constexpr STRUCT_NAME apply(const STRUCT_NAME<F_other>& other, Function&& f) { return {__VA_ARGS__}; }\
308308
template <template <class> class F_other, class Function>\
309-
constexpr STRUCT_NAME apply(const STRUCT_NAME<F_other>& other, Function&& f) const { return {__VA_ARGS__}; }\
309+
__attribute__((flatten)) constexpr STRUCT_NAME apply(const STRUCT_NAME<F_other>& other, Function&& f) const { return {__VA_ARGS__}; }\
310310

311311
#endif // MEMLAYOUT_H

0 commit comments

Comments
 (0)