@@ -1637,18 +1637,18 @@ pipeline {
16371637 -D CMAKE_CXX_COMPILER="${ params.BUILD_COMPILER} " \
16381638 -D CMAKE_BUILD_TYPE=Release \
16391639 -D GPU_TARGETS="gfx90a" \
1640- -D GEMM_DATATYPE ="fp8;fp16" \
1641- -D GEMM_LAYOUT ="rcr;rrr;crr;ccr" \
1640+ -D GEMM_UNIVERSAL_DATATYPE ="fp8;fp16" \
1641+ -D GEMM_UNIVERSAL_LAYOUT ="rcr;rrr;crr;ccr" \
16421642 -D GEMM_STREAMK_DATATYPE="fp8;fp16" \
16431643 -D GEMM_STREAMK_LAYOUT="rcr" \
16441644 -D GEMM_MULTI_D_DATATYPE="fp16" \
16451645 -D GEMM_MULTI_D_LAYOUT="rcrr;rrrr;crrr;ccrr" \
16461646 -D GEMM_PRESHUFFLE_DATATYPE="fp16;fp8;bf16;bf8" \
16471647 -D GEMM_PRESHUFFLE_LAYOUT="rcr" .. && \
1648- ninja -j64 benchmark_gemm_all benchmark_gemm_preshuffle_all benchmark_gemm_multi_d_all benchmark_gemm_streamk_all && \
1649- python3 ../tile_engine/ops/gemm/gemm_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1650- python3 ../tile_engine/ops/gemm_preshuffle/gemm_preshuffle_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1651- python3 ../tile_engine/ops/gemm_multi_d/gemm_multi_d_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json """
1648+ ninja -j ${ nthreads() } benchmark_gemm_universal_all benchmark_gemm_preshuffle_all benchmark_gemm_multi_d_all benchmark_gemm_streamk_all && \
1649+ python3 ../tile_engine/ops/gemm/gemm_universal/ gemm_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1650+ python3 ../tile_engine/ops/gemm/ gemm_preshuffle/gemm_preshuffle_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1651+ python3 ../tile_engine/ops/gemm/ gemm_multi_d/gemm_multi_d_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json """
16521652 }
16531653 steps{
16541654 buildHipClangJobAndReboot(setup_args :setup_args, build_type : ' Release' , execute_cmd : execute_args)
@@ -1668,18 +1668,18 @@ pipeline {
16681668 -D CMAKE_CXX_COMPILER="${ params.BUILD_COMPILER} " \
16691669 -D CMAKE_BUILD_TYPE=Release \
16701670 -D GPU_TARGETS="gfx942" \
1671- -D GEMM_DATATYPE ="fp8;fp16" \
1672- -D GEMM_LAYOUT ="rcr;rrr;crr;ccr" \
1671+ -D GEMM_UNIVERSAL_DATATYPE ="fp8;fp16" \
1672+ -D GEMM_UNIVERSAL_LAYOUT ="rcr;rrr;crr;ccr" \
16731673 -D GEMM_STREAMK_DATATYPE="fp8;fp16" \
16741674 -D GEMM_STREAMK_LAYOUT="rcr" \
16751675 -D GEMM_MULTI_D_DATATYPE="fp16" \
16761676 -D GEMM_MULTI_D_LAYOUT="rcrr;rrrr;crrr;ccrr" \
16771677 -D GEMM_PRESHUFFLE_DATATYPE="fp16;fp8;bf16;bf8" \
16781678 -D GEMM_PRESHUFFLE_LAYOUT="rcr" .. && \
1679- ninja -j64 benchmark_gemm_all benchmark_gemm_preshuffle_all benchmark_gemm_multi_d_all benchmark_gemm_streamk_all && \
1680- python3 ../tile_engine/ops/gemm/gemm_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1681- python3 ../tile_engine/ops/gemm_preshuffle/gemm_preshuffle_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1682- python3 ../tile_engine/ops/gemm_multi_d/gemm_multi_d_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json """
1679+ ninja -j ${ nthreads() } benchmark_gemm_universal_all benchmark_gemm_preshuffle_all benchmark_gemm_multi_d_all benchmark_gemm_streamk_all && \
1680+ python3 ../tile_engine/ops/gemm/gemm_universal/ gemm_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1681+ python3 ../tile_engine/ops/gemm/ gemm_preshuffle/gemm_preshuffle_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1682+ python3 ../tile_engine/ops/gemm/ gemm_multi_d/gemm_multi_d_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json """
16831683 }
16841684 steps{
16851685 buildHipClangJobAndReboot(setup_args :setup_args, build_type : ' Release' , execute_cmd : execute_args)
@@ -1699,10 +1699,10 @@ pipeline {
16991699 -D CMAKE_CXX_COMPILER="${ params.BUILD_COMPILER} " \
17001700 -D CMAKE_BUILD_TYPE=Release \
17011701 -D GPU_TARGETS="gfx1201" \
1702- -D GEMM_DATATYPE ="fp16" \
1703- -D GEMM_LAYOUT ="rcr;rrr;crr;ccr" .. && \
1704- ninja -j64 benchmark_gemm_all && \
1705- python3 ../tile_engine/ops/gemm/gemm_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json """
1702+ -D GEMM_UNIVERSAL_DATATYPE ="fp16" \
1703+ -D GEMM_UNIVERSAL_LAYOUT ="rcr;rrr;crr;ccr" .. && \
1704+ ninja -j ${ nthreads() } benchmark_gemm_universal_all && \
1705+ python3 ../tile_engine/ops/gemm/gemm_universal/ gemm_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json """
17061706 }
17071707 steps{
17081708 buildHipClangJobAndReboot(setup_args :setup_args, build_type : ' Release' , execute_cmd : execute_args)
0 commit comments