Skip to content

Commit e22622f

Browse files
[TILE ENGINE] Restructure to Base class of GEMM (#3434)
1 parent 0fd2b2f commit e22622f

41 files changed

Lines changed: 2243 additions & 3455 deletions

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

Jenkinsfile

Lines changed: 16 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -1637,18 +1637,18 @@ pipeline {
16371637
-D CMAKE_CXX_COMPILER="${params.BUILD_COMPILER}" \
16381638
-D CMAKE_BUILD_TYPE=Release \
16391639
-D GPU_TARGETS="gfx90a" \
1640-
-D GEMM_DATATYPE="fp8;fp16" \
1641-
-D GEMM_LAYOUT="rcr;rrr;crr;ccr" \
1640+
-D GEMM_UNIVERSAL_DATATYPE="fp8;fp16" \
1641+
-D GEMM_UNIVERSAL_LAYOUT="rcr;rrr;crr;ccr" \
16421642
-D GEMM_STREAMK_DATATYPE="fp8;fp16" \
16431643
-D GEMM_STREAMK_LAYOUT="rcr" \
16441644
-D GEMM_MULTI_D_DATATYPE="fp16" \
16451645
-D GEMM_MULTI_D_LAYOUT="rcrr;rrrr;crrr;ccrr" \
16461646
-D GEMM_PRESHUFFLE_DATATYPE="fp16;fp8;bf16;bf8" \
16471647
-D GEMM_PRESHUFFLE_LAYOUT="rcr" .. && \
1648-
ninja -j64 benchmark_gemm_all benchmark_gemm_preshuffle_all benchmark_gemm_multi_d_all benchmark_gemm_streamk_all && \
1649-
python3 ../tile_engine/ops/gemm/gemm_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1650-
python3 ../tile_engine/ops/gemm_preshuffle/gemm_preshuffle_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1651-
python3 ../tile_engine/ops/gemm_multi_d/gemm_multi_d_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json """
1648+
ninja -j${nthreads()} benchmark_gemm_universal_all benchmark_gemm_preshuffle_all benchmark_gemm_multi_d_all benchmark_gemm_streamk_all && \
1649+
python3 ../tile_engine/ops/gemm/gemm_universal/gemm_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1650+
python3 ../tile_engine/ops/gemm/gemm_preshuffle/gemm_preshuffle_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1651+
python3 ../tile_engine/ops/gemm/gemm_multi_d/gemm_multi_d_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json """
16521652
}
16531653
steps{
16541654
buildHipClangJobAndReboot(setup_args:setup_args, build_type: 'Release', execute_cmd: execute_args)
@@ -1668,18 +1668,18 @@ pipeline {
16681668
-D CMAKE_CXX_COMPILER="${params.BUILD_COMPILER}" \
16691669
-D CMAKE_BUILD_TYPE=Release \
16701670
-D GPU_TARGETS="gfx942" \
1671-
-D GEMM_DATATYPE="fp8;fp16" \
1672-
-D GEMM_LAYOUT="rcr;rrr;crr;ccr" \
1671+
-D GEMM_UNIVERSAL_DATATYPE="fp8;fp16" \
1672+
-D GEMM_UNIVERSAL_LAYOUT="rcr;rrr;crr;ccr" \
16731673
-D GEMM_STREAMK_DATATYPE="fp8;fp16" \
16741674
-D GEMM_STREAMK_LAYOUT="rcr" \
16751675
-D GEMM_MULTI_D_DATATYPE="fp16" \
16761676
-D GEMM_MULTI_D_LAYOUT="rcrr;rrrr;crrr;ccrr" \
16771677
-D GEMM_PRESHUFFLE_DATATYPE="fp16;fp8;bf16;bf8" \
16781678
-D GEMM_PRESHUFFLE_LAYOUT="rcr" .. && \
1679-
ninja -j64 benchmark_gemm_all benchmark_gemm_preshuffle_all benchmark_gemm_multi_d_all benchmark_gemm_streamk_all && \
1680-
python3 ../tile_engine/ops/gemm/gemm_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1681-
python3 ../tile_engine/ops/gemm_preshuffle/gemm_preshuffle_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1682-
python3 ../tile_engine/ops/gemm_multi_d/gemm_multi_d_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json """
1679+
ninja -j${nthreads()} benchmark_gemm_universal_all benchmark_gemm_preshuffle_all benchmark_gemm_multi_d_all benchmark_gemm_streamk_all && \
1680+
python3 ../tile_engine/ops/gemm/gemm_universal/gemm_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1681+
python3 ../tile_engine/ops/gemm/gemm_preshuffle/gemm_preshuffle_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1682+
python3 ../tile_engine/ops/gemm/gemm_multi_d/gemm_multi_d_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json """
16831683
}
16841684
steps{
16851685
buildHipClangJobAndReboot(setup_args:setup_args, build_type: 'Release', execute_cmd: execute_args)
@@ -1699,10 +1699,10 @@ pipeline {
16991699
-D CMAKE_CXX_COMPILER="${params.BUILD_COMPILER}" \
17001700
-D CMAKE_BUILD_TYPE=Release \
17011701
-D GPU_TARGETS="gfx1201" \
1702-
-D GEMM_DATATYPE="fp16" \
1703-
-D GEMM_LAYOUT="rcr;rrr;crr;ccr" .. && \
1704-
ninja -j64 benchmark_gemm_all && \
1705-
python3 ../tile_engine/ops/gemm/gemm_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json """
1702+
-D GEMM_UNIVERSAL_DATATYPE="fp16" \
1703+
-D GEMM_UNIVERSAL_LAYOUT="rcr;rrr;crr;ccr" .. && \
1704+
ninja -j${nthreads()} benchmark_gemm_universal_all && \
1705+
python3 ../tile_engine/ops/gemm/gemm_universal/gemm_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json """
17061706
}
17071707
steps{
17081708
buildHipClangJobAndReboot(setup_args:setup_args, build_type: 'Release', execute_cmd: execute_args)

tile_engine/CMakeLists.txt

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,4 +5,6 @@ include_directories(BEFORE
55
${CMAKE_CURRENT_LIST_DIR}/include
66
)
77

8-
add_subdirectory(ops)
8+
add_subdirectory(ops/gemm)
9+
add_subdirectory(ops/gemm_streamk)
10+

tile_engine/ops/CMakeLists.txt

Lines changed: 0 additions & 7 deletions
This file was deleted.

tile_engine/ops/commons/test_benchmark.sh

Lines changed: 0 additions & 105 deletions
This file was deleted.

tile_engine/ops/commons/test_validation.py

Lines changed: 0 additions & 144 deletions
This file was deleted.

0 commit comments

Comments
 (0)