@@ -574,6 +574,8 @@ def cmake_build(Map conf=[:]){
574574 def setup_cmd
575575 def build_cmd
576576 def execute_cmd = conf. get(" execute_cmd" , " " )
577+ // check the node gpu architecture
578+ def arch_name = check_arch_name()
577579 if (! setup_args. contains(" NO_CK_BUILD" )){
578580 if (params. NINJA_BUILD_TRACE ) {
579581 echo " running ninja build trace"
@@ -646,15 +648,15 @@ def cmake_build(Map conf=[:]){
646648
647649 // run tests except when NO_CK_BUILD or BUILD_LEGACY_OS are set
648650 if (! setup_args. contains(" NO_CK_BUILD" ) && ! params. BUILD_LEGACY_OS ){
649- sh " python3 ../script/ninja_json_converter.py .ninja_log --legacy-format --output ck_build_trace_${ check_arch_name() } .json"
650- archiveArtifacts " ck_build_trace_${ check_arch_name() } .json"
651- sh " python3 ../script/parse_ninja_trace.py ck_build_trace_${ check_arch_name() } .json"
651+ sh " python3 ../script/ninja_json_converter.py .ninja_log --legacy-format --output ck_build_trace_${ arch_name } .json"
652+ archiveArtifacts " ck_build_trace_${ arch_name } .json"
653+ sh " python3 ../script/parse_ninja_trace.py ck_build_trace_${ arch_name } .json"
652654 if (params. NINJA_BUILD_TRACE || params. BUILD_INSTANCES_ONLY ){
653655 if (params. NINJA_FTIME_TRACE ) {
654656 echo " running ClangBuildAnalyzer"
655657 sh " /ClangBuildAnalyzer/build/ClangBuildAnalyzer --all . clang_build.log"
656- sh " /ClangBuildAnalyzer/build/ClangBuildAnalyzer --analyze clang_build.log > clang_build_analysis_${ check_arch_name() } .log"
657- archiveArtifacts " clang_build_analysis_${ check_arch_name() } .log"
658+ sh " /ClangBuildAnalyzer/build/ClangBuildAnalyzer --analyze clang_build.log > clang_build_analysis_${ arch_name } .log"
659+ archiveArtifacts " clang_build_analysis_${ arch_name } .log"
658660 }
659661
660662
@@ -672,8 +674,8 @@ def cmake_build(Map conf=[:]){
672674 if (params. BUILD_PACKAGES ){
673675 echo " Build ckProfiler packages"
674676 sh ' ninja -j64 package'
675- sh " mv composablekernel-ckprofiler_*.deb composablekernel-ckprofiler_1.2.0_amd64_${ check_arch_name() } .deb"
676- stash includes : " composablekernel-ckprofiler**.deb" , name : " profiler_package_${ check_arch_name() } "
677+ sh " mv composablekernel-ckprofiler_*.deb composablekernel-ckprofiler_1.2.0_amd64_${ arch_name } .deb"
678+ stash includes : " composablekernel-ckprofiler**.deb" , name : " profiler_package_${ arch_name } "
677679 }
678680 }
679681 if (params. BUILD_INSTANCES_ONLY ){
@@ -699,16 +701,14 @@ def cmake_build(Map conf=[:]){
699701 if (params. BUILD_PACKAGES ){
700702 echo " Build ckProfiler packages"
701703 sh ' ninja -j64 package'
702- sh " mv composablekernel-ckprofiler_*.deb composablekernel-ckprofiler_1.2.0_amd64_${ check_arch_name() } .deb"
703- stash includes : " composablekernel-ckprofiler**.deb" , name : " profiler_package_${ check_arch_name() } "
704+ sh " mv composablekernel-ckprofiler_*.deb composablekernel-ckprofiler_1.2.0_amd64_${ arch_name } .deb"
705+ stash includes : " composablekernel-ckprofiler**.deb" , name : " profiler_package_${ arch_name } "
704706 }
705707 }
706708 }
707709 }
708710 }
709711
710- // check the node gpu architecture
711- def arch_name = check_arch_name()
712712 if (params. RUN_CK_TILE_FMHA_TESTS ){
713713 try {
714714 archiveArtifacts " perf_fmha_*.log"
@@ -1201,8 +1201,8 @@ pipeline {
12011201 description : " Run the ck_tile FMHA tests (default: OFF)" )
12021202 booleanParam(
12031203 name : " RUN_TILE_ENGINE_BASIC_TESTS" ,
1204- defaultValue : false ,
1205- description : " Run the tile_engine_basic tests (default: OFF )" )
1204+ defaultValue : true ,
1205+ description : " Run the tile_engine_basic tests (default: ON )" )
12061206 booleanParam(
12071207 name : " RUN_TILE_ENGINE_GEMM_TESTS" ,
12081208 defaultValue : false ,
@@ -1650,7 +1650,10 @@ pipeline {
16501650 -D GEMM_PRESHUFFLE_DATATYPE="fp16;fp8;bf16;bf8" \
16511651 -D GEMM_PRESHUFFLE_LAYOUT="rcr" \
16521652 -D GEMM_PRESHUFFLE_CONFIG_FILE="default_ci_config.json" .. && \
1653- ninja -j${ nthreads()} benchmark_gemm_universal_all benchmark_gemm_preshuffle_all benchmark_gemm_multi_d_all """
1653+ ninja -j${ nthreads()} benchmark_gemm_universal_all benchmark_gemm_preshuffle_all benchmark_gemm_multi_d_all && \
1654+ python3 ../tile_engine/ops/gemm/gemm_universal/gemm_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1655+ python3 ../tile_engine/ops/gemm/gemm_preshuffle/gemm_preshuffle_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1656+ python3 ../tile_engine/ops/gemm/gemm_multi_d/gemm_multi_d_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json """
16541657 }
16551658 steps{
16561659 buildHipClangJobAndReboot(setup_args :setup_args, build_type : ' Release' , execute_cmd : execute_args)
@@ -1667,37 +1670,6 @@ pipeline {
16671670 }
16681671 parallel
16691672 {
1670- stage(" Run TILE_ENGINE_GEMM Tests on gfx90a" )
1671- {
1672- when {
1673- beforeAgent true
1674- expression { params. RUN_TILE_ENGINE_GEMM_TESTS . toBoolean() }
1675- }
1676- agent{ label rocmnode(" gfx90a" ) }
1677- environment{
1678- setup_args = " NO_CK_BUILD"
1679- execute_args = """ cmake -G Ninja -D CMAKE_PREFIX_PATH=/opt/rocm \
1680- -D CMAKE_CXX_COMPILER="${ params.BUILD_COMPILER} " \
1681- -D CMAKE_BUILD_TYPE=Release \
1682- -D GPU_TARGETS="gfx90a" \
1683- -D GEMM_UNIVERSAL_DATATYPE="fp8;fp16" \
1684- -D GEMM_UNIVERSAL_LAYOUT="rcr;rrr;crr;ccr" \
1685- -D GEMM_STREAMK_DATATYPE="fp8;fp16" \
1686- -D GEMM_STREAMK_LAYOUT="rcr" \
1687- -D GEMM_MULTI_D_DATATYPE="fp16" \
1688- -D GEMM_MULTI_D_LAYOUT="rcrr;rrrr;crrr;ccrr" \
1689- -D GEMM_PRESHUFFLE_DATATYPE="fp16;fp8;bf16;bf8" \
1690- -D GEMM_PRESHUFFLE_LAYOUT="rcr" .. && \
1691- ninja -j${ nthreads()} benchmark_gemm_universal_all benchmark_gemm_preshuffle_all benchmark_gemm_multi_d_all benchmark_gemm_streamk_all && \
1692- python3 ../tile_engine/ops/gemm/gemm_universal/gemm_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1693- python3 ../tile_engine/ops/gemm/gemm_preshuffle/gemm_preshuffle_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json && \
1694- python3 ../tile_engine/ops/gemm/gemm_multi_d/gemm_multi_d_benchmark.py . --problem-sizes "1024,1024,1024" --warmup 5 --repeat 5 --verbose --json results.json """
1695- }
1696- steps{
1697- buildHipClangJobAndReboot(setup_args :setup_args, build_type : ' Release' , execute_cmd : execute_args)
1698- cleanWs()
1699- }
1700- }
17011673 stage(" Run TILE_ENGINE_GEMM Tests on gfx942" )
17021674 {
17031675 when {
0 commit comments