Skip to content

Commit c9911ff

Browse files
authored
Merge pull request #80 from ROCm/revert_trload_dispatch
Revert "Avoid to use qr_ks_vs_tr_load_async pipeline for MTile <= 64 …
2 parents 5f0419a + 112cb18 commit c9911ff

2 files changed

Lines changed: 2 additions & 4 deletions

File tree

xformers/csrc/attention/hip_fmha/ck_tiled_fmha_batched_infer_dispatch.h

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -160,8 +160,7 @@ struct batched_infer_mask_bias_dropout_dispatch {
160160
}
161161
} else {
162162
// use qr_async_trload pipeline if seqlen <= switch_seqlen_threshold
163-
// for MTile <= 64, qr_ks_vs_whole_k_prefetch gives better performance
164-
if constexpr (MaxK == 128 && MTile > 64) {
163+
if constexpr (MaxK == 128) {
165164
using FmhaTraits = ck_tile::TileFmhaTraits<
166165
false, // kPadSeqLenQ,
167166
false, // kPadSeqLenK,

xformers/csrc/attention/hip_fmha/ck_tiled_fmha_grouped_infer_dispatch.h

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -160,8 +160,7 @@ struct grouped_infer_mask_bias_dropout_dispatch {
160160
}
161161
} else {
162162
// use qr_async_trload pipeline if seqlen <= switch_seqlen_threshold
163-
// for MTile <= 64, qr_ks_vs_whole_k_prefetch gives better performance
164-
if constexpr (MaxK == 128 && MTile > 64) {
163+
if constexpr (MaxK == 128) {
165164
using FmhaTraits = ck_tile::TileFmhaTraits<
166165
false, // kPadSeqLenQ,
167166
false, // kPadSeqLenK,

0 commit comments

Comments
 (0)