Skip to content

Commit d6c7576

Browse files
merrymeerkatcopybara-github
authored andcommitted
internal change
PiperOrigin-RevId: 879546918
1 parent 8d9b992 commit d6c7576

1 file changed

Lines changed: 2 additions & 2 deletions

File tree

gemma/flash_attention.cc

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -944,8 +944,8 @@ static HWY_INLINE void QDotKTilexUpTo8TransposedKDoubleWidth(
944944
for (size_t i = 0; i < qkv_dim; ++i) {
945945
VQ_T k_vec1, k_vec2;
946946
if constexpr (HWY_TARGET == HWY_AVX2) {
947-
hwy::Prefetch(k_transposed_span.ptr + (i + 3) * gcpp::KVCache::kTileSize);
948-
hwy::Prefetch(k_transposed_span.ptr + (i + 4) * gcpp::KVCache::kTileSize);
947+
hwy::Prefetch(k_transposed_span.ptr +
948+
(i + 20) * gcpp::KVCache::kTileSize);
949949
}
950950
Decompress2(df, k_transposed_span, i * gcpp::KVCache::kTileSize, k_vec1,
951951
k_vec2);

0 commit comments

Comments
 (0)