Skip to content

Commit fd73ac7

Browse files
arthwiamwavecut
authored andcommitted
sycl : handle other FA case (ggml-org#21377)
1 parent 3cea813 commit fd73ac7

1 file changed

Lines changed: 10 additions & 0 deletions

File tree

ggml/src/ggml-sycl/fattn-tile.hpp

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1252,6 +1252,16 @@ static void launch_fattn_tile_switch_ncols1(ggml_backend_sycl_context & ctx, ggm
12521252
return;
12531253
}
12541254

1255+
{
1256+
constexpr int cols_per_block = ncols2*2;
1257+
const int nwarps = ggml_sycl_fattn_tile_get_nthreads (DKQ, DV, cols_per_block, cc) / warp_size;
1258+
const int nbatch_fa = ggml_sycl_fattn_tile_get_nbatch_fa(DKQ, DV, cols_per_block, cc);
1259+
launch_fattn<DV, cols_per_block/ncols2, ncols2,
1260+
flash_attn_tile<DKQ, DV, cols_per_block / ncols2, ncols2, use_logit_softcap, warp_size>, warp_size>
1261+
(ctx, dst, nwarps, nbytes_shared, nbatch_fa, true, true, false);
1262+
return;
1263+
}
1264+
12551265
GGML_ABORT("fatal error");
12561266
}
12571267

0 commit comments

Comments
 (0)