Skip to content

Commit 8de69c9

Browse files
committed
Update fattn.cu
1 parent 9b72584 commit 8de69c9

1 file changed

Lines changed: 2 additions & 2 deletions

File tree

ggml/src/ggml-cuda/fattn.cu

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -471,7 +471,7 @@ static best_fattn_kernel ggml_cuda_get_best_fattn_kernel(const int device, const
471471
case GGML_TYPE_Q4_0:
472472
case GGML_TYPE_Q8_0:
473473
#ifdef GGML_CUDA_FA_ALL_QUANTS
474-
if (K->ne[0] != 128 && K->ne[0] != 64) {
474+
if (K->ne[0] != 256 && K->ne[0] != 128 && K->ne[0] != 64) {
475475
return BEST_FATTN_KERNEL_NONE;
476476
}
477477
#else
@@ -492,7 +492,7 @@ static best_fattn_kernel ggml_cuda_get_best_fattn_kernel(const int device, const
492492
case GGML_TYPE_Q5_1:
493493
case GGML_TYPE_Q4_0:
494494
case GGML_TYPE_Q8_0:
495-
if (K->ne[0] != 128) {
495+
if (K->ne[0] != 256 && K->ne[0] != 128) {
496496
return BEST_FATTN_KERNEL_NONE;
497497
}
498498
break;

0 commit comments

Comments
 (0)