File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -638,8 +638,16 @@ void ggml_cuda_op_kvarn_store(ggml_backend_cuda_context & ctx, ggml_tensor * dst
638638 const size_t smpbo = ggml_cuda_info ().devices [ctx.device ].smpbo ;
639639
640640 if (!force_low_shmem && smpbo >= KVAR_N_SHARED_BYTES ) {
641- #if !defined(GGML_USE_MUSA)
642- CUDA_CHECK (cudaFuncSetAttribute (reinterpret_cast <const void *>(kvarn_store_kernel_hishmem), cudaFuncAttributeMaxDynamicSharedMemorySize, KVAR_N_SHARED_BYTES ));
641+ #if defined(GGML_USE_HIP)
642+ CUDA_CHECK (hipFuncSetAttribute (
643+ reinterpret_cast <const void *>(&kvarn_store_kernel_hishmem),
644+ hipFuncAttributeMaxDynamicSharedMemorySize,
645+ KVAR_N_SHARED_BYTES ));
646+ #elif !defined(GGML_USE_MUSA)
647+ CUDA_CHECK (cudaFuncSetAttribute (
648+ kvarn_store_kernel_hishmem,
649+ cudaFuncAttributeMaxDynamicSharedMemorySize,
650+ KVAR_N_SHARED_BYTES ));
643651#endif
644652 kvarn_store_kernel_hishmem<<<current->ne[1 ], KVAR_N_DIM , KVAR_N_SHARED_BYTES , ctx.stream()>>> (
645653 (const float *) current->data ,
You can’t perform that action at this time.
0 commit comments