Skip to content

Commit 043f2a1

Browse files
authored
support moe for sm103 (PaddlePaddle#7238)
1 parent 757bafe commit 043f2a1

2 files changed

Lines changed: 3 additions & 3 deletions

File tree

custom_ops/gpu_ops/cutlass_kernels/moe_gemm/fused_moe_cutlass_kernel.h

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -635,7 +635,7 @@ struct MoeFCGemm {
635635
static constexpr bool compile_needed =
636636
platform::is_same<KernelArch, arch::Sm75>::value;
637637
KernelRunner<compile_needed>::run_kernel(params, shared_storage);
638-
#elif defined(__CUDA_ARCH__) && (__CUDA_ARCH__ >= 800) && (__CUDA_ARCH__ < 1010)
638+
#elif defined(__CUDA_ARCH__) && (__CUDA_ARCH__ >= 800) && (__CUDA_ARCH__ < 1100)
639639
static constexpr bool compile_needed =
640640
platform::is_same<KernelArch, arch::Sm80>::value;
641641
KernelRunner<compile_needed>::run_kernel(params, shared_storage);
@@ -1060,7 +1060,7 @@ struct Wint2xMoeFCGemm : public MoeFCGemm<Mma_,
10601060
CUTLASS_DEVICE
10611061
void operator()(Params const& params,
10621062
SharedStorage& shared_storage) { // NOLINT
1063-
#if defined(__CUDA_ARCH__) && (__CUDA_ARCH__ >= 800) && (__CUDA_ARCH__ < 1010)
1063+
#if defined(__CUDA_ARCH__) && (__CUDA_ARCH__ >= 800) && (__CUDA_ARCH__ < 1100)
10641064
KernelRunner<WintQuantMethod::kWeightOnlyInt2, true>::run_kernel(
10651065
params, shared_storage);
10661066
#else

custom_ops/gpu_ops/cutlass_kernels/moe_gemm/fused_moe_gemm_kernels_template.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -709,7 +709,7 @@ void MoeGemmRunner<T, WeightQuantTraits>::dispatch_to_arch<EpilogueTag>(
709709
dispatch_moe_gemm_to_cutlass_macro(cutlass::arch::Sm70);
710710
} else if (sm_ >= 75 && sm_ < 80) {
711711
dispatch_moe_gemm_to_cutlass_macro(cutlass::arch::Sm75);
712-
} else if (sm_ >= 80 && sm_ < 101) {
712+
} else if (sm_ >= 80 && sm_ < 104) {
713713
dispatch_moe_gemm_to_cutlass_macro(cutlass::arch::Sm80);
714714
} else {
715715
throw std::runtime_error(

0 commit comments

Comments
 (0)