We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 1e11c9b commit 8f1b28cCopy full SHA for 8f1b28c
modelopt/torch/quantization/plugins/vllm.py
@@ -336,7 +336,7 @@ def _setup(self):
336
self.parallel_state = create_parallel_state()
337
338
if getattr(self, "invoke_fused_moe_kernel_func", None) is None: # pragma: no cover
339
- for name in ("invoke_fused_moe_kernel", "invoke_fused_moe_triton_kernel"):
+ for name in ("invoke_fused_moe_kernel", "dispatch_fused_moe_kernel"):
340
if hasattr(vllm_fused_moe_package, name):
341
self.invoke_fused_moe_kernel_func = name
342
break
0 commit comments