Skip to content

Commit a45e569

Browse files
upgrade triton moe config fix.
1 parent fb123b0 commit a45e569

1 file changed

Lines changed: 1 addition & 1 deletion

File tree

fastdeploy/model_executor/layers/moe/fused_moe_triton_backend.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2361,4 +2361,4 @@ def apply_ep_prefill(
23612361
def apply_ep_decode(
23622362
self, layer, x, gate, topk_ids_hookfunc=None, shared_experts=None, fc1_latent_proj=None, fc2_latent_proj=None
23632363
):
2364-
return self._apply_ep_no_deepep(layer, x, gate, topk_ids_hookfunc)
2364+
raise NotImplementedError("TritonMoEMethod does not support EP decode yet.")

0 commit comments

Comments
 (0)