Skip to content

Commit 9f1ab8c

Browse files
committed
code check
1 parent 360847d commit 9f1ab8c

1 file changed

Lines changed: 5 additions & 5 deletions

File tree

fastdeploy/model_executor/layers/moe/fused_moe_cutlass_backend.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -94,11 +94,11 @@ def compute_ffn(
9494
Paddle Cutlass compute Fused MoE.
9595
"""
9696
if fastdeploy.envs.FD_USE_PHI_MOE_PERMUTE:
97-
out = deep_batch_gemm(permute_input, getattr(layer, self.added_weight_attrs[0]), expert_idx_per_token)
98-
out = paddle.nn.functional.swiglu(out)
99-
ffn_out_without_down_proj_bias = deep_batch_gemm(
100-
out, getattr(layer, self.added_weight_attrs[1]), expert_idx_per_token
101-
)
97+
out = deep_batch_gemm(permute_input, getattr(layer, self.added_weight_attrs[0]), expert_idx_per_token)
98+
out = paddle.nn.functional.swiglu(out)
99+
ffn_out_without_down_proj_bias = deep_batch_gemm(
100+
out, getattr(layer, self.added_weight_attrs[1]), expert_idx_per_token
101+
)
102102
else:
103103
ffn_out_without_down_proj_bias = fastdeploy.model_executor.ops.gpu.moe_expert_ffn(
104104
permute_input,

0 commit comments

Comments
 (0)