File tree Expand file tree Collapse file tree
gptqmodel/models/definitions Expand file tree Collapse file tree Original file line number Diff line number Diff line change 44# Contact: qubitium@modelcloud.ai, x.com/qubitium
55
66from ..base import BaseQModel
7- from ..moe_lifecycle import GateUpDownMoELifecycleHooks
7+ from ..moe_lifecycle import W1W3W2MoELifecycleHooks
88
99
1010class MiniMaxM2GPTQ (BaseQModel ):
@@ -21,8 +21,8 @@ class MiniMaxM2GPTQ(BaseQModel):
2121
2222 dynamic_expert_index = "num_local_experts"
2323
24- # MoE lifecycle hooks for gate_proj/up_proj/down_proj pattern
25- moe_lifecycle_hooks = GateUpDownMoELifecycleHooks ()
24+ # MoE lifecycle hooks for w1/w3/w2 pattern
25+ moe_lifecycle_hooks = W1W3W2MoELifecycleHooks ()
2626
2727 module_tree = [
2828 "model" ,
@@ -39,11 +39,11 @@ class MiniMaxM2GPTQ(BaseQModel):
3939 "o_proj:1" ,
4040 ),
4141 "post_attention_layernorm" : ("post_attention_layernorm:!" ,),
42- "mlp :moe" : { # MoE module
42+ "block_sparse_moe :moe" : { # MoE module
4343 "gate" : ("gate:!" ,),
4444 "e_score_correction_bias" : ("e_score_correction_bias:!" ,),
4545 "experts" : {
46- "#" : ("gate_proj :0" , "up_proj :0" , "down_proj :1" ),
46+ "#" : ("w1 :0" , "w3 :0" , "w2 :1" ),
4747 },
4848 },
4949 },
You can’t perform that action at this time.
0 commit comments