We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent c850500 commit 7f6cc4bCopy full SHA for 7f6cc4b
1 file changed
src/transformers/models/gemma4/configuration_gemma4.py
@@ -132,6 +132,9 @@ class Gemma4TextConfig(PreTrainedConfig):
132
"layers.*.mlp.gate_proj": "colwise",
133
"layers.*.mlp.up_proj": "colwise",
134
"layers.*.mlp.down_proj": "rowwise",
135
+ "layers.*.experts.gate_up_proj": "packed_colwise",
136
+ "layers.*.experts.down_proj": "rowwise",
137
+ "layers.*.experts": "moe_tp_experts",
138
}
139
base_model_pp_plan = {
140
"embed_tokens": (["input_ids"], ["inputs_embeds"]),
0 commit comments