We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent efbee87 commit a2b9861Copy full SHA for a2b9861
1 file changed
src/maxtext/configs/inference/vllm.yml
@@ -70,6 +70,8 @@ logical_axis_rules: [
70
['kv', []],
71
['embed', ['expert', 'attn_dp_expert']],
72
['embed', ['attn_dp_expert']],
73
+ ['embed_moe', ['expert', 'attn_dp_expert']],
74
+ ['embed_moe', ['attn_dp_expert']],
75
['embed_tensor_transpose', ['attn_dp', 'model']],
76
['embed_no_exp', []],
77
['embed_no_exp_moe', []],
0 commit comments