File tree Expand file tree Collapse file tree 1 file changed +6
-6
lines changed
modelopt/torch/quantization Expand file tree Collapse file tree 1 file changed +6
-6
lines changed Original file line number Diff line number Diff line change 163163}
164164
165165_mamba_moe_disabled_quantizer_cfg = {
166- "*fc1_latent_proj*" : {"enable" : False }, # Skip Latent MOE
167- "*fc2_latent_proj*" : {"enable" : False }, # Skip Latent MOE
168- "*q_proj*" : {"enable" : False }, # Skip QKV Linear
169- "*k_proj*" : {"enable" : False }, # Skip QKV Linear
170- "*v_proj*" : {"enable" : False }, # Skip QKV Linear
171- "*o_proj*" : {"enable" : False }, # Skip QKV Output Projection
166+ "*fc1_latent_proj*" : {"enable" : False }, # Skip Latent MOE
167+ "*fc2_latent_proj*" : {"enable" : False }, # Skip Latent MOE
168+ "*q_proj*" : {"enable" : False }, # Skip QKV Linear
169+ "*k_proj*" : {"enable" : False }, # Skip QKV Linear
170+ "*v_proj*" : {"enable" : False }, # Skip QKV Linear
171+ "*o_proj*" : {"enable" : False }, # Skip QKV Output Projection
172172}
173173
174174INT8_DEFAULT_CFG = {
You can’t perform that action at this time.
0 commit comments