File tree Expand file tree Collapse file tree
modelopt/torch/quantization/plugins Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -576,22 +576,23 @@ def top_k(self, value):
576576except ImportError :
577577 pass
578578
579- try :
580- from transformers .models .qwen3_omni_moe .modeling_qwen3_omni_moe import (
581- Qwen3OmniMoeTalkerTextSparseMoeBlock ,
582- Qwen3OmniMoeThinkerTextSparseMoeBlock ,
583- )
584-
585- if Qwen3OmniMoeTalkerTextSparseMoeBlock not in QuantModuleRegistry :
586- QuantModuleRegistry .register (
587- {Qwen3OmniMoeTalkerTextSparseMoeBlock : "hf.Qwen3OmniMoeTalkerTextSparseMoeBlock" }
588- )(_QuantSparseMoe )
589- if Qwen3OmniMoeThinkerTextSparseMoeBlock not in QuantModuleRegistry :
590- QuantModuleRegistry .register (
591- {Qwen3OmniMoeThinkerTextSparseMoeBlock : "hf.Qwen3OmniMoeThinkerTextSparseMoeBlock" }
592- )(_QuantSparseMoe )
593- except ImportError :
594- pass
579+ # Uncomment to forward tokens to all MoE experts for full calibration.
580+ # try:
581+ # from transformers.models.qwen3_omni_moe.modeling_qwen3_omni_moe import (
582+ # Qwen3OmniMoeTalkerTextSparseMoeBlock,
583+ # Qwen3OmniMoeThinkerTextSparseMoeBlock,
584+ # )
585+
586+ # if Qwen3OmniMoeTalkerTextSparseMoeBlock not in QuantModuleRegistry:
587+ # QuantModuleRegistry.register(
588+ # {Qwen3OmniMoeTalkerTextSparseMoeBlock: "hf.Qwen3OmniMoeTalkerTextSparseMoeBlock"}
589+ # )(_QuantSparseMoe)
590+ # if Qwen3OmniMoeThinkerTextSparseMoeBlock not in QuantModuleRegistry:
591+ # QuantModuleRegistry.register(
592+ # {Qwen3OmniMoeThinkerTextSparseMoeBlock: "hf.Qwen3OmniMoeThinkerTextSparseMoeBlock"}
593+ # )(_QuantSparseMoe)
594+ # except ImportError:
595+ # pass
595596
596597
597598class _QuantGptOssExperts (_QuantFunctionalMixin ):
You can’t perform that action at this time.
0 commit comments