Clarify active MoE AutoQuant ratio

meenchen · meenchen · commit 93c41382d9a8 · 2026-06-01T21:01:29.000-07:00
Signed-off-by: weimingc &lt;17592131+meenchen@users.noreply.github.com&gt;
diff --git a/examples/llm_ptq/hf_ptq.py b/examples/llm_ptq/hf_ptq.py
@@ -1418,7 +1418,9 @@ def parse_args() -> argparse.Namespace:
         help=(
             "Routed MoE expert active ratio for --auto_quantize_cost_model active_moe. "
             "For top-k MoE this is top_k / num_experts. If omitted, common model config "
-            "fields such as num_experts_per_tok and num_experts are used when available."
+            "fields such as num_experts_per_tok and num_experts are used when available. "
+            "This only affects AutoQuant cost accounting and does not change calibration "
+            "routing; use --moe_calib_experts_ratio to control calibration expert coverage."
         ),
     )
     parser.add_argument(