We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent e490b85 commit 93c4138Copy full SHA for 93c4138
1 file changed
examples/llm_ptq/hf_ptq.py
@@ -1418,7 +1418,9 @@ def parse_args() -> argparse.Namespace:
1418
help=(
1419
"Routed MoE expert active ratio for --auto_quantize_cost_model active_moe. "
1420
"For top-k MoE this is top_k / num_experts. If omitted, common model config "
1421
- "fields such as num_experts_per_tok and num_experts are used when available."
+ "fields such as num_experts_per_tok and num_experts are used when available. "
1422
+ "This only affects AutoQuant cost accounting and does not change calibration "
1423
+ "routing; use --moe_calib_experts_ratio to control calibration expert coverage."
1424
),
1425
)
1426
parser.add_argument(
0 commit comments