We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 07d3877 commit 5bdbd31Copy full SHA for 5bdbd31
1 file changed
benchmarks/dsr1_fp4_mi355x_slurm.sh
@@ -10,6 +10,7 @@
10
# RANDOM_RANGE_RATIO
11
# RESULT_FILENAME
12
export SGLANG_USE_AITER=1
13
+export ROCM_QUICK_REDUCE_QUANTIZATION=INT4
14
SERVER_LOG=$(mktemp /tmp/server-XXXXXX.log)
15
16
PREFILL_SIZE=196608
0 commit comments