We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
2 parents a470d47 + 5bdbd31 commit e0706e6Copy full SHA for e0706e6
2 files changed
benchmarks/dsr1_fp4_mi355x_docker.sh
@@ -11,6 +11,7 @@
11
# RESULT_FILENAME
12
# NUM_PROMPTS
13
export SGLANG_USE_AITER=1
14
+export ROCM_QUICK_REDUCE_QUANTIZATION=INT4
15
16
PREFILL_SIZE=196608
17
if [[ "$ISL" == "8192" && "$OSL" == "1024" ]]; then
benchmarks/dsr1_fp4_mi355x_slurm.sh
@@ -10,6 +10,7 @@
10
# RANDOM_RANGE_RATIO
SERVER_LOG=$(mktemp /tmp/server-XXXXXX.log)
0 commit comments