We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 3ce54ef commit 2e3262cCopy full SHA for 2e3262c
1 file changed
tests/e2e/benchmarking/bm_qwen3_coder.sh
@@ -140,6 +140,8 @@ start_time=$(date +%s)
140
# If needed, replace "--async-scheduling" with "--no-async-scheduling"
141
export USE_MOE_EP_KERNEL=${use_moe_ep_kernel}
142
export MODEL_IMPL_TYPE=vllm
143
+# TODO: Remove this once batched rpa is the default
144
+export USE_BATCHED_RPA_KERNEL=1
145
146
echo "bench_serving commit: $(git -C bench_serving rev-parse HEAD)"
147
0 commit comments