We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent ed94d7e commit dc6d76dCopy full SHA for dc6d76d
1 file changed
benchmarks/gptoss_fp4_h100_docker.sh
@@ -29,7 +29,7 @@ vllm serve $MODEL --host=0.0.0.0 --port=$PORT \
29
--gpu-memory-utilization=0.9 \
30
--tensor-parallel-size=$TP \
31
--max-num-seqs=$CONC \
32
---disable-log-requests > $SERVER_LOG 2>&1 &
+--disable-log-requests
33
34
set +x
35
until curl --output /dev/null --silent --head --fail http://localhost:$PORT/health; do
0 commit comments