We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 533d354 commit f41bd71Copy full SHA for f41bd71
1 file changed
benchmarks/gptoss_fp4_h100_docker.sh
@@ -31,13 +31,12 @@ vllm serve $MODEL --host=0.0.0.0 --port=$PORT \
31
--max-num-seqs=$CONC \
32
--disable-log-requests 2>&1 | tee $(mktemp /tmp/server-XXXXXX.log) &
33
34
+# Show server logs til' it is up, then stop showing
35
VLLM_PID=$!
36
set +x
-
37
until curl --output /dev/null --silent --fail http://localhost:$PORT/health; do
38
sleep 5
39
done
40
41
pkill -P $$ tee 2>/dev/null
42
43
pip install -q datasets pandas
0 commit comments