Skip to content

Commit 1d92a47

Browse files
committed
cleaning up mi355x
1 parent 51d4fe3 commit 1d92a47

2 files changed

Lines changed: 9 additions & 52 deletions

File tree

benchmarks/gptoss_fp4_mi355x_docker.sh

Lines changed: 9 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,8 @@ export VLLM_USE_AITER_UNIFIED_ATTENTION=1
2222
export VLLM_ROCM_USE_AITER_MHA=0
2323
export VLLM_ROCM_USE_AITER_FUSED_MOE_A16W4=1
2424

25+
SERVER_LOG=$(mktemp /tmp/server-XXXXXX.log)
26+
2527
set -x
2628
vllm serve $MODEL --port $PORT \
2729
--tensor-parallel-size=$TP \
@@ -32,18 +34,20 @@ vllm serve $MODEL --port $PORT \
3234
--block-size=64 \
3335
--no-enable-prefix-caching \
3436
--disable-log-requests \
35-
--async-scheduling | tee $(mktemp /tmp/server-XXXXXX.log) &
37+
--async-scheduling > $SERVER_LOG 2>&1 &
3638

37-
# Show server logs til' it is up, then stop showing
39+
# Show logs until server is ready
40+
tail -f $SERVER_LOG &
41+
TAIL_PID=$!
3842
set +x
39-
until curl --output /dev/null --silent --fail http://localhost:$PORT/health; do
43+
until curl --output /dev/null --silent --fail http://0.0.0.0:$PORT/health; do
4044
sleep 5
4145
done
42-
pkill -P $$ tee 2>/dev/null
46+
kill $TAIL_PID
4347

48+
set -x
4449
BENCH_SERVING_DIR=$(mktemp -d /tmp/bmk-XXXXXX)
4550
git clone https://github.com/kimbochen/bench_serving.git $BENCH_SERVING_DIR
46-
set -x
4751
python3 $BENCH_SERVING_DIR/benchmark_serving.py \
4852
--model=$MODEL --backend=vllm --base-url="http://localhost:$PORT" \
4953
--dataset-name=random \

runners/launch_mi355x-amd.sh

Lines changed: 0 additions & 47 deletions
Original file line numberDiff line numberDiff line change
@@ -17,11 +17,7 @@
1717
HF_HUB_CACHE_MOUNT="/nfsdata/hf_hub_cache-1/" # Temp solution
1818
PORT=8888
1919

20-
# network_name="bmk-net"
2120
server_name="bmk-server"
22-
# client_name="bmk-client"
23-
24-
# docker network create $network_name
2521

2622
set -x
2723
docker run --rm --ipc=host --shm-size=16g --network=host --name=$server_name \
@@ -35,50 +31,7 @@ docker run --rm --ipc=host --shm-size=16g --network=host --name=$server_name \
3531
$IMAGE \
3632
benchmarks/"${EXP_NAME%%_*}_${PRECISION}_mi355x_docker.sh"
3733

38-
# set +x
39-
# while IFS= read -r line; do
40-
# printf '%s\n' "$line"
41-
# if [[ "$line" =~ Application\ startup\ complete ]]; then
42-
# break
43-
# fi
44-
# done < <(docker logs -f --tail=0 $server_name 2>&1)
45-
46-
# if [[ "$MODEL" == "amd/DeepSeek-R1-0528-MXFP4-Preview" || "$MODEL" == "deepseek-ai/DeepSeek-R1-0528" ]]; then
47-
# if [[ "$OSL" == "8192" ]]; then
48-
# NUM_PROMPTS=$(( CONC * 20 ))
49-
# else
50-
# NUM_PROMPTS=$(( CONC * 50 ))
51-
# fi
52-
# else
53-
# NUM_PROMPTS=$(( CONC * 10 ))
54-
# fi
55-
56-
# git clone https://github.com/kimbochen/bench_serving.git
57-
58-
# set -x
59-
# docker run --rm --network=$network_name --name=$client_name \
60-
# -v $GITHUB_WORKSPACE:/workspace/ -w /workspace/ \
61-
# -e HF_TOKEN -e PYTHONPYCACHEPREFIX=/tmp/pycache/ \
62-
# --entrypoint=python3 \
63-
# $IMAGE \
64-
# bench_serving/benchmark_serving.py \
65-
# --model=$MODEL --backend=vllm --base-url="http://$server_name:$PORT" \
66-
# --dataset-name=random \
67-
# --random-input-len=$ISL --random-output-len=$OSL --random-range-ratio=$RANDOM_RANGE_RATIO \
68-
# --num-prompts=$NUM_PROMPTS \
69-
# --max-concurrency=$CONC \
70-
# --request-rate=inf --ignore-eos \
71-
# --save-result --percentile-metrics="ttft,tpot,itl,e2el" \
72-
# --result-dir=/workspace/ --result-filename=$RESULT_FILENAME.json
73-
7434
if ls gpucore.* 1> /dev/null 2>&1; then
7535
echo "gpucore files exist. not good"
7636
rm -f gpucore.*
7737
fi
78-
79-
80-
# while [ -n "$(docker ps -aq)" ]; do
81-
# docker stop $server_name
82-
# # docker network rm $network_name
83-
# sleep 5
84-
# done

0 commit comments

Comments
 (0)