@@ -5,52 +5,16 @@ sudo sh -c 'echo 0 > /proc/sys/kernel/numa_balancing'
55HF_HUB_CACHE_MOUNT=" /shareddata/hf_hub_cache_$( hostname) /"
66PORT=8888
77
8- network_name=" bmk-net"
98server_name=" bmk-server"
10- client_name=" bmk-client"
11-
12- docker network create $network_name
139
1410set -x
15- docker run --rm -d -- ipc=host --shm-size=16g --network= $network_name --name=$server_name \
11+ docker run --rm -- ipc=host --shm-size=16g --name=$server_name \
1612--privileged --cap-add=CAP_SYS_ADMIN --device=/dev/kfd --device=/dev/dri --device=/dev/mem \
1713--cap-add=SYS_PTRACE --security-opt seccomp=unconfined \
1814-v $HF_HUB_CACHE_MOUNT :$HF_HUB_CACHE \
1915-v $GITHUB_WORKSPACE :/workspace/ -w /workspace/ \
2016-e HF_TOKEN -e HF_HUB_CACHE -e MODEL -e TP -e CONC -e MAX_MODEL_LEN -e PORT=$PORT \
21- -e ISL -e OSL \
17+ -e ISL -e OSL -e PYTHONPYCACHEPREFIX=/tmp/pycache/ -e RANDOM_RANGE_RATIO -e RESULT_FILENAME \
2218--entrypoint=/bin/bash \
2319$IMAGE \
2420benchmarks/" ${EXP_NAME%% _* } _${PRECISION} _mi300x_docker.sh"
25-
26- set +x
27- while IFS= read -r line; do
28- printf ' %s\n' " $line "
29- if [[ " $line " =~ Application\ startup\ complete ]]; then
30- break
31- fi
32- done < <( docker logs -f --tail=0 $server_name 2>&1 )
33-
34- git clone https://github.com/kimbochen/bench_serving.git
35-
36- set -x
37- docker run --rm --network=$network_name --name=$client_name \
38- -v $GITHUB_WORKSPACE :/workspace/ -w /workspace/ \
39- -e HF_TOKEN -e PYTHONPYCACHEPREFIX=/tmp/pycache/ \
40- --entrypoint=python3 \
41- $IMAGE \
42- bench_serving/benchmark_serving.py \
43- --model=$MODEL --backend=vllm --base-url=http://$server_name :$PORT \
44- --dataset-name=random \
45- --random-input-len=$ISL --random-output-len=$OSL --random-range-ratio=$RANDOM_RANGE_RATIO \
46- --num-prompts=$(( $CONC * 10 )) \
47- --max-concurrency=$CONC \
48- --request-rate=inf --ignore-eos \
49- --save-result --percentile-metrics=" ttft,tpot,itl,e2el" \
50- --result-dir=/workspace/ --result-filename=$RESULT_FILENAME .json
51-
52- while [ -n " $( docker ps -aq) " ]; do
53- docker stop $server_name
54- docker network rm $network_name
55- sleep 5
56- done
0 commit comments