@@ -4,7 +4,7 @@ HF_HUB_CACHE_MOUNT="/home/ubuntu/hf_hub_cache/"
44PORT=8888
55
66server_name=" bmk-server"
7- client_name=" bmk-client"
7+ # client_name="bmk-client"
88
99set -x
1010docker run --rm -d --network=host --name=$server_name \
@@ -17,38 +17,38 @@ docker run --rm -d --network=host --name=$server_name \
1717$IMAGE \
1818benchmarks/" ${EXP_NAME%% _* } _${PRECISION} _h100_docker.sh"
1919
20- set +x
21- while IFS= read -r line; do
22- printf ' %s\n' " $line "
23- if [[ " $line " =~ Application\ startup\ complete ]]; then
24- break
25- fi
26- done < <( docker logs -f --tail=0 $server_name 2>&1 )
27-
28- if ! docker ps --format " {{.Names}}" | grep -q " $server_name " ; then
29- echo " Server container launch failed."
30- exit 1
31- fi
32-
33- git clone https://github.com/kimbochen/bench_serving.git
34-
35- set -x
36- docker run --rm --network=host --name=$client_name \
37- -v $GITHUB_WORKSPACE :/workspace/ -w /workspace/ \
38- -e HF_TOKEN -e PYTHONPYCACHEPREFIX=/tmp/pycache/ \
39- --entrypoint=/bin/bash \
40- $IMAGE \
41- -lc " pip install -q datasets pandas && \
42- python3 bench_serving/benchmark_serving.py \
43- --model=$MODEL \
44- --backend=vllm \
45- --base-url=\" http://localhost:$PORT \" \
46- --dataset-name=random \
47- --random-input-len=$ISL --random-output-len=$OSL --random-range-ratio=$RANDOM_RANGE_RATIO \
48- --num-prompts=$(( $CONC * 10 )) --max-concurrency=$CONC \
49- --request-rate=inf --ignore-eos \
50- --save-result --percentile-metrics='ttft,tpot,itl,e2el' \
51- --result-dir=/workspace/ \
52- --result-filename=$RESULT_FILENAME .json"
20+ # set +x
21+ # while IFS= read -r line; do
22+ # printf '%s\n' "$line"
23+ # if [[ "$line" =~ Application\ startup\ complete ]]; then
24+ # break
25+ # fi
26+ # done < <(docker logs -f --tail=0 $server_name 2>&1)
27+
28+ # if ! docker ps --format "{{.Names}}" | grep -q "$server_name"; then
29+ # echo "Server container launch failed."
30+ # exit 1
31+ # fi
32+
33+ # git clone https://github.com/kimbochen/bench_serving.git
34+
35+ # set -x
36+ # docker run --rm --network=host --name=$client_name \
37+ # -v $GITHUB_WORKSPACE:/workspace/ -w /workspace/ \
38+ # -e HF_TOKEN -e PYTHONPYCACHEPREFIX=/tmp/pycache/ \
39+ # --entrypoint=/bin/bash \
40+ # $IMAGE \
41+ # -lc "pip install -q datasets pandas && \
42+ # python3 bench_serving/benchmark_serving.py \
43+ # --model=$MODEL \
44+ # --backend=vllm \
45+ # --base-url=\"http://localhost:$PORT\" \
46+ # --dataset-name=random \
47+ # --random-input-len=$ISL --random-output-len=$OSL --random-range-ratio=$RANDOM_RANGE_RATIO \
48+ # --num-prompts=$(( $CONC * 10 )) --max-concurrency=$CONC \
49+ # --request-rate=inf --ignore-eos \
50+ # --save-result --percentile-metrics='ttft,tpot,itl,e2el' \
51+ # --result-dir=/workspace/ \
52+ # --result-filename=$RESULT_FILENAME.json"
5353
5454docker stop $server_name
0 commit comments