@@ -4,7 +4,6 @@ HF_HUB_CACHE_MOUNT="/home/ubuntu/hf_hub_cache/"
44PORT=8888
55
66server_name=" bmk-server"
7- # client_name="bmk-client"
87
98set -x
109docker run --rm --network=host --name=$server_name \
@@ -16,39 +15,3 @@ docker run --rm --network=host --name=$server_name \
1615--entrypoint=/bin/bash \
1716$IMAGE \
1817benchmarks/" ${EXP_NAME%% _* } _${PRECISION} _h100_docker.sh"
19-
20- # set +x
21- # while IFS= read -r line; do
22- # printf '%s\n' "$line"
23- # if [[ "$line" =~ Application\ startup\ complete ]]; then
24- # break
25- # fi
26- # done < <(docker logs -f --tail=0 $server_name 2>&1)
27-
28- # if ! docker ps --format "{{.Names}}" | grep -q "$server_name"; then
29- # echo "Server container launch failed."
30- # exit 1
31- # fi
32-
33- # git clone https://github.com/kimbochen/bench_serving.git
34-
35- # set -x
36- # docker run --rm --network=host --name=$client_name \
37- # -v $GITHUB_WORKSPACE:/workspace/ -w /workspace/ \
38- # -e HF_TOKEN -e PYTHONPYCACHEPREFIX=/tmp/pycache/ \
39- # --entrypoint=/bin/bash \
40- # $IMAGE \
41- # -lc "pip install -q datasets pandas && \
42- # python3 bench_serving/benchmark_serving.py \
43- # --model=$MODEL \
44- # --backend=vllm \
45- # --base-url=\"http://localhost:$PORT\" \
46- # --dataset-name=random \
47- # --random-input-len=$ISL --random-output-len=$OSL --random-range-ratio=$RANDOM_RANGE_RATIO \
48- # --num-prompts=$(( $CONC * 10 )) --max-concurrency=$CONC \
49- # --request-rate=inf --ignore-eos \
50- # --save-result --percentile-metrics='ttft,tpot,itl,e2el' \
51- # --result-dir=/workspace/ \
52- # --result-filename=$RESULT_FILENAME.json"
53-
54- # docker stop $server_name
0 commit comments