1717HF_HUB_CACHE_MOUNT=" /nfsdata/hf_hub_cache-1/" # Temp solution
1818PORT=8888
1919
20- # network_name="bmk-net"
2120server_name=" bmk-server"
22- # client_name="bmk-client"
23-
24- # docker network create $network_name
2521
2622set -x
2723docker run --rm --ipc=host --shm-size=16g --network=host --name=$server_name \
@@ -35,50 +31,7 @@ docker run --rm --ipc=host --shm-size=16g --network=host --name=$server_name \
3531$IMAGE \
3632benchmarks/" ${EXP_NAME%% _* } _${PRECISION} _mi355x_docker.sh"
3733
38- # set +x
39- # while IFS= read -r line; do
40- # printf '%s\n' "$line"
41- # if [[ "$line" =~ Application\ startup\ complete ]]; then
42- # break
43- # fi
44- # done < <(docker logs -f --tail=0 $server_name 2>&1)
45-
46- # if [[ "$MODEL" == "amd/DeepSeek-R1-0528-MXFP4-Preview" || "$MODEL" == "deepseek-ai/DeepSeek-R1-0528" ]]; then
47- # if [[ "$OSL" == "8192" ]]; then
48- # NUM_PROMPTS=$(( CONC * 20 ))
49- # else
50- # NUM_PROMPTS=$(( CONC * 50 ))
51- # fi
52- # else
53- # NUM_PROMPTS=$(( CONC * 10 ))
54- # fi
55-
56- # git clone https://github.com/kimbochen/bench_serving.git
57-
58- # set -x
59- # docker run --rm --network=$network_name --name=$client_name \
60- # -v $GITHUB_WORKSPACE:/workspace/ -w /workspace/ \
61- # -e HF_TOKEN -e PYTHONPYCACHEPREFIX=/tmp/pycache/ \
62- # --entrypoint=python3 \
63- # $IMAGE \
64- # bench_serving/benchmark_serving.py \
65- # --model=$MODEL --backend=vllm --base-url="http://$server_name:$PORT" \
66- # --dataset-name=random \
67- # --random-input-len=$ISL --random-output-len=$OSL --random-range-ratio=$RANDOM_RANGE_RATIO \
68- # --num-prompts=$NUM_PROMPTS \
69- # --max-concurrency=$CONC \
70- # --request-rate=inf --ignore-eos \
71- # --save-result --percentile-metrics="ttft,tpot,itl,e2el" \
72- # --result-dir=/workspace/ --result-filename=$RESULT_FILENAME.json
73-
7434if ls gpucore.* 1> /dev/null 2>&1 ; then
7535 echo " gpucore files exist. not good"
7636 rm -f gpucore.*
7737fi
78-
79-
80- # while [ -n "$(docker ps -aq)" ]; do
81- # docker stop $server_name
82- # # docker network rm $network_name
83- # sleep 5
84- # done
0 commit comments