Skip to content

Commit 0717ec9

Browse files
committed
updating mi300 pt 2
1 parent 131b572 commit 0717ec9

3 files changed

Lines changed: 5 additions & 77 deletions

File tree

runners/launch_mi300x-amd.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ PORT=8888
88
server_name="bmk-server"
99

1010
set -x
11-
docker run --rm --ipc=host --shm-size=16g --name=$server_name \
11+
docker run --rm --ipc=host --shm-size=16g --network=host --name=$server_name \
1212
--privileged --cap-add=CAP_SYS_ADMIN --device=/dev/kfd --device=/dev/dri --device=/dev/mem \
1313
--cap-add=SYS_PTRACE --security-opt seccomp=unconfined \
1414
-v $HF_HUB_CACHE_MOUNT:$HF_HUB_CACHE \

runners/launch_mi300x-cr.sh

Lines changed: 2 additions & 38 deletions
Original file line numberDiff line numberDiff line change
@@ -5,52 +5,16 @@ sudo sh -c 'echo 0 > /proc/sys/kernel/numa_balancing'
55
HF_HUB_CACHE_MOUNT="/mnt/vdb/gha_cache/hf_hub_cache/"
66
PORT=8888
77

8-
network_name="bmk-net"
98
server_name="bmk-server"
10-
client_name="bmk-client"
11-
12-
docker network create $network_name
139

1410
set -x
15-
docker run --rm -d --ipc=host --shm-size=16g --network=$network_name --name=$server_name \
11+
docker run --rm -d --ipc=host --shm-size=16g --network=host --name=$server_name \
1612
--privileged --cap-add=CAP_SYS_ADMIN --device=/dev/kfd --device=/dev/dri --device=/dev/mem \
1713
--cap-add=SYS_PTRACE --security-opt seccomp=unconfined \
1814
-v $HF_HUB_CACHE_MOUNT:$HF_HUB_CACHE \
1915
-v $GITHUB_WORKSPACE:/workspace/ -w /workspace/ \
2016
-e HF_TOKEN -e HF_HUB_CACHE -e MODEL -e TP -e CONC -e MAX_MODEL_LEN -e PORT=$PORT \
21-
-e ISL -e OSL \
17+
-e ISL -e OSL -e PYTHONPYCACHEPREFIX=/tmp/pycache/ -e RANDOM_RANGE_RATIO -e RESULT_FILENAME \
2218
--entrypoint=/bin/bash \
2319
$IMAGE \
2420
benchmarks/"${EXP_NAME%%_*}_${PRECISION}_mi300x_docker.sh"
25-
26-
set +x
27-
while IFS= read -r line; do
28-
printf '%s\n' "$line"
29-
if [[ "$line" =~ Application\ startup\ complete ]]; then
30-
break
31-
fi
32-
done < <(docker logs -f --tail=0 $server_name 2>&1)
33-
34-
git clone https://github.com/kimbochen/bench_serving.git
35-
36-
set -x
37-
docker run --rm --network=$network_name --name=$client_name \
38-
-v $GITHUB_WORKSPACE:/workspace/ -w /workspace/ \
39-
-e HF_TOKEN -e PYTHONPYCACHEPREFIX=/tmp/pycache/ \
40-
--entrypoint=python3 \
41-
$IMAGE \
42-
bench_serving/benchmark_serving.py \
43-
--model=$MODEL --backend=vllm --base-url=http://$server_name:$PORT \
44-
--dataset-name=random \
45-
--random-input-len=$ISL --random-output-len=$OSL --random-range-ratio=$RANDOM_RANGE_RATIO \
46-
--num-prompts=$(( $CONC * 10 )) \
47-
--max-concurrency=$CONC \
48-
--request-rate=inf --ignore-eos \
49-
--save-result --percentile-metrics="ttft,tpot,itl,e2el" \
50-
--result-dir=/workspace/ --result-filename=$RESULT_FILENAME.json
51-
52-
while [ -n "$(docker ps -aq)" ]; do
53-
docker stop $server_name
54-
docker network rm $network_name
55-
sleep 5
56-
done

runners/launch_mi300x-oci.sh

Lines changed: 2 additions & 38 deletions
Original file line numberDiff line numberDiff line change
@@ -3,52 +3,16 @@
33
HF_HUB_CACHE_MOUNT="$HOME/hf_hub_cache/"
44
PORT=8888
55

6-
network_name="bmk-net"
76
server_name="bmk-server"
8-
client_name="bmk-client"
9-
10-
docker network create $network_name
117

128
set -x
13-
docker run --rm -d --ipc=host --shm-size=16g --network=$network_name --name=$server_name \
9+
docker run --rm -d --ipc=host --shm-size=16g --network=host --name=$server_name \
1410
--privileged --cap-add=CAP_SYS_ADMIN --device=/dev/kfd --device=/dev/dri --device=/dev/mem \
1511
--cap-add=SYS_PTRACE --security-opt seccomp=unconfined \
1612
-v $HF_HUB_CACHE_MOUNT:$HF_HUB_CACHE \
1713
-v $GITHUB_WORKSPACE:/workspace/ -w /workspace/ \
1814
-e HF_TOKEN -e HF_HUB_CACHE -e MODEL -e TP -e CONC -e MAX_MODEL_LEN -e PORT=$PORT \
19-
-e ISL -e OSL \
15+
-e ISL -e OSL -e PYTHONPYCACHEPREFIX=/tmp/pycache/ -e RANDOM_RANGE_RATIO -e RESULT_FILENAME \
2016
--entrypoint=/bin/bash \
2117
$IMAGE \
2218
benchmarks/"${EXP_NAME%%_*}_${PRECISION}_mi300x_docker.sh"
23-
24-
set +x
25-
while IFS= read -r line; do
26-
printf '%s\n' "$line"
27-
if [[ "$line" =~ Application\ startup\ complete ]]; then
28-
break
29-
fi
30-
done < <(docker logs -f --tail=0 $server_name 2>&1)
31-
32-
git clone https://github.com/kimbochen/bench_serving.git
33-
34-
set -x
35-
docker run --rm --network=$network_name --name=$client_name \
36-
-v $GITHUB_WORKSPACE:/workspace/ -w /workspace/ \
37-
-e HF_TOKEN -e PYTHONPYCACHEPREFIX=/tmp/pycache/ \
38-
--entrypoint=python3 \
39-
$IMAGE \
40-
bench_serving/benchmark_serving.py \
41-
--model=$MODEL --backend=vllm --base-url=http://$server_name:$PORT \
42-
--dataset-name=random \
43-
--random-input-len=$ISL --random-output-len=$OSL --random-range-ratio=$RANDOM_RANGE_RATIO \
44-
--num-prompts=$(( $CONC * 10 )) \
45-
--max-concurrency=$CONC \
46-
--request-rate=inf --ignore-eos \
47-
--save-result --percentile-metrics="ttft,tpot,itl,e2el" \
48-
--result-dir=/workspace/ --result-filename=$RESULT_FILENAME.json
49-
50-
while [ -n "$(docker ps -aq)" ]; do
51-
docker stop $server_name
52-
docker network rm $network_name
53-
sleep 5
54-
done

0 commit comments

Comments
 (0)