Skip to content

Commit 28534c7

Browse files
Pass EP_SIZE environment variable to Docker containers in B200 runner scripts
Co-authored-by: functionstackx <47992694+functionstackx@users.noreply.github.com>
1 parent a21de78 commit 28534c7

2 files changed

Lines changed: 2 additions & 2 deletions

File tree

runners/launch_b200-nvd.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -30,7 +30,7 @@ docker run --rm -d --init --network host --name $server_name \
3030
--runtime nvidia --gpus all --ipc host --privileged --shm-size=16g --ulimit memlock=-1 --ulimit stack=67108864 \
3131
-v $HF_HUB_CACHE_MOUNT:$HF_HUB_CACHE \
3232
-v $GITHUB_WORKSPACE:/workspace/ -w /workspace/ \
33-
-e HF_TOKEN -e HF_HUB_CACHE -e MODEL -e TP -e CONC -e MAX_MODEL_LEN -e ISL -e OSL -e PORT=$PORT \
33+
-e HF_TOKEN -e HF_HUB_CACHE -e MODEL -e TP -e CONC -e MAX_MODEL_LEN -e ISL -e OSL -e PORT=$PORT -e EP_SIZE \
3434
-e NCCL_GRAPH_REGISTER=0 \
3535
-e TORCH_CUDA_ARCH_LIST="10.0" -e CUDA_DEVICE_ORDER=PCI_BUS_ID -e CUDA_VISIBLE_DEVICES="0,1,2,3,4,5,6,7" \
3636
--entrypoint=/bin/bash \

runners/launch_b200-tg.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ docker run --rm -d --network host --name $server_name \
1212
--runtime nvidia --gpus all --ipc host --privileged --shm-size=16g --ulimit memlock=-1 --ulimit stack=67108864 \
1313
-v $HF_HUB_CACHE_MOUNT:$HF_HUB_CACHE \
1414
-v $GITHUB_WORKSPACE:/workspace/ -w /workspace/ \
15-
-e HF_TOKEN -e HF_HUB_CACHE -e MODEL -e TP -e CONC -e MAX_MODEL_LEN -e ISL -e OSL -e PORT=$PORT \
15+
-e HF_TOKEN -e HF_HUB_CACHE -e MODEL -e TP -e CONC -e MAX_MODEL_LEN -e ISL -e OSL -e PORT=$PORT -e EP_SIZE \
1616
-e TORCH_CUDA_ARCH_LIST="10.0" -e CUDA_DEVICE_ORDER=PCI_BUS_ID -e CUDA_VISIBLE_DEVICES="0,1,2,3,4,5,6,7" \
1717
--entrypoint=/bin/bash \
1818
$(echo "$IMAGE" | sed 's/#/\//') \

0 commit comments

Comments
 (0)