Skip to content

Commit 287015d

Browse files
Merge pull request #160 from coreweave/jperlman/vllm0.20.2
feat(vllm-tensorizer): Bump vLLM to v0.20.2 on CUDA 13.2 / Ubuntu 24.04
2 parents c0ffa83 + 202ef09 commit 287015d

3 files changed

Lines changed: 25 additions & 17 deletions

File tree

Lines changed: 13 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,13 @@
1-
vllm-commit:
2-
- 'v0.20.0'
3-
flashinfer-commit:
4-
- 'v0.6.8'
5-
lmcache-commit:
6-
- 'v0.4.2'
7-
builder-base-image:
8-
- 'ghcr.io/coreweave/ml-containers/torch:bc8c66e-nccl-cuda12.9.1-ubuntu22.04-nccl2.30.4-1-torch2.11.0-vision0.26.0-audio2.11.0-abi1'
9-
final-base-image:
10-
- 'ghcr.io/coreweave/ml-containers/torch:bc8c66e-nccl-cuda12.9.1-ubuntu22.04-nccl2.30.4-1-torch2.11.0-vision0.26.0-audio2.11.0-abi1'
1+
include:
2+
- vllm-commit: 'v0.20.2'
3+
flashinfer-commit: 'v0.6.8'
4+
lmcache-commit: 'v0.4.2'
5+
builder-base-image: 'ghcr.io/coreweave/ml-containers/torch:bc8c66e-nccl-cuda13.2.1-ubuntu24.04-nccl2.30.4-1-torch2.11.0-vision0.26.0-audio2.11.0-abi1'
6+
final-base-image: 'ghcr.io/coreweave/ml-containers/torch:bc8c66e-nccl-cuda13.2.1-ubuntu24.04-nccl2.30.4-1-torch2.11.0-vision0.26.0-audio2.11.0-abi1'
7+
tag-suffix: 'v0.20.2-cuda13.2.1-ubuntu24.04'
8+
- vllm-commit: 'v0.20.2'
9+
flashinfer-commit: 'v0.6.8'
10+
lmcache-commit: 'v0.4.2'
11+
builder-base-image: 'ghcr.io/coreweave/ml-containers/torch:bc8c66e-nccl-cuda12.9.1-ubuntu24.04-nccl2.30.4-1-torch2.11.0-vision0.26.0-audio2.11.0-abi1'
12+
final-base-image: 'ghcr.io/coreweave/ml-containers/torch:bc8c66e-nccl-cuda12.9.1-ubuntu24.04-nccl2.30.4-1-torch2.11.0-vision0.26.0-audio2.11.0-abi1'
13+
tag-suffix: 'v0.20.2-cuda12.9.1-ubuntu24.04'

.github/workflows/vllm-tensorizer.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@ jobs:
2121
with:
2222
image-name: vllm-tensorizer
2323
folder: vllm-tensorizer
24-
tag-suffix: ${{ matrix.vllm-commit }}
24+
tag-suffix: ${{ matrix.tag-suffix }}
2525
build-contexts: |
2626
common=common
2727
object-storage-secrets: true

vllm-tensorizer/Dockerfile

Lines changed: 11 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
# syntax=docker/dockerfile:1.10
2-
ARG BUILDER_BASE_IMAGE="ghcr.io/coreweave/ml-containers/torch:17ad6db-nccl-cuda12.9.1-ubuntu22.04-nccl2.29.2-1-torch2.10.0-vision0.25.0-audio2.10.0-abi1"
3-
ARG FINAL_BASE_IMAGE="ghcr.io/coreweave/ml-containers/torch:17ad6db-nccl-cuda12.9.1-ubuntu22.04-nccl2.29.2-1-torch2.10.0-vision0.25.0-audio2.10.0-abi1"
2+
ARG BUILDER_BASE_IMAGE="ghcr.io/coreweave/ml-containers/torch:bc8c66e-nccl-cuda13.2.1-ubuntu24.04-nccl2.30.4-1-torch2.11.0-vision0.26.0-audio2.11.0-abi1"
3+
ARG FINAL_BASE_IMAGE="ghcr.io/coreweave/ml-containers/torch:bc8c66e-nccl-cuda13.2.1-ubuntu24.04-nccl2.30.4-1-torch2.11.0-vision0.26.0-audio2.11.0-abi1"
44
ARG SCCACHE_VERSION="0.14.0"
55

66
FROM alpine/curl:8.17.0 AS sccache-downloader
@@ -22,9 +22,10 @@ RUN ldconfig
2222

2323
RUN apt-get -qq update && \
2424
apt-get -qq install -y --no-install-recommends \
25-
python3-pip git ninja-build cmake gcc-12 g++-12 && \
25+
git ninja-build cmake gcc-12 g++-12 && \
2626
apt-get clean && \
27-
pip3 install -U --no-cache-dir pip packaging 'setuptools>=77.0.3,<81.0.0' wheel setuptools_scm regex build
27+
rm -f /usr/lib/python3.*/EXTERNALLY-MANAGED && \
28+
python3 -m pip install -U --no-cache-dir pip packaging 'setuptools>=77.0.3,<81.0.0' wheel setuptools_scm regex build
2829

2930
# Create the /wheels directory
3031
WORKDIR /wheels
@@ -164,7 +165,7 @@ RUN --mount=type=bind,from=flashinfer-downloader,source=/git/flashinfer,target=/
164165
python3 -m pip install --no-cache-dir \
165166
requests nvidia-ml-py ninja tqdm filelock \
166167
'nvidia-cudnn-frontend>=1.13.0,<1.19.0' \
167-
"cuda-python~=${CUDA_VERSION}" \
168+
"cuda-python~=${CUDA_VERSION%.*}" \
168169
"nvidia-nvshmem-cu${CUDA_VERSION%%.*}<3.6" \
169170
'apache-tvm-ffi==0.1.9' && \
170171
export FLASHINFER_LOCAL_VERSION="$(sed -E 's@([[:digit:]]+)\.([[:digit:]]+).*$@cu\1\2@')" \
@@ -264,7 +265,11 @@ FROM ${FINAL_BASE_IMAGE} AS base
264265

265266
WORKDIR /workspace
266267

267-
RUN apt-get -qq update && apt-get install -y --no-install-recommends curl libsodium23 libnuma-dev && apt-get clean
268+
RUN apt-get -qq update && \
269+
apt-get install -y --no-install-recommends curl libsodium23 libnuma-dev && \
270+
apt-get purge -y python3-jwt && \
271+
apt-get clean && \
272+
rm -f /usr/lib/python3.*/EXTERNALLY-MANAGED
268273

269274
RUN --mount=type=bind,from=freezer,target=/tmp/frozen \
270275
/tmp/frozen/freeze.sh torch torchaudio torchvision xformers > /tmp/constraints.txt && \

0 commit comments

Comments
 (0)