Skip to content

Commit 9a0288b

Browse files
authored
Merge pull request #147 from coreweave/rwang/vllm19
feat(vllm-tensorizer): Add Vllm 0.19.0 support for gemma4
2 parents 09f8ada + 5cd4881 commit 9a0288b

2 files changed

Lines changed: 9 additions & 3 deletions

File tree

.github/configurations/vllm-tensorizer.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,9 @@
11
vllm-commit:
2-
- 'v0.18.1'
2+
- 'v0.19.0'
33
flashinfer-commit:
44
- 'v0.6.6'
55
lmcache-commit:
6-
- 'v0.4.1'
6+
- 'v0.4.2'
77
builder-base-image:
88
- 'ghcr.io/coreweave/ml-containers/torch:1a21fa8-nccl-cuda12.9.1-ubuntu22.04-nccl2.29.7-1-torch2.10.0-vision0.25.0-audio2.10.0-abi1'
99
final-base-image:

vllm-tensorizer/Dockerfile

Lines changed: 7 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -241,14 +241,20 @@ COPY --link --from=nixl-builder /usr/lib/python3/dist-packages/nixl.pth /usr/lib
241241
# Copied from vLLM's Dockerfile
242242
ARG TARGETPLATFORM
243243

244+
# Ray was removed as a default dependancy by vllm in v18, but it is still required
245+
# for the multi-node setup.
246+
247+
# Gemma 4 needs transformers > 5.5.0, but is packaged with 4 in vllm 19.
248+
# We must explicitly update it until vLLM updates their dependency.
249+
244250
RUN if [ "$TARGETPLATFORM" = "linux/arm64" ]; then \
245251
BITSANDBYTES_VER='0.42.0'; \
246252
else \
247253
BITSANDBYTES_VER='0.46.1'; \
248254
fi && \
249255
python3 -m pip install --no-cache-dir \
250256
accelerate hf_transfer 'modelscope!=1.15.0' "bitsandbytes>=${BITSANDBYTES_VER:?}" 'timm>=1.0.17' \
251-
'runai-model-streamer[s3,gcs]>=0.15.3' "ray[cgraph]>=2.48.0" -c /tmp/constraints.txt && \
257+
'runai-model-streamer[s3,gcs]>=0.15.3' "ray[cgraph]>=2.48.0" "transformers>=5.5.0" -c /tmp/constraints.txt && \
252258
rm /tmp/constraints.txt
253259

254260
EXPOSE 8080

0 commit comments

Comments
 (0)