Skip to content

Commit ba3ab1e

Browse files
kajalj22claude
andcommitted
Upgrade vllm deps: torch 2.11, flashinfer 0.6.8.post1, restore transformers override
- Bump torch 2.10.0 -> 2.11.0, torchaudio 2.10.0 -> 2.11.0 - Bump flashinfer-python/cubin 0.6.4 -> 0.6.8.post1 for vllm 0.20.0 - Restore transformers==5.3.0 override (vllm 0.20.0 excludes 5.0-5.5.0 but our codebase needs 5.3.0; override lets uv resolve it) - Pin core transformers back to ==5.3.0 Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com> Signed-off-by: Kajal Jain <kajalj@nvidia.com>
1 parent 5bdbeb0 commit ba3ab1e

2 files changed

Lines changed: 1145 additions & 890 deletions

File tree

pyproject.toml

Lines changed: 12 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@ dependencies = [
2525
"setuptools",
2626
"pip", # Required for frozen environments; uv venv --seed may not reliably install pip
2727
"ninja", # for flash-attn parallel build
28-
"torch==2.10.0",
28+
"torch==2.11.0",
2929
"triton; sys_platform == 'linux' and (platform_machine == 'x86_64' or platform_machine == 'aarch64')",
3030
"colored==2.2.3",
3131
"ray[default]==2.54.0",
@@ -49,7 +49,7 @@ dependencies = [
4949
"sympy>=1.14.0",
5050
"pillow>=12.1.1",
5151
"torchvision==0.26.0",
52-
"transformers>=5.3.0",
52+
"transformers==5.3.0",
5353
"num2words>=0.5.14", # for SmolVLM
5454
"mlflow>=3.11.1",
5555
"nvidia-nvshmem-cu13; sys_platform == 'linux' and (platform_machine == 'x86_64' or platform_machine == 'aarch64')", # for deep_ep build
@@ -101,8 +101,8 @@ vllm = [
101101
"vllm @ https://github.com/vllm-project/vllm/releases/download/v0.20.0/vllm-0.20.0-cp38-abi3-manylinux_2_35_x86_64.whl ; sys_platform == 'linux' and platform_machine == 'x86_64'",
102102
"vllm==0.20.0 ; sys_platform != 'linux' or (platform_machine != 'aarch64' and platform_machine != 'x86_64')",
103103
"num2words>=0.5.14",
104-
"flashinfer-python==0.6.4",
105-
"flashinfer-cubin==0.6.4",
104+
"flashinfer-python==0.6.8.post1",
105+
"flashinfer-cubin==0.6.8.post1",
106106
"nvidia-cutlass-dsl>=4.4.0.dev1",
107107
]
108108
sglang = [
@@ -142,7 +142,7 @@ nemo_gym = ["nemo_gym"]
142142
# This is a default group so that we install these even with bare `uv sync`
143143
build = [
144144
# Build requirement for TE
145-
"torch==2.10.0",
145+
"torch==2.11.0",
146146
# Build requirement for TE
147147
"setuptools",
148148
"packaging",
@@ -270,23 +270,26 @@ override-dependencies = [
270270
"opencv-python-headless>=4.11.0",
271271
"timm<=1.0.22",
272272
"nvidia-modelopt[torch]>=0.39.0",
273-
"torch==2.10.0",
274-
"torchaudio==2.10.0",
273+
"torch==2.11.0",
274+
"torchaudio==2.11.0",
275275
# sglang has conflicting llguidance versions than vllm, so enforcing vllm's version since it's newer
276276
"llguidance>=1.3.0,<1.4.0",
277277
# Override setuptools range in other dependencies to address CVE GHSA-58pv-8j8x-9vj2
278278
"setuptools>=80.10.2",
279279
"deep_ep @ git+https://github.com/deepseek-ai/DeepEP.git@bfded34800dfec415b71503f8205181de90b2480",
280-
# Note: flashinfer versions are pinned per-extra (vllm uses 0.6.4, sglang uses 0.6.7.post2)
280+
# Note: flashinfer versions are pinned per-extra (vllm uses 0.6.8.post1, sglang uses 0.6.7.post2)
281281
# since vllm and sglang extras are mutually exclusive and have different requirements.
282-
# Override megatron-core's flashinfer~=0.5.0 constraint to allow both vllm (0.6.4) and sglang (0.6.7.post2)
282+
# Override megatron-core's flashinfer~=0.5.0 constraint to allow both vllm (0.6.8.post1) and sglang (0.6.7.post2)
283283
"flashinfer-python>=0.5.0",
284284
"flashinfer-cubin>=0.5.0",
285285
# sglang 0.5.10 requires nvidia-cutlass-dsl>=4.4.1 (via flashinfer 0.6.7.post2 which uses CUTLASS 4.4.2).
286286
# Override to >=4.4.1 so uv can resolve to a version satisfying both vllm and sglang.
287287
"nvidia-cutlass-dsl>=4.4.1",
288288
# Relax megatron-core workspace member's opentelemetry-api ceiling (<1.34) for protobuf 6.x compat with ray
289289
"opentelemetry-api>=1.33.1",
290+
# vLLM 0.20.0 excludes transformers 5.0-5.5.0 but our codebase needs 5.3.0.
291+
# Override so uv can resolve transformers==5.3.0 for non-vllm extras.
292+
"transformers==5.3.0",
290293
#Override till we can upgrade sglang version to address CVE GHSA-7rgv-gqhr-fxg3
291294
"xgrammar==0.1.33",
292295
# Override dependencies to address CVEs

0 commit comments

Comments
 (0)