Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
12 changes: 12 additions & 0 deletions pkgs/development/python-modules/vllm/0007-drop-quack-reqs.patch
Original file line number Diff line number Diff line change
@@ -0,0 +1,12 @@
diff --git a/requirements/cuda.txt b/requirements/cuda.txt
index 22477dc82..84fe34730 100644
--- a/requirements/cuda.txt
+++ b/requirements/cuda.txt
@@ -11,7 +11,3 @@ torchaudio==2.10.0
torchvision==0.25.0 # Required for phi3v processor. See https://github.com/pytorch/vision?tab=readme-ov-file#installation for corresponding version
# FlashInfer should be updated together with the Dockerfile
flashinfer-python==0.6.4
-
-# QuACK and Cutlass DSL for FA4 (cute-DSL implementation)
-nvidia-cutlass-dsl>=4.4.0.dev1
-quack-kernels>=0.2.7
12 changes: 10 additions & 2 deletions pkgs/development/python-modules/vllm/default.nix
Original file line number Diff line number Diff line change
Expand Up @@ -178,8 +178,8 @@ let
triton-kernels = fetchFromGitHub {
owner = "triton-lang";
repo = "triton";
tag = "v3.5.0";
hash = "sha256-F6T0n37Lbs+B7UHNYzoIQHjNNv3TcMtoXjNrT8ZUlxY=";
tag = "v3.6.0";
hash = "sha256-JFSpQn+WsNnh7CAPlcpOcUp0nyKXNbJEANdXqmkt4Tc=";
};

# grep for GIT_TAG in the following file
Expand Down Expand Up @@ -354,6 +354,9 @@ buildPythonPackage.override { stdenv = torch.stdenv; } (finalAttrs: {
./0003-propagate-pythonpath.patch
./0005-drop-intel-reqs.patch
./0006-drop-rocm-extra-reqs.patch
# QuACK and Cutlass DSL seem to be added only for FA4
# which in our case handles its own deps
./0007-drop-quack-reqs.patch
];

postPatch = ''
Expand Down Expand Up @@ -582,6 +585,11 @@ buildPythonPackage.override { stdenv = torch.stdenv; } (finalAttrs: {
pythonRelaxDeps = true;

pythonImportsCheck = [ "vllm" ];
makeWrapperArgs = lib.optionals cudaSupport [
"--set"
"VLLM_NCCL_SO_PATH"
"${cudaPackages.nccl}/lib/libnccl.so"
];

passthru = {
# make internal dependency available to overlays
Expand Down
Loading