From 0684551ce4c241cff6822629b97330714ed67a14 Mon Sep 17 00:00:00 2001 From: anakin87 Date: Mon, 18 May 2026 09:25:55 +0200 Subject: [PATCH] test: make vLLM wheel detection more robust --- .github/workflows/vllm.yml | 18 +++++++++++------- 1 file changed, 11 insertions(+), 7 deletions(-) diff --git a/.github/workflows/vllm.yml b/.github/workflows/vllm.yml index 5b395ea3db..5c6ea0917d 100644 --- a/.github/workflows/vllm.yml +++ b/.github/workflows/vllm.yml @@ -84,15 +84,19 @@ jobs: run: | # vLLM on PyPI is GPU-only and requires CUDA, so it won't run on CPU-only systems. # CPU wheels are not published to PyPI; they are only available as direct downloads from GitHub releases. - # We fetch the latest release and install the appropriate x86 CPU wheel. + # We query the latest release's assets and pick the x86_64 CPU wheel, since the manylinux/ABI + # tags in the filename can change between releases. # The --torch-backend cpu flag ensures uv installs PyTorch from the official CPU-only index, # since the required torch+cpu builds are also not available on PyPI. - VLLM_VERSION="$(curl -s https://api.github.com/repos/vllm-project/vllm/releases/latest | jq -r .tag_name | sed 's/^v//')" - export VLLM_VERSION - echo "Installing vLLM ${VLLM_VERSION} (CPU)" - hatch run -- uv pip install \ - "https://github.com/vllm-project/vllm/releases/download/v${VLLM_VERSION}/vllm-${VLLM_VERSION}+cpu-cp38-abi3-manylinux_2_35_x86_64.whl" \ - --torch-backend cpu + VLLM_WHEEL_URL="$(curl -s https://api.github.com/repos/vllm-project/vllm/releases/latest \ + | jq -r '.assets[] | select(.name | test("\\+cpu.*x86_64\\.whl$")) | .browser_download_url' \ + | head -n1)" + if [ -z "${VLLM_WHEEL_URL}" ]; then + echo "Could not find a CPU x86_64 wheel in the latest vLLM release" >&2 + exit 1 + fi + echo "Installing ${VLLM_WHEEL_URL}" + hatch run -- uv pip install "${VLLM_WHEEL_URL}" --torch-backend cpu - name: Start vLLM chat server run: |