File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -76,10 +76,17 @@ jobs:
7676
7777 - name : Install vLLM (CPU)
7878 run : |
79+ # vLLM on PyPI is GPU-only and requires CUDA, so it won't run on CPU-only systems.
80+ # CPU wheels are not published to PyPI; they are only available as direct downloads from GitHub releases.
81+ # We fetch the latest release and install the appropriate x86 CPU wheel.
82+ # The --torch-backend cpu flag ensures uv installs PyTorch from the official CPU-only index,
83+ # since the required torch+cpu builds are also not available on PyPI.
7984 VLLM_VERSION="$(curl -s https://api.github.com/repos/vllm-project/vllm/releases/latest | jq -r .tag_name | sed 's/^v//')"
8085 export VLLM_VERSION
8186 echo "Installing vLLM ${VLLM_VERSION} (CPU)"
82- hatch run -- uv pip install "https://github.com/vllm-project/vllm/releases/download/v${VLLM_VERSION}/vllm-${VLLM_VERSION}+cpu-cp38-abi3-manylinux_2_35_x86_64.whl" --extra-index-url https://download.pytorch.org/whl/cpu --index-strategy unsafe-best-match
87+ hatch run -- uv pip install \
88+ "https://github.com/vllm-project/vllm/releases/download/v${VLLM_VERSION}/vllm-${VLLM_VERSION}+cpu-cp38-abi3-manylinux_2_35_x86_64.whl" \
89+ --torch-backend cpu
8390
8491 - name : Start vLLM server
8592 env :
94101 --enable-auto-tool-choice \
95102 --tool-call-parser hermes &
96103
97- # Wait for the vLLM server to be ready with a timeout of 600 seconds
98- timeout=600
104+ # Wait for the vLLM server to be ready with a timeout of 300 seconds
105+ timeout=300
99106 while [ $timeout -gt 0 ] && ! curl -sSf http://localhost:8000/health > /dev/null 2>&1; do
100107 echo "Waiting for vLLM server to start..."
101108 sleep 10
Original file line number Diff line number Diff line change @@ -23,7 +23,7 @@ classifiers = [
2323 " Programming Language :: Python :: Implementation :: CPython" ,
2424 " Programming Language :: Python :: Implementation :: PyPy" ,
2525]
26- dependencies = [" haystack-ai" , " openai" ]
26+ dependencies = [" haystack-ai>=2.23.0 " , " openai" ]
2727
2828[project .urls ]
2929Documentation = " https://github.com/deepset-ai/haystack-core-integrations/tree/main/integrations/vllm#readme"
You can’t perform that action at this time.
0 commit comments