We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent cd60d84 commit 63124faCopy full SHA for 63124fa
1 file changed
.github/workflows/vllm.yml
@@ -79,10 +79,11 @@ jobs:
79
VLLM_VERSION="$(curl -s https://api.github.com/repos/vllm-project/vllm/releases/latest | jq -r .tag_name | sed 's/^v//')"
80
export VLLM_VERSION
81
echo "Installing vLLM ${VLLM_VERSION} (CPU)"
82
- hatch run -- uv pip install "vllm==${VLLM_VERSION}" --extra-index-url "https://wheels.vllm.ai/releases/${VLLM_VERSION}/cpu/"
+ hatch run -- uv pip install "vllm==${VLLM_VERSION}" --extra-index-url "https://wheels.vllm.ai/releases/${VLLM_VERSION}/cpu/" --index-strategy unsafe-best-match
83
84
- name: Start vLLM server
85
env:
86
+ VLLM_TARGET_DEVICE: "cpu"
87
VLLM_CPU_KVCACHE_SPACE: "4"
88
run: |
89
nohup hatch run -- vllm serve ${{ env.VLLM_MODEL }} \
0 commit comments