Skip to content

Commit 098af75

Browse files
committed
[NV] llm-d: add /usr/local/cuda/compat to LIBRARY_PATH for DeepGEMM JIT link
Signed-off-by: Ezra Silvera <ezra@il.ibm.com>
1 parent 4138df9 commit 098af75

1 file changed

Lines changed: 7 additions & 0 deletions

File tree

benchmarks/multi_node/llm-d/server.sh

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -107,6 +107,13 @@ export NCCL_SOCKET_IFNAME=${NCCL_SOCKET_IFNAME:-$DEFAULT_IFACE}
107107
export VLLM_SKIP_P2P_CHECK=1
108108
export VLLM_RANDOMIZE_DP_DUMMY_INPUTS=1
109109
export VLLM_USE_DEEP_GEMM=1
110+
# DeepGEMM JIT-compiles CUDA kernels at warmup and links against
111+
# libcuda.so.1. In ghcr.io/llm-d/llm-d-cuda the lib lives under
112+
# /usr/local/cuda/compat/, which is in LD_LIBRARY_PATH (runtime) but
113+
# NOT in LIBRARY_PATH (link time). Prepend it so ld can resolve
114+
# -l:libcuda.so.1. The /usr/lib/x86_64-linux-gnu fallback covers
115+
# NVIDIA Container Toolkit injection paths on Linux hosts.
116+
export LIBRARY_PATH=/usr/local/cuda/compat:/usr/lib/x86_64-linux-gnu:${LIBRARY_PATH:-}
110117
export VLLM_NIXL_SIDE_CHANNEL_HOST="$HOST_IP"
111118
export VLLM_LOGGING_LEVEL=${VLLM_LOGGING_LEVEL:-INFO}
112119

0 commit comments

Comments
 (0)