File tree Expand file tree Collapse file tree
benchmarks/multi_node/llm-d Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -107,6 +107,13 @@ export NCCL_SOCKET_IFNAME=${NCCL_SOCKET_IFNAME:-$DEFAULT_IFACE}
107107export VLLM_SKIP_P2P_CHECK=1
108108export VLLM_RANDOMIZE_DP_DUMMY_INPUTS=1
109109export VLLM_USE_DEEP_GEMM=1
110+ # DeepGEMM JIT-compiles CUDA kernels at warmup and links against
111+ # libcuda.so.1. In ghcr.io/llm-d/llm-d-cuda the lib lives under
112+ # /usr/local/cuda/compat/, which is in LD_LIBRARY_PATH (runtime) but
113+ # NOT in LIBRARY_PATH (link time). Prepend it so ld can resolve
114+ # -l:libcuda.so.1. The /usr/lib/x86_64-linux-gnu fallback covers
115+ # NVIDIA Container Toolkit injection paths on Linux hosts.
116+ export LIBRARY_PATH=/usr/local/cuda/compat:/usr/lib/x86_64-linux-gnu:${LIBRARY_PATH:- }
110117export VLLM_NIXL_SIDE_CHANNEL_HOST=" $HOST_IP "
111118export VLLM_LOGGING_LEVEL=${VLLM_LOGGING_LEVEL:- INFO}
112119
You can’t perform that action at this time.
0 commit comments