File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -20,4 +20,4 @@ cmake .. -DGGML_SYCL=ON -DCMAKE_C_COMPILER=icx -DCMAKE_CXX_COMPILER=icpx -DLLAMA
2020# cmake --build . --config Release --target llama-bench
2121
2222# build all binary
23- cmake --build . --config Release -j -v
23+ cmake --build . --config Release -j$(( ($(nproc) + 1 ) / 2 )) -v
Original file line number Diff line number Diff line change @@ -23,9 +23,9 @@ if [ $# -gt 0 ]; then
2323 GGML_SYCL_DEVICE=$1
2424 echo " use $GGML_SYCL_DEVICE as main GPU"
2525 # use signle GPU only
26- ZES_ENABLE_SYSMAN=1 ./build/bin/llama-completion -m ${MODEL_FILE} -no-cnv -p " ${INPUT_PROMPT} " -n 400 -e -ngl ${NGL} -s 0 -c ${CONTEXT} -mg $GGML_SYCL_DEVICE -sm none ${LOAD_MODE}
26+ ZES_ENABLE_SYSMAN=1 ./build/bin/llama-completion -m ${MODEL_FILE} -no-cnv -p " ${INPUT_PROMPT} " -n 200 -e -ngl ${NGL} -s 0 -c ${CONTEXT} -mg $GGML_SYCL_DEVICE -sm none ${LOAD_MODE}
2727
2828else
2929 # use multiple GPUs with same max compute units
30- ZES_ENABLE_SYSMAN=1 ./build/bin/llama-completion -m ${MODEL_FILE} -no-cnv -p " ${INPUT_PROMPT} " -n 400 -e -ngl ${NGL} -s 0 -c ${CONTEXT} ${LOAD_MODE}
30+ ZES_ENABLE_SYSMAN=1 ./build/bin/llama-completion -m ${MODEL_FILE} -no-cnv -p " ${INPUT_PROMPT} " -n 200 -e -ngl ${NGL} -s 0 -c ${CONTEXT} ${LOAD_MODE}
3131fi
You can’t perform that action at this time.
0 commit comments