11ARG ONEAPI_VERSION=2025.3.3-0-devel-ubuntu24.04
2+ ARG BUILD_DATE=N/A
3+ ARG APP_VERSION=N/A
4+ ARG APP_REVISION=N/A
25
36# # Build Image
47
58FROM intel/deep-learning-essentials:$ONEAPI_VERSION AS build
69
710ARG GGML_SYCL_F16=OFF
11+ ARG LEVEL_ZERO_VERSION=1.28.2
12+ ARG LEVEL_ZERO_UBUNTU_VERSION=u24.04
813RUN apt-get update && \
9- apt-get install -y git libssl-dev
14+ apt-get install -y git libssl-dev wget ca-certificates && \
15+ cd /tmp && \
16+ wget -q "https://github.com/oneapi-src/level-zero/releases/download/v${LEVEL_ZERO_VERSION}/level-zero_${LEVEL_ZERO_VERSION}%2B${LEVEL_ZERO_UBUNTU_VERSION}_amd64.deb" -O level-zero.deb && \
17+ wget -q "https://github.com/oneapi-src/level-zero/releases/download/v${LEVEL_ZERO_VERSION}/level-zero-devel_${LEVEL_ZERO_VERSION}%2B${LEVEL_ZERO_UBUNTU_VERSION}_amd64.deb" -O level-zero-devel.deb && \
18+ apt-get -o Dpkg::Options::="--force-overwrite" install -y ./level-zero.deb ./level-zero-devel.deb && \
19+ rm -f /tmp/level-zero.deb /tmp/level-zero-devel.deb
1020
1121WORKDIR /app
1222
@@ -26,18 +36,32 @@ RUN mkdir -p /app/lib && \
2636RUN mkdir -p /app/full \
2737 && cp build/bin/* /app/full \
2838 && cp *.py /app/full \
39+ && cp -r conversion /app/full \
2940 && cp -r gguf-py /app/full \
3041 && cp -r requirements /app/full \
3142 && cp requirements.txt /app/full \
3243 && cp .devops/tools.sh /app/full/tools.sh
3344
3445FROM intel/deep-learning-essentials:$ONEAPI_VERSION AS base
3546
36- ARG IGC_VERSION=v2.30.1
37- ARG IGC_VERSION_FULL=2_2.30.1+20950
38- ARG COMPUTE_RUNTIME_VERSION=26.09.37435.1
39- ARG COMPUTE_RUNTIME_VERSION_FULL=26.09.37435.1-0
40- ARG IGDGMM_VERSION=22.9.0
47+ ARG BUILD_DATE=N/A
48+ ARG APP_VERSION=N/A
49+ ARG APP_REVISION=N/A
50+ ARG IMAGE_URL=https://github.com/ggml-org/llama.cpp
51+ ARG IMAGE_SOURCE=https://github.com/ggml-org/llama.cpp
52+ LABEL org.opencontainers.image.created=$BUILD_DATE \
53+ org.opencontainers.image.version=$APP_VERSION \
54+ org.opencontainers.image.revision=$APP_REVISION \
55+ org.opencontainers.image.title="llama.cpp" \
56+ org.opencontainers.image.description="LLM inference in C/C++" \
57+ org.opencontainers.image.url=$IMAGE_URL \
58+ org.opencontainers.image.source=$IMAGE_SOURCE
59+
60+ ARG IGC_VERSION=v2.20.5
61+ ARG IGC_VERSION_FULL=2_2.20.5+19972
62+ ARG COMPUTE_RUNTIME_VERSION=25.40.35563.10
63+ ARG COMPUTE_RUNTIME_VERSION_FULL=25.40.35563.10-0
64+ ARG IGDGMM_VERSION=22.8.2
4165RUN mkdir /tmp/neo/ && cd /tmp/neo/ \
4266 && wget https://github.com/intel/intel-graphics-compiler/releases/download/$IGC_VERSION/intel-igc-core-${IGC_VERSION_FULL}_amd64.deb \
4367 && wget https://github.com/intel/intel-graphics-compiler/releases/download/$IGC_VERSION/intel-igc-opencl-${IGC_VERSION_FULL}_amd64.deb \
@@ -109,4 +133,3 @@ WORKDIR /app
109133HEALTHCHECK CMD [ "curl" , "-f" , "http://localhost:8080/health" ]
110134
111135ENTRYPOINT [ "/app/llama-server" ]
112-
0 commit comments