File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 55# Define the CANN base image for easier version updates later
66ARG CHIP_TYPE=910b
77ARG CANN_BASE_IMAGE=quay.io/ascend/cann:8.5.0-${CHIP_TYPE}-openeuler24.03-py3.11
8+ ARG BUILD_DATE=N/A
9+ ARG APP_VERSION=N/A
10+ ARG APP_REVISION=N/A
811
912# ==============================================================================
1013# BUILD STAGE
@@ -67,6 +70,19 @@ RUN mkdir -p /app/full && \
6770# ==============================================================================
6871FROM ${CANN_BASE_IMAGE} AS base
6972
73+ ARG BUILD_DATE=N/A
74+ ARG APP_VERSION=N/A
75+ ARG APP_REVISION=N/A
76+ ARG IMAGE_URL=https://github.com/ggml-org/llama.cpp
77+ ARG IMAGE_SOURCE=https://github.com/ggml-org/llama.cpp
78+ LABEL org.opencontainers.image.created=$BUILD_DATE \
79+ org.opencontainers.image.version=$APP_VERSION \
80+ org.opencontainers.image.revision=$APP_REVISION \
81+ org.opencontainers.image.title="llama.cpp" \
82+ org.opencontainers.image.description="LLM inference in C/C++" \
83+ org.opencontainers.image.url=$IMAGE_URL \
84+ org.opencontainers.image.source=$IMAGE_SOURCE
85+
7086# -- Install runtime dependencies --
7187RUN yum install -y libgomp curl && \
7288 yum clean all && \
Original file line number Diff line number Diff line change 11ARG UBUNTU_VERSION=24.04
2+ ARG BUILD_DATE=N/A
3+ ARG APP_VERSION=N/A
4+ ARG APP_REVISION=N/A
25
36FROM ubuntu:$UBUNTU_VERSION AS build
47
@@ -35,6 +38,19 @@ RUN mkdir -p /app/full \
3538# # Base image
3639FROM ubuntu:$UBUNTU_VERSION AS base
3740
41+ ARG BUILD_DATE=N/A
42+ ARG APP_VERSION=N/A
43+ ARG APP_REVISION=N/A
44+ ARG IMAGE_URL=https://github.com/ggml-org/llama.cpp
45+ ARG IMAGE_SOURCE=https://github.com/ggml-org/llama.cpp
46+ LABEL org.opencontainers.image.created=$BUILD_DATE \
47+ org.opencontainers.image.version=$APP_VERSION \
48+ org.opencontainers.image.revision=$APP_REVISION \
49+ org.opencontainers.image.title="llama.cpp" \
50+ org.opencontainers.image.description="LLM inference in C/C++" \
51+ org.opencontainers.image.url=$IMAGE_URL \
52+ org.opencontainers.image.source=$IMAGE_SOURCE
53+
3854RUN apt-get update \
3955 && apt-get install -y libgomp1 curl \
4056 && apt autoremove -y \
Original file line number Diff line number Diff line change @@ -6,6 +6,10 @@ ARG BASE_CUDA_DEV_CONTAINER=nvidia/cuda:${CUDA_VERSION}-devel-ubuntu${UBUNTU_VER
66
77ARG BASE_CUDA_RUN_CONTAINER=nvidia/cuda:${CUDA_VERSION}-runtime-ubuntu${UBUNTU_VERSION}
88
9+ ARG BUILD_DATE=N/A
10+ ARG APP_VERSION=N/A
11+ ARG APP_REVISION=N/A
12+
913FROM ${BASE_CUDA_DEV_CONTAINER} AS build
1014
1115# CUDA architecture to build for (defaults to all supported archs)
@@ -40,6 +44,19 @@ RUN mkdir -p /app/full \
4044# # Base image
4145FROM ${BASE_CUDA_RUN_CONTAINER} AS base
4246
47+ ARG BUILD_DATE=N/A
48+ ARG APP_VERSION=N/A
49+ ARG APP_REVISION=N/A
50+ ARG IMAGE_URL=https://github.com/ggml-org/llama.cpp
51+ ARG IMAGE_SOURCE=https://github.com/ggml-org/llama.cpp
52+ LABEL org.opencontainers.image.created=$BUILD_DATE \
53+ org.opencontainers.image.version=$APP_VERSION \
54+ org.opencontainers.image.revision=$APP_REVISION \
55+ org.opencontainers.image.title="llama.cpp" \
56+ org.opencontainers.image.description="LLM inference in C/C++" \
57+ org.opencontainers.image.url=$IMAGE_URL \
58+ org.opencontainers.image.source=$IMAGE_SOURCE
59+
4360RUN apt-get update \
4461 && apt-get install -y libgomp1 curl \
4562 && apt autoremove -y \
Original file line number Diff line number Diff line change 11ARG ONEAPI_VERSION=2025.3.3-0-devel-ubuntu24.04
2+ ARG BUILD_DATE=N/A
3+ ARG APP_VERSION=N/A
4+ ARG APP_REVISION=N/A
25
36# # Build Image
47
@@ -40,6 +43,19 @@ RUN mkdir -p /app/full \
4043
4144FROM intel/deep-learning-essentials:$ONEAPI_VERSION AS base
4245
46+ ARG BUILD_DATE=N/A
47+ ARG APP_VERSION=N/A
48+ ARG APP_REVISION=N/A
49+ ARG IMAGE_URL=https://github.com/ggml-org/llama.cpp
50+ ARG IMAGE_SOURCE=https://github.com/ggml-org/llama.cpp
51+ LABEL org.opencontainers.image.created=$BUILD_DATE \
52+ org.opencontainers.image.version=$APP_VERSION \
53+ org.opencontainers.image.revision=$APP_REVISION \
54+ org.opencontainers.image.title="llama.cpp" \
55+ org.opencontainers.image.description="LLM inference in C/C++" \
56+ org.opencontainers.image.url=$IMAGE_URL \
57+ org.opencontainers.image.source=$IMAGE_SOURCE
58+
4359ARG IGC_VERSION=v2.20.5
4460ARG IGC_VERSION_FULL=2_2.20.5+19972
4561ARG COMPUTE_RUNTIME_VERSION=25.40.35563.10
Original file line number Diff line number Diff line change 11ARG ASCEND_VERSION=8.5.0-910b-openeuler22.03-py3.10
2+ ARG BUILD_DATE=N/A
3+ ARG APP_VERSION=N/A
4+ ARG APP_REVISION=N/A
25
36FROM ascendai/cann:$ASCEND_VERSION AS build
47
@@ -28,6 +31,20 @@ RUN echo "Building with static libs" && \
2831
2932# TODO: use image with NNRT
3033FROM ascendai/cann:$ASCEND_VERSION AS runtime
34+
35+ ARG BUILD_DATE=N/A
36+ ARG APP_VERSION=N/A
37+ ARG APP_REVISION=N/A
38+ ARG IMAGE_URL=https://github.com/ggml-org/llama.cpp
39+ ARG IMAGE_SOURCE=https://github.com/ggml-org/llama.cpp
40+ LABEL org.opencontainers.image.created=$BUILD_DATE \
41+ org.opencontainers.image.version=$APP_VERSION \
42+ org.opencontainers.image.revision=$APP_REVISION \
43+ org.opencontainers.image.title="llama.cpp" \
44+ org.opencontainers.image.description="LLM inference in C/C++" \
45+ org.opencontainers.image.url=$IMAGE_URL \
46+ org.opencontainers.image.source=$IMAGE_SOURCE
47+
3148COPY --from=build /app/build/bin/llama-cli /app/build/bin/llama-completion /
3249
3350ENV LC_ALL=C.utf8
Original file line number Diff line number Diff line change @@ -6,6 +6,10 @@ ARG BASE_MUSA_DEV_CONTAINER=mthreads/musa:${MUSA_VERSION}-devel-ubuntu${UBUNTU_V
66
77ARG BASE_MUSA_RUN_CONTAINER=mthreads/musa:${MUSA_VERSION}-runtime-ubuntu${UBUNTU_VERSION}-amd64
88
9+ ARG BUILD_DATE=N/A
10+ ARG APP_VERSION=N/A
11+ ARG APP_REVISION=N/A
12+
913FROM ${BASE_MUSA_DEV_CONTAINER} AS build
1014
1115# MUSA architecture to build for (defaults to all supported archs)
@@ -45,6 +49,19 @@ RUN mkdir -p /app/full \
4549# # Base image
4650FROM ${BASE_MUSA_RUN_CONTAINER} AS base
4751
52+ ARG BUILD_DATE=N/A
53+ ARG APP_VERSION=N/A
54+ ARG APP_REVISION=N/A
55+ ARG IMAGE_URL=https://github.com/ggml-org/llama.cpp
56+ ARG IMAGE_SOURCE=https://github.com/ggml-org/llama.cpp
57+ LABEL org.opencontainers.image.created=$BUILD_DATE \
58+ org.opencontainers.image.version=$APP_VERSION \
59+ org.opencontainers.image.revision=$APP_REVISION \
60+ org.opencontainers.image.title="llama.cpp" \
61+ org.opencontainers.image.description="LLM inference in C/C++" \
62+ org.opencontainers.image.url=$IMAGE_URL \
63+ org.opencontainers.image.source=$IMAGE_SOURCE
64+
4865RUN apt-get update \
4966 && apt-get install -y libgomp1 curl \
5067 && apt autoremove -y \
Original file line number Diff line number Diff line change @@ -18,6 +18,10 @@ ARG LIBZE1_VERSION=1.27.0-1~24.04~ppa2
1818ARG http_proxy=
1919ARG https_proxy=
2020
21+ ARG BUILD_DATE=N/A
22+ ARG APP_VERSION=N/A
23+ ARG APP_REVISION=N/A
24+
2125# # Build Image
2226FROM ubuntu:${UBUNTU_VERSION} AS build
2327
@@ -88,6 +92,18 @@ FROM ubuntu:${UBUNTU_VERSION} AS base
8892# Pass proxy args to runtime stage
8993ARG http_proxy
9094ARG https_proxy
95+ ARG BUILD_DATE=N/A
96+ ARG APP_VERSION=N/A
97+ ARG APP_REVISION=N/A
98+ ARG IMAGE_URL=https://github.com/ggml-org/llama.cpp
99+ ARG IMAGE_SOURCE=https://github.com/ggml-org/llama.cpp
100+ LABEL org.opencontainers.image.created=$BUILD_DATE \
101+ org.opencontainers.image.version=$APP_VERSION \
102+ org.opencontainers.image.revision=$APP_REVISION \
103+ org.opencontainers.image.title="llama.cpp" \
104+ org.opencontainers.image.description="LLM inference in C/C++" \
105+ org.opencontainers.image.url=$IMAGE_URL \
106+ org.opencontainers.image.source=$IMAGE_SOURCE
91107
92108RUN apt-get update \
93109 && apt-get install -y libgomp1 libtbb12 curl wget ocl-icd-libopencl1 \
Original file line number Diff line number Diff line change @@ -7,6 +7,10 @@ ARG AMDGPU_VERSION=7.2.1
77# Target the ROCm build image
88ARG BASE_ROCM_DEV_CONTAINER=rocm/dev-ubuntu-${UBUNTU_VERSION}:${ROCM_VERSION}-complete
99
10+ ARG BUILD_DATE=N/A
11+ ARG APP_VERSION=N/A
12+ ARG APP_REVISION=N/A
13+
1014# ## Build image
1115FROM ${BASE_ROCM_DEV_CONTAINER} AS build
1216
@@ -57,6 +61,19 @@ RUN mkdir -p /app/full \
5761# # Base image
5862FROM ${BASE_ROCM_DEV_CONTAINER} AS base
5963
64+ ARG BUILD_DATE=N/A
65+ ARG APP_VERSION=N/A
66+ ARG APP_REVISION=N/A
67+ ARG IMAGE_URL=https://github.com/ggml-org/llama.cpp
68+ ARG IMAGE_SOURCE=https://github.com/ggml-org/llama.cpp
69+ LABEL org.opencontainers.image.created=$BUILD_DATE \
70+ org.opencontainers.image.version=$APP_VERSION \
71+ org.opencontainers.image.revision=$APP_REVISION \
72+ org.opencontainers.image.title="llama.cpp" \
73+ org.opencontainers.image.description="LLM inference in C/C++" \
74+ org.opencontainers.image.url=$IMAGE_URL \
75+ org.opencontainers.image.source=$IMAGE_SOURCE
76+
6077RUN apt-get update \
6178 && apt-get install -y libgomp1 curl \
6279 && apt autoremove -y \
Original file line number Diff line number Diff line change 11ARG GCC_VERSION=15.2.0
22ARG UBUNTU_VERSION=24.04
3+ ARG BUILD_DATE=N/A
4+ ARG APP_VERSION=N/A
5+ ARG APP_REVISION=N/A
36
47# ## Build Llama.cpp stage
58FROM gcc:${GCC_VERSION} AS build
@@ -52,6 +55,19 @@ COPY --from=build /opt/llama.cpp/gguf-py /llama.cpp/gguf-py
5255# ## Base image
5356FROM ubuntu:${UBUNTU_VERSION} AS base
5457
58+ ARG BUILD_DATE=N/A
59+ ARG APP_VERSION=N/A
60+ ARG APP_REVISION=N/A
61+ ARG IMAGE_URL=https://github.com/ggml-org/llama.cpp
62+ ARG IMAGE_SOURCE=https://github.com/ggml-org/llama.cpp
63+ LABEL org.opencontainers.image.created=$BUILD_DATE \
64+ org.opencontainers.image.version=$APP_VERSION \
65+ org.opencontainers.image.revision=$APP_REVISION \
66+ org.opencontainers.image.title="llama.cpp" \
67+ org.opencontainers.image.description="LLM inference in C/C++" \
68+ org.opencontainers.image.url=$IMAGE_URL \
69+ org.opencontainers.image.source=$IMAGE_SOURCE
70+
5571RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \
5672 --mount=type=cache,target=/var/lib/apt/lists,sharing=locked \
5773 apt update -y && \
Original file line number Diff line number Diff line change 11ARG UBUNTU_VERSION=26.04
2+ ARG BUILD_DATE=N/A
3+ ARG APP_VERSION=N/A
4+ ARG APP_REVISION=N/A
25
36FROM ubuntu:$UBUNTU_VERSION AS build
47
@@ -31,6 +34,19 @@ RUN mkdir -p /app/full \
3134# # Base image
3235FROM ubuntu:$UBUNTU_VERSION AS base
3336
37+ ARG BUILD_DATE=N/A
38+ ARG APP_VERSION=N/A
39+ ARG APP_REVISION=N/A
40+ ARG IMAGE_URL=https://github.com/ggml-org/llama.cpp
41+ ARG IMAGE_SOURCE=https://github.com/ggml-org/llama.cpp
42+ LABEL org.opencontainers.image.created=$BUILD_DATE \
43+ org.opencontainers.image.version=$APP_VERSION \
44+ org.opencontainers.image.revision=$APP_REVISION \
45+ org.opencontainers.image.title="llama.cpp" \
46+ org.opencontainers.image.description="LLM inference in C/C++" \
47+ org.opencontainers.image.url=$IMAGE_URL \
48+ org.opencontainers.image.source=$IMAGE_SOURCE
49+
3450RUN apt-get update \
3551 && apt-get install -y libgomp1 curl libvulkan1 mesa-vulkan-drivers \
3652 libglvnd0 libgl1 libglx0 libegl1 libgles2 \
You can’t perform that action at this time.
0 commit comments