Skip to content

Commit 2b61ea2

Browse files
authored
Merge pull request #146 from TheTom/sync/upstream-b9190-mtp
sync: upstream master b9190 + MTP/spec stack (DO NOT MERGE — tester review)
2 parents 5aeb2fd + eef2db4 commit 2b61ea2

1,278 files changed

Lines changed: 117661 additions & 71756 deletions

File tree

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

.devops/intel.Dockerfile

Lines changed: 14 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,19 @@
1-
ARG ONEAPI_VERSION=2025.3.2-0-devel-ubuntu24.04
1+
ARG ONEAPI_VERSION=2025.3.3-0-devel-ubuntu24.04
22

33
## Build Image
44

55
FROM intel/deep-learning-essentials:$ONEAPI_VERSION AS build
66

77
ARG GGML_SYCL_F16=OFF
8+
ARG LEVEL_ZERO_VERSION=1.28.2
9+
ARG LEVEL_ZERO_UBUNTU_VERSION=u24.04
810
RUN apt-get update && \
9-
apt-get install -y git libssl-dev
11+
apt-get install -y git libssl-dev wget ca-certificates && \
12+
cd /tmp && \
13+
wget -q "https://github.com/oneapi-src/level-zero/releases/download/v${LEVEL_ZERO_VERSION}/level-zero_${LEVEL_ZERO_VERSION}%2B${LEVEL_ZERO_UBUNTU_VERSION}_amd64.deb" -O level-zero.deb && \
14+
wget -q "https://github.com/oneapi-src/level-zero/releases/download/v${LEVEL_ZERO_VERSION}/level-zero-devel_${LEVEL_ZERO_VERSION}%2B${LEVEL_ZERO_UBUNTU_VERSION}_amd64.deb" -O level-zero-devel.deb && \
15+
apt-get -o Dpkg::Options::="--force-overwrite" install -y ./level-zero.deb ./level-zero-devel.deb && \
16+
rm -f /tmp/level-zero.deb /tmp/level-zero-devel.deb
1017

1118
WORKDIR /app
1219

@@ -33,11 +40,11 @@ RUN mkdir -p /app/full \
3340

3441
FROM intel/deep-learning-essentials:$ONEAPI_VERSION AS base
3542

36-
ARG IGC_VERSION=v2.30.1
37-
ARG IGC_VERSION_FULL=2_2.30.1+20950
38-
ARG COMPUTE_RUNTIME_VERSION=26.09.37435.1
39-
ARG COMPUTE_RUNTIME_VERSION_FULL=26.09.37435.1-0
40-
ARG IGDGMM_VERSION=22.9.0
43+
ARG IGC_VERSION=v2.20.5
44+
ARG IGC_VERSION_FULL=2_2.20.5+19972
45+
ARG COMPUTE_RUNTIME_VERSION=25.40.35563.10
46+
ARG COMPUTE_RUNTIME_VERSION_FULL=25.40.35563.10-0
47+
ARG IGDGMM_VERSION=22.8.2
4148
RUN mkdir /tmp/neo/ && cd /tmp/neo/ \
4249
&& wget https://github.com/intel/intel-graphics-compiler/releases/download/$IGC_VERSION/intel-igc-core-${IGC_VERSION_FULL}_amd64.deb \
4350
&& wget https://github.com/intel/intel-graphics-compiler/releases/download/$IGC_VERSION/intel-igc-opencl-${IGC_VERSION_FULL}_amd64.deb \
@@ -109,4 +116,3 @@ WORKDIR /app
109116
HEALTHCHECK CMD [ "curl", "-f", "http://localhost:8080/health" ]
110117

111118
ENTRYPOINT [ "/app/llama-server" ]
112-

.devops/nix/package.nix

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -147,7 +147,6 @@ effectiveStdenv.mkDerivation (finalAttrs: {
147147
ninja
148148
pkg-config
149149
git
150-
spirv-headers
151150
]
152151
++ optionals useCuda [
153152
cudaPackages.cuda_nvcc

.devops/openvino.Dockerfile

Lines changed: 48 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,19 @@ ARG OPENVINO_VERSION_MAJOR=2026.0
22
ARG OPENVINO_VERSION_FULL=2026.0.0.20965.c6d6a13a886
33
ARG UBUNTU_VERSION=24.04
44

5-
# Optional proxy build arguments - empty by default
5+
# Intel GPU driver versions. https://github.com/intel/compute-runtime/releases
6+
ARG IGC_VERSION=v2.30.1
7+
ARG IGC_VERSION_FULL=2_2.30.1+20950
8+
ARG COMPUTE_RUNTIME_VERSION=26.09.37435.1
9+
ARG COMPUTE_RUNTIME_VERSION_FULL=26.09.37435.1-0
10+
ARG IGDGMM_VERSION=22.9.0
11+
12+
# Intel NPU driver versions. https://github.com/intel/linux-npu-driver/releases
13+
ARG NPU_DRIVER_VERSION=v1.32.0
14+
ARG NPU_DRIVER_FULL=v1.32.0.20260402-23905121947
15+
ARG LIBZE1_VERSION=1.27.0-1~24.04~ppa2
16+
17+
# Optional proxy build arguments
618
ARG http_proxy=
719
ARG https_proxy=
820

@@ -78,13 +90,47 @@ ARG http_proxy
7890
ARG https_proxy
7991

8092
RUN apt-get update \
81-
&& apt-get install -y libgomp1 libtbb12 curl \
93+
&& apt-get install -y libgomp1 libtbb12 curl wget ocl-icd-libopencl1 \
8294
&& apt autoremove -y \
8395
&& apt clean -y \
8496
&& rm -rf /tmp/* /var/tmp/* \
8597
&& find /var/cache/apt/archives /var/lib/apt/lists -not -name lock -type f -delete \
8698
&& find /var/cache -type f -delete
8799

100+
# Install GPU drivers
101+
ARG IGC_VERSION
102+
ARG IGC_VERSION_FULL
103+
ARG COMPUTE_RUNTIME_VERSION
104+
ARG COMPUTE_RUNTIME_VERSION_FULL
105+
ARG IGDGMM_VERSION
106+
RUN mkdir /tmp/neo/ && cd /tmp/neo/ \
107+
&& wget https://github.com/intel/intel-graphics-compiler/releases/download/${IGC_VERSION}/intel-igc-core-${IGC_VERSION_FULL}_amd64.deb \
108+
&& wget https://github.com/intel/intel-graphics-compiler/releases/download/${IGC_VERSION}/intel-igc-opencl-${IGC_VERSION_FULL}_amd64.deb \
109+
&& wget https://github.com/intel/compute-runtime/releases/download/${COMPUTE_RUNTIME_VERSION}/intel-ocloc-dbgsym_${COMPUTE_RUNTIME_VERSION_FULL}_amd64.ddeb \
110+
&& wget https://github.com/intel/compute-runtime/releases/download/${COMPUTE_RUNTIME_VERSION}/intel-ocloc_${COMPUTE_RUNTIME_VERSION_FULL}_amd64.deb \
111+
&& wget https://github.com/intel/compute-runtime/releases/download/${COMPUTE_RUNTIME_VERSION}/intel-opencl-icd-dbgsym_${COMPUTE_RUNTIME_VERSION_FULL}_amd64.ddeb \
112+
&& wget https://github.com/intel/compute-runtime/releases/download/${COMPUTE_RUNTIME_VERSION}/intel-opencl-icd_${COMPUTE_RUNTIME_VERSION_FULL}_amd64.deb \
113+
&& wget https://github.com/intel/compute-runtime/releases/download/${COMPUTE_RUNTIME_VERSION}/libigdgmm12_${IGDGMM_VERSION}_amd64.deb \
114+
&& wget https://github.com/intel/compute-runtime/releases/download/${COMPUTE_RUNTIME_VERSION}/libze-intel-gpu1-dbgsym_${COMPUTE_RUNTIME_VERSION_FULL}_amd64.ddeb \
115+
&& wget https://github.com/intel/compute-runtime/releases/download/${COMPUTE_RUNTIME_VERSION}/libze-intel-gpu1_${COMPUTE_RUNTIME_VERSION_FULL}_amd64.deb \
116+
&& dpkg --install *.deb \
117+
&& rm -rf /tmp/neo/
118+
119+
# Install NPU drivers
120+
ARG NPU_DRIVER_VERSION
121+
ARG NPU_DRIVER_FULL
122+
ARG LIBZE1_VERSION
123+
RUN mkdir /tmp/npu/ && cd /tmp/npu/ \
124+
&& wget https://github.com/intel/linux-npu-driver/releases/download/${NPU_DRIVER_VERSION}/linux-npu-driver-${NPU_DRIVER_FULL}-ubuntu2404.tar.gz \
125+
&& tar -xf linux-npu-driver-${NPU_DRIVER_FULL}-ubuntu2404.tar.gz \
126+
&& dpkg --install *.deb \
127+
&& rm -rf /tmp/npu/
128+
129+
RUN cd /tmp \
130+
&& wget https://snapshot.ppa.launchpadcontent.net/kobuk-team/intel-graphics/ubuntu/20260324T100000Z/pool/main/l/level-zero-loader/libze1_${LIBZE1_VERSION}_amd64.deb \
131+
&& dpkg --install libze1_${LIBZE1_VERSION}_amd64.deb \
132+
&& rm libze1_${LIBZE1_VERSION}_amd64.deb
133+
88134
COPY --from=build /app/lib/ /app/
89135

90136
### Full (all binaries)

.editorconfig

Lines changed: 1 addition & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -45,15 +45,7 @@ insert_final_newline = unset
4545
trim_trailing_whitespace = unset
4646
insert_final_newline = unset
4747

48-
[tools/server/webui/**]
49-
indent_style = unset
50-
indent_size = unset
51-
end_of_line = unset
52-
charset = unset
53-
trim_trailing_whitespace = unset
54-
insert_final_newline = unset
55-
56-
[tools/server/public/**]
48+
[tools/ui/**]
5749
indent_style = unset
5850
indent_size = unset
5951
end_of_line = unset

.gitattributes

Lines changed: 0 additions & 4 deletions
This file was deleted.

.github/ISSUE_TEMPLATE/010-bug-compilation.yml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -12,6 +12,8 @@ body:
1212
after recreating the CMake build directory and with `-DGGML_CCACHE=OFF`.
1313
If the compilation succeeds with ccache disabled you should be able to permanently fix the issue
1414
by clearing `~/.cache/ccache` (on Linux).
15+
16+
Please fill out this template yourself, copypasting language model outputs is [strictly prohibited](https://github.com/ggml-org/llama.cpp/blob/master/CONTRIBUTING.md#ai-usage-policy).
1517
- type: textarea
1618
id: commit
1719
attributes:

.github/ISSUE_TEMPLATE/011-bug-results.yml

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
name: Bug (model use)
2-
description: Something goes wrong when using a model (in general, not specific to a single llama.cpp module).
2+
description: Something goes wrong when running a model (crashes, garbled outputs, etc.).
33
title: "Eval bug: "
44
labels: ["bug-unconfirmed", "model evaluation"]
55
body:
@@ -12,6 +12,8 @@ body:
1212
If you encountered the issue while using an external UI (e.g. ollama),
1313
please reproduce your issue using one of the examples/binaries in this repository.
1414
The `llama-completion` binary can be used for simple and reproducible model inference.
15+
16+
Please fill out this template yourself, copypasting language model outputs is [strictly prohibited](https://github.com/ggml-org/llama.cpp/blob/master/CONTRIBUTING.md#ai-usage-policy).
1517
- type: textarea
1618
id: version
1719
attributes:

.github/ISSUE_TEMPLATE/019-bug-misc.yml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -10,6 +10,8 @@ body:
1010
This issue template is intended for miscellaneous bugs that don't fit into any other category.
1111
If you encountered the issue while using an external UI (e.g. ollama),
1212
please reproduce your issue using one of the examples/binaries in this repository.
13+
14+
Please fill out this template yourself, copypasting language model outputs is [strictly prohibited](https://github.com/ggml-org/llama.cpp/blob/master/CONTRIBUTING.md#ai-usage-policy).
1315
- type: textarea
1416
id: version
1517
attributes:

.github/ISSUE_TEMPLATE/020-enhancement.yml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -8,6 +8,8 @@ body:
88
value: |
99
[Please post your idea first in Discussion if there is not yet a consensus for this enhancement request. This will help to keep this issue tracker focused on enhancements that the community has agreed needs to be implemented.](https://github.com/ggml-org/llama.cpp/discussions/categories/ideas)
1010
11+
Please fill out this template yourself, copypasting language model outputs is [strictly prohibited](https://github.com/ggml-org/llama.cpp/blob/master/CONTRIBUTING.md#ai-usage-policy).
12+
1113
- type: checkboxes
1214
id: prerequisites
1315
attributes:

.github/ISSUE_TEMPLATE/030-research.yml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -8,6 +8,8 @@ body:
88
value: |
99
Don't forget to check for any [duplicate research issue tickets](https://github.com/ggml-org/llama.cpp/issues?q=is%3Aopen+is%3Aissue+label%3A%22research+%F0%9F%94%AC%22)
1010
11+
Please fill out this template yourself, copypasting language model outputs is [strictly prohibited](https://github.com/ggml-org/llama.cpp/blob/master/CONTRIBUTING.md#ai-usage-policy).
12+
1113
- type: checkboxes
1214
id: research-stage
1315
attributes:

0 commit comments

Comments
 (0)