Skip to content

Commit 00c0c4c

Browse files
committed
Merge branch 'master' into pr/19493
2 parents e1141d1 + 277ff5f commit 00c0c4c

113 files changed

Lines changed: 44737 additions & 7785 deletions

File tree

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

.devops/cuda-new.Dockerfile

Lines changed: 0 additions & 97 deletions
This file was deleted.

.devops/nix/package.nix

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@
1616
rocmPackages,
1717
vulkan-headers,
1818
vulkan-loader,
19-
curl,
19+
openssl,
2020
shaderc,
2121
useBlas ?
2222
builtins.all (x: !x) [
@@ -160,7 +160,8 @@ effectiveStdenv.mkDerivation (finalAttrs: {
160160
++ optionals useMpi [ mpi ]
161161
++ optionals useRocm rocmBuildInputs
162162
++ optionals useBlas [ blas ]
163-
++ optionals useVulkan vulkanBuildInputs;
163+
++ optionals useVulkan vulkanBuildInputs
164+
++ [ openssl ];
164165

165166
cmakeFlags =
166167
[

.devops/rocm.Dockerfile

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,8 @@
11
ARG UBUNTU_VERSION=24.04
22

33
# This needs to generally match the container host's environment.
4-
ARG ROCM_VERSION=7.2
5-
ARG AMDGPU_VERSION=7.2
4+
ARG ROCM_VERSION=7.2.1
5+
ARG AMDGPU_VERSION=7.2.1
66

77
# Target the ROCm build image
88
ARG BASE_ROCM_DEV_CONTAINER=rocm/dev-ubuntu-${UBUNTU_VERSION}:${ROCM_VERSION}-complete
@@ -12,11 +12,11 @@ FROM ${BASE_ROCM_DEV_CONTAINER} AS build
1212

1313
# Unless otherwise specified, we make a fat build.
1414
# This is mostly tied to rocBLAS supported archs.
15-
# check https://rocm.docs.amd.com/projects/install-on-linux/en/docs-7.2.0/reference/system-requirements.html
15+
# check https://rocm.docs.amd.com/projects/install-on-linux/en/docs-7.2.1/reference/system-requirements.html
1616
# check https://rocm.docs.amd.com/projects/radeon-ryzen/en/latest/docs/compatibility/compatibilityrad/native_linux/native_linux_compatibility.html
1717
# check https://rocm.docs.amd.com/projects/radeon-ryzen/en/latest/docs/compatibility/compatibilityryz/native_linux/native_linux_compatibility.html
1818

19-
ARG ROCM_DOCKER_ARCH='gfx908;gfx90a;gfx942;gfx1030;gfx1100;gfx1101;gfx1151;gfx1150;gfx1200;gfx1201'
19+
ARG ROCM_DOCKER_ARCH='gfx908;gfx90a;gfx942;gfx1030;gfx1100;gfx1101;gfx1102;gfx1151;gfx1150;gfx1200;gfx1201'
2020

2121
# Set ROCm architectures
2222
ENV AMDGPU_TARGETS=${ROCM_DOCKER_ARCH}

.github/labeler.yml

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -27,6 +27,11 @@ IBM zDNN:
2727
- any-glob-to-any-file:
2828
- ggml/include/ggml-zdnn.h
2929
- ggml/src/ggml-zdnn/**
30+
AMD ZenDNN:
31+
- changed-files:
32+
- any-glob-to-any-file:
33+
- ggml/include/ggml-zendnn.h
34+
- ggml/src/ggml-zendnn/**
3035
documentation:
3136
- changed-files:
3237
- any-glob-to-any-file:

.github/workflows/build.yml

Lines changed: 19 additions & 19 deletions
Original file line numberDiff line numberDiff line change
@@ -150,16 +150,15 @@ jobs:
150150
- name: Dawn Dependency
151151
id: dawn-depends
152152
run: |
153-
DAWN_VERSION="v2.0.0"
154-
DAWN_OWNER="reeselevine"
153+
DAWN_VERSION="v20260317.182325"
154+
DAWN_OWNER="google"
155155
DAWN_REPO="dawn"
156-
DAWN_ASSET_NAME="Dawn-5e9a4865b1635796ccc77dd30057f2b4002a1355-macos-latest-Release"
157-
echo "Fetching release asset from https://github.com/${DAWN_OWNER}/${DAWN_REPO}/releases/download/${DAWN_VERSION}/${DAWN_ASSET_NAME}.zip"
158-
curl -L -o artifact.zip \
159-
"https://github.com/${DAWN_OWNER}/${DAWN_REPO}/releases/download/${DAWN_VERSION}/${DAWN_ASSET_NAME}.zip"
156+
DAWN_ASSET_NAME="Dawn-18eb229ef5f707c1464cc581252e7603c73a3ef0-macos-latest-Release"
157+
echo "Fetching release asset from https://github.com/google/dawn/releases/download/${DAWN_VERSION}/${DAWN_ASSET_NAME}.tar.gz"
158+
curl -L -o artifact.tar.gz \
159+
"https://github.com/google/dawn/releases/download/${DAWN_VERSION}/${DAWN_ASSET_NAME}.tar.gz"
160160
mkdir dawn
161-
unzip artifact.zip
162-
tar -xvf ${DAWN_ASSET_NAME}.tar.gz -C dawn --strip-components=1
161+
tar -xvf artifact.tar.gz -C dawn --strip-components=1
163162
164163
- name: Build
165164
id: cmake_build
@@ -384,16 +383,15 @@ jobs:
384383
id: dawn-depends
385384
run: |
386385
sudo apt-get install -y libxrandr-dev libxinerama-dev libxcursor-dev mesa-common-dev libx11-xcb-dev libxi-dev
387-
DAWN_VERSION="v2.0.0"
388-
DAWN_OWNER="reeselevine"
386+
DAWN_VERSION="v20260317.182325"
387+
DAWN_OWNER="google"
389388
DAWN_REPO="dawn"
390-
DAWN_ASSET_NAME="Dawn-5e9a4865b1635796ccc77dd30057f2b4002a1355-ubuntu-latest-Release"
391-
echo "Fetching release asset from https://github.com/${DAWN_OWNER}/${DAWN_REPO}/releases/download/${DAWN_VERSION}/${DAWN_ASSET_NAME}.zip"
392-
curl -L -o artifact.zip \
393-
"https://github.com/${DAWN_OWNER}/${DAWN_REPO}/releases/download/${DAWN_VERSION}/${DAWN_ASSET_NAME}.zip"
389+
DAWN_ASSET_NAME="Dawn-18eb229ef5f707c1464cc581252e7603c73a3ef0-ubuntu-latest-Release"
390+
echo "Fetching release asset from https://github.com/google/dawn/releases/download/${DAWN_VERSION}/${DAWN_ASSET_NAME}.tar.gz"
391+
curl -L -o artifact.tar.gz \
392+
"https://github.com/google/dawn/releases/download/${DAWN_VERSION}/${DAWN_ASSET_NAME}.tar.gz"
394393
mkdir dawn
395-
unzip artifact.zip
396-
tar -xvf ${DAWN_ASSET_NAME}.tar.gz -C dawn --strip-components=1
394+
tar -xvf artifact.tar.gz -C dawn --strip-components=1
397395
398396
- name: Build
399397
id: cmake_build
@@ -427,7 +425,7 @@ jobs:
427425
428426
- name: Fetch emdawnwebgpu
429427
run: |
430-
DAWN_TAG="v20251027.212519"
428+
DAWN_TAG="v20260317.182325"
431429
EMDAWN_PKG="emdawnwebgpu_pkg-${DAWN_TAG}.zip"
432430
echo "Downloading ${EMDAWN_PKG}"
433431
curl -L -o emdawn.zip \
@@ -474,6 +472,7 @@ jobs:
474472
cmake -B build -S . \
475473
-DCMAKE_HIP_COMPILER="$(hipconfig -l)/clang" \
476474
-DGGML_HIP_ROCWMMA_FATTN=ON \
475+
-DGPU_TARGETS="gfx1030" \
477476
-DGGML_HIP=ON
478477
cmake --build build --config Release -j $(nproc)
479478
@@ -943,7 +942,7 @@ jobs:
943942
- name: Grab rocWMMA package
944943
id: grab_rocwmma
945944
run: |
946-
curl -o rocwmma.deb "https://repo.radeon.com/rocm/apt/7.2/pool/main/r/rocwmma-dev/rocwmma-dev_2.2.0.70200-43~24.04_amd64.deb"
945+
curl -o rocwmma.deb "https://repo.radeon.com/rocm/apt/7.2.1/pool/main/r/rocwmma-dev/rocwmma-dev_2.2.0.70201-81~24.04_amd64.deb"
947946
7z x rocwmma.deb
948947
7z x data.tar
949948
@@ -986,12 +985,13 @@ jobs:
986985
cmake -G "Unix Makefiles" -B build -S . `
987986
-DCMAKE_C_COMPILER="${env:HIP_PATH}\bin\clang.exe" `
988987
-DCMAKE_CXX_COMPILER="${env:HIP_PATH}\bin\clang++.exe" `
989-
-DCMAKE_CXX_FLAGS="-I$($PWD.Path.Replace('\', '/'))/opt/rocm-7.2.0/include/" `
988+
-DCMAKE_CXX_FLAGS="-I$($PWD.Path.Replace('\', '/'))/opt/rocm-7.2.1/include/" `
990989
-DCMAKE_BUILD_TYPE=Release `
991990
-DLLAMA_BUILD_BORINGSSL=ON `
992991
-DROCM_DIR="${env:HIP_PATH}" `
993992
-DGGML_HIP=ON `
994993
-DGGML_HIP_ROCWMMA_FATTN=ON `
994+
-DGPU_TARGETS="gfx1100" `
995995
-DGGML_RPC=ON
996996
cmake --build build -j ${env:NUMBER_OF_PROCESSORS}
997997

.github/workflows/docker.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -73,10 +73,10 @@ jobs:
7373
{ "tag": "cpu", "dockerfile": ".devops/cpu.Dockerfile", "platforms": "linux/amd64", "full": true, "light": true, "server": true, "free_disk_space": false, "runs_on": "ubuntu-24.04" },
7474
{ "tag": "cpu", "dockerfile": ".devops/cpu.Dockerfile", "platforms": "linux/arm64", "full": true, "light": true, "server": true, "free_disk_space": false, "runs_on": "ubuntu-24.04-arm" },
7575
{ "tag": "cpu", "dockerfile": ".devops/s390x.Dockerfile", "platforms": "linux/s390x", "full": true, "light": true, "server": true, "free_disk_space": false, "runs_on": "ubuntu-24.04-s390x" },
76-
{ "tag": "cuda cuda12", "dockerfile": ".devops/cuda.Dockerfile", "platforms": "linux/amd64", "full": true, "light": true, "server": true, "free_disk_space": true, "runs_on": "ubuntu-24.04" },
77-
{ "tag": "cuda cuda12", "dockerfile": ".devops/cuda.Dockerfile", "platforms": "linux/arm64", "full": true, "light": true, "server": true, "free_disk_space": true, "runs_on": "ubuntu-24.04-arm" },
78-
{ "tag": "cuda13", "dockerfile": ".devops/cuda-new.Dockerfile", "platforms": "linux/amd64", "full": true, "light": true, "server": true, "free_disk_space": true, "runs_on": "ubuntu-24.04" },
79-
{ "tag": "cuda13", "dockerfile": ".devops/cuda-new.Dockerfile", "platforms": "linux/arm64", "full": true, "light": true, "server": true, "free_disk_space": true, "runs_on": "ubuntu-24.04-arm" },
76+
{ "tag": "cuda cuda12", "dockerfile": ".devops/cuda.Dockerfile", "cuda_version": "12.9.1", "platforms": "linux/amd64", "full": true, "light": true, "server": true, "free_disk_space": true, "runs_on": "ubuntu-24.04" },
77+
{ "tag": "cuda cuda12", "dockerfile": ".devops/cuda.Dockerfile", "cuda_version": "12.9.1", "platforms": "linux/arm64", "full": true, "light": true, "server": true, "free_disk_space": true, "runs_on": "ubuntu-24.04-arm" },
78+
{ "tag": "cuda13", "dockerfile": ".devops/cuda.Dockerfile", "cuda_version": "13.1.1", "platforms": "linux/amd64", "full": true, "light": true, "server": true, "free_disk_space": true, "runs_on": "ubuntu-24.04" },
79+
{ "tag": "cuda13", "dockerfile": ".devops/cuda.Dockerfile", "cuda_version": "13.1.1", "platforms": "linux/arm64", "full": true, "light": true, "server": true, "free_disk_space": true, "runs_on": "ubuntu-24.04-arm" },
8080
{ "tag": "musa", "dockerfile": ".devops/musa.Dockerfile", "platforms": "linux/amd64", "full": true, "light": true, "server": true, "free_disk_space": true, "runs_on": "ubuntu-24.04" },
8181
{ "tag": "intel", "dockerfile": ".devops/intel.Dockerfile", "platforms": "linux/amd64", "full": true, "light": true, "server": true, "free_disk_space": true, "runs_on": "ubuntu-24.04" },
8282
{ "tag": "vulkan", "dockerfile": ".devops/vulkan.Dockerfile", "platforms": "linux/amd64", "full": true, "light": true, "server": true, "free_disk_space": false, "runs_on": "ubuntu-24.04" },

.github/workflows/hip-quality-check.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@ env:
3535
jobs:
3636
ubuntu-22-hip-quality-check:
3737
runs-on: ubuntu-22.04
38-
container: rocm/dev-ubuntu-22.04:7.2
38+
container: rocm/dev-ubuntu-22.04:7.2.1
3939
steps:
4040
- name: Clone
4141
id: checkout
@@ -59,7 +59,7 @@ jobs:
5959
run: |
6060
cmake -B build -S . \
6161
-DCMAKE_HIP_COMPILER="$(hipconfig -l)/clang" \
62-
-DGPU_TARGETS=gfx908 \
62+
-DGPU_TARGETS=gfx942 \
6363
-DGGML_HIP=ON \
6464
-DGGML_HIP_EXPORT_METRICS=Off \
6565
-DCMAKE_HIP_FLAGS="-Werror -Wno-tautological-compare" \

.github/workflows/release.yml

Lines changed: 12 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -639,8 +639,8 @@ jobs:
639639
strategy:
640640
matrix:
641641
include:
642-
- ROCM_VERSION: "7.2"
643-
gpu_targets: "gfx908;gfx90a;gfx942;gfx1030;gfx1100;gfx1101;gfx1151;gfx1150;gfx1200;gfx1201"
642+
- ROCM_VERSION: "7.2.1"
643+
gpu_targets: "gfx908;gfx90a;gfx942;gfx1030;gfx1100;gfx1101;gfx1102;gfx1151;gfx1150;gfx1200;gfx1201"
644644
build: 'x64'
645645

646646
steps:
@@ -662,7 +662,7 @@ jobs:
662662
sudo apt install -y build-essential git cmake wget
663663
664664
- name: Setup Legacy ROCm
665-
if: matrix.ROCM_VERSION == '7.2'
665+
if: matrix.ROCM_VERSION == '7.2.1'
666666
id: legacy_env
667667
run: |
668668
sudo mkdir --parents --mode=0755 /etc/apt/keyrings
@@ -683,7 +683,7 @@ jobs:
683683
sudo apt-get install -y libssl-dev rocm-hip-sdk
684684
685685
- name: Setup TheRock
686-
if: matrix.ROCM_VERSION != '7.2'
686+
if: matrix.ROCM_VERSION != '7.2.1'
687687
id: therock_env
688688
run: |
689689
wget https://repo.amd.com/rocm/tarball/therock-dist-linux-gfx1151-${{ matrix.ROCM_VERSION }}.tar.gz
@@ -699,7 +699,6 @@ jobs:
699699
run: |
700700
cmake -B build -S . \
701701
-DCMAKE_HIP_COMPILER="$(hipconfig -l)/clang" \
702-
-DCMAKE_HIP_FLAGS="-mllvm --amdgpu-unroll-threshold-local=600" \
703702
-DCMAKE_BUILD_TYPE=Release \
704703
-DGGML_BACKEND_DL=ON \
705704
-DGGML_NATIVE=OFF \
@@ -717,17 +716,20 @@ jobs:
717716
id: tag
718717
uses: ./.github/actions/get-tag-name
719718

719+
- name: Get ROCm short version
720+
run: echo "ROCM_VERSION_SHORT=$(echo '${{ matrix.ROCM_VERSION }}' | cut -d '.' -f 1,2)" >> $GITHUB_ENV
721+
720722
- name: Pack artifacts
721723
id: pack_artifacts
722724
run: |
723725
cp LICENSE ./build/bin/
724-
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-ubuntu-rocm-${{ matrix.ROCM_VERSION }}-${{ matrix.build }}.tar.gz --transform "s,./,llama-${{ steps.tag.outputs.name }}/," -C ./build/bin .
726+
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-ubuntu-rocm-${{ env.ROCM_VERSION_SHORT }}-${{ matrix.build }}.tar.gz --transform "s,./,llama-${{ steps.tag.outputs.name }}/," -C ./build/bin .
725727
726728
- name: Upload artifacts
727729
uses: actions/upload-artifact@v6
728730
with:
729-
path: llama-${{ steps.tag.outputs.name }}-bin-ubuntu-rocm-${{ matrix.ROCM_VERSION }}-${{ matrix.build }}.tar.gz
730-
name: llama-bin-ubuntu-rocm-${{ matrix.ROCM_VERSION }}-${{ matrix.build }}.tar.gz
731+
path: llama-${{ steps.tag.outputs.name }}-bin-ubuntu-rocm-${{ env.ROCM_VERSION_SHORT }}-${{ matrix.build }}.tar.gz
732+
name: llama-bin-ubuntu-rocm-${{ env.ROCM_VERSION_SHORT }}-${{ matrix.build }}.tar.gz
731733

732734
windows-hip:
733735
runs-on: windows-2022
@@ -749,7 +751,7 @@ jobs:
749751
- name: Grab rocWMMA package
750752
id: grab_rocwmma
751753
run: |
752-
curl -o rocwmma.deb "https://repo.radeon.com/rocm/apt/7.2/pool/main/r/rocwmma-dev/rocwmma-dev_2.2.0.70200-43~24.04_amd64.deb"
754+
curl -o rocwmma.deb "https://repo.radeon.com/rocm/apt/7.2.1/pool/main/r/rocwmma-dev/rocwmma-dev_2.2.0.70201-81~24.04_amd64.deb"
753755
7z x rocwmma.deb
754756
7z x data.tar
755757
@@ -806,7 +808,7 @@ jobs:
806808
cmake -G "Unix Makefiles" -B build -S . `
807809
-DCMAKE_C_COMPILER="${env:HIP_PATH}\bin\clang.exe" `
808810
-DCMAKE_CXX_COMPILER="${env:HIP_PATH}\bin\clang++.exe" `
809-
-DCMAKE_CXX_FLAGS="-I$($PWD.Path.Replace('\', '/'))/opt/rocm-7.2.0/include/ -Wno-ignored-attributes -Wno-nested-anon-types" `
811+
-DCMAKE_CXX_FLAGS="-I$($PWD.Path.Replace('\', '/'))/opt/rocm-7.2.1/include/ -Wno-ignored-attributes -Wno-nested-anon-types" `
810812
-DCMAKE_BUILD_TYPE=Release `
811813
-DGGML_BACKEND_DL=ON `
812814
-DGGML_NATIVE=OFF `

0 commit comments

Comments
 (0)