5555 LLAMA_LOG_TIMESTAMPS : 1
5656
5757jobs :
58+ determine-tag :
59+ name : Determine tag name
60+ runs-on : ubuntu-slim
61+ outputs :
62+ tag_name : ${{ steps.tag.outputs.name }}
63+ steps :
64+ - name : Clone
65+ uses : actions/checkout@v6
66+ with :
67+ fetch-depth : 0
68+ - name : Determine tag name
69+ id : tag
70+ uses : ./.github/actions/get-tag-name
71+ env :
72+ BRANCH_NAME : ${{ github.head_ref || github.ref_name }}
73+
5874 ggml-ci-nvidia-cuda :
75+ needs : determine-tag
5976 runs-on : [self-hosted, Linux, NVIDIA]
6077
6178 steps :
@@ -65,11 +82,14 @@ jobs:
6582
6683 - name : Test
6784 id : ggml-ci
85+ env :
86+ HF_UI_VERSION : ${{ needs.determine-tag.outputs.tag_name }}
6887 run : |
6988 nvidia-smi
7089 GG_BUILD_CUDA=1 bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
7190
7291 ggml-ci-nvidia-vulkan-cm :
92+ needs : determine-tag
7393 runs-on : [self-hosted, Linux, NVIDIA]
7494
7595 steps :
@@ -79,11 +99,14 @@ jobs:
7999
80100 - name : Test
81101 id : ggml-ci
102+ env :
103+ HF_UI_VERSION : ${{ needs.determine-tag.outputs.tag_name }}
82104 run : |
83105 vulkaninfo --summary
84106 GG_BUILD_VULKAN=1 GGML_VK_DISABLE_COOPMAT2=1 bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
85107
86108 ggml-ci-nvidia-vulkan-cm2 :
109+ needs : determine-tag
87110 runs-on : [self-hosted, Linux, NVIDIA, COOPMAT2]
88111
89112 steps :
@@ -93,39 +116,40 @@ jobs:
93116
94117 - name : Test
95118 id : ggml-ci
119+ env :
120+ HF_UI_VERSION : ${{ needs.determine-tag.outputs.tag_name }}
96121 run : |
97122 vulkaninfo --summary
98123 GG_BUILD_VULKAN=1 bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
99124
100- # TODO: investigate slight precision issues in some operations for test-backend-ops on the WebGPU backend.
101- # ggml-ci-nvidia-webgpu:
102- # runs-on: [self-hosted, Linux, NVIDIA]
125+ ggml-ci-nvidia-webgpu :
126+ runs-on : [self-hosted, Linux, NVIDIA]
103127
104- # steps:
105- # - name: Clone
106- # id: checkout
107- # uses: actions/checkout@v6
128+ steps :
129+ - name : Clone
130+ id : checkout
131+ uses : actions/checkout@v6
108132
109- # - name: Dawn Dependency
110- # id: dawn-depends
111- # run: |
112- # DAWN_VERSION="v20260317.182325"
113- # DAWN_OWNER="google"
114- # DAWN_REPO="dawn"
115- # DAWN_ASSET_NAME="Dawn-18eb229ef5f707c1464cc581252e7603c73a3ef0-ubuntu-latest-Release"
116- # echo "Fetching release asset from https://github.com/google/dawn/releases/download/${DAWN_VERSION}/${DAWN_ASSET_NAME}.tar.gz"
117- # curl -L -o artifact.tar.gz \
118- # "https://github.com/google/dawn/releases/download/${DAWN_VERSION}/${DAWN_ASSET_NAME}.tar.gz"
119- # mkdir dawn
120- # tar -xvf artifact.tar.gz -C dawn --strip-components=1
133+ - name : Dawn Dependency
134+ id : dawn-depends
135+ run : |
136+ DAWN_VERSION="v20260317.182325"
137+ DAWN_OWNER="google"
138+ DAWN_REPO="dawn"
139+ DAWN_ASSET_NAME="Dawn-18eb229ef5f707c1464cc581252e7603c73a3ef0-ubuntu-latest-Release"
140+ echo "Fetching release asset from https://github.com/google/dawn/releases/download/${DAWN_VERSION}/${DAWN_ASSET_NAME}.tar.gz"
141+ curl -L -o artifact.tar.gz \
142+ "https://github.com/google/dawn/releases/download/${DAWN_VERSION}/${DAWN_ASSET_NAME}.tar.gz"
143+ mkdir dawn
144+ tar -xvf artifact.tar.gz -C dawn --strip-components=1
121145
122- # - name: Test
123- # id: ggml-ci
124- # run: |
125- # GG_BUILD_WEBGPU=1 \
126- # GG_BUILD_WEBGPU_DAWN_PREFIX="$GITHUB_WORKSPACE/dawn" \
127- # GG_BUILD_WEBGPU_DAWN_DIR="$GITHUB_WORKSPACE/dawn/lib64/cmake/Dawn" \
128- # bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
146+ - name : Test
147+ id : ggml-ci
148+ run : |
149+ GG_BUILD_WEBGPU=1 \
150+ GG_BUILD_WEBGPU_DAWN_PREFIX="$GITHUB_WORKSPACE/dawn" \
151+ GG_BUILD_WEBGPU_DAWN_DIR="$GITHUB_WORKSPACE/dawn/lib64/cmake/Dawn" \
152+ bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
129153
130154 # TODO: provision AMX-compatible machine
131155 # ggml-ci-cpu-amx:
@@ -172,6 +196,7 @@ jobs:
172196 # GG_BUILD_ROCM=1 GG_BUILD_AMDGPU_TARGETS="gfx1101" bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
173197
174198 ggml-ci-mac-metal :
199+ needs : determine-tag
175200 runs-on : [self-hosted, macOS, ARM64]
176201
177202 steps :
@@ -181,10 +206,13 @@ jobs:
181206
182207 - name : Test
183208 id : ggml-ci
209+ env :
210+ HF_UI_VERSION : ${{ needs.determine-tag.outputs.tag_name }}
184211 run : |
185212 GG_BUILD_METAL=1 bash ./ci/run.sh ~/results/llama.cpp ~/mnt/llama.cpp
186213
187214 ggml-ci-mac-webgpu :
215+ needs : determine-tag
188216 runs-on : [self-hosted, macOS, ARM64]
189217
190218 steps :
@@ -207,11 +235,14 @@ jobs:
207235
208236 - name : Test
209237 id : ggml-ci
238+ env :
239+ HF_UI_VERSION : ${{ needs.determine-tag.outputs.tag_name }}
210240 run : |
211241 GG_BUILD_WEBGPU=1 GG_BUILD_WEBGPU_DAWN_PREFIX="$GITHUB_WORKSPACE/dawn" \
212242 bash ./ci/run.sh ~/results/llama.cpp ~/mnt/llama.cpp
213243
214244 ggml-ci-mac-vulkan :
245+ needs : determine-tag
215246 runs-on : [self-hosted, macOS, ARM64]
216247
217248 steps :
@@ -221,11 +252,14 @@ jobs:
221252
222253 - name : Test
223254 id : ggml-ci
255+ env :
256+ HF_UI_VERSION : ${{ needs.determine-tag.outputs.tag_name }}
224257 run : |
225258 vulkaninfo --summary
226259 GG_BUILD_VULKAN=1 bash ./ci/run.sh ~/results/llama.cpp ~/mnt/llama.cpp
227260
228261 ggml-ci-linux-intel-vulkan :
262+ needs : determine-tag
229263 runs-on : [self-hosted, Linux, Intel]
230264
231265 steps :
@@ -237,11 +271,14 @@ jobs:
237271
238272 - name : Test
239273 id : ggml-ci
274+ env :
275+ HF_UI_VERSION : ${{ needs.determine-tag.outputs.tag_name }}
240276 run : |
241277 vulkaninfo --summary
242278 GG_BUILD_VULKAN=1 bash ./ci/run.sh ~/results/llama.cpp ~/mnt/llama.cpp
243279
244280 ggml-ci-win-intel-vulkan :
281+ needs : determine-tag
245282 runs-on : [self-hosted, Windows, X64, Intel]
246283
247284 steps :
@@ -256,13 +293,15 @@ jobs:
256293 MSYSTEM : UCRT64
257294 CHERE_INVOKING : 1
258295 PATH : C:\msys64\ucrt64\bin;C:\msys64\usr\bin;C:\Windows\System32;${{ env.PATH }}
296+ HF_UI_VERSION : ${{ needs.determine-tag.outputs.tag_name }}
259297 run : |
260298 vulkaninfo --summary
261299 # Skip python related tests with GG_BUILD_LOW_PERF=1 since Windows MSYS2 UCRT64 currently fails to create
262300 # a valid python environment for testing
263301 LLAMA_FATAL_WARNINGS=OFF GG_BUILD_NINJA=1 GG_BUILD_VULKAN=1 GG_BUILD_LOW_PERF=1 ./ci/run.sh ./results/llama.cpp ./mnt/llama.cpp
264302
265303 ggml-ci-intel-openvino-gpu-low-perf :
304+ needs : determine-tag
266305 runs-on : [self-hosted, Linux, Intel, OpenVINO]
267306
268307 concurrency :
@@ -294,6 +333,8 @@ jobs:
294333
295334 - name : Test
296335 id : ggml-ci
336+ env :
337+ HF_UI_VERSION : ${{ needs.determine-tag.outputs.tag_name }}
297338 run : |
298339 source ./openvino_toolkit/setupvars.sh
299340 GG_BUILD_OPENVINO=1 GGML_OPENVINO_DEVICE=GPU GG_BUILD_LOW_PERF=1 bash ./ci/run.sh ./tmp/results ./tmp/mnt
0 commit comments