3131 description : " SGLang version"
3232 required : false
3333 type : string
34- # This can be removed once we have llama.cpp built for MUSA and CANN.
35- buildMusaCann :
36- description : " Build MUSA and CANN images"
37- required : false
38- type : boolean
39- default : false
4034 imagesOnly :
4135 description : " Only build and push Docker images (skip CLI releases, pinata bump, docs update, and CE packaging)"
4236 required : false
@@ -243,7 +237,6 @@ jobs:
243237 LLAMA_SERVER_VERSION : ${{ inputs.llamaServerVersion }}
244238 VLLM_VERSION : ${{ inputs.vllmVersion }}
245239 SGLANG_VERSION : ${{ inputs.sglangVersion }}
246- BUILD_MUSA_CANN : ${{ inputs.buildMusaCann || 'false' }}
247240 steps :
248241 - name : Checkout repo
249242 uses : actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd
@@ -272,15 +265,7 @@ jobs:
272265 echo "docker/model-runner:$RELEASE_TAG-rocm" >> "$GITHUB_OUTPUT"
273266 echo "docker/model-runner:latest-rocm" >> "$GITHUB_OUTPUT"
274267 echo 'EOF' >> "$GITHUB_OUTPUT"
275- echo "musa<<EOF" >> "$GITHUB_OUTPUT"
276- echo "docker/model-runner:$RELEASE_TAG-musa" >> "$GITHUB_OUTPUT"
277- echo "docker/model-runner:latest-musa" >> "$GITHUB_OUTPUT"
278- echo 'EOF' >> "$GITHUB_OUTPUT"
279- echo "cann<<EOF" >> "$GITHUB_OUTPUT"
280- echo "docker/model-runner:$RELEASE_TAG-cann" >> "$GITHUB_OUTPUT"
281- echo "docker/model-runner:latest-cann" >> "$GITHUB_OUTPUT"
282- echo 'EOF' >> "$GITHUB_OUTPUT"
283-
268+
284269 - name : Load versions
285270 shell : bash
286271 run : |
@@ -293,6 +278,21 @@ jobs:
293278 echo "VLLM_VERSION=${VLLM_VERSION:-$VERSIONS_VLLM}" >> "$GITHUB_ENV"
294279 echo "SGLANG_VERSION=${SGLANG_VERSION:-$VERSIONS_SGLANG}" >> "$GITHUB_ENV"
295280
281+ - name : Resolve llama.cpp upstream images
282+ id : llama-images
283+ shell : bash
284+ run : |
285+ CPU_IMAGE=$(bash scripts/resolve-llama-upstream-image.sh \
286+ "$LLAMA_SERVER_VERSION" cpu)
287+ CUDA_IMAGE=$(bash scripts/resolve-llama-upstream-image.sh \
288+ "$LLAMA_SERVER_VERSION" cuda)
289+ ROCM_IMAGE=$(bash scripts/resolve-llama-upstream-image.sh \
290+ "$LLAMA_SERVER_VERSION" rocm)
291+
292+ echo "cpu=$CPU_IMAGE" >> "$GITHUB_OUTPUT"
293+ echo "cuda=$CUDA_IMAGE" >> "$GITHUB_OUTPUT"
294+ echo "rocm=$ROCM_IMAGE" >> "$GITHUB_OUTPUT"
295+
296296 - name : Log in to DockerHub
297297 uses : docker/login-action@4907a6ddec9925e35a0a9e82d7399ccc52663121
298298 with :
@@ -315,6 +315,8 @@ jobs:
315315 platforms : linux/amd64, linux/arm64
316316 build-args : |
317317 "LLAMA_SERVER_VERSION=${{ env.LLAMA_SERVER_VERSION }}"
318+ "LLAMA_SERVER_VARIANT=cpu"
319+ "LLAMA_UPSTREAM_IMAGE=${{ steps.llama-images.outputs.cpu }}"
318320 "VERSION=${{ env.RELEASE_TAG }}"
319321 push : true
320322 sbom : true
@@ -330,7 +332,7 @@ jobs:
330332 build-args : |
331333 "LLAMA_SERVER_VERSION=${{ env.LLAMA_SERVER_VERSION }}"
332334 "LLAMA_SERVER_VARIANT=cuda"
333- "BASE_IMAGE=nvidia/cuda:12.9.0-runtime-ubuntu24.04 "
335+ "LLAMA_UPSTREAM_IMAGE=${{ steps.llama-images.outputs.cuda }} "
334336 "VERSION=${{ env.RELEASE_TAG }}"
335337 push : true
336338 sbom : true
@@ -346,7 +348,7 @@ jobs:
346348 build-args : |
347349 "LLAMA_SERVER_VERSION=${{ env.LLAMA_SERVER_VERSION }}"
348350 "LLAMA_SERVER_VARIANT=cuda"
349- "BASE_IMAGE=nvidia/cuda:13.0.2-runtime-ubuntu24.04 "
351+ "LLAMA_UPSTREAM_IMAGE=${{ steps.llama-images.outputs.cuda }} "
350352 "VLLM_VERSION=${{ env.VLLM_VERSION }}"
351353 "VERSION=${{ env.RELEASE_TAG }}"
352354 push : true
@@ -363,7 +365,7 @@ jobs:
363365 build-args : |
364366 "LLAMA_SERVER_VERSION=${{ env.LLAMA_SERVER_VERSION }}"
365367 "LLAMA_SERVER_VARIANT=cuda"
366- "BASE_IMAGE=nvidia/cuda:12.9.0-runtime-ubuntu24.04 "
368+ "LLAMA_UPSTREAM_IMAGE=${{ steps.llama-images.outputs.cuda }} "
367369 "SGLANG_VERSION=${{ env.SGLANG_VERSION }}"
368370 "VERSION=${{ env.RELEASE_TAG }}"
369371 push : true
@@ -380,47 +382,13 @@ jobs:
380382 build-args : |
381383 "LLAMA_SERVER_VERSION=${{ env.LLAMA_SERVER_VERSION }}"
382384 "LLAMA_SERVER_VARIANT=rocm"
383- "BASE_IMAGE=rocm/dev-ubuntu-22.04 "
385+ "LLAMA_UPSTREAM_IMAGE=${{ steps.llama-images.outputs.rocm }} "
384386 "VERSION=${{ env.RELEASE_TAG }}"
385387 push : true
386388 sbom : true
387389 provenance : mode=max
388390 tags : ${{ steps.tags.outputs.rocm }}
389391
390- - name : Build MUSA image
391- if : ${{ env.BUILD_MUSA_CANN == 'true' }}
392- uses : docker/build-push-action@bcafcacb16a39f128d818304e6c9c0c18556b85f
393- with :
394- file : Dockerfile
395- target : final-llamacpp
396- platforms : linux/amd64
397- build-args : |
398- "LLAMA_SERVER_VERSION=${{ env.LLAMA_SERVER_VERSION }}"
399- "LLAMA_SERVER_VARIANT=musa"
400- "BASE_IMAGE=mthreads/musa:rc4.3.0-runtime-ubuntu22.04-amd64"
401- "VERSION=${{ env.RELEASE_TAG }}"
402- push : true
403- sbom : true
404- provenance : mode=max
405- tags : ${{ steps.tags.outputs.musa }}
406-
407- - name : Build CANN image
408- if : ${{ env.BUILD_MUSA_CANN == 'true' }}
409- uses : docker/build-push-action@bcafcacb16a39f128d818304e6c9c0c18556b85f
410- with :
411- file : Dockerfile
412- target : final-llamacpp
413- platforms : linux/arm64, linux/amd64
414- build-args : |
415- "LLAMA_SERVER_VERSION=${{ env.LLAMA_SERVER_VERSION }}"
416- "LLAMA_SERVER_VARIANT=cann"
417- "BASE_IMAGE=ascendai/cann:8.2.rc2-910b-ubuntu22.04-py3.11"
418- "VERSION=${{ env.RELEASE_TAG }}"
419- push : true
420- sbom : true
421- provenance : mode=max
422- tags : ${{ steps.tags.outputs.cann }}
423-
424392 # ---------------------------------------------------------------------------
425393 # Release CLI for Docker Desktop — build, sign & push CLI + Desktop module image
426394 # ---------------------------------------------------------------------------
0 commit comments