7373 needs : pre-check
7474 uses : ./.github/workflows/lint-and-test.yml
7575
76- test-build-npu :
77- timeout-minutes : 15
76+ test-build-vllm-ascend :
77+ timeout-minutes : 25
7878 runs-on : ubuntu-24.04-arm
7979 steps :
8080 - uses : actions/checkout@v4
@@ -88,16 +88,17 @@ jobs:
8888 uses : docker/build-push-action@v5
8989 with :
9090 context : .
91- file : ./docker/Dockerfile.vllm_npu
92- build-args : " ENABLE_SPARSE=false"
91+ file : ./docker/Dockerfile.ucm-vllm-ascend.a2-v0.17.0
92+ build-args : |
93+ PIP_INDEX_URL=https://pypi.org/simple
9394 tags : ucm-npu:latest
9495 push : false
9596 load : false
9697 cache-from : type=gha,scope=npu
9798 cache-to : type=gha,mode=max,scope=npu
9899
99- test-build-npu -sparse :
100- timeout-minutes : 15
100+ test-build-vllm-ascend -sparse :
101+ timeout-minutes : 25
101102 runs-on : ubuntu-24.04-arm
102103 steps :
103104 - uses : actions/checkout@v4
@@ -111,14 +112,63 @@ jobs:
111112 uses : docker/build-push-action@v5
112113 with :
113114 context : .
114- file : ./docker/Dockerfile.vllm_npu_v0110
115- build-args : " ENABLE_SPARSE=true"
115+ file : ./docker/Dockerfile.ucm-vllm-ascend.a2-v0.11.0
116+ build-args : |
117+ PIP_INDEX_URL=https://pypi.org/simple
116118 tags : ucm-npu-sparse:latest
117119 push : false
118120 load : false
119121 cache-from : type=gha,scope=npu
120122 cache-to : type=gha,mode=max,scope=npu
121123
124+ test-build-sglang :
125+ timeout-minutes : 25
126+ runs-on : ubuntu-24.04
127+ steps :
128+ - uses : actions/checkout@v4
129+ with :
130+ fetch-depth : 0
131+
132+ - name : Set up Docker Buildx
133+ uses : docker/setup-buildx-action@v3
134+
135+ - name : Build Image
136+ uses : docker/build-push-action@v5
137+ with :
138+ context : .
139+ file : ./docker/Dockerfile.ucm-sglang-cuda-v0.5.5
140+ build-args : |
141+ PIP_INDEX_URL=https://pypi.org/simple
142+ tags : ucm-sglang:latest
143+ push : false
144+ load : false
145+ cache-from : type=gha,scope=gpu
146+ cache-to : type=gha,mode=max,scope=gpu
147+
148+ test-build-mindie :
149+ timeout-minutes : 25
150+ runs-on : ubuntu-24.04-arm
151+ steps :
152+ - uses : actions/checkout@v4
153+ with :
154+ fetch-depth : 0
155+
156+ - name : Set up Docker Buildx
157+ uses : docker/setup-buildx-action@v3
158+
159+ - name : Build Image
160+ uses : docker/build-push-action@v5
161+ with :
162+ context : .
163+ file : ./docker/Dockerfile.ucm-mindie-ascend.a2-v2
164+ build-args : |
165+ PIP_INDEX_URL=https://pypi.org/simple
166+ tags : ucm-mindie:latest
167+ push : false
168+ load : false
169+ cache-from : type=gha,scope=npu
170+ cache-to : type=gha,mode=max,scope=npu
171+
122172 test-e2e-pc-gpu :
123173 timeout-minutes : 25
124174 runs-on : ["gpu-test-in-docker"]
@@ -159,9 +209,10 @@ jobs:
159209 sudo -E docker build --network=host \
160210 --build-arg http_proxy="${http_proxy:-}" \
161211 --build-arg https_proxy="${https_proxy:-}" \
162- --build-arg ENABLE_SPARSE=false \
212+ --build-arg no_proxy="repo.huaweicloud.com,${no_proxy:-}" \
213+ --build-arg PIP_INDEX_URL=https://repo.huaweicloud.com/repository/pypi/simple \
163214 -t ucm-e2etest-online-inference:${{ steps.version.outputs.version }} \
164- -f ./docker/Dockerfile.vllm_gpu ./
215+ -f ./docker/Dockerfile.ucm-vllm-cuda-v0.17.0 ./
165216 - name : Test E2E Online Inference in Docker
166217 run : |
167218 sudo chmod -R 777 /workspace/test_results/
@@ -228,9 +279,10 @@ jobs:
228279 sudo -E docker build --network=host \
229280 --build-arg http_proxy="${http_proxy:-}" \
230281 --build-arg https_proxy="${https_proxy:-}" \
231- --build-arg ENABLE_SPARSE=true \
282+ --build-arg no_proxy="repo.huaweicloud.com,${no_proxy:-}" \
283+ --build-arg PIP_INDEX_URL=https://repo.huaweicloud.com/repository/pypi/simple \
232284 -t ucm-e2etest-gpu-sparse:${{ steps.version.outputs.version }} \
233- -f ./docker/Dockerfile.vllm_gpu_v0110 ./
285+ -f ./docker/Dockerfile.ucm-vllm-cuda-v0.11.0 ./
234286 - name : Test E2E in Docker
235287 run : |
236288 sudo chmod -R 777 /workspace/test_results/
@@ -296,9 +348,10 @@ jobs:
296348 sudo -E docker build --network=host \
297349 --build-arg http_proxy="${http_proxy:-}" \
298350 --build-arg https_proxy="${https_proxy:-}" \
299- --build-arg ENABLE_SPARSE=true \
351+ --build-arg no_proxy="repo.huaweicloud.com,${no_proxy:-}" \
352+ --build-arg PIP_INDEX_URL=https://repo.huaweicloud.com/repository/pypi/simple \
300353 -t ucm-e2etest-gpu-sparse:${{ steps.version.outputs.version }} \
301- -f ./docker/Dockerfile.vllm_gpu_v0110 ./
354+ -f ./docker/Dockerfile.ucm-vllm-cuda-v0.11.0 ./
302355 - name : Test E2E in Docker
303356 run : |
304357 sudo chmod -R 777 /workspace/test_results/
0 commit comments