Fix QNN AAR #4783
cuda.yml
on: pull_request
Matrix: export-model-cuda-artifact
Matrix: test-cuda-builds
Matrix: test-models-cuda
Matrix: test-model-cuda-e2e
check-all-cuda-builds
3s
Artifacts
Produced during runtime
| Name | Size | Digest | |
|---|---|---|---|
|
google-gemma-3-4b-it-cuda-non-quantized
Expired
|
7.22 GB |
sha256:af36a3c48f7edc1c7b15021119e6ce885d93f47dffc940a73b31b2eb01026652
|
|
|
google-gemma-3-4b-it-cuda-quantized-int4-tile-packed
Expired
|
3.36 GB |
sha256:bb3cbade7845cd9cb62aa00ddc492bec7dbbf7569f685ef8040023824b134809
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-non-quantized
Expired
|
6.82 GB |
sha256:2ac05fd35c81f89e43602b5211bcd8301dac4d7ce7a3d2eb340bd1bb4d9ce52f
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-tile-packed
Expired
|
2.89 GB |
sha256:6d963622dadf61a949c996db23a691e041806cda97475bd35bcfe8f33f07d313
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-weight-only
Expired
|
6.14 GB |
sha256:31831ea901d47d41a8674b61489c455d7ce86db2984b703fb9c50fc55c82b6c4
|
|
|
openai-whisper-large-v3-turbo-cuda-non-quantized
Expired
|
1.18 GB |
sha256:ef69d954ac07d1eba51d4d313cd0b77b797cc617735c889a3269732529b7379e
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-tile-packed
Expired
|
491 MB |
sha256:f466406338080fbeafc38cc43bcd4ce33fa49fd197513b882e683c05615b01e8
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-weight-only
Expired
|
485 MB |
sha256:e29970fb472f2a8296b46b57414fda928cec02f400abfce698e8bfacba2ccfc5
|
|
|
openai-whisper-small-cuda-non-quantized
Expired
|
361 MB |
sha256:4b6c224ce32f3c9f859eb0b7d746c747d1129dc3f0d6615746809e14461bb524
|
|
|
openai-whisper-small-cuda-quantized-int4-tile-packed
Expired
|
172 MB |
sha256:7cb6be810fb9b020422a40aa16fd66e406da472f07eeec3785f0e3042d43549d
|
|
|
openai-whisper-small-cuda-quantized-int4-weight-only
Expired
|
270 MB |
sha256:5235b1629e0ec62ab16b8e4860851f1d5111e1dee567b209efd430256f707940
|
|