@@ -56,18 +56,21 @@ jobs:
5656 match_pattern : " ^DCO$|^linux$" # Wait for DCO and Unit tests / linux to pass
5757 delay : 300s
5858
59- # #### PyTorch Example Tests #####
59+ # #### PyTorch Example Tests (speculative_decoding requires 26.01 image) #####
6060 torch-pr :
6161 needs : [check-file-changes, wait-checks]
6262 if : startsWith(github.ref, 'refs/heads/pull-request/') && needs.check-file-changes.outputs.any_changed == 'true'
6363 strategy :
6464 fail-fast : false
6565 matrix :
6666 example : [llm_distill, llm_qat, llm_sparsity]
67+ include :
68+ - example : speculative_decoding
69+ docker_image : " nvcr.io/nvidia/pytorch:26.01-py3"
6770 uses : ./.github/workflows/_example_tests_runner.yml
6871 secrets : inherit
6972 with :
70- docker_image : " nvcr.io/nvidia/pytorch:25.06-py3"
73+ docker_image : ${{ matrix.docker_image || ' nvcr.io/nvidia/pytorch:25.06-py3' }}
7174 example : ${{ matrix.example }}
7275 pip_install_extras : " [hf,dev-test]"
7376 runner : linux-amd64-gpu-l4-latest-1
@@ -78,36 +81,17 @@ jobs:
7881 fail-fast : false
7982 matrix :
8083 example : [llm_distill, llm_qat, llm_sparsity]
84+ include :
85+ - example : speculative_decoding
86+ docker_image : " nvcr.io/nvidia/pytorch:26.01-py3"
8187 uses : ./.github/workflows/_example_tests_runner.yml
8288 secrets : inherit
8389 with :
84- docker_image : " nvcr.io/nvidia/pytorch:25.06-py3"
90+ docker_image : ${{ matrix.docker_image || ' nvcr.io/nvidia/pytorch:25.06-py3' }}
8591 example : ${{ matrix.example }}
8692 pip_install_extras : " [hf,dev-test]"
8793 runner : linux-amd64-gpu-h100-latest-2
8894
89- # #### Speculative Decoding Example Tests (requires 26.01 image) #####
90- speculative-decoding-pr :
91- needs : [check-file-changes, wait-checks]
92- if : startsWith(github.ref, 'refs/heads/pull-request/') && needs.check-file-changes.outputs.any_changed == 'true'
93- uses : ./.github/workflows/_example_tests_runner.yml
94- secrets : inherit
95- with :
96- docker_image : " nvcr.io/nvidia/pytorch:26.01-py3"
97- example : speculative_decoding
98- pip_install_extras : " [hf,dev-test]"
99- runner : linux-amd64-gpu-l4-latest-1
100-
101- speculative-decoding-non-pr :
102- if : ${{ !startsWith(github.ref, 'refs/heads/pull-request/') }}
103- uses : ./.github/workflows/_example_tests_runner.yml
104- secrets : inherit
105- with :
106- docker_image : " nvcr.io/nvidia/pytorch:26.01-py3"
107- example : speculative_decoding
108- pip_install_extras : " [hf,dev-test]"
109- runner : linux-amd64-gpu-h100-latest-2
110-
11195 # #### TensorRT-LLM Example Tests #####
11296 trtllm-pr :
11397 needs : [check-file-changes, wait-checks]
@@ -172,15 +156,14 @@ jobs:
172156 example-pr-required-check :
173157 # Run even if example tests are skipped
174158 if : ${{ startsWith(github.ref, 'refs/heads/pull-request/') && always() }}
175- needs : [check-file-changes, torch-pr, speculative-decoding-pr, trtllm-pr, onnx-pr]
159+ needs : [check-file-changes, torch-pr, trtllm-pr, onnx-pr]
176160 runs-on : ubuntu-latest
177161 steps :
178162 - name : Required GPU tests did not succeed
179163 if : |
180164 needs.check-file-changes.result != 'success' ||
181165 (needs.check-file-changes.outputs.any_changed == 'true' && (
182166 needs.torch-pr.result != 'success' ||
183- needs.speculative-decoding-pr.result != 'success' ||
184167 needs.trtllm-pr.result != 'success' ||
185168 needs.onnx-pr.result != 'success'
186169 ))
0 commit comments