6060 torch-pr :
6161 needs : [check-file-changes, wait-checks]
6262 if : startsWith(github.ref, 'refs/heads/pull-request/') && needs.check-file-changes.outputs.any_changed == 'true'
63- strategy :
63+ strategy : &torch_strategy
6464 fail-fast : false
6565 matrix :
6666 example : [llm_distill, llm_qat, llm_sparsity]
@@ -72,25 +72,21 @@ jobs:
7272 with :
7373 docker_image : " nvcr.io/nvidia/pytorch:${{ matrix.docker_image || '26.01' }}-py3"
7474 example : ${{ matrix.example }}
75+ timeout_minutes : 30
7576 pip_install_extras : " [hf,dev-test]"
76- runner : linux-amd64-gpu-l4 -latest-1
77+ runner : linux-amd64-gpu-h100 -latest-1
7778
7879 torch-non-pr :
7980 if : ${{ !startsWith(github.ref, 'refs/heads/pull-request/') }}
80- strategy :
81- fail-fast : false
82- matrix :
83- example : [llm_distill, llm_qat, llm_sparsity]
84- include :
85- - example : speculative_decoding
86- docker_image : " 26.01"
81+ strategy : *torch_strategy
8782 uses : ./.github/workflows/_example_tests_runner.yml
8883 secrets : inherit
8984 with :
9085 docker_image : " nvcr.io/nvidia/pytorch:${{ matrix.docker_image || '26.01' }}-py3"
9186 example : ${{ matrix.example }}
87+ timeout_minutes : 30
9288 pip_install_extras : " [hf,dev-test]"
93- runner : linux-amd64-gpu-h100 -latest-2
89+ runner : linux-amd64-gpu-rtxpro6000 -latest-2
9490
9591 # #### TensorRT-LLM Example Tests #####
9692 trtllm-pr :
@@ -99,14 +95,14 @@ jobs:
9995 strategy :
10096 fail-fast : false
10197 matrix :
102- example : [llm_ptq] # vlm_ptq temporarily disabled due to pipeline error
98+ example : [llm_ptq, vlm_ptq]
10399 uses : ./.github/workflows/_example_tests_runner.yml
104100 secrets : inherit
105101 with :
106- docker_image : " nvcr.io/nvidia/tensorrt-llm/release:1.2.0rc6.post3 "
102+ docker_image : " nvcr.io/nvidia/tensorrt-llm/release:1.3.0rc5 "
107103 example : ${{ matrix.example }}
108104 pip_install_extras : " [hf,dev-test]"
109- runner : linux-amd64-gpu-h100 -latest-1
105+ runner : linux-amd64-gpu-rtxpro6000 -latest-1
110106
111107 trtllm-non-pr :
112108 if : ${{ !startsWith(github.ref, 'refs/heads/pull-request/') }}
@@ -117,16 +113,16 @@ jobs:
117113 uses : ./.github/workflows/_example_tests_runner.yml
118114 secrets : inherit
119115 with :
120- docker_image : " nvcr.io/nvidia/tensorrt-llm/release:1.2.0rc6.post3 "
116+ docker_image : " nvcr.io/nvidia/tensorrt-llm/release:1.3.0rc5 "
121117 example : ${{ matrix.example }}
122118 pip_install_extras : " [hf,dev-test]"
123- runner : linux-amd64-gpu-h100 -latest-2
119+ runner : linux-amd64-gpu-rtxpro6000 -latest-2
124120
125121 # #### ONNX/TensorRT Example Tests #####
126122 onnx-pr :
127123 needs : [check-file-changes, wait-checks]
128124 if : startsWith(github.ref, 'refs/heads/pull-request/') && needs.check-file-changes.outputs.any_changed == 'true'
129- strategy :
125+ strategy : &onnx_strategy
130126 fail-fast : false
131127 matrix :
132128 example : [diffusers, torch_onnx]
@@ -140,17 +136,14 @@ jobs:
140136
141137 onnx-non-pr :
142138 if : ${{ !startsWith(github.ref, 'refs/heads/pull-request/') }}
143- strategy :
144- fail-fast : false
145- matrix :
146- example : [diffusers, torch_onnx]
139+ strategy : *onnx_strategy
147140 uses : ./.github/workflows/_example_tests_runner.yml
148141 secrets : inherit
149142 with :
150143 docker_image : " nvcr.io/nvidia/tensorrt:26.01-py3"
151144 example : ${{ matrix.example }}
152145 pip_install_extras : " [all,dev-test]"
153- runner : linux-amd64-gpu-l4 -latest-1
146+ runner : linux-amd64-gpu-rtxpro6000 -latest-2
154147
155148 # #### Required Check for PR #####
156149 example-pr-required-check :
0 commit comments