@@ -173,7 +173,7 @@ dsr1-fp8-h200-trt:
173173 - { tp: 8, ep: 8, dp-attn: true, conc-start: 64, conc-end: 64 }
174174
175175gptoss-fp4-b200-trt :
176- image : nvcr.io#nvidia/tensorrt-llm/release:1.2.0rc0.post1
176+ image : nvcr.io#nvidia/tensorrt-llm/release:1.2.0rc2
177177 model : openai/gpt-oss-120b
178178 model-prefix : gptoss
179179 runner : b200-trt
@@ -185,23 +185,27 @@ gptoss-fp4-b200-trt:
185185 - isl : 1024
186186 osl : 1024
187187 search-space :
188+ - { tp: 2, dp-attn: true, conc-start: 32, conc-end: 128 }
189+ - { tp: 4, dp-attn: true, conc-start: 32, conc-end: 64 }
188190 - { tp: 1, conc-start: 64, conc-end: 128 }
189- - { tp: 2, conc-start: 4, conc-end: 128 }
190- - { tp: 4, conc-start: 4, conc-end: 128 }
191+ - { tp: 2, conc-start: 4, conc-end: 32 }
192+ - { tp: 4, conc-start: 4, conc-end: 64 }
191193 - { tp: 8, conc-start: 4, conc-end: 8 }
192194 - isl : 1024
193195 osl : 8192
194196 search-space :
195197 - { tp: 1, conc-start: 64, conc-end: 128 }
198+ - { tp: 2, dp-attn: true, conc-start: 64, conc-end: 128 }
196199 - { tp: 2, conc-start: 4, conc-end: 128 }
197200 - { tp: 4, conc-start: 4, conc-end: 128 }
198201 - { tp: 8, conc-start: 4, conc-end: 16 }
199202 - isl : 8192
200203 osl : 1024
201204 search-space :
202205 - { tp: 1, conc-start: 64, conc-end: 128 }
206+ - { tp: 2, dp-attn: true, conc-start: 64, conc-end: 128 }
203207 - { tp: 2, conc-start: 4, conc-end: 128 }
204- - { tp: 4, conc-start: 4, conc-end: 128 }
208+ - { tp: 4, conc-start: 4, conc-end: 32 }
205209 - { tp: 8, conc-start: 4, conc-end: 8 }
206210
207211gptoss-fp4-b200-vllm :
0 commit comments