diff --git a/.github/configs/nvidia-master.yaml b/.github/configs/nvidia-master.yaml index 8dcf9f45c..419a98c09 100644 --- a/.github/configs/nvidia-master.yaml +++ b/.github/configs/nvidia-master.yaml @@ -4196,7 +4196,7 @@ dsr1-fp8-h100-dynamo-trt: dp-attn: true gptoss-fp4-b200-trt: - image: nvcr.io#nvidia/tensorrt-llm/release:1.2.0rc2.post2 + image: nvcr.io#nvidia/tensorrt-llm/release:1.3.0rc14 model: openai/gpt-oss-120b model-prefix: gptoss runner: b200 diff --git a/perf-changelog.yaml b/perf-changelog.yaml index 29e7490f3..8a2bc8fe8 100644 --- a/perf-changelog.yaml +++ b/perf-changelog.yaml @@ -2820,3 +2820,9 @@ description: - "Update TensorRT-LLM image from v1.3.0rc11 (34d old) to v1.3.0rc14 (latest pre-release)" pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1491 + +- config-keys: + - gptoss-fp4-b200-trt + description: + - "Update TensorRT-LLM image from v1.2.0rc2.post2 (102d old) to v1.3.0rc14 (latest pre-release)" + pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1490