From 08256647093b1f67b9f4edaf73b75c7dda07ca80 Mon Sep 17 00:00:00 2001 From: Chenghao Zhang <211069071+nvchenghaoz@users.noreply.github.com> Date: Mon, 22 Jun 2026 16:39:50 -0700 Subject: [PATCH] disable the pipeline cache by default Signed-off-by: Chenghao Zhang <211069071+nvchenghaoz@users.noreply.github.com> --- tensorrt_llm/_torch/auto_deploy/config/default.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tensorrt_llm/_torch/auto_deploy/config/default.yaml b/tensorrt_llm/_torch/auto_deploy/config/default.yaml index 6952ff96c64c..694f7eb10fdd 100644 --- a/tensorrt_llm/_torch/auto_deploy/config/default.yaml +++ b/tensorrt_llm/_torch/auto_deploy/config/default.yaml @@ -144,7 +144,7 @@ transforms: allreduce_strategy: NCCL pipeline_cache: stage: sharding - enabled: true + enabled: false root: null ############################################################################################ # MOVE MODEL AND LOAD WEIGHTS