diff --git a/tensorrt_llm/_torch/auto_deploy/config/default.yaml b/tensorrt_llm/_torch/auto_deploy/config/default.yaml index 6952ff96c64c..694f7eb10fdd 100644 --- a/tensorrt_llm/_torch/auto_deploy/config/default.yaml +++ b/tensorrt_llm/_torch/auto_deploy/config/default.yaml @@ -144,7 +144,7 @@ transforms: allreduce_strategy: NCCL pipeline_cache: stage: sharding - enabled: true + enabled: false root: null ############################################################################################ # MOVE MODEL AND LOAD WEIGHTS