diff --git a/angelslim/models/llm/deepseek.py b/angelslim/models/llm/deepseek.py index 587961bb..e01ce125 100644 --- a/angelslim/models/llm/deepseek.py +++ b/angelslim/models/llm/deepseek.py @@ -163,7 +163,7 @@ def get_qdq_module(self, layer, name): quant_algo=self.quant_config.quant_algo, weight=weight, weight_scale=weight_scale, - group_size=self.quant_config.quant_algo_info["w_group_size"], + group_size=self.quant_config.quant_algo_info.get("w_group_size", 128), bias=layer.bias, input_scale=act_scale, )