fix(gguf): correct mismatched-shape error message in check_quantized_param_shape (#13504)

Ricardo-M-L · web-flow · commit 6a65a3735b53 · 2026-05-20T12:03:10.000-10:00
fix(gguf): correct mismatched-shape error message check_quantized_param_shape compares inferred_shape against current_param_shape, but the error message printed inferred_shape vs loaded_param_shape — and inferred_shape is derived from loaded_param_shape, so the reported mismatch was effectively self-referential and gave no signal about the model's expected shape. Print current_param_shape (what the model expected) vs inferred_shape (what the quantized weight decodes to) so the two sides of the comparison are actually visible. Noted by @Vargol in #13001.
diff --git a/src/diffusers/quantizers/gguf/gguf_quantizer.py b/src/diffusers/quantizers/gguf/gguf_quantizer.py
@@ -85,7 +85,8 @@ def check_quantized_param_shape(self, param_name, current_param, loaded_param):
         inferred_shape = _quant_shape_from_byte_shape(loaded_param_shape, type_size, block_size)
         if inferred_shape != current_param_shape:
             raise ValueError(
-                f"{param_name} has an expected quantized shape of: {inferred_shape}, but received shape: {loaded_param_shape}"
+                f"{param_name} has an expected shape of: {current_param_shape}, but the loaded GGUF weight decodes "
+                f"to shape: {inferred_shape}"
             )
 
         return True

Original file line number	Diff line number	Diff line change
`@@ -85,7 +85,8 @@ def check_quantized_param_shape(self, param_name, current_param, loaded_param):`
`85`	`85`	`inferred_shape = _quant_shape_from_byte_shape(loaded_param_shape, type_size, block_size)`
`86`	`86`	`if inferred_shape != current_param_shape:`
`87`	`87`	`raise ValueError(`
`88`		`- f"{param_name} has an expected quantized shape of: {inferred_shape}, but received shape: {loaded_param_shape}"`
	`88`	`+ f"{param_name} has an expected shape of: {current_param_shape}, but the loaded GGUF weight decodes "`
	`89`	`+ f"to shape: {inferred_shape}"`
`89`	`90`	`)`
`90`	`91`
`91`	`92`	`return True`