Skip to content

Commit f3feefa

Browse files
committed
Move check inside scales branch
1 parent ce5c29a commit f3feefa

1 file changed

Lines changed: 1 addition & 2 deletions

File tree

ggml/src/ggml-cuda/quantize.cu

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -139,9 +139,8 @@ static __global__ void quantize_mmq_nvfp4(
139139
uint8_t fp8_code = first_fp8_code;
140140
float subblock_scale = test_scale;
141141

142-
const int n_test_offsets = scales ? 1 : 5;
143-
144142
if (scales == nullptr) {
143+
const int n_test_offsets = 5;
145144
# pragma unroll // Check +/- 2 to find best code to reduce NVFP4 activation loss unless input scales define the scale.
146145
for (int i = 1; i < n_test_offsets; i++) {
147146
const int test_code = first_fp8_code + test_offsets[i];

0 commit comments

Comments
 (0)