Skip to content

Commit 5521b2e

Browse files
committed
CUDA: fix bug in rms_norm fusion
1 parent 009b709 commit 5521b2e

1 file changed

Lines changed: 1 addition & 1 deletion

File tree

ggml/src/ggml-cuda/norm.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -187,7 +187,7 @@ static __global__ void rms_norm_f32(const float * x, float * dst,
187187
dst[col] = scale * x[col] * mul[mul_col];
188188
} else if constexpr (do_add) {
189189
const int add_col = col % add_ncols;
190-
dst[col] += add[add_col];
190+
dst[col] = scale * x[col] + add[add_col];
191191
} else {
192192
dst[col] = scale * x[col];
193193
}

0 commit comments

Comments
 (0)