Skip to content

Commit ce5c29a

Browse files
committed
Temporarily assert that in_scale is there for debugging purposes
1 parent e529ad8 commit ce5c29a

1 file changed

Lines changed: 4 additions & 0 deletions

File tree

ggml/src/ggml-cuda/mmq.cu

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -126,6 +126,10 @@ void ggml_cuda_mul_mat_q(
126126
const ggml_tensor * scale_activations = src0->type == GGML_TYPE_NVFP4 ? (ids ? dst->src[4] : dst->src[3]) : nullptr;
127127
const float * scale_activations_d = scale_activations ? (const float *) scale_activations->data : nullptr;
128128
const int64_t n_scale_activations = scale_activations ? ggml_nelements(scale_activations) : 0;
129+
if (use_native_fp4)
130+
{
131+
GGML_ASSERT(scale_activations != nullptr);
132+
}
129133

130134
if (!ids) {
131135
const size_t nbytes_src1_q8_1 = ne13*ne12 * ne11*ne10_padded * sizeof(block_q8_1)/QK8_1 +

0 commit comments

Comments
 (0)