@@ -381,10 +381,10 @@ void gemv_4bit_inference_fp16(
381381
382382#if 1
383383void gemm_4bit_inference_bf16 (
384- int m, int n, int k, sycl::ext::oneapi::bfloat16 * A, unsigned char * B, float *absmax, float *datatype, float * out,
384+ int m, int n, int k, int l, sycl::ext::oneapi::bfloat16 * A, unsigned char * B, float *absmax, float *datatype, float * out,
385385 int lda, int ldb, int ldc, int blocksize, sycl::queue* stream
386386) {
387- gemm_4bit_inference_cutlass_dequant<sycl::ext::oneapi::bfloat16, 16 >(m, n, k, A, B, absmax, datatype, out, lda, ldb, ldc, blocksize, stream);
387+ gemm_4bit_inference_cutlass_dequant<sycl::ext::oneapi::bfloat16, 16 >(m, n, k, l, A, B, absmax, datatype, out, lda, ldb, ldc, blocksize, stream);
388388}
389389#endif
390390
@@ -826,10 +826,10 @@ void cgemv_4bit_inference_fp16(
826826
827827#if 1
828828void cgemv_4bit_inference_bf16 (
829- int m, int n, int k, sycl::ext::oneapi::bfloat16 * A, unsigned char * B, float *absmax, float *datatype,
829+ int m, int n, int k, int l, sycl::ext::oneapi::bfloat16 * A, unsigned char * B, float *absmax, float *datatype,
830830 float * out, int lda, int ldb, int ldc, int blocksize, sycl::queue* stream
831831) {
832- gemm_4bit_inference_bf16 (m, n, k, A, B, absmax, datatype, out, lda, ldb, ldc, blocksize, stream);
832+ gemm_4bit_inference_bf16 (m, n, k, l, A, B, absmax, datatype, out, lda, ldb, ldc, blocksize, stream);
833833}
834834#else
835835void cgemv_4bit_inference_bf16(
0 commit comments