@@ -381,7 +381,7 @@ void gemv_4bit_inference_fp16(
381381
382382#if 1
383383void gemm_4bit_inference_bf16 (
384- int m, int n, int k, sycl::ext::oneapi::bfloat16 * A, unsigned char * B, sycl::ext::oneapi::bfloat16 *absmax, float *datatype, float * out,
384+ int m, int n, int k, sycl::ext::oneapi::bfloat16 * A, unsigned char * B, float *absmax, float *datatype, float * out,
385385 int lda, int ldb, int ldc, int blocksize, sycl::queue* stream
386386) {
387387 gemm_4bit_inference_cutlass_dequant<sycl::ext::oneapi::bfloat16, 16 >(m, n, k, A, B, absmax, datatype, out, lda, ldb, ldc, blocksize, stream);
@@ -826,7 +826,7 @@ void cgemv_4bit_inference_fp16(
826826
827827#if 1
828828void cgemv_4bit_inference_bf16 (
829- int m, int n, int k, sycl::ext::oneapi::bfloat16 * A, unsigned char * B, sycl::ext::oneapi::bfloat16 *absmax, float *datatype,
829+ int m, int n, int k, sycl::ext::oneapi::bfloat16 * A, unsigned char * B, float *absmax, float *datatype,
830830 float * out, int lda, int ldb, int ldc, int blocksize, sycl::queue* stream
831831) {
832832 gemm_4bit_inference_bf16 (m, n, k, A, B, absmax, datatype, out, lda, ldb, ldc, blocksize, stream);
0 commit comments