From bba75d5e45887a2e553fa134d41f5cb89efd8c49 Mon Sep 17 00:00:00 2001 From: h-motoki Date: Fri, 27 Jun 2025 19:37:36 +0900 Subject: [PATCH] GEMM_PREFERED_SIZE parameter has been changed for A64FX. --- param.h | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/param.h b/param.h index a75ba6fafa..97a666b10a 100644 --- a/param.h +++ b/param.h @@ -3701,6 +3701,12 @@ is a big desktop or server with abundant cache rather than a phone or embedded d #elif defined(A64FX) // 512-bit SVE +#if defined(XDOUBLE) || defined(DOUBLE) +#define GEMM_PREFERED_SIZE 8 +#else +#define GEMM_PREFERED_SIZE 16 +#endif + /* When all BLAS3 routines are implemeted with SVE, SGEMM_DEFAULT_UNROLL_M should be "sve_vl". Until then, just keep it different than DGEMM_DEFAULT_UNROLL_N to keep copy routines in both directions seperated. */ #define SGEMM_DEFAULT_UNROLL_M 4