reduced dgemm_unroll_m to work with 128-bit sve
authorBine Brank <binebrank@gmail.com>
Tue, 23 Nov 2021 20:18:08 +0000 (21:18 +0100)
committerBine Brank <binebrank@gmail.com>
Tue, 23 Nov 2021 20:18:08 +0000 (21:18 +0100)
param.h

diff --git a/param.h b/param.h
index bbc52fa..0ccc4a4 100644 (file)
--- a/param.h
+++ b/param.h
@@ -3301,7 +3301,7 @@ is a big desktop or server with abundant cache rather than a phone or embedded d
 
 /* When all BLAS3 routines are implemeted with SVE, DGEMM_DEFAULT_UNROLL_M should be "sve_vl".
 Until then, just keep it different than DGEMM_DEFAULT_UNROLL_N to keep copy routines in both directions seperated. */
-#define DGEMM_DEFAULT_UNROLL_M  4 
+#define DGEMM_DEFAULT_UNROLL_M  2 
 #define DGEMM_DEFAULT_UNROLL_N  8
 
 #define CGEMM_DEFAULT_UNROLL_M  8