#endif
#ifdef __64BIT__
-#define STACKSIZE 400
+#define STACKSIZE 512
#define ALPHA_R_SP 296(SP)
#define ALPHA_I_SP 304(SP)
#define FZERO 312(SP)
li o32 , 32
li o48 , 48
- li T1, 256
- slwi T1, T1, 9 // 131072
- sub BBUFFER, A, T1 // temp buffer for B unrolled
+ li T1, 512
+ slwi T1, T1, 16
+ add BBUFFER, A, T1
#ifdef __64BIT__
#endif
#ifdef __64BIT__
-#define STACKSIZE 340
+#define STACKSIZE 512
#define ALPHA_SP 296(SP)
#define FZERO 304(SP)
#else
li o32, 32
li o48, 48
- li T1, 256
- slwi T1, T1, 9 // 131072
- sub BBUFFER, A, T1 // temp buffer for B unrolled
+ li T1, 512
+ slwi T1, T1, 16
+ add BBUFFER, A, T1
addi T1, SP, 300
stxsspx f1, o0 , T1
#define DNUMOPT 8
#define GEMM_DEFAULT_OFFSET_A 131072
-#define GEMM_DEFAULT_OFFSET_B 1024
+#define GEMM_DEFAULT_OFFSET_B 131072
#define GEMM_DEFAULT_ALIGN 0x03fffUL
#define SGEMM_DEFAULT_UNROLL_M 16
#define SGEMM_DEFAULT_Q 720
#define DGEMM_DEFAULT_Q 720
#define CGEMM_DEFAULT_Q 720
-#define ZGEMM_DEFAULT_Q 360
+#define ZGEMM_DEFAULT_Q 720
#define SGEMM_DEFAULT_R 14400
#define DGEMM_DEFAULT_R 14400
#define CGEMM_DEFAULT_R 14400
-#define ZGEMM_DEFAULT_R 7200
+#define ZGEMM_DEFAULT_R 14400
#define SYMV_P 8