Fix z/ctrmv stack allocation on AMD bulldozer and barcelona target
authorJerome Robert <jeromerobert@gmx.com>
Tue, 7 Jun 2016 14:11:09 +0000 (16:11 +0200)
committerJerome Robert <jeromerobert@gmx.com>
Tue, 7 Jun 2016 14:11:09 +0000 (16:11 +0200)
* Hopefully, because this was found by error and trial (dark magic)
* Ref #786

interface/ztrmv.c

index 2be915c..1721afc 100644 (file)
@@ -243,6 +243,8 @@ void CNAME(enum CBLAS_ORDER order, enum CBLAS_UPLO Uplo,
 #endif
   {
     buffer_size = ((n - 1) / DTB_ENTRIES) * 2 * DTB_ENTRIES + 32 / sizeof(FLOAT);
+    // It seems to be required for some K8 or Barcelona CPU
+    buffer_size += 8;
     if(incx != 1)
       buffer_size += n * 2;
   }