Merge pull request #907 from jeromerobert/bug786

Fix z/ctrmv stack allocation on AMD bulldozer and barcelona target
This commit is contained in:
Zhang Xianyi
2016-06-27 10:04:54 -04:00
committed by GitHub

View File

@@ -243,6 +243,8 @@ void CNAME(enum CBLAS_ORDER order, enum CBLAS_UPLO Uplo,
#endif
{
buffer_size = ((n - 1) / DTB_ENTRIES) * 2 * DTB_ENTRIES + 32 / sizeof(FLOAT);
// It seems to be required for some K8 or Barcelona CPU
buffer_size += 8;
if(incx != 1)
buffer_size += n * 2;
}