Merge pull request #907 from jeromerobert/bug786

Fix z/ctrmv stack allocation on AMD bulldozer and barcelona target
This commit is contained in:
Zhang Xianyi 2016-06-27 10:04:54 -04:00 committed by GitHub
commit ca5c25c870
1 changed files with 2 additions and 0 deletions

View File

@ -243,6 +243,8 @@ void CNAME(enum CBLAS_ORDER order, enum CBLAS_UPLO Uplo,
#endif #endif
{ {
buffer_size = ((n - 1) / DTB_ENTRIES) * 2 * DTB_ENTRIES + 32 / sizeof(FLOAT); buffer_size = ((n - 1) / DTB_ENTRIES) * 2 * DTB_ENTRIES + 32 / sizeof(FLOAT);
// It seems to be required for some K8 or Barcelona CPU
buffer_size += 8;
if(incx != 1) if(incx != 1)
buffer_size += n * 2; buffer_size += n * 2;
} }