Fixed #27. Temporarily walk around axpy's low performance issue with small imput size & multithreads.
This commit is contained in:
parent
b3d1887745
commit
aeed8d6225
|
@ -25,6 +25,7 @@ x86/x86_64:
|
|||
* Fixed #28 a wrong result of dsdot on x86_64.
|
||||
* Fixed #32 a SEGFAULT bug of zdotc with gcc-4.6.
|
||||
* Fixed #33 ztrmm bug on Nehalem.
|
||||
* Walk round #27 the low performance axpy issue with small imput size & multithreads.
|
||||
|
||||
MIPS64:
|
||||
* Fixed #28 a wrong result of dsdot on Loongson3A/MIPS64.
|
||||
|
|
|
@ -86,6 +86,10 @@ void CNAME(blasint n, FLOAT alpha, FLOAT *x, blasint incx, FLOAT *y, blasint inc
|
|||
if (incx == 0 || incy == 0)
|
||||
nthreads = 1;
|
||||
|
||||
//Temporarily walk around the low performance issue with small imput size & multithreads.
|
||||
if (n <= 10000)
|
||||
nthreads = 1;
|
||||
|
||||
if (nthreads == 1) {
|
||||
#endif
|
||||
|
||||
|
|
Loading…
Reference in New Issue