Optimized standard Blas Level-1,2 (excluding nrm2 functions) for z13 (double precision)

This commit is contained in:
Abdurrauf
2017-04-08 21:51:15 +04:00
parent 08786c4b95
commit 1cfdb2295d
26 changed files with 7230 additions and 26 deletions

View File

@@ -40,8 +40,12 @@
#include "common.h"
#ifdef FUNCTION_PROFILE
#include "functable.h"
#endif
#if defined(Z13)
#define MULTI_THREAD_MINIMAL 200000
#else
#define MULTI_THREAD_MINIMAL 10000
#endif
#ifndef CBLAS
void NAME(blasint *N, FLOAT *ALPHA, FLOAT *x, blasint *INCX, FLOAT *y, blasint *INCY){
@@ -88,7 +92,7 @@ void CNAME(blasint n, FLOAT alpha, FLOAT *x, blasint incx, FLOAT *y, blasint inc
//Temporarily work-around the low performance issue with small imput size &
//multithreads.
if (n <= 10000)
if (n <= MULTI_THREAD_MINIMAL)
nthreads = 1;
if (nthreads == 1) {