Merge pull request #1971 from martin-frbg/trsm-threshold
Shift transition to multithreading towards larger matrix sizes
This commit is contained in:
commit
3f7bb87a2a
|
@ -81,6 +81,12 @@
|
||||||
#endif
|
#endif
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
#ifndef COMPLEX
|
||||||
|
#define SMP_FACTOR 256
|
||||||
|
#else
|
||||||
|
#define SMP_FACTOR 128
|
||||||
|
#endif
|
||||||
|
|
||||||
static int (*trsm[])(blas_arg_t *, BLASLONG *, BLASLONG *, FLOAT *, FLOAT *, BLASLONG) = {
|
static int (*trsm[])(blas_arg_t *, BLASLONG *, BLASLONG *, FLOAT *, FLOAT *, BLASLONG) = {
|
||||||
#ifndef TRMM
|
#ifndef TRMM
|
||||||
TRSM_LNUU, TRSM_LNUN, TRSM_LNLU, TRSM_LNLN,
|
TRSM_LNUU, TRSM_LNUN, TRSM_LNLU, TRSM_LNLN,
|
||||||
|
@ -366,10 +372,14 @@ void CNAME(enum CBLAS_ORDER order,
|
||||||
mode |= (trans << BLAS_TRANSA_SHIFT);
|
mode |= (trans << BLAS_TRANSA_SHIFT);
|
||||||
mode |= (side << BLAS_RSIDE_SHIFT);
|
mode |= (side << BLAS_RSIDE_SHIFT);
|
||||||
|
|
||||||
if ( args.m < 2*GEMM_MULTITHREAD_THRESHOLD )
|
/*
|
||||||
|
if ( args.m < 2 * GEMM_MULTITHREAD_THRESHOLD )
|
||||||
args.nthreads = 1;
|
args.nthreads = 1;
|
||||||
else
|
else
|
||||||
if ( args.n < 2*GEMM_MULTITHREAD_THRESHOLD )
|
if ( args.n < 2 * GEMM_MULTITHREAD_THRESHOLD )
|
||||||
|
args.nthreads = 1;
|
||||||
|
*/
|
||||||
|
if ( args.m * args.n < SMP_FACTOR * GEMM_MULTITHREAD_THRESHOLD)
|
||||||
args.nthreads = 1;
|
args.nthreads = 1;
|
||||||
else
|
else
|
||||||
args.nthreads = num_cpu_avail(3);
|
args.nthreads = num_cpu_avail(3);
|
||||||
|
|
Loading…
Reference in New Issue