Merge pull request #3669 from VFerrari/fix_small_matrix_kernel
POWER: fix issues with the small matrix kernel
This commit is contained in:
commit
be5500e704
|
@ -261,7 +261,7 @@ endif
|
||||||
#For small matrix optimization
|
#For small matrix optimization
|
||||||
ifeq ($(ARCH), x86_64)
|
ifeq ($(ARCH), x86_64)
|
||||||
SMALL_MATRIX_OPT = 1
|
SMALL_MATRIX_OPT = 1
|
||||||
else ifeq ($(CORE), POWER10)
|
else ifeq ($(ARCH), power)
|
||||||
SMALL_MATRIX_OPT = 1
|
SMALL_MATRIX_OPT = 1
|
||||||
endif
|
endif
|
||||||
ifeq ($(SMALL_MATRIX_OPT), 1)
|
ifeq ($(SMALL_MATRIX_OPT), 1)
|
||||||
|
|
|
@ -69,6 +69,7 @@ int CNAME(int transa, int transb, BLASLONG M, BLASLONG N, BLASLONG K, FLOAT alph
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
#ifdef SMP
|
||||||
// Multi-threading execution outperforms (or approaches) the execution of the
|
// Multi-threading execution outperforms (or approaches) the execution of the
|
||||||
// small kernel.
|
// small kernel.
|
||||||
if (num_cpu_avail(3) > 1) {
|
if (num_cpu_avail(3) > 1) {
|
||||||
|
@ -77,6 +78,9 @@ int CNAME(int transa, int transb, BLASLONG M, BLASLONG N, BLASLONG K, FLOAT alph
|
||||||
} else {
|
} else {
|
||||||
return 1;
|
return 1;
|
||||||
}
|
}
|
||||||
|
#else
|
||||||
|
return 1;
|
||||||
|
#endif
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue