enabled gemv assembly on power8

This commit is contained in:
Werner Saar 2016-03-04 12:53:31 +01:00
parent 4824b88fcb
commit d5130ce7e3
5 changed files with 31 additions and 8 deletions

View File

@ -137,15 +137,16 @@ ZGEMM3MKERNEL = zgemm3m_kernel_4x4_sse3.S
#CSWAPKERNEL = ../arm/zswap.c #CSWAPKERNEL = ../arm/zswap.c
#ZSWAPKERNEL = ../arm/zswap.c #ZSWAPKERNEL = ../arm/zswap.c
# #
SGEMVNKERNEL = ../arm/gemv_n.c
DGEMVNKERNEL = ../arm/gemv_n.c
CGEMVNKERNEL = ../arm/zgemv_n.c
ZGEMVNKERNEL = ../arm/zgemv_n.c
SGEMVTKERNEL = ../arm/gemv_t.c #SGEMVNKERNEL = ../arm/gemv_n.c
DGEMVTKERNEL = ../arm/gemv_t.c #DGEMVNKERNEL = ../arm/gemv_n.c
CGEMVTKERNEL = ../arm/zgemv_t.c #CGEMVNKERNEL = ../arm/zgemv_n.c
ZGEMVTKERNEL = ../arm/zgemv_t.c #ZGEMVNKERNEL = ../arm/zgemv_n.c
#
#SGEMVTKERNEL = ../arm/gemv_t.c
#DGEMVTKERNEL = ../arm/gemv_t.c
#CGEMVTKERNEL = ../arm/zgemv_t.c
#ZGEMVTKERNEL = ../arm/zgemv_t.c
SSYMV_U_KERNEL = ../generic/symv_k.c SSYMV_U_KERNEL = ../generic/symv_k.c
SSYMV_L_KERNEL = ../generic/symv_k.c SSYMV_L_KERNEL = ../generic/symv_k.c

View File

@ -174,6 +174,12 @@
#define PREFETCHSIZE_C 40 #define PREFETCHSIZE_C 40
#endif #endif
#ifdef POWER8
#define PREFETCHSIZE_A 96
#define PREFETCHSIZE_C 40
#endif
#ifndef NEEDPARAM #ifndef NEEDPARAM
#ifndef __64BIT__ #ifndef __64BIT__

View File

@ -139,6 +139,11 @@
#define PREFETCHSIZE_C 8 #define PREFETCHSIZE_C 8
#endif #endif
#ifdef POWER8
#define PREFETCHSIZE_A 96
#define PREFETCHSIZE_C 8
#endif
#define y01 f0 #define y01 f0
#define y02 f1 #define y02 f1
#define y03 f2 #define y03 f2

View File

@ -170,6 +170,11 @@
#define PREFETCHSIZE_C 24 #define PREFETCHSIZE_C 24
#endif #endif
#ifdef POWER8
#define PREFETCHSIZE_A 24
#define PREFETCHSIZE_C 24
#endif
#ifndef XCONJ #ifndef XCONJ
#define FMADDR FMADD #define FMADDR FMADD
#define FMSUBR FNMSUB #define FMSUBR FNMSUB

View File

@ -144,6 +144,12 @@
#define PREFETCHSIZE_C 8 #define PREFETCHSIZE_C 8
#endif #endif
#ifdef POWER8
#define PREFETCHSIZE_A 24
#define PREFETCHSIZE_C 8
#endif
#if !(defined(CONJ) && defined(XCONJ)) #if !(defined(CONJ) && defined(XCONJ))
#define FMADDR FMADD #define FMADDR FMADD
#define FMSUBR FNMSUB #define FMSUBR FNMSUB