Merge pull request #3266 from martin-frbg/powerparam
Remove spurious casts from PPC parameters and fix compilation for older targets
This commit is contained in:
commit
2e8ff4a781
|
@ -54,3 +54,8 @@ ZTRSMKERNEL_LN = ztrsm_kernel_LN.S
|
||||||
ZTRSMKERNEL_LT = ztrsm_kernel_LT.S
|
ZTRSMKERNEL_LT = ztrsm_kernel_LT.S
|
||||||
ZTRSMKERNEL_RN = ztrsm_kernel_LT.S
|
ZTRSMKERNEL_RN = ztrsm_kernel_LT.S
|
||||||
ZTRSMKERNEL_RT = ztrsm_kernel_RT.S
|
ZTRSMKERNEL_RT = ztrsm_kernel_RT.S
|
||||||
|
|
||||||
|
CROTKERNEL = ../arm/zrot.c
|
||||||
|
ZROTKERNEL = ../arm/zrot.c
|
||||||
|
SGEMVNKERNEL = ../arm/gemv_n.c
|
||||||
|
SGEMVTKERNEL = ../arm/gemv_t.c
|
||||||
|
|
|
@ -16,11 +16,11 @@ ZASUMKERNEL = zasum_ppc440.S
|
||||||
SAXPYKERNEL = axpy_ppc440.S
|
SAXPYKERNEL = axpy_ppc440.S
|
||||||
DAXPYKERNEL = axpy_ppc440.S
|
DAXPYKERNEL = axpy_ppc440.S
|
||||||
ifneq ($(__BYTE_ORDER__),__ORDER_BIG_ENDIAN__)
|
ifneq ($(__BYTE_ORDER__),__ORDER_BIG_ENDIAN__)
|
||||||
CAXPYKERNEL = ../arm/zaxpy.c
|
|
||||||
ZAXPYKERNEL = ../arm/zaxpy.c
|
|
||||||
else
|
|
||||||
CAXPYKERNEL = zaxpy_ppc440.S
|
CAXPYKERNEL = zaxpy_ppc440.S
|
||||||
ZAXPYKERNEL = zaxpy_ppc440.S
|
ZAXPYKERNEL = zaxpy_ppc440.S
|
||||||
|
else
|
||||||
|
CAXPYKERNEL = ../arm/zaxpy.c
|
||||||
|
ZAXPYKERNEL = ../arm/zaxpy.c
|
||||||
endif
|
endif
|
||||||
|
|
||||||
SDOTKERNEL = dot_ppc440.S
|
SDOTKERNEL = dot_ppc440.S
|
||||||
|
|
|
@ -15,8 +15,13 @@ ZASUMKERNEL = zasum_ppc440.S
|
||||||
|
|
||||||
SAXPYKERNEL = axpy_ppc440.S
|
SAXPYKERNEL = axpy_ppc440.S
|
||||||
DAXPYKERNEL = axpy_ppc440.S
|
DAXPYKERNEL = axpy_ppc440.S
|
||||||
|
ifneq ($(__BYTE_ORDER__),__ORDER_BIG_ENDIAN__)
|
||||||
CAXPYKERNEL = zaxpy_ppc440.S
|
CAXPYKERNEL = zaxpy_ppc440.S
|
||||||
ZAXPYKERNEL = zaxpy_ppc440.S
|
ZAXPYKERNEL = zaxpy_ppc440.S
|
||||||
|
else
|
||||||
|
CAXPYKERNEL = ../arm/zaxpy.c
|
||||||
|
ZAXPYKERNEL = ../arm/zaxpy.c
|
||||||
|
endif
|
||||||
|
|
||||||
SDOTKERNEL = dot_ppc440.S
|
SDOTKERNEL = dot_ppc440.S
|
||||||
DDOTKERNEL = dot_ppc440.S
|
DDOTKERNEL = dot_ppc440.S
|
||||||
|
|
|
@ -159,6 +159,11 @@
|
||||||
#define PREFETCHSIZE_C 16
|
#define PREFETCHSIZE_C 16
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
#ifdef POWER3
|
||||||
|
#define PREFETCHSIZE_A 16
|
||||||
|
#define PREFETCHSIZE_C 16
|
||||||
|
#endif
|
||||||
|
|
||||||
#ifdef POWER4
|
#ifdef POWER4
|
||||||
#define PREFETCHSIZE_A 16
|
#define PREFETCHSIZE_A 16
|
||||||
#define PREFETCHSIZE_C 16
|
#define PREFETCHSIZE_C 16
|
||||||
|
|
|
@ -124,6 +124,11 @@
|
||||||
#define PREFETCHSIZE_C 16
|
#define PREFETCHSIZE_C 16
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
#ifdef POWER3
|
||||||
|
#define PREFETCHSIZE_A 16
|
||||||
|
#define PREFETCHSIZE_C 16
|
||||||
|
#endif
|
||||||
|
|
||||||
#ifdef POWER4
|
#ifdef POWER4
|
||||||
#define PREFETCHSIZE_A 48
|
#define PREFETCHSIZE_A 48
|
||||||
#define PREFETCHSIZE_C 16
|
#define PREFETCHSIZE_C 16
|
||||||
|
|
|
@ -155,6 +155,11 @@
|
||||||
#define PREFETCHSIZE_C 16
|
#define PREFETCHSIZE_C 16
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
#ifdef POWER3
|
||||||
|
#define PREFETCHSIZE_A 34
|
||||||
|
#define PREFETCHSIZE_C 16
|
||||||
|
#endif
|
||||||
|
|
||||||
#ifdef POWER4
|
#ifdef POWER4
|
||||||
#define PREFETCHSIZE_A 34
|
#define PREFETCHSIZE_A 34
|
||||||
#define PREFETCHSIZE_C 16
|
#define PREFETCHSIZE_C 16
|
||||||
|
|
|
@ -129,6 +129,11 @@
|
||||||
#define PREFETCHSIZE_C 16
|
#define PREFETCHSIZE_C 16
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
#ifdef POWER3
|
||||||
|
#define PREFETCHSIZE_A 34
|
||||||
|
#define PREFETCHSIZE_C 16
|
||||||
|
#endif
|
||||||
|
|
||||||
#ifdef POWER4
|
#ifdef POWER4
|
||||||
#define PREFETCHSIZE_A 34
|
#define PREFETCHSIZE_A 34
|
||||||
#define PREFETCHSIZE_C 16
|
#define PREFETCHSIZE_C 16
|
||||||
|
|
34
param.h
34
param.h
|
@ -72,13 +72,6 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
#ifndef PARAM_H
|
#ifndef PARAM_H
|
||||||
#define PARAM_H
|
#define PARAM_H
|
||||||
|
|
||||||
#define LONGCAST (BLASLONG)
|
|
||||||
#if defined(__BYTE_ORDER__)
|
|
||||||
#if __GNUC__ < 9
|
|
||||||
#undef LONGCAST
|
|
||||||
#define LONGCAST
|
|
||||||
#endif
|
|
||||||
#endif
|
|
||||||
|
|
||||||
#define SBGEMM_DEFAULT_UNROLL_N 4
|
#define SBGEMM_DEFAULT_UNROLL_N 4
|
||||||
#define SBGEMM_DEFAULT_UNROLL_M 8
|
#define SBGEMM_DEFAULT_UNROLL_M 8
|
||||||
|
@ -2096,7 +2089,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
#ifdef PPCG4
|
#ifdef PPCG4
|
||||||
#define GEMM_DEFAULT_OFFSET_A 0
|
#define GEMM_DEFAULT_OFFSET_A 0
|
||||||
#define GEMM_DEFAULT_OFFSET_B 1024
|
#define GEMM_DEFAULT_OFFSET_B 1024
|
||||||
#define GEMM_DEFAULT_ALIGN LONGCAST 0x0ffffUL
|
#define GEMM_DEFAULT_ALIGN 0x0ffffUL
|
||||||
|
|
||||||
#define SGEMM_DEFAULT_UNROLL_M 16
|
#define SGEMM_DEFAULT_UNROLL_M 16
|
||||||
#define SGEMM_DEFAULT_UNROLL_N 4
|
#define SGEMM_DEFAULT_UNROLL_N 4
|
||||||
|
@ -2127,7 +2120,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
|
|
||||||
#define GEMM_DEFAULT_OFFSET_A 2688
|
#define GEMM_DEFAULT_OFFSET_A 2688
|
||||||
#define GEMM_DEFAULT_OFFSET_B 3072
|
#define GEMM_DEFAULT_OFFSET_B 3072
|
||||||
#define GEMM_DEFAULT_ALIGN LONGCAST 0x03fffUL
|
#define GEMM_DEFAULT_ALIGN 0x03fffUL
|
||||||
|
|
||||||
#if defined(__BYTE_ORDER__)&&(__BYTE_ORDER__ == __ORDER_BIG_ENDIAN__)
|
#if defined(__BYTE_ORDER__)&&(__BYTE_ORDER__ == __ORDER_BIG_ENDIAN__)
|
||||||
#define SGEMM_DEFAULT_UNROLL_M 4
|
#define SGEMM_DEFAULT_UNROLL_M 4
|
||||||
|
@ -2176,7 +2169,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
|
|
||||||
#define GEMM_DEFAULT_OFFSET_A (32 * 0)
|
#define GEMM_DEFAULT_OFFSET_A (32 * 0)
|
||||||
#define GEMM_DEFAULT_OFFSET_B (32 * 0)
|
#define GEMM_DEFAULT_OFFSET_B (32 * 0)
|
||||||
#define GEMM_DEFAULT_ALIGN LONGCAST 0x0ffffUL
|
#define GEMM_DEFAULT_ALIGN 0x0ffffUL
|
||||||
|
|
||||||
#define SGEMM_DEFAULT_UNROLL_M 4
|
#define SGEMM_DEFAULT_UNROLL_M 4
|
||||||
#define SGEMM_DEFAULT_UNROLL_N 4
|
#define SGEMM_DEFAULT_UNROLL_N 4
|
||||||
|
@ -2212,7 +2205,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
|
|
||||||
#define GEMM_DEFAULT_OFFSET_A (32 * 0)
|
#define GEMM_DEFAULT_OFFSET_A (32 * 0)
|
||||||
#define GEMM_DEFAULT_OFFSET_B (32 * 0)
|
#define GEMM_DEFAULT_OFFSET_B (32 * 0)
|
||||||
#define GEMM_DEFAULT_ALIGN LONGCAST 0x0ffffUL
|
#define GEMM_DEFAULT_ALIGN 0x0ffffUL
|
||||||
|
|
||||||
#define SGEMM_DEFAULT_UNROLL_M 8
|
#define SGEMM_DEFAULT_UNROLL_M 8
|
||||||
#define SGEMM_DEFAULT_UNROLL_N 4
|
#define SGEMM_DEFAULT_UNROLL_N 4
|
||||||
|
@ -2247,7 +2240,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
#if defined(POWER3) || defined(POWER4) || defined(POWER5)
|
#if defined(POWER3) || defined(POWER4) || defined(POWER5)
|
||||||
#define GEMM_DEFAULT_OFFSET_A 0
|
#define GEMM_DEFAULT_OFFSET_A 0
|
||||||
#define GEMM_DEFAULT_OFFSET_B 2048
|
#define GEMM_DEFAULT_OFFSET_B 2048
|
||||||
#define GEMM_DEFAULT_ALIGN LONGCAST 0x0ffffUL
|
#define GEMM_DEFAULT_ALIGN 0x0ffffUL
|
||||||
|
|
||||||
#define SGEMM_DEFAULT_UNROLL_M 4
|
#define SGEMM_DEFAULT_UNROLL_M 4
|
||||||
#define SGEMM_DEFAULT_UNROLL_N 4
|
#define SGEMM_DEFAULT_UNROLL_N 4
|
||||||
|
@ -2271,6 +2264,10 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
#define DGEMM_DEFAULT_Q 216
|
#define DGEMM_DEFAULT_Q 216
|
||||||
#define DGEMM_DEFAULT_R 1012
|
#define DGEMM_DEFAULT_R 1012
|
||||||
|
|
||||||
|
#define CGEMM_DEFAULT_P 256
|
||||||
|
#define CGEMM_DEFAULT_Q 104
|
||||||
|
#define CGEMM_DEFAULT_R 1012
|
||||||
|
|
||||||
#define ZGEMM_DEFAULT_P 256
|
#define ZGEMM_DEFAULT_P 256
|
||||||
#define ZGEMM_DEFAULT_Q 104
|
#define ZGEMM_DEFAULT_Q 104
|
||||||
#define ZGEMM_DEFAULT_R 1012
|
#define ZGEMM_DEFAULT_R 1012
|
||||||
|
@ -2288,6 +2285,11 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
#define CGEMM_DEFAULT_P 144
|
#define CGEMM_DEFAULT_P 144
|
||||||
#define ZGEMM_DEFAULT_P 144
|
#define ZGEMM_DEFAULT_P 144
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
#define SGEMM_DEFAULT_Q 256
|
||||||
|
#define CGEMM_DEFAULT_Q 256
|
||||||
|
#define DGEMM_DEFAULT_Q 256
|
||||||
|
#define ZGEMM_DEFAULT_Q 256
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
#if defined(POWER5)
|
#if defined(POWER5)
|
||||||
|
@ -2320,7 +2322,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
|
|
||||||
#define GEMM_DEFAULT_OFFSET_A 384
|
#define GEMM_DEFAULT_OFFSET_A 384
|
||||||
#define GEMM_DEFAULT_OFFSET_B 1024
|
#define GEMM_DEFAULT_OFFSET_B 1024
|
||||||
#define GEMM_DEFAULT_ALIGN LONGCAST 0x03fffUL
|
#define GEMM_DEFAULT_ALIGN 0x03fffUL
|
||||||
|
|
||||||
#define SGEMM_DEFAULT_UNROLL_M 4
|
#define SGEMM_DEFAULT_UNROLL_M 4
|
||||||
#define SGEMM_DEFAULT_UNROLL_N 4
|
#define SGEMM_DEFAULT_UNROLL_N 4
|
||||||
|
@ -2353,7 +2355,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
#define GEMM_DEFAULT_OFFSET_A 0
|
#define GEMM_DEFAULT_OFFSET_A 0
|
||||||
#define GEMM_DEFAULT_OFFSET_B 65536
|
#define GEMM_DEFAULT_OFFSET_B 65536
|
||||||
|
|
||||||
#define GEMM_DEFAULT_ALIGN LONGCAST 0x0ffffUL
|
#define GEMM_DEFAULT_ALIGN 0x0ffffUL
|
||||||
#if defined(__32BIT__)
|
#if defined(__32BIT__)
|
||||||
#warning using BINARY32==POWER6
|
#warning using BINARY32==POWER6
|
||||||
#define SGEMM_DEFAULT_UNROLL_M 4
|
#define SGEMM_DEFAULT_UNROLL_M 4
|
||||||
|
@ -2406,7 +2408,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
|
|
||||||
#define GEMM_DEFAULT_OFFSET_A 0
|
#define GEMM_DEFAULT_OFFSET_A 0
|
||||||
#define GEMM_DEFAULT_OFFSET_B 65536
|
#define GEMM_DEFAULT_OFFSET_B 65536
|
||||||
#define GEMM_DEFAULT_ALIGN LONGCAST 0x0ffffUL
|
#define GEMM_DEFAULT_ALIGN 0x0ffffUL
|
||||||
|
|
||||||
#define SWITCH_RATIO 16
|
#define SWITCH_RATIO 16
|
||||||
#define GEMM_PREFERED_SIZE 16
|
#define GEMM_PREFERED_SIZE 16
|
||||||
|
@ -2445,7 +2447,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
|
|
||||||
#define GEMM_DEFAULT_OFFSET_A 0
|
#define GEMM_DEFAULT_OFFSET_A 0
|
||||||
#define GEMM_DEFAULT_OFFSET_B 65536
|
#define GEMM_DEFAULT_OFFSET_B 65536
|
||||||
#define GEMM_DEFAULT_ALIGN LONGCAST 0x0ffffUL
|
#define GEMM_DEFAULT_ALIGN 0x0ffffUL
|
||||||
|
|
||||||
#define SWITCH_RATIO 16
|
#define SWITCH_RATIO 16
|
||||||
#define GEMM_PREFERED_SIZE 16
|
#define GEMM_PREFERED_SIZE 16
|
||||||
|
|
Loading…
Reference in New Issue