Merge pull request #4699 from ChipKerchner/fixSwapVectorOrder
POWER: Fixing endianness issue in cswap/zswap kernel for AIX
This commit is contained in:
commit
ce96e0e50f
|
@ -58,6 +58,16 @@ static void cswap_kernel_32 (long n, float *x, float *y)
|
|||
"lxvp 62, 224(%3) \n\t"
|
||||
|
||||
|
||||
#if (__BYTE_ORDER__ == __ORDER_BIG_ENDIAN__)
|
||||
"stxv 32, 0(%3) \n\t"
|
||||
"stxv 33, 16(%3) \n\t"
|
||||
"stxv 34, 32(%3) \n\t"
|
||||
"stxv 35, 48(%3) \n\t"
|
||||
"stxv 36, 64(%3) \n\t"
|
||||
"stxv 37, 80(%3) \n\t"
|
||||
"stxv 38, 96(%3) \n\t"
|
||||
"stxv 39, 112(%3) \n\t"
|
||||
#else
|
||||
"stxv 33, 0(%3) \n\t"
|
||||
"stxv 32, 16(%3) \n\t"
|
||||
"stxv 35, 32(%3) \n\t"
|
||||
|
@ -66,9 +76,20 @@ static void cswap_kernel_32 (long n, float *x, float *y)
|
|||
"stxv 36, 80(%3) \n\t"
|
||||
"stxv 39, 96(%3) \n\t"
|
||||
"stxv 38, 112(%3) \n\t"
|
||||
#endif
|
||||
|
||||
"addi %3, %3, 128 \n\t"
|
||||
|
||||
#if (__BYTE_ORDER__ == __ORDER_BIG_ENDIAN__)
|
||||
"stxv 40, 0(%3) \n\t"
|
||||
"stxv 41, 16(%3) \n\t"
|
||||
"stxv 42, 32(%3) \n\t"
|
||||
"stxv 43, 48(%3) \n\t"
|
||||
"stxv 44, 64(%3) \n\t"
|
||||
"stxv 45, 80(%3) \n\t"
|
||||
"stxv 46, 96(%3) \n\t"
|
||||
"stxv 47, 112(%3) \n\t"
|
||||
#else
|
||||
"stxv 41, 0(%3) \n\t"
|
||||
"stxv 40, 16(%3) \n\t"
|
||||
"stxv 43, 32(%3) \n\t"
|
||||
|
@ -77,9 +98,20 @@ static void cswap_kernel_32 (long n, float *x, float *y)
|
|||
"stxv 44, 80(%3) \n\t"
|
||||
"stxv 47, 96(%3) \n\t"
|
||||
"stxv 46, 112(%3) \n\t"
|
||||
#endif
|
||||
|
||||
"addi %3, %3, 128 \n\t"
|
||||
|
||||
#if (__BYTE_ORDER__ == __ORDER_BIG_ENDIAN__)
|
||||
"stxv 48, 0(%4) \n\t"
|
||||
"stxv 49, 16(%4) \n\t"
|
||||
"stxv 50, 32(%4) \n\t"
|
||||
"stxv 51, 48(%4) \n\t"
|
||||
"stxv 52, 64(%4) \n\t"
|
||||
"stxv 53, 80(%4) \n\t"
|
||||
"stxv 54, 96(%4) \n\t"
|
||||
"stxv 55, 112(%4) \n\t"
|
||||
#else
|
||||
"stxv 49, 0(%4) \n\t"
|
||||
"stxv 48, 16(%4) \n\t"
|
||||
"stxv 51, 32(%4) \n\t"
|
||||
|
@ -88,9 +120,20 @@ static void cswap_kernel_32 (long n, float *x, float *y)
|
|||
"stxv 52, 80(%4) \n\t"
|
||||
"stxv 55, 96(%4) \n\t"
|
||||
"stxv 54, 112(%4) \n\t"
|
||||
#endif
|
||||
|
||||
"addi %4, %4, 128 \n\t"
|
||||
|
||||
#if (__BYTE_ORDER__ == __ORDER_BIG_ENDIAN__)
|
||||
"stxv 56, 0(%4) \n\t"
|
||||
"stxv 57, 16(%4) \n\t"
|
||||
"stxv 58, 32(%4) \n\t"
|
||||
"stxv 59, 48(%4) \n\t"
|
||||
"stxv 60, 64(%4) \n\t"
|
||||
"stxv 61, 80(%4) \n\t"
|
||||
"stxv 62, 96(%4) \n\t"
|
||||
"stxv 63, 112(%4) \n\t"
|
||||
#else
|
||||
"stxv 57, 0(%4) \n\t"
|
||||
"stxv 56, 16(%4) \n\t"
|
||||
"stxv 59, 32(%4) \n\t"
|
||||
|
@ -99,6 +142,7 @@ static void cswap_kernel_32 (long n, float *x, float *y)
|
|||
"stxv 60, 80(%4) \n\t"
|
||||
"stxv 63, 96(%4) \n\t"
|
||||
"stxv 62, 112(%4) \n\t"
|
||||
#endif
|
||||
|
||||
"addi %4, %4, 128 \n\t"
|
||||
|
||||
|
|
Loading…
Reference in New Issue