diff --git a/kernel/power/sbgemv_common.c b/kernel/power/sbgemv_common.c index ad040b371..156eadce7 100644 --- a/kernel/power/sbgemv_common.c +++ b/kernel/power/sbgemv_common.c @@ -111,11 +111,6 @@ FORCEINLINE vec_f32 vec_loadNHi_mult(vec_bf16 *in, vec_f32 v_inp0, BLASLONG n, v return (v_inp0 * v_in00); } -FORCEINLINE vec_f32 vec_loadNHi_vec(vec_bf16 *in, BLASLONG i, BLASLONG n, vec_bf16 zero) -{ - return vec_loadNHi(&in[i], n, zero); -} - FORCEINLINE void copy_x(BLASLONG n, IFLOAT *src, IFLOAT *dest, BLASLONG inc_src) { for (BLASLONG i = 0; i < n; i++) { diff --git a/kernel/power/sbgemv_t_vsx.c b/kernel/power/sbgemv_t_vsx.c index 272dccef7..9d5e6d997 100644 --- a/kernel/power/sbgemv_t_vsx.c +++ b/kernel/power/sbgemv_t_vsx.c @@ -66,7 +66,7 @@ static void BF16GEMV_T_VSX_1(BLASLONG n, BLASLONG lda, IFLOAT *ap, IFLOAT *x, FL temp0 += vec_loadN_mult(&va0[i], inp, n, zero); } else if (n) { - inp[0] = vec_loadNHi_vec(v_x, i, n, zero); + inp[0] = vec_loadNHi(&v_x[i], n, zero); temp0 += vec_loadNHi_mult(&va0[i], inp[0], n, zero); } @@ -105,7 +105,7 @@ static void BF16GEMV_T_VSX_2(BLASLONG n, BLASLONG lda, IFLOAT *ap, IFLOAT *x, FL temp0 += vec_loadN_mult(&va0[i], inp, n, zero); temp1 += vec_loadN_mult(&va1[i], inp, n, zero); } else if (n) { - inp[0] = vec_loadNHi_vec(v_x, i, n, zero); + inp[0] = vec_loadNHi(&v_x[i], n, zero); temp0 += vec_loadNHi_mult(&va0[i], inp[0], n, zero); temp1 += vec_loadNHi_mult(&va1[i], inp[0], n, zero); @@ -156,7 +156,7 @@ static void BF16GEMV_T_VSX_4(BLASLONG n, BLASLONG lda, IFLOAT *ap, IFLOAT *x, FL temp2 += vec_loadN_mult(&va2[i], inp, n, zero); temp3 += vec_loadN_mult(&va3[i], inp, n, zero); } else if (n) { - inp[0] = vec_loadNHi_vec(v_x, i, n, zero); + inp[0] = vec_loadNHi(&v_x[i], n, zero); temp0 += vec_loadNHi_mult(&va0[i], inp[0], n, zero); temp1 += vec_loadNHi_mult(&va1[i], inp[0], n, zero); @@ -245,7 +245,7 @@ static void BF16GEMV_T_VSX_8(BLASLONG n, BLASLONG lda, IFLOAT *ap, IFLOAT *x, FL temp6 += vec_loadN_mult(&va6[i], inp, n, zero); temp7 += vec_loadN_mult(&va7[i], inp, n, zero); } else if (n) { - inp[0] = vec_loadNHi_vec(v_x, i, n, zero); + inp[0] = vec_loadNHi(&v_x[i], n, zero); temp0 += vec_loadNHi_mult(&va0[i], inp[0], n, zero); temp1 += vec_loadNHi_mult(&va1[i], inp[0], n, zero);