Fix IDAMAX

2023-06-26 21:19:33 +02:00 · 2023-06-26 21:19:33 +02:00 · d6be5036d7
parent dc2439108d
commit d6be5036d7
1 changed files with 27 additions and 13 deletions
--- a/kernel/riscv64/iamax_vector.c
+++ b/kernel/riscv64/iamax_vector.c
@ -29,8 +29,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 #include <math.h>
 #if defined(DOUBLE)
-
+#define VFMVFS_FLOAT vfmv_f_s_f64m1_f64
 #define ABS fabs
 #define VSETVL(n) vsetvl_e64m8(n)
 #define VSETVL_MAX vsetvlmax_e64m1()
 #define FLOAT_V_T vfloat64m8_t
@ -54,8 +53,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 #define VADDVX_UINT vadd_vx_u64m8
 #define VMVVX_UINT vmv_v_x_u64m8
 #else
-
+#define VFMVFS_FLOAT vfmv_f_s_f32m1_f32
 #define ABS fabsf
 #define VSETVL(n) vsetvl_e32m8(n)
 #define VSETVL_MAX vsetvlmax_e32m1()
 #define FLOAT_V_T vfloat32m8_t
@ -85,7 +83,11 @@ BLASLONG CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x)
 {
 	BLASLONG i=0, j=0;
 	FLOAT maxf=0.0;
 #ifdef DOUBLE
        BLASLONG max_index = 0;
 #else
        unsigned int max_index = 0;
 #endif
 	if (n <= 0 || inc_x <= 0) return(max_index);
        FLOAT_V_T vx, v_max;
@ -117,11 +119,14 @@ BLASLONG CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x)
                        j += gvl;
                }
                v_res = VFREDMAXVS_FLOAT(v_res, v_max, v_z0, gvl);
-                maxf = *((FLOAT*)&v_res);
+                maxf = VFMVFS_FLOAT(v_res);
                mask = VMFGEVF_FLOAT(v_max, maxf, gvl);
                max_index = VMFIRSTM(mask,gvl);
-                max_index = *((unsigned int*)&v_max_index+max_index);
+#ifdef DOUBLE
-
+		max_index = *((BLASLONG *)&v_max_index+max_index);
 #else
 		max_index = *((unsigned int *)&v_max_index+max_index);
 #endif
                if(j < n){
                        gvl = VSETVL(n-j);
                        vx = VLEV_FLOAT(&x[j], gvl);
@ -130,7 +135,7 @@ BLASLONG CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x)
                        v_max = VFRSUBVF_MASK_FLOAT(mask, vx, vx, 0, gvl);
                        v_res = VFREDMAXVS_FLOAT(v_res, v_max, v_z0, gvl);
-                        FLOAT cur_maxf = *((FLOAT*)&v_res);
+                        FLOAT cur_maxf = VFMVFS_FLOAT(v_res);
                        if(cur_maxf > maxf){
                                //tail index
                                v_max_index = VIDV_UINT(gvl);
@ -138,7 +143,11 @@ BLASLONG CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x)
                                mask = VMFGEVF_FLOAT(v_max, cur_maxf, gvl);
                                max_index = VMFIRSTM(mask,gvl);
 #ifdef DOUBLE
                                max_index = *((BLASLONG*)&v_max_index+max_index);
 #else
                                max_index = *((unsigned int*)&v_max_index+max_index);
 #endif
                        }
                }
        }else{
@ -165,11 +174,14 @@ BLASLONG CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x)
                        idx += inc_v;
                }
                v_res = VFREDMAXVS_FLOAT(v_res, v_max, v_z0, gvl);
-                maxf = *((FLOAT*)&v_res);
+                maxf = VFMVFS_FLOAT(v_res);
                mask = VMFGEVF_FLOAT(v_max, maxf, gvl);
                max_index = VMFIRSTM(mask,gvl);
 #ifdef DOUBLE
                max_index = *((BLASLONG*)&v_max_index+max_index);
 #else
                max_index = *((unsigned int*)&v_max_index+max_index);
-
+#endif
                if(j < n){
                        gvl = VSETVL(n-j);
                        vx = VLSEV_FLOAT(&x[idx], stride_x, gvl);
@ -178,7 +190,7 @@ BLASLONG CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x)
                        v_max = VFRSUBVF_MASK_FLOAT(mask, vx, vx, 0, gvl);
                        v_res = VFREDMAXVS_FLOAT(v_res, v_max, v_z0, gvl);
-                        FLOAT cur_maxf = *((FLOAT*)&v_res);
+                        FLOAT cur_maxf = VFMVFS_FLOAT(v_res);
                        if(cur_maxf > maxf){
                                //tail index
                                v_max_index = VIDV_UINT(gvl);
@ -186,11 +198,13 @@ BLASLONG CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x)
                                mask = VMFGEVF_FLOAT(v_max, cur_maxf, gvl);
                                max_index = VMFIRSTM(mask,gvl);
 #ifdef DOUBLE
                                max_index = *((BLASLONG*)&v_max_index+max_index);
 #else
                                max_index = *((unsigned int*)&v_max_index+max_index);
 #endif
                        }
                }
        }
 	return(max_index+1);
 }