[ZARCH] Fix iamax/imax single precision

This commit is contained in:
maamountki 2019-01-28 17:52:23 +02:00 committed by GitHub
parent 04873bb174
commit c7143c1019
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
6 changed files with 12 additions and 0 deletions

View File

@ -248,6 +248,8 @@ static BLASLONG icamax_kernel_32(BLASLONG n, FLOAT *x, FLOAT *amax)
"j 2f \n\t" "j 2f \n\t"
"1: \n\t" "1: \n\t"
"wfchsb %%v4,%%v2,%%v0 \n\t" "wfchsb %%v4,%%v2,%%v0 \n\t"
"vesrlg %%v4,%%v4,32 \n\t"
"vsegf %%v4,%%v4 \n\t"
"vsel %%v1,%%v3,%%v1,%%v4 \n\t" "vsel %%v1,%%v3,%%v1,%%v4 \n\t"
"vsel %%v0,%%v2,%%v0,%%v4 \n\t" "vsel %%v0,%%v2,%%v0,%%v4 \n\t"
"ste %%f0,%1 \n\t" "ste %%f0,%1 \n\t"

View File

@ -248,6 +248,8 @@ static BLASLONG icamin_kernel_32(BLASLONG n, FLOAT *x, FLOAT *amin)
"j 2f \n\t" "j 2f \n\t"
"1: \n\t" "1: \n\t"
"wfchsb %%v4,%%v0,%%v2 \n\t" "wfchsb %%v4,%%v0,%%v2 \n\t"
"vesrlg %%v4,%%v4,32 \n\t"
"vsegf %%v4,%%v4 \n\t"
"vsel %%v1,%%v3,%%v1,%%v4 \n\t" "vsel %%v1,%%v3,%%v1,%%v4 \n\t"
"vsel %%v0,%%v2,%%v0,%%v4 \n\t" "vsel %%v0,%%v2,%%v0,%%v4 \n\t"
"ste %%f0,%1 \n\t" "ste %%f0,%1 \n\t"

View File

@ -216,6 +216,8 @@ static BLASLONG isamax_kernel_64(BLASLONG n, FLOAT *x, FLOAT *amax)
"j 2f \n\t" "j 2f \n\t"
"1: \n\t" "1: \n\t"
"wfchsb %%v4,%%v2,%%v0 \n\t" "wfchsb %%v4,%%v2,%%v0 \n\t"
"vesrlg %%v4,%%v4,32 \n\t"
"vsegf %%v4,%%v4 \n\t"
"vsel %%v1,%%v3,%%v1,%%v4 \n\t" "vsel %%v1,%%v3,%%v1,%%v4 \n\t"
"vsel %%v0,%%v2,%%v0,%%v4 \n\t" "vsel %%v0,%%v2,%%v0,%%v4 \n\t"
"ste %%f0,%1 \n\t" "ste %%f0,%1 \n\t"

View File

@ -216,6 +216,8 @@ static BLASLONG isamin_kernel_64(BLASLONG n, FLOAT *x, FLOAT *amin)
"j 2f \n\t" "j 2f \n\t"
"1: \n\t" "1: \n\t"
"wfchsb %%v4,%%v0,%%v2 \n\t" "wfchsb %%v4,%%v0,%%v2 \n\t"
"vesrlg %%v4,%%v4,32 \n\t"
"vsegf %%v4,%%v4 \n\t"
"vsel %%v1,%%v3,%%v1,%%v4 \n\t" "vsel %%v1,%%v3,%%v1,%%v4 \n\t"
"vsel %%v0,%%v2,%%v0,%%v4 \n\t" "vsel %%v0,%%v2,%%v0,%%v4 \n\t"
"ste %%f0,%1 \n\t" "ste %%f0,%1 \n\t"

View File

@ -192,6 +192,8 @@ static BLASLONG ismax_kernel_64(BLASLONG n, FLOAT *x, FLOAT *max)
"j 2f \n\t" "j 2f \n\t"
"1: \n\t" "1: \n\t"
"wfchsb %%v4,%%v2,%%v0 \n\t" "wfchsb %%v4,%%v2,%%v0 \n\t"
"vesrlg %%v4,%%v4,32 \n\t"
"vsegf %%v4,%%v4 \n\t"
"vsel %%v1,%%v3,%%v1,%%v4 \n\t" "vsel %%v1,%%v3,%%v1,%%v4 \n\t"
"vsel %%v0,%%v2,%%v0,%%v4 \n\t" "vsel %%v0,%%v2,%%v0,%%v4 \n\t"
"ste %%f0,%1 \n\t" "ste %%f0,%1 \n\t"

View File

@ -192,6 +192,8 @@ static BLASLONG ismin_kernel_64(BLASLONG n, FLOAT *x, FLOAT *min)
"j 2f \n\t" "j 2f \n\t"
"1: \n\t" "1: \n\t"
"wfchsb %%v4,%%v0,%%v2 \n\t" "wfchsb %%v4,%%v0,%%v2 \n\t"
"vesrlg %%v4,%%v4,32 \n\t"
"vsegf %%v4,%%v4 \n\t"
"vsel %%v1,%%v3,%%v1,%%v4 \n\t" "vsel %%v1,%%v3,%%v1,%%v4 \n\t"
"vsel %%v0,%%v2,%%v0,%%v4 \n\t" "vsel %%v0,%%v2,%%v0,%%v4 \n\t"
"ste %%f0,%1 \n\t" "ste %%f0,%1 \n\t"