From a3cac9cca0fb81ae6b3c13275ad15999fdba0df0 Mon Sep 17 00:00:00 2001 From: Xianyi Zhang Date: Fri, 18 Dec 2020 11:53:23 +0800 Subject: [PATCH] Update sgemm kernel 1x4 for C910. --- kernel/riscv64/sgemm_kernel_16x4_c910v.c | 131 ++++++++++++++++------- 1 file changed, 94 insertions(+), 37 deletions(-) diff --git a/kernel/riscv64/sgemm_kernel_16x4_c910v.c b/kernel/riscv64/sgemm_kernel_16x4_c910v.c index 83507e744..65bde2fda 100644 --- a/kernel/riscv64/sgemm_kernel_16x4_c910v.c +++ b/kernel/riscv64/sgemm_kernel_16x4_c910v.c @@ -382,7 +382,7 @@ int CNAME(BLASLONG bm,BLASLONG bn,BLASLONG bk,FLOAT alpha,FLOAT* ba,FLOAT* bb,FL { BLASLONG i,j,k; FLOAT *C0,*C1,*C2,*C3; - FLOAT *ptrba,*ptrbb; + FLOAT *ptrba,*ptrbb, *tmpc; FLOAT loadb0,loadb1,loadb2,loadb3; FLOAT load0,load1,load2,load3,load4,load5,load6,load7; @@ -392,6 +392,7 @@ int CNAME(BLASLONG bm,BLASLONG bn,BLASLONG bk,FLOAT alpha,FLOAT* ba,FLOAT* bb,FL FLOAT res8,res9,res10,res11; FLOAT res12,res13,res14,res15; + for (j=0; j