Refs #171. Prevent loading the dirty number from the buffer in sgemv_t x86 kernel.
This commit is contained in:
parent
fd3046b32a
commit
91ed4e4450
|
@ -236,6 +236,20 @@
|
||||||
jg .L06
|
jg .L06
|
||||||
ALIGN_4
|
ALIGN_4
|
||||||
|
|
||||||
|
//Padding zero to prevent loading the dirty number from buffer.
|
||||||
|
movl M, I
|
||||||
|
movl $8, J
|
||||||
|
andl $7, I
|
||||||
|
xorps %xmm0, %xmm0
|
||||||
|
subl I, J
|
||||||
|
ALIGN_2
|
||||||
|
.L07:
|
||||||
|
movss %xmm0, 0 * SIZE(Y1)
|
||||||
|
addl $SIZE, Y1
|
||||||
|
decl J
|
||||||
|
jg .L07
|
||||||
|
ALIGN_4
|
||||||
|
|
||||||
.L10:
|
.L10:
|
||||||
movl Y, Y1
|
movl Y, Y1
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue