bugfix for haswell cgemm- and zgemm-kernel
This commit is contained in:
parent
35f668bb14
commit
b94ea89f52
|
@ -26,7 +26,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|||
**********************************************************************************/
|
||||
|
||||
/*********************************************************************
|
||||
* 2013/11/13 Saar
|
||||
* 2014/06/28 Saar
|
||||
* BLASTEST : OK
|
||||
* CTEST : OK
|
||||
* TEST : OK
|
||||
|
@ -816,16 +816,16 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|||
#ifdef WINDOWS_ABI
|
||||
movq %rdi, 48(%rsp)
|
||||
movq %rsi, 56(%rsp)
|
||||
movups %xmm6, 64(%rsp)
|
||||
movups %xmm7, 80(%rsp)
|
||||
movups %xmm8, 96(%rsp)
|
||||
movups %xmm9, 112(%rsp)
|
||||
movups %xmm10, 128(%rsp)
|
||||
movups %xmm11, 144(%rsp)
|
||||
movups %xmm12, 160(%rsp)
|
||||
movups %xmm13, 176(%rsp)
|
||||
movups %xmm14, 192(%rsp)
|
||||
movups %xmm15, 208(%rsp)
|
||||
vmovups %xmm6, 64(%rsp)
|
||||
vmovups %xmm7, 80(%rsp)
|
||||
vmovups %xmm8, 96(%rsp)
|
||||
vmovups %xmm9, 112(%rsp)
|
||||
vmovups %xmm10, 128(%rsp)
|
||||
vmovups %xmm11, 144(%rsp)
|
||||
vmovups %xmm12, 160(%rsp)
|
||||
vmovups %xmm13, 176(%rsp)
|
||||
vmovups %xmm14, 192(%rsp)
|
||||
vmovups %xmm15, 208(%rsp)
|
||||
|
||||
movq ARG1, OLD_M
|
||||
movq ARG2, OLD_N
|
||||
|
@ -838,6 +838,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|||
movsd OLD_OFFSET, %xmm12
|
||||
#endif
|
||||
vmovaps %xmm3, %xmm0
|
||||
vmovsd OLD_ALPHA_I, %xmm1
|
||||
|
||||
#else
|
||||
movq STACKSIZE + 8(%rsp), LDC
|
||||
|
@ -2253,6 +2254,8 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|||
|
||||
|
||||
.L999:
|
||||
vzeroupper
|
||||
|
||||
movq SP, %rsp
|
||||
movq (%rsp), %rbx
|
||||
movq 8(%rsp), %rbp
|
||||
|
@ -2264,16 +2267,16 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|||
#ifdef WINDOWS_ABI
|
||||
movq 48(%rsp), %rdi
|
||||
movq 56(%rsp), %rsi
|
||||
movups 64(%rsp), %xmm6
|
||||
movups 80(%rsp), %xmm7
|
||||
movups 96(%rsp), %xmm8
|
||||
movups 112(%rsp), %xmm9
|
||||
movups 128(%rsp), %xmm10
|
||||
movups 144(%rsp), %xmm11
|
||||
movups 160(%rsp), %xmm12
|
||||
movups 176(%rsp), %xmm13
|
||||
movups 192(%rsp), %xmm14
|
||||
movups 208(%rsp), %xmm15
|
||||
vmovups 64(%rsp), %xmm6
|
||||
vmovups 80(%rsp), %xmm7
|
||||
vmovups 96(%rsp), %xmm8
|
||||
vmovups 112(%rsp), %xmm9
|
||||
vmovups 128(%rsp), %xmm10
|
||||
vmovups 144(%rsp), %xmm11
|
||||
vmovups 160(%rsp), %xmm12
|
||||
vmovups 176(%rsp), %xmm13
|
||||
vmovups 192(%rsp), %xmm14
|
||||
vmovups 208(%rsp), %xmm15
|
||||
#endif
|
||||
|
||||
addq $ STACKSIZE, %rsp
|
||||
|
|
|
@ -26,7 +26,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|||
**********************************************************************************/
|
||||
|
||||
/********************************************************************************
|
||||
* 2013/11/13 Saar
|
||||
* 2014/06/28 Saar
|
||||
* BLASTEST : OK
|
||||
* CTEST : OK
|
||||
* TEST : OK
|
||||
|
@ -693,16 +693,16 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|||
#ifdef WINDOWS_ABI
|
||||
movq %rdi, 48(%rsp)
|
||||
movq %rsi, 56(%rsp)
|
||||
movups %xmm6, 64(%rsp)
|
||||
movups %xmm7, 80(%rsp)
|
||||
movups %xmm8, 96(%rsp)
|
||||
movups %xmm9, 112(%rsp)
|
||||
movups %xmm10, 128(%rsp)
|
||||
movups %xmm11, 144(%rsp)
|
||||
movups %xmm12, 160(%rsp)
|
||||
movups %xmm13, 176(%rsp)
|
||||
movups %xmm14, 192(%rsp)
|
||||
movups %xmm15, 208(%rsp)
|
||||
vmovups %xmm6, 64(%rsp)
|
||||
vmovups %xmm7, 80(%rsp)
|
||||
vmovups %xmm8, 96(%rsp)
|
||||
vmovups %xmm9, 112(%rsp)
|
||||
vmovups %xmm10, 128(%rsp)
|
||||
vmovups %xmm11, 144(%rsp)
|
||||
vmovups %xmm12, 160(%rsp)
|
||||
vmovups %xmm13, 176(%rsp)
|
||||
vmovups %xmm14, 192(%rsp)
|
||||
vmovups %xmm15, 208(%rsp)
|
||||
|
||||
movq ARG1, OLD_M
|
||||
movq ARG2, OLD_N
|
||||
|
@ -715,6 +715,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|||
movsd OLD_OFFSET, %xmm12
|
||||
#endif
|
||||
vmovaps %xmm3, %xmm0
|
||||
vmovsd OLD_ALPHA_I, %xmm1
|
||||
|
||||
#else
|
||||
movq STACKSIZE + 8(%rsp), LDC
|
||||
|
@ -1781,6 +1782,8 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|||
|
||||
|
||||
.L999:
|
||||
vzeroupper
|
||||
|
||||
movq SP, %rsp
|
||||
movq (%rsp), %rbx
|
||||
movq 8(%rsp), %rbp
|
||||
|
@ -1792,16 +1795,16 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|||
#ifdef WINDOWS_ABI
|
||||
movq 48(%rsp), %rdi
|
||||
movq 56(%rsp), %rsi
|
||||
movups 64(%rsp), %xmm6
|
||||
movups 80(%rsp), %xmm7
|
||||
movups 96(%rsp), %xmm8
|
||||
movups 112(%rsp), %xmm9
|
||||
movups 128(%rsp), %xmm10
|
||||
movups 144(%rsp), %xmm11
|
||||
movups 160(%rsp), %xmm12
|
||||
movups 176(%rsp), %xmm13
|
||||
movups 192(%rsp), %xmm14
|
||||
movups 208(%rsp), %xmm15
|
||||
vmovups 64(%rsp), %xmm6
|
||||
vmovups 80(%rsp), %xmm7
|
||||
vmovups 96(%rsp), %xmm8
|
||||
vmovups 112(%rsp), %xmm9
|
||||
vmovups 128(%rsp), %xmm10
|
||||
vmovups 144(%rsp), %xmm11
|
||||
vmovups 160(%rsp), %xmm12
|
||||
vmovups 176(%rsp), %xmm13
|
||||
vmovups 192(%rsp), %xmm14
|
||||
vmovups 208(%rsp), %xmm15
|
||||
#endif
|
||||
|
||||
addq $ STACKSIZE, %rsp
|
||||
|
|
Loading…
Reference in New Issue