Use .p2align instead of .align for compatibility on Sandybridge as well

This commit is contained in:
Martin Kroeker
2018-02-24 19:43:15 +01:00
committed by GitHub
parent 2359c7c1a9
commit 7c1925acec
18 changed files with 32 additions and 32 deletions

View File

@@ -41,7 +41,7 @@ static void ddot_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *dot)
"vxorpd %%ymm6, %%ymm6, %%ymm6 \n\t"
"vxorpd %%ymm7, %%ymm7, %%ymm7 \n\t"
".align 16 \n\t"
".p2align 4 \n\t"
"1: \n\t"
"vmovups (%2,%0,8), %%ymm12 \n\t" // 2 * x
"vmovups 32(%2,%0,8), %%ymm13 \n\t" // 2 * x