@@ -50,11 +50,11 @@ static void caxpy_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha)
5050 "vmulps (%5), %%ymm0 , %%ymm0 \n\t"
5151#endif
5252
53- ".align 16 \n\t"
53+ ".p2align 4 \n\t"
5454 "1: \n\t"
5555
5656 "vmovups (%2,%0,4), %%ymm5 \n\t" // 4 complex values from x
57- ".align 2 \n\t"
57+ ".p2align 1 \n\t"
5858 "vmovups 32(%2,%0,4), %%ymm7 \n\t" // 4 complex values from x
5959 "vmovups 64(%2,%0,4), %%ymm9 \n\t" // 4 complex values from x
6060 "vmovups 96(%2,%0,4), %%ymm11 \n\t" // 4 complex values from x
@@ -70,7 +70,7 @@ static void caxpy_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha)
7070 "vpermilps $0xb1 , %%ymm11, %%ymm10 \n\t" // exchange real and imag part
7171
7272 "vfmadd213ps (%3,%0,4), %%ymm0 , %%ymm5 \n\t"
73- ".align 2 \n\t"
73+ ".p2align 1 \n\t"
7474 "vfmadd213ps 32(%3,%0,4), %%ymm0 , %%ymm7 \n\t"
7575 "vfmadd213ps 64(%3,%0,4), %%ymm0 , %%ymm9 \n\t"
7676 "vfmadd213ps 96(%3,%0,4), %%ymm0 , %%ymm11 \n\t"
@@ -96,7 +96,7 @@ static void caxpy_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha)
9696 "vfmadd231ps %%ymm1 , %%ymm10, %%ymm15 \n\t"
9797
9898 "vmovups %%ymm5 , (%3,%0,4) \n\t"
99- ".align 2 \n\t"
99+ ".p2align 1 \n\t"
100100 "vmovups %%ymm7 , 32(%3,%0,4) \n\t"
101101 "vmovups %%ymm9 , 64(%3,%0,4) \n\t"
102102 "vmovups %%ymm11, 96(%3,%0,4) \n\t"
0 commit comments