Skip to content

Commit 7c1925a

Browse files
authored
Use .p2align instead of .align for compatibility on Sandybridge as well
1 parent 2359c7c commit 7c1925a

18 files changed

+32
-32
lines changed

kernel/x86_64/caxpy_microk_sandy-2.c

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -50,11 +50,11 @@ static void caxpy_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha)
5050
"vmulps (%5), %%ymm0 , %%ymm0 \n\t"
5151
#endif
5252

53-
".align 16 \n\t"
53+
".p2align 4 \n\t"
5454
"1: \n\t"
5555

5656
"vmovups (%2,%0,4), %%ymm5 \n\t" // 4 complex values from x
57-
".align 2 \n\t"
57+
".p2align 1 \n\t"
5858
"vmovups 32(%2,%0,4), %%ymm7 \n\t" // 4 complex values from x
5959
"vmovups 64(%2,%0,4), %%ymm9 \n\t" // 4 complex values from x
6060
"vmovups 96(%2,%0,4), %%ymm11 \n\t" // 4 complex values from x
@@ -85,7 +85,7 @@ static void caxpy_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha)
8585
"vaddps %%ymm10, %%ymm11, %%ymm11 \n\t"
8686

8787
"vmovups %%ymm5 , (%3,%0,4) \n\t"
88-
".align 2 \n\t"
88+
".p2align 1 \n\t"
8989
"vmovups %%ymm7 , 32(%3,%0,4) \n\t"
9090
"vmovups %%ymm9 , 64(%3,%0,4) \n\t"
9191
"vmovups %%ymm11, 96(%3,%0,4) \n\t"

kernel/x86_64/cdot_microk_sandy-2.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@ static void cdot_kernel_16( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *dot)
4646
"vxorps %%ymm6, %%ymm6, %%ymm6 \n\t"
4747
"vxorps %%ymm7, %%ymm7, %%ymm7 \n\t"
4848

49-
".align 16 \n\t"
49+
".p2align 4 \n\t"
5050
"1: \n\t"
5151
"vmovups (%2,%0,4), %%ymm8 \n\t" // 2 * x
5252
"vmovups 32(%2,%0,4), %%ymm9 \n\t" // 2 * x

kernel/x86_64/daxpy_microk_sandy-2.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -50,7 +50,7 @@ static void daxpy_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha)
5050
"subq $16, %1 \n\t"
5151
"jz 2f \n\t"
5252

53-
".align 16 \n\t"
53+
".p2align 4 \n\t"
5454
"1: \n\t"
5555

5656
"vmulpd %%ymm4, %%ymm0, %%ymm4 \n\t"

kernel/x86_64/ddot_microk_sandy-2.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -41,7 +41,7 @@ static void ddot_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *dot)
4141
"vxorpd %%ymm6, %%ymm6, %%ymm6 \n\t"
4242
"vxorpd %%ymm7, %%ymm7, %%ymm7 \n\t"
4343

44-
".align 16 \n\t"
44+
".p2align 4 \n\t"
4545
"1: \n\t"
4646
"vmovups (%2,%0,8), %%ymm12 \n\t" // 2 * x
4747
"vmovups 32(%2,%0,8), %%ymm13 \n\t" // 2 * x

kernel/x86_64/dger_microk_sandy-2.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -53,7 +53,7 @@ static void dger_kernel_16( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha)
5353
"subq $8, %1 \n\t"
5454
"jz 2f \n\t"
5555

56-
".align 8 \n\t"
56+
".p2align 3 \n\t"
5757
"1: \n\t"
5858

5959
"vmulpd %%xmm4, %%xmm0, %%xmm4 \n\t"

kernel/x86_64/dscal_microk_sandy-2.c

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -58,7 +58,7 @@ static void dscal_kernel_8( BLASLONG n, FLOAT *alpha, FLOAT *x)
5858
"subq $1 , %0 \n\t"
5959
"jz 2f \n\t"
6060

61-
".align 16 \n\t"
61+
".p2align 4 \n\t"
6262
"1: \n\t"
6363
"prefetcht0 640(%1) \n\t"
6464

@@ -156,7 +156,7 @@ static void dscal_kernel_8_zero( BLASLONG n, FLOAT *alpha, FLOAT *x)
156156
"cmpq $0, %0 \n\t"
157157
"je 2f \n\t"
158158

159-
".align 16 \n\t"
159+
".p2align 4 \n\t"
160160
"1: \n\t"
161161

162162
"vmovups %%xmm0 ,-128(%1) \n\t"

kernel/x86_64/dsymv_L_microk_sandy-2.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -44,7 +44,7 @@ static void dsymv_kernel_4x4(BLASLONG from, BLASLONG to, FLOAT **a, FLOAT *x, FL
4444
"vbroadcastsd 16(%8), %%ymm6 \n\t" // temp1[1]
4545
"vbroadcastsd 24(%8), %%ymm7 \n\t" // temp1[1]
4646

47-
".align 16 \n\t"
47+
".p2align 4 \n\t"
4848
"1: \n\t"
4949

5050
"vmovups (%3,%0,8), %%ymm9 \n\t" // 2 * y

kernel/x86_64/dsymv_U_microk_sandy-2.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@ static void dsymv_kernel_4x4(BLASLONG n, FLOAT *a0, FLOAT *a1, FLOAT *a2, FLOAT
4646
"vbroadcastsd 24(%8), %%ymm7 \n\t" // temp1[1]
4747
"xorq %0,%0 \n\t"
4848

49-
".align 16 \n\t"
49+
".p2align 4 \n\t"
5050
"1: \n\t"
5151

5252
"vmovups (%3,%0,8), %%ymm9 \n\t" // 2 * y

kernel/x86_64/saxpy_microk_sandy-2.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -50,7 +50,7 @@ static void saxpy_kernel_16( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha)
5050
"subq $32, %1 \n\t"
5151
"jz 2f \n\t"
5252

53-
".align 16 \n\t"
53+
".p2align 4 \n\t"
5454
"1: \n\t"
5555

5656
"vmulps %%ymm4, %%ymm0, %%ymm4 \n\t"

kernel/x86_64/sdot_microk_sandy-2.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -41,7 +41,7 @@ static void sdot_kernel_16( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *dot)
4141
"vxorps %%ymm6, %%ymm6, %%ymm6 \n\t"
4242
"vxorps %%ymm7, %%ymm7, %%ymm7 \n\t"
4343

44-
".align 16 \n\t"
44+
".p2align 4 \n\t"
4545
"1: \n\t"
4646
"vmovups (%2,%0,4), %%ymm12 \n\t" // 2 * x
4747
"vmovups 32(%2,%0,4), %%ymm13 \n\t" // 2 * x

0 commit comments

Comments
 (0)