Skip to content

Commit a388c4b

Browse files
authored
Merge pull request #4872 from chenx97/ls3a-fix-stack-fpr-len
Use ldc1 and sdc1 for the prologue and epilogue on LOONGSON3A
2 parents f24b521 + ef94b96 commit a388c4b

File tree

1 file changed

+18
-18
lines changed

1 file changed

+18
-18
lines changed

kernel/mips64/cgemm_kernel_loongson3a_4x2_ps.S

Lines changed: 18 additions & 18 deletions
Original file line numberDiff line numberDiff line change
@@ -131,11 +131,11 @@
131131
sd $21, 40($sp)
132132
sd $22, 48($sp)
133133

134-
ST $f24, 56($sp)
135-
ST $f25, 64($sp)
136-
ST $f26, 72($sp)
137-
ST $f27, 80($sp)
138-
ST $f28, 88($sp)
134+
sdc1 $f24, 56($sp)
135+
sdc1 $f25, 64($sp)
136+
sdc1 $f26, 72($sp)
137+
sdc1 $f27, 80($sp)
138+
sdc1 $f28, 88($sp)
139139

140140
#if defined(TRMMKERNEL)
141141
sd $23, 96($sp)
@@ -146,10 +146,10 @@
146146
#endif
147147

148148
#ifndef __64BIT__
149-
ST $f20,120($sp)
150-
ST $f21,128($sp)
151-
ST $f22,136($sp)
152-
ST $f23,144($sp)
149+
sdc1 $f20,120($sp)
150+
sdc1 $f21,128($sp)
151+
sdc1 $f22,136($sp)
152+
sdc1 $f23,144($sp)
153153
#endif
154154

155155
.align 4
@@ -4000,11 +4000,11 @@
40004000
ld $21, 40($sp)
40014001
ld $22, 48($sp)
40024002

4003-
LD $f24, 56($sp)
4004-
LD $f25, 64($sp)
4005-
LD $f26, 72($sp)
4006-
LD $f27, 80($sp)
4007-
LD $f28, 88($sp)
4003+
ldc1 $f24, 56($sp)
4004+
ldc1 $f25, 64($sp)
4005+
ldc1 $f26, 72($sp)
4006+
ldc1 $f27, 80($sp)
4007+
ldc1 $f28, 88($sp)
40084008

40094009
#if defined(TRMMKERNEL)
40104010
ld $23, 96($sp)
@@ -4013,10 +4013,10 @@
40134013
#endif
40144014

40154015
#ifndef __64BIT__
4016-
LD $f20,120($sp)
4017-
LD $f21,128($sp)
4018-
LD $f22,136($sp)
4019-
LD $f23,144($sp)
4016+
ldc1 $f20,120($sp)
4017+
ldc1 $f21,128($sp)
4018+
ldc1 $f22,136($sp)
4019+
ldc1 $f23,144($sp)
40204020
#endif
40214021

40224022
daddiu $sp,$sp,STACKSIZE

0 commit comments

Comments
 (0)