Skip to content

Commit 729303e

Browse files
authored
Merge pull request #2643 from craft-zhang/cortex-a53
Improve performance of SGEMM on Arm Cortex-A53
2 parents 5479655 + 9b7877c commit 729303e

File tree

4 files changed

+1589
-353
lines changed

4 files changed

+1589
-353
lines changed

kernel/arm64/KERNEL.CORTEXA53

Lines changed: 1 addition & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -126,16 +126,9 @@ endif
126126
SGEMMINCOPYOBJ = sgemm_incopy$(TSUFFIX).$(SUFFIX)
127127
SGEMMITCOPYOBJ = sgemm_itcopy$(TSUFFIX).$(SUFFIX)
128128
endif
129-
ifeq ($(SGEMM_UNROLL_N), 16)
129+
130130
SGEMMOTCOPY = sgemm_tcopy_$(SGEMM_UNROLL_N).S
131-
else
132-
SGEMMOTCOPY = ../generic/gemm_tcopy_$(SGEMM_UNROLL_N).c
133-
endif
134-
ifeq ($(SGEMM_UNROLL_N), 4)
135131
SGEMMONCOPY = sgemm_ncopy_$(SGEMM_UNROLL_N).S
136-
else
137-
SGEMMONCOPY = ../generic/gemm_ncopy_$(SGEMM_UNROLL_N).c
138-
endif
139132
SGEMMONCOPYOBJ = sgemm_oncopy$(TSUFFIX).$(SUFFIX)
140133
SGEMMOTCOPYOBJ = sgemm_otcopy$(TSUFFIX).$(SUFFIX)
141134

0 commit comments

Comments
 (0)