Skip to content

Commit dcfe782

Browse files
authored
Merge pull request #4540 from ErnstPeng/feature-branch
Optimized ssymv and dsymv kernel LASX for LoongArch
2 parents 7804973 + 6546600 commit dcfe782

File tree

5 files changed

+1734
-0
lines changed

5 files changed

+1734
-0
lines changed

kernel/loongarch64/KERNEL.LOONGSON3R5

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -98,6 +98,9 @@ DGEMMOTCOPYOBJ = dgemm_otcopy$(TSUFFIX).$(SUFFIX)
9898
DGEMVNKERNEL = dgemv_n_8_lasx.S
9999
DGEMVTKERNEL = dgemv_t_8_lasx.S
100100

101+
DSYMV_U_KERNEL = dsymv_U_lasx.S
102+
DSYMV_L_KERNEL = dsymv_L_lasx.S
103+
101104
SGEMMKERNEL = sgemm_kernel_16x8_lasx.S
102105
SGEMMINCOPY = sgemm_ncopy_16_lasx.S
103106
SGEMMITCOPY = sgemm_tcopy_16_lasx.S
@@ -111,6 +114,9 @@ SGEMMOTCOPYOBJ = sgemm_otcopy$(TSUFFIX).$(SUFFIX)
111114
SGEMVNKERNEL = sgemv_n_8_lasx.S
112115
SGEMVTKERNEL = sgemv_t_8_lasx.S
113116

117+
SSYMV_U_KERNEL = ssymv_U_lasx.S
118+
SSYMV_L_KERNEL = ssymv_L_lasx.S
119+
114120
CGEMMKERNEL = cgemm_kernel_16x4_lasx.S
115121
CGEMMINCOPY = cgemm_ncopy_16_lasx.S
116122
CGEMMITCOPY = cgemm_tcopy_16_lasx.S

0 commit comments

Comments
 (0)