Skip to content

Commit 2241068

Browse files
authored
Merge pull request #3469 from martin-frbg/issue2986
Roll back SkylakeX DGEMM kernels to 4x8 when compiling for DYNAMIC_ARCH
2 parents 3e9a528 + 5378046 commit 2241068

File tree

2 files changed

+14
-0
lines changed

2 files changed

+14
-0
lines changed

kernel/x86_64/KERNEL.SKYLAKEX

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -20,13 +20,19 @@ SGEMM_SMALL_K_B0_TN = sgemm_small_kernel_tn_skylakex.c
2020
SGEMM_SMALL_K_TT = sgemm_small_kernel_tt_skylakex.c
2121
SGEMM_SMALL_K_B0_TT = sgemm_small_kernel_tt_skylakex.c
2222

23+
ifndef DYNAMIC_ARCH
2324
DGEMMKERNEL = dgemm_kernel_16x2_skylakex.c
2425
DTRMMKERNEL = dgemm_kernel_16x2_skylakex.c
2526
DGEMMINCOPY = ../generic/gemm_ncopy_16.c
2627
DGEMMITCOPY = dgemm_tcopy_16_skylakex.c
2728
DGEMMONCOPY = ../generic/gemm_ncopy_2.c
2829
DGEMMOTCOPY = ../generic/gemm_tcopy_2.c
2930
DTRSMKERNEL_RN = ../generic/trsm_kernel_RN.c
31+
else
32+
DGEMMKERNEL = dgemm_kernel_4x8_skylakex_2.c
33+
DGEMMONCOPY = dgemm_ncopy_8_skylakex.c
34+
DGEMMOTCOPY = dgemm_tcopy_8_skylakex.c
35+
endif
3036
DGEMM_SMALL_M_PERMIT = dgemm_small_kernel_permit_skylakex.c
3137
DGEMM_SMALL_K_NN = dgemm_small_kernel_nn_skylakex.c
3238
DGEMM_SMALL_K_B0_NN = dgemm_small_kernel_nn_skylakex.c

param.h

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1669,14 +1669,22 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
16691669
#else
16701670

16711671
#define SGEMM_DEFAULT_UNROLL_M 16
1672+
#ifndef DYNAMIC_ARCH
16721673
#define DGEMM_DEFAULT_UNROLL_M 16
1674+
#else
1675+
#define DGEMM_DEFAULT_UNROLL_M 4
1676+
#endif
16731677
#define QGEMM_DEFAULT_UNROLL_M 2
16741678
#define CGEMM_DEFAULT_UNROLL_M 8
16751679
#define ZGEMM_DEFAULT_UNROLL_M 4
16761680
#define XGEMM_DEFAULT_UNROLL_M 1
16771681

16781682
#define SGEMM_DEFAULT_UNROLL_N 4
1683+
#ifndef DYNAMIC_ARCH
16791684
#define DGEMM_DEFAULT_UNROLL_N 2
1685+
#else
1686+
#define DGEMM_DEFAULT_UNROLL_N 8
1687+
#endif
16801688
#define QGEMM_DEFAULT_UNROLL_N 2
16811689
#define CGEMM_DEFAULT_UNROLL_N 2
16821690
#define ZGEMM_DEFAULT_UNROLL_N 2

0 commit comments

Comments
 (0)