Skip to content

Commit a897bc3

Browse files
authored
Merge pull request #99 from xianyi/develop
rebase
2 parents a0ada4b + 756802d commit a897bc3

13 files changed

+1993
-396
lines changed

Makefile.x86_64

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,6 +12,10 @@ ifdef HAVE_SSE3
1212
ifndef DYNAMIC_ARCH
1313
CCOMMON_OPT += -msse3
1414
FCOMMON_OPT += -msse3
15+
ifdef HAVE_SSSE3
16+
CCOMMON_OPT += -mssse3
17+
FCOMMON_OPT += -mssse3
18+
endif
1519
endif
1620
endif
1721

@@ -60,7 +64,7 @@ endif
6064
endif
6165
endif
6266

63-
ifeq ($(CORE), HASWELL)
67+
ifeq ($(CORE), $(filter $(CORE), HASWELL ZEN SKYLAKEX COOPERLAKE))
6468
ifndef DYNAMIC_ARCH
6569
ifndef NO_AVX2
6670
ifeq ($(C_COMPILER), GCC)

cmake/cc.cmake

Lines changed: 16 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -109,10 +109,25 @@ if (${CORE} STREQUAL "COOPERLAKE")
109109
if (NOT NO_AVX512)
110110
execute_process(COMMAND ${CMAKE_C_COMPILER} -dumpversion OUTPUT_VARIABLE GCC_VERSION)
111111
if (${GCC_VERSION} VERSION_GREATER 10.1 OR ${GCC_VERSION} VERSION_EQUAL 10.1)
112-
set (CCOMMON_OPT = "${CCOMMON_OPT} -march=cooperlake")
112+
set (CCOMMON_OPT "${CCOMMON_OPT} -march=cooperlake")
113113
else ()
114114
set (CCOMMON_OPT "${CCOMMON_OPT} -march=skylake-avx512")
115115
endif()
116116
endif ()
117117
endif ()
118118
endif ()
119+
120+
if (NOT DYNAMIC_ARCH)
121+
if (HAVE_AVX2)
122+
set (CCOMMON_OPT "${CCOMMON_OPT} -mavx2")
123+
endif ()
124+
if (HAVE_AVX)
125+
set (CCOMMON_OPT "${CCOMMON_OPT} -mavx")
126+
endif ()
127+
if (HAVE_SSE3)
128+
set (CCOMMON_OPT "${CCOMMON_OPT} -msse3")
129+
endif ()
130+
if (HAVE_SSSE3)
131+
set (CCOMMON_OPT "${CCOMMON_OPT} -mssse3")
132+
endif ()
133+
endif()

ctest/CMakeLists.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ FILE(WRITE ${CMAKE_CURRENT_BINARY_DIR}/test_cblas_helper.sh
1212
foreach(float_type ${FLOAT_TYPES})
1313
string(SUBSTRING ${float_type} 0 1 float_char_upper)
1414
string(TOLOWER ${float_char_upper} float_char)
15-
if (${float_char} STREQUAL "h")
15+
if (${float_char} STREQUAL "b")
1616
continue()
1717
endif()
1818
#level1

kernel/Makefile

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -8,6 +8,9 @@ include $(TOPDIR)/Makefile.system
88
ifdef HAVE_SSE3
99
CFLAGS += -msse3
1010
endif
11+
ifdef HAVE_SSSE3
12+
CFLAGS += -mssse3
13+
endif
1114

1215
ifeq ($(C_COMPILER), GCC)
1316
GCCVERSIONGTEQ9 := $(shell expr `$(CC) -dumpversion | cut -f1 -d.` \>= 9)
@@ -41,8 +44,8 @@ ifdef NO_AVX2
4144
endif
4245

4346
ifdef TARGET_CORE
44-
ifeq ($(TARGET_CORE), $(filter $(TARGET_CORE),PRESCOTT CORE2 PENRYN DUNNINGTON ATOM NANO NEHALEM BARCELONA BOBCAT BULLDOZER PILEDRIVER EXCAVATOR STEAMROLLER OPTERON_SSE3))
45-
override CFLAGS += -msse3
47+
ifeq ($(TARGET_CORE), $(filter $(TARGET_CORE),PRESCOTT CORE2 PENRYN DUNNINGTON ATOM NANO SANDYBRIDGE HASWELL NEHALEM ZEN BARCELONA BOBCAT BULLDOZER PILEDRIVER EXCAVATOR STEAMROLLER OPTERON_SSE3))
48+
override CFLAGS += -msse3 -mssse3
4649
endif
4750
ifeq ($(TARGET_CORE), COOPERLAKE)
4851
override CFLAGS += -DBUILD_KERNEL -DTABLE_NAME=gotoblas_$(TARGET_CORE)

kernel/power/KERNEL.POWER10

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -9,10 +9,10 @@ else
99

1010
SBGEMM_BETA = ../generic/gemm_beta.c
1111
SBGEMMKERNEL = sbgemm_kernel_power10.c
12-
SBGEMMINCOPY = ../generic/gemm_ncopy_16.c
13-
SBGEMMITCOPY = ../generic/gemm_tcopy_16.c
14-
SBGEMMONCOPY = ../generic/gemm_ncopy_8.c
15-
SBGEMMOTCOPY = ../generic/gemm_tcopy_8.c
12+
SBGEMMINCOPY = sbgemm_ncopy_16_power10.c
13+
SBGEMMITCOPY = sbgemm_tcopy_16_power10.c
14+
SBGEMMONCOPY = sbgemm_ncopy_8_power10.c
15+
SBGEMMOTCOPY = sbgemm_tcopy_8_power10.c
1616
SBGEMMINCOPYOBJ = sbgemm_incopy$(TSUFFIX).$(SUFFIX)
1717
SBGEMMITCOPYOBJ = sbgemm_itcopy$(TSUFFIX).$(SUFFIX)
1818
SBGEMMONCOPYOBJ = sbgemm_oncopy$(TSUFFIX).$(SUFFIX)

0 commit comments

Comments
 (0)