Skip to content

Commit 3853014

Browse files
authored
Merge pull request #1 from xianyi/develop
rebase
2 parents 52ed274 + f216186 commit 3853014

17 files changed

+1274
-205
lines changed

.travis.yml

Lines changed: 20 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -211,44 +211,48 @@ matrix:
211211

212212
- &test-macos
213213
os: osx
214-
osx_image: xcode10.1
214+
osx_image: xcode11.5
215215
before_script:
216216
- COMMON_FLAGS="DYNAMIC_ARCH=1 NUM_THREADS=32"
217-
- brew update
218-
- brew install gcc@8 # for gfortran
219217
script:
220218
- travis_wait 45 make QUIET_MAKE=1 $COMMON_FLAGS $BTYPE
221219
env:
222-
- BTYPE="TARGET=NEHALEM BINARY=64 INTERFACE64=1 FC=gfortran-8"
220+
- BTYPE="TARGET=NEHALEM BINARY=64 INTERFACE64=1 FC=gfortran-9"
223221

224222
- <<: *test-macos
225223
osx_image: xcode12
226224
before_script:
227225
- COMMON_FLAGS="DYNAMIC_ARCH=1 NUM_THREADS=32"
228226
- brew update
229-
- brew install gcc@10 # for gfortran
227+
- brew install gcc@10
230228
script:
231229
- travis_wait 45 make QUIET_MAKE=1 $COMMON_FLAGS $BTYPE
232230
env:
233231
- BTYPE="TARGET=NEHALEM BINARY=64 INTERFACE64=1 FC=gfortran-10"
234232

235-
- <<: *test-macos
236-
osx_image: xcode10.0
237-
env:
238-
- BTYPE="TARGET=NEHALEM BINARY=32 NOFORTRAN=1"
233+
# - <<: *test-macos
234+
# osx_image: xcode10
235+
# env:
236+
# - BTYPE="TARGET=NEHALEM BINARY=32 NOFORTRAN=1"
239237

240238
- <<: *test-macos
241-
osx_image: xcode10.1
239+
osx_image: xcode11.5
240+
before_script:
241+
- COMMON_FLAGS="DYNAMIC_ARCH=1 NUM_THREADS=32"
242+
- brew update
242243
env:
243-
- CC="/Applications/Xcode-10.1.app/Contents/Developer/Toolchains/XcodeDefault.xctoolchain/usr/bin/clang"
244-
- CFLAGS="-O2 -Wno-macro-redefined -isysroot /Applications/Xcode-10.1.app/Contents/Developer/Platforms/iPhoneOS.platform/Developer/SDKs/iPhoneOS12.1.sdk -arch arm64 -miphoneos-version-min=10.0"
244+
# - CC="/Applications/Xcode-10.1.app/Contents/Developer/Toolchains/XcodeDefault.xctoolchain/usr/bin/clang"
245+
# - CFLAGS="-O2 -Wno-macro-redefined -isysroot /Applications/Xcode-10.1.app/Contents/Developer/Platforms/iPhoneOS.platform/Developer/SDKs/iPhoneOS12.1.sdk -arch arm64 -miphoneos-version-min=10.0"
246+
- CC="/Applications/Xcode-11.5.GM.Seed.app/Contents/Developer/Toolchains/XcodeDefault.xctoolchain/usr/bin/clang"
247+
- CFLAGS="-O2 -Wno-macro-redefined -isysroot /Applications/Xcode-11.5.GM.Seed.app/Contents/Developer/Platforms/iPhoneOS.platform/Developer/SDKs/iPhoneOS13.5.sdk -arch arm64 -miphoneos-version-min=10.0"
245248
- BTYPE="TARGET=ARMV8 BINARY=64 HOSTCC=clang NOFORTRAN=1"
246-
247249
- <<: *test-macos
248-
osx_image: xcode10.1
250+
osx_image: xcode11.5
249251
env:
250-
- CC="/Applications/Xcode-10.1.app/Contents/Developer/Toolchains/XcodeDefault.xctoolchain/usr/bin/clang"
251-
- CFLAGS="-O2 -mno-thumb -Wno-macro-redefined -isysroot /Applications/Xcode-10.1.app/Contents/Developer/Platforms/iPhoneOS.platform/Developer/SDKs/iPhoneOS12.1.sdk -arch armv7 -miphoneos-version-min=5.1"
252+
# - CC="/Applications/Xcode-10.1.app/Contents/Developer/Toolchains/XcodeDefault.xctoolchain/usr/bin/clang"
253+
# - CFLAGS="-O2 -mno-thumb -Wno-macro-redefined -isysroot /Applications/Xcode-10.1.app/Contents/Developer/Platforms/iPhoneOS.platform/Developer/SDKs/iPhoneOS12.1.sdk -arch armv7 -miphoneos-version-min=5.1"
254+
- CC="/Applications/Xcode-11.5.GM.Seed.app/Contents/Developer/Toolchains/XcodeDefault.xctoolchain/usr/bin/clang"
255+
- CFLAGS="-O2 -mno-thumb -Wno-macro-redefined -isysroot /Applications/Xcode-11.5.GM.Seed.app/Contents/Developer/Platforms/iPhoneOS.platform/Developer/SDKs/iPhoneOS13.5.sdk -arch armv7 -miphoneos-version-min=5.1"
252256
- BTYPE="TARGET=ARMV7 HOSTCC=clang NOFORTRAN=1"
253257

254258
- &test-graviton2

Makefile

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -268,7 +268,11 @@ ifeq ($(NOFORTRAN), $(filter 0,$(NOFORTRAN)))
268268
-@echo "POPTS = $(LAPACK_FPFLAGS)" >> $(NETLIB_LAPACK_DIR)/make.inc
269269
-@echo "FFLAGS_NOOPT = -O0 $(LAPACK_NOOPT)" >> $(NETLIB_LAPACK_DIR)/make.inc
270270
-@echo "PNOOPT = $(LAPACK_FPFLAGS) -O0" >> $(NETLIB_LAPACK_DIR)/make.inc
271+
ifeq ($(C_COMPILER)$(F_COMPILER)$(USE_OPENMP), CLANGGFORTRAN1)
272+
-@echo "LDFLAGS = $(FFLAGS) $(EXTRALIB) -lomp" >> $(NETLIB_LAPACK_DIR)/make.inc
273+
else
271274
-@echo "LDFLAGS = $(FFLAGS) $(EXTRALIB)" >> $(NETLIB_LAPACK_DIR)/make.inc
275+
endif
272276
-@echo "CC = $(CC)" >> $(NETLIB_LAPACK_DIR)/make.inc
273277
-@echo "override CFLAGS = $(LAPACK_CFLAGS)" >> $(NETLIB_LAPACK_DIR)/make.inc
274278
-@echo "AR = $(AR)" >> $(NETLIB_LAPACK_DIR)/make.inc

Makefile.system

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1561,6 +1561,7 @@ export KERNELDIR
15611561
export FUNCTION_PROFILE
15621562
export TARGET_CORE
15631563
export NO_AVX512
1564+
export NO_AVX2
15641565
export BUILD_BFLOAT16
15651566

15661567
export SBGEMM_UNROLL_M

Makefile.x86

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -59,9 +59,11 @@ LIBATLAS = -L$(ATLASPATH)/32 -lcblas -lf77blas -latlas -lm
5959
else
6060
LIBATLAS = -L$(ATLASPATH)/32 -lptf77blas -lptatlas -lpthread -lm
6161
endif
62-
62+
ifdef HAVE_SSE2
63+
CCOMMON_OPT += -msse2
64+
FCOMMON_OPT += -msse2
65+
endif
6366
ifdef HAVE_SSE3
64-
ifndef DYNAMIC_ARCH
6567
CCOMMON_OPT += -msse3
6668
FCOMMON_OPT += -msse3
6769
ifdef HAVE_SSSE3
@@ -73,5 +75,4 @@ CCOMMON_OPT += -msse4.1
7375
FCOMMON_OPT += -msse4.1
7476
endif
7577
endif
76-
endif
7778

Makefile.x86_64

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -20,18 +20,24 @@ ifdef HAVE_SSE4_1
2020
CCOMMON_OPT += -msse4.1
2121
FCOMMON_OPT += -msse4.1
2222
endif
23+
ifndef OLDGCC
2324
ifdef HAVE_AVX
2425
CCOMMON_OPT += -mavx
2526
FCOMMON_OPT += -mavx
2627
endif
28+
endif
29+
ifndef NO_AVX2
2730
ifdef HAVE_AVX2
2831
CCOMMON_OPT += -mavx2
2932
FCOMMON_OPT += -mavx2
3033
endif
34+
endif
35+
ifndef OLDGCC
3136
ifdef HAVE_FMA3
3237
CCOMMON_OPT += -mfma
3338
FCOMMON_OPT += -mfma
3439
endif
40+
endif
3541

3642
ifeq ($(CORE), SKYLAKEX)
3743
ifndef DYNAMIC_ARCH

c_check

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -276,6 +276,15 @@ if ($data =~ /HAVE_C11/) {
276276
}
277277
}
278278

279+
if ($compiler eq "GCC" &&( ($architecture eq "x86") || ($architecture eq "x86_64"))) {
280+
$no_avx2 = 0;
281+
$oldgcc = 0;
282+
$data = `$compiler_name -dumpversion`;
283+
if ($data <= 4.6) {
284+
$no_avx2 = 1;
285+
$oldgcc = 1;
286+
}
287+
}
279288

280289
$data = `$compiler_name $flags -S ctest1.c && grep globl ctest1.s | head -n 1 && rm -f ctest1.s`;
281290

@@ -368,6 +377,8 @@ print MAKEFILE "CEXTRALIB=$linker_L $linker_l $linker_a\n";
368377
print MAKEFILE "HAVE_MSA=1\n" if $have_msa eq 1;
369378
print MAKEFILE "MSA_FLAGS=$msa_flags\n" if $have_msa eq 1;
370379
print MAKEFILE "NO_AVX512=1\n" if $no_avx512 eq 1;
380+
print MAKEFILE "NO_AVX2=1\n" if $no_avx2 eq 1;
381+
print MAKEFILE "OLDGCC=1\n" if $oldgcc eq 1;
371382

372383
$os =~ tr/[a-z]/[A-Z]/;
373384
$architecture =~ tr/[a-z]/[A-Z]/;

f_check

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -330,6 +330,9 @@ if ($link ne "") {
330330
$flags =~ s/\@/\,/g;
331331
$linker_L .= "-Wl,". $flags . " " ;
332332
}
333+
if ($flags =~ /-lgomp/ && $CC =~ /clang/) {
334+
$flags = "-lomp";
335+
}
333336

334337
if (
335338
($flags =~ /^\-l/)

getarch.c

Lines changed: 55 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -326,6 +326,16 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
326326
#define FORCE
327327
#define FORCE_INTEL
328328
#define ARCHITECTURE "X86"
329+
#ifdef NO_AVX2
330+
#define SUBARCHITECTURE "SANDYBRIDGE"
331+
#define ARCHCONFIG "-DSANDYBRIDGE " \
332+
"-DL1_DATA_SIZE=32768 -DL1_DATA_LINESIZE=64 " \
333+
"-DL2_SIZE=262144 -DL2_LINESIZE=64 " \
334+
"-DDTB_DEFAULT_ENTRIES=64 -DDTB_SIZE=4096 " \
335+
"-DHAVE_CMOV -DHAVE_MMX -DHAVE_SSE -DHAVE_SSE2 -DHAVE_SSE3 -DHAVE_SSSE3 -DHAVE_SSE4_1 -DHAVE_SSE4_2 -DHAVE_AVX"
336+
#define LIBNAME "sandybridge"
337+
#define CORENAME "SANDYBRIDGE"
338+
#else
329339
#define SUBARCHITECTURE "HASWELL"
330340
#define ARCHCONFIG "-DHASWELL " \
331341
"-DL1_DATA_SIZE=32768 -DL1_DATA_LINESIZE=64 " \
@@ -336,6 +346,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
336346
#define LIBNAME "haswell"
337347
#define CORENAME "HASWELL"
338348
#endif
349+
#endif
339350

340351
#ifdef FORCE_SKYLAKEX
341352
#ifdef NO_AVX512
@@ -551,6 +562,16 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
551562
#define FORCE
552563
#define FORCE_INTEL
553564
#define ARCHITECTURE "X86"
565+
#ifdef NO_AVX2
566+
#define SUBARCHITECTURE "SANDYBRIDGE"
567+
#define ARCHCONFIG "-DSANDYBRIDGE " \
568+
"-DL1_DATA_SIZE=32768 -DL1_DATA_LINESIZE=64 " \
569+
"-DL2_SIZE=262144 -DL2_LINESIZE=64 " \
570+
"-DDTB_DEFAULT_ENTRIES=64 -DDTB_SIZE=4096 " \
571+
"-DHAVE_CMOV -DHAVE_MMX -DHAVE_SSE -DHAVE_SSE2 -DHAVE_SSE3 -DHAVE_SSSE3 -DHAVE_SSE4_1 -DHAVE_SSE4_2 -DHAVE_AVX"
572+
#define LIBNAME "sandybridge"
573+
#define CORENAME "SANDYBRIDGE"
574+
#else
554575
#define SUBARCHITECTURE "ZEN"
555576
#define ARCHCONFIG "-DZEN " \
556577
"-DL1_CODE_SIZE=32768 -DL1_CODE_LINESIZE=64 -DL1_CODE_ASSOCIATIVE=8 " \
@@ -565,6 +586,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
565586
#define LIBNAME "zen"
566587
#define CORENAME "ZEN"
567588
#endif
589+
#endif
568590

569591

570592
#ifdef FORCE_SSE_GENERIC
@@ -983,6 +1005,20 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
9831005
#else
9841006
#endif
9851007

1008+
#ifdef FORCE_RISCV64_GENERIC
1009+
#define FORCE
1010+
#define ARCHITECTURE "RISCV64"
1011+
#define SUBARCHITECTURE "RISCV64_GENERIC"
1012+
#define SUBDIRNAME "riscv64"
1013+
#define ARCHCONFIG "-DRISCV64_GENERIC " \
1014+
"-DL1_DATA_SIZE=32768 -DL1_DATA_LINESIZE=32 " \
1015+
"-DL2_SIZE=1048576 -DL2_LINESIZE=32 " \
1016+
"-DDTB_DEFAULT_ENTRIES=128 -DDTB_SIZE=4096 -DL2_ASSOCIATIVE=4 "
1017+
#define LIBNAME "riscv64_generic"
1018+
#define CORENAME "RISCV64_GENERIC"
1019+
#else
1020+
#endif
1021+
9861022
#ifdef FORCE_CORTEXA15
9871023
#define FORCE
9881024
#define ARCHITECTURE "ARM"
@@ -1268,6 +1304,21 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
12681304
#define CORENAME "Z14"
12691305
#endif
12701306

1307+
#ifdef FORCE_C910V
1308+
#define FORCE
1309+
#define ARCHITECTURE "RISCV64"
1310+
#define SUBARCHITECTURE "C910V"
1311+
#define SUBDIRNAME "riscv64"
1312+
#define ARCHCONFIG "-DC910V " \
1313+
"-DL1_DATA_SIZE=32768 -DL1_DATA_LINESIZE=32 " \
1314+
"-DL2_SIZE=1048576 -DL2_LINESIZE=32 " \
1315+
"-DDTB_DEFAULT_ENTRIES=128 -DDTB_SIZE=4096 -DL2_ASSOCIATIVE=4 "
1316+
#define LIBNAME "c910v"
1317+
#define CORENAME "C910V"
1318+
#else
1319+
#endif
1320+
1321+
12711322
#ifndef FORCE
12721323

12731324
#ifdef USER_TARGET
@@ -1322,6 +1373,10 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
13221373
#define OPENBLAS_SUPPORTED
13231374
#endif
13241375

1376+
#ifdef __riscv
1377+
#include "cpuid_riscv64.c"
1378+
#endif
1379+
13251380
#ifdef __arm__
13261381
#include "cpuid_arm.c"
13271382
#define OPENBLAS_SUPPORTED

0 commit comments

Comments
 (0)