Skip to content

Commit 63d2609

Browse files
authored
Merge pull request #64 from xianyi/develop
rebase
2 parents fdd1b50 + 3a1b58d commit 63d2609

File tree

5 files changed

+26
-19
lines changed

5 files changed

+26
-19
lines changed

Makefile.system

Lines changed: 7 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -797,11 +797,11 @@ endif
797797
ifeq ($(USE_OPENMP), 1)
798798
FCOMMON_OPT += -fopenmp
799799
endif
800-
ifeq ($(OSNAME), Linux)
801-
ifeq ($(ARCH), x86_64)
802-
FLANG_VENDOR := $(shell expr `$(FC) --version|cut -f 1 -d "."|head -1`)
803-
endif
804-
endif
800+
#ifeq ($(OSNAME), Linux)
801+
#ifeq ($(ARCH), x86_64)
802+
#FLANG_VENDOR := $(shell expr `$(FC) --version|cut -f 1 -d "."|head -1`)
803+
#endif
804+
#endif
805805
endif
806806

807807
ifeq ($(F_COMPILER), G77)
@@ -1276,7 +1276,8 @@ endif
12761276

12771277
override CFLAGS += $(COMMON_OPT) $(CCOMMON_OPT) -I$(TOPDIR)
12781278
override PFLAGS += $(COMMON_OPT) $(CCOMMON_OPT) -I$(TOPDIR) -DPROFILE $(COMMON_PROF)
1279-
ifeq ($(FLANG_VENDOR),AOCC)
1279+
#ifeq ($(FLANG_VENDOR),AOCC)
1280+
ifeq ($(F_COMPILER),FLANG)
12801281
override FFLAGS += $(filter-out -O2 -O3,$(COMMON_OPT)) -O1 $(FCOMMON_OPT)
12811282
else
12821283
override FFLAGS += $(COMMON_OPT) $(FCOMMON_OPT)

cmake/fc.cmake

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -16,6 +16,7 @@ if (${F_COMPILER} STREQUAL "FLANG")
1616
if (USE_OPENMP)
1717
set(FCOMMON_OPT "${FCOMMON_OPT} -fopenmp")
1818
endif ()
19+
set(FCOMMON_OPT "${FCOMMON_OPT} -frecursive")
1920
endif ()
2021

2122
if (${F_COMPILER} STREQUAL "G77")

cmake/system.cmake

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -417,6 +417,15 @@ if (${CMAKE_C_COMPILER} STREQUAL "LSB" OR ${CMAKE_SYSTEM_NAME} STREQUAL "Windows
417417
set(LAPACK_CFLAGS "${LAPACK_CFLAGS} -DLAPACK_COMPLEX_STRUCTURE")
418418
endif ()
419419

420+
if ("${CMAKE_BUILD_TYPE}" STREQUAL "Release")
421+
if ("${F_COMPILER}" STREQUAL "FLANG")
422+
set(FILTER_FLAGS "-O2;-O3")
423+
foreach (FILTER_FLAG ${FILTER_FLAGS})
424+
string(REPLACE ${FILTER_FLAG} "-O1" CMAKE_Fortran_FLAGS_RELEASE ${CMAKE_Fortran_FLAGS_RELEASE})
425+
endforeach ()
426+
endif ()
427+
endif ()
428+
420429
if (NOT DEFINED SUFFIX)
421430
set(SUFFIX o)
422431
endif ()

exports/Makefile

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -155,8 +155,12 @@ ifeq ($(F_COMPILER), INTEL)
155155
-Wl,--whole-archive $< -Wl,--no-whole-archive \
156156
-Wl,-soname,$(INTERNALNAME) $(EXTRALIB)
157157
$(CC) $(CFLAGS) $(LDFLAGS) -w -o linktest linktest.c ../$(LIBSONAME) $(FEXTRALIB) && echo OK.
158+
else ifeq ($(F_COMPILER), FLANG)
159+
$(FC) $(FFLAGS) $(LDFLAGS) -shared -o ../$(LIBSONAME) \
160+
-Wl,--whole-archive $< -Wl,--no-whole-archive \
161+
-Wl,-soname,$(INTERNALNAME) $(EXTRALIB)
162+
$(CC) $(CFLAGS) $(LDFLAGS) -w -o linktest linktest.c ../$(LIBSONAME) $(FEXTRALIB) && echo OK.
158163
else
159-
160164
ifneq ($(C_COMPILER), LSB)
161165
$(CC) $(CFLAGS) $(LDFLAGS) -shared -o ../$(LIBSONAME) \
162166
-Wl,--whole-archive $< -Wl,--no-whole-archive \

kernel/arm64/sgemm_kernel_8x8_cortexa53.S

Lines changed: 4 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -681,12 +681,12 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
681681
.macro INIT8x4
682682
fmov s16, wzr
683683
fmov s17, wzr
684+
fmov s18, wzr
685+
fmov s19, s16
684686
fmov s20, wzr
685687
fmov s21, s16
686-
fmov s24, wzr
687-
fmov s25, s16
688-
fmov s28, wzr
689-
fmov s29, s16
688+
fmov s22, wzr
689+
fmov s23, s16
690690
.endm
691691

692692
.macro KERNEL8x4_I
@@ -765,14 +765,6 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
765765
fmla v21.4s, v3.4s, v6.s[2]
766766
fmla v22.4s, v2.4s, v6.s[3]
767767
fmla v23.4s, v3.4s, v6.s[3]
768-
fmla v24.4s, v2.4s, v7.s[0]
769-
fmla v25.4s, v3.4s, v7.s[0]
770-
fmla v26.4s, v2.4s, v7.s[1]
771-
fmla v27.4s, v3.4s, v7.s[1]
772-
fmla v28.4s, v2.4s, v7.s[2]
773-
fmla v29.4s, v3.4s, v7.s[2]
774-
fmla v30.4s, v2.4s, v7.s[3]
775-
fmla v31.4s, v3.4s, v7.s[3]
776768
.endm
777769

778770
.macro KERNEL8x4_SUB

0 commit comments

Comments
 (0)