Skip to content

Commit 3aecafa

Browse files
authored
Change "HALF" and "sh" to "BFLOAT16" and "sb"
1 parent 756062a commit 3aecafa

File tree

4 files changed

+125
-125
lines changed

4 files changed

+125
-125
lines changed

kernel/CMakeLists.txt

Lines changed: 14 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -41,8 +41,8 @@ function (build_core TARGET_CORE KDIR TSUFFIX KERNEL_DEFINITIONS)
4141
foreach (float_type ${FLOAT_TYPES})
4242
# a bit of metaprogramming here to pull out the appropriate KERNEL var
4343
string(SUBSTRING ${float_type} 0 1 float_char)
44-
if (${float_type} STREQUAL "HALF")
45-
set (float_char "SH")
44+
if (${float_type} STREQUAL "BFLOAT16")
45+
set (float_char "SB")
4646
endif ()
4747
GenerateNamedObjects("${KERNELDIR}/${${float_char}AMAXKERNEL}" "USE_ABS" "amax_k" false "" "" false ${float_type})
4848
GenerateNamedObjects("${KERNELDIR}/${${float_char}AMINKERNEL}" "USE_ABS;USE_MIN" "amin_k" false "" "" false ${float_type})
@@ -149,8 +149,8 @@ function (build_core TARGET_CORE KDIR TSUFFIX KERNEL_DEFINITIONS)
149149
GenerateNamedObjects("generic/ger.c" "" "ger_k" false "" "" "" 3)
150150
foreach (float_type ${FLOAT_TYPES})
151151
string(SUBSTRING ${float_type} 0 1 float_char)
152-
if (${float_type} STREQUAL "HALF")
153-
set (float_char "SH")
152+
if (${float_type} STREQUAL "BFLOAT16")
153+
set (float_char "SB")
154154
endif ()
155155
if (${float_type} STREQUAL "COMPLEX" OR ${float_type} STREQUAL "ZCOMPLEX")
156156
GenerateNamedObjects("${KERNELDIR}/${${float_char}GERUKERNEL}" "" "geru_k" false "" "" false ${float_type})
@@ -208,13 +208,13 @@ function (build_core TARGET_CORE KDIR TSUFFIX KERNEL_DEFINITIONS)
208208
GenerateNamedObjects("${KERNELDIR}/${SGEMMDIRECTPERFORMANT}" "" "gemm_direct_performant" false "" "" false SINGLE)
209209
endif()
210210

211-
foreach (float_type SINGLE DOUBLE HALF)
211+
foreach (float_type SINGLE DOUBLE BFLOAT16)
212212
string(SUBSTRING ${float_type} 0 1 float_char)
213-
if (${float_type} STREQUAL "HALF")
214-
if (NOT ${BUILD_HALF})
213+
if (${float_type} STREQUAL "BFLOAT16")
214+
if (NOT ${BUILD_BFLOAT16})
215215
continue ()
216216
else ()
217-
set (float_char "SH")
217+
set (float_char "SB")
218218
endif ()
219219
endif ()
220220
GenerateNamedObjects("${KERNELDIR}/${${float_char}GEMMKERNEL}" "" "gemm_kernel" false "" "" false ${float_type})
@@ -254,8 +254,8 @@ function (build_core TARGET_CORE KDIR TSUFFIX KERNEL_DEFINITIONS)
254254

255255
foreach (float_type ${FLOAT_TYPES})
256256
string(SUBSTRING ${float_type} 0 1 float_char)
257-
if (${float_type} STREQUAL "HALF")
258-
set (float_char "SH")
257+
if (${float_type} STREQUAL "BFLOAT16")
258+
set (float_char "SB")
259259
endif ()
260260
if (${float_char}GEMMINCOPY)
261261
GenerateNamedObjects("${KERNELDIR}/${${float_char}GEMMINCOPY}" "${float_type}" "${${float_char}GEMMINCOPYOBJ}" false "" "" true ${float_type})
@@ -620,8 +620,8 @@ function (build_core TARGET_CORE KDIR TSUFFIX KERNEL_DEFINITIONS)
620620
# Makefile.LA
621621
if(NOT NO_LAPACK)
622622
foreach (float_type ${FLOAT_TYPES})
623-
if (${float_type} STREQUAL "HALF")
624-
set (float_char "SH")
623+
if (${float_type} STREQUAL "BFLOAT16")
624+
set (float_char "SB")
625625
endif ()
626626
if (NOT DEFINED ${float_char}NEG_TCOPY)
627627
if (${float_char} STREQUAL "Z" OR ${float_char} STREQUAL "C" OR ${float_char} STREQUAL "X")
@@ -688,8 +688,8 @@ function (build_core TARGET_CORE KDIR TSUFFIX KERNEL_DEFINITIONS)
688688
foreach (float_type ${FLOAT_TYPES})
689689
# a bit of metaprogramming here to pull out the appropriate KERNEL var
690690
string(SUBSTRING ${float_type} 0 1 float_char)
691-
if (${float_type} STREQUAL "HALF")
692-
set (float_char "SH")
691+
if (${float_type} STREQUAL "BFLOAT16")
692+
set (float_char "SB")
693693
endif ()
694694
GenerateNamedObjects("generic/neg_tcopy_${${float_char}GEMM_UNROLL_M}.c" "" "neg_tcopy" false "" ${TSUFFIX} false ${float_type})
695695
GenerateNamedObjects("generic/laswp_ncopy_${${float_char}GEMM_UNROLL_N}.c" "" "laswp_ncopy" false "" ${TSUFFIX} false ${float_type})

kernel/Makefile.L1

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -262,9 +262,9 @@ ifndef XDOTKERNEL
262262
XDOTKERNEL = zdot.S
263263
endif
264264

265-
ifeq ($(BUILD_HALF),1)
266-
ifndef SHDOTKERNEL
267-
SHDOTKERNEL = ../x86_64/shdot.c
265+
ifeq ($(BUILD_BFLOAT16),1)
266+
ifndef SBDOTKERNEL
267+
SBDOTKERNEL = ../x86_64/sbdot.c
268268
endif
269269

270270
ifndef TOBF16KERNEL
@@ -530,11 +530,11 @@ XBLASOBJS += \
530530
xdotc_k$(TSUFFIX).$(SUFFIX) xdotu_k$(TSUFFIX).$(SUFFIX) xnrm2_k$(TSUFFIX).$(SUFFIX) xqrot_k$(TSUFFIX).$(SUFFIX) \
531531
xscal_k$(TSUFFIX).$(SUFFIX) xswap_k$(TSUFFIX).$(SUFFIX) xsum_k$(TSUFFIX).$(SUFFIX)
532532

533-
ifeq ($(BUILD_HALF),1)
533+
ifeq ($(BUILD_BFLOAT16),1)
534534
SHBLASOBJS += \
535-
shdot_k$(TSUFFIX).$(SUFFIX)
535+
sbdot_k$(TSUFFIX).$(SUFFIX)
536536
SHEXTOBJS += \
537-
shstobf16_k$(TSUFFIX).$(SUFFIX) shdtobf16_k$(TSUFFIX).$(SUFFIX)
537+
sbstobf16_k$(TSUFFIX).$(SUFFIX) sbdtobf16_k$(TSUFFIX).$(SUFFIX)
538538
SHEXTOBJS += \
539539
sbf16tos_k$(TSUFFIX).$(SUFFIX) dbf16tod_k$(TSUFFIX).$(SUFFIX)
540540
endif
@@ -757,12 +757,12 @@ $(KDIR)ddot_k$(TSUFFIX).$(SUFFIX) $(KDIR)ddot_k$(TPSUFFIX).$(PSUFFIX) : $(KERNEL
757757
$(KDIR)qdot_k$(TSUFFIX).$(SUFFIX) $(KDIR)qdot_k$(TPSUFFIX).$(PSUFFIX) : $(KERNELDIR)/$(QDOTKERNEL)
758758
$(CC) -c $(CFLAGS) -UCOMPLEX -DXDOUBLE $< -o $@
759759

760-
ifeq ($(BUILD_HALF),1)
761-
$(KDIR)shdot_k$(TSUFFIX).$(SUFFIX) $(KDIR)shdot_k$(TPSUFFIX).$(PSUFFIX) : $(KERNELDIR)/$(SHDOTKERNEL)
760+
ifeq ($(BUILD_BFLOAT16),1)
761+
$(KDIR)sbdot_k$(TSUFFIX).$(SUFFIX) $(KDIR)sbdot_k$(TPSUFFIX).$(PSUFFIX) : $(KERNELDIR)/$(SBDOTKERNEL)
762762
$(CC) -c $(CFLAGS) -UCOMPLEX $< -o $@
763-
$(KDIR)shstobf16_k$(TSUFFIX).$(SUFFIX) : $(KERNELDIR)/$(TOBF16KERNEL)
763+
$(KDIR)sbstobf16_k$(TSUFFIX).$(SUFFIX) : $(KERNELDIR)/$(TOBF16KERNEL)
764764
$(CC) -c $(CFLAGS) -UDOUBLE -DSINGLE $< -o $@
765-
$(KDIR)shdtobf16_k$(TSUFFIX).$(SUFFIX) : $(KERNELDIR)/$(TOBF16KERNEL)
765+
$(KDIR)sbdtobf16_k$(TSUFFIX).$(SUFFIX) : $(KERNELDIR)/$(TOBF16KERNEL)
766766
$(CC) -c $(CFLAGS) -DDOUBLE -USINGLE $< -o $@
767767
$(KDIR)sbf16tos_k$(TSUFFIX).$(SUFFIX) : $(KERNELDIR)/$(BF16TOKERNEL)
768768
$(CC) -c $(CFLAGS) -UDOUBLE -DSINGLE $< -o $@

kernel/Makefile.L3

Lines changed: 67 additions & 67 deletions
Original file line numberDiff line numberDiff line change
@@ -80,24 +80,24 @@ SGEMMDIRECTPERFORMANT = sgemm_direct_performant.c
8080
endif
8181
endif
8282

83-
ifeq ($(BUILD_HALF), 1)
84-
ifndef SHGEMMKERNEL
85-
SHGEMM_BETA = ../generic/gemm_beta.c
86-
SHGEMMKERNEL = ../generic/gemmkernel_2x2.c
87-
SHGEMMINCOPY = ../generic/gemm_ncopy_2.c
88-
SHGEMMITCOPY = ../generic/gemm_tcopy_2.c
89-
SHGEMMONCOPY = ../generic/gemm_ncopy_2.c
90-
SHGEMMOTCOPY = ../generic/gemm_tcopy_2.c
91-
SHGEMMINCOPYOBJ = shgemm_incopy$(TSUFFIX).$(SUFFIX)
92-
SHGEMMITCOPYOBJ = shgemm_itcopy$(TSUFFIX).$(SUFFIX)
93-
SHGEMMONCOPYOBJ = shgemm_oncopy$(TSUFFIX).$(SUFFIX)
94-
SHGEMMOTCOPYOBJ = shgemm_otcopy$(TSUFFIX).$(SUFFIX)
83+
ifeq ($(BUILD_BFLOAT16), 1)
84+
ifndef SBGEMMKERNEL
85+
SBGEMM_BETA = ../generic/gemm_beta.c
86+
SBGEMMKERNEL = ../generic/gemmkernel_2x2.c
87+
SBGEMMINCOPY = ../generic/gemm_ncopy_2.c
88+
SBGEMMITCOPY = ../generic/gemm_tcopy_2.c
89+
SBGEMMONCOPY = ../generic/gemm_ncopy_2.c
90+
SBGEMMOTCOPY = ../generic/gemm_tcopy_2.c
91+
SBGEMMINCOPYOBJ = sbgemm_incopy$(TSUFFIX).$(SUFFIX)
92+
SBGEMMITCOPYOBJ = sbgemm_itcopy$(TSUFFIX).$(SUFFIX)
93+
SBGEMMONCOPYOBJ = sbgemm_oncopy$(TSUFFIX).$(SUFFIX)
94+
SBGEMMOTCOPYOBJ = sbgemm_otcopy$(TSUFFIX).$(SUFFIX)
9595
endif
9696

9797
SHKERNELOBJS += \
98-
shgemm_kernel$(TSUFFIX).$(SUFFIX) \
99-
$(SHGEMMINCOPYOBJ) $(SHGEMMITCOPYOBJ) \
100-
$(SHGEMMONCOPYOBJ) $(SHGEMMOTCOPYOBJ)
98+
sbgemm_kernel$(TSUFFIX).$(SUFFIX) \
99+
$(SBGEMMINCOPYOBJ) $(SBGEMMITCOPYOBJ) \
100+
$(SBGEMMONCOPYOBJ) $(SBGEMMOTCOPYOBJ)
101101
endif
102102

103103
ifneq "$(or $(BUILD_SINGLE),$(BUILD_DOUBLE),$(BUILD_COMPLEX))" ""
@@ -149,7 +149,7 @@ XKERNELOBJS += \
149149
$(XGEMMINCOPYOBJ) $(XGEMMITCOPYOBJ) \
150150
$(XGEMMONCOPYOBJ) $(XGEMMOTCOPYOBJ)
151151

152-
ifeq ($(BUILD_HALF),1)
152+
ifeq ($(BUILD_BFLOAT16),1)
153153
SHBLASOBJS += $(SHKERNELOBJS)
154154
endif
155155
SBLASOBJS += $(SKERNELOBJS)
@@ -159,8 +159,8 @@ CBLASOBJS += $(CKERNELOBJS)
159159
ZBLASOBJS += $(ZKERNELOBJS)
160160
XBLASOBJS += $(XKERNELOBJS)
161161

162-
ifeq ($(BUILD_HALF),1)
163-
SHBLASOBJS += shgemm_beta$(TSUFFIX).$(SUFFIX)
162+
ifeq ($(BUILD_BFLOAT16),1)
163+
SHBLASOBJS += sbgemm_beta$(TSUFFIX).$(SUFFIX)
164164
endif
165165

166166
ifneq "$(or $(BUILD_SINGLE),$(BUILD_DOUBLE))" ""
@@ -492,11 +492,11 @@ ZBLASOBJS += \
492492
zgeadd_k$(TSUFFIX).$(SUFFIX)
493493
endif
494494

495-
ifeq ($(BUILD_HALF), 1)
496-
SHGEMMINCOPYOBJ_P = $(SHGEMMINCOPYOBJ:.$(SUFFIX)=.$(PSUFFIX))
497-
SHGEMMITCOPYOBJ_P = $(SHGEMMITCOPYOBJ:.$(SUFFIX)=.$(PSUFFIX))
498-
SHGEMMONCOPYOBJ_P = $(SHGEMMONCOPYOBJ:.$(SUFFIX)=.$(PSUFFIX))
499-
SHGEMMOTCOPYOBJ_P = $(SHGEMMOTCOPYOBJ:.$(SUFFIX)=.$(PSUFFIX))
495+
ifeq ($(BUILD_BFLOAT16), 1)
496+
SBGEMMINCOPYOBJ_P = $(SBGEMMINCOPYOBJ:.$(SUFFIX)=.$(PSUFFIX))
497+
SBGEMMITCOPYOBJ_P = $(SBGEMMITCOPYOBJ:.$(SUFFIX)=.$(PSUFFIX))
498+
SBGEMMONCOPYOBJ_P = $(SBGEMMONCOPYOBJ:.$(SUFFIX)=.$(PSUFFIX))
499+
SBGEMMOTCOPYOBJ_P = $(SBGEMMOTCOPYOBJ:.$(SUFFIX)=.$(PSUFFIX))
500500
endif
501501

502502
SGEMMINCOPYOBJ_P = $(SGEMMINCOPYOBJ:.$(SUFFIX)=.$(PSUFFIX))
@@ -524,9 +524,9 @@ XGEMMITCOPYOBJ_P = $(XGEMMITCOPYOBJ:.$(SUFFIX)=.$(PSUFFIX))
524524
XGEMMONCOPYOBJ_P = $(XGEMMONCOPYOBJ:.$(SUFFIX)=.$(PSUFFIX))
525525
XGEMMOTCOPYOBJ_P = $(XGEMMOTCOPYOBJ:.$(SUFFIX)=.$(PSUFFIX))
526526

527-
ifeq ($(BUILD_HALF),1)
528-
$(KDIR)shgemm_beta$(TSUFFIX).$(SUFFIX) : $(KERNELDIR)/$(SHGEMM_BETA)
529-
$(CC) $(CFLAGS) -c -DHALF -UDOUBLE -UCOMPLEX $< -o $@
527+
ifeq ($(BUILD_BFLOAT16),1)
528+
$(KDIR)sbgemm_beta$(TSUFFIX).$(SUFFIX) : $(KERNELDIR)/$(SBGEMM_BETA)
529+
$(CC) $(CFLAGS) -c -DBFLOAT16 -UDOUBLE -UCOMPLEX $< -o $@
530530
endif
531531

532532
$(KDIR)sgemm_beta$(TSUFFIX).$(SUFFIX) : $(KERNELDIR)/$(SGEMM_BETA)
@@ -548,35 +548,35 @@ $(KDIR)xgemm_beta$(TSUFFIX).$(SUFFIX) : $(KERNELDIR)/$(XGEMM_BETA)
548548
$(CC) $(CFLAGS) -c -DXDOUBLE -DCOMPLEX $< -o $@
549549

550550

551-
ifeq ($(BUILD_HALF), 1)
551+
ifeq ($(BUILD_BFLOAT16), 1)
552552

553-
$(KDIR)$(SHGEMMONCOPYOBJ) : $(KERNELDIR)/$(SHGEMMONCOPY)
554-
$(CC) $(CFLAGS) -c -DHALF -UDOUBLE -UCOMPLEX $< -o $@
553+
$(KDIR)$(SBGEMMONCOPYOBJ) : $(KERNELDIR)/$(SBGEMMONCOPY)
554+
$(CC) $(CFLAGS) -c -DBFLOAT16 -UDOUBLE -UCOMPLEX $< -o $@
555555

556-
$(KDIR)$(SHGEMMOTCOPYOBJ) : $(KERNELDIR)/$(SHGEMMOTCOPY)
556+
$(KDIR)$(SBGEMMOTCOPYOBJ) : $(KERNELDIR)/$(SBGEMMOTCOPY)
557557

558558
ifeq ($(OS), AIX)
559-
$(CC) $(CFLAGS) -S -DHALF -UDOUBLE -UCOMPLEX $< -o - > shgemmotcopy.s
560-
m4 shgemmotcopy.s > shgemmotcopy_nomacros.s
561-
$(CC) $(CFLAGS) -c -DHALF -UDOUBLE -UCOMPLEX shgemmotcopy_nomacros.s -o $@
562-
rm shgemmotcopy.s shgemmotcopy_nomacros.s
559+
$(CC) $(CFLAGS) -S -DBFLOAT16 -UDOUBLE -UCOMPLEX $< -o - > sbgemmotcopy.s
560+
m4 sbgemmotcopy.s > sbgemmotcopy_nomacros.s
561+
$(CC) $(CFLAGS) -c -DBFLOAT16 -UDOUBLE -UCOMPLEX sbgemmotcopy_nomacros.s -o $@
562+
rm sbgemmotcopy.s sbgemmotcopy_nomacros.s
563563
else
564-
$(CC) $(CFLAGS) -c -DHALF -UDOUBLE -UCOMPLEX $< -o $@
564+
$(CC) $(CFLAGS) -c -DBFLOAT16 -UDOUBLE -UCOMPLEX $< -o $@
565565
endif
566566

567-
ifneq ($(SHGEMM_UNROLL_M), $(SHGEMM_UNROLL_N))
567+
ifneq ($(SBGEMM_UNROLL_M), $(SBGEMM_UNROLL_N))
568568

569-
$(KDIR)$(SHGEMMINCOPYOBJ) : $(KERNELDIR)/$(SHGEMMINCOPY)
570-
$(CC) $(CFLAGS) -c -DHALF -UDOUBLE -UCOMPLEX $< -o $@
569+
$(KDIR)$(SBGEMMINCOPYOBJ) : $(KERNELDIR)/$(SBGEMMINCOPY)
570+
$(CC) $(CFLAGS) -c -DBFLOAT16 -UDOUBLE -UCOMPLEX $< -o $@
571571

572-
$(KDIR)$(SHGEMMITCOPYOBJ) : $(KERNELDIR)/$(SHGEMMITCOPY)
572+
$(KDIR)$(SBGEMMITCOPYOBJ) : $(KERNELDIR)/$(SBGEMMITCOPY)
573573
ifeq ($(OS), AIX)
574-
$(CC) $(CFLAGS) -S -DHALF -UDOUBLE -UCOMPLEX $< -o - > shgemmitcopy.s
575-
m4 shgemmitcopy.s > shgemmitcopy_nomacros.s
576-
$(CC) $(CFLAGS) -c -DHALF -UDOUBLE -UCOMPLEX shgemmitcopy_nomacros.s -o $@
577-
rm shgemmitcopy.s shgemmitcopy_nomacros.s
574+
$(CC) $(CFLAGS) -S -DBFLOAT16 -UDOUBLE -UCOMPLEX $< -o - > sbgemmitcopy.s
575+
m4 sbgemmitcopy.s > sbgemmitcopy_nomacros.s
576+
$(CC) $(CFLAGS) -c -DBFLOAT16 -UDOUBLE -UCOMPLEX sbgemmitcopy_nomacros.s -o $@
577+
rm sbgemmitcopy.s sbgemmitcopy_nomacros.s
578578
else
579-
$(CC) $(CFLAGS) -c -DHALF -UDOUBLE -UCOMPLEX $< -o $@
579+
$(CC) $(CFLAGS) -c -DBFLOAT16 -UDOUBLE -UCOMPLEX $< -o $@
580580
endif
581581

582582
endif
@@ -746,16 +746,16 @@ $(KDIR)sgemm_direct$(TSUFFIX).$(SUFFIX) : $(KERNELDIR)/$(SGEMMDIRECTKERNEL)
746746
$(CC) $(CFLAGS) -c -UDOUBLE -UCOMPLEX $< -o $@
747747
endif
748748

749-
ifeq ($(BUILD_HALF), 1)
749+
ifeq ($(BUILD_BFLOAT16), 1)
750750

751-
$(KDIR)shgemm_kernel$(TSUFFIX).$(SUFFIX) : $(KERNELDIR)/$(SHGEMMKERNEL) $(SHGEMMDEPEND)
751+
$(KDIR)sbgemm_kernel$(TSUFFIX).$(SUFFIX) : $(KERNELDIR)/$(SBGEMMKERNEL) $(SBGEMMDEPEND)
752752
ifeq ($(OS), AIX)
753-
$(CC) $(CFLAGS) -S -DHALF -UDOUBLE -UCOMPLEX $< -o - > shgemm_kernel$(TSUFFIX).s
754-
m4 shgemm_kernel$(TSUFFIX).s > shgemm_kernel$(TSUFFIX)_nomacros.s
755-
$(CC) $(CFLAGS) -c -DHALF -UDOUBLE -UCOMPLEX shgemm_kernel$(TSUFFIX)_nomacros.s -o $@
756-
rm shgemm_kernel$(TSUFFIX).s shgemm_kernel$(TSUFFIX)_nomacros.s
753+
$(CC) $(CFLAGS) -S -DBFLOAT16 -UDOUBLE -UCOMPLEX $< -o - > sbgemm_kernel$(TSUFFIX).s
754+
m4 sbgemm_kernel$(TSUFFIX).s > sbgemm_kernel$(TSUFFIX)_nomacros.s
755+
$(CC) $(CFLAGS) -c -DBFLOAT16 -UDOUBLE -UCOMPLEX sbgemm_kernel$(TSUFFIX)_nomacros.s -o $@
756+
rm sbgemm_kernel$(TSUFFIX).s sbgemm_kernel$(TSUFFIX)_nomacros.s
757757
else
758-
$(CC) $(CFLAGS) -c -DHALF -UDOUBLE -UCOMPLEX $< -o $@
758+
$(CC) $(CFLAGS) -c -DBFLOAT16 -UDOUBLE -UCOMPLEX $< -o $@
759759
endif
760760
endif
761761

@@ -2375,9 +2375,9 @@ $(KDIR)xtrsm_oltncopy$(TSUFFIX).$(SUFFIX) : generic/ztrsm_ltcopy_$(XGEMM_UNROLL_
23752375
$(KDIR)sgemm_beta$(TSUFFIX).$(PSUFFIX) : $(KERNELDIR)/$(SGEMM_BETA)
23762376
$(CC) $(PFLAGS) -c -UDOUBLE -UCOMPLEX $< -o $@
23772377

2378-
ifeq ($(BUILD_HALF),1)
2379-
$(KDIR)shgemm_beta$(TSUFFIX).$(PSUFFIX) : $(KERNELDIR)/$(SHGEMM_BETA)
2380-
$(CC) $(PFLAGS) -c -DHALF -UDOUBLE -UCOMPLEX $< -o $@
2378+
ifeq ($(BUILD_BFLOAT16),1)
2379+
$(KDIR)sbgemm_beta$(TSUFFIX).$(PSUFFIX) : $(KERNELDIR)/$(SBGEMM_BETA)
2380+
$(CC) $(PFLAGS) -c -DBFLOAT16 -UDOUBLE -UCOMPLEX $< -o $@
23812381
endif
23822382

23832383
$(KDIR)dgemm_beta$(TSUFFIX).$(PSUFFIX) : $(KERNELDIR)/$(DGEMM_BETA)
@@ -2396,19 +2396,19 @@ $(KDIR)xgemm_beta$(TSUFFIX).$(PSUFFIX) : $(KERNELDIR)/$(XGEMM_BETA)
23962396
$(CC) $(PFLAGS) -c -DXDOUBLE -DCOMPLEX $< -o $@
23972397

23982398

2399-
ifeq ($(BUILD_HALF), 1)
2400-
$(SHGEMMONCOPYOBJ_P) : $(KERNELDIR)/$(SHGEMMONCOPY)
2401-
$(CC) $(PFLAGS) -c -DHALF -UDOUBLE -UCOMPLEX $< -o $@
2399+
ifeq ($(BUILD_BFLOAT16), 1)
2400+
$(SBGEMMONCOPYOBJ_P) : $(KERNELDIR)/$(SBGEMMONCOPY)
2401+
$(CC) $(PFLAGS) -c -DBFLOAT16 -UDOUBLE -UCOMPLEX $< -o $@
24022402

2403-
$(SHGEMMOTCOPYOBJ_P) : $(KERNELDIR)/$(SHGEMMOTCOPY)
2404-
$(CC) $(PFLAGS) -c -DHALF -UDOUBLE -UCOMPLEX $< -o $@
2403+
$(SBGEMMOTCOPYOBJ_P) : $(KERNELDIR)/$(SBGEMMOTCOPY)
2404+
$(CC) $(PFLAGS) -c -DBFLOAT16 -UDOUBLE -UCOMPLEX $< -o $@
24052405

2406-
ifneq ($(SHGEMM_UNROLL_M), $(SHGEMM_UNROLL_N))
2407-
$(SHGEMMINCOPYOBJ_P) : $(KERNELDIR)/$(SHGEMMINCOPY)
2408-
$(CC) $(PFLAGS) -c -DHALF -UDOUBLE -UCOMPLEX $< -o $@
2406+
ifneq ($(SBGEMM_UNROLL_M), $(SBGEMM_UNROLL_N))
2407+
$(SBGEMMINCOPYOBJ_P) : $(KERNELDIR)/$(SBGEMMINCOPY)
2408+
$(CC) $(PFLAGS) -c -DBFLOAT16 -UDOUBLE -UCOMPLEX $< -o $@
24092409

2410-
$(SHGEMMITCOPYOBJ_P) : $(KERNELDIR)/$(SHGEMMITCOPY)
2411-
$(CC) $(PFLAGS) -c -DHALF -UDOUBLE -UCOMPLEX $< -o $@
2410+
$(SBGEMMITCOPYOBJ_P) : $(KERNELDIR)/$(SBGEMMITCOPY)
2411+
$(CC) $(PFLAGS) -c -DBFLOAT16 -UDOUBLE -UCOMPLEX $< -o $@
24122412

24132413
endif
24142414
endif
@@ -2518,9 +2518,9 @@ endif
25182518
endif
25192519

25202520

2521-
ifeq ($(BUILD_HALF), 1)
2522-
$(KDIR)shgemm_kernel$(TSUFFIX).$(PSUFFIX) : $(KERNELDIR)/$(SHGEMMKERNEL) $(SHGEMMDEPEND)
2523-
$(CC) $(PFLAGS) -c -DHALF -UDOUBLE -UCOMPLEX $< -o $@
2521+
ifeq ($(BUILD_BFLOAT16), 1)
2522+
$(KDIR)sbgemm_kernel$(TSUFFIX).$(PSUFFIX) : $(KERNELDIR)/$(SBGEMMKERNEL) $(SBGEMMDEPEND)
2523+
$(CC) $(PFLAGS) -c -DBFLOAT16 -UDOUBLE -UCOMPLEX $< -o $@
25242524
endif
25252525

25262526
$(KDIR)sgemm_kernel$(TSUFFIX).$(PSUFFIX) : $(KERNELDIR)/$(SGEMMKERNEL) $(SGEMMDEPEND)

0 commit comments

Comments
 (0)