@@ -23,6 +23,10 @@ ifeq ($(BUILD_BFLOAT16),1)
23
23
SBBLASOBJS += sbgemm_nn.$(SUFFIX ) sbgemm_nt.$(SUFFIX ) sbgemm_tn.$(SUFFIX ) sbgemm_tt.$(SUFFIX )
24
24
endif
25
25
26
+ ifeq ($(BUILD_HFLOAT16 ) ,1)
27
+ SHBLASOBJS += shgemm_nn.$(SUFFIX ) shgemm_nt.$(SUFFIX ) shgemm_tn.$(SUFFIX ) shgemm_tt.$(SUFFIX )
28
+ endif
29
+
26
30
SBLASOBJS += \
27
31
sgemm_nn.$(SUFFIX ) sgemm_nt.$(SUFFIX ) sgemm_tn.$(SUFFIX ) sgemm_tt.$(SUFFIX ) \
28
32
strmm_LNUU.$(SUFFIX ) strmm_LNUN.$(SUFFIX ) strmm_LNLU.$(SUFFIX ) strmm_LNLN.$(SUFFIX ) \
@@ -210,6 +214,9 @@ ifneq ($(USE_SIMPLE_THREADED_LEVEL3), 1)
210
214
ifeq ($(BUILD_BFLOAT16 ) ,1)
211
215
SBBLASOBJS += sbgemm_thread_nn.$(SUFFIX ) sbgemm_thread_nt.$(SUFFIX ) sbgemm_thread_tn.$(SUFFIX ) sbgemm_thread_tt.$(SUFFIX )
212
216
endif
217
+ ifeq ($(BUILD_HFLOAT16 ) ,1)
218
+ SHBLASOBJS += shgemm_thread_nn.$(SUFFIX ) shgemm_thread_nt.$(SUFFIX ) shgemm_thread_tn.$(SUFFIX ) shgemm_thread_tt.$(SUFFIX )
219
+ endif
213
220
SBLASOBJS += sgemm_thread_nn.$(SUFFIX ) sgemm_thread_nt.$(SUFFIX ) sgemm_thread_tn.$(SUFFIX ) sgemm_thread_tt.$(SUFFIX )
214
221
DBLASOBJS += dgemm_thread_nn.$(SUFFIX ) dgemm_thread_nt.$(SUFFIX ) dgemm_thread_tn.$(SUFFIX ) dgemm_thread_tt.$(SUFFIX )
215
222
QBLASOBJS += qgemm_thread_nn.$(SUFFIX ) qgemm_thread_nt.$(SUFFIX ) qgemm_thread_tn.$(SUFFIX ) qgemm_thread_tt.$(SUFFIX )
@@ -355,6 +362,18 @@ sbgemm_tn.$(SUFFIX) : gemm.c level3.c ../../param.h
355
362
sbgemm_tt.$(SUFFIX ) : gemm.c level3.c ../../param.h
356
363
$(CC ) $(CFLAGS ) $(BLOCKS ) -c -DHALF -UDOUBLE -UCOMPLEX -DTT $< -o $(@F )
357
364
365
+ shgemm_nn.$(SUFFIX ) : gemm.c level3.c ../../param.h
366
+ $(CC ) $(CFLAGS ) $(BLOCKS ) -c -DHFLOAT16 -UDOUBLE -UCOMPLEX -DNN $< -o $(@F )
367
+
368
+ shgemm_nt.$(SUFFIX ) : gemm.c level3.c ../../param.h
369
+ $(CC ) $(CFLAGS ) $(BLOCKS ) -c -DHFLOAT16 -UDOUBLE -UCOMPLEX -DNT $< -o $(@F )
370
+
371
+ shgemm_tn.$(SUFFIX ) : gemm.c level3.c ../../param.h
372
+ $(CC ) $(CFLAGS ) $(BLOCKS ) -c -DHFLOAT16 -UDOUBLE -UCOMPLEX -DTN $< -o $(@F )
373
+
374
+ shgemm_tt.$(SUFFIX ) : gemm.c level3.c ../../param.h
375
+ $(CC ) $(CFLAGS ) $(BLOCKS ) -c -DHFLOAT16 -UDOUBLE -UCOMPLEX -DTT $< -o $(@F )
376
+
358
377
sgemm_nn.$(SUFFIX ) : gemm.c level3.c ../../param.h
359
378
$(CC ) $(CFLAGS ) $(BLOCKS ) -c -UDOUBLE -UCOMPLEX -DNN $< -o $(@F )
360
379
@@ -562,6 +581,18 @@ sbgemm_thread_tn.$(SUFFIX) : gemm.c level3_thread.c ../../param.h
562
581
sbgemm_thread_tt.$(SUFFIX ) : gemm.c level3_thread.c ../../param.h
563
582
$(CC ) $(CFLAGS ) $(BLOCKS ) -c -DTHREADED_LEVEL3 -DHALF -UDOUBLE -UCOMPLEX -DTT $< -o $(@F )
564
583
584
+ shgemm_thread_nn.$(SUFFIX ) : gemm.c level3_thread.c ../../param.h
585
+ $(CC ) $(CFLAGS ) $(BLOCKS ) -c -DTHREADED_LEVEL3 -DHFLOAT16 -UDOUBLE -UCOMPLEX -DNN $< -o $(@F )
586
+
587
+ shgemm_thread_nt.$(SUFFIX ) : gemm.c level3_thread.c ../../param.h
588
+ $(CC ) $(CFLAGS ) $(BLOCKS ) -c -DTHREADED_LEVEL3 -DHFLOAT16 -UDOUBLE -UCOMPLEX -DNT $< -o $(@F )
589
+
590
+ shgemm_thread_tn.$(SUFFIX ) : gemm.c level3_thread.c ../../param.h
591
+ $(CC ) $(CFLAGS ) $(BLOCKS ) -c -DTHREADED_LEVEL3 -DHFLOAT16 -UDOUBLE -UCOMPLEX -DTN $< -o $(@F )
592
+
593
+ shgemm_thread_tt.$(SUFFIX ) : gemm.c level3_thread.c ../../param.h
594
+ $(CC ) $(CFLAGS ) $(BLOCKS ) -c -DTHREADED_LEVEL3 -DHFLOAT16 -UDOUBLE -UCOMPLEX -DTT $< -o $(@F )
595
+
565
596
sgemm_thread_nn.$(SUFFIX ) : gemm.c level3_thread.c ../../param.h
566
597
$(CC ) $(CFLAGS ) $(BLOCKS ) -c -DTHREADED_LEVEL3 -UDOUBLE -UCOMPLEX -DNN $< -o $(@F )
567
598
@@ -2747,6 +2778,18 @@ sbgemm_tn.$(PSUFFIX) : gemm.c level3.c ../../param.h
2747
2778
sbgemm_tt.$(PSUFFIX ) : gemm.c level3.c ../../param.h
2748
2779
$(CC ) $(PFLAGS ) $(BLOCKS ) -c -DHALF -UDOUBLE -UCOMPLEX -DTT $< -o $(@F )
2749
2780
2781
+ shgemm_nn.$(PSUFFIX ) : gemm.c level3.c ../../param.h
2782
+ $(CC ) $(PFLAGS ) $(BLOCKS ) -c -DHFLOAT16 -UDOUBLE -UCOMPLEX -DNN $< -o $(@F )
2783
+
2784
+ shgemm_nt.$(PSUFFIX ) : gemm.c level3.c ../../param.h
2785
+ $(CC ) $(PFLAGS ) $(BLOCKS ) -c -DHFLOAT16 -UDOUBLE -UCOMPLEX -DNT $< -o $(@F )
2786
+
2787
+ shgemm_tn.$(PSUFFIX ) : gemm.c level3.c ../../param.h
2788
+ $(CC ) $(PFLAGS ) $(BLOCKS ) -c -DHFLOAT16 -UDOUBLE -UCOMPLEX -DTN $< -o $(@F )
2789
+
2790
+ shgemm_tt.$(PSUFFIX ) : gemm.c level3.c ../../param.h
2791
+ $(CC ) $(PFLAGS ) $(BLOCKS ) -c -DHFLOAT16 -UDOUBLE -UCOMPLEX -DTT $< -o $(@F )
2792
+
2750
2793
sgemm_nn.$(PSUFFIX ) : gemm.c level3.c ../../param.h
2751
2794
$(CC ) $(PFLAGS ) $(BLOCKS ) -c -UDOUBLE -UCOMPLEX -DNN $< -o $(@F )
2752
2795
@@ -2970,6 +3013,18 @@ sbgemm_thread_tn.$(PSUFFIX) : gemm.c level3_thread.c ../../param.h
2970
3013
sbgemm_thread_tt.$(PSUFFIX ) : gemm.c level3_thread.c ../../param.h
2971
3014
$(CC ) $(PFLAGS ) $(BLOCKS ) -c -DTHREADED_LEVEL3 -DHALF -UDOUBLE -UCOMPLEX -DTT $< -o $(@F )
2972
3015
3016
+ shgemm_thread_nn.$(PSUFFIX ) : gemm.c level3_thread.c ../../param.h
3017
+ $(CC ) $(PFLAGS ) $(BLOCKS ) -c -DTHREADED_LEVEL3 -DHFLOAT16 -UDOUBLE -UCOMPLEX -DNN $< -o $(@F )
3018
+
3019
+ shgemm_thread_nt.$(PSUFFIX ) : gemm.c level3_thread.c ../../param.h
3020
+ $(CC ) $(PFLAGS ) $(BLOCKS ) -c -DTHREADED_LEVEL3 -DHFLOAT16 -UDOUBLE -UCOMPLEX -DNT $< -o $(@F )
3021
+
3022
+ shgemm_thread_tn.$(PSUFFIX ) : gemm.c level3_thread.c ../../param.h
3023
+ $(CC ) $(PFLAGS ) $(BLOCKS ) -c -DTHREADED_LEVEL3 -DHFLOAT16 -UDOUBLE -UCOMPLEX -DTN $< -o $(@F )
3024
+
3025
+ shgemm_thread_tt.$(PSUFFIX ) : gemm.c level3_thread.c ../../param.h
3026
+ $(CC ) $(PFLAGS ) $(BLOCKS ) -c -DTHREADED_LEVEL3 -DHFLOAT16 -UDOUBLE -UCOMPLEX -DTT $< -o $(@F )
3027
+
2973
3028
sgemm_thread_nn.$(PSUFFIX ) : gemm.c level3_thread.c ../../param.h
2974
3029
$(CC ) $(PFLAGS ) $(BLOCKS ) -c -DTHREADED_LEVEL3 -UDOUBLE -UCOMPLEX -DNN $< -o $(@F )
2975
3030
0 commit comments