update configuration of kernels for A64FX and ARMV8SVE
This commit is contained in:
parent
07fa6fa3b1
commit
d30157d891
|
@ -156,19 +156,30 @@ DTRMMLTCOPY_M = trmm_ltcopy_sve_v1.c
|
||||||
DSYMMUCOPY_M = symm_ucopy_sve.c
|
DSYMMUCOPY_M = symm_ucopy_sve.c
|
||||||
DSYMMLCOPY_M = symm_lcopy_sve.c
|
DSYMMLCOPY_M = symm_lcopy_sve.c
|
||||||
|
|
||||||
CGEMMKERNEL = cgemm_kernel_$(CGEMM_UNROLL_M)x$(CGEMM_UNROLL_N).S
|
CGEMMKERNEL = cgemm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
|
||||||
CTRMMKERNEL = ctrmm_kernel_$(CGEMM_UNROLL_M)x$(CGEMM_UNROLL_N).S
|
CTRMMKERNEL = ctrmm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
|
||||||
ifneq ($(CGEMM_UNROLL_M), $(CGEMM_UNROLL_N))
|
|
||||||
CGEMMINCOPY = ../generic/zgemm_ncopy_$(CGEMM_UNROLL_M).c
|
CGEMMINCOPY = cgemm_ncopy_sve_v1.c
|
||||||
CGEMMITCOPY = ../generic/zgemm_tcopy_$(CGEMM_UNROLL_M).c
|
CGEMMITCOPY = cgemm_tcopy_sve_v1.c
|
||||||
|
CGEMMONCOPY = ../generic/zgemm_ncopy_$(ZGEMM_UNROLL_N).c
|
||||||
|
CGEMMOTCOPY = ../generic/zgemm_tcopy_$(ZGEMM_UNROLL_N).c
|
||||||
|
|
||||||
CGEMMINCOPYOBJ = cgemm_incopy$(TSUFFIX).$(SUFFIX)
|
CGEMMINCOPYOBJ = cgemm_incopy$(TSUFFIX).$(SUFFIX)
|
||||||
CGEMMITCOPYOBJ = cgemm_itcopy$(TSUFFIX).$(SUFFIX)
|
CGEMMITCOPYOBJ = cgemm_itcopy$(TSUFFIX).$(SUFFIX)
|
||||||
endif
|
|
||||||
CGEMMONCOPY = ../generic/zgemm_ncopy_$(CGEMM_UNROLL_N).c
|
|
||||||
CGEMMOTCOPY = ../generic/zgemm_tcopy_$(CGEMM_UNROLL_N).c
|
|
||||||
CGEMMONCOPYOBJ = cgemm_oncopy$(TSUFFIX).$(SUFFIX)
|
CGEMMONCOPYOBJ = cgemm_oncopy$(TSUFFIX).$(SUFFIX)
|
||||||
CGEMMOTCOPYOBJ = cgemm_otcopy$(TSUFFIX).$(SUFFIX)
|
CGEMMOTCOPYOBJ = cgemm_otcopy$(TSUFFIX).$(SUFFIX)
|
||||||
|
|
||||||
|
CTRMMUNCOPY_M = ztrmm_uncopy_sve_v1.c
|
||||||
|
CTRMMLNCOPY_M = ztrmm_lncopy_sve_v1.c
|
||||||
|
CTRMMUTCOPY_M = ztrmm_utcopy_sve_v1.c
|
||||||
|
CTRMMLTCOPY_M = ztrmm_ltcopy_sve_v1.c
|
||||||
|
|
||||||
|
CHEMMLTCOPY_M = chemm_ltcopy_sve.c
|
||||||
|
CHEMMUTCOPY_M = chemm_utcopy_sve.c
|
||||||
|
|
||||||
|
CSYMMUCOPY_M = zsymm_ucopy_sve.c
|
||||||
|
CSYMMLCOPY_M = zsymm_lcopy_sve.c
|
||||||
|
|
||||||
ZGEMMKERNEL = zgemm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
|
ZGEMMKERNEL = zgemm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
|
||||||
ZTRMMKERNEL = ztrmm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
|
ZTRMMKERNEL = ztrmm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
|
||||||
|
|
||||||
|
@ -190,3 +201,5 @@ ZTRMMLTCOPY_M = ztrmm_ltcopy_sve_v1.c
|
||||||
ZHEMMLTCOPY_M = zhemm_ltcopy_sve.c
|
ZHEMMLTCOPY_M = zhemm_ltcopy_sve.c
|
||||||
ZHEMMUTCOPY_M = zhemm_utcopy_sve.c
|
ZHEMMUTCOPY_M = zhemm_utcopy_sve.c
|
||||||
|
|
||||||
|
ZSYMMUCOPY_M = zsymm_ucopy_sve.c
|
||||||
|
ZSYMMLCOPY_M = zsymm_lcopy_sve.c
|
||||||
|
|
|
@ -156,28 +156,50 @@ DTRMMLTCOPY_M = trmm_ltcopy_sve_v1.c
|
||||||
DSYMMUCOPY_M = symm_ucopy_sve.c
|
DSYMMUCOPY_M = symm_ucopy_sve.c
|
||||||
DSYMMLCOPY_M = symm_lcopy_sve.c
|
DSYMMLCOPY_M = symm_lcopy_sve.c
|
||||||
|
|
||||||
CGEMMKERNEL = cgemm_kernel_$(CGEMM_UNROLL_M)x$(CGEMM_UNROLL_N).S
|
CGEMMKERNEL = cgemm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
|
||||||
CTRMMKERNEL = ctrmm_kernel_$(CGEMM_UNROLL_M)x$(CGEMM_UNROLL_N).S
|
CTRMMKERNEL = ctrmm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
|
||||||
ifneq ($(CGEMM_UNROLL_M), $(CGEMM_UNROLL_N))
|
|
||||||
CGEMMINCOPY = ../generic/zgemm_ncopy_$(CGEMM_UNROLL_M).c
|
CGEMMINCOPY = cgemm_ncopy_sve_v1.c
|
||||||
CGEMMITCOPY = ../generic/zgemm_tcopy_$(CGEMM_UNROLL_M).c
|
CGEMMITCOPY = cgemm_tcopy_sve_v1.c
|
||||||
|
CGEMMONCOPY = ../generic/zgemm_ncopy_$(ZGEMM_UNROLL_N).c
|
||||||
|
CGEMMOTCOPY = ../generic/zgemm_tcopy_$(ZGEMM_UNROLL_N).c
|
||||||
|
|
||||||
CGEMMINCOPYOBJ = cgemm_incopy$(TSUFFIX).$(SUFFIX)
|
CGEMMINCOPYOBJ = cgemm_incopy$(TSUFFIX).$(SUFFIX)
|
||||||
CGEMMITCOPYOBJ = cgemm_itcopy$(TSUFFIX).$(SUFFIX)
|
CGEMMITCOPYOBJ = cgemm_itcopy$(TSUFFIX).$(SUFFIX)
|
||||||
endif
|
|
||||||
CGEMMONCOPY = ../generic/zgemm_ncopy_$(CGEMM_UNROLL_N).c
|
|
||||||
CGEMMOTCOPY = ../generic/zgemm_tcopy_$(CGEMM_UNROLL_N).c
|
|
||||||
CGEMMONCOPYOBJ = cgemm_oncopy$(TSUFFIX).$(SUFFIX)
|
CGEMMONCOPYOBJ = cgemm_oncopy$(TSUFFIX).$(SUFFIX)
|
||||||
CGEMMOTCOPYOBJ = cgemm_otcopy$(TSUFFIX).$(SUFFIX)
|
CGEMMOTCOPYOBJ = cgemm_otcopy$(TSUFFIX).$(SUFFIX)
|
||||||
|
|
||||||
ZGEMMKERNEL = zgemm_kernel_$(ZGEMM_UNROLL_M)x$(ZGEMM_UNROLL_N).S
|
CTRMMUNCOPY_M = ztrmm_uncopy_sve_v1.c
|
||||||
ZTRMMKERNEL = ztrmm_kernel_$(ZGEMM_UNROLL_M)x$(ZGEMM_UNROLL_N).S
|
CTRMMLNCOPY_M = ztrmm_lncopy_sve_v1.c
|
||||||
ifneq ($(ZGEMM_UNROLL_M), $(ZGEMM_UNROLL_N))
|
CTRMMUTCOPY_M = ztrmm_utcopy_sve_v1.c
|
||||||
ZGEMMINCOPY = ../generic/zgemm_ncopy_$(ZGEMM_UNROLL_M).c
|
CTRMMLTCOPY_M = ztrmm_ltcopy_sve_v1.c
|
||||||
ZGEMMITCOPY = ../generic/zgemm_tcopy_$(ZGEMM_UNROLL_M).c
|
|
||||||
ZGEMMINCOPYOBJ = zgemm_incopy$(TSUFFIX).$(SUFFIX)
|
CHEMMLTCOPY_M = chemm_ltcopy_sve.c
|
||||||
ZGEMMITCOPYOBJ = zgemm_itcopy$(TSUFFIX).$(SUFFIX)
|
CHEMMUTCOPY_M = chemm_utcopy_sve.c
|
||||||
endif
|
|
||||||
|
CSYMMUCOPY_M = zsymm_ucopy_sve.c
|
||||||
|
CSYMMLCOPY_M = zsymm_lcopy_sve.c
|
||||||
|
|
||||||
|
ZGEMMKERNEL = zgemm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
|
||||||
|
ZTRMMKERNEL = ztrmm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
|
||||||
|
|
||||||
|
ZGEMMINCOPY = zgemm_ncopy_sve_v1.c
|
||||||
|
ZGEMMITCOPY = zgemm_tcopy_sve_v1.c
|
||||||
ZGEMMONCOPY = ../generic/zgemm_ncopy_$(ZGEMM_UNROLL_N).c
|
ZGEMMONCOPY = ../generic/zgemm_ncopy_$(ZGEMM_UNROLL_N).c
|
||||||
ZGEMMOTCOPY = ../generic/zgemm_tcopy_$(ZGEMM_UNROLL_N).c
|
ZGEMMOTCOPY = ../generic/zgemm_tcopy_$(ZGEMM_UNROLL_N).c
|
||||||
|
|
||||||
|
ZGEMMINCOPYOBJ = zgemm_incopy$(TSUFFIX).$(SUFFIX)
|
||||||
|
ZGEMMITCOPYOBJ = zgemm_itcopy$(TSUFFIX).$(SUFFIX)
|
||||||
ZGEMMONCOPYOBJ = zgemm_oncopy$(TSUFFIX).$(SUFFIX)
|
ZGEMMONCOPYOBJ = zgemm_oncopy$(TSUFFIX).$(SUFFIX)
|
||||||
ZGEMMOTCOPYOBJ = zgemm_otcopy$(TSUFFIX).$(SUFFIX)
|
ZGEMMOTCOPYOBJ = zgemm_otcopy$(TSUFFIX).$(SUFFIX)
|
||||||
|
|
||||||
|
ZTRMMUNCOPY_M = ztrmm_uncopy_sve_v1.c
|
||||||
|
ZTRMMLNCOPY_M = ztrmm_lncopy_sve_v1.c
|
||||||
|
ZTRMMUTCOPY_M = ztrmm_utcopy_sve_v1.c
|
||||||
|
ZTRMMLTCOPY_M = ztrmm_ltcopy_sve_v1.c
|
||||||
|
|
||||||
|
ZHEMMLTCOPY_M = zhemm_ltcopy_sve.c
|
||||||
|
ZHEMMUTCOPY_M = zhemm_utcopy_sve.c
|
||||||
|
|
||||||
|
ZSYMMUCOPY_M = zsymm_ucopy_sve.c
|
||||||
|
ZSYMMLCOPY_M = zsymm_lcopy_sve.c
|
||||||
|
|
Loading…
Reference in New Issue