Optimize cdot function for POWER10

This patch makes use of new POWER10 vector pair instructions for
loads and stores.
This commit is contained in:
Rajalakshmi Srinivasaraghavan
2021-01-15 13:40:34 -06:00
parent e378b24487
commit eff7c9166e
3 changed files with 185 additions and 4 deletions

View File

@@ -154,11 +154,7 @@ ZCOPYKERNEL = zcopy_power10.c
SDOTKERNEL = sdot_power10.c
DDOTKERNEL = ddot_power10.c
DSDOTKERNEL = sdot_power10.c
ifneq ($(GCCVERSIONGTEQ9),1)
CDOTKERNEL = cdot_power9.S
else
CDOTKERNEL = cdot.c
endif
ZDOTKERNEL = zdot.c
#
SNRM2KERNEL = ../arm/nrm2.c