Add workaround for NVIDIA HPC mishandling of the asm DOT kernels
This commit is contained in:
parent
c2a8ebfe69
commit
0f27a03607
|
@ -70,10 +70,19 @@ DCOPYKERNEL = copy.S
|
||||||
CCOPYKERNEL = copy.S
|
CCOPYKERNEL = copy.S
|
||||||
ZCOPYKERNEL = copy.S
|
ZCOPYKERNEL = copy.S
|
||||||
|
|
||||||
|
ifneq ($(C_COMPILER), PGI)
|
||||||
SDOTKERNEL = ../generic/dot.c
|
SDOTKERNEL = ../generic/dot.c
|
||||||
|
else
|
||||||
|
SDOTKERNEL = dot.S
|
||||||
|
endif
|
||||||
DDOTKERNEL = dot.S
|
DDOTKERNEL = dot.S
|
||||||
|
ifneq ($(C_COMPILER), PGI)
|
||||||
CDOTKERNEL = zdot.S
|
CDOTKERNEL = zdot.S
|
||||||
ZDOTKERNEL = zdot.S
|
ZDOTKERNEL = zdot.S
|
||||||
|
else
|
||||||
|
CDOTKERNEL = ../arm/zdot.c
|
||||||
|
ZDOTKERNEL = ../arm/zdot.c
|
||||||
|
endif
|
||||||
DSDOTKERNEL = dot.S
|
DSDOTKERNEL = dot.S
|
||||||
|
|
||||||
SNRM2KERNEL = nrm2.S
|
SNRM2KERNEL = nrm2.S
|
||||||
|
|
Loading…
Reference in New Issue