undo slow dgemm/skylake microoptimization
the compare is more costly than the work
This commit is contained in:
parent
d74dc39b0f
commit
6d43c51ccf
|
@ -647,11 +647,9 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
|
|
||||||
|
|
||||||
#define SAVE2x2(ALPHA) \
|
#define SAVE2x2(ALPHA) \
|
||||||
if (ALPHA != 1.0) { \
|
xmm0 = _mm_set1_pd(ALPHA); \
|
||||||
xmm0 = _mm_set1_pd(ALPHA); \
|
xmm4 *= xmm0; \
|
||||||
xmm4 *= xmm0; \
|
xmm6 *= xmm0; \
|
||||||
xmm6 *= xmm0; \
|
|
||||||
} \
|
|
||||||
\
|
\
|
||||||
xmm4 += _mm_loadu_pd(CO1); \
|
xmm4 += _mm_loadu_pd(CO1); \
|
||||||
xmm6 += _mm_loadu_pd(CO1 + ldc); \
|
xmm6 += _mm_loadu_pd(CO1 + ldc); \
|
||||||
|
|
Loading…
Reference in New Issue