Update dgemm_kernel_4x8_skylakex_2.c

This commit is contained in:
wjc404 2019-11-28 19:56:35 +08:00 committed by GitHub
parent eb1e9c8c92
commit 934e601e93
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
1 changed files with 5 additions and 3 deletions

View File

@ -97,15 +97,17 @@
/* %10 for prefetch of C elements before storage; %4 = ldc(in bytes),%11 for prefetch of next B block */
#define INNER_KERNELm8(nn) \
"movq %3,%10;cmpq $16,%2;jb "#nn"001f;"\
"movq %3,%10;cmpq $18,%2;jb "#nn"001f;"\
#nn"008:\n\t"\
INNER_KERNEL_k1m8n##nn "addq $64,%1;"\
INNER_KERNEL_k1m8n##nn "addq $64,%1;"\
INNER_KERNEL_k1m8n##nn "addq $64,%1;"\
"prefetcht1 (%10); prefetcht1 63(%10); addq %4,%10;"\
INNER_KERNEL_k1m8n##nn "addq $64,%1;"\
INNER_KERNEL_k1m8n##nn "addq $64,%1;"\
"prefetcht1 (%11); addq $16,%11;"\
"subq $4,%2;cmpq $16,%2;jnb "#nn"008b;"\
INNER_KERNEL_k1m8n##nn "addq $64,%1;"\
"prefetcht1 (%11); addq $32,%11;"\
"subq $6,%2;cmpq $18,%2;jnb "#nn"008b;"\
"movq %3,%10;"\
#nn"001:\n\t"\
"cmpq $1,%2;jb "#nn"000f;"\