Merge pull request #898 from wernsaar/develop
added experimental support for optimized lapack fortran functions
This commit is contained in:
commit
f04af36ad0
File diff suppressed because it is too large
Load Diff
|
@ -54,29 +54,26 @@ DSTRM_LT_L4x16_LOOP_START:
|
||||||
|
|
||||||
addic. L, KK, 0
|
addic. L, KK, 0
|
||||||
ble- DSTRM_LT_L4x16_SAVE
|
ble- DSTRM_LT_L4x16_SAVE
|
||||||
|
mtctr L
|
||||||
|
|
||||||
DSTRM_LT_L4x16_LOOP:
|
DSTRM_LT_L4x16_LOOP:
|
||||||
|
|
||||||
dcbt AO, PRE
|
dcbt AO, PRE
|
||||||
dcbt BO, PRE
|
dcbt BO, PRE
|
||||||
KERNEL_16x4
|
KERNEL_16x4
|
||||||
addic. L, L, -1
|
bdz- DSTRM_LT_L4x16_SAVE
|
||||||
ble- DSTRM_LT_L4x16_SAVE
|
|
||||||
|
|
||||||
dcbt AO, PRE
|
dcbt AO, PRE
|
||||||
KERNEL_16x4
|
KERNEL_16x4
|
||||||
addic. L, L, -1
|
bdz- DSTRM_LT_L4x16_SAVE
|
||||||
ble- DSTRM_LT_L4x16_SAVE
|
|
||||||
|
|
||||||
dcbt AO, PRE
|
dcbt AO, PRE
|
||||||
KERNEL_16x4
|
KERNEL_16x4
|
||||||
addic. L, L, -1
|
bdz- DSTRM_LT_L4x16_SAVE
|
||||||
ble- DSTRM_LT_L4x16_SAVE
|
|
||||||
|
|
||||||
dcbt AO, PRE
|
dcbt AO, PRE
|
||||||
KERNEL_16x4
|
KERNEL_16x4
|
||||||
addic. L, L, -1
|
bdnz+ DSTRM_LT_L4x16_LOOP
|
||||||
bgt+ DSTRM_LT_L4x16_LOOP
|
|
||||||
|
|
||||||
|
|
||||||
DSTRM_LT_L4x16_SAVE:
|
DSTRM_LT_L4x16_SAVE:
|
||||||
|
|
File diff suppressed because it is too large
Load Diff
Loading…
Reference in New Issue