optimized sgemm kernel for ARMV6
This commit is contained in:
		
							parent
							
								
									3d5e792c72
								
							
						
					
					
						commit
						b42145834f
					
				|  | @ -26,7 +26,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||||
| *****************************************************************************/ | *****************************************************************************/ | ||||||
| 
 | 
 | ||||||
| /************************************************************************************** | /************************************************************************************** | ||||||
| * 2013/11/27 Saar | * 2013/11/28 Saar | ||||||
| * 	 BLASTEST 		: OK | * 	 BLASTEST 		: OK | ||||||
| * 	 CTEST			: OK | * 	 CTEST			: OK | ||||||
| * 	 TEST			: OK | * 	 TEST			: OK | ||||||
|  | @ -100,17 +100,12 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||||
| 
 | 
 | ||||||
| .macro KERNEL4x2_SUB
 | .macro KERNEL4x2_SUB
 | ||||||
| 
 | 
 | ||||||
| 	flds	s4 , [ BO ] | 	fldmias	AO! , { s0 - s3 } | ||||||
| 
 | 	fldmias	BO! , { s4 - s5 } | ||||||
| 	flds	s0 , [ AO ] |  | ||||||
| 	flds	s1 , [ AO, #4 ] |  | ||||||
| 
 | 
 | ||||||
| 	fmacs	s8  , s0,  s4 | 	fmacs	s8  , s0,  s4 | ||||||
| 	flds	s2 , [ AO, #8 ] |  | ||||||
| 	fmacs	s9  , s1,  s4 | 	fmacs	s9  , s1,  s4 | ||||||
| 	flds	s3 , [ AO, #12 ] |  | ||||||
| 	fmacs	s10  , s2,  s4 | 	fmacs	s10  , s2,  s4 | ||||||
| 	flds	s5 , [ BO, #4 ] |  | ||||||
| 	fmacs	s11  , s3,  s4 | 	fmacs	s11  , s3,  s4 | ||||||
| 
 | 
 | ||||||
| 	fmacs	s12  , s0,  s5 | 	fmacs	s12  , s0,  s5 | ||||||
|  | @ -118,9 +113,6 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||||
| 	fmacs	s14  , s2,  s5 | 	fmacs	s14  , s2,  s5 | ||||||
| 	fmacs	s15  , s3,  s5 | 	fmacs	s15  , s3,  s5 | ||||||
| 
 | 
 | ||||||
| 	add	AO , AO, #16 |  | ||||||
| 	add	BO , BO, #8 |  | ||||||
| 
 |  | ||||||
| .endm | .endm | ||||||
| 
 | 
 | ||||||
| .macro SAVE4x2
 | .macro SAVE4x2
 | ||||||
|  |  | ||||||
		Loading…
	
		Reference in New Issue