wernsaar
|
4be4db590c
|
Merge remote branch 'origin/develop' into armv7
|
2013-12-01 13:16:41 +01:00 |
wernsaar
|
5c648a8984
|
Merge remote branch 'origin/develop' into haswell
|
2013-12-01 11:25:33 +01:00 |
wernsaar
|
7581e2e9cb
|
merged common_x86.h and common_x86_64.h from develop
|
2013-12-01 11:23:36 +01:00 |
wernsaar
|
c44dc4dd3c
|
Merge remote branch 'origin/develop' into piledriver
|
2013-12-01 11:06:36 +01:00 |
wernsaar
|
ac7735e01f
|
merge from develop
|
2013-12-01 11:05:10 +01:00 |
wernsaar
|
271ceeba15
|
merged form develop
|
2013-12-01 10:58:22 +01:00 |
wernsaar
|
71eecaaf37
|
Merge remote branch 'origin/develop' into bulldozer
|
2013-12-01 10:53:39 +01:00 |
wernsaar
|
9d3fae15a8
|
Merge branch 'develop' into armv7
|
2013-12-01 10:12:07 +01:00 |
wernsaar
|
2d3c884294
|
added complex gemv kernels for ARMV6 and ARMV7
|
2013-11-29 17:06:33 +01:00 |
wernsaar
|
d54a061713
|
optimized gemv_n_vfp.S
|
2013-11-28 17:40:21 +01:00 |
wernsaar
|
86afb47e83
|
added optimized ctrmm kernel for ARMV6
|
2013-11-28 14:35:07 +01:00 |
wernsaar
|
42a4dff056
|
added optimized ztrmm kernel for ARMV6
|
2013-11-28 13:41:06 +01:00 |
wernsaar
|
5bc322a66c
|
optimized strmm kernel for ARMV6
|
2013-11-28 12:45:38 +01:00 |
wernsaar
|
dec7ad0dfd
|
optimized dtrmm kernel for ARMV7
|
2013-11-28 12:32:12 +01:00 |
wernsaar
|
274304bd03
|
add optimized cgemm kernel for ARMV6
|
2013-11-28 11:54:38 +01:00 |
wernsaar
|
5007a534c4
|
optimized zgemm kernel for ARMV6
|
2013-11-28 10:04:43 +01:00 |
wernsaar
|
a537d7d8d7
|
optimized zgemm_kernel_2x2_vfp.S
|
2013-11-28 08:33:44 +01:00 |
wernsaar
|
b42145834f
|
optimized sgemm kernel for ARMV6
|
2013-11-28 08:08:08 +01:00 |
wernsaar
|
3d5e792c72
|
optimized sgemm kernel for ARMV6
|
2013-11-27 18:38:32 +01:00 |
wernsaar
|
a9bd12da2c
|
optimized dgemm kernel for ARMV6
|
2013-11-27 17:37:38 +01:00 |
wernsaar
|
697e198e8a
|
added zgemm_kernel for ARMV6
|
2013-11-27 16:15:06 +01:00 |
wernsaar
|
36b0f7fe1d
|
added optimized gemv_t kernel for ARMV6
|
2013-11-25 19:31:27 +01:00 |
wernsaar
|
d2b20c5c51
|
add optimized axpy kernel
|
2013-11-25 12:25:58 +01:00 |
wernsaar
|
fd1d9fdb22
|
changed default optimization from -O2 to -O3 for ARMV8
|
2013-11-24 16:19:01 +01:00 |
wernsaar
|
fe5f46c330
|
added experimental support for ARMV8
|
2013-11-24 15:47:00 +01:00 |
wernsaar
|
e25de3d182
|
changed default optimization flag for ARM from -O2 to -O3
|
2013-11-24 13:22:49 +01:00 |
wernsaar
|
25c6050593
|
add single and double precision gemv_n kernel for ARMV6
|
2013-11-24 12:03:28 +01:00 |
wernsaar
|
12e02a00e0
|
added ncopy kernels for ARMV6
|
2013-11-24 08:46:47 +01:00 |
wernsaar
|
29a3196f56
|
added optimized sgemm and strmm kernel for ARMV6
|
2013-11-23 18:09:41 +01:00 |
wernsaar
|
8776a73773
|
added optimized dgemm and dtrmm kernel for ARMV6
|
2013-11-23 16:24:52 +01:00 |
wernsaar
|
7e84acd3e8
|
fixed bug in SAVE macros, that are not found by any test routine
|
2013-11-23 14:35:19 +01:00 |
wernsaar
|
33d3ab6e09
|
small optimizations for zgemv kernels
|
2013-11-23 12:35:31 +01:00 |
wernsaar
|
9a0f978929
|
added nrm2 kernel for ARMV6
|
2013-11-22 17:21:10 +01:00 |
wernsaar
|
7f210587f0
|
renamed some ncopy and tcopy files
|
2013-11-22 00:20:25 +01:00 |
wernsaar
|
9f0a3a35b3
|
removed obsolete file sdot_vfpv3.S
|
2013-11-21 23:42:54 +01:00 |
wernsaar
|
dbae93110b
|
added sdot_vfp.S
|
2013-11-21 23:34:51 +01:00 |
wernsaar
|
19cd5c64a2
|
renamed swap_vfpv3.S to swap_vfp.S
|
2013-11-21 23:19:32 +01:00 |
wernsaar
|
9adf87495e
|
renamed some dot kernels
|
2013-11-21 23:07:51 +01:00 |
wernsaar
|
440db4cdda
|
delete rot_vfpv3.S
|
2013-11-21 22:52:24 +01:00 |
wernsaar
|
cd93cae5a7
|
renamed rot_vfpv3.S to rot_vfp.S
|
2013-11-21 22:49:28 +01:00 |
wernsaar
|
8565afb3c2
|
renamed asum_vfpv3.S to asum_vfp.S
|
2013-11-21 22:26:27 +01:00 |
wernsaar
|
5bf7cf8d67
|
renamed scal_vfpv3.S to scal_vfp.S
|
2013-11-21 22:03:36 +01:00 |
wernsaar
|
29a005c635
|
renamed iamax assembler kernel
|
2013-11-21 21:12:33 +01:00 |
wernsaar
|
f1be3a168a
|
renamed some BLAS kernels, which are compatible to ARMV6
|
2013-11-21 20:48:57 +01:00 |
wernsaar
|
410afda9b4
|
added cpu detection and target ARMV6, used in raspberry pi
|
2013-11-21 20:18:51 +01:00 |
wernsaar
|
bf04544902
|
added gemv_n kernel for single and double precision
|
2013-11-19 15:07:20 +01:00 |
wernsaar
|
86283c0be1
|
added gemv_t kernel for single and double precision
|
2013-11-19 09:55:54 +01:00 |
wernsaar
|
f27cabfd08
|
added nrm2 kernel for all precisions
|
2013-11-16 16:17:17 +01:00 |
wernsaar
|
23dd474cd0
|
added rot kernel for all precisions
|
2013-11-15 14:08:57 +01:00 |
wernsaar
|
f1b452e160
|
added scal kernel for all precisions
|
2013-11-15 11:56:43 +01:00 |