97f68f7f3a 
								
							 
						 
						
							
							
								
								Merge pull request  #169  from juliantaylor/sanity-check-cpu  
							
							... 
							
							
							
							add a sanity check on the detected cpu type 
							
						 
						
							2012-12-15 06:46:48 -08:00  
				
					
						
							
							
								 
						
							
								1138817dd2 
								
							 
						 
						
							
							
								
								add a sanity check on the detected cpu type  
							
							... 
							
							
							
							if we have 64 bit pointers we can't have a 32 bit cpu, so fall back to
the 64bit cpu fallback (prescott)
E.g. the cpu detection fails in amd qemu64 emulation (family 6 model 2)
causing it to use the uninitialized gotoblas_ATHLON 
							
						 
						
							2012-12-15 13:29:46 +01:00  
				
					
						
							
							
								 
						
							
								13f8fc0b1a 
								
							 
						 
						
							
							
								
								Write FMA4 flag to the configure file.  
							
							
							
						 
						
							2012-12-11 10:55:10 +01:00  
				
					
						
							
							
								 
						
							
								bdf8d9411e 
								
							 
						 
						
							
							
								
								Refs  #163 . Obtain the build configure on runtime.  
							
							... 
							
							
							
							openblas_get_config function returns the configure string.
So far, it supports USE64BITINT, NO_CBLAS, NO_LAPACK, NO_LAPACKE,
DYNAMIC_ARCH, NO_AFFINITY.
Example:
 #include <stdio.h>
extern char * openblas_get_config();
void main()
{
  printf("%s\n",openblas_get_config());
  return;
} 
							
						 
						
							2012-12-10 15:52:51 +08:00  
				
					
						
							
							
								 
						
							
								bb10cb8442 
								
							 
						 
						
							
							
								
								Refs  #165 . fall back of DTB_DEFAULT_ENTRIES for some virtual machines.  
							
							
							
						 
						
							2012-12-10 11:51:39 +08:00  
				
					
						
							
							
								 
						
							
								d48cff8cf1 
								
							 
						 
						
							
							
								
								Added optimized sgemm_kernel  
							
							
							
						 
						
							2012-12-08 18:50:53 +01:00  
				
					
						
							
							
								 
						
							
								f19af5ecc0 
								
							 
						 
						
							
							
								
								Refs  #54 . Added AMD Bulldozer x86_64 dgemm kernel developed by Werner Saar <wernsaar at googlemail.com>  
							
							... 
							
							
							
							Based on the dgemm kernel for AMD Barcelona, he used AVX and FMA4 instructions.
Thank Werner Saar! 
							
						 
						
							2012-12-07 01:05:11 +08:00  
				
					
						
							
							
								 
						
							
								bfaaa975e6 
								
							 
						 
						
							
							
								
								Added BULLDOZER target. So far it uses barcelona kernels.  
							
							
							
						 
						
							2012-12-07 00:53:31 +08:00  
				
					
						
							
							
								 
						
							
								b7c0fa6bd2 
								
							 
						 
						
							
							
								
								Init AMD Bulldozer codebase.  
							
							
							
						 
						
							2012-12-06 07:29:54 -05:00  
				
					
						
							
							
								 
						
							
								7110d17146 
								
							 
						 
						
							
							
								
								Added -lgomp for generating DLL on Windows.  
							
							
							
						 
						
							2012-11-28 12:52:28 +08:00  
				
					
						
							
							
								 
						
							
								e01b3d4b54 
								
							 
						 
						
							
							
								
								Merge branch 'develop'  
							
							
							
						 
						
							2012-11-27 07:24:53 +08:00  
				
					
						
							
							
								 
						
							
								cea1a885b5 
								
							 
						 
						
							
							
								
								Refs  #154 . Fixed the build bug of dgemv_t on MinW64.  
							
							
							
						 
						
							2012-11-27 07:24:04 +08:00  
				
					
						
							
							
								 
						
							
								f78eb335d6 
								
							 
						 
						
							
							
								
								Merge branch 'develop'  
							
							
							
						 
						
							2012-11-26 17:32:56 +08:00  
				
					
						
							
							
								 
						
							
								2345bdec68 
								
							 
						 
						
							
							
								
								Update the doc for 0.2.5 version.  
							
							
							
						 
						
							2012-11-26 17:32:25 +08:00  
				
					
						
							
							
								 
						
							
								5f0117385e 
								
							 
						 
						
							
							
								
								Refs  #154 . Fixed a SEGFAULT bug of dgemv_t when m is very large.  
							
							... 
							
							
							
							It overflowed the internal buffer. Thus, we split vector x into blocks when m is very large.
Thank @wangqian for this patch. 
							
						 
						
							2012-11-19 22:32:27 +08:00  
				
					
						
							
							
								 
						
							
								6caf1bab73 
								
							 
						 
						
							
							
								
								Fixed   #160 . Merge branch 'master' of  https://github.com/sebastien-villemot/OpenBLAS  into develop  
							
							
							
						 
						
							2012-11-15 18:21:04 +08:00  
				
					
						
							
							
								 
						
							
								01e3c984ce 
								
							 
						 
						
							
							
								
								Fix compilation with TARGET=GENERIC  
							
							... 
							
							
							
							Patch applied to Debian package 
							
						 
						
							2012-11-14 21:04:05 +01:00  
				
					
						
							
							
								 
						
							
								6751f7b9a7 
								
							 
						 
						
							
							
								
								Fixed   #157 . Only detect the number of physical CPU cores on Mac OSX.  
							
							
							
						 
						
							2012-11-13 15:48:57 +08:00  
				
					
						
							
							
								 
						
							
								d5717a97ea 
								
							 
						 
						
							
							
								
								Compile lapacke with ILP64 modle when INTERFACE64=1  
							
							
							
						 
						
							2012-11-13 00:54:20 +08:00  
				
					
						
							
							
								 
						
							
								b45d43d295 
								
							 
						 
						
							
							
								
								Added the patch for lapacke example.  
							
							
							
						 
						
							2012-11-13 00:53:26 +08:00  
				
					
						
							
							
								 
						
							
								dcfb69c2b5 
								
							 
						 
						
							
							
								
								Merge branch 'master' of  https://github.com/alnsn/OpenBLAS  into develop  
							
							
							
						 
						
							2012-11-12 11:17:04 +08:00  
				
					
						
							
							
								 
						
							
								e85549ee11 
								
							 
						 
						
							
							
								
								Fix NetBSD build.  
							
							
							
						 
						
							2012-11-10 23:20:44 +00:00  
				
					
						
							
							
								 
						
							
								789f205177 
								
							 
						 
						
							
							
								
								Improved Makefile.rule for cross compiler.  
							
							
							
						 
						
							2012-11-09 00:14:20 +08:00  
				
					
						
							
							
								 
						
							
								378acfe826 
								
							 
						 
						
							
							
								
								Added NO_SHARED flag to disable generating the shared library.  
							
							
							
						 
						
							2012-11-09 00:14:15 +08:00  
				
					
						
							
							
								 
						
							
								538c764d2b 
								
							 
						 
						
							
							
								
								Refs  #153 . Restore the original CPU affinity when calling openblas_set_num_threads(1).  
							
							... 
							
							
							
							Please read the issue on github.com for the detail. 
							
						 
						
							2012-11-06 18:21:46 +08:00  
				
					
						
							
							
								 
						
							
								0f26a21624 
								
							 
						 
						
							
							
								
								Alternative approach to avoid command-line length while archiving lapacke -- Thanks Michel!  
							
							
							
						 
						
							2012-10-15 22:26:18 +02:00  
				
					
						
							
							
								 
						
							
								5c1efa1149 
								
							 
						 
						
							
							
								
								Fix installation step on Windows (regression from  e8306f623a)  
							
							... 
							
							
							
							Since the DLL now has a fixed name there is no need to install a versioned alias too. 
							
						 
						
							2012-10-15 22:13:37 +02:00  
				
					
						
							
							
								 
						
							
								ca4136cf41 
								
							 
						 
						
							
							
								
								Fixed   #147 : LAPACK symbols were not being exported for version 3.4.2  
							
							
							
						 
						
							2012-10-12 23:44:23 +02:00  
				
					
						
							
							
								 
						
							
								3a26470fb7 
								
							 
						 
						
							
							
								
								Merge branch 'develop'  
							
							
							
						 
						
							2012-10-09 20:08:28 +08:00  
				
					
						
							
							
								 
						
							
								6c5899dff5 
								
							 
						 
						
							
							
								
								Don't use xgetbv instruction when NO_AVX=1  
							
							
							
						 
						
							2012-10-09 14:52:35 +08:00  
				
					
						
							
							
								 
						
							
								2df2878dfc 
								
							 
						 
						
							
							
								
								Merge branch 'develop'  
							
							
							
						 
						
							2012-10-08 13:38:03 +08:00  
				
					
						
							
							
								 
						
							
								0b719945c5 
								
							 
						 
						
							
							
								
								Updated the doc for 0.2.4 version.  
							
							
							
						 
						
							2012-10-08 13:37:44 +08:00  
				
					
						
							
							
								 
						
							
								b1a54a0107 
								
							 
						 
						
							
							
								
								Fixed   #141 . make f77blas.h compatible with compilers which lack C99 complex number.  
							
							... 
							
							
							
							Apply the patch from Tony @tonyhill. Thank you. 
							
						 
						
							2012-10-08 12:48:20 +08:00  
				
					
						
							
							
								 
						
							
								08c177ca36 
								
							 
						 
						
							
							
								
								Refs  #145 . Update LAPACK to 3.4.2 version.  
							
							
							
						 
						
							2012-09-29 23:14:39 +08:00  
				
					
						
							
							
								 
						
							
								2573311308 
								
							 
						 
						
							
							
								
								refs  #140 . Fixed zdot incompatibility ABI issue with GCC 4.7 on Win 32.  
							
							... 
							
							
							
							GCC 4.7 uses MSVC ABI on Win 32. This means the caller pops the hidden pointer for returning
aggregate structures larger than 8 bytes. 
							
						 
						
							2012-09-24 20:34:33 +08:00  
				
					
						
							
							
								 
						
							
								1d72b8bf1b 
								
							 
						 
						
							
							
								
								Fixed generating shared library bug on MIPS.  
							
							
							
						 
						
							2012-09-21 11:49:07 +00:00  
				
					
						
							
							
								 
						
							
								758e34efbb 
								
							 
						 
						
							
							
								
								Fixed the detection bug on Loongson 3A server.  
							
							
							
						 
						
							2012-09-21 10:14:07 +00:00  
				
					
						
							
							
								 
						
							
								735ca38b8f 
								
							 
						 
						
							
							
								
								Refs  #139 . Check OS supporting AVX on runtime.  
							
							
							
						 
						
							2012-09-18 15:46:20 +08:00  
				
					
						
							
							
								 
						
							
								f76a384841 
								
							 
						 
						
							
							
								
								Refs  #139 . Added NO_AVX flag to use old Nehalem kernels on Sandy Bridge.  
							
							... 
							
							
							
							For example, make NO_AVX=1 or make DYNAMIC_ARCH=1 NO_AVX=1 
							
						 
						
							2012-09-17 23:25:46 +08:00  
				
					
						
							
							
								 
						
							
								9419a43a7f 
								
							 
						 
						
							
							
								
								Fixed   #142 . Added the gesvd and potrs function families to common_interface.h.  
							
							
							
						 
						
							2012-09-14 15:15:08 +08:00  
				
					
						
							
							
								 
						
							
								b695680a33 
								
							 
						 
						
							
							
								
								Fixed   #143 . Don't generate cblas.h with NO_CBLAS.  
							
							
							
						 
						
							2012-09-14 14:06:14 +08:00  
				
					
						
							
							
								 
						
							
								d0e731e8b8 
								
							 
						 
						
							
							
								
								provide support for passing CFLAGS, FFLAGS, PFLAGS, FPFLAGS to make on the command line  
							
							
							
						 
						
							2012-08-21 00:31:12 -04:00  
				
					
						
							
							
								 
						
							
								48f075cfd5 
								
							 
						 
						
							
							
								
								Merge branch 'develop'  
							
							
							
						 
						
							2012-08-20 16:52:35 +08:00  
				
					
						
							
							
								 
						
							
								3e87648de3 
								
							 
						 
						
							
							
								
								Updated the doc for 0.2.3 version.  
							
							
							
						 
						
							2012-08-20 16:51:47 +08:00  
				
					
						
							
							
								 
						
							
								fe4ab95cd5 
								
							 
						 
						
							
							
								
								Refs  #136 . Fixed a bug about controlling the number of threads on Windows.  
							
							
							
						 
						
							2012-08-19 23:50:54 +08:00  
				
					
						
							
							
								 
						
							
								801383effe 
								
							 
						 
						
							
							
								
								Fixed a hang bug when shutdown blas threads server on Windows. Added the feature about dynamic changing the number of threads on Windows.  
							
							
							
						 
						
							2012-08-14 18:34:32 +08:00  
				
					
						
							
							
								 
						
							
								54cd65e47f 
								
							 
						 
						
							
							
								
								Use sandy bridge kernel when DYNAMIC_ARCH=1.  
							
							
							
						 
						
							2012-08-13 15:25:08 +08:00  
				
					
						
							
							
								 
						
							
								a55821a2ec 
								
							 
						 
						
							
							
								
								Refs  #132 . Kill the threads when unload the library.  
							
							
							
						 
						
							2012-08-11 21:33:15 +08:00  
				
					
						
							
							
								 
						
							
								068861a927 
								
							 
						 
						
							
							
								
								Refs  #133 . Users can set COMMON_OPT flag to control CFLAGS and FFLAGS.  
							
							
							
						 
						
							2012-08-10 14:36:26 +08:00  
				
					
						
							
							
								 
						
							
								d007cca61d 
								
							 
						 
						
							
							
								
								Refs  #134 . Fixed the building bug on IBM Power.  
							
							
							
						 
						
							2012-08-10 11:54:21 +08:00